model_pipeline = Pipeline(steps=[ ("dimension_reduction", PCA(n_components=10)), ("classifiers", RandomForestClassifier()) ]) model_pipeline.fit(train_data.values, train_labels.values) predictions = model_pipeline.predict(predict_data.values)