linuxdevhub
diff --git a/‎dev/_downloads/auto_examples_jupyter.zip
-1.5 KB b/‎dev/_downloads/auto_examples_jupyter.zip
-1.5 KB
diff --git a/‎dev/_downloads/auto_examples_python.zip
-1.44 KB b/‎dev/_downloads/auto_examples_python.zip
-1.44 KB
diff --git a/‎dev/_downloads/column_transformer.ipynb
Lines changed: 54 additions & 0 deletions b/‎dev/_downloads/column_transformer.ipynb
Lines changed: 54 additions & 0 deletions
diff --git a/‎dev/_downloads/hetero_feature_union.py renamed to ‎dev/_downloads/column_transformer.py
Lines changed: 22 additions & 67 deletions b/‎dev/_downloads/hetero_feature_union.py renamed to ‎dev/_downloads/column_transformer.py
Lines changed: 22 additions & 67 deletions
diff --git a/‎dev/_downloads/hetero_feature_union.ipynb
Lines changed: 0 additions & 54 deletions b/‎dev/_downloads/hetero_feature_union.ipynb
Lines changed: 0 additions & 54 deletions
diff --git a/‎dev/_downloads/scikit-learn-docs.pdf
-133 KB b/‎dev/_downloads/scikit-learn-docs.pdf
-133 KB
diff --git a/‎dev/_images/iris.png
0 Bytes b/‎dev/_images/iris.png
0 Bytes
diff --git a/‎dev/_images/sphx_glr_hetero_feature_union_thumb.png renamed to ‎dev/_images/sphx_glr_column_transformer_thumb.png b/‎dev/_images/sphx_glr_hetero_feature_union_thumb.png renamed to ‎dev/_images/sphx_glr_column_transformer_thumb.png
diff --git a/‎dev/_images/sphx_glr_plot_agglomerative_clustering_001.png
-531 Bytes b/‎dev/_images/sphx_glr_plot_agglomerative_clustering_001.png
-531 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_agglomerative_clustering_0011.png
-531 Bytes b/‎dev/_images/sphx_glr_plot_agglomerative_clustering_0011.png
-531 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_agglomerative_clustering_002.png
-327 Bytes b/‎dev/_images/sphx_glr_plot_agglomerative_clustering_002.png
-327 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_agglomerative_clustering_0021.png
-327 Bytes b/‎dev/_images/sphx_glr_plot_agglomerative_clustering_0021.png
-327 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_agglomerative_clustering_003.png
-73 Bytes b/‎dev/_images/sphx_glr_plot_agglomerative_clustering_003.png
-73 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_agglomerative_clustering_0031.png
-73 Bytes b/‎dev/_images/sphx_glr_plot_agglomerative_clustering_0031.png
-73 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_agglomerative_clustering_004.png
-328 Bytes b/‎dev/_images/sphx_glr_plot_agglomerative_clustering_004.png
-328 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_agglomerative_clustering_0041.png
-328 Bytes b/‎dev/_images/sphx_glr_plot_agglomerative_clustering_0041.png
-328 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_agglomerative_clustering_thumb.png
-102 Bytes b/‎dev/_images/sphx_glr_plot_agglomerative_clustering_thumb.png
-102 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_anomaly_comparison_001.png
-583 Bytes b/‎dev/_images/sphx_glr_plot_anomaly_comparison_001.png
-583 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_anomaly_comparison_0011.png
-583 Bytes b/‎dev/_images/sphx_glr_plot_anomaly_comparison_0011.png
-583 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_anomaly_comparison_thumb.png
-2 Bytes b/‎dev/_images/sphx_glr_plot_anomaly_comparison_thumb.png
-2 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_cluster_comparison_001.png
897 Bytes b/‎dev/_images/sphx_glr_plot_cluster_comparison_001.png
897 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_cluster_comparison_0011.png
897 Bytes b/‎dev/_images/sphx_glr_plot_cluster_comparison_0011.png
897 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_cluster_comparison_thumb.png
-47 Bytes b/‎dev/_images/sphx_glr_plot_cluster_comparison_thumb.png
-47 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_coin_segmentation_001.png
333 Bytes b/‎dev/_images/sphx_glr_plot_coin_segmentation_001.png
333 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_coin_segmentation_0011.png
333 Bytes b/‎dev/_images/sphx_glr_plot_coin_segmentation_0011.png
333 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_coin_segmentation_002.png
-220 Bytes b/‎dev/_images/sphx_glr_plot_coin_segmentation_002.png
-220 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_coin_segmentation_0021.png
-220 Bytes b/‎dev/_images/sphx_glr_plot_coin_segmentation_0021.png
-220 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_coin_segmentation_thumb.png
-112 Bytes b/‎dev/_images/sphx_glr_plot_coin_segmentation_thumb.png
-112 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_compare_methods_001.png
-1009 Bytes b/‎dev/_images/sphx_glr_plot_compare_methods_001.png
-1009 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_compare_methods_0011.png
-1009 Bytes b/‎dev/_images/sphx_glr_plot_compare_methods_0011.png
-1009 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_compare_methods_001_carousel.png
-50 Bytes b/‎dev/_images/sphx_glr_plot_compare_methods_001_carousel.png
-50 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_compare_methods_thumb.png
33 Bytes b/‎dev/_images/sphx_glr_plot_compare_methods_thumb.png
33 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_compare_methods_thumb1.png
33 Bytes b/‎dev/_images/sphx_glr_plot_compare_methods_thumb1.png
33 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_compare_reduction_001.png
1 Byte b/‎dev/_images/sphx_glr_plot_compare_reduction_001.png
1 Byte
diff --git a/‎dev/_images/sphx_glr_plot_compare_reduction_thumb.png
-18 Bytes b/‎dev/_images/sphx_glr_plot_compare_reduction_thumb.png
-18 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_dict_face_patches_001.png
65 Bytes b/‎dev/_images/sphx_glr_plot_dict_face_patches_001.png
65 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_dict_face_patches_0011.png
65 Bytes b/‎dev/_images/sphx_glr_plot_dict_face_patches_0011.png
65 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_dict_face_patches_thumb.png
-21 Bytes b/‎dev/_images/sphx_glr_plot_dict_face_patches_thumb.png
-21 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_document_classification_20newsgroups_001.png
33 Bytes b/‎dev/_images/sphx_glr_plot_document_classification_20newsgroups_001.png
33 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_document_classification_20newsgroups_thumb.png
18 Bytes b/‎dev/_images/sphx_glr_plot_document_classification_20newsgroups_thumb.png
18 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_face_recognition_001.png
574 Bytes b/‎dev/_images/sphx_glr_plot_face_recognition_001.png
574 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_face_recognition_002.png
7 Bytes b/‎dev/_images/sphx_glr_plot_face_recognition_002.png
7 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_face_recognition_thumb.png
-235 Bytes b/‎dev/_images/sphx_glr_plot_face_recognition_thumb.png
-235 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_faces_decomposition_003.png
64 Bytes b/‎dev/_images/sphx_glr_plot_faces_decomposition_003.png
64 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_faces_decomposition_0031.png
64 Bytes b/‎dev/_images/sphx_glr_plot_faces_decomposition_0031.png
64 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_faces_decomposition_004.png
20 Bytes b/‎dev/_images/sphx_glr_plot_faces_decomposition_004.png
20 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_faces_decomposition_0041.png
20 Bytes b/‎dev/_images/sphx_glr_plot_faces_decomposition_0041.png
20 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_faces_decomposition_005.png
-106 Bytes b/‎dev/_images/sphx_glr_plot_faces_decomposition_005.png
-106 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_faces_decomposition_0051.png
-106 Bytes b/‎dev/_images/sphx_glr_plot_faces_decomposition_0051.png
-106 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_faces_decomposition_006.png
-236 Bytes b/‎dev/_images/sphx_glr_plot_faces_decomposition_006.png
-236 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_faces_decomposition_0061.png
-236 Bytes b/‎dev/_images/sphx_glr_plot_faces_decomposition_0061.png
-236 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_gradient_boosting_early_stopping_002.png
822 Bytes b/‎dev/_images/sphx_glr_plot_gradient_boosting_early_stopping_002.png
822 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_image_denoising_001.png
102 Bytes b/‎dev/_images/sphx_glr_plot_image_denoising_001.png
102 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_image_denoising_0011.png
102 Bytes b/‎dev/_images/sphx_glr_plot_image_denoising_0011.png
102 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_image_denoising_003.png
146 Bytes b/‎dev/_images/sphx_glr_plot_image_denoising_003.png
146 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_image_denoising_004.png
-20 Bytes b/‎dev/_images/sphx_glr_plot_image_denoising_004.png
-20 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_image_denoising_005.png
-37 Bytes b/‎dev/_images/sphx_glr_plot_image_denoising_005.png
-37 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_image_denoising_thumb.png
-43 Bytes b/‎dev/_images/sphx_glr_plot_image_denoising_thumb.png
-43 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_johnson_lindenstrauss_bound_003.png
-1.7 KB b/‎dev/_images/sphx_glr_plot_johnson_lindenstrauss_bound_003.png
-1.7 KB
diff --git a/‎dev/_images/sphx_glr_plot_johnson_lindenstrauss_bound_004.png
119 Bytes b/‎dev/_images/sphx_glr_plot_johnson_lindenstrauss_bound_004.png
119 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_johnson_lindenstrauss_bound_005.png
171 Bytes b/‎dev/_images/sphx_glr_plot_johnson_lindenstrauss_bound_005.png
171 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_johnson_lindenstrauss_bound_006.png
38 Bytes b/‎dev/_images/sphx_glr_plot_johnson_lindenstrauss_bound_006.png
38 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_johnson_lindenstrauss_bound_007.png
471 Bytes b/‎dev/_images/sphx_glr_plot_johnson_lindenstrauss_bound_007.png
471 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_johnson_lindenstrauss_bound_008.png
-717 Bytes b/‎dev/_images/sphx_glr_plot_johnson_lindenstrauss_bound_008.png
-717 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_kernel_approximation_001.png
124 Bytes b/‎dev/_images/sphx_glr_plot_kernel_approximation_001.png
124 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_kernel_approximation_002.png
51 Bytes b/‎dev/_images/sphx_glr_plot_kernel_approximation_002.png
51 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_kernel_approximation_0021.png
51 Bytes b/‎dev/_images/sphx_glr_plot_kernel_approximation_0021.png
51 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_kernel_approximation_thumb.png
774 Bytes b/‎dev/_images/sphx_glr_plot_kernel_approximation_thumb.png
774 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_kernel_ridge_regression_001.png
-395 Bytes b/‎dev/_images/sphx_glr_plot_kernel_ridge_regression_001.png
-395 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_kernel_ridge_regression_0011.png
-395 Bytes b/‎dev/_images/sphx_glr_plot_kernel_ridge_regression_0011.png
-395 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_kernel_ridge_regression_002.png
-475 Bytes b/‎dev/_images/sphx_glr_plot_kernel_ridge_regression_002.png
-475 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_kernel_ridge_regression_0021.png
-475 Bytes b/‎dev/_images/sphx_glr_plot_kernel_ridge_regression_0021.png
-475 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_kernel_ridge_regression_thumb.png
-105 Bytes b/‎dev/_images/sphx_glr_plot_kernel_ridge_regression_thumb.png
-105 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_lasso_model_selection_002.png
68 Bytes b/‎dev/_images/sphx_glr_plot_lasso_model_selection_002.png
68 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_lasso_model_selection_0021.png
68 Bytes b/‎dev/_images/sphx_glr_plot_lasso_model_selection_0021.png
68 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_lasso_model_selection_003.png
-135 Bytes b/‎dev/_images/sphx_glr_plot_lasso_model_selection_003.png
-135 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_lasso_model_selection_0031.png
-135 Bytes b/‎dev/_images/sphx_glr_plot_lasso_model_selection_0031.png
-135 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_linkage_comparison_001.png
-722 Bytes b/‎dev/_images/sphx_glr_plot_linkage_comparison_001.png
-722 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_linkage_comparison_0011.png
-722 Bytes b/‎dev/_images/sphx_glr_plot_linkage_comparison_0011.png
-722 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_linkage_comparison_thumb.png
8 Bytes b/‎dev/_images/sphx_glr_plot_linkage_comparison_thumb.png
8 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_lle_digits_004.png
-59 Bytes b/‎dev/_images/sphx_glr_plot_lle_digits_004.png
-59 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_lle_digits_0041.png
-59 Bytes b/‎dev/_images/sphx_glr_plot_lle_digits_0041.png
-59 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_lle_digits_005.png
213 Bytes b/‎dev/_images/sphx_glr_plot_lle_digits_005.png
213 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_lle_digits_0051.png
213 Bytes b/‎dev/_images/sphx_glr_plot_lle_digits_0051.png
213 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_lle_digits_006.png
23 Bytes b/‎dev/_images/sphx_glr_plot_lle_digits_006.png
23 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_lle_digits_0061.png
23 Bytes b/‎dev/_images/sphx_glr_plot_lle_digits_0061.png
23 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_lle_digits_009.png
179 Bytes b/‎dev/_images/sphx_glr_plot_lle_digits_009.png
179 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_lle_digits_0091.png
179 Bytes b/‎dev/_images/sphx_glr_plot_lle_digits_0091.png
179 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_lle_digits_010.png
-88 Bytes b/‎dev/_images/sphx_glr_plot_lle_digits_010.png
-88 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_lle_digits_0101.png
-88 Bytes b/‎dev/_images/sphx_glr_plot_lle_digits_0101.png
-88 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_lle_digits_011.png
-80 Bytes b/‎dev/_images/sphx_glr_plot_lle_digits_011.png
-80 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_lle_digits_012.png
189 Bytes b/‎dev/_images/sphx_glr_plot_lle_digits_012.png
189 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_lle_digits_013.png
-77 Bytes b/‎dev/_images/sphx_glr_plot_lle_digits_013.png
-77 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_lle_digits_0131.png
-77 Bytes b/‎dev/_images/sphx_glr_plot_lle_digits_0131.png
-77 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_manifold_sphere_001.png
945 Bytes b/‎dev/_images/sphx_glr_plot_manifold_sphere_001.png
945 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_manifold_sphere_thumb.png
68 Bytes b/‎dev/_images/sphx_glr_plot_manifold_sphere_thumb.png
68 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_mini_batch_kmeans_001.png
-83 Bytes b/‎dev/_images/sphx_glr_plot_mini_batch_kmeans_001.png
-83 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_mini_batch_kmeans_0011.png
-83 Bytes b/‎dev/_images/sphx_glr_plot_mini_batch_kmeans_0011.png
-83 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_mini_batch_kmeans_thumb.png
14 Bytes b/‎dev/_images/sphx_glr_plot_mini_batch_kmeans_thumb.png
14 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_model_complexity_influence_001.png
1.52 KB b/‎dev/_images/sphx_glr_plot_model_complexity_influence_001.png
1.52 KB
diff --git a/‎dev/_images/sphx_glr_plot_model_complexity_influence_0011.png
1.52 KB b/‎dev/_images/sphx_glr_plot_model_complexity_influence_0011.png
1.52 KB
diff --git a/‎dev/_images/sphx_glr_plot_model_complexity_influence_002.png
-59 Bytes b/‎dev/_images/sphx_glr_plot_model_complexity_influence_002.png
-59 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_model_complexity_influence_0021.png
-59 Bytes b/‎dev/_images/sphx_glr_plot_model_complexity_influence_0021.png
-59 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_model_complexity_influence_003.png
-52 Bytes b/‎dev/_images/sphx_glr_plot_model_complexity_influence_003.png
-52 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_model_complexity_influence_0031.png
-52 Bytes b/‎dev/_images/sphx_glr_plot_model_complexity_influence_0031.png
-52 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_model_complexity_influence_thumb.png
319 Bytes b/‎dev/_images/sphx_glr_plot_model_complexity_influence_thumb.png
319 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_out_of_core_classification_001.png
6.41 KB b/‎dev/_images/sphx_glr_plot_out_of_core_classification_001.png
6.41 KB
diff --git a/‎dev/_images/sphx_glr_plot_out_of_core_classification_0011.png
6.41 KB b/‎dev/_images/sphx_glr_plot_out_of_core_classification_0011.png
6.41 KB
diff --git a/‎dev/_images/sphx_glr_plot_out_of_core_classification_002.png
8.6 KB b/‎dev/_images/sphx_glr_plot_out_of_core_classification_002.png
8.6 KB
diff --git a/‎dev/_images/sphx_glr_plot_out_of_core_classification_003.png
-67 Bytes b/‎dev/_images/sphx_glr_plot_out_of_core_classification_003.png
-67 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_out_of_core_classification_0031.png
-67 Bytes b/‎dev/_images/sphx_glr_plot_out_of_core_classification_0031.png
-67 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_out_of_core_classification_004.png
267 Bytes b/‎dev/_images/sphx_glr_plot_out_of_core_classification_004.png
267 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_out_of_core_classification_0041.png
267 Bytes b/‎dev/_images/sphx_glr_plot_out_of_core_classification_0041.png
267 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_out_of_core_classification_thumb.png
3.28 KB b/‎dev/_images/sphx_glr_plot_out_of_core_classification_thumb.png
3.28 KB
diff --git a/‎dev/_images/sphx_glr_plot_prediction_latency_001.png
-226 Bytes b/‎dev/_images/sphx_glr_plot_prediction_latency_001.png
-226 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_prediction_latency_0011.png
-226 Bytes b/‎dev/_images/sphx_glr_plot_prediction_latency_0011.png
-226 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_prediction_latency_002.png
-6 Bytes b/‎dev/_images/sphx_glr_plot_prediction_latency_002.png
-6 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_prediction_latency_0021.png
-6 Bytes b/‎dev/_images/sphx_glr_plot_prediction_latency_0021.png
-6 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_prediction_latency_003.png
-4.27 KB b/‎dev/_images/sphx_glr_plot_prediction_latency_003.png
-4.27 KB
diff --git a/‎dev/_images/sphx_glr_plot_prediction_latency_0031.png
-4.27 KB b/‎dev/_images/sphx_glr_plot_prediction_latency_0031.png
-4.27 KB
diff --git a/‎dev/_images/sphx_glr_plot_prediction_latency_004.png
-2.57 KB b/‎dev/_images/sphx_glr_plot_prediction_latency_004.png
-2.57 KB
diff --git a/‎dev/_images/sphx_glr_plot_prediction_latency_0041.png
-2.57 KB b/‎dev/_images/sphx_glr_plot_prediction_latency_0041.png
-2.57 KB
diff --git a/‎dev/_images/sphx_glr_plot_prediction_latency_thumb.png
-218 Bytes b/‎dev/_images/sphx_glr_plot_prediction_latency_thumb.png
-218 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_sparse_logistic_regression_20newsgroups_001.png
1.16 KB b/‎dev/_images/sphx_glr_plot_sparse_logistic_regression_20newsgroups_001.png
1.16 KB
diff --git a/‎dev/_images/sphx_glr_plot_sparse_logistic_regression_20newsgroups_thumb.png
248 Bytes b/‎dev/_images/sphx_glr_plot_sparse_logistic_regression_20newsgroups_thumb.png
248 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_theilsen_001.png
149 Bytes b/‎dev/_images/sphx_glr_plot_theilsen_001.png
149 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_theilsen_0011.png
149 Bytes b/‎dev/_images/sphx_glr_plot_theilsen_0011.png
149 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_theilsen_002.png
-14 Bytes b/‎dev/_images/sphx_glr_plot_theilsen_002.png
-14 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_theilsen_thumb.png
51 Bytes b/‎dev/_images/sphx_glr_plot_theilsen_thumb.png
51 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_tomography_l1_reconstruction_001.png
-155 Bytes b/‎dev/_images/sphx_glr_plot_tomography_l1_reconstruction_001.png
-155 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_tomography_l1_reconstruction_thumb.png
-242 Bytes b/‎dev/_images/sphx_glr_plot_tomography_l1_reconstruction_thumb.png
-242 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_ward_structured_vs_unstructured_002.png
-77 Bytes b/‎dev/_images/sphx_glr_plot_ward_structured_vs_unstructured_002.png
-77 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_ward_structured_vs_unstructured_0021.png
-77 Bytes b/‎dev/_images/sphx_glr_plot_ward_structured_vs_unstructured_0021.png
-77 Bytes
@@ -0,0 +1,54 @@
+{
+  "cells": [
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {
+        "collapsed": false
+      },
+      "outputs": [],
+      "source": [
+        "%matplotlib inline"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "\n# Column Transformer with Heterogeneous Data Sources\n\n\nDatasets can often contain components of that require different feature\nextraction and processing pipelines.  This scenario might occur when:\n\n1. Your dataset consists of heterogeneous data types (e.g. raster images and\n   text captions)\n2. Your dataset is stored in a Pandas DataFrame and different columns\n   require different processing pipelines.\n\nThis example demonstrates how to use\n:class:`sklearn.compose.ColumnTransformer` on a dataset containing\ndifferent types of features.  We use the 20-newsgroups dataset and compute\nstandard bag-of-words features for the subject line and body in separate\npipelines as well as ad hoc features on the body. We combine them (with\nweights) using a ColumnTransformer and finally train a classifier on the\ncombined set of features.\n\nThe choice of features is not particularly helpful, but serves to illustrate\nthe technique.\n\n"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {
+        "collapsed": false
+      },
+      "outputs": [],
+      "source": [
+        "# Author: Matt Terry <[email protected]>\n#\n# License: BSD 3 clause\nfrom __future__ import print_function\n\nimport numpy as np\n\nfrom sklearn.base import BaseEstimator, TransformerMixin\nfrom sklearn.datasets import fetch_20newsgroups\nfrom sklearn.datasets.twenty_newsgroups import strip_newsgroup_footer\nfrom sklearn.datasets.twenty_newsgroups import strip_newsgroup_quoting\nfrom sklearn.decomposition import TruncatedSVD\nfrom sklearn.feature_extraction import DictVectorizer\nfrom sklearn.feature_extraction.text import TfidfVectorizer\nfrom sklearn.metrics import classification_report\nfrom sklearn.pipeline import Pipeline\nfrom sklearn.compose import ColumnTransformer\nfrom sklearn.svm import SVC\n\n\nclass TextStats(BaseEstimator, TransformerMixin):\n    \"\"\"Extract features from each document for DictVectorizer\"\"\"\n\n    def fit(self, x, y=None):\n        return self\n\n    def transform(self, posts):\n        return [{'length': len(text),\n                 'num_sentences': text.count('.')}\n                for text in posts]\n\n\nclass SubjectBodyExtractor(BaseEstimator, TransformerMixin):\n    \"\"\"Extract the subject & body from a usenet post in a single pass.\n\n    Takes a sequence of strings and produces a dict of sequences.  Keys are\n    `subject` and `body`.\n    \"\"\"\n    def fit(self, x, y=None):\n        return self\n\n    def transform(self, posts):\n        # construct object dtype array with two columns\n        # first column = 'subject' and second column = 'body'\n        features = np.empty(shape=(len(posts), 2), dtype=object)\n        for i, text in enumerate(posts):\n            headers, _, bod = text.partition('\\n\\n')\n            bod = strip_newsgroup_footer(bod)\n            bod = strip_newsgroup_quoting(bod)\n            features[i, 1] = bod\n\n            prefix = 'Subject:'\n            sub = ''\n            for line in headers.split('\\n'):\n                if line.startswith(prefix):\n                    sub = line[len(prefix):]\n                    break\n            features[i, 0] = sub\n\n        return features\n\n\npipeline = Pipeline([\n    # Extract the subject & body\n    ('subjectbody', SubjectBodyExtractor()),\n\n    # Use C toolumnTransformer to combine the features from subject and body\n    ('union', ColumnTransformer(\n        [\n            # Pulling features from the post's subject line (first column)\n            ('subject', TfidfVectorizer(min_df=50), 0),\n\n            # Pipeline for standard bag-of-words model for body (second column)\n            ('body_bow', Pipeline([\n                ('tfidf', TfidfVectorizer()),\n                ('best', TruncatedSVD(n_components=50)),\n            ]), 1),\n\n            # Pipeline for pulling ad hoc features from post's body\n            ('body_stats', Pipeline([\n                ('stats', TextStats()),  # returns a list of dicts\n                ('vect', DictVectorizer()),  # list of dicts -> feature matrix\n            ]), 1),\n        ],\n\n        # weight components in ColumnTransformer\n        transformer_weights={\n            'subject': 0.8,\n            'body_bow': 0.5,\n            'body_stats': 1.0,\n        }\n    )),\n\n    # Use a SVC classifier on the combined features\n    ('svc', SVC(kernel='linear')),\n])\n\n# limit the list of categories to make running this example faster.\ncategories = ['alt.atheism', 'talk.religion.misc']\ntrain = fetch_20newsgroups(random_state=1,\n                           subset='train',\n                           categories=categories,\n                           )\ntest = fetch_20newsgroups(random_state=1,\n                          subset='test',\n                          categories=categories,\n                          )\n\npipeline.fit(train.data, train.target)\ny = pipeline.predict(test.data)\nprint(classification_report(y, test.target))"
+      ]
+    }
+  ],
+  "metadata": {
+    "kernelspec": {
+      "display_name": "Python 3",
+      "language": "python",
+      "name": "python3"
+    },
+    "language_info": {
+      "codemirror_mode": {
+        "name": "ipython",
+        "version": 3
+      },
+      "file_extension": ".py",
+      "mimetype": "text/x-python",
+      "name": "python",
+      "nbconvert_exporter": "python",
+      "pygments_lexer": "ipython3",
+      "version": "3.6.5"
+    }
+  },
+  "nbformat": 4,
+  "nbformat_minor": 0
+}
@@ -1,7 +1,7 @@
 """
-=============================================
-Feature Union with Heterogeneous Data Sources
-=============================================
+==================================================
+Column Transformer with Heterogeneous Data Sources
+==================================================
 
 Datasets can often contain components of that require different feature
 extraction and processing pipelines.  This scenario might occur when:
@@ -12,12 +12,12 @@
    require different processing pipelines.
 
 This example demonstrates how to use
-:class:`sklearn.feature_extraction.FeatureUnion` on a dataset containing
+:class:`sklearn.compose.ColumnTransformer` on a dataset containing
 different types of features.  We use the 20-newsgroups dataset and compute
 standard bag-of-words features for the subject line and body in separate
 pipelines as well as ad hoc features on the body. We combine them (with
-weights) using a FeatureUnion and finally train a classifier on the combined
-set of features.
+weights) using a ColumnTransformer and finally train a classifier on the
+combined set of features.
 
 The choice of features is not particularly helpful, but serves to illustrate
 the technique.
@@ -38,50 +38,11 @@
 from sklearn.feature_extraction import DictVectorizer
 from sklearn.feature_extraction.text import TfidfVectorizer
 from sklearn.metrics import classification_report
-from sklearn.pipeline import FeatureUnion
 from sklearn.pipeline import Pipeline
+from sklearn.compose import ColumnTransformer
 from sklearn.svm import SVC
 
 
-class ItemSelector(BaseEstimator, TransformerMixin):
-    """For data grouped by feature, select subset of data at a provided key.
-
-    The data is expected to be stored in a 2D data structure, where the first
-    index is over features and the second is over samples.  i.e.
-
-    >> len(data[key]) == n_samples
-
-    Please note that this is the opposite convention to scikit-learn feature
-    matrixes (where the first index corresponds to sample).
-
-    ItemSelector only requires that the collection implement getitem
-    (data[key]).  Examples include: a dict of lists, 2D numpy array, Pandas
-    DataFrame, numpy record array, etc.
-
-    >> data = {'a': [1, 5, 2, 5, 2, 8],
-               'b': [9, 4, 1, 4, 1, 3]}
-    >> ds = ItemSelector(key='a')
-    >> data['a'] == ds.transform(data)
-
-    ItemSelector is not designed to handle data grouped by sample.  (e.g. a
-    list of dicts).  If your data is structured this way, consider a
-    transformer along the lines of `sklearn.feature_extraction.DictVectorizer`.
-
-    Parameters
-    ----------
-    key : hashable, required
-        The key corresponding to the desired value in a mappable.
-    """
-    def __init__(self, key):
-        self.key = key
-
-    def fit(self, x, y=None):
-        return self
-
-    def transform(self, data_dict):
-        return data_dict[self.key]
-
-
 class TextStats(BaseEstimator, TransformerMixin):
     """Extract features from each document for DictVectorizer"""
 
@@ -104,21 +65,22 @@ def fit(self, x, y=None):
         return self
 
     def transform(self, posts):
-        features = np.recarray(shape=(len(posts),),
-                               dtype=[('subject', object), ('body', object)])
+        # construct object dtype array with two columns
+        # first column = 'subject' and second column = 'body'
+        features = np.empty(shape=(len(posts), 2), dtype=object)
         for i, text in enumerate(posts):
             headers, _, bod = text.partition('\n\n')
             bod = strip_newsgroup_footer(bod)
             bod = strip_newsgroup_quoting(bod)
-            features['body'][i] = bod
+            features[i, 1] = bod
 
             prefix = 'Subject:'
             sub = ''
             for line in headers.split('\n'):
                 if line.startswith(prefix):
                     sub = line[len(prefix):]
                     break
-            features['subject'][i] = sub
+            features[i, 0] = sub
 
         return features
 
@@ -127,38 +89,31 @@ def transform(self, posts):
     # Extract the subject & body
     ('subjectbody', SubjectBodyExtractor()),
 
-    # Use FeatureUnion to combine the features from subject and body
-    ('union', FeatureUnion(
-        transformer_list=[
+    # Use C toolumnTransformer to combine the features from subject and body
+    ('union', ColumnTransformer(
+        [
+            # Pulling features from the post's subject line (first column)
+            ('subject', TfidfVectorizer(min_df=50), 0),
 
-            # Pipeline for pulling features from the post's subject line
-            ('subject', Pipeline([
-                ('selector', ItemSelector(key='subject')),
-                ('tfidf', TfidfVectorizer(min_df=50)),
-            ])),
-
-            # Pipeline for standard bag-of-words model for body
+            # Pipeline for standard bag-of-words model for body (second column)
             ('body_bow', Pipeline([
-                ('selector', ItemSelector(key='body')),
                 ('tfidf', TfidfVectorizer()),
                 ('best', TruncatedSVD(n_components=50)),
-            ])),
+            ]), 1),
 
             # Pipeline for pulling ad hoc features from post's body
             ('body_stats', Pipeline([
-                ('selector', ItemSelector(key='body')),
                 ('stats', TextStats()),  # returns a list of dicts
                 ('vect', DictVectorizer()),  # list of dicts -> feature matrix
-            ])),
-
+            ]), 1),
         ],
 
-        # weight components in FeatureUnion
+        # weight components in ColumnTransformer
         transformer_weights={
             'subject': 0.8,
             'body_bow': 0.5,
             'body_stats': 1.0,
-        },
+        }
     )),
 
     # Use a SVC classifier on the combined features