codeur66
diff --git a/‎dev/_downloads/1abc4484d4183963e2039c8c679497eb/plot_sgd_comparison.ipynb
Lines changed: 1 addition & 1 deletion b/‎dev/_downloads/1abc4484d4183963e2039c8c679497eb/plot_sgd_comparison.ipynb
Lines changed: 1 addition & 1 deletion
diff --git a/‎dev/_downloads/3409d9766d352cc9f9b169d4a799a87a/auto_examples_python.zip
-41 Bytes b/‎dev/_downloads/3409d9766d352cc9f9b169d4a799a87a/auto_examples_python.zip
-41 Bytes
diff --git a/‎dev/_downloads/3650884f0a646ba96d2e47df0a6fb935/plot_sgd_comparison.py
Lines changed: 2 additions & 2 deletions b/‎dev/_downloads/3650884f0a646ba96d2e47df0a6fb935/plot_sgd_comparison.py
Lines changed: 2 additions & 2 deletions
diff --git a/‎dev/_downloads/388641d133587cc11aa26f2dbef4b950/plot_document_classification_20newsgroups.py
Lines changed: 1 addition & 1 deletion b/‎dev/_downloads/388641d133587cc11aa26f2dbef4b950/plot_document_classification_20newsgroups.py
Lines changed: 1 addition & 1 deletion
diff --git a/‎dev/_downloads/3b31bf37034a6ece04667cd422e5ff79/plot_document_classification_20newsgroups.ipynb
Lines changed: 1 addition & 1 deletion b/‎dev/_downloads/3b31bf37034a6ece04667cd422e5ff79/plot_document_classification_20newsgroups.ipynb
Lines changed: 1 addition & 1 deletion
diff --git a/‎dev/_downloads/80692cf167e9ea27b27e5bd144159c82/plot_out_of_core_classification.py
Lines changed: 1 addition & 1 deletion b/‎dev/_downloads/80692cf167e9ea27b27e5bd144159c82/plot_out_of_core_classification.py
Lines changed: 1 addition & 1 deletion
diff --git a/‎dev/_downloads/b86db3a111b621a7beeaa9d099608e5b/plot_out_of_core_classification.ipynb
Lines changed: 1 addition & 1 deletion b/‎dev/_downloads/b86db3a111b621a7beeaa9d099608e5b/plot_out_of_core_classification.ipynb
Lines changed: 1 addition & 1 deletion
diff --git a/‎dev/_downloads/d34667f097c619f8afda4bc936e7af21/auto_examples_jupyter.zip
-41 Bytes b/‎dev/_downloads/d34667f097c619f8afda4bc936e7af21/auto_examples_jupyter.zip
-41 Bytes
diff --git a/‎dev/_downloads/scikit-learn-docs.pdf
3.11 KB b/‎dev/_downloads/scikit-learn-docs.pdf
3.11 KB
diff --git a/‎dev/_images/iris.png
0 Bytes b/‎dev/_images/iris.png
0 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_agglomerative_clustering_001.png
268 Bytes b/‎dev/_images/sphx_glr_plot_agglomerative_clustering_001.png
268 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_agglomerative_clustering_0011.png
268 Bytes b/‎dev/_images/sphx_glr_plot_agglomerative_clustering_0011.png
268 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_agglomerative_clustering_002.png
34 Bytes b/‎dev/_images/sphx_glr_plot_agglomerative_clustering_002.png
34 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_agglomerative_clustering_0021.png
34 Bytes b/‎dev/_images/sphx_glr_plot_agglomerative_clustering_0021.png
34 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_agglomerative_clustering_003.png
377 Bytes b/‎dev/_images/sphx_glr_plot_agglomerative_clustering_003.png
377 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_agglomerative_clustering_0031.png
377 Bytes b/‎dev/_images/sphx_glr_plot_agglomerative_clustering_0031.png
377 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_agglomerative_clustering_004.png
406 Bytes b/‎dev/_images/sphx_glr_plot_agglomerative_clustering_004.png
406 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_agglomerative_clustering_0041.png
406 Bytes b/‎dev/_images/sphx_glr_plot_agglomerative_clustering_0041.png
406 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_agglomerative_clustering_thumb.png
107 Bytes b/‎dev/_images/sphx_glr_plot_agglomerative_clustering_thumb.png
107 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_anomaly_comparison_001.png
409 Bytes b/‎dev/_images/sphx_glr_plot_anomaly_comparison_001.png
409 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_anomaly_comparison_0011.png
409 Bytes b/‎dev/_images/sphx_glr_plot_anomaly_comparison_0011.png
409 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_anomaly_comparison_001_carousel.png
-63 Bytes b/‎dev/_images/sphx_glr_plot_anomaly_comparison_001_carousel.png
-63 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_anomaly_comparison_thumb.png
-72 Bytes b/‎dev/_images/sphx_glr_plot_anomaly_comparison_thumb.png
-72 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_cluster_comparison_001.png
2.32 KB b/‎dev/_images/sphx_glr_plot_cluster_comparison_001.png
2.32 KB
diff --git a/‎dev/_images/sphx_glr_plot_cluster_comparison_0011.png
2.32 KB b/‎dev/_images/sphx_glr_plot_cluster_comparison_0011.png
2.32 KB
diff --git a/‎dev/_images/sphx_glr_plot_cluster_comparison_thumb.png
46 Bytes b/‎dev/_images/sphx_glr_plot_cluster_comparison_thumb.png
46 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_coin_segmentation_001.png
59 Bytes b/‎dev/_images/sphx_glr_plot_coin_segmentation_001.png
59 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_coin_segmentation_0011.png
59 Bytes b/‎dev/_images/sphx_glr_plot_coin_segmentation_0011.png
59 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_coin_segmentation_002.png
157 Bytes b/‎dev/_images/sphx_glr_plot_coin_segmentation_002.png
157 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_coin_segmentation_0021.png
157 Bytes b/‎dev/_images/sphx_glr_plot_coin_segmentation_0021.png
157 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_coin_segmentation_thumb.png
45 Bytes b/‎dev/_images/sphx_glr_plot_coin_segmentation_thumb.png
45 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_compare_methods_001.png
92 Bytes b/‎dev/_images/sphx_glr_plot_compare_methods_001.png
92 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_compare_methods_0011.png
92 Bytes b/‎dev/_images/sphx_glr_plot_compare_methods_0011.png
92 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_compare_methods_001_carousel.png
11 Bytes b/‎dev/_images/sphx_glr_plot_compare_methods_001_carousel.png
11 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_compare_methods_thumb.png
-14 Bytes b/‎dev/_images/sphx_glr_plot_compare_methods_thumb.png
-14 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_compare_methods_thumb1.png
-14 Bytes b/‎dev/_images/sphx_glr_plot_compare_methods_thumb1.png
-14 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_dict_face_patches_001.png
150 Bytes b/‎dev/_images/sphx_glr_plot_dict_face_patches_001.png
150 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_dict_face_patches_0011.png
150 Bytes b/‎dev/_images/sphx_glr_plot_dict_face_patches_0011.png
150 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_dict_face_patches_thumb.png
44 Bytes b/‎dev/_images/sphx_glr_plot_dict_face_patches_thumb.png
44 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_digits_pipe_001.png
47 Bytes b/‎dev/_images/sphx_glr_plot_digits_pipe_001.png
47 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_digits_pipe_0011.png
47 Bytes b/‎dev/_images/sphx_glr_plot_digits_pipe_0011.png
47 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_digits_pipe_thumb.png
23 Bytes b/‎dev/_images/sphx_glr_plot_digits_pipe_thumb.png
23 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_document_classification_20newsgroups_001.png
-22 Bytes b/‎dev/_images/sphx_glr_plot_document_classification_20newsgroups_001.png
-22 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_document_classification_20newsgroups_thumb.png
-101 Bytes b/‎dev/_images/sphx_glr_plot_document_classification_20newsgroups_thumb.png
-101 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_face_recognition_002.png
-2 Bytes b/‎dev/_images/sphx_glr_plot_face_recognition_002.png
-2 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_faces_decomposition_006.png
68 Bytes b/‎dev/_images/sphx_glr_plot_faces_decomposition_006.png
68 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_faces_decomposition_0061.png
68 Bytes b/‎dev/_images/sphx_glr_plot_faces_decomposition_0061.png
68 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_faces_decomposition_009.png
179 Bytes b/‎dev/_images/sphx_glr_plot_faces_decomposition_009.png
179 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_faces_decomposition_0091.png
179 Bytes b/‎dev/_images/sphx_glr_plot_faces_decomposition_0091.png
179 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_gradient_boosting_early_stopping_002.png
423 Bytes b/‎dev/_images/sphx_glr_plot_gradient_boosting_early_stopping_002.png
423 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_image_denoising_001.png
374 Bytes b/‎dev/_images/sphx_glr_plot_image_denoising_001.png
374 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_image_denoising_0011.png
374 Bytes b/‎dev/_images/sphx_glr_plot_image_denoising_0011.png
374 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_image_denoising_003.png
-490 Bytes b/‎dev/_images/sphx_glr_plot_image_denoising_003.png
-490 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_image_denoising_004.png
-85 Bytes b/‎dev/_images/sphx_glr_plot_image_denoising_004.png
-85 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_image_denoising_005.png
-345 Bytes b/‎dev/_images/sphx_glr_plot_image_denoising_005.png
-345 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_image_denoising_006.png
328 Bytes b/‎dev/_images/sphx_glr_plot_image_denoising_006.png
328 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_image_denoising_thumb.png
349 Bytes b/‎dev/_images/sphx_glr_plot_image_denoising_thumb.png
349 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_johnson_lindenstrauss_bound_003.png
2.21 KB b/‎dev/_images/sphx_glr_plot_johnson_lindenstrauss_bound_003.png
2.21 KB
diff --git a/‎dev/_images/sphx_glr_plot_johnson_lindenstrauss_bound_004.png
-3.07 KB b/‎dev/_images/sphx_glr_plot_johnson_lindenstrauss_bound_004.png
-3.07 KB
diff --git a/‎dev/_images/sphx_glr_plot_johnson_lindenstrauss_bound_005.png
-393 Bytes b/‎dev/_images/sphx_glr_plot_johnson_lindenstrauss_bound_005.png
-393 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_johnson_lindenstrauss_bound_006.png
-113 Bytes b/‎dev/_images/sphx_glr_plot_johnson_lindenstrauss_bound_006.png
-113 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_johnson_lindenstrauss_bound_007.png
499 Bytes b/‎dev/_images/sphx_glr_plot_johnson_lindenstrauss_bound_007.png
499 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_johnson_lindenstrauss_bound_008.png
-13 Bytes b/‎dev/_images/sphx_glr_plot_johnson_lindenstrauss_bound_008.png
-13 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_kernel_approximation_001.png
620 Bytes b/‎dev/_images/sphx_glr_plot_kernel_approximation_001.png
620 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_kernel_approximation_002.png
-24 Bytes b/‎dev/_images/sphx_glr_plot_kernel_approximation_002.png
-24 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_kernel_approximation_0021.png
-24 Bytes b/‎dev/_images/sphx_glr_plot_kernel_approximation_0021.png
-24 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_kernel_approximation_thumb.png
-116 Bytes b/‎dev/_images/sphx_glr_plot_kernel_approximation_thumb.png
-116 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_kernel_ridge_regression_001.png
144 Bytes b/‎dev/_images/sphx_glr_plot_kernel_ridge_regression_001.png
144 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_kernel_ridge_regression_0011.png
144 Bytes b/‎dev/_images/sphx_glr_plot_kernel_ridge_regression_0011.png
144 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_kernel_ridge_regression_002.png
387 Bytes b/‎dev/_images/sphx_glr_plot_kernel_ridge_regression_002.png
387 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_kernel_ridge_regression_0021.png
387 Bytes b/‎dev/_images/sphx_glr_plot_kernel_ridge_regression_0021.png
387 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_kernel_ridge_regression_thumb.png
35 Bytes b/‎dev/_images/sphx_glr_plot_kernel_ridge_regression_thumb.png
35 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_lasso_model_selection_002.png
84 Bytes b/‎dev/_images/sphx_glr_plot_lasso_model_selection_002.png
84 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_lasso_model_selection_0021.png
84 Bytes b/‎dev/_images/sphx_glr_plot_lasso_model_selection_0021.png
84 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_lasso_model_selection_003.png
-35 Bytes b/‎dev/_images/sphx_glr_plot_lasso_model_selection_003.png
-35 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_lasso_model_selection_0031.png
-35 Bytes b/‎dev/_images/sphx_glr_plot_lasso_model_selection_0031.png
-35 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_learning_curve_001.png
5.21 KB b/‎dev/_images/sphx_glr_plot_learning_curve_001.png
5.21 KB
diff --git a/‎dev/_images/sphx_glr_plot_learning_curve_0011.png
5.21 KB b/‎dev/_images/sphx_glr_plot_learning_curve_0011.png
5.21 KB
diff --git a/‎dev/_images/sphx_glr_plot_learning_curve_thumb.png
581 Bytes b/‎dev/_images/sphx_glr_plot_learning_curve_thumb.png
581 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_linkage_comparison_001.png
3.55 KB b/‎dev/_images/sphx_glr_plot_linkage_comparison_001.png
3.55 KB
diff --git a/‎dev/_images/sphx_glr_plot_linkage_comparison_0011.png
3.55 KB b/‎dev/_images/sphx_glr_plot_linkage_comparison_0011.png
3.55 KB
diff --git a/‎dev/_images/sphx_glr_plot_linkage_comparison_thumb.png
13 Bytes b/‎dev/_images/sphx_glr_plot_linkage_comparison_thumb.png
13 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_lle_digits_005.png
238 Bytes b/‎dev/_images/sphx_glr_plot_lle_digits_005.png
238 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_lle_digits_0051.png
238 Bytes b/‎dev/_images/sphx_glr_plot_lle_digits_0051.png
238 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_lle_digits_006.png
-67 Bytes b/‎dev/_images/sphx_glr_plot_lle_digits_006.png
-67 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_lle_digits_0061.png
-67 Bytes b/‎dev/_images/sphx_glr_plot_lle_digits_0061.png
-67 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_lle_digits_007.png
-211 Bytes b/‎dev/_images/sphx_glr_plot_lle_digits_007.png
-211 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_lle_digits_0071.png
-211 Bytes b/‎dev/_images/sphx_glr_plot_lle_digits_0071.png
-211 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_lle_digits_008.png
128 Bytes b/‎dev/_images/sphx_glr_plot_lle_digits_008.png
128 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_lle_digits_0081.png
128 Bytes b/‎dev/_images/sphx_glr_plot_lle_digits_0081.png
128 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_lle_digits_009.png
-43 Bytes b/‎dev/_images/sphx_glr_plot_lle_digits_009.png
-43 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_lle_digits_0091.png
-43 Bytes b/‎dev/_images/sphx_glr_plot_lle_digits_0091.png
-43 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_lle_digits_010.png
82 Bytes b/‎dev/_images/sphx_glr_plot_lle_digits_010.png
82 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_lle_digits_0101.png
82 Bytes b/‎dev/_images/sphx_glr_plot_lle_digits_0101.png
82 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_lle_digits_012.png
-144 Bytes b/‎dev/_images/sphx_glr_plot_lle_digits_012.png
-144 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_lle_digits_013.png
57 Bytes b/‎dev/_images/sphx_glr_plot_lle_digits_013.png
57 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_lle_digits_0131.png
57 Bytes b/‎dev/_images/sphx_glr_plot_lle_digits_0131.png
57 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_lle_digits_014.png
-112 Bytes b/‎dev/_images/sphx_glr_plot_lle_digits_014.png
-112 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_manifold_sphere_001.png
777 Bytes b/‎dev/_images/sphx_glr_plot_manifold_sphere_001.png
777 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_manifold_sphere_thumb.png
-45 Bytes b/‎dev/_images/sphx_glr_plot_manifold_sphere_thumb.png
-45 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_model_complexity_influence_001.png
-79 Bytes b/‎dev/_images/sphx_glr_plot_model_complexity_influence_001.png
-79 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_model_complexity_influence_0011.png
-79 Bytes b/‎dev/_images/sphx_glr_plot_model_complexity_influence_0011.png
-79 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_model_complexity_influence_002.png
-85 Bytes b/‎dev/_images/sphx_glr_plot_model_complexity_influence_002.png
-85 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_model_complexity_influence_0021.png
-85 Bytes b/‎dev/_images/sphx_glr_plot_model_complexity_influence_0021.png
-85 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_model_complexity_influence_003.png
-22 Bytes b/‎dev/_images/sphx_glr_plot_model_complexity_influence_003.png
-22 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_model_complexity_influence_0031.png
-22 Bytes b/‎dev/_images/sphx_glr_plot_model_complexity_influence_0031.png
-22 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_model_complexity_influence_thumb.png
-158 Bytes b/‎dev/_images/sphx_glr_plot_model_complexity_influence_thumb.png
-158 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_out_of_core_classification_001.png
-3.74 KB b/‎dev/_images/sphx_glr_plot_out_of_core_classification_001.png
-3.74 KB
diff --git a/‎dev/_images/sphx_glr_plot_out_of_core_classification_0011.png
-3.74 KB b/‎dev/_images/sphx_glr_plot_out_of_core_classification_0011.png
-3.74 KB
diff --git a/‎dev/_images/sphx_glr_plot_out_of_core_classification_002.png
-4.18 KB b/‎dev/_images/sphx_glr_plot_out_of_core_classification_002.png
-4.18 KB
diff --git a/‎dev/_images/sphx_glr_plot_out_of_core_classification_003.png
114 Bytes b/‎dev/_images/sphx_glr_plot_out_of_core_classification_003.png
114 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_out_of_core_classification_0031.png
114 Bytes b/‎dev/_images/sphx_glr_plot_out_of_core_classification_0031.png
114 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_out_of_core_classification_004.png
-192 Bytes b/‎dev/_images/sphx_glr_plot_out_of_core_classification_004.png
-192 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_out_of_core_classification_0041.png
-192 Bytes b/‎dev/_images/sphx_glr_plot_out_of_core_classification_0041.png
-192 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_out_of_core_classification_thumb.png
-2.05 KB b/‎dev/_images/sphx_glr_plot_out_of_core_classification_thumb.png
-2.05 KB
diff --git a/‎dev/_images/sphx_glr_plot_prediction_latency_001.png
-1.3 KB b/‎dev/_images/sphx_glr_plot_prediction_latency_001.png
-1.3 KB
diff --git a/‎dev/_images/sphx_glr_plot_prediction_latency_0011.png
-1.3 KB b/‎dev/_images/sphx_glr_plot_prediction_latency_0011.png
-1.3 KB
diff --git a/‎dev/_images/sphx_glr_plot_prediction_latency_002.png
1.93 KB b/‎dev/_images/sphx_glr_plot_prediction_latency_002.png
1.93 KB
diff --git a/‎dev/_images/sphx_glr_plot_prediction_latency_0021.png
1.93 KB b/‎dev/_images/sphx_glr_plot_prediction_latency_0021.png
1.93 KB
diff --git a/‎dev/_images/sphx_glr_plot_prediction_latency_003.png
-5.29 KB b/‎dev/_images/sphx_glr_plot_prediction_latency_003.png
-5.29 KB
diff --git a/‎dev/_images/sphx_glr_plot_prediction_latency_0031.png
-5.29 KB b/‎dev/_images/sphx_glr_plot_prediction_latency_0031.png
-5.29 KB
diff --git a/‎dev/_images/sphx_glr_plot_prediction_latency_004.png
-15 Bytes b/‎dev/_images/sphx_glr_plot_prediction_latency_004.png
-15 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_prediction_latency_0041.png
-15 Bytes b/‎dev/_images/sphx_glr_plot_prediction_latency_0041.png
-15 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_prediction_latency_thumb.png
-346 Bytes b/‎dev/_images/sphx_glr_plot_prediction_latency_thumb.png
-346 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_sgd_early_stopping_001.png
-2.15 KB b/‎dev/_images/sphx_glr_plot_sgd_early_stopping_001.png
-2.15 KB
diff --git a/‎dev/_images/sphx_glr_plot_sgd_early_stopping_thumb.png
-467 Bytes b/‎dev/_images/sphx_glr_plot_sgd_early_stopping_thumb.png
-467 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_sparse_logistic_regression_20newsgroups_001.png
-160 Bytes b/‎dev/_images/sphx_glr_plot_sparse_logistic_regression_20newsgroups_001.png
-160 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_sparse_logistic_regression_20newsgroups_thumb.png
613 Bytes b/‎dev/_images/sphx_glr_plot_sparse_logistic_regression_20newsgroups_thumb.png
613 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_theilsen_002.png
9 Bytes b/‎dev/_images/sphx_glr_plot_theilsen_002.png
9 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_tomography_l1_reconstruction_001.png
25 Bytes b/‎dev/_images/sphx_glr_plot_tomography_l1_reconstruction_001.png
25 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_tomography_l1_reconstruction_thumb.png
300 Bytes b/‎dev/_images/sphx_glr_plot_tomography_l1_reconstruction_thumb.png
300 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_ward_structured_vs_unstructured_001.png
76 Bytes b/‎dev/_images/sphx_glr_plot_ward_structured_vs_unstructured_001.png
76 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_ward_structured_vs_unstructured_0011.png
76 Bytes b/‎dev/_images/sphx_glr_plot_ward_structured_vs_unstructured_0011.png
76 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_ward_structured_vs_unstructured_002.png
138 Bytes b/‎dev/_images/sphx_glr_plot_ward_structured_vs_unstructured_002.png
138 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_ward_structured_vs_unstructured_0021.png
138 Bytes b/‎dev/_images/sphx_glr_plot_ward_structured_vs_unstructured_0021.png
138 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_ward_structured_vs_unstructured_thumb.png
15 Bytes b/‎dev/_images/sphx_glr_plot_ward_structured_vs_unstructured_thumb.png
15 Bytes
diff --git a/‎dev/_sources/auto_examples/applications/plot_face_recognition.rst.txt
Lines changed: 17 additions & 17 deletions b/‎dev/_sources/auto_examples/applications/plot_face_recognition.rst.txt
Lines changed: 17 additions & 17 deletions
@@ -26,7 +26,7 @@
       },
       "outputs": [],
       "source": [
-        "# Author: Rob Zinkov <rob at zinkov dot com>\n# License: BSD 3 clause\n\nimport numpy as np\nimport matplotlib.pyplot as plt\nfrom sklearn import datasets\n\nfrom sklearn.model_selection import train_test_split\nfrom sklearn.linear_model import SGDClassifier, Perceptron\nfrom sklearn.linear_model import PassiveAggressiveClassifier\nfrom sklearn.linear_model import LogisticRegression\n\nheldout = [0.95, 0.90, 0.75, 0.50, 0.01]\nrounds = 20\nX, y = datasets.load_digits(return_X_y=True)\n\nclassifiers = [\n    (\"SGD\", SGDClassifier(max_iter=100)),\n    (\"ASGD\", SGDClassifier(average=True, max_iter=1000)),\n    (\"Perceptron\", Perceptron(tol=1e-3)),\n    (\"Passive-Aggressive I\", PassiveAggressiveClassifier(loss='hinge',\n                                                         C=1.0, tol=1e-4)),\n    (\"Passive-Aggressive II\", PassiveAggressiveClassifier(loss='squared_hinge',\n                                                          C=1.0, tol=1e-4)),\n    (\"SAG\", LogisticRegression(solver='sag', tol=1e-1, C=1.e4 / X.shape[0]))\n]\n\nxx = 1. - np.array(heldout)\n\nfor name, clf in classifiers:\n    print(\"training %s\" % name)\n    rng = np.random.RandomState(42)\n    yy = []\n    for i in heldout:\n        yy_ = []\n        for r in range(rounds):\n            X_train, X_test, y_train, y_test = \\\n                train_test_split(X, y, test_size=i, random_state=rng)\n            clf.fit(X_train, y_train)\n            y_pred = clf.predict(X_test)\n            yy_.append(1 - np.mean(y_pred == y_test))\n        yy.append(np.mean(yy_))\n    plt.plot(xx, yy, label=name)\n\nplt.legend(loc=\"upper right\")\nplt.xlabel(\"Proportion train\")\nplt.ylabel(\"Test Error Rate\")\nplt.show()"
+        "# Author: Rob Zinkov <rob at zinkov dot com>\n# License: BSD 3 clause\n\nimport numpy as np\nimport matplotlib.pyplot as plt\nfrom sklearn import datasets\n\nfrom sklearn.model_selection import train_test_split\nfrom sklearn.linear_model import SGDClassifier, Perceptron\nfrom sklearn.linear_model import PassiveAggressiveClassifier\nfrom sklearn.linear_model import LogisticRegression\n\nheldout = [0.95, 0.90, 0.75, 0.50, 0.01]\nrounds = 20\nX, y = datasets.load_digits(return_X_y=True)\n\nclassifiers = [\n    (\"SGD\", SGDClassifier(max_iter=100)),\n    (\"ASGD\", SGDClassifier(average=True)),\n    (\"Perceptron\", Perceptron()),\n    (\"Passive-Aggressive I\", PassiveAggressiveClassifier(loss='hinge',\n                                                         C=1.0, tol=1e-4)),\n    (\"Passive-Aggressive II\", PassiveAggressiveClassifier(loss='squared_hinge',\n                                                          C=1.0, tol=1e-4)),\n    (\"SAG\", LogisticRegression(solver='sag', tol=1e-1, C=1.e4 / X.shape[0]))\n]\n\nxx = 1. - np.array(heldout)\n\nfor name, clf in classifiers:\n    print(\"training %s\" % name)\n    rng = np.random.RandomState(42)\n    yy = []\n    for i in heldout:\n        yy_ = []\n        for r in range(rounds):\n            X_train, X_test, y_train, y_test = \\\n                train_test_split(X, y, test_size=i, random_state=rng)\n            clf.fit(X_train, y_train)\n            y_pred = clf.predict(X_test)\n            yy_.append(1 - np.mean(y_pred == y_test))\n        yy.append(np.mean(yy_))\n    plt.plot(xx, yy, label=name)\n\nplt.legend(loc=\"upper right\")\nplt.xlabel(\"Proportion train\")\nplt.ylabel(\"Test Error Rate\")\nplt.show()"
       ]
     }
   ],
 
@@ -25,8 +25,8 @@
 
 classifiers = [
     ("SGD", SGDClassifier(max_iter=100)),
-    ("ASGD", SGDClassifier(average=True, max_iter=1000)),
-    ("Perceptron", Perceptron(tol=1e-3)),
+    ("ASGD", SGDClassifier(average=True)),
+    ("Perceptron", Perceptron()),
     ("Passive-Aggressive I", PassiveAggressiveClassifier(loss='hinge',
                                                          C=1.0, tol=1e-4)),
     ("Passive-Aggressive II", PassiveAggressiveClassifier(loss='squared_hinge',
 
@@ -247,7 +247,7 @@ def benchmark(clf):
 results = []
 for clf, name in (
         (RidgeClassifier(tol=1e-2, solver="sag"), "Ridge Classifier"),
-        (Perceptron(max_iter=50, tol=1e-3), "Perceptron"),
+        (Perceptron(max_iter=50), "Perceptron"),
         (PassiveAggressiveClassifier(max_iter=50, tol=1e-3),
          "Passive-Aggressive"),
         (KNeighborsClassifier(n_neighbors=10), "kNN"),
 
@@ -208,7 +208,7 @@ def progress(blocknum, bs, size):
 # Here are some classifiers that support the `partial_fit` method
 partial_fit_classifiers = {
     'SGD': SGDClassifier(max_iter=5),
-    'Perceptron': Perceptron(tol=1e-3),
+    'Perceptron': Perceptron(),
     'NB Multinomial': MultinomialNB(alpha=0.01),
     'Passive-Aggressive': PassiveAggressiveClassifier(tol=1e-3),
 }
 
@@ -62,7 +62,7 @@
       },
       "outputs": [],
       "source": [
-        "vectorizer = HashingVectorizer(decode_error='ignore', n_features=2 ** 18,\n                               alternate_sign=False)\n\n\n# Iterator over parsed Reuters SGML files.\ndata_stream = stream_reuters_documents()\n\n# We learn a binary classification between the \"acq\" class and all the others.\n# \"acq\" was chosen as it is more or less evenly distributed in the Reuters\n# files. For other datasets, one should take care of creating a test set with\n# a realistic portion of positive instances.\nall_classes = np.array([0, 1])\npositive_class = 'acq'\n\n# Here are some classifiers that support the `partial_fit` method\npartial_fit_classifiers = {\n    'SGD': SGDClassifier(max_iter=5),\n    'Perceptron': Perceptron(tol=1e-3),\n    'NB Multinomial': MultinomialNB(alpha=0.01),\n    'Passive-Aggressive': PassiveAggressiveClassifier(tol=1e-3),\n}\n\n\ndef get_minibatch(doc_iter, size, pos_class=positive_class):\n    \"\"\"Extract a minibatch of examples, return a tuple X_text, y.\n\n    Note: size is before excluding invalid docs with no topics assigned.\n\n    \"\"\"\n    data = [('{title}\\n\\n{body}'.format(**doc), pos_class in doc['topics'])\n            for doc in itertools.islice(doc_iter, size)\n            if doc['topics']]\n    if not len(data):\n        return np.asarray([], dtype=int), np.asarray([], dtype=int)\n    X_text, y = zip(*data)\n    return X_text, np.asarray(y, dtype=int)\n\n\ndef iter_minibatches(doc_iter, minibatch_size):\n    \"\"\"Generator of minibatches.\"\"\"\n    X_text, y = get_minibatch(doc_iter, minibatch_size)\n    while len(X_text):\n        yield X_text, y\n        X_text, y = get_minibatch(doc_iter, minibatch_size)\n\n\n# test data statistics\ntest_stats = {'n_test': 0, 'n_test_pos': 0}\n\n# First we hold out a number of examples to estimate accuracy\nn_test_documents = 1000\ntick = time.time()\nX_test_text, y_test = get_minibatch(data_stream, 1000)\nparsing_time = time.time() - tick\ntick = time.time()\nX_test = vectorizer.transform(X_test_text)\nvectorizing_time = time.time() - tick\ntest_stats['n_test'] += len(y_test)\ntest_stats['n_test_pos'] += sum(y_test)\nprint(\"Test set is %d documents (%d positive)\" % (len(y_test), sum(y_test)))\n\n\ndef progress(cls_name, stats):\n    \"\"\"Report progress information, return a string.\"\"\"\n    duration = time.time() - stats['t0']\n    s = \"%20s classifier : \\t\" % cls_name\n    s += \"%(n_train)6d train docs (%(n_train_pos)6d positive) \" % stats\n    s += \"%(n_test)6d test docs (%(n_test_pos)6d positive) \" % test_stats\n    s += \"accuracy: %(accuracy).3f \" % stats\n    s += \"in %.2fs (%5d docs/s)\" % (duration, stats['n_train'] / duration)\n    return s\n\n\ncls_stats = {}\n\nfor cls_name in partial_fit_classifiers:\n    stats = {'n_train': 0, 'n_train_pos': 0,\n             'accuracy': 0.0, 'accuracy_history': [(0, 0)], 't0': time.time(),\n             'runtime_history': [(0, 0)], 'total_fit_time': 0.0}\n    cls_stats[cls_name] = stats\n\nget_minibatch(data_stream, n_test_documents)\n# Discard test set\n\n# We will feed the classifier with mini-batches of 1000 documents; this means\n# we have at most 1000 docs in memory at any time.  The smaller the document\n# batch, the bigger the relative overhead of the partial fit methods.\nminibatch_size = 1000\n\n# Create the data_stream that parses Reuters SGML files and iterates on\n# documents as a stream.\nminibatch_iterators = iter_minibatches(data_stream, minibatch_size)\ntotal_vect_time = 0.0\n\n# Main loop : iterate on mini-batches of examples\nfor i, (X_train_text, y_train) in enumerate(minibatch_iterators):\n\n    tick = time.time()\n    X_train = vectorizer.transform(X_train_text)\n    total_vect_time += time.time() - tick\n\n    for cls_name, cls in partial_fit_classifiers.items():\n        tick = time.time()\n        # update estimator with examples in the current mini-batch\n        cls.partial_fit(X_train, y_train, classes=all_classes)\n\n        # accumulate test accuracy stats\n        cls_stats[cls_name]['total_fit_time'] += time.time() - tick\n        cls_stats[cls_name]['n_train'] += X_train.shape[0]\n        cls_stats[cls_name]['n_train_pos'] += sum(y_train)\n        tick = time.time()\n        cls_stats[cls_name]['accuracy'] = cls.score(X_test, y_test)\n        cls_stats[cls_name]['prediction_time'] = time.time() - tick\n        acc_history = (cls_stats[cls_name]['accuracy'],\n                       cls_stats[cls_name]['n_train'])\n        cls_stats[cls_name]['accuracy_history'].append(acc_history)\n        run_history = (cls_stats[cls_name]['accuracy'],\n                       total_vect_time + cls_stats[cls_name]['total_fit_time'])\n        cls_stats[cls_name]['runtime_history'].append(run_history)\n\n        if i % 3 == 0:\n            print(progress(cls_name, cls_stats[cls_name]))\n    if i % 3 == 0:\n        print('\\n')"
+        "vectorizer = HashingVectorizer(decode_error='ignore', n_features=2 ** 18,\n                               alternate_sign=False)\n\n\n# Iterator over parsed Reuters SGML files.\ndata_stream = stream_reuters_documents()\n\n# We learn a binary classification between the \"acq\" class and all the others.\n# \"acq\" was chosen as it is more or less evenly distributed in the Reuters\n# files. For other datasets, one should take care of creating a test set with\n# a realistic portion of positive instances.\nall_classes = np.array([0, 1])\npositive_class = 'acq'\n\n# Here are some classifiers that support the `partial_fit` method\npartial_fit_classifiers = {\n    'SGD': SGDClassifier(max_iter=5),\n    'Perceptron': Perceptron(),\n    'NB Multinomial': MultinomialNB(alpha=0.01),\n    'Passive-Aggressive': PassiveAggressiveClassifier(tol=1e-3),\n}\n\n\ndef get_minibatch(doc_iter, size, pos_class=positive_class):\n    \"\"\"Extract a minibatch of examples, return a tuple X_text, y.\n\n    Note: size is before excluding invalid docs with no topics assigned.\n\n    \"\"\"\n    data = [('{title}\\n\\n{body}'.format(**doc), pos_class in doc['topics'])\n            for doc in itertools.islice(doc_iter, size)\n            if doc['topics']]\n    if not len(data):\n        return np.asarray([], dtype=int), np.asarray([], dtype=int)\n    X_text, y = zip(*data)\n    return X_text, np.asarray(y, dtype=int)\n\n\ndef iter_minibatches(doc_iter, minibatch_size):\n    \"\"\"Generator of minibatches.\"\"\"\n    X_text, y = get_minibatch(doc_iter, minibatch_size)\n    while len(X_text):\n        yield X_text, y\n        X_text, y = get_minibatch(doc_iter, minibatch_size)\n\n\n# test data statistics\ntest_stats = {'n_test': 0, 'n_test_pos': 0}\n\n# First we hold out a number of examples to estimate accuracy\nn_test_documents = 1000\ntick = time.time()\nX_test_text, y_test = get_minibatch(data_stream, 1000)\nparsing_time = time.time() - tick\ntick = time.time()\nX_test = vectorizer.transform(X_test_text)\nvectorizing_time = time.time() - tick\ntest_stats['n_test'] += len(y_test)\ntest_stats['n_test_pos'] += sum(y_test)\nprint(\"Test set is %d documents (%d positive)\" % (len(y_test), sum(y_test)))\n\n\ndef progress(cls_name, stats):\n    \"\"\"Report progress information, return a string.\"\"\"\n    duration = time.time() - stats['t0']\n    s = \"%20s classifier : \\t\" % cls_name\n    s += \"%(n_train)6d train docs (%(n_train_pos)6d positive) \" % stats\n    s += \"%(n_test)6d test docs (%(n_test_pos)6d positive) \" % test_stats\n    s += \"accuracy: %(accuracy).3f \" % stats\n    s += \"in %.2fs (%5d docs/s)\" % (duration, stats['n_train'] / duration)\n    return s\n\n\ncls_stats = {}\n\nfor cls_name in partial_fit_classifiers:\n    stats = {'n_train': 0, 'n_train_pos': 0,\n             'accuracy': 0.0, 'accuracy_history': [(0, 0)], 't0': time.time(),\n             'runtime_history': [(0, 0)], 'total_fit_time': 0.0}\n    cls_stats[cls_name] = stats\n\nget_minibatch(data_stream, n_test_documents)\n# Discard test set\n\n# We will feed the classifier with mini-batches of 1000 documents; this means\n# we have at most 1000 docs in memory at any time.  The smaller the document\n# batch, the bigger the relative overhead of the partial fit methods.\nminibatch_size = 1000\n\n# Create the data_stream that parses Reuters SGML files and iterates on\n# documents as a stream.\nminibatch_iterators = iter_minibatches(data_stream, minibatch_size)\ntotal_vect_time = 0.0\n\n# Main loop : iterate on mini-batches of examples\nfor i, (X_train_text, y_train) in enumerate(minibatch_iterators):\n\n    tick = time.time()\n    X_train = vectorizer.transform(X_train_text)\n    total_vect_time += time.time() - tick\n\n    for cls_name, cls in partial_fit_classifiers.items():\n        tick = time.time()\n        # update estimator with examples in the current mini-batch\n        cls.partial_fit(X_train, y_train, classes=all_classes)\n\n        # accumulate test accuracy stats\n        cls_stats[cls_name]['total_fit_time'] += time.time() - tick\n        cls_stats[cls_name]['n_train'] += X_train.shape[0]\n        cls_stats[cls_name]['n_train_pos'] += sum(y_train)\n        tick = time.time()\n        cls_stats[cls_name]['accuracy'] = cls.score(X_test, y_test)\n        cls_stats[cls_name]['prediction_time'] = time.time() - tick\n        acc_history = (cls_stats[cls_name]['accuracy'],\n                       cls_stats[cls_name]['n_train'])\n        cls_stats[cls_name]['accuracy_history'].append(acc_history)\n        run_history = (cls_stats[cls_name]['accuracy'],\n                       total_vect_time + cls_stats[cls_name]['total_fit_time'])\n        cls_stats[cls_name]['runtime_history'].append(run_history)\n\n        if i % 3 == 0:\n            print(progress(cls_name, cls_stats[cls_name]))\n    if i % 3 == 0:\n        print('\\n')"
       ]
     },
     {
Original file line number	Diff line number	Diff line change
`@@ -26,7 +26,7 @@`
`26`	`26`	`},`
`27`	`27`	`"outputs": [],`
`28`	`28`	`"source": [`
`29`		- "# Author: Rob Zinkov <rob at zinkov dot com>\n# License: BSD 3 clause\n\nimport numpy as np\nimport matplotlib.pyplot as plt\nfrom sklearn import datasets\n\nfrom sklearn.model_selection import train_test_split\nfrom sklearn.linear_model import SGDClassifier, Perceptron\nfrom sklearn.linear_model import PassiveAggressiveClassifier\nfrom sklearn.linear_model import LogisticRegression\n\nheldout = [0.95, 0.90, 0.75, 0.50, 0.01]\nrounds = 20\nX, y = datasets.load_digits(return_X_y=True)\n\nclassifiers = [\n (\"SGD\", SGDClassifier(max_iter=100)),\n (\"ASGD\", SGDClassifier(average=True, max_iter=1000)),\n (\"Perceptron\", Perceptron(tol=1e-3)),\n (\"Passive-Aggressive I\", PassiveAggressiveClassifier(loss='hinge',\n C=1.0, tol=1e-4)),\n (\"Passive-Aggressive II\", PassiveAggressiveClassifier(loss='squared_hinge',\n C=1.0, tol=1e-4)),\n (\"SAG\", LogisticRegression(solver='sag', tol=1e-1, C=1.e4 / X.shape[0]))\n]\n\nxx = 1. - np.array(heldout)\n\nfor name, clf in classifiers:\n print(\"training %s\" % name)\n rng = np.random.RandomState(42)\n yy = []\n for i in heldout:\n yy_ = []\n for r in range(rounds):\n X_train, X_test, y_train, y_test = \\\n train_test_split(X, y, test_size=i, random_state=rng)\n clf.fit(X_train, y_train)\n y_pred = clf.predict(X_test)\n yy_.append(1 - np.mean(y_pred == y_test))\n yy.append(np.mean(yy_))\n plt.plot(xx, yy, label=name)\n\nplt.legend(loc=\"upper right\")\nplt.xlabel(\"Proportion train\")\nplt.ylabel(\"Test Error Rate\")\nplt.show()"
	`29`	+ "# Author: Rob Zinkov <rob at zinkov dot com>\n# License: BSD 3 clause\n\nimport numpy as np\nimport matplotlib.pyplot as plt\nfrom sklearn import datasets\n\nfrom sklearn.model_selection import train_test_split\nfrom sklearn.linear_model import SGDClassifier, Perceptron\nfrom sklearn.linear_model import PassiveAggressiveClassifier\nfrom sklearn.linear_model import LogisticRegression\n\nheldout = [0.95, 0.90, 0.75, 0.50, 0.01]\nrounds = 20\nX, y = datasets.load_digits(return_X_y=True)\n\nclassifiers = [\n (\"SGD\", SGDClassifier(max_iter=100)),\n (\"ASGD\", SGDClassifier(average=True)),\n (\"Perceptron\", Perceptron()),\n (\"Passive-Aggressive I\", PassiveAggressiveClassifier(loss='hinge',\n C=1.0, tol=1e-4)),\n (\"Passive-Aggressive II\", PassiveAggressiveClassifier(loss='squared_hinge',\n C=1.0, tol=1e-4)),\n (\"SAG\", LogisticRegression(solver='sag', tol=1e-1, C=1.e4 / X.shape[0]))\n]\n\nxx = 1. - np.array(heldout)\n\nfor name, clf in classifiers:\n print(\"training %s\" % name)\n rng = np.random.RandomState(42)\n yy = []\n for i in heldout:\n yy_ = []\n for r in range(rounds):\n X_train, X_test, y_train, y_test = \\\n train_test_split(X, y, test_size=i, random_state=rng)\n clf.fit(X_train, y_train)\n y_pred = clf.predict(X_test)\n yy_.append(1 - np.mean(y_pred == y_test))\n yy.append(np.mean(yy_))\n plt.plot(xx, yy, label=name)\n\nplt.legend(loc=\"upper right\")\nplt.xlabel(\"Proportion train\")\nplt.ylabel(\"Test Error Rate\")\nplt.show()"
`30`	`30`	`]`
`31`	`31`	`}`
`32`	`32`	`],`
Original file line number	Diff line number	Diff line change
`@@ -208,7 +208,7 @@ def progress(blocknum, bs, size):`
`208`	`208`	# Here are some classifiers that support the `partial_fit` method
`209`	`209`	`partial_fit_classifiers = {`
`210`	`210`	`'SGD': SGDClassifier(max_iter=5),`
`211`		`- 'Perceptron': Perceptron(tol=1e-3),`
	`211`	`+ 'Perceptron': Perceptron(),`
`212`	`212`	`'NB Multinomial': MultinomialNB(alpha=0.01),`
`213`	`213`	`'Passive-Aggressive': PassiveAggressiveClassifier(tol=1e-3),`
`214`	`214`	`}`
Original file line number	Diff line number	Diff line change
`@@ -62,7 +62,7 @@`
`62`	`62`	`},`
`63`	`63`	`"outputs": [],`
`64`	`64`	`"source": [`
`65`		- "vectorizer = HashingVectorizer(decode_error='ignore', n_features=2 18,\n alternate_sign=False)\n\n\n# Iterator over parsed Reuters SGML files.\ndata_stream = stream_reuters_documents()\n\n# We learn a binary classification between the \"acq\" class and all the others.\n# \"acq\" was chosen as it is more or less evenly distributed in the Reuters\n# files. For other datasets, one should take care of creating a test set with\n# a realistic portion of positive instances.\nall_classes = np.array([0, 1])\npositive_class = 'acq'\n\n# Here are some classifiers that support the `partial_fit` method\npartial_fit_classifiers = {\n 'SGD': SGDClassifier(max_iter=5),\n 'Perceptron': Perceptron(tol=1e-3),\n 'NB Multinomial': MultinomialNB(alpha=0.01),\n 'Passive-Aggressive': PassiveAggressiveClassifier(tol=1e-3),\n}\n\n\ndef get_minibatch(doc_iter, size, pos_class=positive_class):\n \"\"\"Extract a minibatch of examples, return a tuple X_text, y.\n\n Note: size is before excluding invalid docs with no topics assigned.\n\n \"\"\"\n data = [('{title}\\n\\n{body}'.format(doc), pos_class in doc['topics'])\n for doc in itertools.islice(doc_iter, size)\n if doc['topics']]\n if not len(data):\n return np.asarray([], dtype=int), np.asarray([], dtype=int)\n X_text, y = zip(*data)\n return X_text, np.asarray(y, dtype=int)\n\n\ndef iter_minibatches(doc_iter, minibatch_size):\n \"\"\"Generator of minibatches.\"\"\"\n X_text, y = get_minibatch(doc_iter, minibatch_size)\n while len(X_text):\n yield X_text, y\n X_text, y = get_minibatch(doc_iter, minibatch_size)\n\n\n# test data statistics\ntest_stats = {'n_test': 0, 'n_test_pos': 0}\n\n# First we hold out a number of examples to estimate accuracy\nn_test_documents = 1000\ntick = time.time()\nX_test_text, y_test = get_minibatch(data_stream, 1000)\nparsing_time = time.time() - tick\ntick = time.time()\nX_test = vectorizer.transform(X_test_text)\nvectorizing_time = time.time() - tick\ntest_stats['n_test'] += len(y_test)\ntest_stats['n_test_pos'] += sum(y_test)\nprint(\"Test set is %d documents (%d positive)\" % (len(y_test), sum(y_test)))\n\n\ndef progress(cls_name, stats):\n \"\"\"Report progress information, return a string.\"\"\"\n duration = time.time() - stats['t0']\n s = \"%20s classifier : \\t\" % cls_name\n s += \"%(n_train)6d train docs (%(n_train_pos)6d positive) \" % stats\n s += \"%(n_test)6d test docs (%(n_test_pos)6d positive) \" % test_stats\n s += \"accuracy: %(accuracy).3f \" % stats\n s += \"in %.2fs (%5d docs/s)\" % (duration, stats['n_train'] / duration)\n return s\n\n\ncls_stats = {}\n\nfor cls_name in partial_fit_classifiers:\n stats = {'n_train': 0, 'n_train_pos': 0,\n 'accuracy': 0.0, 'accuracy_history': [(0, 0)], 't0': time.time(),\n 'runtime_history': [(0, 0)], 'total_fit_time': 0.0}\n cls_stats[cls_name] = stats\n\nget_minibatch(data_stream, n_test_documents)\n# Discard test set\n\n# We will feed the classifier with mini-batches of 1000 documents; this means\n# we have at most 1000 docs in memory at any time. The smaller the document\n# batch, the bigger the relative overhead of the partial fit methods.\nminibatch_size = 1000\n\n# Create the data_stream that parses Reuters SGML files and iterates on\n# documents as a stream.\nminibatch_iterators = iter_minibatches(data_stream, minibatch_size)\ntotal_vect_time = 0.0\n\n# Main loop : iterate on mini-batches of examples\nfor i, (X_train_text, y_train) in enumerate(minibatch_iterators):\n\n tick = time.time()\n X_train = vectorizer.transform(X_train_text)\n total_vect_time += time.time() - tick\n\n for cls_name, cls in partial_fit_classifiers.items():\n tick = time.time()\n # update estimator with examples in the current mini-batch\n cls.partial_fit(X_train, y_train, classes=all_classes)\n\n # accumulate test accuracy stats\n cls_stats[cls_name]['total_fit_time'] += time.time() - tick\n cls_stats[cls_name]['n_train'] += X_train.shape[0]\n cls_stats[cls_name]['n_train_pos'] += sum(y_train)\n tick = time.time()\n cls_stats[cls_name]['accuracy'] = cls.score(X_test, y_test)\n cls_stats[cls_name]['prediction_time'] = time.time() - tick\n acc_history = (cls_stats[cls_name]['accuracy'],\n cls_stats[cls_name]['n_train'])\n cls_stats[cls_name]['accuracy_history'].append(acc_history)\n run_history = (cls_stats[cls_name]['accuracy'],\n total_vect_time + cls_stats[cls_name]['total_fit_time'])\n cls_stats[cls_name]['runtime_history'].append(run_history)\n\n if i % 3 == 0:\n print(progress(cls_name, cls_stats[cls_name]))\n if i % 3 == 0:\n print('\\n')"
	`65`	+ "vectorizer = HashingVectorizer(decode_error='ignore', n_features=2 18,\n alternate_sign=False)\n\n\n# Iterator over parsed Reuters SGML files.\ndata_stream = stream_reuters_documents()\n\n# We learn a binary classification between the \"acq\" class and all the others.\n# \"acq\" was chosen as it is more or less evenly distributed in the Reuters\n# files. For other datasets, one should take care of creating a test set with\n# a realistic portion of positive instances.\nall_classes = np.array([0, 1])\npositive_class = 'acq'\n\n# Here are some classifiers that support the `partial_fit` method\npartial_fit_classifiers = {\n 'SGD': SGDClassifier(max_iter=5),\n 'Perceptron': Perceptron(),\n 'NB Multinomial': MultinomialNB(alpha=0.01),\n 'Passive-Aggressive': PassiveAggressiveClassifier(tol=1e-3),\n}\n\n\ndef get_minibatch(doc_iter, size, pos_class=positive_class):\n \"\"\"Extract a minibatch of examples, return a tuple X_text, y.\n\n Note: size is before excluding invalid docs with no topics assigned.\n\n \"\"\"\n data = [('{title}\\n\\n{body}'.format(doc), pos_class in doc['topics'])\n for doc in itertools.islice(doc_iter, size)\n if doc['topics']]\n if not len(data):\n return np.asarray([], dtype=int), np.asarray([], dtype=int)\n X_text, y = zip(*data)\n return X_text, np.asarray(y, dtype=int)\n\n\ndef iter_minibatches(doc_iter, minibatch_size):\n \"\"\"Generator of minibatches.\"\"\"\n X_text, y = get_minibatch(doc_iter, minibatch_size)\n while len(X_text):\n yield X_text, y\n X_text, y = get_minibatch(doc_iter, minibatch_size)\n\n\n# test data statistics\ntest_stats = {'n_test': 0, 'n_test_pos': 0}\n\n# First we hold out a number of examples to estimate accuracy\nn_test_documents = 1000\ntick = time.time()\nX_test_text, y_test = get_minibatch(data_stream, 1000)\nparsing_time = time.time() - tick\ntick = time.time()\nX_test = vectorizer.transform(X_test_text)\nvectorizing_time = time.time() - tick\ntest_stats['n_test'] += len(y_test)\ntest_stats['n_test_pos'] += sum(y_test)\nprint(\"Test set is %d documents (%d positive)\" % (len(y_test), sum(y_test)))\n\n\ndef progress(cls_name, stats):\n \"\"\"Report progress information, return a string.\"\"\"\n duration = time.time() - stats['t0']\n s = \"%20s classifier : \\t\" % cls_name\n s += \"%(n_train)6d train docs (%(n_train_pos)6d positive) \" % stats\n s += \"%(n_test)6d test docs (%(n_test_pos)6d positive) \" % test_stats\n s += \"accuracy: %(accuracy).3f \" % stats\n s += \"in %.2fs (%5d docs/s)\" % (duration, stats['n_train'] / duration)\n return s\n\n\ncls_stats = {}\n\nfor cls_name in partial_fit_classifiers:\n stats = {'n_train': 0, 'n_train_pos': 0,\n 'accuracy': 0.0, 'accuracy_history': [(0, 0)], 't0': time.time(),\n 'runtime_history': [(0, 0)], 'total_fit_time': 0.0}\n cls_stats[cls_name] = stats\n\nget_minibatch(data_stream, n_test_documents)\n# Discard test set\n\n# We will feed the classifier with mini-batches of 1000 documents; this means\n# we have at most 1000 docs in memory at any time. The smaller the document\n# batch, the bigger the relative overhead of the partial fit methods.\nminibatch_size = 1000\n\n# Create the data_stream that parses Reuters SGML files and iterates on\n# documents as a stream.\nminibatch_iterators = iter_minibatches(data_stream, minibatch_size)\ntotal_vect_time = 0.0\n\n# Main loop : iterate on mini-batches of examples\nfor i, (X_train_text, y_train) in enumerate(minibatch_iterators):\n\n tick = time.time()\n X_train = vectorizer.transform(X_train_text)\n total_vect_time += time.time() - tick\n\n for cls_name, cls in partial_fit_classifiers.items():\n tick = time.time()\n # update estimator with examples in the current mini-batch\n cls.partial_fit(X_train, y_train, classes=all_classes)\n\n # accumulate test accuracy stats\n cls_stats[cls_name]['total_fit_time'] += time.time() - tick\n cls_stats[cls_name]['n_train'] += X_train.shape[0]\n cls_stats[cls_name]['n_train_pos'] += sum(y_train)\n tick = time.time()\n cls_stats[cls_name]['accuracy'] = cls.score(X_test, y_test)\n cls_stats[cls_name]['prediction_time'] = time.time() - tick\n acc_history = (cls_stats[cls_name]['accuracy'],\n cls_stats[cls_name]['n_train'])\n cls_stats[cls_name]['accuracy_history'].append(acc_history)\n run_history = (cls_stats[cls_name]['accuracy'],\n total_vect_time + cls_stats[cls_name]['total_fit_time'])\n cls_stats[cls_name]['runtime_history'].append(run_history)\n\n if i % 3 == 0:\n print(progress(cls_name, cls_stats[cls_name]))\n if i % 3 == 0:\n print('\\n')"
`66`	`66`	`]`
`67`	`67`	`},`
`68`	`68`	`{`