automl
diff --git a/‎development/_downloads/bb7d59d9ddc2ff29f0d6eb99747a3347/example_resampling.ipynb
Lines changed: 1 addition & 1 deletion b/‎development/_downloads/bb7d59d9ddc2ff29f0d6eb99747a3347/example_resampling.ipynb
Lines changed: 1 addition & 1 deletion
diff --git a/‎development/_downloads/bc82bea3a5dd7bdba60b65220891d9e5/examples_python.zip
72 Bytes b/‎development/_downloads/bc82bea3a5dd7bdba60b65220891d9e5/examples_python.zip
72 Bytes
diff --git a/‎development/_downloads/c6beb850ad22be83885d2737cca63b33/example_resampling.py
Lines changed: 4 additions & 1 deletion b/‎development/_downloads/c6beb850ad22be83885d2737cca63b33/example_resampling.py
Lines changed: 4 additions & 1 deletion
diff --git a/‎development/_downloads/fb625db3c50d423b1b7881136ffdeec8/examples_jupyter.zip
75 Bytes b/‎development/_downloads/fb625db3c50d423b1b7881136ffdeec8/examples_jupyter.zip
75 Bytes
diff --git a/‎development/_images/sphx_glr_example_inspect_predictions_001.png
-567 Bytes b/‎development/_images/sphx_glr_example_inspect_predictions_001.png
-567 Bytes
diff --git a/‎development/_images/sphx_glr_example_inspect_predictions_002.png
39 KB b/‎development/_images/sphx_glr_example_inspect_predictions_002.png
39 KB
diff --git a/‎development/_images/sphx_glr_example_inspect_predictions_003.png
1.37 KB b/‎development/_images/sphx_glr_example_inspect_predictions_003.png
1.37 KB
diff --git a/‎development/_images/sphx_glr_example_inspect_predictions_thumb.png
-516 Bytes b/‎development/_images/sphx_glr_example_inspect_predictions_thumb.png
-516 Bytes
diff --git a/‎development/_images/sphx_glr_example_pandas_train_test_001.png
699 Bytes b/‎development/_images/sphx_glr_example_pandas_train_test_001.png
699 Bytes
diff --git a/‎development/_images/sphx_glr_example_pandas_train_test_thumb.png
4.22 KB b/‎development/_images/sphx_glr_example_pandas_train_test_thumb.png
4.22 KB
diff --git a/‎development/_images/sphx_glr_example_regression_001.png
0 Bytes b/‎development/_images/sphx_glr_example_regression_001.png
0 Bytes
diff --git a/‎development/_sources/examples/20_basic/example_classification.rst.txt
Lines changed: 111 additions & 39 deletions b/‎development/_sources/examples/20_basic/example_classification.rst.txt
Lines changed: 111 additions & 39 deletions
diff --git a/‎development/_sources/examples/20_basic/example_multilabel_classification.rst.txt
Lines changed: 2 additions & 2 deletions b/‎development/_sources/examples/20_basic/example_multilabel_classification.rst.txt
Lines changed: 2 additions & 2 deletions
diff --git a/‎development/_sources/examples/20_basic/example_multioutput_regression.rst.txt
Lines changed: 4 additions & 4 deletions b/‎development/_sources/examples/20_basic/example_multioutput_regression.rst.txt
Lines changed: 4 additions & 4 deletions
diff --git a/‎development/_sources/examples/20_basic/example_regression.rst.txt
Lines changed: 6 additions & 6 deletions b/‎development/_sources/examples/20_basic/example_regression.rst.txt
Lines changed: 6 additions & 6 deletions
diff --git a/‎development/_sources/examples/20_basic/sg_execution_times.rst.txt
Lines changed: 5 additions & 5 deletions b/‎development/_sources/examples/20_basic/sg_execution_times.rst.txt
Lines changed: 5 additions & 5 deletions
diff --git a/‎development/_sources/examples/40_advanced/example_calc_multiple_metrics.rst.txt
Lines changed: 33 additions & 30 deletions b/‎development/_sources/examples/40_advanced/example_calc_multiple_metrics.rst.txt
Lines changed: 33 additions & 30 deletions
@@ -141,7 +141,7 @@
       },
       "outputs": [],
       "source": [
-        "resampling_strategy = sklearn.model_selection.PredefinedSplit(\n    test_fold=np.where(X_train[:, 0] < np.mean(X_train[:, 0]))[0]\n)\n\nautoml = autosklearn.classification.AutoSklearnClassifier(\n    time_left_for_this_task=120,\n    per_run_time_limit=30,\n    tmp_folder='/tmp/autosklearn_resampling_example_tmp',\n    disable_evaluator_output=False,\n    resampling_strategy=resampling_strategy,\n)\nautoml.fit(X_train, y_train, dataset_name='breast_cancer')"
+        "selected_indices = (X_train[:, 0] < np.mean(X_train[:, 0])).astype(int)\nresampling_strategy = sklearn.model_selection.PredefinedSplit(\n    test_fold=selected_indices\n)\n\nautoml = autosklearn.classification.AutoSklearnClassifier(\n    time_left_for_this_task=120,\n    per_run_time_limit=30,\n    tmp_folder='/tmp/autosklearn_resampling_example_tmp',\n    disable_evaluator_output=False,\n    resampling_strategy=resampling_strategy,\n)\nautoml.fit(X_train, y_train, dataset_name='breast_cancer')\n\nprint(automl.sprint_statistics())"
       ]
     },
     {
 
@@ -98,8 +98,9 @@
 # data by the first feature. In practice, one would use a splitting according
 # to the use case at hand.
 
+selected_indices = (X_train[:, 0] < np.mean(X_train[:, 0])).astype(int)
 resampling_strategy = sklearn.model_selection.PredefinedSplit(
-    test_fold=np.where(X_train[:, 0] < np.mean(X_train[:, 0]))[0]
+    test_fold=selected_indices
 )
 
 automl = autosklearn.classification.AutoSklearnClassifier(
@@ -111,6 +112,8 @@
 )
 automl.fit(X_train, y_train, dataset_name='breast_cancer')
 
+print(automl.sprint_statistics())
+
 ############################################################################
 # For custom resampling strategies (i.e. resampling strategies that are not
 # defined as strings by Auto-sklearn) it is necessary to perform a refit:
 
@@ -154,7 +154,7 @@ View the models found by auto-sklearn
 
               rank  ensemble_weight           type      cost  duration
     model_id                                                          
-    2            1              1.0  random_forest  0.447294  4.619741
+    2            1              1.0  random_forest  0.447294  3.722532
 
 
 
@@ -262,7 +262,7 @@ Get the Score of the final ensemble
 
 .. rst-class:: sphx-glr-timing
 
-   **Total running time of the script:** ( 0 minutes  16.665 seconds)
+   **Total running time of the script:** ( 0 minutes  17.564 seconds)
 
 
 .. _sphx_glr_download_examples_20_basic_example_multilabel_classification.py:
 
@@ -124,7 +124,7 @@ View the models found by auto-sklearn
 
               rank  ensemble_weight              type          cost  duration
     model_id                                                                 
-    11           1              1.0  gaussian_process  1.845174e-09  6.166486
+    20           1              1.0  gaussian_process  2.198749e-08  4.786565
 
 
 
@@ -151,7 +151,7 @@ Print the final ensemble constructed by auto-sklearn
 
  .. code-block:: none
 
-    [(1.000000, SimpleRegressionPipeline({'data_preprocessor:__choice__': 'feature_type', 'feature_preprocessor:__choice__': 'no_preprocessing', 'regressor:__choice__': 'gaussian_process', 'data_preprocessor:feature_type:categorical_transformer:categorical_encoding:__choice__': 'one_hot_encoding', 'data_preprocessor:feature_type:categorical_transformer:category_coalescence:__choice__': 'minority_coalescer', 'data_preprocessor:feature_type:numerical_transformer:imputation:strategy': 'most_frequent', 'data_preprocessor:feature_type:numerical_transformer:rescaling:__choice__': 'robust_scaler', 'regressor:gaussian_process:alpha': 1.6650724498551164e-11, 'regressor:gaussian_process:thetaL': 5.222627524598125e-10, 'regressor:gaussian_process:thetaU': 5801.524168449955, 'data_preprocessor:feature_type:categorical_transformer:category_coalescence:minority_coalescer:minimum_fraction': 0.0809214996879808, 'data_preprocessor:feature_type:numerical_transformer:rescaling:robust_scaler:q_max': 0.9020530113478731, 'data_preprocessor:feature_type:numerical_transformer:rescaling:robust_scaler:q_min': 0.10288728233229412},
+    [(1.000000, SimpleRegressionPipeline({'data_preprocessor:__choice__': 'feature_type', 'feature_preprocessor:__choice__': 'extra_trees_preproc_for_regression', 'regressor:__choice__': 'gaussian_process', 'data_preprocessor:feature_type:categorical_transformer:categorical_encoding:__choice__': 'encoding', 'data_preprocessor:feature_type:categorical_transformer:category_coalescence:__choice__': 'minority_coalescer', 'data_preprocessor:feature_type:numerical_transformer:imputation:strategy': 'mean', 'data_preprocessor:feature_type:numerical_transformer:rescaling:__choice__': 'standardize', 'feature_preprocessor:extra_trees_preproc_for_regression:bootstrap': 'True', 'feature_preprocessor:extra_trees_preproc_for_regression:criterion': 'mae', 'feature_preprocessor:extra_trees_preproc_for_regression:max_depth': 'None', 'feature_preprocessor:extra_trees_preproc_for_regression:max_features': 0.5166678376035129, 'feature_preprocessor:extra_trees_preproc_for_regression:max_leaf_nodes': 'None', 'feature_preprocessor:extra_trees_preproc_for_regression:min_samples_leaf': 1, 'feature_preprocessor:extra_trees_preproc_for_regression:min_samples_split': 9, 'feature_preprocessor:extra_trees_preproc_for_regression:min_weight_fraction_leaf': 0.0, 'feature_preprocessor:extra_trees_preproc_for_regression:n_estimators': 100, 'regressor:gaussian_process:alpha': 4.2478708206859043e-10, 'regressor:gaussian_process:thetaL': 1.158691069519535e-05, 'regressor:gaussian_process:thetaU': 1167.1248238015862, 'data_preprocessor:feature_type:categorical_transformer:category_coalescence:minority_coalescer:minimum_fraction': 0.01017601832778754},
     dataset_properties={
       'task': 5,
       'sparse': False,
@@ -186,7 +186,7 @@ Get the Score of the final ensemble
 
  .. code-block:: none
 
-    R2 score: 0.9999999995848977
+    R2 score: 0.9999999937620259
 
 
 
@@ -409,7 +409,7 @@ Get the configuration space
 
 .. rst-class:: sphx-glr-timing
 
-   **Total running time of the script:** ( 1 minutes  55.688 seconds)
+   **Total running time of the script:** ( 2 minutes  1.233 seconds)
 
 
 .. _sphx_glr_download_examples_20_basic_example_multioutput_regression.py:
 
@@ -121,11 +121,11 @@ View the models found by auto-sklearn
 
               rank  ensemble_weight               type      cost   duration
     model_id                                                               
-    25           1             0.46                sgd  0.436679   0.830493
-    6            2             0.32     ard_regression  0.455042   0.827029
-    27           3             0.14     ard_regression  0.462249   0.856700
-    11           4             0.02      random_forest  0.507400  12.339479
-    7            5             0.06  gradient_boosting  0.518673   1.640017
+    25           1             0.46                sgd  0.436679   0.732215
+    6            2             0.32     ard_regression  0.455042   0.723179
+    27           3             0.14     ard_regression  0.462249   0.728957
+    11           4             0.02      random_forest  0.507400  10.798643
+    7            5             0.06  gradient_boosting  0.518673   1.353502
 
 
 
@@ -267,7 +267,7 @@ the true value).
 
 .. rst-class:: sphx-glr-timing
 
-   **Total running time of the script:** ( 1 minutes  56.297 seconds)
+   **Total running time of the script:** ( 2 minutes  0.468 seconds)
 
 
 .. _sphx_glr_download_examples_20_basic_example_regression.py:
 
@@ -5,14 +5,14 @@
 
 Computation times
 =================
-**06:11.822** total execution time for **examples_20_basic** files:
+**06:21.704** total execution time for **examples_20_basic** files:
 
 +-------------------------------------------------------------------------------------------------------------------+-----------+--------+
-| :ref:`sphx_glr_examples_20_basic_example_classification.py` (``example_classification.py``)                       | 02:03.173 | 0.0 MB |
+| :ref:`sphx_glr_examples_20_basic_example_classification.py` (``example_classification.py``)                       | 02:02.438 | 0.0 MB |
 +-------------------------------------------------------------------------------------------------------------------+-----------+--------+
-| :ref:`sphx_glr_examples_20_basic_example_regression.py` (``example_regression.py``)                               | 01:56.297 | 0.0 MB |
+| :ref:`sphx_glr_examples_20_basic_example_multioutput_regression.py` (``example_multioutput_regression.py``)       | 02:01.233 | 0.0 MB |
 +-------------------------------------------------------------------------------------------------------------------+-----------+--------+
-| :ref:`sphx_glr_examples_20_basic_example_multioutput_regression.py` (``example_multioutput_regression.py``)       | 01:55.688 | 0.0 MB |
+| :ref:`sphx_glr_examples_20_basic_example_regression.py` (``example_regression.py``)                               | 02:00.468 | 0.0 MB |
 +-------------------------------------------------------------------------------------------------------------------+-----------+--------+
-| :ref:`sphx_glr_examples_20_basic_example_multilabel_classification.py` (``example_multilabel_classification.py``) | 00:16.665 | 0.0 MB |
+| :ref:`sphx_glr_examples_20_basic_example_multilabel_classification.py` (``example_multilabel_classification.py``) | 00:17.564 | 0.0 MB |
 +-------------------------------------------------------------------------------------------------------------------+-----------+--------+
@@ -154,46 +154,49 @@ Get the Score of the final ensemble
     ################################################################################
     Metric results
      rank_test_scores param_classifier:__choice__  mean_test_score  metric_balanced_accuracy  metric_precision  metric_recall  metric_f1  metric_custom_error
-                    5               random_forest         0.971631                  0.969533          0.977528       0.977528   0.977528             0.028369
-                    5                         mlp         0.971631                  0.961538          0.956989       1.000000   0.978022             0.028369
-                   27                         mlp         0.943262                  0.935069          0.945055       0.966292   0.955556             0.056738
-                   15               random_forest         0.964539                  0.959918          0.966667       0.977528   0.972067             0.035461
-                    5                         mlp         0.971631                  0.961538          0.956989       1.000000   0.978022             0.028369
+                    4               random_forest         0.971631                  0.969533          0.977528       0.977528   0.977528             0.028369
+                    4                         mlp         0.971631                  0.961538          0.956989       1.000000   0.978022             0.028369
+                   29                         mlp         0.943262                  0.935069          0.945055       0.966292   0.955556             0.056738
+                   18               random_forest         0.964539                  0.959918          0.966667       0.977528   0.972067             0.035461
+                    4                         mlp         0.971631                  0.961538          0.956989       1.000000   0.978022             0.028369
                     1                 extra_trees         0.985816                  0.984767          0.988764       0.988764   0.988764             0.014184
-                   15               random_forest         0.964539                  0.963915          0.977273       0.966292   0.971751             0.035461
-                   20                 extra_trees         0.957447                  0.954300          0.966292       0.966292   0.966292             0.042553
-                    5               random_forest         0.971631                  0.969533          0.977528       0.977528   0.977528             0.028369
-                    5               random_forest         0.971631                  0.969533          0.977528       0.977528   0.977528             0.028369
-                   15           gradient_boosting         0.964539                  0.963915          0.977273       0.966292   0.971751             0.035461
-                    5           gradient_boosting         0.971631                  0.965536          0.967033       0.988764   0.977778             0.028369
-                    5                         mlp         0.971631                  0.965536          0.967033       0.988764   0.977778             0.028369
-                   24                         mlp         0.950355                  0.948682          0.965909       0.955056   0.960452             0.049645
+                   18               random_forest         0.964539                  0.963915          0.977273       0.966292   0.971751             0.035461
+                   24                 extra_trees         0.957447                  0.954300          0.966292       0.966292   0.966292             0.042553
+                    4               random_forest         0.971631                  0.969533          0.977528       0.977528   0.977528             0.028369
+                    4               random_forest         0.971631                  0.969533          0.977528       0.977528   0.977528             0.028369
+                   18           gradient_boosting         0.964539                  0.963915          0.977273       0.966292   0.971751             0.035461
+                    4           gradient_boosting         0.971631                  0.965536          0.967033       0.988764   0.977778             0.028369
+                    4                         mlp         0.971631                  0.965536          0.967033       0.988764   0.977778             0.028369
+                   26                         mlp         0.950355                  0.948682          0.965909       0.955056   0.960452             0.049645
                     2           gradient_boosting         0.978723                  0.975151          0.977778       0.988764   0.983240             0.021277
-                   15           gradient_boosting         0.964539                  0.959918          0.966667       0.977528   0.972067             0.035461
-                   15               random_forest         0.964539                  0.959918          0.966667       0.977528   0.972067             0.035461
-                    5                 extra_trees         0.971631                  0.969533          0.977528       0.977528   0.977528             0.028369
-                   32          passive_aggressive         0.921986                  0.894231          0.890000       1.000000   0.941799             0.078014
+                   18           gradient_boosting         0.964539                  0.959918          0.966667       0.977528   0.972067             0.035461
+                   18               random_forest         0.964539                  0.959918          0.966667       0.977528   0.972067             0.035461
+                    4                 extra_trees         0.971631                  0.969533          0.977528       0.977528   0.977528             0.028369
+                   34          passive_aggressive         0.921986                  0.894231          0.890000       1.000000   0.941799             0.078014
                     2                 extra_trees         0.978723                  0.975151          0.977778       0.988764   0.983240             0.021277
-                    5           gradient_boosting         0.971631                  0.965536          0.967033       0.988764   0.977778             0.028369
-                   24                         mlp         0.950355                  0.940687          0.945652       0.977528   0.961326             0.049645
-                   30               random_forest         0.929078                  0.923833          0.943820       0.943820   0.943820             0.070922
-                   20                    adaboost         0.957447                  0.950303          0.956044       0.977528   0.966667             0.042553
-                    5                 extra_trees         0.971631                  0.965536          0.967033       0.988764   0.977778             0.028369
-                   20                 extra_trees         0.957447                  0.954300          0.966292       0.966292   0.966292             0.042553
-                   30                bernoulli_nb         0.929078                  0.923833          0.943820       0.943820   0.943820             0.070922
-                    2                 extra_trees         0.978723                  0.979149          0.988636       0.977528   0.983051             0.021277
-                   20               liblinear_svc         0.957447                  0.954300          0.966292       0.966292   0.966292             0.042553
-                   27                 gaussian_nb         0.943262                  0.935069          0.945055       0.966292   0.955556             0.056738
-                   24                 extra_trees         0.950355                  0.936690          0.936170       0.988764   0.961749             0.049645
-                   27               random_forest         0.943262                  0.943064          0.965517       0.943820   0.954545             0.056738
+                    4           gradient_boosting         0.971631                  0.965536          0.967033       0.988764   0.977778             0.028369
+                   26                         mlp         0.950355                  0.940687          0.945652       0.977528   0.961326             0.049645
+                   33               random_forest         0.929078                  0.923833          0.943820       0.943820   0.943820             0.070922
+                   24                    adaboost         0.957447                  0.950303          0.956044       0.977528   0.966667             0.042553
+                    4                 extra_trees         0.971631                  0.965536          0.967033       0.988764   0.977778             0.028369
+                    4                 extra_trees         0.971631                  0.969533          0.977528       0.977528   0.977528             0.028369
+                   31                         lda         0.936170                  0.925454          0.934783       0.966292   0.950276             0.063830
+                    4                 extra_trees         0.971631                  0.965536          0.967033       0.988764   0.977778             0.028369
+                    4                         lda         0.971631                  0.961538          0.956989       1.000000   0.978022             0.028369
+                   18               liblinear_svc         0.964539                  0.959918          0.966667       0.977528   0.972067             0.035461
+                    4               liblinear_svc         0.971631                  0.965536          0.967033       0.988764   0.977778             0.028369
+                   29                    adaboost         0.943262                  0.943064          0.965517       0.943820   0.954545             0.056738
+                   31               random_forest         0.936170                  0.937446          0.965116       0.932584   0.948571             0.063830
+                   26                    adaboost         0.950355                  0.952679          0.976744       0.943820   0.960000             0.049645
+                   35                 extra_trees         0.631206                  0.500000          0.631206       1.000000   0.773913             0.368794
 
 
 
 
 
 .. rst-class:: sphx-glr-timing
 
-   **Total running time of the script:** ( 2 minutes  1.880 seconds)
+   **Total running time of the script:** ( 2 minutes  3.281 seconds)
 
 
 .. _sphx_glr_download_examples_40_advanced_example_calc_multiple_metrics.py:
Original file line number	Diff line number	Diff line change
`@@ -141,7 +141,7 @@`
`141`	`141`	`},`
`142`	`142`	`"outputs": [],`
`143`	`143`	`"source": [`
`144`		`- "resampling_strategy = sklearn.model_selection.PredefinedSplit(\n test_fold=np.where(X_train[:, 0] < np.mean(X_train[:, 0]))[0]\n)\n\nautoml = autosklearn.classification.AutoSklearnClassifier(\n time_left_for_this_task=120,\n per_run_time_limit=30,\n tmp_folder='/tmp/autosklearn_resampling_example_tmp',\n disable_evaluator_output=False,\n resampling_strategy=resampling_strategy,\n)\nautoml.fit(X_train, y_train, dataset_name='breast_cancer')"`
	`144`	+ "selected_indices = (X_train[:, 0] < np.mean(X_train[:, 0])).astype(int)\nresampling_strategy = sklearn.model_selection.PredefinedSplit(\n test_fold=selected_indices\n)\n\nautoml = autosklearn.classification.AutoSklearnClassifier(\n time_left_for_this_task=120,\n per_run_time_limit=30,\n tmp_folder='/tmp/autosklearn_resampling_example_tmp',\n disable_evaluator_output=False,\n resampling_strategy=resampling_strategy,\n)\nautoml.fit(X_train, y_train, dataset_name='breast_cancer')\n\nprint(automl.sprint_statistics())"
`145`	`145`	`]`
`146`	`146`	`},`
`147`	`147`	`{`