@@ -1465,7 +1465,7 @@ def test_openml_param_name_to_sklearn(self):
14651465 )
14661466 model = sklearn .pipeline .Pipeline (steps = [("scaler" , scaler ), ("boosting" , boosting )])
14671467 flow = self .extension .model_to_flow (model )
1468- task = openml .tasks .get_task (115 )
1468+ task = openml .tasks .get_task (115 ) # diabetes; crossvalidation
14691469 run = openml .runs .run_flow_on_task (flow , task )
14701470 run = run .publish ()
14711471 TestBase ._mark_entity_for_removal ("run" , run .run_id )
@@ -1561,7 +1561,7 @@ def setUp(self):
15611561 # Test methods for performing runs with this extension module
15621562
15631563 def test_run_model_on_task (self ):
1564- task = openml .tasks .get_task (1 )
1564+ task = openml .tasks .get_task (1 ) # anneal; crossvalidation
15651565 # using most_frequent imputer since dataset has mixed types and to keep things simple
15661566 pipe = sklearn .pipeline .Pipeline (
15671567 [
@@ -1626,7 +1626,7 @@ def test_seed_model_raises(self):
16261626 self .extension .seed_model (model = clf , seed = 42 )
16271627
16281628 def test_run_model_on_fold_classification_1_array (self ):
1629- task = openml .tasks .get_task (1 )
1629+ task = openml .tasks .get_task (1 ) # anneal; crossvalidation
16301630
16311631 X , y = task .get_X_and_y ()
16321632 train_indices , test_indices = task .get_train_test_split_indices (repeat = 0 , fold = 0 , sample = 0 )
@@ -1689,7 +1689,7 @@ def test_run_model_on_fold_classification_1_array(self):
16891689 def test_run_model_on_fold_classification_1_dataframe (self ):
16901690 from sklearn .compose import ColumnTransformer
16911691
1692- task = openml .tasks .get_task (1 )
1692+ task = openml .tasks .get_task (1 ) # anneal; crossvalidation
16931693
16941694 # diff test_run_model_on_fold_classification_1_array()
16951695 X , y = task .get_X_and_y (dataset_format = "dataframe" )
@@ -1753,7 +1753,7 @@ def test_run_model_on_fold_classification_1_dataframe(self):
17531753 )
17541754
17551755 def test_run_model_on_fold_classification_2 (self ):
1756- task = openml .tasks .get_task (7 )
1756+ task = openml .tasks .get_task (7 ) # kr-vs-kp; crossvalidation
17571757
17581758 X , y = task .get_X_and_y ()
17591759 train_indices , test_indices = task .get_train_test_split_indices (repeat = 0 , fold = 0 , sample = 0 )
@@ -1815,7 +1815,11 @@ def predict_proba(*args, **kwargs):
18151815 raise AttributeError ("predict_proba is not available when " "probability=False" )
18161816
18171817 # task 1 (test server) is important: it is a task with an unused class
1818- tasks = [1 , 3 , 115 ]
1818+ tasks = [
1819+ 1 , # anneal; crossvalidation
1820+ 3 , # anneal; crossvalidation
1821+ 115 , # diabetes; crossvalidation
1822+ ]
18191823 flow = unittest .mock .Mock ()
18201824 flow .name = "dummy"
18211825
@@ -1969,7 +1973,7 @@ def test__extract_trace_data(self):
19691973 "max_iter" : [10 , 20 , 40 , 80 ],
19701974 }
19711975 num_iters = 10
1972- task = openml .tasks .get_task (20 )
1976+ task = openml .tasks .get_task (20 ) # balance-scale; crossvalidation
19731977 clf = sklearn .model_selection .RandomizedSearchCV (
19741978 sklearn .neural_network .MLPClassifier (), param_grid , num_iters ,
19751979 )
@@ -2080,8 +2084,8 @@ def test_run_on_model_with_empty_steps(self):
20802084 from sklearn .compose import ColumnTransformer
20812085
20822086 # testing 'drop', 'passthrough', None as non-actionable sklearn estimators
2083- dataset = openml .datasets .get_dataset (128 )
2084- task = openml .tasks .get_task (59 )
2087+ dataset = openml .datasets .get_dataset (128 ) # iris
2088+ task = openml .tasks .get_task (59 ) # mfeat-pixel; crossvalidation
20852089
20862090 X , y , categorical_ind , feature_names = dataset .get_data (
20872091 target = dataset .default_target_attribute , dataset_format = "array"
@@ -2198,7 +2202,7 @@ def test_failed_serialization_of_custom_class(self):
21982202 steps = [("preprocess" , ct ), ("estimator" , sklearn .tree .DecisionTreeClassifier ())]
21992203 ) # build a sklearn classifier
22002204
2201- task = openml .tasks .get_task (253 ) # data with mixed types from test server
2205+ task = openml .tasks .get_task (253 ) # profb; crossvalidation
22022206 try :
22032207 _ = openml .runs .run_model_on_task (clf , task )
22042208 except AttributeError as e :
0 commit comments