@@ -244,6 +244,7 @@ def test_get_datasets(self):
244244 assert len (datasets ) == 2
245245 _assert_datasets_retrieved_successfully ([1 , 2 ])
246246
247+ @pytest .mark .xfail (reason = "failures_issue_1544" )
247248 def test_get_dataset_by_name (self ):
248249 dataset = openml .datasets .get_dataset ("anneal" )
249250 assert type (dataset ) == OpenMLDataset
@@ -262,6 +263,7 @@ def test_get_dataset_download_all_files(self):
262263 # test_get_dataset_lazy
263264 raise NotImplementedError
264265
266+ @pytest .mark .xfail (reason = "failures_issue_1544" )
265267 def test_get_dataset_uint8_dtype (self ):
266268 dataset = openml .datasets .get_dataset (1 )
267269 assert type (dataset ) == OpenMLDataset
@@ -280,6 +282,7 @@ def test_dataset_by_name_cannot_access_private_data(self):
280282 self .use_production_server ()
281283 self .assertRaises (OpenMLPrivateDatasetError , openml .datasets .get_dataset , "NAME_GOES_HERE" )
282284
285+ @pytest .mark .xfail (reason = "failures_issue_1544" )
283286 def test_get_dataset_lazy_all_functions (self ):
284287 """Test that all expected functionality is available without downloading the dataset."""
285288 dataset = openml .datasets .get_dataset (1 )
@@ -309,6 +312,7 @@ def ensure_absence_of_real_data():
309312 assert classes == ["1" , "2" , "3" , "4" , "5" , "U" ]
310313 ensure_absence_of_real_data ()
311314
315+ @pytest .mark .xfail (reason = "failures_issue_1544" )
312316 def test_get_dataset_sparse (self ):
313317 dataset = openml .datasets .get_dataset (102 )
314318 X , * _ = dataset .get_data ()
@@ -327,6 +331,7 @@ def test__get_dataset_description(self):
327331 description_xml_path = os .path .join (self .workdir , "description.xml" )
328332 assert os .path .exists (description_xml_path )
329333
334+ @pytest .mark .xfail (reason = "failures_issue_1544" )
330335 def test__getarff_path_dataset_arff (self ):
331336 openml .config .set_root_cache_directory (self .static_cache_dir )
332337 description = _get_dataset_description (self .workdir , 2 )
@@ -430,12 +435,14 @@ def test__getarff_md5_issue(self):
430435
431436 openml .config .connection_n_retries = n
432437
438+ @pytest .mark .xfail (reason = "failures_issue_1544" )
433439 def test__get_dataset_features (self ):
434440 features_file = _get_dataset_features_file (self .workdir , 2 )
435441 assert isinstance (features_file , Path )
436442 features_xml_path = self .workdir / "features.xml"
437443 assert features_xml_path .exists ()
438444
445+ @pytest .mark .xfail (reason = "failures_issue_1544" )
439446 def test__get_dataset_qualities (self ):
440447 qualities = _get_dataset_qualities_file (self .workdir , 2 )
441448 assert isinstance (qualities , Path )
@@ -853,6 +860,7 @@ def test_create_invalid_dataset(self):
853860 param ["data" ] = data [0 ]
854861 self .assertRaises (ValueError , create_dataset , ** param )
855862
863+ @pytest .mark .xfail (reason = "failures_issue_1544" )
856864 def test_get_online_dataset_arff (self ):
857865 dataset_id = 100 # Australian
858866 # lazy loading not used as arff file is checked.
@@ -1332,6 +1340,7 @@ def test_list_qualities(self):
13321340 assert isinstance (qualities , list ) is True
13331341 assert all (isinstance (q , str ) for q in qualities ) is True
13341342
1343+ @pytest .mark .xfail (reason = "failures_issue_1544" )
13351344 def test_get_dataset_cache_format_pickle (self ):
13361345 dataset = openml .datasets .get_dataset (1 )
13371346 dataset .get_data ()
@@ -1347,6 +1356,7 @@ def test_get_dataset_cache_format_pickle(self):
13471356 assert len (categorical ) == X .shape [1 ]
13481357 assert len (attribute_names ) == X .shape [1 ]
13491358
1359+ @pytest .mark .xfail (reason = "failures_issue_1544" )
13501360 def test_get_dataset_cache_format_feather (self ):
13511361 # This test crashed due to using the parquet file by default, which is downloaded
13521362 # from minio. However, there is a mismatch between OpenML test server and minio IDs.
@@ -1523,6 +1533,7 @@ def test_list_datasets_with_high_size_parameter(self):
15231533 (None , None , ["wrong" , "sunny" ]),
15241534 ],
15251535)
1536+ @pytest .mark .xfail (reason = "failures_issue_1544" )
15261537def test_invalid_attribute_validations (
15271538 default_target_attribute ,
15281539 row_id_attribute ,
@@ -1584,6 +1595,7 @@ def test_invalid_attribute_validations(
15841595 (None , None , ["outlook" , "windy" ]),
15851596 ],
15861597)
1598+ @pytest .mark .xfail (reason = "failures_issue_1544" )
15871599def test_valid_attribute_validations (default_target_attribute , row_id_attribute , ignore_attribute ):
15881600 data = [
15891601 ["a" , "sunny" , 85.0 , 85.0 , "FALSE" , "no" ],
@@ -1802,6 +1814,7 @@ def test_list_datasets_by_number_instances(all_datasets: pd.DataFrame):
18021814 _assert_datasets_have_id_and_valid_status (small_datasets )
18031815
18041816
1817+ @pytest .mark .xfail (reason = "failures_issue_1544" )
18051818def test_list_datasets_by_number_features (all_datasets : pd .DataFrame ):
18061819 wide_datasets = openml .datasets .list_datasets (number_features = "50..100" )
18071820 assert 8 <= len (wide_datasets ) < len (all_datasets )
@@ -1814,12 +1827,14 @@ def test_list_datasets_by_number_classes(all_datasets: pd.DataFrame):
18141827 _assert_datasets_have_id_and_valid_status (five_class_datasets )
18151828
18161829
1830+ @pytest .mark .xfail (reason = "failures_issue_1544" )
18171831def test_list_datasets_by_number_missing_values (all_datasets : pd .DataFrame ):
18181832 na_datasets = openml .datasets .list_datasets (number_missing_values = "5..100" )
18191833 assert 5 <= len (na_datasets ) < len (all_datasets )
18201834 _assert_datasets_have_id_and_valid_status (na_datasets )
18211835
18221836
1837+ @pytest .mark .xfail (reason = "failures_issue_1544" )
18231838def test_list_datasets_combined_filters (all_datasets : pd .DataFrame ):
18241839 combined_filter_datasets = openml .datasets .list_datasets (
18251840 tag = "study_14" ,
@@ -1892,6 +1907,7 @@ def isolate_for_test():
18921907 ("with_data" , "with_qualities" , "with_features" ),
18931908 itertools .product ([True , False ], repeat = 3 ),
18941909)
1910+ @pytest .mark .xfail (reason = "failures_issue_1544" )
18951911def test_get_dataset_lazy_behavior (
18961912 isolate_for_test , with_data : bool , with_qualities : bool , with_features : bool
18971913):
0 commit comments