Skip to content

Commit 406205a

Browse files
committed
mark xfail
1 parent 5a840c8 commit 406205a

8 files changed

Lines changed: 37 additions & 0 deletions

File tree

tests/test_datasets/test_dataset_functions.py

Lines changed: 16 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -244,6 +244,7 @@ def test_get_datasets(self):
244244
assert len(datasets) == 2
245245
_assert_datasets_retrieved_successfully([1, 2])
246246

247+
@pytest.mark.xfail(reason="failures_issue_1544")
247248
def test_get_dataset_by_name(self):
248249
dataset = openml.datasets.get_dataset("anneal")
249250
assert type(dataset) == OpenMLDataset
@@ -262,6 +263,7 @@ def test_get_dataset_download_all_files(self):
262263
# test_get_dataset_lazy
263264
raise NotImplementedError
264265

266+
@pytest.mark.xfail(reason="failures_issue_1544")
265267
def test_get_dataset_uint8_dtype(self):
266268
dataset = openml.datasets.get_dataset(1)
267269
assert type(dataset) == OpenMLDataset
@@ -280,6 +282,7 @@ def test_dataset_by_name_cannot_access_private_data(self):
280282
self.use_production_server()
281283
self.assertRaises(OpenMLPrivateDatasetError, openml.datasets.get_dataset, "NAME_GOES_HERE")
282284

285+
@pytest.mark.xfail(reason="failures_issue_1544")
283286
def test_get_dataset_lazy_all_functions(self):
284287
"""Test that all expected functionality is available without downloading the dataset."""
285288
dataset = openml.datasets.get_dataset(1)
@@ -309,6 +312,7 @@ def ensure_absence_of_real_data():
309312
assert classes == ["1", "2", "3", "4", "5", "U"]
310313
ensure_absence_of_real_data()
311314

315+
@pytest.mark.xfail(reason="failures_issue_1544")
312316
def test_get_dataset_sparse(self):
313317
dataset = openml.datasets.get_dataset(102)
314318
X, *_ = dataset.get_data()
@@ -327,6 +331,7 @@ def test__get_dataset_description(self):
327331
description_xml_path = os.path.join(self.workdir, "description.xml")
328332
assert os.path.exists(description_xml_path)
329333

334+
@pytest.mark.xfail(reason="failures_issue_1544")
330335
def test__getarff_path_dataset_arff(self):
331336
openml.config.set_root_cache_directory(self.static_cache_dir)
332337
description = _get_dataset_description(self.workdir, 2)
@@ -430,12 +435,14 @@ def test__getarff_md5_issue(self):
430435

431436
openml.config.connection_n_retries = n
432437

438+
@pytest.mark.xfail(reason="failures_issue_1544")
433439
def test__get_dataset_features(self):
434440
features_file = _get_dataset_features_file(self.workdir, 2)
435441
assert isinstance(features_file, Path)
436442
features_xml_path = self.workdir / "features.xml"
437443
assert features_xml_path.exists()
438444

445+
@pytest.mark.xfail(reason="failures_issue_1544")
439446
def test__get_dataset_qualities(self):
440447
qualities = _get_dataset_qualities_file(self.workdir, 2)
441448
assert isinstance(qualities, Path)
@@ -853,6 +860,7 @@ def test_create_invalid_dataset(self):
853860
param["data"] = data[0]
854861
self.assertRaises(ValueError, create_dataset, **param)
855862

863+
@pytest.mark.xfail(reason="failures_issue_1544")
856864
def test_get_online_dataset_arff(self):
857865
dataset_id = 100 # Australian
858866
# lazy loading not used as arff file is checked.
@@ -1332,6 +1340,7 @@ def test_list_qualities(self):
13321340
assert isinstance(qualities, list) is True
13331341
assert all(isinstance(q, str) for q in qualities) is True
13341342

1343+
@pytest.mark.xfail(reason="failures_issue_1544")
13351344
def test_get_dataset_cache_format_pickle(self):
13361345
dataset = openml.datasets.get_dataset(1)
13371346
dataset.get_data()
@@ -1347,6 +1356,7 @@ def test_get_dataset_cache_format_pickle(self):
13471356
assert len(categorical) == X.shape[1]
13481357
assert len(attribute_names) == X.shape[1]
13491358

1359+
@pytest.mark.xfail(reason="failures_issue_1544")
13501360
def test_get_dataset_cache_format_feather(self):
13511361
# This test crashed due to using the parquet file by default, which is downloaded
13521362
# from minio. However, there is a mismatch between OpenML test server and minio IDs.
@@ -1523,6 +1533,7 @@ def test_list_datasets_with_high_size_parameter(self):
15231533
(None, None, ["wrong", "sunny"]),
15241534
],
15251535
)
1536+
@pytest.mark.xfail(reason="failures_issue_1544")
15261537
def test_invalid_attribute_validations(
15271538
default_target_attribute,
15281539
row_id_attribute,
@@ -1584,6 +1595,7 @@ def test_invalid_attribute_validations(
15841595
(None, None, ["outlook", "windy"]),
15851596
],
15861597
)
1598+
@pytest.mark.xfail(reason="failures_issue_1544")
15871599
def test_valid_attribute_validations(default_target_attribute, row_id_attribute, ignore_attribute):
15881600
data = [
15891601
["a", "sunny", 85.0, 85.0, "FALSE", "no"],
@@ -1802,6 +1814,7 @@ def test_list_datasets_by_number_instances(all_datasets: pd.DataFrame):
18021814
_assert_datasets_have_id_and_valid_status(small_datasets)
18031815

18041816

1817+
@pytest.mark.xfail(reason="failures_issue_1544")
18051818
def test_list_datasets_by_number_features(all_datasets: pd.DataFrame):
18061819
wide_datasets = openml.datasets.list_datasets(number_features="50..100")
18071820
assert 8 <= len(wide_datasets) < len(all_datasets)
@@ -1814,12 +1827,14 @@ def test_list_datasets_by_number_classes(all_datasets: pd.DataFrame):
18141827
_assert_datasets_have_id_and_valid_status(five_class_datasets)
18151828

18161829

1830+
@pytest.mark.xfail(reason="failures_issue_1544")
18171831
def test_list_datasets_by_number_missing_values(all_datasets: pd.DataFrame):
18181832
na_datasets = openml.datasets.list_datasets(number_missing_values="5..100")
18191833
assert 5 <= len(na_datasets) < len(all_datasets)
18201834
_assert_datasets_have_id_and_valid_status(na_datasets)
18211835

18221836

1837+
@pytest.mark.xfail(reason="failures_issue_1544")
18231838
def test_list_datasets_combined_filters(all_datasets: pd.DataFrame):
18241839
combined_filter_datasets = openml.datasets.list_datasets(
18251840
tag="study_14",
@@ -1892,6 +1907,7 @@ def isolate_for_test():
18921907
("with_data", "with_qualities", "with_features"),
18931908
itertools.product([True, False], repeat=3),
18941909
)
1910+
@pytest.mark.xfail(reason="failures_issue_1544")
18951911
def test_get_dataset_lazy_behavior(
18961912
isolate_for_test, with_data: bool, with_qualities: bool, with_features: bool
18971913
):

tests/test_runs/test_run_functions.py

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1695,6 +1695,7 @@ def test_format_prediction_non_supervised(self):
16951695
):
16961696
format_prediction(clustering, *ignored_input)
16971697

1698+
@pytest.mark.xfail(reason="failures_issue_1544")
16981699
def test_format_prediction_classification_no_probabilities(self):
16991700
classification = openml.tasks.get_task(
17001701
self.TEST_SERVER_TASK_SIMPLE["task_id"],
@@ -1704,6 +1705,7 @@ def test_format_prediction_classification_no_probabilities(self):
17041705
with pytest.raises(ValueError, match="`proba` is required for classification task"):
17051706
format_prediction(classification, *ignored_input, proba=None)
17061707

1708+
@pytest.mark.xfail(reason="failures_issue_1544")
17071709
def test_format_prediction_classification_incomplete_probabilities(self):
17081710
classification = openml.tasks.get_task(
17091711
self.TEST_SERVER_TASK_SIMPLE["task_id"],
@@ -1714,6 +1716,7 @@ def test_format_prediction_classification_incomplete_probabilities(self):
17141716
with pytest.raises(ValueError, match="Each class should have a predicted probability"):
17151717
format_prediction(classification, *ignored_input, proba=incomplete_probabilities)
17161718

1719+
@pytest.mark.xfail(reason="failures_issue_1544")
17171720
def test_format_prediction_task_without_classlabels_set(self):
17181721
classification = openml.tasks.get_task(
17191722
self.TEST_SERVER_TASK_SIMPLE["task_id"],
@@ -1724,6 +1727,7 @@ def test_format_prediction_task_without_classlabels_set(self):
17241727
with pytest.raises(ValueError, match="The classification task must have class labels set"):
17251728
format_prediction(classification, *ignored_input, proba={})
17261729

1730+
@pytest.mark.xfail(reason="failures_issue_1544")
17271731
def test_format_prediction_task_learning_curve_sample_not_set(self):
17281732
learning_curve = openml.tasks.get_task(801, download_data=False) # diabetes;crossvalidation
17291733
probabilities = {c: 0.2 for c in learning_curve.class_labels}

tests/test_setups/test_setup_functions.py

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -166,6 +166,7 @@ def test_list_setups_output_format(self):
166166
assert isinstance(setups, pd.DataFrame)
167167
assert len(setups) == 10
168168

169+
@pytest.mark.xfail(reason="failures_issue_1544")
169170
def test_setuplist_offset(self):
170171
size = 10
171172
setups = openml.setups.list_setups(offset=0, size=size)

tests/test_study/test_study_functions.py

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -148,6 +148,7 @@ def test_publish_empty_study_implicit(self):
148148
self._test_publish_empty_study_is_allowed(explicit=False)
149149

150150
@pytest.mark.flaky()
151+
@pytest.mark.xfail(reason="failures_issue_1544")
151152
def test_publish_study(self):
152153
# get some random runs to attach
153154
run_list = openml.evaluations.list_evaluations("predictive_accuracy", size=10)
@@ -217,6 +218,7 @@ def test_publish_study(self):
217218
res = openml.study.delete_study(study.id)
218219
assert res
219220

221+
@pytest.mark.xfail(reason="failures_issue_1544")
220222
def test_study_attach_illegal(self):
221223
run_list = openml.runs.list_runs(size=10)
222224
assert len(run_list) == 10

tests/test_tasks/test_classification_task.py

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -18,19 +18,22 @@ def setUp(self, n_levels: int = 1):
1818
self.task_type = TaskType.SUPERVISED_CLASSIFICATION
1919
self.estimation_procedure = 5
2020

21+
@pytest.mark.xfail(reason="failures_issue_1544")
2122
def test_download_task(self):
2223
task = super().test_download_task()
2324
assert task.task_id == self.task_id
2425
assert task.task_type_id == TaskType.SUPERVISED_CLASSIFICATION
2526
assert task.dataset_id == 20
2627
assert task.estimation_procedure_id == self.estimation_procedure
2728

29+
@pytest.mark.xfail(reason="failures_issue_1544")
2830
def test_class_labels(self):
2931
task = get_task(self.task_id)
3032
assert task.class_labels == ["tested_negative", "tested_positive"]
3133

3234

3335
@pytest.mark.server()
36+
@pytest.mark.xfail(reason="failures_issue_1544")
3437
def test_get_X_and_Y():
3538
task = get_task(119)
3639
X, Y = task.get_X_and_y()

tests/test_tasks/test_learning_curve_task.py

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -2,6 +2,7 @@
22
from __future__ import annotations
33

44
import pandas as pd
5+
import pytest
56

67
from openml.tasks import TaskType, get_task
78

@@ -17,6 +18,7 @@ def setUp(self, n_levels: int = 1):
1718
self.task_type = TaskType.LEARNING_CURVE
1819
self.estimation_procedure = 13
1920

21+
@pytest.mark.xfail(reason="failures_issue_1544")
2022
def test_get_X_and_Y(self):
2123
X, Y = super().test_get_X_and_Y()
2224
assert X.shape == (768, 8)
@@ -25,12 +27,14 @@ def test_get_X_and_Y(self):
2527
assert isinstance(Y, pd.Series)
2628
assert pd.api.types.is_categorical_dtype(Y)
2729

30+
@pytest.mark.xfail(reason="failures_issue_1544")
2831
def test_download_task(self):
2932
task = super().test_download_task()
3033
assert task.task_id == self.task_id
3134
assert task.task_type_id == TaskType.LEARNING_CURVE
3235
assert task.dataset_id == 20
3336

37+
@pytest.mark.xfail(reason="failures_issue_1544")
3438
def test_class_labels(self):
3539
task = get_task(self.task_id)
3640
assert task.class_labels == ["tested_negative", "tested_positive"]

tests/test_tasks/test_regression_task.py

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -4,6 +4,7 @@
44
import ast
55

66
import pandas as pd
7+
import pytest
78

89
import openml
910
from openml.exceptions import OpenMLServerException
@@ -48,6 +49,7 @@ def setUp(self, n_levels: int = 1):
4849
self.task_type = TaskType.SUPERVISED_REGRESSION
4950

5051

52+
@pytest.mark.xfail(reason="failures_issue_1544")
5153
def test_get_X_and_Y(self):
5254
X, Y = super().test_get_X_and_Y()
5355
assert X.shape == (194, 32)

tests/test_tasks/test_task_functions.py

Lines changed: 5 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -100,6 +100,7 @@ def test_list_tasks(self):
100100
for task in tasks.to_dict(orient="index").values():
101101
self._check_task(task)
102102

103+
@pytest.mark.xfail(reason="failures_issue_1544")
103104
def test_list_tasks_paginate(self):
104105
size = 10
105106
max = 100
@@ -139,6 +140,7 @@ def test__get_task_live(self):
139140
# https://github.com/openml/openml-python/issues/378
140141
openml.tasks.get_task(34536)
141142

143+
@pytest.mark.xfail(reason="failures_issue_1544")
142144
def test_get_task(self):
143145
task = openml.tasks.get_task(1, download_data=True) # anneal; crossvalidation
144146
assert isinstance(task, OpenMLTask)
@@ -152,6 +154,7 @@ def test_get_task(self):
152154
os.path.join(self.workdir, "org", "openml", "test", "datasets", "1", "dataset.arff")
153155
)
154156

157+
@pytest.mark.xfail(reason="failures_issue_1544")
155158
def test_get_task_lazy(self):
156159
task = openml.tasks.get_task(2, download_data=False) # anneal; crossvalidation
157160
assert isinstance(task, OpenMLTask)
@@ -191,6 +194,7 @@ def assert_and_raise(*args, **kwargs):
191194
# Now the file should no longer exist
192195
assert not os.path.exists(os.path.join(os.getcwd(), "tasks", "1", "tasks.xml"))
193196

197+
@pytest.mark.xfail(reason="failures_issue_1544")
194198
def test_get_task_with_cache(self):
195199
openml.config.set_root_cache_directory(self.static_cache_dir)
196200
task = openml.tasks.get_task(1)
@@ -206,6 +210,7 @@ def test_get_task_different_types(self):
206210
# Issue 538, get_task failing with clustering task.
207211
openml.tasks.functions.get_task(126033)
208212

213+
@pytest.mark.xfail(reason="failures_issue_1544")
209214
def test_download_split(self):
210215
task = openml.tasks.get_task(1) # anneal; crossvalidation
211216
split = task.download_split()

0 commit comments

Comments
 (0)