Skip to content
Merged
Show file tree
Hide file tree
Changes from 1 commit
Commits
Show all changes
54 commits
Select commit Hold shift + click to select a range
f16ba08
minor fixes to usage.rst (#1090)
mfeurer May 31, 2021
6717e66
Add Windows to Github Action CI matrix (#1095)
PGijsbers Jun 16, 2021
2984403
Add ChunkedError to list of retry exception (#1118)
PGijsbers Oct 27, 2021
a6c0576
Always ignore MaxRetryError but log with warning (#1119)
PGijsbers Oct 27, 2021
b4c868a
Fix/1110 (#1117)
PGijsbers Oct 28, 2021
aed5010
Add AttributeError as suspect for dependency issue (#1121)
PGijsbers Nov 3, 2021
db7bb9a
Add CITATION.cff (#1120)
PGijsbers Jan 11, 2022
493511a
Precommit update (#1129)
PGijsbers Apr 14, 2022
99a62f6
Predictions (#1128)
PGijsbers Apr 19, 2022
c911d6d
Use GET instead of POST for flow exist (#1147)
PGijsbers Jun 28, 2022
c6fab8e
pre-commit update (#1150)
PGijsbers Jul 11, 2022
a8d96d5
Replace removed file with new target for download test (#1158)
PGijsbers Aug 16, 2022
ccb3e8e
Fix outdated docstring for list_tasks function (#1149)
chadmarchand Oct 6, 2022
9ce2a6b
Improve the error message on out-of-sync flow ids (#1171)
PGijsbers Oct 7, 2022
2ed77db
Add scikit-learn 1.0 and 1.1 values for test (#1168)
PGijsbers Oct 7, 2022
2fde8d5
Update Pipeline description for >=1.0 (#1170)
PGijsbers Oct 7, 2022
2ddae0f
Update URL to reflect new endpoint (#1172)
PGijsbers Oct 7, 2022
c17704e
Remove tests which only test scikit-learn functionality (#1169)
PGijsbers Oct 7, 2022
953f84e
fix nonetype error during print for tasks without class labels (#1148)
willcmartin Oct 7, 2022
6da0aac
Flow exists GET is deprecated, use POST (#1173)
PGijsbers Oct 10, 2022
22ee9cd
Test `get_parquet` on production server (#1174)
PGijsbers Oct 11, 2022
5cd6973
Refactor out different test cases to separate tests (#1176)
PGijsbers Oct 18, 2022
e6250fa
Provide clearer error when server provides bad data description XML (…
PGijsbers Oct 24, 2022
75fed8a
Update more sklearn tests (#1175)
PGijsbers Oct 24, 2022
f37ebbe
Remove dtype checking for prediction comparison (#1177)
PGijsbers Nov 24, 2022
a909a0c
feat(minio): Allow for proxies (#1184)
eddiebergman Nov 25, 2022
1dfe398
Update __version__.py (#1189)
PGijsbers Nov 25, 2022
580b536
Download all files (#1188)
PGijsbers Nov 25, 2022
5eb84ce
Skip tests that use arff reading optimization for typecheck (#1185)
PGijsbers Nov 25, 2022
467f6eb
Update configs (#1199)
PGijsbers Feb 20, 2023
dd62f2b
Update tests for sklearn 1.2, server issue (#1200)
PGijsbers Feb 20, 2023
2a7ab17
Version bump to dev and add changelog stub (#1190)
PGijsbers Feb 20, 2023
5f72e2e
Add: dependabot checks for workflow versions (#1155)
eddiebergman Feb 20, 2023
7d069a9
Change the cached file to reflect new standard #1188 (#1203)
PGijsbers Feb 21, 2023
23755bf
Bump actions/checkout from 2 to 3 (#1206)
dependabot[bot] Feb 21, 2023
603fe60
Update docker actions (#1211)
mfeurer Feb 22, 2023
17ff086
Support new numpy (#1215)
mfeurer Feb 23, 2023
d9850be
Allow unknown task types on the server (#1216)
mfeurer Feb 23, 2023
a968288
Mark sklearn tests (#1202)
PGijsbers Feb 23, 2023
beb598c
Bump actions/setup-python from 2 to 4 (#1212)
dependabot[bot] Feb 24, 2023
c590b3a
Make OpenMLTraceIteration a dataclass (#1201)
PGijsbers Feb 24, 2023
bbf09b3
Fix: correctly order the ground truth and prediction for ARFF files i…
LennartPurucker Feb 24, 2023
b84536a
Fix documentation building (#1217)
mfeurer Feb 24, 2023
5730669
Fix CI Python 3.6 (#1218)
mfeurer Feb 24, 2023
5b2ac46
Bump docker/setup-buildx-action from 1 to 2 (#1221)
dependabot[bot] Feb 24, 2023
5dcb7a3
Update run.py (#1194)
v-parmar Feb 24, 2023
687a0f1
Refactor if-statements (#1219)
PGijsbers Mar 1, 2023
c0a75bd
Ci python 38 (#1220)
mfeurer Mar 1, 2023
ce82fd5
Add summary of locally computed metrics to representation of run (#…
LennartPurucker Mar 1, 2023
c177d39
Better Error for Checksum Mismatch (#1225)
LennartPurucker Mar 4, 2023
24cbc5e
Fix coverage (#1226)
PGijsbers Mar 4, 2023
3c00d7b
Issue 1028: public delete functions for run, task, flow and database …
Mirkazemi Mar 21, 2023
7127e9c
Update changelog and version number for new release (#1230)
mfeurer Mar 22, 2023
bb3793d
Merge pull request #1233 from openml/main
mfeurer Mar 22, 2023
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
Prev Previous commit
Next Next commit
Provide clearer error when server provides bad data description XML (#…
  • Loading branch information
PGijsbers authored Oct 24, 2022
commit e6250fa6e01b24e71ce1ab3720236fd5cbfc67f2
15 changes: 9 additions & 6 deletions openml/_api_calls.py
Original file line number Diff line number Diff line change
Expand Up @@ -23,6 +23,14 @@
)


def _create_url_from_endpoint(endpoint: str) -> str:
url = config.server
if not url.endswith("/"):
url += "/"
url += endpoint
return url.replace("=", "%3d")


def _perform_api_call(call, request_method, data=None, file_elements=None):
"""
Perform an API call at the OpenML server.
Expand Down Expand Up @@ -50,12 +58,7 @@ def _perform_api_call(call, request_method, data=None, file_elements=None):
return_value : str
Return value of the OpenML server
"""
url = config.server
if not url.endswith("/"):
url += "/"
url += call

url = url.replace("=", "%3d")
url = _create_url_from_endpoint(call)
logging.info("Starting [%s] request for the URL %s", request_method, url)
start = time.time()

Expand Down
12 changes: 9 additions & 3 deletions openml/datasets/functions.py
Original file line number Diff line number Diff line change
Expand Up @@ -3,6 +3,7 @@
import io
import logging
import os
from pyexpat import ExpatError
from typing import List, Dict, Union, Optional, cast

import numpy as np
Expand All @@ -19,6 +20,7 @@
from .dataset import OpenMLDataset
from ..exceptions import (
OpenMLHashException,
OpenMLServerError,
OpenMLServerException,
OpenMLPrivateDatasetError,
)
Expand Down Expand Up @@ -437,7 +439,7 @@ def get_dataset(
parquet_file = None
remove_dataset_cache = False
except OpenMLServerException as e:
# if there was an exception,
# if there was an exception
# check if the user had access to the dataset
if e.code == 112:
raise OpenMLPrivateDatasetError(e.message) from None
Expand Down Expand Up @@ -949,14 +951,18 @@ def _get_dataset_description(did_cache_dir, dataset_id):
try:
with io.open(description_file, encoding="utf8") as fh:
dataset_xml = fh.read()
description = xmltodict.parse(dataset_xml)["oml:data_set_description"]
except Exception:
url_extension = "data/{}".format(dataset_id)
dataset_xml = openml._api_calls._perform_api_call(url_extension, "get")
try:
description = xmltodict.parse(dataset_xml)["oml:data_set_description"]
except ExpatError as e:
url = openml._api_calls._create_url_from_endpoint(url_extension)
raise OpenMLServerError(f"Dataset description XML at '{url}' is malformed.") from e
with io.open(description_file, "w", encoding="utf8") as fh:
fh.write(dataset_xml)

description = xmltodict.parse(dataset_xml)["oml:data_set_description"]

return description


Expand Down
2 changes: 1 addition & 1 deletion tests/test_datasets/test_dataset_functions.py
Original file line number Diff line number Diff line change
Expand Up @@ -1240,7 +1240,7 @@ def _wait_for_dataset_being_processed(self, dataset_id):
try:
downloaded_dataset = openml.datasets.get_dataset(dataset_id)
break
except Exception as e:
except OpenMLServerException as e:
# returned code 273: Dataset not processed yet
# returned code 362: No qualities found
TestBase.logger.error(
Expand Down