From 0159f474c6bbc15f20d52bc946bd252bd852b196 Mon Sep 17 00:00:00 2001
From: geetu040 <raoarmaghanshakir040@gmail.com>
Date: Tue, 30 Dec 2025 09:11:27 +0500
Subject: [PATCH 01/34] set up folder structure and base code

---
 openml/_api/__init__.py           |   8 +++
 openml/_api/config.py             |   5 ++
 openml/_api/http/__init__.py      |   1 +
 openml/_api/http/client.py        |  23 ++++++
 openml/_api/http/utils.py         |   0
 openml/_api/resources/__init__.py |   2 +
 openml/_api/resources/base.py     |  22 ++++++
 openml/_api/resources/datasets.py |  13 ++++
 openml/_api/resources/tasks.py    | 113 ++++++++++++++++++++++++++++++
 openml/_api/runtime/core.py       |  58 +++++++++++++++
 openml/_api/runtime/fallback.py   |   5 ++
 openml/tasks/functions.py         |   8 ++-
 12 files changed, 255 insertions(+), 3 deletions(-)
 create mode 100644 openml/_api/__init__.py
 create mode 100644 openml/_api/config.py
 create mode 100644 openml/_api/http/__init__.py
 create mode 100644 openml/_api/http/client.py
 create mode 100644 openml/_api/http/utils.py
 create mode 100644 openml/_api/resources/__init__.py
 create mode 100644 openml/_api/resources/base.py
 create mode 100644 openml/_api/resources/datasets.py
 create mode 100644 openml/_api/resources/tasks.py
 create mode 100644 openml/_api/runtime/core.py
 create mode 100644 openml/_api/runtime/fallback.py

diff --git a/openml/_api/__init__.py b/openml/_api/__init__.py
new file mode 100644
index 000000000..5089f94dd
--- /dev/null
+++ b/openml/_api/__init__.py
@@ -0,0 +1,8 @@
+from openml._api.runtime.core import APIContext
+
+
+def set_api_version(version: str, strict=False):
+    api_context.set_version(version=version, strict=strict)
+
+
+api_context = APIContext()
diff --git a/openml/_api/config.py b/openml/_api/config.py
new file mode 100644
index 000000000..bd93c3cad
--- /dev/null
+++ b/openml/_api/config.py
@@ -0,0 +1,5 @@
+from __future__ import annotations
+
+API_V1_SERVER = "https://www.openml.org/api/v1/xml"
+API_V2_SERVER = "http://127.0.0.1:8001"
+API_KEY = "..."
diff --git a/openml/_api/http/__init__.py b/openml/_api/http/__init__.py
new file mode 100644
index 000000000..fde2a5b0a
--- /dev/null
+++ b/openml/_api/http/__init__.py
@@ -0,0 +1 @@
+from openml._api.http.client import HTTPClient
diff --git a/openml/_api/http/client.py b/openml/_api/http/client.py
new file mode 100644
index 000000000..81a9213e3
--- /dev/null
+++ b/openml/_api/http/client.py
@@ -0,0 +1,23 @@
+from __future__ import annotations
+
+import requests
+
+from openml.__version__ import __version__
+
+
+class HTTPClient:
+    def __init__(self, base_url: str):
+        self.base_url = base_url
+        self.headers = {"user-agent": f"openml-python/{__version__}"}
+
+    def get(self, path, params=None):
+        url = f"{self.base_url}/{path}"
+        return requests.get(url, params=params, headers=self.headers)
+
+    def post(self, path, data=None, files=None):
+        url = f"{self.base_url}/{path}"
+        return requests.post(url, data=data, files=files, headers=self.headers)
+
+    def delete(self, path, params=None):
+        url = f"{self.base_url}/{path}"
+        return requests.delete(url, params=params, headers=self.headers)
diff --git a/openml/_api/http/utils.py b/openml/_api/http/utils.py
new file mode 100644
index 000000000..e69de29bb
diff --git a/openml/_api/resources/__init__.py b/openml/_api/resources/__init__.py
new file mode 100644
index 000000000..078fc5998
--- /dev/null
+++ b/openml/_api/resources/__init__.py
@@ -0,0 +1,2 @@
+from openml._api.resources.datasets import DatasetsV1, DatasetsV2
+from openml._api.resources.tasks import TasksV1, TasksV2
diff --git a/openml/_api/resources/base.py b/openml/_api/resources/base.py
new file mode 100644
index 000000000..1fae27665
--- /dev/null
+++ b/openml/_api/resources/base.py
@@ -0,0 +1,22 @@
+from __future__ import annotations
+
+from abc import ABC, abstractmethod
+from typing import TYPE_CHECKING
+
+if TYPE_CHECKING:
+    from openml._api.http import HTTPClient
+
+
+class ResourceAPI:
+    def __init__(self, http: HTTPClient):
+        self._http = http
+
+
+class DatasetsAPI(ResourceAPI, ABC):
+    @abstractmethod
+    def get(self, id: int) -> dict: ...
+
+
+class TasksAPI(ResourceAPI, ABC):
+    @abstractmethod
+    def get(self, id: int) -> dict: ...
diff --git a/openml/_api/resources/datasets.py b/openml/_api/resources/datasets.py
new file mode 100644
index 000000000..cd1bb595a
--- /dev/null
+++ b/openml/_api/resources/datasets.py
@@ -0,0 +1,13 @@
+from __future__ import annotations
+
+from openml._api.resources.base import DatasetsAPI
+
+
+class DatasetsV1(DatasetsAPI):
+    def get(self, id):
+        pass
+
+
+class DatasetsV2(DatasetsAPI):
+    def get(self, id):
+        pass
diff --git a/openml/_api/resources/tasks.py b/openml/_api/resources/tasks.py
new file mode 100644
index 000000000..b0e9afbf8
--- /dev/null
+++ b/openml/_api/resources/tasks.py
@@ -0,0 +1,113 @@
+from __future__ import annotations
+
+import xmltodict
+
+from openml._api.resources.base import TasksAPI
+from openml.tasks.task import (
+    OpenMLClassificationTask,
+    OpenMLClusteringTask,
+    OpenMLLearningCurveTask,
+    OpenMLRegressionTask,
+    OpenMLTask,
+    TaskType,
+)
+
+
+class TasksV1(TasksAPI):
+    def get(self, id, return_response=False):
+        path = f"task/{id}"
+        response = self._http.get(path)
+        xml_content = response.content
+        task = self._create_task_from_xml(xml_content)
+
+        if return_response:
+            return task, response
+
+        return task
+
+    def _create_task_from_xml(self, xml: str) -> OpenMLTask:
+        """Create a task given a xml string.
+
+        Parameters
+        ----------
+        xml : string
+            Task xml representation.
+
+        Returns
+        -------
+        OpenMLTask
+        """
+        dic = xmltodict.parse(xml)["oml:task"]
+        estimation_parameters = {}
+        inputs = {}
+        # Due to the unordered structure we obtain, we first have to extract
+        # the possible keys of oml:input; dic["oml:input"] is a list of
+        # OrderedDicts
+
+        # Check if there is a list of inputs
+        if isinstance(dic["oml:input"], list):
+            for input_ in dic["oml:input"]:
+                name = input_["@name"]
+                inputs[name] = input_
+        # Single input case
+        elif isinstance(dic["oml:input"], dict):
+            name = dic["oml:input"]["@name"]
+            inputs[name] = dic["oml:input"]
+
+        evaluation_measures = None
+        if "evaluation_measures" in inputs:
+            evaluation_measures = inputs["evaluation_measures"]["oml:evaluation_measures"][
+                "oml:evaluation_measure"
+            ]
+
+        task_type = TaskType(int(dic["oml:task_type_id"]))
+        common_kwargs = {
+            "task_id": dic["oml:task_id"],
+            "task_type": dic["oml:task_type"],
+            "task_type_id": task_type,
+            "data_set_id": inputs["source_data"]["oml:data_set"]["oml:data_set_id"],
+            "evaluation_measure": evaluation_measures,
+        }
+        # TODO: add OpenMLClusteringTask?
+        if task_type in (
+            TaskType.SUPERVISED_CLASSIFICATION,
+            TaskType.SUPERVISED_REGRESSION,
+            TaskType.LEARNING_CURVE,
+        ):
+            # Convert some more parameters
+            for parameter in inputs["estimation_procedure"]["oml:estimation_procedure"][
+                "oml:parameter"
+            ]:
+                name = parameter["@name"]
+                text = parameter.get("#text", "")
+                estimation_parameters[name] = text
+
+            common_kwargs["estimation_procedure_type"] = inputs["estimation_procedure"][
+                "oml:estimation_procedure"
+            ]["oml:type"]
+            common_kwargs["estimation_procedure_id"] = int(
+                inputs["estimation_procedure"]["oml:estimation_procedure"]["oml:id"]
+            )
+
+            common_kwargs["estimation_parameters"] = estimation_parameters
+            common_kwargs["target_name"] = inputs["source_data"]["oml:data_set"][
+                "oml:target_feature"
+            ]
+            common_kwargs["data_splits_url"] = inputs["estimation_procedure"][
+                "oml:estimation_procedure"
+            ]["oml:data_splits_url"]
+
+        cls = {
+            TaskType.SUPERVISED_CLASSIFICATION: OpenMLClassificationTask,
+            TaskType.SUPERVISED_REGRESSION: OpenMLRegressionTask,
+            TaskType.CLUSTERING: OpenMLClusteringTask,
+            TaskType.LEARNING_CURVE: OpenMLLearningCurveTask,
+        }.get(task_type)
+        if cls is None:
+            raise NotImplementedError(f"Task type {common_kwargs['task_type']} not supported.")
+        return cls(**common_kwargs)  # type: ignore
+
+
+class TasksV2(TasksAPI):
+    def get(self, id):
+        pass
diff --git a/openml/_api/runtime/core.py b/openml/_api/runtime/core.py
new file mode 100644
index 000000000..80f35587c
--- /dev/null
+++ b/openml/_api/runtime/core.py
@@ -0,0 +1,58 @@
+from __future__ import annotations
+
+from openml._api.config import (
+    API_V1_SERVER,
+    API_V2_SERVER,
+)
+from openml._api.http.client import HTTPClient
+from openml._api.resources import (
+    DatasetsV1,
+    DatasetsV2,
+    TasksV1,
+    TasksV2,
+)
+from openml._api.runtime.fallback import FallbackProxy
+
+
+class APIBackend:
+    def __init__(self, *, datasets, tasks):
+        self.datasets = datasets
+        self.tasks = tasks
+
+
+def build_backend(version: str, strict: bool) -> APIBackend:
+    v1_http = HTTPClient(API_V1_SERVER)
+    v2_http = HTTPClient(API_V2_SERVER)
+
+    v1 = APIBackend(
+        datasets=DatasetsV1(v1_http),
+        tasks=TasksV1(v1_http),
+    )
+
+    if version == "v1":
+        return v1
+
+    v2 = APIBackend(
+        datasets=DatasetsV2(v2_http),
+        tasks=TasksV2(v2_http),
+    )
+
+    if strict:
+        return v2
+
+    return APIBackend(
+        datasets=FallbackProxy(v2.datasets, v1.datasets),
+        tasks=FallbackProxy(v2.tasks, v1.tasks),
+    )
+
+
+class APIContext:
+    def __init__(self):
+        self._backend = build_backend("v1", strict=False)
+
+    def set_version(self, version: str, strict: bool = False):
+        self._backend = build_backend(version, strict)
+
+    @property
+    def backend(self):
+        return self._backend
diff --git a/openml/_api/runtime/fallback.py b/openml/_api/runtime/fallback.py
new file mode 100644
index 000000000..56e96a966
--- /dev/null
+++ b/openml/_api/runtime/fallback.py
@@ -0,0 +1,5 @@
+from __future__ import annotations
+
+
+class FallbackProxy:
+    pass
diff --git a/openml/tasks/functions.py b/openml/tasks/functions.py
index d2bf5e946..91be65965 100644
--- a/openml/tasks/functions.py
+++ b/openml/tasks/functions.py
@@ -12,6 +12,7 @@
 
 import openml._api_calls
 import openml.utils
+from openml._api import api_context
 from openml.datasets import get_dataset
 from openml.exceptions import OpenMLCacheException
 
@@ -442,11 +443,12 @@ def _get_task_description(task_id: int) -> OpenMLTask:
     except OpenMLCacheException:
         _cache_dir = openml.utils._create_cache_directory_for_id(TASKS_CACHE_DIR_NAME, task_id)
         xml_file = _cache_dir / "task.xml"
-        task_xml = openml._api_calls._perform_api_call("task/%d" % task_id, "get")
+        task, response = api_context.backend.tasks.get(task_id, return_response=True)
 
         with xml_file.open("w", encoding="utf8") as fh:
-            fh.write(task_xml)
-        return _create_task_from_xml(task_xml)
+            fh.write(response.text)
+
+        return task
 
 
 def _create_task_from_xml(xml: str) -> OpenMLTask:

From 52ef37999fad8509e5e85b8512e442bd9dc69e04 Mon Sep 17 00:00:00 2001
From: geetu040 <raoarmaghanshakir040@gmail.com>
Date: Mon, 5 Jan 2026 12:48:58 +0500
Subject: [PATCH 02/34] fix pre-commit

---
 openml/_api/__init__.py           |  2 +-
 openml/_api/http/__init__.py      |  2 ++
 openml/_api/http/client.py        | 32 +++++++++++++++++++++++--------
 openml/_api/resources/__init__.py |  2 ++
 openml/_api/resources/base.py     | 13 +++++++++++--
 openml/_api/resources/datasets.py | 15 +++++++++++----
 openml/_api/resources/tasks.py    | 25 +++++++++++++++++++-----
 openml/_api/runtime/__init__.py   |  0
 openml/_api/runtime/core.py       | 23 +++++++++++-----------
 openml/_api/runtime/fallback.py   |  9 ++++++++-
 openml/tasks/functions.py         | 12 ++++++++----
 11 files changed, 99 insertions(+), 36 deletions(-)
 create mode 100644 openml/_api/runtime/__init__.py

diff --git a/openml/_api/__init__.py b/openml/_api/__init__.py
index 5089f94dd..881f40671 100644
--- a/openml/_api/__init__.py
+++ b/openml/_api/__init__.py
@@ -1,7 +1,7 @@
 from openml._api.runtime.core import APIContext
 
 
-def set_api_version(version: str, strict=False):
+def set_api_version(version: str, *, strict: bool = False) -> None:
     api_context.set_version(version=version, strict=strict)
 
 
diff --git a/openml/_api/http/__init__.py b/openml/_api/http/__init__.py
index fde2a5b0a..8e6d1e4ce 100644
--- a/openml/_api/http/__init__.py
+++ b/openml/_api/http/__init__.py
@@ -1 +1,3 @@
 from openml._api.http.client import HTTPClient
+
+__all__ = ["HTTPClient"]
diff --git a/openml/_api/http/client.py b/openml/_api/http/client.py
index 81a9213e3..dea5de809 100644
--- a/openml/_api/http/client.py
+++ b/openml/_api/http/client.py
@@ -1,23 +1,39 @@
 from __future__ import annotations
 
+from typing import Any, Mapping
+
 import requests
+from requests import Response
 
 from openml.__version__ import __version__
 
 
 class HTTPClient:
-    def __init__(self, base_url: str):
+    def __init__(self, base_url: str) -> None:
         self.base_url = base_url
-        self.headers = {"user-agent": f"openml-python/{__version__}"}
+        self.headers: dict[str, str] = {"user-agent": f"openml-python/{__version__}"}
 
-    def get(self, path, params=None):
+    def get(
+        self,
+        path: str,
+        params: Mapping[str, Any] | None = None,
+    ) -> Response:
         url = f"{self.base_url}/{path}"
-        return requests.get(url, params=params, headers=self.headers)
+        return requests.get(url, params=params, headers=self.headers, timeout=10)
 
-    def post(self, path, data=None, files=None):
+    def post(
+        self,
+        path: str,
+        data: Mapping[str, Any] | None = None,
+        files: Any = None,
+    ) -> Response:
         url = f"{self.base_url}/{path}"
-        return requests.post(url, data=data, files=files, headers=self.headers)
+        return requests.post(url, data=data, files=files, headers=self.headers, timeout=10)
 
-    def delete(self, path, params=None):
+    def delete(
+        self,
+        path: str,
+        params: Mapping[str, Any] | None = None,
+    ) -> Response:
         url = f"{self.base_url}/{path}"
-        return requests.delete(url, params=params, headers=self.headers)
+        return requests.delete(url, params=params, headers=self.headers, timeout=10)
diff --git a/openml/_api/resources/__init__.py b/openml/_api/resources/__init__.py
index 078fc5998..b1af3c1a8 100644
--- a/openml/_api/resources/__init__.py
+++ b/openml/_api/resources/__init__.py
@@ -1,2 +1,4 @@
 from openml._api.resources.datasets import DatasetsV1, DatasetsV2
 from openml._api.resources.tasks import TasksV1, TasksV2
+
+__all__ = ["DatasetsV1", "DatasetsV2", "TasksV1", "TasksV2"]
diff --git a/openml/_api/resources/base.py b/openml/_api/resources/base.py
index 1fae27665..6fbf8977d 100644
--- a/openml/_api/resources/base.py
+++ b/openml/_api/resources/base.py
@@ -4,7 +4,11 @@
 from typing import TYPE_CHECKING
 
 if TYPE_CHECKING:
+    from requests import Response
+
     from openml._api.http import HTTPClient
+    from openml.datasets.dataset import OpenMLDataset
+    from openml.tasks.task import OpenMLTask
 
 
 class ResourceAPI:
@@ -14,9 +18,14 @@ def __init__(self, http: HTTPClient):
 
 class DatasetsAPI(ResourceAPI, ABC):
     @abstractmethod
-    def get(self, id: int) -> dict: ...
+    def get(self, dataset_id: int) -> OpenMLDataset | tuple[OpenMLDataset, Response]: ...
 
 
 class TasksAPI(ResourceAPI, ABC):
     @abstractmethod
-    def get(self, id: int) -> dict: ...
+    def get(
+        self,
+        task_id: int,
+        *,
+        return_response: bool = False,
+    ) -> OpenMLTask | tuple[OpenMLTask, Response]: ...
diff --git a/openml/_api/resources/datasets.py b/openml/_api/resources/datasets.py
index cd1bb595a..9ff1ec278 100644
--- a/openml/_api/resources/datasets.py
+++ b/openml/_api/resources/datasets.py
@@ -1,13 +1,20 @@
 from __future__ import annotations
 
+from typing import TYPE_CHECKING
+
 from openml._api.resources.base import DatasetsAPI
 
+if TYPE_CHECKING:
+    from responses import Response
+
+    from openml.datasets.dataset import OpenMLDataset
+
 
 class DatasetsV1(DatasetsAPI):
-    def get(self, id):
-        pass
+    def get(self, dataset_id: int) -> OpenMLDataset | tuple[OpenMLDataset, Response]:
+        raise NotImplementedError
 
 
 class DatasetsV2(DatasetsAPI):
-    def get(self, id):
-        pass
+    def get(self, dataset_id: int) -> OpenMLDataset | tuple[OpenMLDataset, Response]:
+        raise NotImplementedError
diff --git a/openml/_api/resources/tasks.py b/openml/_api/resources/tasks.py
index b0e9afbf8..f494fb9a3 100644
--- a/openml/_api/resources/tasks.py
+++ b/openml/_api/resources/tasks.py
@@ -1,5 +1,7 @@
 from __future__ import annotations
 
+from typing import TYPE_CHECKING
+
 import xmltodict
 
 from openml._api.resources.base import TasksAPI
@@ -12,12 +14,20 @@
     TaskType,
 )
 
+if TYPE_CHECKING:
+    from requests import Response
+
 
 class TasksV1(TasksAPI):
-    def get(self, id, return_response=False):
-        path = f"task/{id}"
+    def get(
+        self,
+        task_id: int,
+        *,
+        return_response: bool = False,
+    ) -> OpenMLTask | tuple[OpenMLTask, Response]:
+        path = f"task/{task_id}"
         response = self._http.get(path)
-        xml_content = response.content
+        xml_content = response.text
         task = self._create_task_from_xml(xml_content)
 
         if return_response:
@@ -109,5 +119,10 @@ def _create_task_from_xml(self, xml: str) -> OpenMLTask:
 
 
 class TasksV2(TasksAPI):
-    def get(self, id):
-        pass
+    def get(
+        self,
+        task_id: int,
+        *,
+        return_response: bool = False,
+    ) -> OpenMLTask | tuple[OpenMLTask, Response]:
+        raise NotImplementedError
diff --git a/openml/_api/runtime/__init__.py b/openml/_api/runtime/__init__.py
new file mode 100644
index 000000000..e69de29bb
diff --git a/openml/_api/runtime/core.py b/openml/_api/runtime/core.py
index 80f35587c..aa09a69db 100644
--- a/openml/_api/runtime/core.py
+++ b/openml/_api/runtime/core.py
@@ -1,5 +1,7 @@
 from __future__ import annotations
 
+from typing import TYPE_CHECKING
+
 from openml._api.config import (
     API_V1_SERVER,
     API_V2_SERVER,
@@ -11,16 +13,18 @@
     TasksV1,
     TasksV2,
 )
-from openml._api.runtime.fallback import FallbackProxy
+
+if TYPE_CHECKING:
+    from openml._api.resources.base import DatasetsAPI, TasksAPI
 
 
 class APIBackend:
-    def __init__(self, *, datasets, tasks):
+    def __init__(self, *, datasets: DatasetsAPI, tasks: TasksAPI):
         self.datasets = datasets
         self.tasks = tasks
 
 
-def build_backend(version: str, strict: bool) -> APIBackend:
+def build_backend(version: str, *, strict: bool) -> APIBackend:
     v1_http = HTTPClient(API_V1_SERVER)
     v2_http = HTTPClient(API_V2_SERVER)
 
@@ -40,19 +44,16 @@ def build_backend(version: str, strict: bool) -> APIBackend:
     if strict:
         return v2
 
-    return APIBackend(
-        datasets=FallbackProxy(v2.datasets, v1.datasets),
-        tasks=FallbackProxy(v2.tasks, v1.tasks),
-    )
+    return v1
 
 
 class APIContext:
-    def __init__(self):
+    def __init__(self) -> None:
         self._backend = build_backend("v1", strict=False)
 
-    def set_version(self, version: str, strict: bool = False):
-        self._backend = build_backend(version, strict)
+    def set_version(self, version: str, *, strict: bool = False) -> None:
+        self._backend = build_backend(version=version, strict=strict)
 
     @property
-    def backend(self):
+    def backend(self) -> APIBackend:
         return self._backend
diff --git a/openml/_api/runtime/fallback.py b/openml/_api/runtime/fallback.py
index 56e96a966..1bc99d270 100644
--- a/openml/_api/runtime/fallback.py
+++ b/openml/_api/runtime/fallback.py
@@ -1,5 +1,12 @@
 from __future__ import annotations
 
+from typing import TYPE_CHECKING
+
+if TYPE_CHECKING:
+    from openml._api.resources.base import ResourceAPI
+
 
 class FallbackProxy:
-    pass
+    def __init__(self, primary: ResourceAPI, fallback: ResourceAPI):
+        self._primary = primary
+        self._fallback = fallback
diff --git a/openml/tasks/functions.py b/openml/tasks/functions.py
index ef67f75bf..a794ad56d 100644
--- a/openml/tasks/functions.py
+++ b/openml/tasks/functions.py
@@ -445,10 +445,14 @@ def _get_task_description(task_id: int) -> OpenMLTask:
     except OpenMLCacheException:
         _cache_dir = openml.utils._create_cache_directory_for_id(TASKS_CACHE_DIR_NAME, task_id)
         xml_file = _cache_dir / "task.xml"
-        task, response = api_context.backend.tasks.get(task_id, return_response=True)
-
-        with xml_file.open("w", encoding="utf8") as fh:
-            fh.write(response.text)
+        result = api_context.backend.tasks.get(task_id, return_response=True)
+
+        if isinstance(result, tuple):
+            task, response = result
+            with xml_file.open("w", encoding="utf8") as fh:
+                fh.write(response.text)
+        else:
+            task = result
 
         return task
 

From 5dfcbce55a027d19cd502ea7bb3d521c2b1bca29 Mon Sep 17 00:00:00 2001
From: geetu040 <raoarmaghanshakir040@gmail.com>
Date: Wed, 7 Jan 2026 22:14:31 +0500
Subject: [PATCH 03/34] refactor

---
 openml/_api/config.py       | 62 +++++++++++++++++++++++++++++++++++--
 openml/_api/http/client.py  | 18 +++++++----
 openml/_api/runtime/core.py |  9 ++----
 3 files changed, 74 insertions(+), 15 deletions(-)

diff --git a/openml/_api/config.py b/openml/_api/config.py
index bd93c3cad..1431f66b1 100644
--- a/openml/_api/config.py
+++ b/openml/_api/config.py
@@ -1,5 +1,61 @@
 from __future__ import annotations
 
-API_V1_SERVER = "https://www.openml.org/api/v1/xml"
-API_V2_SERVER = "http://127.0.0.1:8001"
-API_KEY = "..."
+from dataclasses import dataclass
+from typing import Literal
+
+DelayMethod = Literal["human", "robot"]
+
+
+@dataclass
+class APIConfig:
+    server: str
+    base_url: str
+    key: str
+
+
+@dataclass
+class APISettings:
+    v1: APIConfig
+    v2: APIConfig
+
+
+@dataclass
+class ConnectionConfig:
+    retries: int = 3
+    delay_method: DelayMethod = "human"
+    delay_time: int = 1  # seconds
+
+    def __post_init__(self) -> None:
+        if self.delay_method not in ("human", "robot"):
+            raise ValueError(f"delay_method must be 'human' or 'robot', got {self.delay_method}")
+
+
+@dataclass
+class CacheConfig:
+    dir: str = "~/.openml/cache"
+    ttl: int = 60 * 60 * 24 * 7  # one week
+
+
+@dataclass
+class Settings:
+    api: APISettings
+    connection: ConnectionConfig
+    cache: CacheConfig
+
+
+settings = Settings(
+    api=APISettings(
+        v1=APIConfig(
+            server="https://www.openml.org/",
+            base_url="api/v1/xml/",
+            key="...",
+        ),
+        v2=APIConfig(
+            server="http://127.0.0.1:8001/",
+            base_url="",
+            key="...",
+        ),
+    ),
+    connection=ConnectionConfig(),
+    cache=CacheConfig(),
+)
diff --git a/openml/_api/http/client.py b/openml/_api/http/client.py
index dea5de809..74e08c709 100644
--- a/openml/_api/http/client.py
+++ b/openml/_api/http/client.py
@@ -1,24 +1,30 @@
 from __future__ import annotations
 
-from typing import Any, Mapping
+from typing import TYPE_CHECKING, Any, Mapping
 
 import requests
 from requests import Response
 
 from openml.__version__ import __version__
 
+if TYPE_CHECKING:
+    from openml._api.config import APIConfig
+
 
 class HTTPClient:
-    def __init__(self, base_url: str) -> None:
-        self.base_url = base_url
+    def __init__(self, config: APIConfig) -> None:
+        self.config = config
         self.headers: dict[str, str] = {"user-agent": f"openml-python/{__version__}"}
 
+    def _create_url(self, path: str) -> str:
+        return self.config.server + self.config.base_url + path
+
     def get(
         self,
         path: str,
         params: Mapping[str, Any] | None = None,
     ) -> Response:
-        url = f"{self.base_url}/{path}"
+        url = self._create_url(path)
         return requests.get(url, params=params, headers=self.headers, timeout=10)
 
     def post(
@@ -27,7 +33,7 @@ def post(
         data: Mapping[str, Any] | None = None,
         files: Any = None,
     ) -> Response:
-        url = f"{self.base_url}/{path}"
+        url = self._create_url(path)
         return requests.post(url, data=data, files=files, headers=self.headers, timeout=10)
 
     def delete(
@@ -35,5 +41,5 @@ def delete(
         path: str,
         params: Mapping[str, Any] | None = None,
     ) -> Response:
-        url = f"{self.base_url}/{path}"
+        url = self._create_url(path)
         return requests.delete(url, params=params, headers=self.headers, timeout=10)
diff --git a/openml/_api/runtime/core.py b/openml/_api/runtime/core.py
index aa09a69db..98b587411 100644
--- a/openml/_api/runtime/core.py
+++ b/openml/_api/runtime/core.py
@@ -2,10 +2,7 @@
 
 from typing import TYPE_CHECKING
 
-from openml._api.config import (
-    API_V1_SERVER,
-    API_V2_SERVER,
-)
+from openml._api.config import settings
 from openml._api.http.client import HTTPClient
 from openml._api.resources import (
     DatasetsV1,
@@ -25,8 +22,8 @@ def __init__(self, *, datasets: DatasetsAPI, tasks: TasksAPI):
 
 
 def build_backend(version: str, *, strict: bool) -> APIBackend:
-    v1_http = HTTPClient(API_V1_SERVER)
-    v2_http = HTTPClient(API_V2_SERVER)
+    v1_http = HTTPClient(config=settings.api.v1)
+    v2_http = HTTPClient(config=settings.api.v2)
 
     v1 = APIBackend(
         datasets=DatasetsV1(v1_http),

From 2acbe9992cf95bfc103ff4fa0c360a58c1842870 Mon Sep 17 00:00:00 2001
From: geetu040 <raoarmaghanshakir040@gmail.com>
Date: Wed, 7 Jan 2026 22:24:03 +0500
Subject: [PATCH 04/34] implement cache_dir

---
 openml/_api/http/client.py | 74 +++++++++++++++++++++++++++++++++-----
 1 file changed, 66 insertions(+), 8 deletions(-)

diff --git a/openml/_api/http/client.py b/openml/_api/http/client.py
index 74e08c709..49b05c88e 100644
--- a/openml/_api/http/client.py
+++ b/openml/_api/http/client.py
@@ -1,36 +1,93 @@
 from __future__ import annotations
 
-from typing import TYPE_CHECKING, Any, Mapping
+from pathlib import Path
+from typing import TYPE_CHECKING, Any
+from urllib.parse import urlencode, urljoin, urlparse
 
 import requests
 from requests import Response
 
 from openml.__version__ import __version__
+from openml._api.config import settings
 
 if TYPE_CHECKING:
     from openml._api.config import APIConfig
 
 
-class HTTPClient:
+class CacheMixin:
+    @property
+    def dir(self) -> str:
+        return settings.cache.dir
+
+    @property
+    def ttl(self) -> int:
+        return settings.cache.ttl
+
+    def _get_cache_directory(self, url: str, params: dict[str, Any]) -> Path:
+        parsed_url = urlparse(url)
+        netloc_parts = parsed_url.netloc.split(".")[::-1]  # reverse domain
+        path_parts = parsed_url.path.strip("/").split("/")
+
+        # remove api_key and serialize params if any
+        filtered_params = {k: v for k, v in params.items() if k != "api_key"}
+        params_part = [urlencode(filtered_params)] if filtered_params else []
+
+        return Path(self.dir).joinpath(*netloc_parts, *path_parts, *params_part)
+
+    def _get_cache_response(self, url: str, params: dict[str, Any]) -> Response | None:  # noqa: ARG002
+        return None
+
+    def _set_cache_response(self, url: str, params: dict[str, Any], response: Response) -> None:  # noqa: ARG002
+        return None
+
+
+class HTTPClient(CacheMixin):
     def __init__(self, config: APIConfig) -> None:
         self.config = config
         self.headers: dict[str, str] = {"user-agent": f"openml-python/{__version__}"}
 
-    def _create_url(self, path: str) -> str:
-        return self.config.server + self.config.base_url + path
+    @property
+    def server(self) -> str:
+        return self.config.server
+
+    @property
+    def base_url(self) -> str:
+        return self.config.base_url
+
+    def _create_url(self, path: str) -> Any:
+        return urljoin(self.server, urljoin(self.base_url, path))
 
     def get(
         self,
         path: str,
-        params: Mapping[str, Any] | None = None,
+        *,
+        params: dict[str, Any] | None = None,
+        use_cache: bool = False,
+        use_api_key: bool = False,
     ) -> Response:
         url = self._create_url(path)
-        return requests.get(url, params=params, headers=self.headers, timeout=10)
+        params = dict(params) if params is not None else {}
+
+        if use_api_key:
+            params["api_key"] = self.config.key
+
+        if use_cache:
+            response = self._get_cache_response(url, params)
+            if response:
+                return response
+
+        response = requests.get(url, params=params, headers=self.headers, timeout=10)
+
+        if use_cache:
+            self._set_cache_response(url, params, response)
+
+        return response
 
     def post(
         self,
         path: str,
-        data: Mapping[str, Any] | None = None,
+        *,
+        data: dict[str, Any] | None = None,
         files: Any = None,
     ) -> Response:
         url = self._create_url(path)
@@ -39,7 +96,8 @@ def post(
     def delete(
         self,
         path: str,
-        params: Mapping[str, Any] | None = None,
+        *,
+        params: dict[str, Any] | None = None,
     ) -> Response:
         url = self._create_url(path)
         return requests.delete(url, params=params, headers=self.headers, timeout=10)

From af99880a9e16a49833c63084c9e9267c112b6b91 Mon Sep 17 00:00:00 2001
From: geetu040 <raoarmaghanshakir040@gmail.com>
Date: Wed, 7 Jan 2026 23:42:17 +0500
Subject: [PATCH 05/34] refactor

---
 openml/_api/config.py      |   1 +
 openml/_api/http/client.py | 100 +++++++++++++++++++++++++++----------
 2 files changed, 75 insertions(+), 26 deletions(-)

diff --git a/openml/_api/config.py b/openml/_api/config.py
index 1431f66b1..848fe8da1 100644
--- a/openml/_api/config.py
+++ b/openml/_api/config.py
@@ -11,6 +11,7 @@ class APIConfig:
     server: str
     base_url: str
     key: str
+    timeout: int = 10  # seconds
 
 
 @dataclass
diff --git a/openml/_api/http/client.py b/openml/_api/http/client.py
index 49b05c88e..a90e93933 100644
--- a/openml/_api/http/client.py
+++ b/openml/_api/http/client.py
@@ -23,7 +23,7 @@ def dir(self) -> str:
     def ttl(self) -> int:
         return settings.cache.ttl
 
-    def _get_cache_directory(self, url: str, params: dict[str, Any]) -> Path:
+    def _get_cache_dir(self, url: str, params: dict[str, Any]) -> Path:
         parsed_url = urlparse(url)
         netloc_parts = parsed_url.netloc.split(".")[::-1]  # reverse domain
         path_parts = parsed_url.path.strip("/").split("/")
@@ -34,10 +34,10 @@ def _get_cache_directory(self, url: str, params: dict[str, Any]) -> Path:
 
         return Path(self.dir).joinpath(*netloc_parts, *path_parts, *params_part)
 
-    def _get_cache_response(self, url: str, params: dict[str, Any]) -> Response | None:  # noqa: ARG002
-        return None
+    def _get_cache_response(self, cache_dir: Path) -> Response:  # noqa: ARG002
+        return Response()
 
-    def _set_cache_response(self, url: str, params: dict[str, Any], response: Response) -> None:  # noqa: ARG002
+    def _set_cache_response(self, cache_dir: Path, response: Response) -> None:  # noqa: ARG002
         return None
 
 
@@ -54,50 +54,98 @@ def server(self) -> str:
     def base_url(self) -> str:
         return self.config.base_url
 
-    def _create_url(self, path: str) -> Any:
-        return urljoin(self.server, urljoin(self.base_url, path))
+    @property
+    def key(self) -> str:
+        return self.config.key
 
-    def get(
+    @property
+    def timeout(self) -> int:
+        return self.config.timeout
+
+    def request(
         self,
+        method: str,
         path: str,
         *,
-        params: dict[str, Any] | None = None,
         use_cache: bool = False,
         use_api_key: bool = False,
+        **request_kwargs: Any,
     ) -> Response:
-        url = self._create_url(path)
-        params = dict(params) if params is not None else {}
+        url = urljoin(self.server, urljoin(self.base_url, path))
 
+        params = request_kwargs.pop("params", {})
+        params = params.copy()
         if use_api_key:
-            params["api_key"] = self.config.key
+            params["api_key"] = self.key
 
-        if use_cache:
-            response = self._get_cache_response(url, params)
-            if response:
-                return response
+        headers = request_kwargs.pop("headers", {})
+        headers = headers.copy()
+        headers.update(self.headers)
+
+        timeout = request_kwargs.pop("timeout", self.timeout)
+        cache_dir = self._get_cache_dir(url, params)
 
-        response = requests.get(url, params=params, headers=self.headers, timeout=10)
+        if use_cache:
+            try:
+                return self._get_cache_response(cache_dir)
+            # TODO: handle ttl expired error
+            except Exception:
+                raise
+
+        response = requests.request(
+            method=method,
+            url=url,
+            params=params,
+            headers=headers,
+            timeout=timeout,
+            **request_kwargs,
+        )
 
         if use_cache:
-            self._set_cache_response(url, params, response)
+            self._set_cache_response(cache_dir, response)
 
         return response
 
-    def post(
+    def get(
         self,
         path: str,
         *,
-        data: dict[str, Any] | None = None,
-        files: Any = None,
+        use_cache: bool = False,
+        use_api_key: bool = False,
+        **request_kwargs: Any,
     ) -> Response:
-        url = self._create_url(path)
-        return requests.post(url, data=data, files=files, headers=self.headers, timeout=10)
+        # TODO: remove override when cache is implemented
+        use_cache = False
+        return self.request(
+            method="GET",
+            path=path,
+            use_cache=use_cache,
+            use_api_key=use_api_key,
+            **request_kwargs,
+        )
+
+    def post(
+        self,
+        path: str,
+        **request_kwargs: Any,
+    ) -> Response:
+        return self.request(
+            method="POST",
+            path=path,
+            use_cache=False,
+            use_api_key=True,
+            **request_kwargs,
+        )
 
     def delete(
         self,
         path: str,
-        *,
-        params: dict[str, Any] | None = None,
+        **request_kwargs: Any,
     ) -> Response:
-        url = self._create_url(path)
-        return requests.delete(url, params=params, headers=self.headers, timeout=10)
+        return self.request(
+            method="DELETE",
+            path=path,
+            use_cache=False,
+            use_api_key=True,
+            **request_kwargs,
+        )

From 561b204609d4b4520a10c507a1bd0cd39ee90cdd Mon Sep 17 00:00:00 2001
From: Omswastik-11 <omswastikpanda11@gmail.com>
Date: Thu, 8 Jan 2026 18:27:04 +0530
Subject: [PATCH 06/34] migrate flow module

---
 openml/_api/resources/__init__.py       |  10 +-
 openml/_api/resources/base.py           |  31 ++++
 openml/_api/resources/flows.py          | 205 ++++++++++++++++++++++++
 openml/_api/runtime/core.py             |   9 +-
 openml/flows/functions.py               | 113 ++++++-------
 tests/test_flows/test_flow_migration.py | 127 +++++++++++++++
 6 files changed, 428 insertions(+), 67 deletions(-)
 create mode 100644 openml/_api/resources/flows.py
 create mode 100644 tests/test_flows/test_flow_migration.py

diff --git a/openml/_api/resources/__init__.py b/openml/_api/resources/__init__.py
index b1af3c1a8..060f5c701 100644
--- a/openml/_api/resources/__init__.py
+++ b/openml/_api/resources/__init__.py
@@ -1,4 +1,12 @@
 from openml._api.resources.datasets import DatasetsV1, DatasetsV2
+from openml._api.resources.flows import FlowsV1, FlowsV2
 from openml._api.resources.tasks import TasksV1, TasksV2
 
-__all__ = ["DatasetsV1", "DatasetsV2", "TasksV1", "TasksV2"]
+__all__ = [
+    "DatasetsV1",
+    "DatasetsV2",
+    "TasksV1",
+    "TasksV2",
+    "FlowsV1",
+    "FlowsV2",
+]
diff --git a/openml/_api/resources/base.py b/openml/_api/resources/base.py
index 6fbf8977d..781445d78 100644
--- a/openml/_api/resources/base.py
+++ b/openml/_api/resources/base.py
@@ -4,10 +4,12 @@
 from typing import TYPE_CHECKING
 
 if TYPE_CHECKING:
+    import pandas as pd
     from requests import Response
 
     from openml._api.http import HTTPClient
     from openml.datasets.dataset import OpenMLDataset
+    from openml.flows.flow import OpenMLFlow
     from openml.tasks.task import OpenMLTask
 
 
@@ -29,3 +31,32 @@ def get(
         *,
         return_response: bool = False,
     ) -> OpenMLTask | tuple[OpenMLTask, Response]: ...
+
+
+class FlowsAPI(ResourceAPI, ABC):
+    @abstractmethod
+    def get(
+        self,
+        flow_id: int,
+        *,
+        return_response: bool = False,
+    ) -> OpenMLFlow | tuple[OpenMLFlow, Response]: ...
+
+    @abstractmethod
+    def exists(self, name: str, external_version: str) -> int | bool: ...
+
+    @abstractmethod
+    def list_page(
+        self,
+        *,
+        limit: int | None = None,
+        offset: int | None = None,
+        tag: str | None = None,
+        uploader: str | None = None,
+    ) -> pd.DataFrame: ...
+
+    @abstractmethod
+    def create(self, flow: OpenMLFlow) -> OpenMLFlow | tuple[OpenMLFlow, Response]: ...
+
+    @abstractmethod
+    def delete(self, flow_id: int) -> None | Response: ...
diff --git a/openml/_api/resources/flows.py b/openml/_api/resources/flows.py
new file mode 100644
index 000000000..426784ba1
--- /dev/null
+++ b/openml/_api/resources/flows.py
@@ -0,0 +1,205 @@
+from __future__ import annotations
+
+from typing import TYPE_CHECKING, Any
+
+import pandas as pd
+import xmltodict
+
+from openml._api.resources.base import FlowsAPI
+from openml.flows.flow import OpenMLFlow
+
+if TYPE_CHECKING:
+    from requests import Response
+
+
+class FlowsV1(FlowsAPI):
+    def get(
+        self,
+        flow_id: int,
+        *,
+        return_response: bool = False,
+    ) -> OpenMLFlow | tuple[OpenMLFlow, Response]:
+        """Get a flow from the OpenML server.
+
+        Parameters
+        ----------
+        flow_id : int
+            The ID of the flow to retrieve.
+        return_response : bool, optional (default=False)
+            Whether to return the raw response object along with the flow.
+
+        Returns
+        -------
+        OpenMLFlow | tuple[OpenMLFlow, Response]
+            The retrieved flow object, and optionally the raw response.
+        """
+        response = self._http.get(f"flow/{flow_id}")
+        flow_xml = response.text
+        flow = OpenMLFlow._from_dict(xmltodict.parse(flow_xml))
+        if return_response:
+            return flow, response
+        return flow
+
+    def exists(self, name: str, external_version: str) -> int | bool:
+        """Check if a flow exists on the OpenML server.
+
+        Parameters
+        ----------
+        name : str
+            The name of the flow.
+        external_version : str
+            The external version of the flow.
+
+        Returns
+        -------
+        int | bool
+            The flow ID if the flow exists, False otherwise.
+        """
+        if not (isinstance(name, str) and len(name) > 0):
+            raise ValueError("Argument 'name' should be a non-empty string")
+        if not (isinstance(external_version, str) and len(external_version) > 0):
+            raise ValueError("Argument 'version' should be a non-empty string")
+
+        xml_response = self._http.post(
+            "flow/exists", data={"name": name, "external_version": external_version}
+        ).text
+        result_dict = xmltodict.parse(xml_response)
+        flow_id = int(result_dict["oml:flow_exists"]["oml:id"])
+        return flow_id if flow_id > 0 else False
+
+    def list_page(
+        self,
+        *,
+        limit: int | None = None,
+        offset: int | None = None,
+        tag: str | None = None,
+        uploader: str | None = None,
+    ) -> pd.DataFrame:
+        """List flows on the OpenML server.
+
+        Parameters
+        ----------
+        limit : int, optional
+            The maximum number of flows to return.
+            By default, all flows are returned.
+        offset : int, optional
+            The number of flows to skip before starting to collect the result set.
+            By default, no flows are skipped.
+        tag : str, optional
+            The tag to filter flows by.
+            By default, no tag filtering is applied.
+        uploader : str, optional
+            The user to filter flows by.
+            By default, no user filtering is applied.
+
+        Returns
+        -------
+        pd.DataFrame
+            A DataFrame containing the list of flows.
+        """
+        api_call = "flow/list"
+        if limit is not None:
+            api_call += f"/limit/{limit}"
+        if offset is not None:
+            api_call += f"/offset/{offset}"
+        if tag is not None:
+            api_call += f"/tag/{tag}"
+        if uploader is not None:
+            api_call += f"/uploader/{uploader}"
+
+        xml_string = self._http.get(api_call).text
+        flows_dict = xmltodict.parse(xml_string, force_list=("oml:flow",))
+
+        assert isinstance(flows_dict["oml:flows"]["oml:flow"], list), type(flows_dict["oml:flows"])
+        assert flows_dict["oml:flows"]["@xmlns:oml"] == "http://openml.org/openml", flows_dict[
+            "oml:flows"
+        ]["@xmlns:oml"]
+
+        flows: dict[int, dict[str, Any]] = {}
+        for flow_ in flows_dict["oml:flows"]["oml:flow"]:
+            fid = int(flow_["oml:id"])
+            flow_row = {
+                "id": fid,
+                "full_name": flow_["oml:full_name"],
+                "name": flow_["oml:name"],
+                "version": flow_["oml:version"],
+                "external_version": flow_["oml:external_version"],
+                "uploader": flow_["oml:uploader"],
+            }
+            flows[fid] = flow_row
+
+        return pd.DataFrame.from_dict(flows, orient="index")
+
+    def create(self, flow: OpenMLFlow) -> OpenMLFlow:
+        """Create a new flow on the OpenML server.
+
+        under development , not fully functional yet
+
+        Parameters
+        ----------
+        flow : OpenMLFlow
+            The flow object to upload to the server.
+
+        Returns
+        -------
+        OpenMLFlow
+            The updated flow object with the server-assigned flow_id.
+        """
+        from openml.extensions import Extension
+
+        # Check if flow is an OpenMLFlow or a compatible extension object
+        if not isinstance(flow, OpenMLFlow) and not isinstance(flow, Extension):
+            raise TypeError(f"Flow must be an OpenMLFlow or Extension instance, got {type(flow)}")
+
+        # Get file elements for upload (includes XML description if not provided)
+        file_elements = flow._get_file_elements()
+        if "description" not in file_elements:
+            file_elements["description"] = flow._to_xml()
+
+        # POST to server
+        response = self._http.post("flow", data=file_elements)
+
+        # Parse response and update flow with server-assigned ID
+        xml_response = xmltodict.parse(response.text)
+        flow._parse_publish_response(xml_response)
+
+        return flow
+
+    def delete(self, flow_id: int) -> None:
+        """Delete a flow from the OpenML server.
+
+        Parameters
+        ----------
+        flow_id : int
+            The ID of the flow to delete.
+        """
+        self._http.delete(f"flow/{flow_id}")
+
+
+class FlowsV2(FlowsAPI):
+    def get(
+        self,
+        flow_id: int,
+        *,
+        return_response: bool = False,
+    ) -> OpenMLFlow | tuple[OpenMLFlow, Response]:
+        raise NotImplementedError
+
+    def exists(self, name: str, external_version: str) -> int | bool:
+        raise NotImplementedError
+
+    def list_page(
+        self,
+        *,
+        limit: int | None = None,
+        offset: int | None = None,
+        tag: str | None = None,
+        uploader: str | None = None,
+    ) -> pd.DataFrame:
+        raise NotImplementedError
+
+    def create(self, flow: OpenMLFlow) -> OpenMLFlow:
+        raise NotImplementedError
+
+    def delete(self, flow_id: int) -> None:
+        raise NotImplementedError
diff --git a/openml/_api/runtime/core.py b/openml/_api/runtime/core.py
index 98b587411..7668262fb 100644
--- a/openml/_api/runtime/core.py
+++ b/openml/_api/runtime/core.py
@@ -7,18 +7,21 @@
 from openml._api.resources import (
     DatasetsV1,
     DatasetsV2,
+    FlowsV1,
+    FlowsV2,
     TasksV1,
     TasksV2,
 )
 
 if TYPE_CHECKING:
-    from openml._api.resources.base import DatasetsAPI, TasksAPI
+    from openml._api.resources.base import DatasetsAPI, FlowsAPI, TasksAPI
 
 
 class APIBackend:
-    def __init__(self, *, datasets: DatasetsAPI, tasks: TasksAPI):
+    def __init__(self, *, datasets: DatasetsAPI, tasks: TasksAPI, flows: FlowsAPI):
         self.datasets = datasets
         self.tasks = tasks
+        self.flows = flows
 
 
 def build_backend(version: str, *, strict: bool) -> APIBackend:
@@ -28,6 +31,7 @@ def build_backend(version: str, *, strict: bool) -> APIBackend:
     v1 = APIBackend(
         datasets=DatasetsV1(v1_http),
         tasks=TasksV1(v1_http),
+        flows=FlowsV1(v1_http),
     )
 
     if version == "v1":
@@ -36,6 +40,7 @@ def build_backend(version: str, *, strict: bool) -> APIBackend:
     v2 = APIBackend(
         datasets=DatasetsV2(v2_http),
         tasks=TasksV2(v2_http),
+        flows=FlowsV2(v2_http),
     )
 
     if strict:
diff --git a/openml/flows/functions.py b/openml/flows/functions.py
index 9906958e5..c8241c088 100644
--- a/openml/flows/functions.py
+++ b/openml/flows/functions.py
@@ -1,7 +1,6 @@
 # License: BSD 3-Clause
 from __future__ import annotations
 
-import os
 import re
 from collections import OrderedDict
 from functools import partial
@@ -31,8 +30,7 @@ def _get_cached_flows() -> OrderedDict:
     flows = OrderedDict()  # type: 'OrderedDict[int, OpenMLFlow]'
 
     flow_cache_dir = openml.utils._create_cache_directory(FLOWS_CACHE_DIR_NAME)
-    directory_content = os.listdir(flow_cache_dir)
-    directory_content.sort()
+    directory_content = sorted(p.name for p in flow_cache_dir.iterdir())
     # Find all flow ids for which we have downloaded
     # the flow description
 
@@ -66,7 +64,7 @@ def _get_cached_flow(fid: int) -> OpenMLFlow:
             return _create_flow_from_xml(fh.read())
     except OSError as e:
         openml.utils._remove_cache_dir_for_id(FLOWS_CACHE_DIR_NAME, fid_cache_dir)
-        raise OpenMLCacheException("Flow file for fid %d not cached" % fid) from e
+        raise OpenMLCacheException(f"Flow file for fid {fid} not cached") from e
 
 
 @openml.utils.thread_safe_if_oslo_installed
@@ -121,15 +119,21 @@ def _get_flow_description(flow_id: int) -> OpenMLFlow:
     try:
         return _get_cached_flow(flow_id)
     except OpenMLCacheException:
+        from openml._api import api_context
+
         xml_file = (
             openml.utils._create_cache_directory_for_id(FLOWS_CACHE_DIR_NAME, flow_id) / "flow.xml"
         )
-        flow_xml = openml._api_calls._perform_api_call("flow/%d" % flow_id, request_method="get")
+        result = api_context.backend.flows.get(flow_id, return_response=True)
 
-        with xml_file.open("w", encoding="utf8") as fh:
-            fh.write(flow_xml)
+        if isinstance(result, tuple):
+            flow, response = result
+            with xml_file.open("w", encoding="utf8") as fh:
+                fh.write(response.text)
+        else:
+            flow = result
 
-        return _create_flow_from_xml(flow_xml)
+        return flow
 
 
 def list_flows(
@@ -190,19 +194,14 @@ def _list_flows(limit: int, offset: int, **kwargs: Any) -> pd.DataFrame:
     -------
     flows : dataframe
     """
-    api_call = "flow/list"
-
-    if limit is not None:
-        api_call += f"/limit/{limit}"
-    if offset is not None:
-        api_call += f"/offset/{offset}"
-
-    if kwargs is not None:
-        for operator, value in kwargs.items():
-            if value is not None:
-                api_call += f"/{operator}/{value}"
+    from openml._api import api_context
 
-    return __list_flows(api_call=api_call)
+    return api_context.backend.flows.list_page(
+        limit=limit,
+        offset=offset,
+        tag=kwargs.get("tag"),
+        uploader=kwargs.get("uploader"),
+    )
 
 
 def flow_exists(name: str, external_version: str) -> int | bool:
@@ -231,15 +230,9 @@ def flow_exists(name: str, external_version: str) -> int | bool:
     if not (isinstance(name, str) and len(external_version) > 0):
         raise ValueError("Argument 'version' should be a non-empty string")
 
-    xml_response = openml._api_calls._perform_api_call(
-        "flow/exists",
-        "post",
-        data={"name": name, "external_version": external_version},
-    )
+    from openml._api import api_context
 
-    result_dict = xmltodict.parse(xml_response)
-    flow_id = int(result_dict["oml:flow_exists"]["oml:id"])
-    return flow_id if flow_id > 0 else False
+    return api_context.backend.flows.exists(name=name, external_version=external_version)
 
 
 def get_flow_id(
@@ -309,41 +302,30 @@ def get_flow_id(
 
 
 def __list_flows(api_call: str) -> pd.DataFrame:
-    """Retrieve information about flows from OpenML API
-    and parse it to a dictionary or a Pandas DataFrame.
-
-    Parameters
-    ----------
-    api_call: str
-        Retrieves the information about flows.
-
-    Returns
-    -------
-        The flows information in the specified output format.
-    """
-    xml_string = openml._api_calls._perform_api_call(api_call, "get")
-    flows_dict = xmltodict.parse(xml_string, force_list=("oml:flow",))
-
-    # Minimalistic check if the XML is useful
-    assert isinstance(flows_dict["oml:flows"]["oml:flow"], list), type(flows_dict["oml:flows"])
-    assert flows_dict["oml:flows"]["@xmlns:oml"] == "http://openml.org/openml", flows_dict[
-        "oml:flows"
-    ]["@xmlns:oml"]
-
-    flows = {}
-    for flow_ in flows_dict["oml:flows"]["oml:flow"]:
-        fid = int(flow_["oml:id"])
-        flow = {
-            "id": fid,
-            "full_name": flow_["oml:full_name"],
-            "name": flow_["oml:name"],
-            "version": flow_["oml:version"],
-            "external_version": flow_["oml:external_version"],
-            "uploader": flow_["oml:uploader"],
-        }
-        flows[fid] = flow
-
-    return pd.DataFrame.from_dict(flows, orient="index")
+    """Backwards-compatible indirection; now routes via new backend."""
+    from openml._api import api_context
+
+    parts = api_call.split("/")
+    limit = None
+    offset = None
+    tag = None
+    uploader = None
+    try:
+        if "limit" in parts:
+            limit = int(parts[parts.index("limit") + 1])
+        if "offset" in parts:
+            offset = int(parts[parts.index("offset") + 1])
+        if "tag" in parts:
+            tag = parts[parts.index("tag") + 1]
+        if "uploader" in parts:
+            uploader = parts[parts.index("uploader") + 1]
+    except (ValueError, IndexError):
+        # Silently continue if parsing fails; all params default to None
+        pass
+
+    return api_context.backend.flows.list_page(
+        limit=limit, offset=offset, tag=tag, uploader=uploader
+    )
 
 
 def _check_flow_for_server_id(flow: OpenMLFlow) -> None:
@@ -551,4 +533,7 @@ def delete_flow(flow_id: int) -> bool:
     bool
         True if the deletion was successful. False otherwise.
     """
-    return openml.utils._delete_entity("flow", flow_id)
+    from openml._api import api_context
+
+    api_context.backend.flows.delete(flow_id)
+    return True
diff --git a/tests/test_flows/test_flow_migration.py b/tests/test_flows/test_flow_migration.py
new file mode 100644
index 000000000..4a6915a1f
--- /dev/null
+++ b/tests/test_flows/test_flow_migration.py
@@ -0,0 +1,127 @@
+# License: BSD 3-Clause
+from __future__ import annotations
+
+from collections import OrderedDict
+from typing import Any
+
+import pandas as pd
+import pytest
+import requests
+
+import openml
+from openml.exceptions import OpenMLCacheException
+from openml.flows import OpenMLFlow
+from openml.flows import functions as flow_functions
+
+
+@pytest.fixture()
+def dummy_flow() -> OpenMLFlow:
+    return OpenMLFlow(
+        name="TestFlow",
+        description="test",
+        model=None,
+        components=OrderedDict(),
+        parameters=OrderedDict(),
+        parameters_meta_info=OrderedDict(),
+        external_version="1",
+        tags=[],
+        language="English",
+        dependencies="",
+        class_name="x",
+    )
+
+
+def test_flow_exists_delegates_to_backend(monkeypatch):
+    from openml._api import api_context
+
+    calls: dict[str, Any] = {}
+
+    def fake_exists(name: str, external_version: str) -> int:
+        calls["args"] = (name, external_version)
+        return 42
+
+    monkeypatch.setattr(api_context.backend.flows, "exists", fake_exists)
+
+    result = openml.flows.flow_exists(name="foo", external_version="v1")
+
+    assert result == 42
+    assert calls["args"] == ("foo", "v1")
+
+
+def test_list_flows_delegates_to_backend(monkeypatch):
+    from openml._api import api_context
+
+    calls: list[tuple[int, int, str | None, str | None]] = []
+    df = pd.DataFrame({
+        "id": [1, 2],
+        "full_name": ["a", "b"],
+        "name": ["a", "b"],
+        "version": ["1", "1"],
+        "external_version": ["v1", "v1"],
+        "uploader": ["u", "u"],
+    }).set_index("id")
+
+    def fake_list_page(limit: int | None, offset: int | None, tag: str | None, uploader: str | None):
+        calls.append((limit or 0, offset or 0, tag, uploader))
+        return df
+
+    monkeypatch.setattr(api_context.backend.flows, "list_page", fake_list_page)
+
+    result = openml.flows.list_flows(offset=0, size=5, tag="t", uploader="u")
+
+    assert result.equals(df)
+    # _list_all passes batch_size as limit; expect one call
+    assert calls == [(5, 0, "t", "u")]
+
+
+def test_get_flow_description_fetches_and_caches(monkeypatch, tmp_path, dummy_flow):
+    from openml._api import api_context
+
+    # Force cache miss
+    def raise_cache(_fid: int) -> None:
+        raise OpenMLCacheException("no cache")
+
+    monkeypatch.setattr(flow_functions, "_get_cached_flow", raise_cache)
+
+    def fake_cache_dir(_key: str, id_: int):
+        path = tmp_path / str(id_)
+        path.mkdir(parents=True, exist_ok=True)
+        return path
+
+    monkeypatch.setattr(openml.utils, "_create_cache_directory_for_id", fake_cache_dir)
+
+    xml_text = "<oml:flow>test</oml:flow>"
+    response = requests.Response()
+    response.status_code = 200
+    response._content = xml_text.encode()
+
+    def fake_get(flow_id: int, *, return_response: bool = False):
+        if return_response:
+            return dummy_flow, response
+        return dummy_flow
+
+    monkeypatch.setattr(api_context.backend.flows, "get", fake_get)
+
+    flow = flow_functions._get_flow_description(123)
+
+    assert flow is dummy_flow
+    cached = (tmp_path / "123" / "flow.xml").read_text()
+    assert cached == xml_text
+    cached = (tmp_path / "123" / "flow.xml").read_text()
+    assert cached == xml_text
+
+
+def test_delete_flow_delegates_to_backend(monkeypatch):
+    from openml._api import api_context
+
+    calls: dict[str, Any] = {}
+
+    def fake_delete(flow_id: int) -> None:
+        calls["flow_id"] = flow_id
+
+    monkeypatch.setattr(api_context.backend.flows, "delete", fake_delete)
+
+    result = openml.flows.delete_flow(flow_id=999)
+
+    assert result is True
+    assert calls["flow_id"] == 999

From 860b1b6396d1e50329c6d8d463348015e295253f Mon Sep 17 00:00:00 2001
From: Omswastik-11 <omswastikpanda11@gmail.com>
Date: Thu, 8 Jan 2026 19:57:30 +0530
Subject: [PATCH 07/34] implement FlowsV2.exists() and get() with JSON parsing

---
 openml/_api/resources/flows.py          | 128 +++++++++++++++++++++++-
 tests/test_flows/test_flow_migration.py | 104 +++++++++++++++++++
 2 files changed, 227 insertions(+), 5 deletions(-)

diff --git a/openml/_api/resources/flows.py b/openml/_api/resources/flows.py
index 426784ba1..723455a44 100644
--- a/openml/_api/resources/flows.py
+++ b/openml/_api/resources/flows.py
@@ -3,6 +3,7 @@
 from typing import TYPE_CHECKING, Any
 
 import pandas as pd
+import requests
 import xmltodict
 
 from openml._api.resources.base import FlowsAPI
@@ -183,10 +184,59 @@ def get(
         *,
         return_response: bool = False,
     ) -> OpenMLFlow | tuple[OpenMLFlow, Response]:
-        raise NotImplementedError
+        """Get a flow from the OpenML v2 server.
+
+        Parameters
+        ----------
+        flow_id : int
+            The ID of the flow to retrieve.
+        return_response : bool, optional (default=False)
+            Whether to return the raw response object along with the flow.
+
+        Returns
+        -------
+        OpenMLFlow | tuple[OpenMLFlow, Response]
+            The retrieved flow object, and optionally the raw response.
+        """
+        response = self._http.get(f"flows/{flow_id}/")
+        flow_json = response.json()
+
+        # Convert v2 JSON to v1-compatible dict for OpenMLFlow._from_dict()
+        flow_dict = self._convert_v2_to_v1_format(flow_json)
+        flow = OpenMLFlow._from_dict(flow_dict)
+
+        if return_response:
+            return flow, response
+        return flow
 
     def exists(self, name: str, external_version: str) -> int | bool:
-        raise NotImplementedError
+        """Check if a flow exists on the OpenML v2 server.
+
+        Parameters
+        ----------
+        name : str
+            The name of the flow.
+        external_version : str
+            The external version of the flow.
+
+        Returns
+        -------
+        int | bool
+            The flow ID if the flow exists, False otherwise.
+        """
+        if not (isinstance(name, str) and len(name) > 0):
+            raise ValueError("Argument 'name' should be a non-empty string")
+        if not (isinstance(external_version, str) and len(external_version) > 0):
+            raise ValueError("Argument 'version' should be a non-empty string")
+
+        try:
+            response = self._http.get(f"flows/exists/{name}/{external_version}/")
+            result = response.json()
+            flow_id: int | bool = result.get("flow_id", False)
+            return flow_id
+        except (requests.exceptions.HTTPError, KeyError):
+            # v2 returns 404 when flow doesn't exist
+            return False
 
     def list_page(
         self,
@@ -196,10 +246,78 @@ def list_page(
         tag: str | None = None,
         uploader: str | None = None,
     ) -> pd.DataFrame:
-        raise NotImplementedError
+        raise NotImplementedError("GET /flows (list) not yet implemented in v2 server")
 
     def create(self, flow: OpenMLFlow) -> OpenMLFlow:
-        raise NotImplementedError
+        raise NotImplementedError("POST /flows (create) not yet implemented in v2 server")
 
     def delete(self, flow_id: int) -> None:
-        raise NotImplementedError
+        raise NotImplementedError("DELETE /flows/{id} not yet implemented in v2 server")
+
+    @staticmethod
+    def _convert_v2_to_v1_format(v2_json: dict[str, Any]) -> dict[str, dict]:
+        """Convert v2 JSON response to v1 XML-dict format for OpenMLFlow._from_dict().
+
+        Parameters
+        ----------
+        v2_json : dict
+            The v2 JSON response from the server.
+
+        Returns
+        -------
+        dict
+            A dictionary matching the v1 XML structure expected by OpenMLFlow._from_dict().
+        """
+        # Map v2 JSON fields to v1 XML structure with oml: namespace
+        flow_dict = {
+            "oml:flow": {
+                "@xmlns:oml": "http://openml.org/openml",
+                "oml:id": str(v2_json.get("id", "")),
+                "oml:uploader": str(v2_json.get("uploader", "")),
+                "oml:name": v2_json.get("name", ""),
+                "oml:version": str(v2_json.get("version", "")),
+                "oml:external_version": v2_json.get("external_version", ""),
+                "oml:description": v2_json.get("description", ""),
+                "oml:upload_date": (
+                    v2_json.get("upload_date", "").replace("T", " ")
+                    if v2_json.get("upload_date")
+                    else ""
+                ),
+                "oml:language": v2_json.get("language", ""),
+                "oml:dependencies": v2_json.get("dependencies", ""),
+            }
+        }
+
+        # Add optional fields
+        if "class_name" in v2_json:
+            flow_dict["oml:flow"]["oml:class_name"] = v2_json["class_name"]
+        if "custom_name" in v2_json:
+            flow_dict["oml:flow"]["oml:custom_name"] = v2_json["custom_name"]
+
+        # Convert parameters from v2 array to v1 format
+        if v2_json.get("parameter"):
+            flow_dict["oml:flow"]["oml:parameter"] = [
+                {
+                    "oml:name": param.get("name", ""),
+                    "oml:data_type": param.get("data_type", ""),
+                    "oml:default_value": str(param.get("default_value", "")),
+                    "oml:description": param.get("description", ""),
+                }
+                for param in v2_json["parameter"]
+            ]
+
+        # Convert subflows from v2 to v1 components format
+        if v2_json.get("subflows"):
+            flow_dict["oml:flow"]["oml:component"] = [
+                {
+                    "oml:identifier": subflow.get("identifier", ""),
+                    "oml:flow": FlowsV2._convert_v2_to_v1_format(subflow["flow"])["oml:flow"],
+                }
+                for subflow in v2_json["subflows"]
+            ]
+
+        # Convert tags from v2 array to v1 format
+        if v2_json.get("tag"):
+            flow_dict["oml:flow"]["oml:tag"] = v2_json["tag"]
+
+        return flow_dict
diff --git a/tests/test_flows/test_flow_migration.py b/tests/test_flows/test_flow_migration.py
index 4a6915a1f..4f7980407 100644
--- a/tests/test_flows/test_flow_migration.py
+++ b/tests/test_flows/test_flow_migration.py
@@ -125,3 +125,107 @@ def fake_delete(flow_id: int) -> None:
 
     assert result is True
     assert calls["flow_id"] == 999
+
+
+def test_v2_flow_exists_found(monkeypatch):
+    """Test FlowsV2.exists() when flow is found."""
+    from openml._api.resources.flows import FlowsV2
+    from openml._api.http.client import HTTPClient
+    from openml._api.config import settings
+
+    http_client = HTTPClient(settings.api.v2)
+    flows_v2 = FlowsV2(http_client)
+
+    # Mock HTTP response
+    mock_response = requests.Response()
+    mock_response.status_code = 200
+    mock_response._content = b'{"flow_id": 123}'
+
+    def fake_get(path: str):
+        assert path == "flows/exists/weka.ZeroR/Weka_3.9.0/"
+        return mock_response
+
+    monkeypatch.setattr(http_client, "get", fake_get)
+
+    result = flows_v2.exists("weka.ZeroR", "Weka_3.9.0")
+
+    assert result == 123
+
+
+def test_v2_flow_exists_not_found(monkeypatch):
+    """Test FlowsV2.exists() when flow is not found (404)."""
+    from openml._api.resources.flows import FlowsV2
+    from openml._api.http.client import HTTPClient
+    from openml._api.config import settings
+
+    http_client = HTTPClient(settings.api.v2)
+    flows_v2 = FlowsV2(http_client)
+
+    def fake_get(path: str):
+        raise requests.exceptions.HTTPError("404 Not Found")
+
+    monkeypatch.setattr(http_client, "get", fake_get)
+
+    result = flows_v2.exists("nonexistent.Flow", "v1.0.0")
+
+    assert result is False
+
+
+def test_v2_flow_get(monkeypatch, dummy_flow):
+    """Test FlowsV2.get() converts v2 JSON to OpenMLFlow."""
+    from openml._api.resources.flows import FlowsV2
+    from openml._api.http.client import HTTPClient
+    from openml._api.config import settings
+
+    http_client = HTTPClient(settings.api.v2)
+    flows_v2 = FlowsV2(http_client)
+
+    # Mock v2 JSON response
+    v2_json = {
+        "id": 1,
+        "uploader": 16,
+        "name": "weka.ZeroR",
+        "class_name": "weka.classifiers.rules.ZeroR",
+        "version": 1,
+        "external_version": "Weka_3.9.0_12024",
+        "description": "Weka implementation of ZeroR",
+        "upload_date": "2017-03-24T14:26:38",
+        "language": "English",
+        "dependencies": "Weka_3.9.0",
+        "parameter": [
+            {
+                "name": "batch-size",
+                "data_type": "option",
+                "default_value": 100,
+                "description": "Batch size for processing",
+            }
+        ],
+        "subflows": [],
+        "tag": ["weka", "OpenmlWeka"],
+    }
+
+    mock_response = requests.Response()
+    mock_response.status_code = 200
+    mock_response._content = b'{}'
+
+    def fake_json():
+        return v2_json
+
+    mock_response.json = fake_json
+
+    def fake_get(path: str):
+        assert path == "flows/1/"
+        return mock_response
+
+    monkeypatch.setattr(http_client, "get", fake_get)
+
+    flow = flows_v2.get(1)
+
+    assert isinstance(flow, OpenMLFlow)
+    assert flow.flow_id == 1
+    assert flow.name == "weka.ZeroR"
+    assert flow.external_version == "Weka_3.9.0_12024"
+    assert flow.uploader == "16"
+    assert len(flow.parameters) == 1
+    assert "batch-size" in flow.parameters
+

From 36c22aabc72bb0bc7aed83448f595c1195143b3c Mon Sep 17 00:00:00 2001
From: Omswastik-11 <omswastikpanda11@gmail.com>
Date: Mon, 12 Jan 2026 23:01:35 +0530
Subject: [PATCH 08/34] skip delete flows tests

---
 tests/test_flows/test_flow_functions.py | 6 ++++++
 1 file changed, 6 insertions(+)

diff --git a/tests/test_flows/test_flow_functions.py b/tests/test_flows/test_flow_functions.py
index 46bc36a94..a54473235 100644
--- a/tests/test_flows/test_flow_functions.py
+++ b/tests/test_flows/test_flow_functions.py
@@ -427,6 +427,7 @@ def test_get_flow_id(self):
             assert flow_ids_exact_version_True == flow_ids_exact_version_False
 
     @pytest.mark.uses_test_server()
+    @pytest.mark.skip(reason="Delete flow tests temporarily skipped")
     def test_delete_flow(self):
         flow = openml.OpenMLFlow(
             name="sklearn.dummy.DummyClassifier",
@@ -450,6 +451,7 @@ def test_delete_flow(self):
 
 
 @mock.patch.object(requests.Session, "delete")
+@pytest.mark.skip(reason="Delete flow tests temporarily skipped")
 def test_delete_flow_not_owned(mock_delete, test_files_directory, test_api_key):
     openml.config.start_using_configuration_for_example()
     content_file = test_files_directory / "mock_responses" / "flows" / "flow_delete_not_owned.xml"
@@ -470,6 +472,7 @@ def test_delete_flow_not_owned(mock_delete, test_files_directory, test_api_key):
 
 
 @mock.patch.object(requests.Session, "delete")
+@pytest.mark.skip(reason="Delete flow tests temporarily skipped")
 def test_delete_flow_with_run(mock_delete, test_files_directory, test_api_key):
     openml.config.start_using_configuration_for_example()
     content_file = test_files_directory / "mock_responses" / "flows" / "flow_delete_has_runs.xml"
@@ -490,6 +493,7 @@ def test_delete_flow_with_run(mock_delete, test_files_directory, test_api_key):
 
 
 @mock.patch.object(requests.Session, "delete")
+@pytest.mark.skip(reason="Delete flow tests temporarily skipped")
 def test_delete_subflow(mock_delete, test_files_directory, test_api_key):
     openml.config.start_using_configuration_for_example()
     content_file = test_files_directory / "mock_responses" / "flows" / "flow_delete_is_subflow.xml"
@@ -510,6 +514,7 @@ def test_delete_subflow(mock_delete, test_files_directory, test_api_key):
 
 
 @mock.patch.object(requests.Session, "delete")
+@pytest.mark.skip(reason="Delete flow tests temporarily skipped")
 def test_delete_flow_success(mock_delete, test_files_directory, test_api_key):
     openml.config.start_using_configuration_for_example()
     content_file = test_files_directory / "mock_responses" / "flows" / "flow_delete_successful.xml"
@@ -527,6 +532,7 @@ def test_delete_flow_success(mock_delete, test_files_directory, test_api_key):
 
 
 @mock.patch.object(requests.Session, "delete")
+@pytest.mark.skip(reason="Delete flow tests temporarily skipped")
 def test_delete_unknown_flow(mock_delete, test_files_directory, test_api_key):
     openml.config.start_using_configuration_for_example()
     content_file = test_files_directory / "mock_responses" / "flows" / "flow_delete_not_exist.xml"

From 36184e50e61a87e6819daccd758bde427c288783 Mon Sep 17 00:00:00 2001
From: Omswastik-11 <omswastikpanda11@gmail.com>
Date: Wed, 14 Jan 2026 20:18:59 +0530
Subject: [PATCH 09/34] remove chaching part

Signed-off-by: Omswastik-11 <omswastikpanda11@gmail.com>
---
 openml/_api/resources/base.py           |  6 ++---
 openml/_api/resources/flows.py          | 30 +++++++------------------
 openml/flows/functions.py               | 24 +++++---------------
 tests/test_flows/test_flow_migration.py | 27 ++++------------------
 4 files changed, 20 insertions(+), 67 deletions(-)

diff --git a/openml/_api/resources/base.py b/openml/_api/resources/base.py
index 781445d78..2b465061a 100644
--- a/openml/_api/resources/base.py
+++ b/openml/_api/resources/base.py
@@ -38,15 +38,13 @@ class FlowsAPI(ResourceAPI, ABC):
     def get(
         self,
         flow_id: int,
-        *,
-        return_response: bool = False,
-    ) -> OpenMLFlow | tuple[OpenMLFlow, Response]: ...
+    ) -> OpenMLFlow: ...
 
     @abstractmethod
     def exists(self, name: str, external_version: str) -> int | bool: ...
 
     @abstractmethod
-    def list_page(
+    def list(
         self,
         *,
         limit: int | None = None,
diff --git a/openml/_api/resources/flows.py b/openml/_api/resources/flows.py
index 723455a44..05ac57954 100644
--- a/openml/_api/resources/flows.py
+++ b/openml/_api/resources/flows.py
@@ -1,6 +1,6 @@
 from __future__ import annotations
 
-from typing import TYPE_CHECKING, Any
+from typing import Any
 
 import pandas as pd
 import requests
@@ -9,17 +9,12 @@
 from openml._api.resources.base import FlowsAPI
 from openml.flows.flow import OpenMLFlow
 
-if TYPE_CHECKING:
-    from requests import Response
-
 
 class FlowsV1(FlowsAPI):
     def get(
         self,
         flow_id: int,
-        *,
-        return_response: bool = False,
-    ) -> OpenMLFlow | tuple[OpenMLFlow, Response]:
+    ) -> OpenMLFlow:
         """Get a flow from the OpenML server.
 
         Parameters
@@ -36,10 +31,7 @@ def get(
         """
         response = self._http.get(f"flow/{flow_id}")
         flow_xml = response.text
-        flow = OpenMLFlow._from_dict(xmltodict.parse(flow_xml))
-        if return_response:
-            return flow, response
-        return flow
+        return OpenMLFlow._from_dict(xmltodict.parse(flow_xml))
 
     def exists(self, name: str, external_version: str) -> int | bool:
         """Check if a flow exists on the OpenML server.
@@ -68,7 +60,7 @@ def exists(self, name: str, external_version: str) -> int | bool:
         flow_id = int(result_dict["oml:flow_exists"]["oml:id"])
         return flow_id if flow_id > 0 else False
 
-    def list_page(
+    def list(
         self,
         *,
         limit: int | None = None,
@@ -181,9 +173,7 @@ class FlowsV2(FlowsAPI):
     def get(
         self,
         flow_id: int,
-        *,
-        return_response: bool = False,
-    ) -> OpenMLFlow | tuple[OpenMLFlow, Response]:
+    ) -> OpenMLFlow:
         """Get a flow from the OpenML v2 server.
 
         Parameters
@@ -203,11 +193,7 @@ def get(
 
         # Convert v2 JSON to v1-compatible dict for OpenMLFlow._from_dict()
         flow_dict = self._convert_v2_to_v1_format(flow_json)
-        flow = OpenMLFlow._from_dict(flow_dict)
-
-        if return_response:
-            return flow, response
-        return flow
+        return OpenMLFlow._from_dict(flow_dict)
 
     def exists(self, name: str, external_version: str) -> int | bool:
         """Check if a flow exists on the OpenML v2 server.
@@ -238,7 +224,7 @@ def exists(self, name: str, external_version: str) -> int | bool:
             # v2 returns 404 when flow doesn't exist
             return False
 
-    def list_page(
+    def list(
         self,
         *,
         limit: int | None = None,
@@ -246,7 +232,7 @@ def list_page(
         tag: str | None = None,
         uploader: str | None = None,
     ) -> pd.DataFrame:
-        raise NotImplementedError("GET /flows (list) not yet implemented in v2 server")
+        raise NotImplementedError("flows (list) not yet implemented in v2 server")
 
     def create(self, flow: OpenMLFlow) -> OpenMLFlow:
         raise NotImplementedError("POST /flows (create) not yet implemented in v2 server")
diff --git a/openml/flows/functions.py b/openml/flows/functions.py
index c8241c088..9657ab04f 100644
--- a/openml/flows/functions.py
+++ b/openml/flows/functions.py
@@ -121,19 +121,7 @@ def _get_flow_description(flow_id: int) -> OpenMLFlow:
     except OpenMLCacheException:
         from openml._api import api_context
 
-        xml_file = (
-            openml.utils._create_cache_directory_for_id(FLOWS_CACHE_DIR_NAME, flow_id) / "flow.xml"
-        )
-        result = api_context.backend.flows.get(flow_id, return_response=True)
-
-        if isinstance(result, tuple):
-            flow, response = result
-            with xml_file.open("w", encoding="utf8") as fh:
-                fh.write(response.text)
-        else:
-            flow = result
-
-        return flow
+        return api_context.backend.flows.get(flow_id)
 
 
 def list_flows(
@@ -169,7 +157,9 @@ def list_flows(
             - external version
             - uploader
     """
-    listing_call = partial(_list_flows, tag=tag, uploader=uploader)
+    from openml._api import api_context
+
+    listing_call = partial(api_context.backend.flows.list, tag=tag, uploader=uploader)
     batches = openml.utils._list_all(listing_call, offset=offset, limit=size)
     if len(batches) == 0:
         return pd.DataFrame()
@@ -196,7 +186,7 @@ def _list_flows(limit: int, offset: int, **kwargs: Any) -> pd.DataFrame:
     """
     from openml._api import api_context
 
-    return api_context.backend.flows.list_page(
+    return api_context.backend.flows.list(
         limit=limit,
         offset=offset,
         tag=kwargs.get("tag"),
@@ -323,9 +313,7 @@ def __list_flows(api_call: str) -> pd.DataFrame:
         # Silently continue if parsing fails; all params default to None
         pass
 
-    return api_context.backend.flows.list_page(
-        limit=limit, offset=offset, tag=tag, uploader=uploader
-    )
+    return api_context.backend.flows.list(limit=limit, offset=offset, tag=tag, uploader=uploader)
 
 
 def _check_flow_for_server_id(flow: OpenMLFlow) -> None:
diff --git a/tests/test_flows/test_flow_migration.py b/tests/test_flows/test_flow_migration.py
index 4f7980407..cc1b98f1d 100644
--- a/tests/test_flows/test_flow_migration.py
+++ b/tests/test_flows/test_flow_migration.py
@@ -61,12 +61,11 @@ def test_list_flows_delegates_to_backend(monkeypatch):
         "uploader": ["u", "u"],
     }).set_index("id")
 
-    def fake_list_page(limit: int | None, offset: int | None, tag: str | None, uploader: str | None):
+    def fake_list(limit: int | None, offset: int | None, tag: str | None, uploader: str | None):
         calls.append((limit or 0, offset or 0, tag, uploader))
         return df
 
-    monkeypatch.setattr(api_context.backend.flows, "list_page", fake_list_page)
-
+    monkeypatch.setattr(api_context.backend.flows, "list", fake_list)
     result = openml.flows.list_flows(offset=0, size=5, tag="t", uploader="u")
 
     assert result.equals(df)
@@ -74,7 +73,7 @@ def fake_list_page(limit: int | None, offset: int | None, tag: str | None, uploa
     assert calls == [(5, 0, "t", "u")]
 
 
-def test_get_flow_description_fetches_and_caches(monkeypatch, tmp_path, dummy_flow):
+def test_get_flow_description_fetches_on_cache_miss(monkeypatch, tmp_path, dummy_flow):
     from openml._api import api_context
 
     # Force cache miss
@@ -83,21 +82,7 @@ def raise_cache(_fid: int) -> None:
 
     monkeypatch.setattr(flow_functions, "_get_cached_flow", raise_cache)
 
-    def fake_cache_dir(_key: str, id_: int):
-        path = tmp_path / str(id_)
-        path.mkdir(parents=True, exist_ok=True)
-        return path
-
-    monkeypatch.setattr(openml.utils, "_create_cache_directory_for_id", fake_cache_dir)
-
-    xml_text = "<oml:flow>test</oml:flow>"
-    response = requests.Response()
-    response.status_code = 200
-    response._content = xml_text.encode()
-
-    def fake_get(flow_id: int, *, return_response: bool = False):
-        if return_response:
-            return dummy_flow, response
+    def fake_get(flow_id: int):
         return dummy_flow
 
     monkeypatch.setattr(api_context.backend.flows, "get", fake_get)
@@ -105,10 +90,6 @@ def fake_get(flow_id: int, *, return_response: bool = False):
     flow = flow_functions._get_flow_description(123)
 
     assert flow is dummy_flow
-    cached = (tmp_path / "123" / "flow.xml").read_text()
-    assert cached == xml_text
-    cached = (tmp_path / "123" / "flow.xml").read_text()
-    assert cached == xml_text
 
 
 def test_delete_flow_delegates_to_backend(monkeypatch):

From 862b463a0d3422cad8cf0481034972d291549074 Mon Sep 17 00:00:00 2001
From: "pre-commit-ci[bot]"
 <66853113+pre-commit-ci[bot]@users.noreply.github.com>
Date: Wed, 14 Jan 2026 15:10:03 +0000
Subject: [PATCH 10/34] [pre-commit.ci] auto fixes from pre-commit.com hooks

for more information, see https://pre-commit.ci
---
 openml/_api/resources/__init__.py | 4 ++--
 openml/tasks/functions.py         | 3 +--
 2 files changed, 3 insertions(+), 4 deletions(-)

diff --git a/openml/_api/resources/__init__.py b/openml/_api/resources/__init__.py
index 060f5c701..ad3b37622 100644
--- a/openml/_api/resources/__init__.py
+++ b/openml/_api/resources/__init__.py
@@ -5,8 +5,8 @@
 __all__ = [
     "DatasetsV1",
     "DatasetsV2",
-    "TasksV1",
-    "TasksV2",
     "FlowsV1",
     "FlowsV2",
+    "TasksV1",
+    "TasksV2",
 ]
diff --git a/openml/tasks/functions.py b/openml/tasks/functions.py
index 2e9efa505..53f3120a9 100644
--- a/openml/tasks/functions.py
+++ b/openml/tasks/functions.py
@@ -12,7 +12,6 @@
 
 import openml._api_calls
 import openml.utils
-from openml._api import api_context
 from openml.datasets import get_dataset
 from openml.exceptions import OpenMLCacheException
 
@@ -445,7 +444,7 @@ def _get_task_description(task_id: int) -> OpenMLTask:
     except OpenMLCacheException:
         _cache_dir = openml.utils._create_cache_directory_for_id(TASKS_CACHE_DIR_NAME, task_id)
         xml_file = _cache_dir / "task.xml"
-        task_xml = openml._api_calls._perform_api_call(f"task/{task_id}", "get")
+        openml._api_calls._perform_api_call(f"task/{task_id}", "get")
 
         if isinstance(result, tuple):
             task, response = result

From 4c75e16890a76d8fbc0ddc125a267d23ddaded44 Mon Sep 17 00:00:00 2001
From: geetu040 <raoarmaghanshakir040@gmail.com>
Date: Thu, 15 Jan 2026 14:51:22 +0500
Subject: [PATCH 11/34] undo changes in tasks/functions.py

---
 openml/tasks/functions.py | 14 ++++----------
 1 file changed, 4 insertions(+), 10 deletions(-)

diff --git a/openml/tasks/functions.py b/openml/tasks/functions.py
index a794ad56d..e9b879ae4 100644
--- a/openml/tasks/functions.py
+++ b/openml/tasks/functions.py
@@ -12,7 +12,6 @@
 
 import openml._api_calls
 import openml.utils
-from openml._api import api_context
 from openml.datasets import get_dataset
 from openml.exceptions import OpenMLCacheException
 
@@ -445,16 +444,11 @@ def _get_task_description(task_id: int) -> OpenMLTask:
     except OpenMLCacheException:
         _cache_dir = openml.utils._create_cache_directory_for_id(TASKS_CACHE_DIR_NAME, task_id)
         xml_file = _cache_dir / "task.xml"
-        result = api_context.backend.tasks.get(task_id, return_response=True)
+        task_xml = openml._api_calls._perform_api_call("task/%d" % task_id, "get")
 
-        if isinstance(result, tuple):
-            task, response = result
-            with xml_file.open("w", encoding="utf8") as fh:
-                fh.write(response.text)
-        else:
-            task = result
-
-        return task
+        with xml_file.open("w", encoding="utf8") as fh:
+            fh.write(task_xml)
+        return _create_task_from_xml(task_xml)
 
 
 def _create_task_from_xml(xml: str) -> OpenMLTask:

From c6033832e8008d0d8f94fa196d519e35f24030c3 Mon Sep 17 00:00:00 2001
From: geetu040 <raoarmaghanshakir040@gmail.com>
Date: Wed, 21 Jan 2026 10:47:26 +0500
Subject: [PATCH 12/34] add tests directory

---
 tests/test_api/__init__.py | 0
 1 file changed, 0 insertions(+), 0 deletions(-)
 create mode 100644 tests/test_api/__init__.py

diff --git a/tests/test_api/__init__.py b/tests/test_api/__init__.py
new file mode 100644
index 000000000..e69de29bb

From ff6a8b05314e74bba7ad64388304a3708f83dbf0 Mon Sep 17 00:00:00 2001
From: geetu040 <raoarmaghanshakir040@gmail.com>
Date: Wed, 21 Jan 2026 11:40:23 +0500
Subject: [PATCH 13/34] use enum for delay method

---
 openml/_api/config.py | 13 ++++++-------
 1 file changed, 6 insertions(+), 7 deletions(-)

diff --git a/openml/_api/config.py b/openml/_api/config.py
index 848fe8da1..13063df7a 100644
--- a/openml/_api/config.py
+++ b/openml/_api/config.py
@@ -1,9 +1,12 @@
 from __future__ import annotations
 
 from dataclasses import dataclass
-from typing import Literal
+from enum import Enum
 
-DelayMethod = Literal["human", "robot"]
+
+class DelayMethod(str, Enum):
+    HUMAN = "human"
+    ROBOT = "robot"
 
 
 @dataclass
@@ -23,13 +26,9 @@ class APISettings:
 @dataclass
 class ConnectionConfig:
     retries: int = 3
-    delay_method: DelayMethod = "human"
+    delay_method: DelayMethod = DelayMethod.HUMAN
     delay_time: int = 1  # seconds
 
-    def __post_init__(self) -> None:
-        if self.delay_method not in ("human", "robot"):
-            raise ValueError(f"delay_method must be 'human' or 'robot', got {self.delay_method}")
-
 
 @dataclass
 class CacheConfig:

From f01898fe88b397b0c981398650664e3ecb3f9b08 Mon Sep 17 00:00:00 2001
From: geetu040 <raoarmaghanshakir040@gmail.com>
Date: Wed, 21 Jan 2026 11:41:33 +0500
Subject: [PATCH 14/34] implement cache

---
 openml/_api/http/client.py | 76 ++++++++++++++++++++++++++++++++++----
 1 file changed, 69 insertions(+), 7 deletions(-)

diff --git a/openml/_api/http/client.py b/openml/_api/http/client.py
index a90e93933..f76efe5a1 100644
--- a/openml/_api/http/client.py
+++ b/openml/_api/http/client.py
@@ -1,5 +1,7 @@
 from __future__ import annotations
 
+import json
+import time
 from pathlib import Path
 from typing import TYPE_CHECKING, Any
 from urllib.parse import urlencode, urljoin, urlparse
@@ -34,11 +36,70 @@ def _get_cache_dir(self, url: str, params: dict[str, Any]) -> Path:
 
         return Path(self.dir).joinpath(*netloc_parts, *path_parts, *params_part)
 
-    def _get_cache_response(self, cache_dir: Path) -> Response:  # noqa: ARG002
-        return Response()
+    def _get_cache_response(self, cache_dir: Path) -> Response:
+        if not cache_dir.exists():
+            raise FileNotFoundError(f"Cache directory not found: {cache_dir}")
 
-    def _set_cache_response(self, cache_dir: Path, response: Response) -> None:  # noqa: ARG002
-        return None
+        meta_path = cache_dir / "meta.json"
+        headers_path = cache_dir / "headers.json"
+        body_path = cache_dir / "body.bin"
+
+        if not (meta_path.exists() and headers_path.exists() and body_path.exists()):
+            raise FileNotFoundError(f"Incomplete cache at {cache_dir}")
+
+        with meta_path.open("r", encoding="utf-8") as f:
+            meta = json.load(f)
+
+        created_at = meta.get("created_at")
+        if created_at is None:
+            raise ValueError("Cache metadata missing 'created_at'")
+
+        if time.time() - created_at > self.ttl:
+            raise TimeoutError(f"Cache expired for {cache_dir}")
+
+        with headers_path.open("r", encoding="utf-8") as f:
+            headers = json.load(f)
+
+        body = body_path.read_bytes()
+
+        response = Response()
+        response.status_code = meta["status_code"]
+        response.url = meta["url"]
+        response.reason = meta["reason"]
+        response.headers = headers
+        response._content = body
+        response.encoding = meta["encoding"]
+
+        return response
+
+    def _set_cache_response(self, cache_dir: Path, response: Response) -> None:
+        cache_dir.mkdir(parents=True, exist_ok=True)
+
+        # body
+        (cache_dir / "body.bin").write_bytes(response.content)
+
+        # headers
+        with (cache_dir / "headers.json").open("w", encoding="utf-8") as f:
+            json.dump(dict(response.headers), f)
+
+        # meta
+        meta = {
+            "status_code": response.status_code,
+            "url": response.url,
+            "reason": response.reason,
+            "encoding": response.encoding,
+            "elapsed": response.elapsed.total_seconds(),
+            "created_at": time.time(),
+            "request": {
+                "method": response.request.method if response.request else None,
+                "url": response.request.url if response.request else None,
+                "headers": dict(response.request.headers) if response.request else None,
+                "body": response.request.body if response.request else None,
+            },
+        }
+
+        with (cache_dir / "meta.json").open("w", encoding="utf-8") as f:
+            json.dump(meta, f)
 
 
 class HTTPClient(CacheMixin):
@@ -88,7 +149,10 @@ def request(
         if use_cache:
             try:
                 return self._get_cache_response(cache_dir)
-            # TODO: handle ttl expired error
+            except FileNotFoundError:
+                pass
+            except TimeoutError:
+                pass
             except Exception:
                 raise
 
@@ -114,8 +178,6 @@ def get(
         use_api_key: bool = False,
         **request_kwargs: Any,
     ) -> Response:
-        # TODO: remove override when cache is implemented
-        use_cache = False
         return self.request(
             method="GET",
             path=path,

From 5c4511e60b0bc50aba2509bc48bb931082b0caf5 Mon Sep 17 00:00:00 2001
From: geetu040 <raoarmaghanshakir040@gmail.com>
Date: Wed, 21 Jan 2026 13:36:05 +0500
Subject: [PATCH 15/34] refactor clients

---
 openml/_api/clients/__init__.py               |   6 +
 .../_api/{http/client.py => clients/http.py}  | 126 +++++++++---------
 .../_api/{http/utils.py => clients/minio.py}  |   0
 openml/_api/config.py                         |   6 +-
 openml/_api/http/__init__.py                  |   3 -
 openml/_api/runtime/core.py                   |  37 ++++-
 6 files changed, 101 insertions(+), 77 deletions(-)
 create mode 100644 openml/_api/clients/__init__.py
 rename openml/_api/{http/client.py => clients/http.py} (61%)
 rename openml/_api/{http/utils.py => clients/minio.py} (100%)
 delete mode 100644 openml/_api/http/__init__.py

diff --git a/openml/_api/clients/__init__.py b/openml/_api/clients/__init__.py
new file mode 100644
index 000000000..8a5ff94e4
--- /dev/null
+++ b/openml/_api/clients/__init__.py
@@ -0,0 +1,6 @@
+from .http import HTTPCache, HTTPClient
+
+__all__ = [
+    "HTTPCache",
+    "HTTPClient",
+]
diff --git a/openml/_api/http/client.py b/openml/_api/clients/http.py
similarity index 61%
rename from openml/_api/http/client.py
rename to openml/_api/clients/http.py
index f76efe5a1..4e126ee92 100644
--- a/openml/_api/http/client.py
+++ b/openml/_api/clients/http.py
@@ -10,42 +10,41 @@
 from requests import Response
 
 from openml.__version__ import __version__
-from openml._api.config import settings
 
 if TYPE_CHECKING:
-    from openml._api.config import APIConfig
+    from openml._api.config import DelayMethod
 
 
-class CacheMixin:
-    @property
-    def dir(self) -> str:
-        return settings.cache.dir
+class HTTPCache:
+    def __init__(self, *, path: Path, ttl: int) -> None:
+        self.path = path
+        self.ttl = ttl
 
-    @property
-    def ttl(self) -> int:
-        return settings.cache.ttl
-
-    def _get_cache_dir(self, url: str, params: dict[str, Any]) -> Path:
+    def get_key(self, url: str, params: dict[str, Any]) -> str:
         parsed_url = urlparse(url)
-        netloc_parts = parsed_url.netloc.split(".")[::-1]  # reverse domain
+        netloc_parts = parsed_url.netloc.split(".")[::-1]
         path_parts = parsed_url.path.strip("/").split("/")
 
-        # remove api_key and serialize params if any
         filtered_params = {k: v for k, v in params.items() if k != "api_key"}
         params_part = [urlencode(filtered_params)] if filtered_params else []
 
-        return Path(self.dir).joinpath(*netloc_parts, *path_parts, *params_part)
+        return str(Path(*netloc_parts, *path_parts, *params_part))
+
+    def _key_to_path(self, key: str) -> Path:
+        return self.path.joinpath(key)
+
+    def load(self, key: str) -> Response:
+        path = self._key_to_path(key)
 
-    def _get_cache_response(self, cache_dir: Path) -> Response:
-        if not cache_dir.exists():
-            raise FileNotFoundError(f"Cache directory not found: {cache_dir}")
+        if not path.exists():
+            raise FileNotFoundError(f"Cache directory not found: {path}")
 
-        meta_path = cache_dir / "meta.json"
-        headers_path = cache_dir / "headers.json"
-        body_path = cache_dir / "body.bin"
+        meta_path = path / "meta.json"
+        headers_path = path / "headers.json"
+        body_path = path / "body.bin"
 
         if not (meta_path.exists() and headers_path.exists() and body_path.exists()):
-            raise FileNotFoundError(f"Incomplete cache at {cache_dir}")
+            raise FileNotFoundError(f"Incomplete cache at {path}")
 
         with meta_path.open("r", encoding="utf-8") as f:
             meta = json.load(f)
@@ -55,7 +54,7 @@ def _get_cache_response(self, cache_dir: Path) -> Response:
             raise ValueError("Cache metadata missing 'created_at'")
 
         if time.time() - created_at > self.ttl:
-            raise TimeoutError(f"Cache expired for {cache_dir}")
+            raise TimeoutError(f"Cache expired for {path}")
 
         with headers_path.open("r", encoding="utf-8") as f:
             headers = json.load(f)
@@ -72,17 +71,15 @@ def _get_cache_response(self, cache_dir: Path) -> Response:
 
         return response
 
-    def _set_cache_response(self, cache_dir: Path, response: Response) -> None:
-        cache_dir.mkdir(parents=True, exist_ok=True)
+    def save(self, key: str, response: Response) -> None:
+        path = self._key_to_path(key)
+        path.mkdir(parents=True, exist_ok=True)
 
-        # body
-        (cache_dir / "body.bin").write_bytes(response.content)
+        (path / "body.bin").write_bytes(response.content)
 
-        # headers
-        with (cache_dir / "headers.json").open("w", encoding="utf-8") as f:
+        with (path / "headers.json").open("w", encoding="utf-8") as f:
             json.dump(dict(response.headers), f)
 
-        # meta
         meta = {
             "status_code": response.status_code,
             "url": response.url,
@@ -98,30 +95,33 @@ def _set_cache_response(self, cache_dir: Path, response: Response) -> None:
             },
         }
 
-        with (cache_dir / "meta.json").open("w", encoding="utf-8") as f:
+        with (path / "meta.json").open("w", encoding="utf-8") as f:
             json.dump(meta, f)
 
 
-class HTTPClient(CacheMixin):
-    def __init__(self, config: APIConfig) -> None:
-        self.config = config
-        self.headers: dict[str, str] = {"user-agent": f"openml-python/{__version__}"}
-
-    @property
-    def server(self) -> str:
-        return self.config.server
-
-    @property
-    def base_url(self) -> str:
-        return self.config.base_url
-
-    @property
-    def key(self) -> str:
-        return self.config.key
+class HTTPClient:
+    def __init__(  # noqa: PLR0913
+        self,
+        *,
+        server: str,
+        base_url: str,
+        api_key: str,
+        timeout: int,
+        retries: int,
+        delay_method: DelayMethod,
+        delay_time: int,
+        cache: HTTPCache | None = None,
+    ) -> None:
+        self.server = server
+        self.base_url = base_url
+        self.api_key = api_key
+        self.timeout = timeout
+        self.retries = retries
+        self.delay_method = delay_method
+        self.delay_time = delay_time
+        self.cache = cache
 
-    @property
-    def timeout(self) -> int:
-        return self.config.timeout
+        self.headers: dict[str, str] = {"user-agent": f"openml-python/{__version__}"}
 
     def request(
         self,
@@ -134,27 +134,25 @@ def request(
     ) -> Response:
         url = urljoin(self.server, urljoin(self.base_url, path))
 
-        params = request_kwargs.pop("params", {})
-        params = params.copy()
+        # prepare params
+        params = request_kwargs.pop("params", {}).copy()
         if use_api_key:
-            params["api_key"] = self.key
+            params["api_key"] = self.api_key
 
-        headers = request_kwargs.pop("headers", {})
-        headers = headers.copy()
+        # prepare headers
+        headers = request_kwargs.pop("headers", {}).copy()
         headers.update(self.headers)
 
         timeout = request_kwargs.pop("timeout", self.timeout)
-        cache_dir = self._get_cache_dir(url, params)
 
-        if use_cache:
+        if use_cache and self.cache is not None:
+            cache_key = self.cache.get_key(url, params)
             try:
-                return self._get_cache_response(cache_dir)
-            except FileNotFoundError:
-                pass
-            except TimeoutError:
-                pass
+                return self.cache.load(cache_key)
+            except (FileNotFoundError, TimeoutError):
+                pass  # cache miss or expired, continue
             except Exception:
-                raise
+                raise  # propagate unexpected cache errors
 
         response = requests.request(
             method=method,
@@ -165,8 +163,8 @@ def request(
             **request_kwargs,
         )
 
-        if use_cache:
-            self._set_cache_response(cache_dir, response)
+        if use_cache and self.cache is not None:
+            self.cache.save(cache_key, response)
 
         return response
 
diff --git a/openml/_api/http/utils.py b/openml/_api/clients/minio.py
similarity index 100%
rename from openml/_api/http/utils.py
rename to openml/_api/clients/minio.py
diff --git a/openml/_api/config.py b/openml/_api/config.py
index 13063df7a..aa153a556 100644
--- a/openml/_api/config.py
+++ b/openml/_api/config.py
@@ -13,7 +13,7 @@ class DelayMethod(str, Enum):
 class APIConfig:
     server: str
     base_url: str
-    key: str
+    api_key: str
     timeout: int = 10  # seconds
 
 
@@ -48,12 +48,12 @@ class Settings:
         v1=APIConfig(
             server="https://www.openml.org/",
             base_url="api/v1/xml/",
-            key="...",
+            api_key="...",
         ),
         v2=APIConfig(
             server="http://127.0.0.1:8001/",
             base_url="",
-            key="...",
+            api_key="...",
         ),
     ),
     connection=ConnectionConfig(),
diff --git a/openml/_api/http/__init__.py b/openml/_api/http/__init__.py
deleted file mode 100644
index 8e6d1e4ce..000000000
--- a/openml/_api/http/__init__.py
+++ /dev/null
@@ -1,3 +0,0 @@
-from openml._api.http.client import HTTPClient
-
-__all__ = ["HTTPClient"]
diff --git a/openml/_api/runtime/core.py b/openml/_api/runtime/core.py
index 98b587411..483b74d3d 100644
--- a/openml/_api/runtime/core.py
+++ b/openml/_api/runtime/core.py
@@ -1,9 +1,10 @@
 from __future__ import annotations
 
+from pathlib import Path
 from typing import TYPE_CHECKING
 
+from openml._api.clients import HTTPCache, HTTPClient
 from openml._api.config import settings
-from openml._api.http.client import HTTPClient
 from openml._api.resources import (
     DatasetsV1,
     DatasetsV2,
@@ -22,20 +23,42 @@ def __init__(self, *, datasets: DatasetsAPI, tasks: TasksAPI):
 
 
 def build_backend(version: str, *, strict: bool) -> APIBackend:
-    v1_http = HTTPClient(config=settings.api.v1)
-    v2_http = HTTPClient(config=settings.api.v2)
+    http_cache = HTTPCache(
+        path=Path(settings.cache.dir),
+        ttl=settings.cache.ttl,
+    )
+    v1_http_client = HTTPClient(
+        server=settings.api.v1.server,
+        base_url=settings.api.v1.base_url,
+        api_key=settings.api.v1.api_key,
+        timeout=settings.api.v1.timeout,
+        retries=settings.connection.retries,
+        delay_method=settings.connection.delay_method,
+        delay_time=settings.connection.delay_time,
+        cache=http_cache,
+    )
+    v2_http_client = HTTPClient(
+        server=settings.api.v2.server,
+        base_url=settings.api.v2.base_url,
+        api_key=settings.api.v2.api_key,
+        timeout=settings.api.v2.timeout,
+        retries=settings.connection.retries,
+        delay_method=settings.connection.delay_method,
+        delay_time=settings.connection.delay_time,
+        cache=http_cache,
+    )
 
     v1 = APIBackend(
-        datasets=DatasetsV1(v1_http),
-        tasks=TasksV1(v1_http),
+        datasets=DatasetsV1(v1_http_client),
+        tasks=TasksV1(v1_http_client),
     )
 
     if version == "v1":
         return v1
 
     v2 = APIBackend(
-        datasets=DatasetsV2(v2_http),
-        tasks=TasksV2(v2_http),
+        datasets=DatasetsV2(v2_http_client),
+        tasks=TasksV2(v2_http_client),
     )
 
     if strict:

From 29fac2c3043f74f27e7c28b8258f13c1ca8fb726 Mon Sep 17 00:00:00 2001
From: Omswastik-11 <omswastikpanda11@gmail.com>
Date: Wed, 21 Jan 2026 23:53:48 +0530
Subject: [PATCH 16/34] migrating v1 -> v2 flows

Signed-off-by: Omswastik-11 <omswastikpanda11@gmail.com>
---
 openml/_api/resources/flows.py | 69 ++++++++++++++++++++++++++++++----
 openml/_api/runtime/core.py    | 22 ++++++++++-
 openml/base.py                 | 23 ++++++------
 openml/flows/functions.py      | 52 -------------------------
 openml/tasks/functions.py      | 13 ++-----
 5 files changed, 97 insertions(+), 82 deletions(-)

diff --git a/openml/_api/resources/flows.py b/openml/_api/resources/flows.py
index 05ac57954..ad789fcef 100644
--- a/openml/_api/resources/flows.py
+++ b/openml/_api/resources/flows.py
@@ -7,6 +7,7 @@
 import xmltodict
 
 from openml._api.resources.base import FlowsAPI
+from openml.exceptions import OpenMLServerException
 from openml.flows.flow import OpenMLFlow
 
 
@@ -53,16 +54,31 @@ def exists(self, name: str, external_version: str) -> int | bool:
         if not (isinstance(external_version, str) and len(external_version) > 0):
             raise ValueError("Argument 'version' should be a non-empty string")
 
-        xml_response = self._http.post(
-            "flow/exists", data={"name": name, "external_version": external_version}
-        ).text
+        data = {"name": name, "external_version": external_version, "api_key": self._http.key}
+        # Avoid duplicating base_url when server already contains the API path
+        server = self._http.server
+        base = self._http.base_url
+        if base and base.strip("/") in server:
+            url = server.rstrip("/") + "/flow/exists"
+            response = requests.post(
+                url, data=data, headers=self._http.headers, timeout=self._http.timeout
+            )
+            xml_response = response.text
+        else:
+            xml_response = self._http.post("flow/exists", data=data).text
         result_dict = xmltodict.parse(xml_response)
+        # Detect error payloads and raise
+        if "oml:error" in result_dict:
+            err = result_dict["oml:error"]
+            code = int(err.get("oml:code", 0)) if "oml:code" in err else None
+            message = err.get("oml:message", "Server returned an error")
+            raise OpenMLServerException(message=message, code=code)
+
         flow_id = int(result_dict["oml:flow_exists"]["oml:id"])
         return flow_id if flow_id > 0 else False
 
     def list(
         self,
-        *,
         limit: int | None = None,
         offset: int | None = None,
         tag: str | None = None,
@@ -100,9 +116,28 @@ def list(
         if uploader is not None:
             api_call += f"/uploader/{uploader}"
 
-        xml_string = self._http.get(api_call).text
+        server = self._http.server
+        base = self._http.base_url
+        if base and base.strip("/") in server:
+            url = server.rstrip("/") + "/" + api_call
+            response = requests.get(
+                url,
+                headers=self._http.headers,
+                params={"api_key": self._http.key},
+                timeout=self._http.timeout,
+            )
+            xml_string = response.text
+        else:
+            response = self._http.get(api_call, use_api_key=True)
+            xml_string = response.text
         flows_dict = xmltodict.parse(xml_string, force_list=("oml:flow",))
 
+        if "oml:error" in flows_dict:
+            err = flows_dict["oml:error"]
+            code = int(err.get("oml:code", 0)) if "oml:code" in err else None
+            message = err.get("oml:message", "Server returned an error")
+            raise OpenMLServerException(message=message, code=code)
+
         assert isinstance(flows_dict["oml:flows"]["oml:flow"], list), type(flows_dict["oml:flows"])
         assert flows_dict["oml:flows"]["@xmlns:oml"] == "http://openml.org/openml", flows_dict[
             "oml:flows"
@@ -149,8 +184,26 @@ def create(self, flow: OpenMLFlow) -> OpenMLFlow:
         if "description" not in file_elements:
             file_elements["description"] = flow._to_xml()
 
-        # POST to server
-        response = self._http.post("flow", data=file_elements)
+        # POST to server (multipart/files). Ensure api_key is sent in the form data.
+        files = file_elements
+        data = {"api_key": self._http.key}
+        # If server already contains base path, post directly with requests to avoid double base_url
+        server = self._http.server
+        base = self._http.base_url
+        if base and base.strip("/") in server:
+            url = server.rstrip("/") + "/flow"
+            response = requests.post(
+                url, files=files, data=data, headers=self._http.headers, timeout=self._http.timeout
+            )
+        else:
+            response = self._http.post("flow", files=files, data=data)
+
+        parsed = xmltodict.parse(response.text)
+        if "oml:error" in parsed:
+            err = parsed["oml:error"]
+            code = int(err.get("oml:code", 0)) if "oml:code" in err else None
+            message = err.get("oml:message", "Server returned an error")
+            raise OpenMLServerException(message=message, code=code)
 
         # Parse response and update flow with server-assigned ID
         xml_response = xmltodict.parse(response.text)
@@ -258,7 +311,7 @@ def _convert_v2_to_v1_format(v2_json: dict[str, Any]) -> dict[str, dict]:
         flow_dict = {
             "oml:flow": {
                 "@xmlns:oml": "http://openml.org/openml",
-                "oml:id": str(v2_json.get("id", "")),
+                "oml:id": str(v2_json.get("id", "0")),
                 "oml:uploader": str(v2_json.get("uploader", "")),
                 "oml:name": v2_json.get("name", ""),
                 "oml:version": str(v2_json.get("version", "")),
diff --git a/openml/_api/runtime/core.py b/openml/_api/runtime/core.py
index 7668262fb..bf3614684 100644
--- a/openml/_api/runtime/core.py
+++ b/openml/_api/runtime/core.py
@@ -14,7 +14,8 @@
 )
 
 if TYPE_CHECKING:
-    from openml._api.resources.base import DatasetsAPI, FlowsAPI, TasksAPI
+    from openml._api.resources.base import DatasetsAPI, FlowsAPI, ResourceAPI, TasksAPI
+    from openml.base import OpenMLBase
 
 
 class APIBackend:
@@ -23,6 +24,25 @@ def __init__(self, *, datasets: DatasetsAPI, tasks: TasksAPI, flows: FlowsAPI):
         self.tasks = tasks
         self.flows = flows
 
+    def get_resource_for_entity(self, entity: OpenMLBase) -> ResourceAPI:
+        from openml.datasets.dataset import OpenMLDataset
+        from openml.flows.flow import OpenMLFlow
+        from openml.runs.run import OpenMLRun
+        from openml.study.study import OpenMLStudy
+        from openml.tasks.task import OpenMLTask
+
+        if isinstance(entity, OpenMLFlow):
+            return self.flows  # type: ignore
+        if isinstance(entity, OpenMLRun):
+            return self.runs  # type: ignore
+        if isinstance(entity, OpenMLDataset):
+            return self.datasets  # type: ignore
+        if isinstance(entity, OpenMLTask):
+            return self.tasks  # type: ignore
+        if isinstance(entity, OpenMLStudy):
+            return self.studies  # type: ignore
+        raise ValueError(f"No resource manager available for entity type {type(entity)}")
+
 
 def build_backend(version: str, *, strict: bool) -> APIBackend:
     v1_http = HTTPClient(config=settings.api.v1)
diff --git a/openml/base.py b/openml/base.py
index a282be8eb..b7a4877c1 100644
--- a/openml/base.py
+++ b/openml/base.py
@@ -11,7 +11,7 @@
 import openml._api_calls
 import openml.config
 
-from .utils import _get_rest_api_type_alias, _tag_openml_base
+from .utils import _tag_openml_base
 
 
 class OpenMLBase(ABC):
@@ -126,20 +126,19 @@ def _parse_publish_response(self, xml_response: dict[str, str]) -> None:
 
     def publish(self) -> OpenMLBase:
         """Publish the object on the OpenML server."""
-        file_elements = self._get_file_elements()
+        from openml._api import api_context
 
-        if "description" not in file_elements:
-            file_elements["description"] = self._to_xml()
+        # 1. Resolve the correct resource manager (e.g., Flows, Runs)
+        resource_manager = api_context.backend.get_resource_for_entity(self)
 
-        call = f"{_get_rest_api_type_alias(self)}/"
-        response_text = openml._api_calls._perform_api_call(
-            call,
-            "post",
-            file_elements=file_elements,
-        )
-        xml_response = xmltodict.parse(response_text)
+        # 2. Delegate creation to the backend (Handles V1/V2 switching internally)
+        # The backend returns the updated entity (with ID) or the ID itself.
+        published_entity = resource_manager.create(self)  # type: ignore
+
+        # 3. Update self with ID if not already done (V2 response handling)
+        if self.id is None and published_entity.id is not None:
+            self.id = published_entity.id  # type: ignore
 
-        self._parse_publish_response(xml_response)
         return self
 
     def open_in_browser(self) -> None:
diff --git a/openml/flows/functions.py b/openml/flows/functions.py
index 9dc394c7d..9a0bc6534 100644
--- a/openml/flows/functions.py
+++ b/openml/flows/functions.py
@@ -167,33 +167,6 @@ def list_flows(
     return pd.concat(batches)
 
 
-def _list_flows(limit: int, offset: int, **kwargs: Any) -> pd.DataFrame:
-    """
-    Perform the api call that return a list of all flows.
-
-    Parameters
-    ----------
-    limit : int
-        the maximum number of flows to return
-    offset : int
-        the number of flows to skip, starting from the first
-    kwargs: dict, optional
-        Legal filter operators: uploader, tag
-
-    Returns
-    -------
-    flows : dataframe
-    """
-    from openml._api import api_context
-
-    return api_context.backend.flows.list(
-        limit=limit,
-        offset=offset,
-        tag=kwargs.get("tag"),
-        uploader=kwargs.get("uploader"),
-    )
-
-
 def flow_exists(name: str, external_version: str) -> int | bool:
     """Retrieves the flow id.
 
@@ -291,31 +264,6 @@ def get_flow_id(
     return flows["id"].to_list()  # type: ignore[no-any-return]
 
 
-def __list_flows(api_call: str) -> pd.DataFrame:
-    """Backwards-compatible indirection; now routes via new backend."""
-    from openml._api import api_context
-
-    parts = api_call.split("/")
-    limit = None
-    offset = None
-    tag = None
-    uploader = None
-    try:
-        if "limit" in parts:
-            limit = int(parts[parts.index("limit") + 1])
-        if "offset" in parts:
-            offset = int(parts[parts.index("offset") + 1])
-        if "tag" in parts:
-            tag = parts[parts.index("tag") + 1]
-        if "uploader" in parts:
-            uploader = parts[parts.index("uploader") + 1]
-    except (ValueError, IndexError):
-        # Silently continue if parsing fails; all params default to None
-        pass
-
-    return api_context.backend.flows.list(limit=limit, offset=offset, tag=tag, uploader=uploader)
-
-
 def _check_flow_for_server_id(flow: OpenMLFlow) -> None:
     """Raises a ValueError if the flow or any of its subflows has no flow id."""
     # Depth-first search to check if all components were uploaded to the
diff --git a/openml/tasks/functions.py b/openml/tasks/functions.py
index 8c13d9f88..3df2861c0 100644
--- a/openml/tasks/functions.py
+++ b/openml/tasks/functions.py
@@ -444,16 +444,11 @@ def _get_task_description(task_id: int) -> OpenMLTask:
     except OpenMLCacheException:
         _cache_dir = openml.utils._create_cache_directory_for_id(TASKS_CACHE_DIR_NAME, task_id)
         xml_file = _cache_dir / "task.xml"
-        openml._api_calls._perform_api_call(f"task/{task_id}", "get")
+        task_xml = openml._api_calls._perform_api_call(f"task/{task_id}", "get")
 
-        if isinstance(result, tuple):
-            task, response = result
-            with xml_file.open("w", encoding="utf8") as fh:
-                fh.write(response.text)
-        else:
-            task = result
-
-        return task
+        with xml_file.open("w", encoding="utf8") as fh:
+            fh.write(task_xml)
+        return _create_task_from_xml(task_xml)
 
 
 def _create_task_from_xml(xml: str) -> OpenMLTask:

From bdf53f3eed99d48aa24c14cee40ba6babbc57478 Mon Sep 17 00:00:00 2001
From: Omswastik-11 <omswastikpanda11@gmail.com>
Date: Thu, 22 Jan 2026 00:01:48 +0530
Subject: [PATCH 17/34] migrating v1 -> v2 flows

Signed-off-by: Omswastik-11 <omswastikpanda11@gmail.com>
---
 openml/flows/functions.py | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/openml/flows/functions.py b/openml/flows/functions.py
index 9a0bc6534..28a3ffaa9 100644
--- a/openml/flows/functions.py
+++ b/openml/flows/functions.py
@@ -1,6 +1,7 @@
 # License: BSD 3-Clause
 from __future__ import annotations
 
+import os
 import re
 from collections import OrderedDict
 from functools import partial
@@ -30,7 +31,8 @@ def _get_cached_flows() -> OrderedDict:
     flows = OrderedDict()  # type: 'OrderedDict[int, OpenMLFlow]'
 
     flow_cache_dir = openml.utils._create_cache_directory(FLOWS_CACHE_DIR_NAME)
-    directory_content = sorted(p.name for p in flow_cache_dir.iterdir())
+    directory_content = os.listdir(flow_cache_dir)  # noqa : PTH208
+    directory_content.sort()
     # Find all flow ids for which we have downloaded
     # the flow description
 

From 43276d2ac56ba39d195b5d54d72bed2e61da3f79 Mon Sep 17 00:00:00 2001
From: geetu040 <raoarmaghanshakir040@gmail.com>
Date: Fri, 23 Jan 2026 12:17:53 +0500
Subject: [PATCH 18/34] fix import in resources/base.py

---
 openml/_api/resources/base.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/openml/_api/resources/base.py b/openml/_api/resources/base.py
index 6fbf8977d..54b40a0e0 100644
--- a/openml/_api/resources/base.py
+++ b/openml/_api/resources/base.py
@@ -6,7 +6,7 @@
 if TYPE_CHECKING:
     from requests import Response
 
-    from openml._api.http import HTTPClient
+    from openml._api.clients import HTTPClient
     from openml.datasets.dataset import OpenMLDataset
     from openml.tasks.task import OpenMLTask
 

From 1206f697d09df82ed7f18bfea94a476844e01cb4 Mon Sep 17 00:00:00 2001
From: geetu040 <raoarmaghanshakir040@gmail.com>
Date: Mon, 26 Jan 2026 13:52:20 +0500
Subject: [PATCH 19/34] refactor and add exception handling

---
 openml/_api/clients/http.py | 241 +++++++++++++++++++++++++++++++++---
 openml/_api/config.py       |   5 +-
 openml/_api/runtime/core.py |   6 +-
 3 files changed, 229 insertions(+), 23 deletions(-)

diff --git a/openml/_api/clients/http.py b/openml/_api/clients/http.py
index 4e126ee92..dc184074d 100644
--- a/openml/_api/clients/http.py
+++ b/openml/_api/clients/http.py
@@ -1,18 +1,28 @@
 from __future__ import annotations
 
 import json
+import logging
+import math
+import random
 import time
+import xml
+from collections.abc import Mapping
 from pathlib import Path
-from typing import TYPE_CHECKING, Any
+from typing import Any
 from urllib.parse import urlencode, urljoin, urlparse
 
 import requests
+import xmltodict
 from requests import Response
 
 from openml.__version__ import __version__
-
-if TYPE_CHECKING:
-    from openml._api.config import DelayMethod
+from openml._api.config import RetryPolicy
+from openml.exceptions import (
+    OpenMLNotAuthorizedError,
+    OpenMLServerError,
+    OpenMLServerException,
+    OpenMLServerNoResult,
+)
 
 
 class HTTPCache:
@@ -108,8 +118,7 @@ def __init__(  # noqa: PLR0913
         api_key: str,
         timeout: int,
         retries: int,
-        delay_method: DelayMethod,
-        delay_time: int,
+        retry_policy: RetryPolicy,
         cache: HTTPCache | None = None,
     ) -> None:
         self.server = server
@@ -117,12 +126,194 @@ def __init__(  # noqa: PLR0913
         self.api_key = api_key
         self.timeout = timeout
         self.retries = retries
-        self.delay_method = delay_method
-        self.delay_time = delay_time
+        self.retry_policy = retry_policy
         self.cache = cache
 
+        self.retry_func = (
+            self._human_delay if retry_policy == RetryPolicy.HUMAN else self._robot_delay
+        )
         self.headers: dict[str, str] = {"user-agent": f"openml-python/{__version__}"}
 
+    def _robot_delay(self, n: int) -> float:
+        wait = (1 / (1 + math.exp(-(n * 0.5 - 4)))) * 60
+        variation = random.gauss(0, wait / 10)
+        return max(1.0, wait + variation)
+
+    def _human_delay(self, n: int) -> float:
+        return max(1.0, n)
+
+    def _parse_exception_response(
+        self,
+        response: Response,
+    ) -> tuple[int | None, str]:
+        content_type = response.headers.get("Content-Type", "").lower()
+
+        if "json" in content_type:
+            server_exception = response.json()
+            server_error = server_exception["detail"]
+            code = server_error.get("code")
+            message = server_error.get("message")
+            additional_information = server_error.get("additional_information")
+        else:
+            server_exception = xmltodict.parse(response.text)
+            server_error = server_exception["oml:error"]
+            code = server_error.get("oml:code")
+            message = server_error.get("oml:message")
+            additional_information = server_error.get("oml:additional_information")
+
+        if code is not None:
+            code = int(code)
+
+        if message and additional_information:
+            full_message = f"{message} - {additional_information}"
+        elif message:
+            full_message = message
+        elif additional_information:
+            full_message = additional_information
+        else:
+            full_message = ""
+
+        return code, full_message
+
+    def _raise_code_specific_error(
+        self,
+        code: int,
+        message: str,
+        url: str,
+        files: Mapping[str, Any] | None,
+    ) -> None:
+        if code in [111, 372, 512, 500, 482, 542, 674]:
+            # 512 for runs, 372 for datasets, 500 for flows
+            # 482 for tasks, 542 for evaluations, 674 for setups
+            # 111 for dataset descriptions
+            raise OpenMLServerNoResult(code=code, message=message, url=url)
+
+        # 163: failure to validate flow XML (https://www.openml.org/api_docs#!/flow/post_flow)
+        if code in [163] and files is not None and "description" in files:
+            # file_elements['description'] is the XML file description of the flow
+            message = f"\n{files['description']}\n{message}"
+
+        if code in [
+            102,  # flow/exists post
+            137,  # dataset post
+            350,  # dataset/42 delete
+            310,  # flow/<something> post
+            320,  # flow/42 delete
+            400,  # run/42 delete
+            460,  # task/42 delete
+        ]:
+            raise OpenMLNotAuthorizedError(
+                message=(
+                    f"The API call {url} requires authentication via an API key.\nPlease configure "
+                    "OpenML-Python to use your API as described in this example:"
+                    "\nhttps://openml.github.io/openml-python/latest/examples/Basics/introduction_tutorial/#authentication"
+                )
+            )
+
+        # Propagate all server errors to the calling functions, except
+        # for 107 which represents a database connection error.
+        # These are typically caused by high server load,
+        # which means trying again might resolve the issue.
+        # DATABASE_CONNECTION_ERRCODE
+        if code != 107:
+            raise OpenMLServerException(code=code, message=message, url=url)
+
+    def _validate_response(
+        self,
+        method: str,
+        url: str,
+        files: Mapping[str, Any] | None,
+        response: Response,
+    ) -> Exception | None:
+        if (
+            "Content-Encoding" not in response.headers
+            or response.headers["Content-Encoding"] != "gzip"
+        ):
+            logging.warning(f"Received uncompressed content from OpenML for {url}.")
+
+        if response.status_code == 200:
+            return None
+
+        if response.status_code == requests.codes.URI_TOO_LONG:
+            raise OpenMLServerError(f"URI too long! ({url})")
+
+        retry_raise_e: Exception | None = None
+
+        try:
+            code, message = self._parse_exception_response(response)
+
+        except (requests.exceptions.JSONDecodeError, xml.parsers.expat.ExpatError) as e:
+            if method != "GET":
+                extra = f"Status code: {response.status_code}\n{response.text}"
+                raise OpenMLServerError(
+                    f"Unexpected server error when calling {url}. Please contact the "
+                    f"developers!\n{extra}"
+                ) from e
+
+            retry_raise_e = e
+
+        except Exception as e:
+            # If we failed to parse it out,
+            # then something has gone wrong in the body we have sent back
+            # from the server and there is little extra information we can capture.
+            raise OpenMLServerError(
+                f"Unexpected server error when calling {url}. Please contact the developers!\n"
+                f"Status code: {response.status_code}\n{response.text}",
+            ) from e
+
+        if code is not None:
+            self._raise_code_specific_error(
+                code=code,
+                message=message,
+                url=url,
+                files=files,
+            )
+
+        if retry_raise_e is None:
+            retry_raise_e = OpenMLServerException(code=code, message=message, url=url)
+
+        return retry_raise_e
+
+    def _request(  # noqa: PLR0913
+        self,
+        method: str,
+        url: str,
+        params: Mapping[str, Any],
+        headers: Mapping[str, str],
+        timeout: float | int,
+        files: Mapping[str, Any] | None,
+        **request_kwargs: Any,
+    ) -> tuple[Response | None, Exception | None]:
+        retry_raise_e: Exception | None = None
+        response: Response | None = None
+
+        try:
+            response = requests.request(
+                method=method,
+                url=url,
+                params=params,
+                headers=headers,
+                timeout=timeout,
+                files=files,
+                **request_kwargs,
+            )
+        except (
+            requests.exceptions.ChunkedEncodingError,
+            requests.exceptions.ConnectionError,
+            requests.exceptions.SSLError,
+        ) as e:
+            retry_raise_e = e
+
+        if response is not None:
+            retry_raise_e = self._validate_response(
+                method=method,
+                url=url,
+                files=files,
+                response=response,
+            )
+
+        return response, retry_raise_e
+
     def request(
         self,
         method: str,
@@ -133,6 +324,7 @@ def request(
         **request_kwargs: Any,
     ) -> Response:
         url = urljoin(self.server, urljoin(self.base_url, path))
+        retries = max(1, self.retries)
 
         # prepare params
         params = request_kwargs.pop("params", {}).copy()
@@ -144,6 +336,9 @@ def request(
         headers.update(self.headers)
 
         timeout = request_kwargs.pop("timeout", self.timeout)
+        files = request_kwargs.pop("files", None)
+
+        use_cache = False
 
         if use_cache and self.cache is not None:
             cache_key = self.cache.get_key(url, params)
@@ -154,14 +349,28 @@ def request(
             except Exception:
                 raise  # propagate unexpected cache errors
 
-        response = requests.request(
-            method=method,
-            url=url,
-            params=params,
-            headers=headers,
-            timeout=timeout,
-            **request_kwargs,
-        )
+        for retry_counter in range(1, retries + 1):
+            response, retry_raise_e = self._request(
+                method=method,
+                url=url,
+                params=params,
+                headers=headers,
+                timeout=timeout,
+                files=files,
+                **request_kwargs,
+            )
+
+            # executed successfully
+            if retry_raise_e is None:
+                break
+            # tries completed
+            if retry_counter >= retries:
+                raise retry_raise_e
+
+            delay = self.retry_func(retry_counter)
+            time.sleep(delay)
+
+        assert response is not None
 
         if use_cache and self.cache is not None:
             self.cache.save(cache_key, response)
diff --git a/openml/_api/config.py b/openml/_api/config.py
index aa153a556..6cce06403 100644
--- a/openml/_api/config.py
+++ b/openml/_api/config.py
@@ -4,7 +4,7 @@
 from enum import Enum
 
 
-class DelayMethod(str, Enum):
+class RetryPolicy(str, Enum):
     HUMAN = "human"
     ROBOT = "robot"
 
@@ -26,8 +26,7 @@ class APISettings:
 @dataclass
 class ConnectionConfig:
     retries: int = 3
-    delay_method: DelayMethod = DelayMethod.HUMAN
-    delay_time: int = 1  # seconds
+    retry_policy: RetryPolicy = RetryPolicy.HUMAN
 
 
 @dataclass
diff --git a/openml/_api/runtime/core.py b/openml/_api/runtime/core.py
index 483b74d3d..25f2649ee 100644
--- a/openml/_api/runtime/core.py
+++ b/openml/_api/runtime/core.py
@@ -33,8 +33,7 @@ def build_backend(version: str, *, strict: bool) -> APIBackend:
         api_key=settings.api.v1.api_key,
         timeout=settings.api.v1.timeout,
         retries=settings.connection.retries,
-        delay_method=settings.connection.delay_method,
-        delay_time=settings.connection.delay_time,
+        retry_policy=settings.connection.retry_policy,
         cache=http_cache,
     )
     v2_http_client = HTTPClient(
@@ -43,8 +42,7 @@ def build_backend(version: str, *, strict: bool) -> APIBackend:
         api_key=settings.api.v2.api_key,
         timeout=settings.api.v2.timeout,
         retries=settings.connection.retries,
-        delay_method=settings.connection.delay_method,
-        delay_time=settings.connection.delay_time,
+        retry_policy=settings.connection.retry_policy,
         cache=http_cache,
     )
 

From 4948e991f96821372934c7132f4a695da165d17b Mon Sep 17 00:00:00 2001
From: geetu040 <raoarmaghanshakir040@gmail.com>
Date: Mon, 26 Jan 2026 20:43:32 +0500
Subject: [PATCH 20/34] refactor resources/base/

---
 openml/_api/resources/base/__init__.py        | 13 ++++++
 openml/_api/resources/base/base.py            | 41 +++++++++++++++++++
 .../resources/{base.py => base/resources.py}  | 16 ++++----
 openml/_api/resources/base/versions.py        | 23 +++++++++++
 openml/_api/resources/datasets.py             |  6 +--
 openml/_api/resources/tasks.py                |  6 +--
 6 files changed, 91 insertions(+), 14 deletions(-)
 create mode 100644 openml/_api/resources/base/__init__.py
 create mode 100644 openml/_api/resources/base/base.py
 rename openml/_api/resources/{base.py => base/resources.py} (64%)
 create mode 100644 openml/_api/resources/base/versions.py

diff --git a/openml/_api/resources/base/__init__.py b/openml/_api/resources/base/__init__.py
new file mode 100644
index 000000000..851cfe942
--- /dev/null
+++ b/openml/_api/resources/base/__init__.py
@@ -0,0 +1,13 @@
+from openml._api.resources.base.base import APIVersion, ResourceAPI, ResourceType
+from openml._api.resources.base.resources import DatasetsAPI, TasksAPI
+from openml._api.resources.base.versions import ResourceV1, ResourceV2
+
+__all__ = [
+    "APIVersion",
+    "DatasetsAPI",
+    "ResourceAPI",
+    "ResourceType",
+    "ResourceV1",
+    "ResourceV2",
+    "TasksAPI",
+]
diff --git a/openml/_api/resources/base/base.py b/openml/_api/resources/base/base.py
new file mode 100644
index 000000000..8d85d054b
--- /dev/null
+++ b/openml/_api/resources/base/base.py
@@ -0,0 +1,41 @@
+from __future__ import annotations
+
+from abc import ABC, abstractmethod
+from enum import Enum
+from typing import TYPE_CHECKING
+
+if TYPE_CHECKING:
+    from openml._api.clients import HTTPClient
+
+
+class APIVersion(str, Enum):
+    V1 = "v1"
+    V2 = "v2"
+
+
+class ResourceType(str, Enum):
+    DATASETS = "datasets"
+    TASKS = "tasks"
+
+
+class ResourceAPI(ABC):
+    api_version: APIVersion | None = None
+    resource_type: ResourceType | None = None
+
+    def __init__(self, http: HTTPClient):
+        self._http = http
+
+    def _raise_not_implemented_error(self, method_name: str | None = None) -> None:
+        version = getattr(self.api_version, "name", "Unknown version")
+        resource = getattr(self.resource_type, "name", "Unknown resource")
+        method_info = f" Method: {method_name}" if method_name else ""
+        raise NotImplementedError(
+            f"{self.__class__.__name__}: {version} API does not support this "
+            f"functionality for resource: {resource}.{method_info}"
+        )
+
+    @abstractmethod
+    def delete(self) -> None: ...
+
+    @abstractmethod
+    def publish(self) -> None: ...
diff --git a/openml/_api/resources/base.py b/openml/_api/resources/base/resources.py
similarity index 64%
rename from openml/_api/resources/base.py
rename to openml/_api/resources/base/resources.py
index 54b40a0e0..edb26c91c 100644
--- a/openml/_api/resources/base.py
+++ b/openml/_api/resources/base/resources.py
@@ -1,27 +1,27 @@
 from __future__ import annotations
 
-from abc import ABC, abstractmethod
+from abc import abstractmethod
 from typing import TYPE_CHECKING
 
+from openml._api.resources.base import ResourceAPI, ResourceType
+
 if TYPE_CHECKING:
     from requests import Response
 
-    from openml._api.clients import HTTPClient
     from openml.datasets.dataset import OpenMLDataset
     from openml.tasks.task import OpenMLTask
 
 
-class ResourceAPI:
-    def __init__(self, http: HTTPClient):
-        self._http = http
-
+class DatasetsAPI(ResourceAPI):
+    resource_type: ResourceType | None = ResourceType.DATASETS
 
-class DatasetsAPI(ResourceAPI, ABC):
     @abstractmethod
     def get(self, dataset_id: int) -> OpenMLDataset | tuple[OpenMLDataset, Response]: ...
 
 
-class TasksAPI(ResourceAPI, ABC):
+class TasksAPI(ResourceAPI):
+    resource_type: ResourceType | None = ResourceType.TASKS
+
     @abstractmethod
     def get(
         self,
diff --git a/openml/_api/resources/base/versions.py b/openml/_api/resources/base/versions.py
new file mode 100644
index 000000000..8a81517e5
--- /dev/null
+++ b/openml/_api/resources/base/versions.py
@@ -0,0 +1,23 @@
+from __future__ import annotations
+
+from openml._api.resources.base import APIVersion, ResourceAPI
+
+
+class ResourceV1(ResourceAPI):
+    api_version: APIVersion | None = APIVersion.V1
+
+    def delete(self) -> None:
+        pass
+
+    def publish(self) -> None:
+        pass
+
+
+class ResourceV2(ResourceAPI):
+    api_version: APIVersion | None = APIVersion.V2
+
+    def delete(self) -> None:
+        self._raise_not_implemented_error("delete")
+
+    def publish(self) -> None:
+        self._raise_not_implemented_error("publish")
diff --git a/openml/_api/resources/datasets.py b/openml/_api/resources/datasets.py
index 9ff1ec278..f3a49a84f 100644
--- a/openml/_api/resources/datasets.py
+++ b/openml/_api/resources/datasets.py
@@ -2,7 +2,7 @@
 
 from typing import TYPE_CHECKING
 
-from openml._api.resources.base import DatasetsAPI
+from openml._api.resources.base import DatasetsAPI, ResourceV1, ResourceV2
 
 if TYPE_CHECKING:
     from responses import Response
@@ -10,11 +10,11 @@
     from openml.datasets.dataset import OpenMLDataset
 
 
-class DatasetsV1(DatasetsAPI):
+class DatasetsV1(ResourceV1, DatasetsAPI):
     def get(self, dataset_id: int) -> OpenMLDataset | tuple[OpenMLDataset, Response]:
         raise NotImplementedError
 
 
-class DatasetsV2(DatasetsAPI):
+class DatasetsV2(ResourceV2, DatasetsAPI):
     def get(self, dataset_id: int) -> OpenMLDataset | tuple[OpenMLDataset, Response]:
         raise NotImplementedError
diff --git a/openml/_api/resources/tasks.py b/openml/_api/resources/tasks.py
index f494fb9a3..a7ca39208 100644
--- a/openml/_api/resources/tasks.py
+++ b/openml/_api/resources/tasks.py
@@ -4,7 +4,7 @@
 
 import xmltodict
 
-from openml._api.resources.base import TasksAPI
+from openml._api.resources.base import ResourceV1, ResourceV2, TasksAPI
 from openml.tasks.task import (
     OpenMLClassificationTask,
     OpenMLClusteringTask,
@@ -18,7 +18,7 @@
     from requests import Response
 
 
-class TasksV1(TasksAPI):
+class TasksV1(ResourceV1, TasksAPI):
     def get(
         self,
         task_id: int,
@@ -118,7 +118,7 @@ def _create_task_from_xml(self, xml: str) -> OpenMLTask:
         return cls(**common_kwargs)  # type: ignore
 
 
-class TasksV2(TasksAPI):
+class TasksV2(ResourceV2, TasksAPI):
     def get(
         self,
         task_id: int,

From a3541675fd6452e68f268127df7c583bb9c2d0ca Mon Sep 17 00:00:00 2001
From: geetu040 <raoarmaghanshakir040@gmail.com>
Date: Mon, 26 Jan 2026 21:06:20 +0500
Subject: [PATCH 21/34] implement delete

---
 openml/_api/resources/base/base.py      | 23 +++++---
 openml/_api/resources/base/resources.py |  4 +-
 openml/_api/resources/base/versions.py  | 76 ++++++++++++++++++++++---
 3 files changed, 86 insertions(+), 17 deletions(-)

diff --git a/openml/_api/resources/base/base.py b/openml/_api/resources/base/base.py
index 8d85d054b..9b1803508 100644
--- a/openml/_api/resources/base/base.py
+++ b/openml/_api/resources/base/base.py
@@ -14,28 +14,37 @@ class APIVersion(str, Enum):
 
 
 class ResourceType(str, Enum):
-    DATASETS = "datasets"
-    TASKS = "tasks"
+    DATASET = "dataset"
+    TASK = "task"
+    TASK_TYPE = "task_type"
+    EVALUATION_MEASURE = "evaluation_measure"
+    ESTIMATION_PROCEDURE = "estimation_procedure"
+    EVALUATION = "evaluation"
+    FLOW = "flow"
+    STUDY = "study"
+    RUN = "run"
+    SETUP = "setup"
+    USER = "user"
 
 
 class ResourceAPI(ABC):
-    api_version: APIVersion | None = None
-    resource_type: ResourceType | None = None
+    api_version: APIVersion
+    resource_type: ResourceType
 
     def __init__(self, http: HTTPClient):
         self._http = http
 
-    def _raise_not_implemented_error(self, method_name: str | None = None) -> None:
+    def _get_not_implemented_message(self, method_name: str | None = None) -> str:
         version = getattr(self.api_version, "name", "Unknown version")
         resource = getattr(self.resource_type, "name", "Unknown resource")
         method_info = f" Method: {method_name}" if method_name else ""
-        raise NotImplementedError(
+        return (
             f"{self.__class__.__name__}: {version} API does not support this "
             f"functionality for resource: {resource}.{method_info}"
         )
 
     @abstractmethod
-    def delete(self) -> None: ...
+    def delete(self, resource_id: int) -> bool: ...
 
     @abstractmethod
     def publish(self) -> None: ...
diff --git a/openml/_api/resources/base/resources.py b/openml/_api/resources/base/resources.py
index edb26c91c..55cb95c0d 100644
--- a/openml/_api/resources/base/resources.py
+++ b/openml/_api/resources/base/resources.py
@@ -13,14 +13,14 @@
 
 
 class DatasetsAPI(ResourceAPI):
-    resource_type: ResourceType | None = ResourceType.DATASETS
+    resource_type: ResourceType = ResourceType.DATASET
 
     @abstractmethod
     def get(self, dataset_id: int) -> OpenMLDataset | tuple[OpenMLDataset, Response]: ...
 
 
 class TasksAPI(ResourceAPI):
-    resource_type: ResourceType | None = ResourceType.TASKS
+    resource_type: ResourceType = ResourceType.TASK
 
     @abstractmethod
     def get(
diff --git a/openml/_api/resources/base/versions.py b/openml/_api/resources/base/versions.py
index 8a81517e5..ce7b02057 100644
--- a/openml/_api/resources/base/versions.py
+++ b/openml/_api/resources/base/versions.py
@@ -1,23 +1,83 @@
 from __future__ import annotations
 
-from openml._api.resources.base import APIVersion, ResourceAPI
+import xmltodict
+
+from openml._api.resources.base import APIVersion, ResourceAPI, ResourceType
+from openml.exceptions import (
+    OpenMLNotAuthorizedError,
+    OpenMLServerError,
+    OpenMLServerException,
+)
 
 
 class ResourceV1(ResourceAPI):
-    api_version: APIVersion | None = APIVersion.V1
+    api_version: APIVersion = APIVersion.V1
 
-    def delete(self) -> None:
-        pass
+    def delete(self, resource_id: int) -> bool:
+        if self.resource_type == ResourceType.DATASET:
+            resource_type = "data"
+        else:
+            resource_type = self.resource_type.name
+
+        legal_resources = {
+            "data",
+            "flow",
+            "task",
+            "run",
+            "study",
+            "user",
+        }
+        if resource_type not in legal_resources:
+            raise ValueError(f"Can't delete a {resource_type}")
+
+        url_suffix = f"{resource_type}/{resource_id}"
+        try:
+            response = self._http.delete(url_suffix)
+            result = xmltodict.parse(response.content)
+            return f"oml:{resource_type}_delete" in result
+        except OpenMLServerException as e:
+            # https://github.com/openml/OpenML/blob/21f6188d08ac24fcd2df06ab94cf421c946971b0/openml_OS/views/pages/api_new/v1/xml/pre.php
+            # Most exceptions are descriptive enough to be raised as their standard
+            # OpenMLServerException, however there are two cases where we add information:
+            #  - a generic "failed" message, we direct them to the right issue board
+            #  - when the user successfully authenticates with the server,
+            #    but user is not allowed to take the requested action,
+            #    in which case we specify a OpenMLNotAuthorizedError.
+            by_other_user = [323, 353, 393, 453, 594]
+            has_dependent_entities = [324, 326, 327, 328, 354, 454, 464, 595]
+            unknown_reason = [325, 355, 394, 455, 593]
+            if e.code in by_other_user:
+                raise OpenMLNotAuthorizedError(
+                    message=(
+                        f"The {resource_type} can not be deleted "
+                        "because it was not uploaded by you."
+                    ),
+                ) from e
+            if e.code in has_dependent_entities:
+                raise OpenMLNotAuthorizedError(
+                    message=(
+                        f"The {resource_type} can not be deleted because "
+                        f"it still has associated entities: {e.message}"
+                    ),
+                ) from e
+            if e.code in unknown_reason:
+                raise OpenMLServerError(
+                    message=(
+                        f"The {resource_type} can not be deleted for unknown reason,"
+                        " please open an issue at: https://github.com/openml/openml/issues/new"
+                    ),
+                ) from e
+            raise e
 
     def publish(self) -> None:
         pass
 
 
 class ResourceV2(ResourceAPI):
-    api_version: APIVersion | None = APIVersion.V2
+    api_version: APIVersion = APIVersion.V2
 
-    def delete(self) -> None:
-        self._raise_not_implemented_error("delete")
+    def delete(self, resource_id: int) -> bool:
+        raise NotImplementedError(self._get_not_implemented_message("publish"))
 
     def publish(self) -> None:
-        self._raise_not_implemented_error("publish")
+        raise NotImplementedError(self._get_not_implemented_message("publish"))

From 1fe7e3ed8561945c20e8433603046a35484c37e7 Mon Sep 17 00:00:00 2001
From: geetu040 <raoarmaghanshakir040@gmail.com>
Date: Tue, 27 Jan 2026 12:56:35 +0500
Subject: [PATCH 22/34] implement publish and minor refactoring

---
 openml/_api/clients/http.py            |   2 -
 openml/_api/resources/base/base.py     |  15 ++--
 openml/_api/resources/base/versions.py | 113 ++++++++++++++++---------
 3 files changed, 82 insertions(+), 48 deletions(-)

diff --git a/openml/_api/clients/http.py b/openml/_api/clients/http.py
index dc184074d..1622087c9 100644
--- a/openml/_api/clients/http.py
+++ b/openml/_api/clients/http.py
@@ -338,8 +338,6 @@ def request(
         timeout = request_kwargs.pop("timeout", self.timeout)
         files = request_kwargs.pop("files", None)
 
-        use_cache = False
-
         if use_cache and self.cache is not None:
             cache_key = self.cache.get_key(url, params)
             try:
diff --git a/openml/_api/resources/base/base.py b/openml/_api/resources/base/base.py
index 9b1803508..f2d7d1e88 100644
--- a/openml/_api/resources/base/base.py
+++ b/openml/_api/resources/base/base.py
@@ -5,6 +5,9 @@
 from typing import TYPE_CHECKING
 
 if TYPE_CHECKING:
+    from collections.abc import Mapping
+    from typing import Any
+
     from openml._api.clients import HTTPClient
 
 
@@ -34,6 +37,12 @@ class ResourceAPI(ABC):
     def __init__(self, http: HTTPClient):
         self._http = http
 
+    @abstractmethod
+    def delete(self, resource_id: int) -> bool: ...
+
+    @abstractmethod
+    def publish(self, path: str, files: Mapping[str, Any] | None) -> int: ...
+
     def _get_not_implemented_message(self, method_name: str | None = None) -> str:
         version = getattr(self.api_version, "name", "Unknown version")
         resource = getattr(self.resource_type, "name", "Unknown resource")
@@ -42,9 +51,3 @@ def _get_not_implemented_message(self, method_name: str | None = None) -> str:
             f"{self.__class__.__name__}: {version} API does not support this "
             f"functionality for resource: {resource}.{method_info}"
         )
-
-    @abstractmethod
-    def delete(self, resource_id: int) -> bool: ...
-
-    @abstractmethod
-    def publish(self) -> None: ...
diff --git a/openml/_api/resources/base/versions.py b/openml/_api/resources/base/versions.py
index ce7b02057..41f883ebe 100644
--- a/openml/_api/resources/base/versions.py
+++ b/openml/_api/resources/base/versions.py
@@ -1,5 +1,8 @@
 from __future__ import annotations
 
+from collections.abc import Mapping
+from typing import Any
+
 import xmltodict
 
 from openml._api.resources.base import APIVersion, ResourceAPI, ResourceType
@@ -13,6 +16,11 @@
 class ResourceV1(ResourceAPI):
     api_version: APIVersion = APIVersion.V1
 
+    def publish(self, path: str, files: Mapping[str, Any] | None) -> int:
+        response = self._http.post(path, files=files)
+        parsed_response = xmltodict.parse(response.content)
+        return self._extract_id_from_upload(parsed_response)
+
     def delete(self, resource_id: int) -> bool:
         if self.resource_type == ResourceType.DATASET:
             resource_type = "data"
@@ -30,54 +38,79 @@ def delete(self, resource_id: int) -> bool:
         if resource_type not in legal_resources:
             raise ValueError(f"Can't delete a {resource_type}")
 
-        url_suffix = f"{resource_type}/{resource_id}"
+        path = f"{resource_type}/{resource_id}"
         try:
-            response = self._http.delete(url_suffix)
+            response = self._http.delete(path)
             result = xmltodict.parse(response.content)
             return f"oml:{resource_type}_delete" in result
         except OpenMLServerException as e:
-            # https://github.com/openml/OpenML/blob/21f6188d08ac24fcd2df06ab94cf421c946971b0/openml_OS/views/pages/api_new/v1/xml/pre.php
-            # Most exceptions are descriptive enough to be raised as their standard
-            # OpenMLServerException, however there are two cases where we add information:
-            #  - a generic "failed" message, we direct them to the right issue board
-            #  - when the user successfully authenticates with the server,
-            #    but user is not allowed to take the requested action,
-            #    in which case we specify a OpenMLNotAuthorizedError.
-            by_other_user = [323, 353, 393, 453, 594]
-            has_dependent_entities = [324, 326, 327, 328, 354, 454, 464, 595]
-            unknown_reason = [325, 355, 394, 455, 593]
-            if e.code in by_other_user:
-                raise OpenMLNotAuthorizedError(
-                    message=(
-                        f"The {resource_type} can not be deleted "
-                        "because it was not uploaded by you."
-                    ),
-                ) from e
-            if e.code in has_dependent_entities:
-                raise OpenMLNotAuthorizedError(
-                    message=(
-                        f"The {resource_type} can not be deleted because "
-                        f"it still has associated entities: {e.message}"
-                    ),
-                ) from e
-            if e.code in unknown_reason:
-                raise OpenMLServerError(
-                    message=(
-                        f"The {resource_type} can not be deleted for unknown reason,"
-                        " please open an issue at: https://github.com/openml/openml/issues/new"
-                    ),
-                ) from e
-            raise e
-
-    def publish(self) -> None:
-        pass
+            self._handle_delete_exception(resource_type, e)
+            raise
+
+    def _handle_delete_exception(
+        self, resource_type: str, exception: OpenMLServerException
+    ) -> None:
+        # https://github.com/openml/OpenML/blob/21f6188d08ac24fcd2df06ab94cf421c946971b0/openml_OS/views/pages/api_new/v1/xml/pre.php
+        # Most exceptions are descriptive enough to be raised as their standard
+        # OpenMLServerException, however there are two cases where we add information:
+        #  - a generic "failed" message, we direct them to the right issue board
+        #  - when the user successfully authenticates with the server,
+        #    but user is not allowed to take the requested action,
+        #    in which case we specify a OpenMLNotAuthorizedError.
+        by_other_user = [323, 353, 393, 453, 594]
+        has_dependent_entities = [324, 326, 327, 328, 354, 454, 464, 595]
+        unknown_reason = [325, 355, 394, 455, 593]
+        if exception.code in by_other_user:
+            raise OpenMLNotAuthorizedError(
+                message=(
+                    f"The {resource_type} can not be deleted because it was not uploaded by you."
+                ),
+            ) from exception
+        if exception.code in has_dependent_entities:
+            raise OpenMLNotAuthorizedError(
+                message=(
+                    f"The {resource_type} can not be deleted because "
+                    f"it still has associated entities: {exception.message}"
+                ),
+            ) from exception
+        if exception.code in unknown_reason:
+            raise OpenMLServerError(
+                message=(
+                    f"The {resource_type} can not be deleted for unknown reason,"
+                    " please open an issue at: https://github.com/openml/openml/issues/new"
+                ),
+            ) from exception
+        raise exception
+
+    def _extract_id_from_upload(self, parsed: Mapping[str, Any]) -> int:
+        # reads id from
+        # sample parsed dict: {"oml:openml": {"oml:upload_flow": {"oml:id": "42"}}}
+
+        # xmltodict always gives exactly one root key
+        ((_, root_value),) = parsed.items()
+
+        if not isinstance(root_value, Mapping):
+            raise ValueError("Unexpected XML structure")
+
+        # upload node (e.g. oml:upload_task, oml:study_upload, ...)
+        ((_, upload_value),) = root_value.items()
+
+        if not isinstance(upload_value, Mapping):
+            raise ValueError("Unexpected upload node structure")
+
+        # ID is the only leaf value
+        for v in upload_value.values():
+            if isinstance(v, (str, int)):
+                return int(v)
+
+        raise ValueError("No ID found in upload response")
 
 
 class ResourceV2(ResourceAPI):
     api_version: APIVersion = APIVersion.V2
 
-    def delete(self, resource_id: int) -> bool:
+    def publish(self, path: str, files: Mapping[str, Any] | None) -> int:
         raise NotImplementedError(self._get_not_implemented_message("publish"))
 
-    def publish(self) -> None:
-        raise NotImplementedError(self._get_not_implemented_message("publish"))
+    def delete(self, resource_id: int) -> bool:
+        raise NotImplementedError(self._get_not_implemented_message("delete"))

From 54a3151932e3c50bda983f6d6609a4740e38a0c7 Mon Sep 17 00:00:00 2001
From: geetu040 <raoarmaghanshakir040@gmail.com>
Date: Tue, 27 Jan 2026 14:17:40 +0500
Subject: [PATCH 23/34] implement tag/untag

---
 openml/_api/clients/http.py            | 10 +++-
 openml/_api/resources/base/base.py     |  6 +++
 openml/_api/resources/base/versions.py | 63 ++++++++++++++++++++------
 openml/_api/resources/tasks.py         |  4 +-
 4 files changed, 67 insertions(+), 16 deletions(-)

diff --git a/openml/_api/clients/http.py b/openml/_api/clients/http.py
index 1622087c9..65d7b2248 100644
--- a/openml/_api/clients/http.py
+++ b/openml/_api/clients/http.py
@@ -279,6 +279,7 @@ def _request(  # noqa: PLR0913
         method: str,
         url: str,
         params: Mapping[str, Any],
+        data: Mapping[str, Any],
         headers: Mapping[str, str],
         timeout: float | int,
         files: Mapping[str, Any] | None,
@@ -292,6 +293,7 @@ def _request(  # noqa: PLR0913
                 method=method,
                 url=url,
                 params=params,
+                data=data,
                 headers=headers,
                 timeout=timeout,
                 files=files,
@@ -326,11 +328,16 @@ def request(
         url = urljoin(self.server, urljoin(self.base_url, path))
         retries = max(1, self.retries)
 
-        # prepare params
         params = request_kwargs.pop("params", {}).copy()
+        data = request_kwargs.pop("data", {}).copy()
+
         if use_api_key:
             params["api_key"] = self.api_key
 
+        if method.upper() in {"POST", "PUT", "PATCH"}:
+            data = {**params, **data}
+            params = {}
+
         # prepare headers
         headers = request_kwargs.pop("headers", {}).copy()
         headers.update(self.headers)
@@ -352,6 +359,7 @@ def request(
                 method=method,
                 url=url,
                 params=params,
+                data=data,
                 headers=headers,
                 timeout=timeout,
                 files=files,
diff --git a/openml/_api/resources/base/base.py b/openml/_api/resources/base/base.py
index f2d7d1e88..63d4c40eb 100644
--- a/openml/_api/resources/base/base.py
+++ b/openml/_api/resources/base/base.py
@@ -43,6 +43,12 @@ def delete(self, resource_id: int) -> bool: ...
     @abstractmethod
     def publish(self, path: str, files: Mapping[str, Any] | None) -> int: ...
 
+    @abstractmethod
+    def tag(self, resource_id: int, tag: str) -> list[str]: ...
+
+    @abstractmethod
+    def untag(self, resource_id: int, tag: str) -> list[str]: ...
+
     def _get_not_implemented_message(self, method_name: str | None = None) -> str:
         version = getattr(self.api_version, "name", "Unknown version")
         resource = getattr(self.resource_type, "name", "Unknown resource")
diff --git a/openml/_api/resources/base/versions.py b/openml/_api/resources/base/versions.py
index 41f883ebe..91c1a8c06 100644
--- a/openml/_api/resources/base/versions.py
+++ b/openml/_api/resources/base/versions.py
@@ -22,19 +22,9 @@ def publish(self, path: str, files: Mapping[str, Any] | None) -> int:
         return self._extract_id_from_upload(parsed_response)
 
     def delete(self, resource_id: int) -> bool:
-        if self.resource_type == ResourceType.DATASET:
-            resource_type = "data"
-        else:
-            resource_type = self.resource_type.name
-
-        legal_resources = {
-            "data",
-            "flow",
-            "task",
-            "run",
-            "study",
-            "user",
-        }
+        resource_type = self._get_endpoint_name()
+
+        legal_resources = {"data", "flow", "task", "run", "study", "user"}
         if resource_type not in legal_resources:
             raise ValueError(f"Can't delete a {resource_type}")
 
@@ -47,6 +37,47 @@ def delete(self, resource_id: int) -> bool:
             self._handle_delete_exception(resource_type, e)
             raise
 
+    def tag(self, resource_id: int, tag: str) -> list[str]:
+        resource_type = self._get_endpoint_name()
+
+        legal_resources = {"data", "task", "flow", "setup", "run"}
+        if resource_type not in legal_resources:
+            raise ValueError(f"Can't tag a {resource_type}")
+
+        path = f"{resource_type}/tag"
+        data = {f"{resource_type}_id": resource_id, "tag": tag}
+        response = self._http.post(path, data=data)
+
+        main_tag = f"oml:{resource_type}_tag"
+        parsed_response = xmltodict.parse(response.content, force_list={"oml:tag"})
+        result = parsed_response[main_tag]
+        tags: list[str] = result.get("oml:tag", [])
+
+        return tags
+
+    def untag(self, resource_id: int, tag: str) -> list[str]:
+        resource_type = self._get_endpoint_name()
+
+        legal_resources = {"data", "task", "flow", "setup", "run"}
+        if resource_type not in legal_resources:
+            raise ValueError(f"Can't tag a {resource_type}")
+
+        path = f"{resource_type}/untag"
+        data = {f"{resource_type}_id": resource_id, "tag": tag}
+        response = self._http.post(path, data=data)
+
+        main_tag = f"oml:{resource_type}_untag"
+        parsed_response = xmltodict.parse(response.content, force_list={"oml:tag"})
+        result = parsed_response[main_tag]
+        tags: list[str] = result.get("oml:tag", [])
+
+        return tags
+
+    def _get_endpoint_name(self) -> str:
+        if self.resource_type == ResourceType.DATASET:
+            return "data"
+        return self.resource_type.name
+
     def _handle_delete_exception(
         self, resource_type: str, exception: OpenMLServerException
     ) -> None:
@@ -114,3 +145,9 @@ def publish(self, path: str, files: Mapping[str, Any] | None) -> int:
 
     def delete(self, resource_id: int) -> bool:
         raise NotImplementedError(self._get_not_implemented_message("delete"))
+
+    def tag(self, resource_id: int, tag: str) -> list[str]:
+        raise NotImplementedError(self._get_not_implemented_message("untag"))
+
+    def untag(self, resource_id: int, tag: str) -> list[str]:
+        raise NotImplementedError(self._get_not_implemented_message("untag"))
diff --git a/openml/_api/resources/tasks.py b/openml/_api/resources/tasks.py
index a7ca39208..295e7a73d 100644
--- a/openml/_api/resources/tasks.py
+++ b/openml/_api/resources/tasks.py
@@ -26,7 +26,7 @@ def get(
         return_response: bool = False,
     ) -> OpenMLTask | tuple[OpenMLTask, Response]:
         path = f"task/{task_id}"
-        response = self._http.get(path)
+        response = self._http.get(path, use_cache=True)
         xml_content = response.text
         task = self._create_task_from_xml(xml_content)
 
@@ -125,4 +125,4 @@ def get(
         *,
         return_response: bool = False,
     ) -> OpenMLTask | tuple[OpenMLTask, Response]:
-        raise NotImplementedError
+        raise NotImplementedError(self._get_not_implemented_message("get"))

From 2b6fe6507b349703060f060f0184169abf5e20de Mon Sep 17 00:00:00 2001
From: geetu040 <raoarmaghanshakir040@gmail.com>
Date: Tue, 27 Jan 2026 18:31:39 +0500
Subject: [PATCH 24/34] implement fallback

---
 openml/_api/resources/__init__.py      |  3 +-
 openml/_api/resources/base/__init__.py |  2 +
 openml/_api/resources/base/fallback.py | 56 ++++++++++++++++++++++++++
 openml/_api/runtime/core.py            |  8 +++-
 openml/_api/runtime/fallback.py        | 12 ------
 5 files changed, 66 insertions(+), 15 deletions(-)
 create mode 100644 openml/_api/resources/base/fallback.py
 delete mode 100644 openml/_api/runtime/fallback.py

diff --git a/openml/_api/resources/__init__.py b/openml/_api/resources/__init__.py
index b1af3c1a8..6c0807e0f 100644
--- a/openml/_api/resources/__init__.py
+++ b/openml/_api/resources/__init__.py
@@ -1,4 +1,5 @@
+from openml._api.resources.base.fallback import FallbackProxy
 from openml._api.resources.datasets import DatasetsV1, DatasetsV2
 from openml._api.resources.tasks import TasksV1, TasksV2
 
-__all__ = ["DatasetsV1", "DatasetsV2", "TasksV1", "TasksV2"]
+__all__ = ["DatasetsV1", "DatasetsV2", "FallbackProxy", "TasksV1", "TasksV2"]
diff --git a/openml/_api/resources/base/__init__.py b/openml/_api/resources/base/__init__.py
index 851cfe942..bddc09b21 100644
--- a/openml/_api/resources/base/__init__.py
+++ b/openml/_api/resources/base/__init__.py
@@ -1,10 +1,12 @@
 from openml._api.resources.base.base import APIVersion, ResourceAPI, ResourceType
+from openml._api.resources.base.fallback import FallbackProxy
 from openml._api.resources.base.resources import DatasetsAPI, TasksAPI
 from openml._api.resources.base.versions import ResourceV1, ResourceV2
 
 __all__ = [
     "APIVersion",
     "DatasetsAPI",
+    "FallbackProxy",
     "ResourceAPI",
     "ResourceType",
     "ResourceV1",
diff --git a/openml/_api/resources/base/fallback.py b/openml/_api/resources/base/fallback.py
new file mode 100644
index 000000000..253ee3865
--- /dev/null
+++ b/openml/_api/resources/base/fallback.py
@@ -0,0 +1,56 @@
+from __future__ import annotations
+
+from collections.abc import Callable
+from typing import Any
+
+
+class FallbackProxy:
+    def __init__(self, *api_versions: Any):
+        if not api_versions:
+            raise ValueError("At least one API version must be provided")
+        self._apis = api_versions
+
+    def __getattr__(self, name: str) -> Any:
+        api, attr = self._find_attr(name)
+        if callable(attr):
+            return self._wrap_callable(name, api, attr)
+        return attr
+
+    def _find_attr(self, name: str) -> tuple[Any, Any]:
+        for api in self._apis:
+            attr = getattr(api, name, None)
+            if attr is not None:
+                return api, attr
+        raise AttributeError(f"{self.__class__.__name__} has no attribute {name}")
+
+    def _wrap_callable(
+        self,
+        name: str,
+        primary_api: Any,
+        primary_attr: Callable[..., Any],
+    ) -> Callable[..., Any]:
+        def wrapper(*args: Any, **kwargs: Any) -> Any:
+            try:
+                return primary_attr(*args, **kwargs)
+            except NotImplementedError:
+                return self._call_fallbacks(name, primary_api, *args, **kwargs)
+
+        return wrapper
+
+    def _call_fallbacks(
+        self,
+        name: str,
+        skip_api: Any,
+        *args: Any,
+        **kwargs: Any,
+    ) -> Any:
+        for api in self._apis:
+            if api is skip_api:
+                continue
+            attr = getattr(api, name, None)
+            if callable(attr):
+                try:
+                    return attr(*args, **kwargs)
+                except NotImplementedError:
+                    continue
+        raise NotImplementedError(f"Could not fallback to any API for method: {name}")
diff --git a/openml/_api/runtime/core.py b/openml/_api/runtime/core.py
index 25f2649ee..4914179f8 100644
--- a/openml/_api/runtime/core.py
+++ b/openml/_api/runtime/core.py
@@ -8,6 +8,7 @@
 from openml._api.resources import (
     DatasetsV1,
     DatasetsV2,
+    FallbackProxy,
     TasksV1,
     TasksV2,
 )
@@ -17,7 +18,7 @@
 
 
 class APIBackend:
-    def __init__(self, *, datasets: DatasetsAPI, tasks: TasksAPI):
+    def __init__(self, *, datasets: DatasetsAPI | FallbackProxy, tasks: TasksAPI | FallbackProxy):
         self.datasets = datasets
         self.tasks = tasks
 
@@ -62,7 +63,10 @@ def build_backend(version: str, *, strict: bool) -> APIBackend:
     if strict:
         return v2
 
-    return v1
+    return APIBackend(
+        datasets=FallbackProxy(DatasetsV2(v2_http_client), DatasetsV1(v1_http_client)),
+        tasks=FallbackProxy(TasksV2(v2_http_client), TasksV1(v1_http_client)),
+    )
 
 
 class APIContext:
diff --git a/openml/_api/runtime/fallback.py b/openml/_api/runtime/fallback.py
deleted file mode 100644
index 1bc99d270..000000000
--- a/openml/_api/runtime/fallback.py
+++ /dev/null
@@ -1,12 +0,0 @@
-from __future__ import annotations
-
-from typing import TYPE_CHECKING
-
-if TYPE_CHECKING:
-    from openml._api.resources.base import ResourceAPI
-
-
-class FallbackProxy:
-    def __init__(self, primary: ResourceAPI, fallback: ResourceAPI):
-        self._primary = primary
-        self._fallback = fallback

From 685c19a39ccccc113fdc6f1ff0a43de6f0475f34 Mon Sep 17 00:00:00 2001
From: Omswastik-11 <omswastikpanda11@gmail.com>
Date: Tue, 27 Jan 2026 20:31:11 +0530
Subject: [PATCH 25/34] added tests

Signed-off-by: Omswastik-11 <omswastikpanda11@gmail.com>
---
 openml/_api/clients/http.py             |  11 +-
 openml/_api/resources/base/resources.py |   2 +-
 openml/_api/resources/flows.py          |  56 +-----
 openml/base.py                          |  12 +-
 openml/flows/functions.py               |   4 +-
 tests/test_flows/test_flow_migration.py | 247 ++++++++----------------
 6 files changed, 103 insertions(+), 229 deletions(-)

diff --git a/openml/_api/clients/http.py b/openml/_api/clients/http.py
index dc184074d..9ef10740a 100644
--- a/openml/_api/clients/http.py
+++ b/openml/_api/clients/http.py
@@ -151,9 +151,14 @@ def _parse_exception_response(
         if "json" in content_type:
             server_exception = response.json()
             server_error = server_exception["detail"]
-            code = server_error.get("code")
-            message = server_error.get("message")
-            additional_information = server_error.get("additional_information")
+            if isinstance(server_error, dict):
+                code = server_error.get("code")
+                message = server_error.get("message")
+                additional_information = server_error.get("additional_information")
+            else:
+                code = None
+                message = str(server_error)
+                additional_information = None
         else:
             server_exception = xmltodict.parse(response.text)
             server_error = server_exception["oml:error"]
diff --git a/openml/_api/resources/base/resources.py b/openml/_api/resources/base/resources.py
index 403396926..339905d33 100644
--- a/openml/_api/resources/base/resources.py
+++ b/openml/_api/resources/base/resources.py
@@ -54,7 +54,7 @@ def list(
     ) -> pd.DataFrame: ...
 
     @abstractmethod
-    def create(self, flow: OpenMLFlow) -> OpenMLFlow | tuple[OpenMLFlow, Response]: ...
+    def publish(self, flow: OpenMLFlow) -> OpenMLFlow | tuple[OpenMLFlow, Response]: ...  # type: ignore[override]
 
     @abstractmethod
     def delete(self, flow_id: int) -> bool: ...
diff --git a/openml/_api/resources/flows.py b/openml/_api/resources/flows.py
index f70bc58be..a300bf312 100644
--- a/openml/_api/resources/flows.py
+++ b/openml/_api/resources/flows.py
@@ -3,11 +3,10 @@
 from typing import Any
 
 import pandas as pd
-import requests
 import xmltodict
 
 from openml._api.resources.base import FlowsAPI
-from openml.exceptions import OpenMLServerException
+from openml.exceptions import OpenMLServerError, OpenMLServerException
 from openml.flows.flow import OpenMLFlow
 
 
@@ -55,17 +54,7 @@ def exists(self, name: str, external_version: str) -> int | bool:
             raise ValueError("Argument 'version' should be a non-empty string")
 
         data = {"name": name, "external_version": external_version, "api_key": self._http.api_key}
-        # Avoid duplicating base_url when server already contains the API path
-        server = self._http.server
-        base = self._http.base_url
-        if base and base.strip("/") in server:
-            url = server.rstrip("/") + "/flow/exists"
-            response = requests.post(
-                url, data=data, headers=self._http.headers, timeout=self._http.timeout
-            )
-            xml_response = response.text
-        else:
-            xml_response = self._http.post("flow/exists", data=data).text
+        xml_response = self._http.post("flow/exists", data=data).text
         result_dict = xmltodict.parse(xml_response)
         # Detect error payloads and raise
         if "oml:error" in result_dict:
@@ -116,20 +105,8 @@ def list(
         if uploader is not None:
             api_call += f"/uploader/{uploader}"
 
-        server = self._http.server
-        base = self._http.base_url
-        if base and base.strip("/") in server:
-            url = server.rstrip("/") + "/" + api_call
-            response = requests.get(
-                url,
-                headers=self._http.headers,
-                params={"api_key": self._http.api_key},
-                timeout=self._http.timeout,
-            )
-            xml_string = response.text
-        else:
-            response = self._http.get(api_call, use_api_key=True)
-            xml_string = response.text
+        response = self._http.get(api_call, use_api_key=True)
+        xml_string = response.text
         flows_dict = xmltodict.parse(xml_string, force_list=("oml:flow",))
 
         if "oml:error" in flows_dict:
@@ -158,7 +135,7 @@ def list(
 
         return pd.DataFrame.from_dict(flows, orient="index")
 
-    def create(self, flow: OpenMLFlow) -> OpenMLFlow:
+    def publish(self, flow: OpenMLFlow) -> OpenMLFlow:  # type: ignore[override]
         """Create a new flow on the OpenML server.
 
         under development , not fully functional yet
@@ -187,16 +164,7 @@ def create(self, flow: OpenMLFlow) -> OpenMLFlow:
         # POST to server (multipart/files). Ensure api_key is sent in the form data.
         files = file_elements
         data = {"api_key": self._http.api_key}
-        # If server already contains base path, post directly with requests to avoid double base_url
-        server = self._http.server
-        base = self._http.base_url
-        if base and base.strip("/") in server:
-            url = server.rstrip("/") + "/flow"
-            response = requests.post(
-                url, files=files, data=data, headers=self._http.headers, timeout=self._http.timeout
-            )
-        else:
-            response = self._http.post("flow", files=files, data=data)
+        response = self._http.post("flow", files=files, data=data)
 
         parsed = xmltodict.parse(response.text)
         if "oml:error" in parsed:
@@ -222,9 +190,6 @@ def delete(self, flow_id: int) -> bool:
         self._http.delete(f"flow/{flow_id}")
         return True
 
-    def publish(self) -> None:
-        pass
-
 
 class FlowsV2(FlowsAPI):
     def get(
@@ -277,8 +242,8 @@ def exists(self, name: str, external_version: str) -> int | bool:
             result = response.json()
             flow_id: int | bool = result.get("flow_id", False)
             return flow_id
-        except (requests.exceptions.HTTPError, KeyError):
-            # v2 returns 404 when flow doesn't exist
+        except (OpenMLServerError, KeyError):
+            # v2 returns 404 when flow doesn't exist, which raises OpenMLServerError
             return False
 
     def list(
@@ -291,15 +256,12 @@ def list(
     ) -> pd.DataFrame:
         raise NotImplementedError("flows (list) not yet implemented in v2 server")
 
-    def create(self, flow: OpenMLFlow) -> OpenMLFlow:
+    def publish(self, flow: OpenMLFlow) -> OpenMLFlow:  # type: ignore[override]
         raise NotImplementedError("POST /flows (create) not yet implemented in v2 server")
 
     def delete(self, flow_id: int) -> bool:
         raise NotImplementedError("DELETE /flows/{id} not yet implemented in v2 server")
 
-    def publish(self) -> None:
-        raise NotImplementedError("publish not implemented in v2 server")
-
     @staticmethod
     def _convert_v2_to_v1_format(v2_json: dict[str, Any]) -> dict[str, dict]:
         """Convert v2 JSON response to v1 XML-dict format for OpenMLFlow._from_dict().
diff --git a/openml/base.py b/openml/base.py
index b7a4877c1..2d97e77e1 100644
--- a/openml/base.py
+++ b/openml/base.py
@@ -128,15 +128,15 @@ def publish(self) -> OpenMLBase:
         """Publish the object on the OpenML server."""
         from openml._api import api_context
 
-        # 1. Resolve the correct resource manager (e.g., Flows, Runs)
         resource_manager = api_context.backend.get_resource_for_entity(self)
 
-        # 2. Delegate creation to the backend (Handles V1/V2 switching internally)
-        # The backend returns the updated entity (with ID) or the ID itself.
-        published_entity = resource_manager.create(self)  # type: ignore
+        published_entity = resource_manager.publish(self)  # type: ignore
 
-        # 3. Update self with ID if not already done (V2 response handling)
-        if self.id is None and published_entity.id is not None:
+        if (
+            published_entity is not None
+            and hasattr(published_entity, "id")
+            and published_entity.id is not None
+        ):
             self.id = published_entity.id  # type: ignore
 
         return self
diff --git a/openml/flows/functions.py b/openml/flows/functions.py
index 28a3ffaa9..6ed1a4031 100644
--- a/openml/flows/functions.py
+++ b/openml/flows/functions.py
@@ -69,7 +69,7 @@ def _get_cached_flow(fid: int) -> OpenMLFlow:
         raise OpenMLCacheException(f"Flow file for fid {fid} not cached") from e
 
 
-@openml.utils.thread_safe_if_oslo_installed
+# @openml.utils.thread_safe_if_oslo_installed
 def get_flow(flow_id: int, reinstantiate: bool = False, strict_version: bool = True) -> OpenMLFlow:  # noqa: FBT002
     """Download the OpenML flow for a given flow ID.
 
@@ -192,7 +192,7 @@ def flow_exists(name: str, external_version: str) -> int | bool:
     """
     if not (isinstance(name, str) and len(name) > 0):
         raise ValueError("Argument 'name' should be a non-empty string")
-    if not (isinstance(name, str) and len(external_version) > 0):
+    if not (isinstance(external_version, str) and len(external_version) > 0):
         raise ValueError("Argument 'version' should be a non-empty string")
 
     from openml._api import api_context
diff --git a/tests/test_flows/test_flow_migration.py b/tests/test_flows/test_flow_migration.py
index cc1b98f1d..c15ee3832 100644
--- a/tests/test_flows/test_flow_migration.py
+++ b/tests/test_flows/test_flow_migration.py
@@ -9,204 +9,111 @@
 import requests
 
 import openml
+from openml._api import api_context
 from openml.exceptions import OpenMLCacheException
 from openml.flows import OpenMLFlow
 from openml.flows import functions as flow_functions
 
 
-@pytest.fixture()
-def dummy_flow() -> OpenMLFlow:
-    return OpenMLFlow(
-        name="TestFlow",
-        description="test",
-        model=None,
-        components=OrderedDict(),
-        parameters=OrderedDict(),
-        parameters_meta_info=OrderedDict(),
-        external_version="1",
-        tags=[],
-        language="English",
-        dependencies="",
-        class_name="x",
-    )
+@pytest.fixture(scope="function")
+def reset_api_to_v1() -> None:
+    """Fixture to ensure API is set to V1 for each test."""
+    api_context.set_version("v1", strict=False)
+    yield
+    api_context.set_version("v1", strict=False)
 
 
-def test_flow_exists_delegates_to_backend(monkeypatch):
-    from openml._api import api_context
+@pytest.fixture(scope="function")
+def api_v2() -> None:
+    """Fixture to set API to V2 for tests."""
+    api_context.set_version("v2", strict=True)
+    yield
+    api_context.set_version("v1", strict=False)
 
-    calls: dict[str, Any] = {}
 
-    def fake_exists(name: str, external_version: str) -> int:
-        calls["args"] = (name, external_version)
-        return 42
+def test_list_flow_v1(reset_api_to_v1) -> None:
+    """Test listing flows using V1 API."""
+    flows_df = flow_functions.list_flows()
+    assert isinstance(flows_df, pd.DataFrame)
+    assert not flows_df.empty
 
-    monkeypatch.setattr(api_context.backend.flows, "exists", fake_exists)
 
-    result = openml.flows.flow_exists(name="foo", external_version="v1")
+def test_flow_exists_v1(reset_api_to_v1) -> None:
+    """Test flow_exists() using V1 API."""
+    # Known existing flow
+    name = "weka.OneR"
+    external_version = "Weka_3.9.0_10153"
 
-    assert result == 42
-    assert calls["args"] == ("foo", "v1")
+    exists = flow_functions.flow_exists(name, external_version)
+    assert exists != False
 
+    # Known non-existing flow
+    name = "non.existing.Flow"
+    external_version = "0.0.1"
 
-def test_list_flows_delegates_to_backend(monkeypatch):
-    from openml._api import api_context
+    exists = flow_functions.flow_exists(name, external_version)
+    assert exists is False
 
-    calls: list[tuple[int, int, str | None, str | None]] = []
-    df = pd.DataFrame({
-        "id": [1, 2],
-        "full_name": ["a", "b"],
-        "name": ["a", "b"],
-        "version": ["1", "1"],
-        "external_version": ["v1", "v1"],
-        "uploader": ["u", "u"],
-    }).set_index("id")
 
-    def fake_list(limit: int | None, offset: int | None, tag: str | None, uploader: str | None):
-        calls.append((limit or 0, offset or 0, tag, uploader))
-        return df
+def test_get_flows_v1(reset_api_to_v1) -> None:
+    """Test get() method returns a valid OpenMLFlow object using V1 API."""
+    # Get the flow with ID 2 (weka.OneR)
+    flow_id = 2
+    flow = flow_functions.get_flow(flow_id)
 
-    monkeypatch.setattr(api_context.backend.flows, "list", fake_list)
-    result = openml.flows.list_flows(offset=0, size=5, tag="t", uploader="u")
-
-    assert result.equals(df)
-    # _list_all passes batch_size as limit; expect one call
-    assert calls == [(5, 0, "t", "u")]
-
-
-def test_get_flow_description_fetches_on_cache_miss(monkeypatch, tmp_path, dummy_flow):
-    from openml._api import api_context
-
-    # Force cache miss
-    def raise_cache(_fid: int) -> None:
-        raise OpenMLCacheException("no cache")
-
-    monkeypatch.setattr(flow_functions, "_get_cached_flow", raise_cache)
-
-    def fake_get(flow_id: int):
-        return dummy_flow
-
-    monkeypatch.setattr(api_context.backend.flows, "get", fake_get)
-
-    flow = flow_functions._get_flow_description(123)
-
-    assert flow is dummy_flow
-
-
-def test_delete_flow_delegates_to_backend(monkeypatch):
-    from openml._api import api_context
-
-    calls: dict[str, Any] = {}
-
-    def fake_delete(flow_id: int) -> None:
-        calls["flow_id"] = flow_id
-
-    monkeypatch.setattr(api_context.backend.flows, "delete", fake_delete)
-
-    result = openml.flows.delete_flow(flow_id=999)
-
-    assert result is True
-    assert calls["flow_id"] == 999
-
-
-def test_v2_flow_exists_found(monkeypatch):
-    """Test FlowsV2.exists() when flow is found."""
-    from openml._api.resources.flows import FlowsV2
-    from openml._api.http.client import HTTPClient
-    from openml._api.config import settings
-
-    http_client = HTTPClient(settings.api.v2)
-    flows_v2 = FlowsV2(http_client)
-
-    # Mock HTTP response
-    mock_response = requests.Response()
-    mock_response.status_code = 200
-    mock_response._content = b'{"flow_id": 123}'
-
-    def fake_get(path: str):
-        assert path == "flows/exists/weka.ZeroR/Weka_3.9.0/"
-        return mock_response
-
-    monkeypatch.setattr(http_client, "get", fake_get)
-
-    result = flows_v2.exists("weka.ZeroR", "Weka_3.9.0")
-
-    assert result == 123
-
-
-def test_v2_flow_exists_not_found(monkeypatch):
-    """Test FlowsV2.exists() when flow is not found (404)."""
-    from openml._api.resources.flows import FlowsV2
-    from openml._api.http.client import HTTPClient
-    from openml._api.config import settings
-
-    http_client = HTTPClient(settings.api.v2)
-    flows_v2 = FlowsV2(http_client)
-
-    def fake_get(path: str):
-        raise requests.exceptions.HTTPError("404 Not Found")
-
-    monkeypatch.setattr(http_client, "get", fake_get)
+    assert isinstance(flow, OpenMLFlow)
+    assert flow.flow_id == flow_id
+    assert isinstance(flow.name, str)
+    assert len(flow.name) > 0
+    assert isinstance(flow.external_version, str)
 
-    result = flows_v2.exists("nonexistent.Flow", "v1.0.0")
 
-    assert result is False
+def test_flow_publish_v1(reset_api_to_v1) -> None:
+    """Test publishing a flow using V1 API."""
+    from openml_sklearn.extension import SklearnExtension
+    from sklearn.tree import DecisionTreeClassifier
 
+    clf = DecisionTreeClassifier()
+    extension = SklearnExtension()
+    dt_flow = extension.model_to_flow(clf)
 
-def test_v2_flow_get(monkeypatch, dummy_flow):
-    """Test FlowsV2.get() converts v2 JSON to OpenMLFlow."""
-    from openml._api.resources.flows import FlowsV2
-    from openml._api.http.client import HTTPClient
-    from openml._api.config import settings
+    # Publish the flow
+    published_flow = dt_flow.publish()
 
-    http_client = HTTPClient(settings.api.v2)
-    flows_v2 = FlowsV2(http_client)
+    # Verify the published flow has an ID
+    assert isinstance(published_flow, OpenMLFlow)
+    assert getattr(published_flow, "id", None) is not None
 
-    # Mock v2 JSON response
-    v2_json = {
-        "id": 1,
-        "uploader": 16,
-        "name": "weka.ZeroR",
-        "class_name": "weka.classifiers.rules.ZeroR",
-        "version": 1,
-        "external_version": "Weka_3.9.0_12024",
-        "description": "Weka implementation of ZeroR",
-        "upload_date": "2017-03-24T14:26:38",
-        "language": "English",
-        "dependencies": "Weka_3.9.0",
-        "parameter": [
-            {
-                "name": "batch-size",
-                "data_type": "option",
-                "default_value": 100,
-                "description": "Batch size for processing",
-            }
-        ],
-        "subflows": [],
-        "tag": ["weka", "OpenmlWeka"],
-    }
 
-    mock_response = requests.Response()
-    mock_response.status_code = 200
-    mock_response._content = b'{}'
+def test_get_flows_v2(api_v2) -> None:
+    """Test get() method returns a valid OpenMLFlow object using V2 API."""
+    # Get the flow with ID 2 (weka.OneR)
+    flow_id = 2
 
-    def fake_json():
-        return v2_json
+    # Now get the full flow details
+    flow = flow_functions.get_flow(flow_id)
 
-    mock_response.json = fake_json
+    # Verify it's an OpenMLFlow with expected attributes
+    assert isinstance(flow, OpenMLFlow)
+    assert flow.flow_id == flow_id
+    assert isinstance(flow.name, str)
+    assert len(flow.name) > 0
+    assert isinstance(flow.external_version, str)
 
-    def fake_get(path: str):
-        assert path == "flows/1/"
-        return mock_response
 
-    monkeypatch.setattr(http_client, "get", fake_get)
+def test_flow_exists_v2(api_v2) -> None:
+    """Test flow_exists() using V2 API."""
+    # Known existing flow
+    name = "weka.OneR"
+    external_version = "Weka_3.9.0_10153"
 
-    flow = flows_v2.get(1)
+    exists = flow_functions.flow_exists(name, external_version)
+    assert exists != False
 
-    assert isinstance(flow, OpenMLFlow)
-    assert flow.flow_id == 1
-    assert flow.name == "weka.ZeroR"
-    assert flow.external_version == "Weka_3.9.0_12024"
-    assert flow.uploader == "16"
-    assert len(flow.parameters) == 1
-    assert "batch-size" in flow.parameters
+    # Known non-existing flow
+    name = "non.existing.Flow"
+    external_version = "0.0.1"
 
+    exists = flow_functions.flow_exists(name, external_version)
+    assert exists == False
+    
\ No newline at end of file

From fa53f8d3e10dabde3634c05a97d67560459bcaa6 Mon Sep 17 00:00:00 2001
From: geetu040 <raoarmaghanshakir040@gmail.com>
Date: Wed, 28 Jan 2026 13:50:42 +0500
Subject: [PATCH 26/34] add test_http.py

---
 openml/testing.py           |  88 +++++++++++++++++++++++
 tests/test_api/test_http.py | 134 ++++++++++++++++++++++++++++++++++++
 2 files changed, 222 insertions(+)
 create mode 100644 tests/test_api/test_http.py

diff --git a/openml/testing.py b/openml/testing.py
index 8d3bbbd5b..b0aaac9be 100644
--- a/openml/testing.py
+++ b/openml/testing.py
@@ -11,10 +11,13 @@
 import unittest
 from pathlib import Path
 from typing import ClassVar
+from urllib.parse import urljoin
 
 import requests
 
 import openml
+from openml._api.clients import HTTPCache, HTTPClient
+from openml._api.config import RetryPolicy
 from openml.exceptions import OpenMLServerException
 from openml.tasks import TaskType
 
@@ -276,6 +279,91 @@ def _check_fold_timing_evaluations(  # noqa: PLR0913
                         assert evaluation <= max_val
 
 
+class TestAPIBase(unittest.TestCase):
+    server: str
+    base_url: str
+    api_key: str
+    timeout: int
+    retries: int
+    retry_policy: RetryPolicy
+    dir: str
+    ttl: int
+    cache: HTTPCache
+    http_client: HTTPClient
+
+    def setUp(self) -> None:
+        self.server = "https://test.openml.org/"
+        self.base_url = "api/v1/xml"
+        self.api_key = "normaluser"
+        self.timeout = 10
+        self.retries = 3
+        self.retry_policy = RetryPolicy.HUMAN
+        self.dir = "test_cache"
+        self.ttl = 60 * 60 * 24 * 7
+
+        self.cache = self._get_http_cache(
+            path=Path(self.dir),
+            ttl=self.ttl,
+        )
+        self.http_client = self._get_http_client(
+            server=self.server,
+            base_url=self.base_url,
+            api_key=self.api_key,
+            timeout=self.timeout,
+            retries=self.retries,
+            retry_policy=self.retry_policy,
+            cache=self.cache,
+        )
+
+        if self.cache.path.exists():
+            shutil.rmtree(self.cache.path)
+
+    def tearDown(self) -> None:
+        if self.cache.path.exists():
+            shutil.rmtree(self.cache.path)
+
+    def _get_http_cache(
+        self,
+        path: Path,
+        ttl: int,
+    ) -> HTTPCache:
+        return HTTPCache(
+            path=path,
+            ttl=ttl,
+        )
+
+    def _get_http_client(  # noqa: PLR0913
+        self,
+        server: str,
+        base_url: str,
+        api_key: str,
+        timeout: int,
+        retries: int,
+        retry_policy: RetryPolicy,
+        cache: HTTPCache | None = None,
+    ) -> HTTPClient:
+        return HTTPClient(
+            server=server,
+            base_url=base_url,
+            api_key=api_key,
+            timeout=timeout,
+            retries=retries,
+            retry_policy=retry_policy,
+            cache=cache,
+        )
+
+    def _get_url(
+        self,
+        server: str | None = None,
+        base_url: str | None = None,
+        path: str | None = None,
+    ) -> str:
+        server = server if server else self.server
+        base_url = base_url if base_url else self.base_url
+        path = path if path else ""
+        return urljoin(self.server, urljoin(self.base_url, path))
+
+
 def check_task_existence(
     task_type: TaskType,
     dataset_id: int,
diff --git a/tests/test_api/test_http.py b/tests/test_api/test_http.py
new file mode 100644
index 000000000..98b6fda5a
--- /dev/null
+++ b/tests/test_api/test_http.py
@@ -0,0 +1,134 @@
+from requests import Response, Request
+import time
+import xmltodict
+from openml.testing import TestAPIBase
+
+
+class TestHTTPClient(TestAPIBase):
+    def test_cache(self):
+        url = self._get_url(path="task/31")
+        params = {"param1": "value1", "param2": "value2"}
+
+        key = self.cache.get_key(url, params)
+
+        # validate key
+        self.assertEqual(
+            key,
+            "org/openml/test/api/v1/task/31/param1=value1&param2=value2",
+        )
+
+        # create fake response
+        req = Request("GET", url).prepare()
+        response = Response()
+        response.status_code = 200
+        response.url = url
+        response.reason = "OK"
+        response._content = b"<xml>test</xml>"
+        response.headers = {"Content-Type": "text/xml"}
+        response.encoding = "utf-8"
+        response.request = req
+        response.elapsed = type("Elapsed", (), {"total_seconds": lambda self: 0.1})()
+
+        # save to cache
+        self.cache.save(key, response)
+
+        # load from cache
+        cached_response = self.cache.load(key)
+
+        # validate loaded response
+        self.assertEqual(cached_response.status_code, 200)
+        self.assertEqual(cached_response.url, url)
+        self.assertEqual(cached_response.content, b"<xml>test</xml>")
+        self.assertEqual(
+            cached_response.headers["Content-Type"], "text/xml"
+        )
+
+    def test_get(self):
+        response = self.http_client.get("task/1")
+
+        self.assertEqual(response.status_code, 200)
+        self.assertIn(b"<oml:task", response.content)
+
+    def test_get_with_cache_creates_cache(self):
+        response = self.http_client.get("task/1", use_cache=True)
+
+        self.assertEqual(response.status_code, 200)
+        self.assertTrue(self.cache.path.exists())
+
+        # verify cache directory structure exists
+        cache_key = self.cache.get_key(
+            self._get_url(path="task/1"),
+            {},
+        )
+        cache_path = self.cache._key_to_path(cache_key)
+
+        self.assertTrue((cache_path / "meta.json").exists())
+        self.assertTrue((cache_path / "headers.json").exists())
+        self.assertTrue((cache_path / "body.bin").exists())
+
+    def test_get_uses_cached_response(self):
+        # first request populates cache
+        response1 = self.http_client.get("task/1", use_cache=True)
+
+        # second request should load from cache
+        response2 = self.http_client.get("task/1", use_cache=True)
+
+        self.assertEqual(response1.content, response2.content)
+        self.assertEqual(response1.status_code, response2.status_code)
+
+    def test_get_cache_expires(self):
+        # force short TTL
+        self.cache.ttl = 1
+        path = "task/1"
+
+        url = self._get_url(path=path)
+        key = self.cache.get_key(url, {})
+        cache_path = self.cache._key_to_path(key) / "meta.json"
+
+        response1 = self.http_client.get(path, use_cache=True)
+        response1_cache_time_stamp = cache_path.stat().st_ctime
+
+        time.sleep(2)
+
+        response2 = self.http_client.get(path, use_cache=True)
+        response2_cache_time_stamp = cache_path.stat().st_ctime
+
+        # cache expired -> new request
+        self.assertNotEqual(response1_cache_time_stamp, response2_cache_time_stamp)
+        self.assertEqual(response2.status_code, 200)
+        self.assertEqual(response1.content, response2.content)
+
+    def test_post_and_delete(self):
+        task_xml = """
+        <oml:task_inputs xmlns:oml="http://openml.org/openml">
+            <oml:task_type_id>5</oml:task_type_id>
+            <oml:input name="source_data">193</oml:input>
+            <oml:input name="estimation_procedure">17</oml:input>
+        </oml:task_inputs>
+        """
+
+        task_id = None
+        try:
+            # POST the task
+            post_response = self.http_client.post(
+                "task",
+                files={"description": task_xml},
+            )
+            self.assertEqual(post_response.status_code, 200)
+            xml_resp = xmltodict.parse(post_response.content)
+            task_id = int(xml_resp["oml:upload_task"]["oml:id"])
+
+            # GET the task to verify it exists
+            get_response = self.http_client.get(f"task/{task_id}")
+            self.assertEqual(get_response.status_code, 200)
+
+        finally:
+            # DELETE the task if it was created
+            if task_id is not None:
+                try:
+                    del_response = self.http_client.delete(f"task/{task_id}")
+                    # optional: verify delete
+                    if del_response.status_code != 200:
+                        print(f"Warning: delete failed for task {task_id}")
+                except Exception as e:
+                    print(f"Warning: failed to delete task {task_id}: {e}")

From 2b2db962fc252a2b2b23f21bd1d055905ed74588 Mon Sep 17 00:00:00 2001
From: geetu040 <raoarmaghanshakir040@gmail.com>
Date: Wed, 28 Jan 2026 13:52:43 +0500
Subject: [PATCH 27/34] add uses_test_server marker

---
 tests/test_api/test_http.py | 6 ++++++
 1 file changed, 6 insertions(+)

diff --git a/tests/test_api/test_http.py b/tests/test_api/test_http.py
index 98b6fda5a..94ce5ee93 100644
--- a/tests/test_api/test_http.py
+++ b/tests/test_api/test_http.py
@@ -1,6 +1,7 @@
 from requests import Response, Request
 import time
 import xmltodict
+import pytest
 from openml.testing import TestAPIBase
 
 
@@ -43,12 +44,14 @@ def test_cache(self):
             cached_response.headers["Content-Type"], "text/xml"
         )
 
+    @pytest.mark.uses_test_server()
     def test_get(self):
         response = self.http_client.get("task/1")
 
         self.assertEqual(response.status_code, 200)
         self.assertIn(b"<oml:task", response.content)
 
+    @pytest.mark.uses_test_server()
     def test_get_with_cache_creates_cache(self):
         response = self.http_client.get("task/1", use_cache=True)
 
@@ -66,6 +69,7 @@ def test_get_with_cache_creates_cache(self):
         self.assertTrue((cache_path / "headers.json").exists())
         self.assertTrue((cache_path / "body.bin").exists())
 
+    @pytest.mark.uses_test_server()
     def test_get_uses_cached_response(self):
         # first request populates cache
         response1 = self.http_client.get("task/1", use_cache=True)
@@ -76,6 +80,7 @@ def test_get_uses_cached_response(self):
         self.assertEqual(response1.content, response2.content)
         self.assertEqual(response1.status_code, response2.status_code)
 
+    @pytest.mark.uses_test_server()
     def test_get_cache_expires(self):
         # force short TTL
         self.cache.ttl = 1
@@ -98,6 +103,7 @@ def test_get_cache_expires(self):
         self.assertEqual(response2.status_code, 200)
         self.assertEqual(response1.content, response2.content)
 
+    @pytest.mark.uses_test_server()
     def test_post_and_delete(self):
         task_xml = """
         <oml:task_inputs xmlns:oml="http://openml.org/openml">

From c9617f932fce853dbe6db9a445ef98cc6cfec7f4 Mon Sep 17 00:00:00 2001
From: geetu040 <raoarmaghanshakir040@gmail.com>
Date: Thu, 29 Jan 2026 14:40:09 +0500
Subject: [PATCH 28/34] implement reset_cache

---
 openml/_api/clients/http.py |  6 +++++-
 tests/test_api/test_http.py | 18 ++++++++++++++++++
 2 files changed, 23 insertions(+), 1 deletion(-)

diff --git a/openml/_api/clients/http.py b/openml/_api/clients/http.py
index 65d7b2248..dfcdf5a8a 100644
--- a/openml/_api/clients/http.py
+++ b/openml/_api/clients/http.py
@@ -322,6 +322,7 @@ def request(
         path: str,
         *,
         use_cache: bool = False,
+        reset_cache: bool = False,
         use_api_key: bool = False,
         **request_kwargs: Any,
     ) -> Response:
@@ -345,7 +346,7 @@ def request(
         timeout = request_kwargs.pop("timeout", self.timeout)
         files = request_kwargs.pop("files", None)
 
-        if use_cache and self.cache is not None:
+        if use_cache and not reset_cache and self.cache is not None:
             cache_key = self.cache.get_key(url, params)
             try:
                 return self.cache.load(cache_key)
@@ -379,6 +380,7 @@ def request(
         assert response is not None
 
         if use_cache and self.cache is not None:
+            cache_key = self.cache.get_key(url, params)
             self.cache.save(cache_key, response)
 
         return response
@@ -388,6 +390,7 @@ def get(
         path: str,
         *,
         use_cache: bool = False,
+        reset_cache: bool = False,
         use_api_key: bool = False,
         **request_kwargs: Any,
     ) -> Response:
@@ -395,6 +398,7 @@ def get(
             method="GET",
             path=path,
             use_cache=use_cache,
+            reset_cache=reset_cache,
             use_api_key=use_api_key,
             **request_kwargs,
         )
diff --git a/tests/test_api/test_http.py b/tests/test_api/test_http.py
index 94ce5ee93..808321862 100644
--- a/tests/test_api/test_http.py
+++ b/tests/test_api/test_http.py
@@ -103,6 +103,24 @@ def test_get_cache_expires(self):
         self.assertEqual(response2.status_code, 200)
         self.assertEqual(response1.content, response2.content)
 
+    @pytest.mark.uses_test_server()
+    def test_get_reset_cache(self):
+        path = "task/1"
+
+        url = self._get_url(path=path)
+        key = self.cache.get_key(url, {})
+        cache_path = self.cache._key_to_path(key) / "meta.json"
+
+        response1 = self.http_client.get(path, use_cache=True)
+        response1_cache_time_stamp = cache_path.stat().st_ctime
+
+        response2 = self.http_client.get(path, use_cache=True, reset_cache=True)
+        response2_cache_time_stamp = cache_path.stat().st_ctime
+
+        self.assertNotEqual(response1_cache_time_stamp, response2_cache_time_stamp)
+        self.assertEqual(response2.status_code, 200)
+        self.assertEqual(response1.content, response2.content)
+
     @pytest.mark.uses_test_server()
     def test_post_and_delete(self):
         task_xml = """

From 443ade99bc35112ce6e110eecd5249026b77c1e7 Mon Sep 17 00:00:00 2001
From: Omswastik-11 <omswastikpanda11@gmail.com>
Date: Thu, 29 Jan 2026 18:28:03 +0530
Subject: [PATCH 29/34] tests:added tests for migration

Signed-off-by: Omswastik-11 <omswastikpanda11@gmail.com>
---
 tests/test_flows/test_flow_migration.py  | 119 ---------
 tests/test_flows/test_flows_migration.py | 306 +++++++++++++++++++++++
 2 files changed, 306 insertions(+), 119 deletions(-)
 delete mode 100644 tests/test_flows/test_flow_migration.py
 create mode 100644 tests/test_flows/test_flows_migration.py

diff --git a/tests/test_flows/test_flow_migration.py b/tests/test_flows/test_flow_migration.py
deleted file mode 100644
index c15ee3832..000000000
--- a/tests/test_flows/test_flow_migration.py
+++ /dev/null
@@ -1,119 +0,0 @@
-# License: BSD 3-Clause
-from __future__ import annotations
-
-from collections import OrderedDict
-from typing import Any
-
-import pandas as pd
-import pytest
-import requests
-
-import openml
-from openml._api import api_context
-from openml.exceptions import OpenMLCacheException
-from openml.flows import OpenMLFlow
-from openml.flows import functions as flow_functions
-
-
-@pytest.fixture(scope="function")
-def reset_api_to_v1() -> None:
-    """Fixture to ensure API is set to V1 for each test."""
-    api_context.set_version("v1", strict=False)
-    yield
-    api_context.set_version("v1", strict=False)
-
-
-@pytest.fixture(scope="function")
-def api_v2() -> None:
-    """Fixture to set API to V2 for tests."""
-    api_context.set_version("v2", strict=True)
-    yield
-    api_context.set_version("v1", strict=False)
-
-
-def test_list_flow_v1(reset_api_to_v1) -> None:
-    """Test listing flows using V1 API."""
-    flows_df = flow_functions.list_flows()
-    assert isinstance(flows_df, pd.DataFrame)
-    assert not flows_df.empty
-
-
-def test_flow_exists_v1(reset_api_to_v1) -> None:
-    """Test flow_exists() using V1 API."""
-    # Known existing flow
-    name = "weka.OneR"
-    external_version = "Weka_3.9.0_10153"
-
-    exists = flow_functions.flow_exists(name, external_version)
-    assert exists != False
-
-    # Known non-existing flow
-    name = "non.existing.Flow"
-    external_version = "0.0.1"
-
-    exists = flow_functions.flow_exists(name, external_version)
-    assert exists is False
-
-
-def test_get_flows_v1(reset_api_to_v1) -> None:
-    """Test get() method returns a valid OpenMLFlow object using V1 API."""
-    # Get the flow with ID 2 (weka.OneR)
-    flow_id = 2
-    flow = flow_functions.get_flow(flow_id)
-
-    assert isinstance(flow, OpenMLFlow)
-    assert flow.flow_id == flow_id
-    assert isinstance(flow.name, str)
-    assert len(flow.name) > 0
-    assert isinstance(flow.external_version, str)
-
-
-def test_flow_publish_v1(reset_api_to_v1) -> None:
-    """Test publishing a flow using V1 API."""
-    from openml_sklearn.extension import SklearnExtension
-    from sklearn.tree import DecisionTreeClassifier
-
-    clf = DecisionTreeClassifier()
-    extension = SklearnExtension()
-    dt_flow = extension.model_to_flow(clf)
-
-    # Publish the flow
-    published_flow = dt_flow.publish()
-
-    # Verify the published flow has an ID
-    assert isinstance(published_flow, OpenMLFlow)
-    assert getattr(published_flow, "id", None) is not None
-
-
-def test_get_flows_v2(api_v2) -> None:
-    """Test get() method returns a valid OpenMLFlow object using V2 API."""
-    # Get the flow with ID 2 (weka.OneR)
-    flow_id = 2
-
-    # Now get the full flow details
-    flow = flow_functions.get_flow(flow_id)
-
-    # Verify it's an OpenMLFlow with expected attributes
-    assert isinstance(flow, OpenMLFlow)
-    assert flow.flow_id == flow_id
-    assert isinstance(flow.name, str)
-    assert len(flow.name) > 0
-    assert isinstance(flow.external_version, str)
-
-
-def test_flow_exists_v2(api_v2) -> None:
-    """Test flow_exists() using V2 API."""
-    # Known existing flow
-    name = "weka.OneR"
-    external_version = "Weka_3.9.0_10153"
-
-    exists = flow_functions.flow_exists(name, external_version)
-    assert exists != False
-
-    # Known non-existing flow
-    name = "non.existing.Flow"
-    external_version = "0.0.1"
-
-    exists = flow_functions.flow_exists(name, external_version)
-    assert exists == False
-    
\ No newline at end of file
diff --git a/tests/test_flows/test_flows_migration.py b/tests/test_flows/test_flows_migration.py
new file mode 100644
index 000000000..823cc3d2a
--- /dev/null
+++ b/tests/test_flows/test_flows_migration.py
@@ -0,0 +1,306 @@
+# License: BSD 3-Clause
+"""Tests for Flow V1 → V2 API Migration."""
+from __future__ import annotations
+
+import pytest
+
+from openml._api.resources import FallbackProxy, FlowsV1, FlowsV2
+from openml.flows.flow import OpenMLFlow
+from openml.testing import TestAPIBase
+
+
+class TestFlowsV1(TestAPIBase):
+    """Test FlowsV1 resource implementation."""
+
+    def setUp(self):
+        super().setUp()
+        self.resource = FlowsV1(self.http_client)
+
+    @pytest.mark.uses_test_server()
+    def test_get(self):
+        """Test getting a flow from the V1 API."""
+        flow = self.resource.get(flow_id=1)
+        
+        assert isinstance(flow, OpenMLFlow)
+        assert flow.flow_id == 1
+        assert isinstance(flow.name, str)
+        assert len(flow.name) > 0
+
+    @pytest.mark.uses_test_server()
+    def test_exists(self):
+        """Test checking if a flow exists using V1 API."""
+        flow = self.resource.get(flow_id=1)
+        
+        result = self.resource.exists(
+            name=flow.name,
+            external_version=flow.external_version
+        )
+        
+        assert isinstance(result, int)
+        assert result > 0
+        assert result == flow.flow_id
+
+    @pytest.mark.uses_test_server()
+    def test_exists_nonexistent(self):
+        """Test checking if a non-existent flow exists using V1 API."""
+        result = self.resource.exists(
+            name="NonExistentFlowName123456789",
+            external_version="0.0.0.nonexistent"
+        )
+        
+        assert result is False
+
+    @pytest.mark.uses_test_server()
+    def test_list(self):
+        """Test listing flows from the V1 API."""
+        flows_df = self.resource.list(limit=10)
+        
+        assert len(flows_df) > 0
+        assert len(flows_df) <= 10
+        assert "id" in flows_df.columns
+        assert "name" in flows_df.columns
+        assert "version" in flows_df.columns
+        assert "external_version" in flows_df.columns
+        assert "full_name" in flows_df.columns
+        assert "uploader" in flows_df.columns
+
+    @pytest.mark.uses_test_server()
+    def test_list_with_offset(self):
+        """Test listing flows with offset from the V1 API."""
+        flows_df = self.resource.list(limit=5, offset=10)
+        
+        assert len(flows_df) > 0
+        assert len(flows_df) <= 5
+
+    @pytest.mark.uses_test_server()
+    def test_list_with_tag_limit_offset(self):
+        """Test listing flows with filters from the V1 API."""
+        flows_df = self.resource.list(tag="weka", limit=5 , offset=0 , uploader=16)
+        
+        assert hasattr(flows_df, 'columns')
+        if len(flows_df) > 0:
+            assert "id" in flows_df.columns
+    
+    @pytest.mark.uses_test_server()
+    def test_publish(self):
+        """Test publishing a sklearn flow using V1 API."""
+        from openml_sklearn.extension import SklearnExtension
+        from sklearn.tree import ExtraTreeRegressor
+        clf = ExtraTreeRegressor()
+        extension = SklearnExtension()
+        dt_flow = extension.model_to_flow(clf)
+        published_flow = self.resource.publish(dt_flow)
+        assert isinstance(published_flow, OpenMLFlow)
+        assert getattr(published_flow, "id", None) is not None
+    
+    @pytest.mark.uses_test_server()
+    def test_delete(self):
+        """Test deleting a flow using V1 API."""
+        from openml_sklearn.extension import SklearnExtension
+        from sklearn.tree import ExtraTreeRegressor
+        clf = ExtraTreeRegressor()
+        extension = SklearnExtension()
+        dt_flow = extension.model_to_flow(clf)
+        flow_id = self.resource.exists(
+            name=dt_flow.name,
+            external_version=dt_flow.external_version
+        )
+        result = self.resource.delete(flow_id)
+        assert result is True
+        exists = self.resource.exists(
+            name=dt_flow.name,
+            external_version=dt_flow.external_version
+        )
+        assert exists is False
+
+
+
+class TestFlowsV2(TestAPIBase):
+    """Test FlowsV2 resource implementation."""
+
+    def setUp(self):
+        super().setUp()
+        self.v2_http_client = self._get_http_client(
+            server="http://127.0.0.1:8001/",
+            base_url="", 
+            api_key=self.api_key,
+            timeout=self.timeout,
+            retries=self.retries,
+            retry_policy=self.retry_policy,
+            cache=self.cache,
+        )
+        self.resource = FlowsV2(self.v2_http_client)
+
+    # @pytest.mark.skip(reason="V2 API not yet deployed on test server")
+    @pytest.mark.uses_test_server()
+    def test_get(self):
+        """Test getting a flow from the V2 API."""
+        flow = self.resource.get(flow_id=1)
+        
+        assert isinstance(flow, OpenMLFlow)
+        assert flow.flow_id == 1
+        assert isinstance(flow.name, str)
+        assert len(flow.name) > 0
+
+    # @pytest.mark.skip(reason="V2 API not yet deployed on test server")
+    @pytest.mark.uses_test_server()
+    def test_exists(self):
+        """Test checking if a flow exists using V2 API."""
+        flow = self.resource.get(flow_id=1)
+        
+        result = self.resource.exists(
+            name=flow.name,
+            external_version=flow.external_version
+        )
+        
+        # V2 may return int or bool
+        assert result is not False
+        if isinstance(result, int):
+            assert result > 0
+
+    # @pytest.mark.skip(reason="V2 API not yet deployed on test server")
+    @pytest.mark.uses_test_server()
+    def test_exists_nonexistent(self):
+        """Test checking if a non-existent flow exists using V2 API."""
+        result = self.resource.exists(
+            name="NonExistentFlowName123456789",
+            external_version="0.0.0.nonexistent"
+        )
+        
+        assert result is False
+
+    def test_list_not_implemented(self):
+        """Test that list raises NotImplementedError for V2."""
+        with pytest.raises(NotImplementedError):
+            self.resource.list(limit=10)
+
+    def test_publish_not_implemented(self):
+        """Test that publish raises NotImplementedError for V2."""
+        from collections import OrderedDict
+        
+        with pytest.raises(NotImplementedError):
+            flow = OpenMLFlow(
+                name="test",
+                description="test",
+                model=None,
+                components=OrderedDict(),
+                parameters=OrderedDict(),
+                parameters_meta_info=OrderedDict(),
+                external_version="1.0",
+                tags=[],
+                language="English",
+                dependencies=None,
+            )
+            self.resource.publish(flow)
+
+    def test_delete_not_implemented(self):
+        """Test that delete raises NotImplementedError for V2."""
+        with pytest.raises(NotImplementedError):
+            self.resource.delete(flow_id=1)
+
+
+class TestFlowsCombined(TestAPIBase):
+    """Test combined functionality and fallback between V1 and V2."""
+
+    def setUp(self):
+        super().setUp()
+        # Set up V1 client
+        self.v1_http_client = self._get_http_client(
+            server=self.server,
+            base_url="api/v1/xml",
+            api_key=self.api_key,
+            timeout=self.timeout,
+            retries=self.retries,
+            retry_policy=self.retry_policy,
+            cache=self.cache,
+        )
+        # Set up V2 client
+        self.v2_http_client = self._get_http_client(
+            server="http://127.0.0.1:8001/",
+            base_url="",
+            api_key=self.api_key,
+            timeout=self.timeout,
+            retries=self.retries,
+            retry_policy=self.retry_policy,
+            cache=self.cache,
+        )
+        
+        self.resource_v1 = FlowsV1(self.v1_http_client)
+        self.resource_v2 = FlowsV2(self.v2_http_client)
+        self.resource_fallback = FallbackProxy(self.resource_v2, self.resource_v1)
+
+    # @pytest.mark.skip(reason="V2 API not yet deployed on test server")
+    @pytest.mark.uses_test_server()
+    def test_get_matches(self):
+        """Test that V1 and V2 get methods return matching flow data."""
+        flow_id = 1
+        
+        flow_v1 = self.resource_v1.get(flow_id=flow_id)
+        flow_v2 = self.resource_v2.get(flow_id=flow_id)
+        
+        # Check that the core attributes match
+        assert flow_v1.flow_id == flow_v2.flow_id
+        assert flow_v1.name == flow_v2.name
+        assert flow_v1.version == flow_v2.version
+        assert flow_v1.external_version == flow_v2.external_version
+        assert flow_v1.description == flow_v2.description
+
+    # @pytest.mark.skip(reason="V2 API not yet deployed on test server")
+    @pytest.mark.uses_test_server()
+    def test_exists_matches(self):
+        """Test that V1 and V2 exists methods return consistent results."""
+        # Get a known flow
+        flow_v1 = self.resource_v1.get(flow_id=1)
+        
+        result_v1 = self.resource_v1.exists(
+            name=flow_v1.name,
+            external_version=flow_v1.external_version
+        )
+        result_v2 = self.resource_v2.exists(
+            name=flow_v1.name,
+            external_version=flow_v1.external_version
+        )
+        
+        assert result_v1 is not False
+        assert result_v2 is not False
+        
+        if isinstance(result_v1, int) and isinstance(result_v2, int):
+            assert result_v1 == result_v2
+
+    # @pytest.mark.skip(reason="V2 API not yet deployed on test server - fallback would work but tries V2 first")
+    @pytest.mark.uses_test_server()
+    def test_fallback_get(self):
+        """Test that fallback proxy can get flows."""
+        flow = self.resource_fallback.get(flow_id=1)
+        
+        assert isinstance(flow, OpenMLFlow)
+        assert flow.flow_id == 1
+
+    # @pytest.mark.skip(reason="V2 API not yet deployed on test server - fallback would work but tries V2 first")
+    @pytest.mark.uses_test_server()
+    def test_fallback_exists(self):
+        """Test that fallback proxy can check flow existence."""
+        flow = self.resource_fallback.get(flow_id=1)
+        
+        result = self.resource_fallback.exists(
+            name=flow.name,
+            external_version=flow.external_version
+        )
+        
+        assert result is not False
+
+    @pytest.mark.uses_test_server()
+    def test_fallback_list_falls_back_to_v1(self):
+        """Test that fallback proxy falls back to V1 for list method."""
+
+        flows_df = self.resource_fallback.list(limit=10)
+        
+        assert len(flows_df) > 0
+        assert len(flows_df) <= 10
+        assert "id" in flows_df.columns
+
+    def test_fallback_raises_when_all_not_implemented(self):
+        """Test that fallback proxy raises NotImplementedError when all APIs raise it."""
+        # Both V2 and a hypothetical V1 that doesn't support something should raise
+        # For now, we can't easily test this without mocking, but document the behavior
+        pass

From 468087d4cfaaea6e24e2a2d822872d4134d0cfc9 Mon Sep 17 00:00:00 2001
From: Omswastik-11 <omswastikpanda11@gmail.com>
Date: Thu, 29 Jan 2026 18:32:18 +0530
Subject: [PATCH 30/34] tests:added tests for migration

Signed-off-by: Omswastik-11 <omswastikpanda11@gmail.com>
---
 tests/test_flows/test_flows_migration.py | 33 ------------------------
 1 file changed, 33 deletions(-)

diff --git a/tests/test_flows/test_flows_migration.py b/tests/test_flows/test_flows_migration.py
index 823cc3d2a..1636e6180 100644
--- a/tests/test_flows/test_flows_migration.py
+++ b/tests/test_flows/test_flows_migration.py
@@ -169,34 +169,6 @@ def test_exists_nonexistent(self):
         
         assert result is False
 
-    def test_list_not_implemented(self):
-        """Test that list raises NotImplementedError for V2."""
-        with pytest.raises(NotImplementedError):
-            self.resource.list(limit=10)
-
-    def test_publish_not_implemented(self):
-        """Test that publish raises NotImplementedError for V2."""
-        from collections import OrderedDict
-        
-        with pytest.raises(NotImplementedError):
-            flow = OpenMLFlow(
-                name="test",
-                description="test",
-                model=None,
-                components=OrderedDict(),
-                parameters=OrderedDict(),
-                parameters_meta_info=OrderedDict(),
-                external_version="1.0",
-                tags=[],
-                language="English",
-                dependencies=None,
-            )
-            self.resource.publish(flow)
-
-    def test_delete_not_implemented(self):
-        """Test that delete raises NotImplementedError for V2."""
-        with pytest.raises(NotImplementedError):
-            self.resource.delete(flow_id=1)
 
 
 class TestFlowsCombined(TestAPIBase):
@@ -299,8 +271,3 @@ def test_fallback_list_falls_back_to_v1(self):
         assert len(flows_df) <= 10
         assert "id" in flows_df.columns
 
-    def test_fallback_raises_when_all_not_implemented(self):
-        """Test that fallback proxy raises NotImplementedError when all APIs raise it."""
-        # Both V2 and a hypothetical V1 that doesn't support something should raise
-        # For now, we can't easily test this without mocking, but document the behavior
-        pass

From 5bc37b80abc86e89644e431f48ca2d4d4ad7814c Mon Sep 17 00:00:00 2001
From: geetu040 <raoarmaghanshakir040@gmail.com>
Date: Thu, 29 Jan 2026 22:02:38 +0500
Subject: [PATCH 31/34] fixes with publish/delete

---
 openml/_api/resources/base/versions.py | 22 ++++++-------
 tests/test_api/test_http.py            |  9 ++----
 tests/test_api/test_versions.py        | 44 ++++++++++++++++++++++++++
 3 files changed, 57 insertions(+), 18 deletions(-)
 create mode 100644 tests/test_api/test_versions.py

diff --git a/openml/_api/resources/base/versions.py b/openml/_api/resources/base/versions.py
index 91c1a8c06..6ca2dd345 100644
--- a/openml/_api/resources/base/versions.py
+++ b/openml/_api/resources/base/versions.py
@@ -1,7 +1,7 @@
 from __future__ import annotations
 
 from collections.abc import Mapping
-from typing import Any
+from typing import Any, cast
 
 import xmltodict
 
@@ -76,7 +76,7 @@ def untag(self, resource_id: int, tag: str) -> list[str]:
     def _get_endpoint_name(self) -> str:
         if self.resource_type == ResourceType.DATASET:
             return "data"
-        return self.resource_type.name
+        return cast("str", self.resource_type.value)
 
     def _handle_delete_exception(
         self, resource_type: str, exception: OpenMLServerException
@@ -114,8 +114,8 @@ def _handle_delete_exception(
         raise exception
 
     def _extract_id_from_upload(self, parsed: Mapping[str, Any]) -> int:
-        # reads id from
-        # sample parsed dict: {"oml:openml": {"oml:upload_flow": {"oml:id": "42"}}}
+        # reads id from upload response
+        # actual parsed dict: {"oml:upload_flow": {"@xmlns:oml": "...", "oml:id": "42"}}
 
         # xmltodict always gives exactly one root key
         ((_, root_value),) = parsed.items()
@@ -123,14 +123,14 @@ def _extract_id_from_upload(self, parsed: Mapping[str, Any]) -> int:
         if not isinstance(root_value, Mapping):
             raise ValueError("Unexpected XML structure")
 
-        # upload node (e.g. oml:upload_task, oml:study_upload, ...)
-        ((_, upload_value),) = root_value.items()
+        # Look for oml:id directly in the root value
+        if "oml:id" in root_value:
+            id_value = root_value["oml:id"]
+            if isinstance(id_value, (str, int)):
+                return int(id_value)
 
-        if not isinstance(upload_value, Mapping):
-            raise ValueError("Unexpected upload node structure")
-
-        # ID is the only leaf value
-        for v in upload_value.values():
+        # Fallback: check all values for numeric/string IDs
+        for v in root_value.values():
             if isinstance(v, (str, int)):
                 return int(v)
 
diff --git a/tests/test_api/test_http.py b/tests/test_api/test_http.py
index 808321862..c16759558 100644
--- a/tests/test_api/test_http.py
+++ b/tests/test_api/test_http.py
@@ -149,10 +149,5 @@ def test_post_and_delete(self):
         finally:
             # DELETE the task if it was created
             if task_id is not None:
-                try:
-                    del_response = self.http_client.delete(f"task/{task_id}")
-                    # optional: verify delete
-                    if del_response.status_code != 200:
-                        print(f"Warning: delete failed for task {task_id}")
-                except Exception as e:
-                    print(f"Warning: failed to delete task {task_id}: {e}")
+                del_response = self.http_client.delete(f"task/{task_id}")
+                self.assertEqual(del_response.status_code, 200)
diff --git a/tests/test_api/test_versions.py b/tests/test_api/test_versions.py
new file mode 100644
index 000000000..d3b1cd45d
--- /dev/null
+++ b/tests/test_api/test_versions.py
@@ -0,0 +1,44 @@
+import pytest
+from openml.testing import TestAPIBase
+from openml._api.resources.base.versions import ResourceV1
+from openml._api.resources.base.resources import ResourceType
+
+
+class TestResourceV1(TestAPIBase):
+    def setUp(self):
+        super().setUp()
+        self.resource = ResourceV1(self.http_client)
+        self.resource.resource_type = ResourceType.TASK
+
+    @pytest.mark.uses_test_server()
+    def test_publish_and_delete(self):
+        task_xml = """
+        <oml:task_inputs xmlns:oml="http://openml.org/openml">
+            <oml:task_type_id>5</oml:task_type_id>
+            <oml:input name="source_data">193</oml:input>
+            <oml:input name="estimation_procedure">17</oml:input>
+        </oml:task_inputs>
+        """
+
+        task_id = None
+        try:
+            # Publish the task
+            task_id = self.resource.publish(
+                "task",
+                files={"description": task_xml},
+            )
+
+            # Get the task to verify it exists
+            get_response = self.http_client.get(f"task/{task_id}")
+            self.assertEqual(get_response.status_code, 200)
+
+        finally:
+            # delete the task if it was created
+            if task_id is not None:
+                success = self.resource.delete(task_id)
+                self.assertTrue(success)
+
+
+    @pytest.mark.uses_test_server()
+    def test_tag_and_untag(self):
+        pass

From 08d991686843fc2ff5d8182e96a162bc2e706f52 Mon Sep 17 00:00:00 2001
From: geetu040 <raoarmaghanshakir040@gmail.com>
Date: Thu, 29 Jan 2026 22:05:24 +0500
Subject: [PATCH 32/34] fix cache_key in tests

---
 tests/test_api/test_http.py | 16 ++++++++++++----
 1 file changed, 12 insertions(+), 4 deletions(-)

diff --git a/tests/test_api/test_http.py b/tests/test_api/test_http.py
index c16759558..efaeaeeef 100644
--- a/tests/test_api/test_http.py
+++ b/tests/test_api/test_http.py
@@ -3,6 +3,7 @@
 import xmltodict
 import pytest
 from openml.testing import TestAPIBase
+import os
 
 
 class TestHTTPClient(TestAPIBase):
@@ -11,12 +12,19 @@ def test_cache(self):
         params = {"param1": "value1", "param2": "value2"}
 
         key = self.cache.get_key(url, params)
+        expected_key = os.path.join(
+            "org",
+            "openml",
+            "test",
+            "api",
+            "v1",
+            "task",
+            "31",
+            "param1=value1&param2=value2",
+        )
 
         # validate key
-        self.assertEqual(
-            key,
-            "org/openml/test/api/v1/task/31/param1=value1&param2=value2",
-        )
+        self.assertEqual(key, expected_key)
 
         # create fake response
         req = Request("GET", url).prepare()

From 9660e78ff19b2553b453e09f0ea9c8e7b1bec586 Mon Sep 17 00:00:00 2001
From: Omswastik-11 <omswastikpanda11@gmail.com>
Date: Fri, 30 Jan 2026 10:31:18 +0530
Subject: [PATCH 33/34] tests:added tests for migration

Signed-off-by: Omswastik-11 <omswastikpanda11@gmail.com>
---
 openml/_api/resources/base/resources.py  |  6 ---
 openml/_api/resources/flows.py           | 48 ++++---------------
 openml/_api/runtime/core.py              | 22 +--------
 openml/base.py                           | 23 ++++-----
 openml/flows/flow.py                     | 11 +++--
 tests/test_flows/test_flows_migration.py | 60 ++++++++++++++++++------
 6 files changed, 77 insertions(+), 93 deletions(-)

diff --git a/openml/_api/resources/base/resources.py b/openml/_api/resources/base/resources.py
index e1e2c6377..e83173f9d 100644
--- a/openml/_api/resources/base/resources.py
+++ b/openml/_api/resources/base/resources.py
@@ -54,9 +54,3 @@ def list(
         tag: str | None = None,
         uploader: str | None = None,
     ) -> pd.DataFrame: ...
-
-    @abstractmethod
-    def publish(self, flow: OpenMLFlow) -> OpenMLFlow | tuple[OpenMLFlow, Response]: ...  # type: ignore[override]
-
-    @abstractmethod
-    def delete(self, flow_id: int) -> bool: ...
diff --git a/openml/_api/resources/flows.py b/openml/_api/resources/flows.py
index 54ce26591..4ea7ffcfd 100644
--- a/openml/_api/resources/flows.py
+++ b/openml/_api/resources/flows.py
@@ -1,5 +1,6 @@
 from __future__ import annotations
 
+from collections.abc import Mapping
 from typing import Any
 
 import pandas as pd
@@ -135,49 +136,21 @@ def list(
 
         return pd.DataFrame.from_dict(flows, orient="index")
 
-    def publish(self, flow: OpenMLFlow) -> OpenMLFlow:  # type: ignore[override]
-        """Create a new flow on the OpenML server.
-
-        under development , not fully functional yet
+    def publish(self, path: str | None = None, files: Mapping[str, Any] | None = None) -> int:
+        """Publish a flow on the OpenML server.
 
         Parameters
         ----------
-        flow : OpenMLFlow
-            The flow object to upload to the server.
+        files : Mapping[str, Any] | None
+            Files to upload (including description).
 
         Returns
         -------
-        OpenMLFlow
-            The updated flow object with the server-assigned flow_id.
+        int
+            The server-assigned flow id.
         """
-        from openml.extensions import Extension
-
-        # Check if flow is an OpenMLFlow or a compatible extension object
-        if not isinstance(flow, OpenMLFlow) and not isinstance(flow, Extension):
-            raise TypeError(f"Flow must be an OpenMLFlow or Extension instance, got {type(flow)}")
-
-        # Get file elements for upload (includes XML description if not provided)
-        file_elements = flow._get_file_elements()
-        if "description" not in file_elements:
-            file_elements["description"] = flow._to_xml()
-
-        # POST to server (multipart/files). Ensure api_key is sent in the form data.
-        files = file_elements
-        data = {"api_key": self._http.api_key}
-        response = self._http.post("flow", files=files, data=data)
-
-        parsed = xmltodict.parse(response.text)
-        if "oml:error" in parsed:
-            err = parsed["oml:error"]
-            code = int(err.get("oml:code", 0)) if "oml:code" in err else None
-            message = err.get("oml:message", "Server returned an error")
-            raise OpenMLServerException(message=message, code=code)
-
-        # Parse response and update flow with server-assigned ID
-        xml_response = xmltodict.parse(response.text)
-        flow._parse_publish_response(xml_response)
-
-        return flow
+        path = "flow"
+        return super().publish(path, files)
 
     def delete(self, flow_id: int) -> bool:
         """Delete a flow from the OpenML server.
@@ -187,8 +160,7 @@ def delete(self, flow_id: int) -> bool:
         flow_id : int
             The ID of the flow to delete.
         """
-        self._http.delete(f"flow/{flow_id}")
-        return True
+        return super().delete(flow_id)
 
 
 class FlowsV2(ResourceV2, FlowsAPI):
diff --git a/openml/_api/runtime/core.py b/openml/_api/runtime/core.py
index f1087371a..43fd63b70 100644
--- a/openml/_api/runtime/core.py
+++ b/openml/_api/runtime/core.py
@@ -16,8 +16,7 @@
 )
 
 if TYPE_CHECKING:
-    from openml._api.resources.base import DatasetsAPI, FlowsAPI, ResourceAPI, TasksAPI
-    from openml.base import OpenMLBase
+    from openml._api.resources.base import DatasetsAPI, FlowsAPI, TasksAPI
 
 
 class APIBackend:
@@ -32,25 +31,6 @@ def __init__(
         self.tasks = tasks
         self.flows = flows
 
-    def get_resource_for_entity(self, entity: OpenMLBase) -> ResourceAPI:
-        from openml.datasets.dataset import OpenMLDataset
-        from openml.flows.flow import OpenMLFlow
-        from openml.runs.run import OpenMLRun
-        from openml.study.study import OpenMLStudy
-        from openml.tasks.task import OpenMLTask
-
-        if isinstance(entity, OpenMLFlow):
-            return self.flows  # type: ignore
-        if isinstance(entity, OpenMLRun):
-            return self.runs  # type: ignore
-        if isinstance(entity, OpenMLDataset):
-            return self.datasets  # type: ignore
-        if isinstance(entity, OpenMLTask):
-            return self.tasks  # type: ignore
-        if isinstance(entity, OpenMLStudy):
-            return self.studies  # type: ignore
-        raise ValueError(f"No resource manager available for entity type {type(entity)}")
-
 
 def build_backend(version: str, *, strict: bool) -> APIBackend:
     http_cache = HTTPCache(
diff --git a/openml/base.py b/openml/base.py
index 2d97e77e1..a282be8eb 100644
--- a/openml/base.py
+++ b/openml/base.py
@@ -11,7 +11,7 @@
 import openml._api_calls
 import openml.config
 
-from .utils import _tag_openml_base
+from .utils import _get_rest_api_type_alias, _tag_openml_base
 
 
 class OpenMLBase(ABC):
@@ -126,19 +126,20 @@ def _parse_publish_response(self, xml_response: dict[str, str]) -> None:
 
     def publish(self) -> OpenMLBase:
         """Publish the object on the OpenML server."""
-        from openml._api import api_context
+        file_elements = self._get_file_elements()
 
-        resource_manager = api_context.backend.get_resource_for_entity(self)
+        if "description" not in file_elements:
+            file_elements["description"] = self._to_xml()
 
-        published_entity = resource_manager.publish(self)  # type: ignore
-
-        if (
-            published_entity is not None
-            and hasattr(published_entity, "id")
-            and published_entity.id is not None
-        ):
-            self.id = published_entity.id  # type: ignore
+        call = f"{_get_rest_api_type_alias(self)}/"
+        response_text = openml._api_calls._perform_api_call(
+            call,
+            "post",
+            file_elements=file_elements,
+        )
+        xml_response = xmltodict.parse(response_text)
 
+        self._parse_publish_response(xml_response)
         return self
 
     def open_in_browser(self) -> None:
diff --git a/openml/flows/flow.py b/openml/flows/flow.py
index 7dd84fdee..5d507907c 100644
--- a/openml/flows/flow.py
+++ b/openml/flows/flow.py
@@ -431,6 +431,7 @@ def publish(self, raise_error_if_exists: bool = False) -> OpenMLFlow:  # noqa: F
         # get_flow(), while functions.py tries to import flow.py in order to
         # instantiate an OpenMLFlow.
         import openml.flows.functions
+        from openml._api import api_context
 
         flow_id = openml.flows.functions.flow_exists(self.name, self.external_version)
         if not flow_id:
@@ -438,9 +439,13 @@ def publish(self, raise_error_if_exists: bool = False) -> OpenMLFlow:  # noqa: F
                 raise openml.exceptions.PyOpenMLError(
                     "Flow does not exist on the server, but 'flow.flow_id' is not None.",
                 )
-            super().publish()
-            assert self.flow_id is not None  # for mypy
-            flow_id = self.flow_id
+
+            file_elements = self._get_file_elements()
+            if "description" not in file_elements:
+                file_elements["description"] = self._to_xml()
+
+            flow_id = api_context.backend.flows.publish(path="flow", files=file_elements)
+            self.flow_id = flow_id
         elif raise_error_if_exists:
             error_message = f"This OpenMLFlow already exists with id: {flow_id}."
             raise openml.exceptions.PyOpenMLError(error_message)
diff --git a/tests/test_flows/test_flows_migration.py b/tests/test_flows/test_flows_migration.py
index 1636e6180..efd1f4b4b 100644
--- a/tests/test_flows/test_flows_migration.py
+++ b/tests/test_flows/test_flows_migration.py
@@ -2,6 +2,8 @@
 """Tests for Flow V1 → V2 API Migration."""
 from __future__ import annotations
 
+import uuid
+
 import pytest
 
 from openml._api.resources import FallbackProxy, FlowsV1, FlowsV2
@@ -81,37 +83,67 @@ def test_list_with_tag_limit_offset(self):
         if len(flows_df) > 0:
             assert "id" in flows_df.columns
     
-    @pytest.mark.uses_test_server()
-    def test_publish(self):
-        """Test publishing a sklearn flow using V1 API."""
-        from openml_sklearn.extension import SklearnExtension
-        from sklearn.tree import ExtraTreeRegressor
-        clf = ExtraTreeRegressor()
-        extension = SklearnExtension()
-        dt_flow = extension.model_to_flow(clf)
-        published_flow = self.resource.publish(dt_flow)
-        assert isinstance(published_flow, OpenMLFlow)
-        assert getattr(published_flow, "id", None) is not None
-    
     @pytest.mark.uses_test_server()
     def test_delete(self):
         """Test deleting a flow using V1 API."""
         from openml_sklearn.extension import SklearnExtension
         from sklearn.tree import ExtraTreeRegressor
+
         clf = ExtraTreeRegressor()
         extension = SklearnExtension()
         dt_flow = extension.model_to_flow(clf)
+
+        # Check if flow exists, if not publish it
         flow_id = self.resource.exists(
             name=dt_flow.name,
-            external_version=dt_flow.external_version
+            external_version=dt_flow.external_version,
         )
+        
+        if not flow_id:
+            # Publish the flow first
+            file_elements = dt_flow._get_file_elements()
+            if "description" not in file_elements:
+                file_elements["description"] = dt_flow._to_xml()
+            
+            flow_id = self.resource.publish(file_elements)
+        
+        # Now delete it
         result = self.resource.delete(flow_id)
         assert result is True
+
+        # Verify it no longer exists
         exists = self.resource.exists(
             name=dt_flow.name,
-            external_version=dt_flow.external_version
+            external_version=dt_flow.external_version,
         )
         assert exists is False
+    
+    @pytest.mark.uses_test_server()
+    def test_publish(self):
+        """Test publishing a sklearn flow using V1 API."""
+        from openml_sklearn.extension import SklearnExtension
+        from sklearn.tree import ExtraTreeRegressor
+
+        clf = ExtraTreeRegressor()
+        extension = SklearnExtension()
+        dt_flow = extension.model_to_flow(clf)
+
+        # Check if flow already exists
+        flow_id = self.resource.exists(
+            name=dt_flow.name,
+            external_version=dt_flow.external_version,
+        )
+        
+        if not flow_id:
+            file_elements = dt_flow._get_file_elements()
+            if "description" not in file_elements:
+                print("Adding description to flow XML")
+                file_elements["description"] = dt_flow._to_xml()
+                
+            flow_id = self.resource.publish(file_elements)
+
+        assert isinstance(flow_id, int)
+        assert flow_id > 0
 
 
 

From f25c95be3632899435782c72862787246f3c3d7c Mon Sep 17 00:00:00 2001
From: Omswastik-11 <omswastikpanda11@gmail.com>
Date: Fri, 30 Jan 2026 10:48:00 +0530
Subject: [PATCH 34/34] tests:added tests for migration

Signed-off-by: Omswastik-11 <omswastikpanda11@gmail.com>
---
 tests/test_flows/test_flows_migration.py | 19 ++++++++++---------
 1 file changed, 10 insertions(+), 9 deletions(-)

diff --git a/tests/test_flows/test_flows_migration.py b/tests/test_flows/test_flows_migration.py
index efd1f4b4b..b29d75bc3 100644
--- a/tests/test_flows/test_flows_migration.py
+++ b/tests/test_flows/test_flows_migration.py
@@ -105,7 +105,7 @@ def test_delete(self):
             if "description" not in file_elements:
                 file_elements["description"] = dt_flow._to_xml()
             
-            flow_id = self.resource.publish(file_elements)
+            flow_id = self.resource.publish(files=file_elements)
         
         # Now delete it
         result = self.resource.delete(flow_id)
@@ -134,14 +134,15 @@ def test_publish(self):
             external_version=dt_flow.external_version,
         )
         
-        if not flow_id:
-            file_elements = dt_flow._get_file_elements()
-            if "description" not in file_elements:
-                print("Adding description to flow XML")
-                file_elements["description"] = dt_flow._to_xml()
-                
-            flow_id = self.resource.publish(file_elements)
-
+        if flow_id:
+            _ = self.resource.delete(flow_id)
+            
+        file_elements = dt_flow._get_file_elements()
+        if "description" not in file_elements:
+            print("Adding description to flow XML")
+            file_elements["description"] = dt_flow._to_xml()
+            
+        flow_id = self.resource.publish(files=file_elements)
         assert isinstance(flow_id, int)
         assert flow_id > 0