move utills function to a separate dispathcer file

Omswastik-11 · Omswastik-11 · commit b10eb12e593e · 2026-01-13T19:59:19.000+05:30
diff --git a/openml/__init__.py b/openml/__init__.py
@@ -18,12 +18,11 @@
 # License: BSD 3-Clause
 from __future__ import annotations
 
-from typing import Any, Callable, Dict
-
 from . import (
     _api_calls,
     config,
     datasets,
+    dispatchers,
     evaluations,
     exceptions,
     extensions,
@@ -36,6 +35,7 @@
 )
 from .__version__ import __version__
 from .datasets import OpenMLDataFeature, OpenMLDataset
+from .dispatchers import get, list_all
 from .evaluations import OpenMLEvaluation
 from .flows import OpenMLFlow
 from .runs import OpenMLRun
@@ -51,102 +51,6 @@
     OpenMLTask,
 )
 
-ListDispatcher = Dict[str, Callable[..., Any]]
-GetDispatcher = Dict[str, Callable[..., Any]]
-
-_LIST_DISPATCH: ListDispatcher = {
-    "dataset": datasets.functions.list_datasets,
-    "task": tasks.functions.list_tasks,
-    "flow": flows.functions.list_flows,
-    "run": runs.functions.list_runs,
-}
-
-_GET_DISPATCH: GetDispatcher = {
-    "dataset": datasets.functions.get_dataset,
-    "task": tasks.functions.get_task,
-    "flow": flows.functions.get_flow,
-    "run": runs.functions.get_run,
-}
-
-
-def list_all(object_type: str, /, **kwargs: Any) -> Any:
-    """List OpenML objects by type (e.g., datasets, tasks, flows, runs).
-
-    This is a convenience dispatcher that forwards to the existing type-specific
-    ``list_*`` functions. Existing imports remain available for backward compatibility.
-
-    Parameters
-    ----------
-    object_type : str
-        The type of object to list. Must be one of 'dataset', 'task', 'flow', 'run'.
-    **kwargs : Any
-        Additional arguments passed to the underlying list function.
-
-    Returns
-    -------
-    Any
-        The result from the type-specific list function (typically a DataFrame).
-
-    Raises
-    ------
-    ValueError
-        If object_type is not one of the supported types.
-    """
-    if not isinstance(object_type, str):
-        raise TypeError(f"object_type must be a string, got {type(object_type).__name__}")
-
-    func = _LIST_DISPATCH.get(object_type.lower())
-    if func is None:
-        valid_types = ", ".join(repr(k) for k in _LIST_DISPATCH)
-        raise ValueError(
-            f"Unsupported object_type {object_type!r}; expected one of {valid_types}.",
-        )
-
-    return func(**kwargs)
-
-
-def get(identifier: int | str, *, object_type: str = "dataset", **kwargs: Any) -> Any:
-    """Get an OpenML object by identifier.
-
-    Parameters
-    ----------
-    identifier : int | str
-        The ID or name of the object to retrieve.
-    object_type : str, default="dataset"
-        The type of object to get. Must be one of 'dataset', 'task', 'flow', 'run'.
-    **kwargs : Any
-        Additional arguments passed to the underlying get function.
-
-    Returns
-    -------
-    Any
-        The requested OpenML object.
-
-    Raises
-    ------
-    ValueError
-        If object_type is not one of the supported types.
-
-    Examples
-    --------
-    >>> openml.get(61)  # Get dataset 61 (default object_type="dataset")
-    >>> openml.get("Fashion-MNIST")  # Get dataset by name
-    >>> openml.get(31, object_type="task")  # Get task 31
-    >>> openml.get(10, object_type="flow")  # Get flow 10
-    >>> openml.get(20, object_type="run")  # Get run 20
-    """
-    if not isinstance(object_type, str):
-        raise TypeError(f"object_type must be a string, got {type(object_type).__name__}")
-
-    func = _GET_DISPATCH.get(object_type.lower())
-    if func is None:
-        valid_types = ", ".join(repr(k) for k in _GET_DISPATCH)
-        raise ValueError(
-            f"Unsupported object_type {object_type!r}; expected one of {valid_types}.",
-        )
-
-    return func(identifier, **kwargs)
-
 
 def populate_cache(
     task_ids: list[int] | None = None,
@@ -206,6 +110,7 @@ def populate_cache(
     "OpenMLStudy",
     "OpenMLBenchmarkSuite",
     "datasets",
+    "dispatchers",
     "evaluations",
     "exceptions",
     "extensions",
diff --git a/openml/dispatchers.py b/openml/dispatchers.py
@@ -0,0 +1,107 @@
+"""OpenML API dispatchers for unified get/list operations."""
+
+# License: BSD 3-Clause
+from __future__ import annotations
+
+from typing import Any, Callable, Dict
+
+from .datasets import get_dataset, list_datasets
+from .flows import get_flow, list_flows
+from .runs import get_run, list_runs
+from .tasks import get_task, list_tasks
+
+ListDispatcher = Dict[str, Callable[..., Any]]
+GetDispatcher = Dict[str, Callable[..., Any]]
+
+_LIST_DISPATCH: ListDispatcher = {
+    "dataset": list_datasets,
+    "task": list_tasks,
+    "flow": list_flows,
+    "run": list_runs,
+}
+
+_GET_DISPATCH: GetDispatcher = {
+    "dataset": get_dataset,
+    "task": get_task,
+    "flow": get_flow,
+    "run": get_run,
+}
+
+
+def list_all(object_type: str, /, **kwargs: Any) -> Any:
+    """List OpenML objects by type (e.g., datasets, tasks, flows, runs).
+
+    This is a convenience dispatcher that forwards to the existing type-specific
+    ``list_*`` functions. Existing imports remain available for backward compatibility.
+
+    Parameters
+    ----------
+    object_type : str
+        The type of object to list. Must be one of 'dataset', 'task', 'flow', 'run'.
+    **kwargs : Any
+        Additional arguments passed to the underlying list function.
+
+    Returns
+    -------
+    Any
+        The result from the type-specific list function (typically a DataFrame).
+
+    Raises
+    ------
+    ValueError
+        If object_type is not one of the supported types.
+    """
+    if not isinstance(object_type, str):
+        raise TypeError(f"object_type must be a string, got {type(object_type).__name__}")
+
+    func = _LIST_DISPATCH.get(object_type.lower())
+    if func is None:
+        valid_types = ", ".join(repr(k) for k in _LIST_DISPATCH)
+        raise ValueError(
+            f"Unsupported object_type {object_type!r}; expected one of {valid_types}.",
+        )
+
+    return func(**kwargs)
+
+
+def get(identifier: int | str, *, object_type: str = "dataset", **kwargs: Any) -> Any:
+    """Get an OpenML object by identifier.
+
+    Parameters
+    ----------
+    identifier : int | str
+        The ID or name of the object to retrieve.
+    object_type : str, default="dataset"
+        The type of object to get. Must be one of 'dataset', 'task', 'flow', 'run'.
+    **kwargs : Any
+        Additional arguments passed to the underlying get function.
+
+    Returns
+    -------
+    Any
+        The requested OpenML object.
+
+    Raises
+    ------
+    ValueError
+        If object_type is not one of the supported types.
+
+    Examples
+    --------
+    >>> openml.get(61)  # Get dataset 61 (default object_type="dataset")
+    >>> openml.get("Fashion-MNIST")  # Get dataset by name
+    >>> openml.get(31, object_type="task")  # Get task 31
+    >>> openml.get(10, object_type="flow")  # Get flow 10
+    >>> openml.get(20, object_type="run")  # Get run 20
+    """
+    if not isinstance(object_type, str):
+        raise TypeError(f"object_type must be a string, got {type(object_type).__name__}")
+
+    func = _GET_DISPATCH.get(object_type.lower())
+    if func is None:
+        valid_types = ", ".join(repr(k) for k in _GET_DISPATCH)
+        raise ValueError(
+            f"Unsupported object_type {object_type!r}; expected one of {valid_types}.",
+        )
+
+    return func(identifier, **kwargs)
diff --git a/tests/test_openml/test_openml.py b/tests/test_openml/test_openml.py
@@ -47,7 +47,7 @@ def test_populate_cache(
     def test_list_dispatch(self, list_datasets_mock, list_tasks_mock):
         # Need to patch after import, so update dispatch dict
         with mock.patch.dict(
-            "openml._LIST_DISPATCH",
+            "openml.dispatchers._LIST_DISPATCH",
             {
                 "dataset": list_datasets_mock,
                 "task": list_tasks_mock,
@@ -64,20 +64,20 @@ def test_list_dispatch(self, list_datasets_mock, list_tasks_mock):
     def test_get_dispatch(self, get_dataset_mock, get_task_mock):
         # Need to patch after import, so update dispatch dict
         with mock.patch.dict(
-            "openml._GET_DISPATCH",
+            "openml.dispatchers._GET_DISPATCH",
             {
                 "dataset": get_dataset_mock,
                 "task": get_task_mock,
             },
         ):
-            openml.get(61) 
+            openml.get(61)
             get_dataset_mock.assert_called_with(61)
 
-            openml.get("Fashion-MNIST", version=2) 
+            openml.get("Fashion-MNIST", version=2)
             get_dataset_mock.assert_called_with("Fashion-MNIST", version=2)
 
             openml.get("Fashion-MNIST")
             get_dataset_mock.assert_called_with("Fashion-MNIST")
 
-            openml.get(31, object_type="task") 
+            openml.get(31, object_type="task")
             get_task_mock.assert_called_with(31)