openml
diff --git a/‎examples/20_basic/simple_datasets_tutorial.py
+3-3 b/‎examples/20_basic/simple_datasets_tutorial.py
+3-3
diff --git a/‎examples/30_extended/task_manual_iteration_tutorial.py
+4-4 b/‎examples/30_extended/task_manual_iteration_tutorial.py
+4-4
diff --git a/‎openml/datasets/functions.py
+22-130 b/‎openml/datasets/functions.py
+22-130
diff --git a/‎openml/evaluations/evaluation.py
+20 b/‎openml/evaluations/evaluation.py
+20
@@ -19,7 +19,7 @@
 # List datasets
 # =============
 
-datasets_df = openml.datasets.list_datasets(output_format="dataframe")
+datasets_df = openml.datasets.list_datasets()
 print(datasets_df.head(n=10))
 
 ############################################################################
@@ -48,7 +48,7 @@
 # attribute_names - the names of the features for the examples (X) and
 # target feature (y)
 X, y, categorical_indicator, attribute_names = dataset.get_data(
-    dataset_format="dataframe", target=dataset.default_target_attribute
+    target=dataset.default_target_attribute
 )
 
 ############################################################################
@@ -63,9 +63,9 @@
 # Visualize the dataset
 # =====================
 
+import matplotlib.pyplot as plt
 import pandas as pd
 import seaborn as sns
-import matplotlib.pyplot as plt
 
 sns.set_style("darkgrid")
 
 
@@ -68,7 +68,7 @@
 ####################################################################################################
 # And then split the data based on this:
 
-X, y = task.get_X_and_y(dataset_format="dataframe")
+X, y = task.get_X_and_y()
 X_train = X.iloc[train_indices]
 y_train = y.iloc[train_indices]
 X_test = X.iloc[test_indices]
@@ -88,7 +88,7 @@
 
 task_id = 3
 task = openml.tasks.get_task(task_id)
-X, y = task.get_X_and_y(dataset_format="dataframe")
+X, y = task.get_X_and_y()
 n_repeats, n_folds, n_samples = task.get_split_dimensions()
 print(
     "Task {}: number of repeats: {}, number of folds: {}, number of samples {}.".format(
@@ -132,7 +132,7 @@
 
 task_id = 1767
 task = openml.tasks.get_task(task_id)
-X, y = task.get_X_and_y(dataset_format="dataframe")
+X, y = task.get_X_and_y()
 n_repeats, n_folds, n_samples = task.get_split_dimensions()
 print(
     "Task {}: number of repeats: {}, number of folds: {}, number of samples {}.".format(
@@ -176,7 +176,7 @@
 
 task_id = 1702
 task = openml.tasks.get_task(task_id)
-X, y = task.get_X_and_y(dataset_format="dataframe")
+X, y = task.get_X_and_y()
 n_repeats, n_folds, n_samples = task.get_split_dimensions()
 print(
     "Task {}: number of repeats: {}, number of folds: {}, number of samples {}.".format(
 
@@ -7,7 +7,7 @@
 from collections import OrderedDict
 from pathlib import Path
 from pyexpat import ExpatError
-from typing import TYPE_CHECKING, Any, overload
+from typing import TYPE_CHECKING, Any
 from typing_extensions import Literal
 
 import arff
@@ -75,54 +75,16 @@ def list_qualities() -> list[str]:
     return qualities["oml:data_qualities_list"]["oml:quality"]
 
 
-@overload
-def list_datasets(
-    data_id: list[int] | None = ...,
-    offset: int | None = ...,
-    size: int | None = ...,
-    status: str | None = ...,
-    tag: str | None = ...,
-    *,
-    output_format: Literal["dataframe"],
-    **kwargs: Any,
-) -> pd.DataFrame: ...
-
-
-@overload
-def list_datasets(
-    data_id: list[int] | None,
-    offset: int | None,
-    size: int | None,
-    status: str | None,
-    tag: str | None,
-    output_format: Literal["dataframe"],
-    **kwargs: Any,
-) -> pd.DataFrame: ...
-
-
-@overload
-def list_datasets(
-    data_id: list[int] | None = ...,
-    offset: int | None = ...,
-    size: int | None = ...,
-    status: str | None = ...,
-    tag: str | None = ...,
-    output_format: Literal["dict"] = "dict",
-    **kwargs: Any,
-) -> pd.DataFrame: ...
-
-
 def list_datasets(
     data_id: list[int] | None = None,
     offset: int | None = None,
     size: int | None = None,
     status: str | None = None,
     tag: str | None = None,
-    output_format: Literal["dataframe", "dict"] = "dict",
     **kwargs: Any,
-) -> dict | pd.DataFrame:
-    """
-    Return a list of all dataset which are on OpenML.
+) -> pd.DataFrame:
+    """Return a dataframe of all dataset which are on OpenML.
+
     Supports large amount of results.
 
     Parameters
@@ -139,87 +101,36 @@ def list_datasets(
         default active datasets are returned, but also datasets
         from another status can be requested.
     tag : str, optional
-    output_format: str, optional (default='dict')
-        The parameter decides the format of the output.
-        - If 'dict' the output is a dict of dict
-        - If 'dataframe' the output is a pandas DataFrame
     kwargs : dict, optional
         Legal filter operators (keys in the dict):
         data_name, data_version, number_instances,
         number_features, number_classes, number_missing_values.
 
     Returns
     -------
-    datasets : dict of dicts, or dataframe
-        - If output_format='dict'
-            A mapping from dataset ID to dict.
-
-            Every dataset is represented by a dictionary containing
-            the following information:
-            - dataset id
-            - name
-            - format
-            - status
-            If qualities are calculated for the dataset, some of
-            these are also returned.
-
-        - If output_format='dataframe'
-            Each row maps to a dataset
-            Each column contains the following information:
-            - dataset id
-            - name
-            - format
-            - status
-            If qualities are calculated for the dataset, some of
-            these are also included as columns.
+    datasets: dataframe
+        Each row maps to a dataset
+        Each column contains the following information:
+        - dataset id
+        - name
+        - format
+        - status
+        If qualities are calculated for the dataset, some of
+        these are also included as columns.
     """
-    if output_format not in ["dataframe", "dict"]:
-        raise ValueError(
-            "Invalid output format selected. " "Only 'dict' or 'dataframe' applicable.",
-        )
-
-    # TODO: [0.15]
-    if output_format == "dict":
-        msg = (
-            "Support for `output_format` of 'dict' will be removed in 0.15 "
-            "and pandas dataframes will be returned instead. To ensure your code "
-            "will continue to work, use `output_format`='dataframe'."
-        )
-        warnings.warn(msg, category=FutureWarning, stacklevel=2)
-
-    return openml.utils._list_all(  # type: ignore
-        data_id=data_id,
-        list_output_format=output_format,  # type: ignore
+    batches = openml.utils._list_all(
         listing_call=_list_datasets,
+        data_id=data_id,
         offset=offset,
         size=size,
         status=status,
         tag=tag,
         **kwargs,
     )
+    return pd.concat(batches, ignore_index=True)
 
 
-@overload
-def _list_datasets(
-    data_id: list | None = ...,
-    output_format: Literal["dict"] = "dict",
-    **kwargs: Any,
-) -> dict: ...
-
-
-@overload
-def _list_datasets(
-    data_id: list | None = ...,
-    output_format: Literal["dataframe"] = "dataframe",
-    **kwargs: Any,
-) -> pd.DataFrame: ...
-
-
-def _list_datasets(
-    data_id: list | None = None,
-    output_format: Literal["dict", "dataframe"] = "dict",
-    **kwargs: Any,
-) -> dict | pd.DataFrame:
+def _list_datasets(data_id: list[int] | None = None, **kwargs: Any) -> pd.DataFrame:
     """
     Perform api call to return a list of all datasets.
 
@@ -232,18 +143,14 @@ def _list_datasets(
 
     data_id : list, optional
 
-    output_format: str, optional (default='dict')
-        The parameter decides the format of the output.
-        - If 'dict' the output is a dict of dict
-        - If 'dataframe' the output is a pandas DataFrame
     kwargs : dict, optional
         Legal filter operators (keys in the dict):
         tag, status, limit, offset, data_name, data_version, number_instances,
         number_features, number_classes, number_missing_values.
 
     Returns
     -------
-    datasets : dict of dicts, or dataframe
+    datasets : dataframe
     """
     api_call = "data/list"
 
@@ -252,21 +159,10 @@ def _list_datasets(
             api_call += f"/{operator}/{value}"
     if data_id is not None:
         api_call += "/data_id/{}".format(",".join([str(int(i)) for i in data_id]))
-    return __list_datasets(api_call=api_call, output_format=output_format)
-
-
-@overload
-def __list_datasets(api_call: str, output_format: Literal["dict"] = "dict") -> dict: ...
-
+    return __list_datasets(api_call=api_call)
 
-@overload
-def __list_datasets(api_call: str, output_format: Literal["dataframe"]) -> pd.DataFrame: ...
 
-
-def __list_datasets(
-    api_call: str,
-    output_format: Literal["dict", "dataframe"] = "dict",
-) -> dict | pd.DataFrame:
+def __list_datasets(api_call: str) -> pd.DataFrame:
     xml_string = openml._api_calls._perform_api_call(api_call, "get")
     datasets_dict = xmltodict.parse(xml_string, force_list=("oml:dataset",))
 
@@ -295,10 +191,7 @@ def __list_datasets(
                 dataset[quality["@name"]] = float(quality["#text"])
         datasets[dataset["did"]] = dataset
 
-    if output_format == "dataframe":
-        datasets = pd.DataFrame.from_dict(datasets, orient="index")
-
-    return datasets
+    return pd.DataFrame.from_dict(datasets, orient="index")
 
 
 def _expand_parameter(parameter: str | list[str] | None) -> list[str]:
@@ -1493,8 +1386,7 @@ def _get_online_dataset_arff(dataset_id: int) -> str | None:
 
 
 def _get_online_dataset_format(dataset_id: int) -> str:
-    """Get the dataset format for a given dataset id
-    from the OpenML website.
+    """Get the dataset format for a given dataset id from the OpenML website.
 
     Parameters
     ----------
 
@@ -8,6 +8,8 @@
 import openml.tasks
 
 
+# TODO(eddiebergman): A lot of this class is automatically
+# handled by a dataclass
 class OpenMLEvaluation:
     """
     Contains all meta-information about a run / evaluation combination,
@@ -78,6 +80,24 @@ def __init__(  # noqa: PLR0913
         self.values = values
         self.array_data = array_data
 
+    def _to_dict(self) -> dict:
+        return {
+            "run_id": self.run_id,
+            "task_id": self.task_id,
+            "setup_id": self.setup_id,
+            "flow_id": self.flow_id,
+            "flow_name": self.flow_name,
+            "data_id": self.data_id,
+            "data_name": self.data_name,
+            "function": self.function,
+            "upload_time": self.upload_time,
+            "uploader": self.uploader,
+            "uploader_name": self.uploader_name,
+            "value": self.value,
+            "values": self.values,
+            "array_data": self.array_data,
+        }
+
     def __repr__(self) -> str:
         header = "OpenML Evaluation"
         header = "{}\n{}\n".format(header, "=" * len(header))