{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import openml\n",
    "\n",
    "def generate_latex_table(dataset_ids):\n",
    "    \"\"\"Generates a LaTeX table with an overview of OpenML datasets.\"\"\"\n",
    "    table_header = r\"\"\"\\begin{table}[h]\n",
    "\\centering\n",
    "\\begin{tabular}{|c|c|c|c|c|}\n",
    "\\hline\n",
    "ID & Name & Features & Classes & Data Points \\\\\n",
    "\\hline\"\"\"\n",
    "    table_rows = []\n",
    "    \n",
    "    for dataset_id in dataset_ids:\n",
    "        try:\n",
    "            dataset = openml.datasets.get_dataset(dataset_id)\n",
    "            name = dataset.name\n",
    "            features = len(dataset.features)\n",
    "            classes = len(dataset.retrieve_class_labels()) if dataset.retrieve_class_labels() else \"N/A\"\n",
    "            datapoints = dataset.qualities.get(\"NumberOfInstances\", \"N/A\")\n",
    "            \n",
    "            row = f\"{dataset_id} & {name} & {features} & {classes} & {datapoints} \\\\\\hline\"\n",
    "            table_rows.append(row)\n",
    "        except Exception as e:\n",
    "            print(f\"Failed to fetch dataset {dataset_id}: {e}\")\n",
    "    \n",
    "    table_footer = \"\"\"\\end{tabular}\n",
    "\\caption{Overview of OpenML datasets}\n",
    "\\label{tab:openml_datasets}\n",
    "\\end{table}\"\"\"\n",
    "    \n",
    "    latex_table = \"\\n\".join([table_header] + table_rows + [table_footer])\n",
    "    return latex_table\n",
    "\n",
    "# Example usage\n",
    "dataset_ids = [35,41,54,61, 187, 15, 31, 4534]  # Replace with desired OpenML dataset IDs\n",
    "latex_code = generate_latex_table(dataset_ids)\n",
    "print(latex_code)\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import openml\n",
    "\n",
    "def generate_latex_table(dataset_ids):\n",
    "    \"\"\"Generates a LaTeX table with an overview of OpenML datasets suitable for a single column in a two-column document.\"\"\"\n",
    "    table_header = r\"\"\"\\begin{table}[h]\n",
    "\\centering\n",
    "\\resizebox{\\columnwidth}{!}{%\n",
    "\\begin{tabular}{|c|c|c|c|c|}\n",
    "\\hline\n",
    "ID & Name & Feat. & Classes & Inst. \\\\\n",
    "\\hline\"\"\"\n",
    "    table_rows = []\n",
    "    \n",
    "    dataset_info = []\n",
    "    \n",
    "    for dataset_id in dataset_ids:\n",
    "        try:\n",
    "            dataset = openml.datasets.get_dataset(dataset_id)\n",
    "            name = dataset.name\n",
    "            features = len(dataset.features)\n",
    "            qualities = dataset.qualities\n",
    "            classes = qualities.get(\"NumberOfClasses\", \"N/A\")\n",
    "            datapoints = qualities.get(\"NumberOfInstances\", \"N/A\")\n",
    "            classes = int(classes)\n",
    "            datapoints = int(datapoints)\n",
    "            \n",
    "            dataset_info.append((dataset_id, name, features, classes, datapoints))\n",
    "        except Exception as e:\n",
    "            print(f\"Failed to fetch dataset {dataset_id}: {e}\")\n",
    "    \n",
    "    dataset_info.sort(key=lambda x: (x[3] if isinstance(x[3], (int, float)) else float('inf')))\n",
    "    \n",
    "    for dataset_id, name, features, classes, datapoints in dataset_info:\n",
    "        row = f\"{dataset_id} & {name} & {features} & {classes} & {datapoints} \\\\\\hline\"\n",
    "        table_rows.append(row)\n",
    "    \n",
    "    table_footer = r\"\"\"\\end{tabular}}\n",
    "\\caption{Overview of OpenML datasets sorted by number of classes}\n",
    "\\label{tab:openml_datasets}\n",
    "\\end{table}\"\"\"\n",
    "    \n",
    "    latex_table = \"\\n\".join([table_header] + table_rows + [table_footer])\n",
    "    return latex_table\n",
    "\n",
    "# Example usage\n",
    "dataset_ids = [35,41,54,61, 187, 15, 31, 4534]  # Replace with desired OpenML dataset IDs\n",
    "latex_code = generate_latex_table(dataset_ids)\n",
    "print(latex_code)\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "plnet",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.11.10"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
