{
 "cells": [
  {
   "cell_type": "markdown",
   "id": "16c6e1d3",
   "metadata": {},
   "source": [
    "# Table: Dataset Statistics"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1,
   "id": "2615def3",
   "metadata": {},
   "outputs": [],
   "source": [
    "import pandas as pd\n",
    "import numpy as np\n",
    "from tqdm.auto import tqdm\n",
    "from gluonts.dataset.stat import calculate_dataset_statistics\n",
    "from tsbench.config import DATASET_REGISTRY\n",
    "\n",
    "%reload_ext autoreload\n",
    "%autoreload 2"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "bdb94749",
   "metadata": {},
   "source": [
    "## Dataset Summary"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "id": "5d0e545e",
   "metadata": {
    "scrolled": true
   },
   "outputs": [
    {
     "data": {
      "application/vnd.jupyter.widget-view+json": {
       "model_id": "19920b16a01a4323b9742096737caa21",
       "version_major": 2,
       "version_minor": 0
      },
      "text/plain": [
       "  0%|          | 0/45 [00:00<?, ?it/s]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "\n",
      "100%|██████████| 8/8 [00:00<00:00, 1101.52it/s]\n",
      "\n",
      "100%|██████████| 321/321 [00:01<00:00, 314.29it/s]\n",
      "\n",
      "100%|██████████| 137/137 [00:00<00:00, 1221.05it/s]\n",
      "\n",
      "100%|██████████| 9535/9535 [00:02<00:00, 4484.49it/s]\n",
      "\n",
      "100%|██████████| 1214/1214 [00:00<00:00, 3607.86it/s]\n",
      "\n",
      "100%|██████████| 1428/1428 [00:00<00:00, 10854.71it/s]\n",
      "\n",
      "100%|██████████| 756/756 [00:00<00:00, 12120.32it/s]\n",
      "\n",
      "100%|██████████| 645/645 [00:00<00:00, 12748.64it/s]\n",
      "\n",
      "100%|██████████| 174/174 [00:00<00:00, 11533.19it/s]\n",
      "\n",
      "100%|██████████| 414/414 [00:00<00:00, 5714.93it/s]\n",
      "\n",
      "100%|██████████| 4227/4227 [00:01<00:00, 2872.53it/s]\n",
      "\n",
      "100%|██████████| 359/359 [00:00<00:00, 4978.43it/s]\n",
      "\n",
      "100%|██████████| 48000/48000 [00:04<00:00, 9967.94it/s]\n",
      "\n",
      "100%|██████████| 24000/24000 [00:02<00:00, 11933.80it/s]\n",
      "\n",
      "100%|██████████| 22974/22974 [00:01<00:00, 13242.38it/s]\n",
      "\n",
      "  0%|          | 0/30490 [00:00<?, ?it/s]\u001b[A\n",
      " 37%|███▋      | 11232/30490 [00:10<00:17, 1123.13it/s]\u001b[A\n",
      "100%|██████████| 30490/30490 [00:27<00:00, 1123.43it/s]\u001b[A\n",
      "\n",
      "100%|██████████| 366/366 [00:00<00:00, 8847.62it/s]\n",
      "\n",
      "100%|██████████| 427/427 [00:00<00:00, 11380.33it/s]\n",
      "\n",
      "100%|██████████| 518/518 [00:00<00:00, 13284.23it/s]\n",
      "\n",
      "  0%|          | 0/145026 [00:00<?, ?it/s]\u001b[A\n",
      " 36%|███▋      | 52705/145026 [00:10<00:17, 5270.39it/s]\u001b[A\n",
      "100%|██████████| 145026/145026 [00:27<00:00, 5229.72it/s]\u001b[A\n",
      "\n",
      "100%|██████████| 111/111 [00:00<00:00, 5869.27it/s]\n",
      "\n",
      "  0%|          | 0/5559 [00:00<?, ?it/s]\u001b[A\n",
      "100%|██████████| 5559/5559 [00:16<00:00, 328.50it/s]\u001b[A\n",
      "\n",
      "  0%|          | 0/313 [00:00<?, ?it/s]\u001b[A\n",
      "100%|██████████| 313/313 [00:17<00:00, 18.05it/s]\u001b[A\n",
      "\n",
      "100%|██████████| 2504/2504 [00:00<00:00, 12856.75it/s]\n",
      "\n",
      "100%|██████████| 115163/115163 [00:09<00:00, 11842.79it/s]\n",
      "\n",
      "100%|██████████| 107/107 [00:00<00:00, 6172.34it/s]\n",
      "\n",
      "100%|██████████| 862/862 [00:01<00:00, 538.94it/s]\n",
      "\n",
      "100%|██████████| 66/66 [00:00<00:00, 141.22it/s]\n",
      "\n",
      "100%|██████████| 767/767 [00:00<00:00, 11753.69it/s]\n",
      "\n",
      "100%|██████████| 227/227 [00:00<00:00, 9770.41it/s]\n",
      "\n",
      "100%|██████████| 270/270 [00:00<00:00, 860.72it/s]\n",
      "\n",
      "100%|██████████| 72/72 [00:00<00:00, 10828.67it/s]\n",
      "\n",
      "100%|██████████| 5/5 [00:00<00:00, 29.55it/s]\n",
      "\n",
      "100%|██████████| 17/17 [00:00<00:00, 1496.11it/s]\n",
      "\n",
      "100%|██████████| 2304/2304 [00:00<00:00, 8337.55it/s]\n",
      "\n",
      "100%|██████████| 314/314 [00:00<00:00, 9914.72it/s]\n",
      "\n",
      "100%|██████████| 3010/3010 [00:04<00:00, 671.98it/s]\n",
      "\n",
      "100%|██████████| 32053/32053 [00:04<00:00, 6957.12it/s]\n",
      "\n",
      "100%|██████████| 181/181 [00:00<00:00, 12683.89it/s]\n",
      "\n",
      "100%|██████████| 203/203 [00:00<00:00, 11931.67it/s]\n",
      "\n",
      "100%|██████████| 617/617 [00:00<00:00, 12142.34it/s]\n",
      "\n",
      "100%|██████████| 1115/1115 [00:00<00:00, 4536.40it/s]\n",
      "\n",
      "  0%|          | 0/171091 [00:00<?, ?it/s]\u001b[A\n",
      " 25%|██▍       | 42389/171091 [00:10<00:30, 4238.81it/s]\u001b[A\n",
      " 51%|█████▏    | 88064/171091 [00:20<00:18, 4432.14it/s]\u001b[A\n",
      "100%|██████████| 171091/171091 [00:32<00:00, 5240.78it/s]\u001b[A\n",
      "\n",
      "100%|██████████| 2934/2934 [00:00<00:00, 11397.30it/s]\n",
      "\n",
      "100%|██████████| 823/823 [00:00<00:00, 7851.98it/s]\n"
     ]
    }
   ],
   "source": [
    "results = []\n",
    "for dataset, config in tqdm(DATASET_REGISTRY.items()):\n",
    "    meta = config.meta\n",
    "    data = config.data.train(val=False).gluonts()\n",
    "    val_data = config.data.val().gluonts()\n",
    "    test_data = config.data.test().gluonts()\n",
    "    stats = calculate_dataset_statistics(data)\n",
    "    \n",
    "    min_date = pd.Timestamp(\"2100-01-01\")\n",
    "    max_date = pd.Timestamp(\"1700-01-01\")\n",
    "    for item in test_data:\n",
    "        min_date = min(min_date, item[\"start\"])\n",
    "        max_date = max(max_date, item[\"start\"] + len(item[\"target\"]) * item[\"start\"].freq)\n",
    "    \n",
    "    results.append({\n",
    "        \"dataset\": dataset,\n",
    "        \"frequency\": meta.freq,\n",
    "        \"prediction_length\": meta.prediction_length,\n",
    "        \"integer_dataset\": stats.integer_dataset,\n",
    "        \"num_time_series\": stats.num_time_series,\n",
    "        \"mean_length\": stats.mean_target_length,\n",
    "        \"max_length\": stats.max_target_length,\n",
    "        \"num_values\": stats.num_time_observations,\n",
    "        \"min_date\": min_date,\n",
    "        \"max_date\": max_date,\n",
    "    })\n",
    "statistics = pd.DataFrame(results).set_index(\"dataset\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "id": "cdd89b3b",
   "metadata": {
    "scrolled": false
   },
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>frequency</th>\n",
       "      <th>prediction_length</th>\n",
       "      <th>integer_dataset</th>\n",
       "      <th>num_time_series</th>\n",
       "      <th>mean_length</th>\n",
       "      <th>max_length</th>\n",
       "      <th>num_values</th>\n",
       "      <th>min_date</th>\n",
       "      <th>max_date</th>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>dataset</th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>australian_electricity_demand</th>\n",
       "      <td>0.5H</td>\n",
       "      <td>48</td>\n",
       "      <td>False</td>\n",
       "      <td>5</td>\n",
       "      <td>231004.800000</td>\n",
       "      <td>232224</td>\n",
       "      <td>1155024</td>\n",
       "      <td>2002-01-01 00:00:00</td>\n",
       "      <td>2015-04-02 00:00:00</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>bitcoin</th>\n",
       "      <td>D</td>\n",
       "      <td>30</td>\n",
       "      <td>False</td>\n",
       "      <td>17</td>\n",
       "      <td>4134.058824</td>\n",
       "      <td>4551</td>\n",
       "      <td>70279</td>\n",
       "      <td>2009-01-03 00:00:00</td>\n",
       "      <td>2021-07-20 00:00:00</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>car_parts</th>\n",
       "      <td>M</td>\n",
       "      <td>12</td>\n",
       "      <td>True</td>\n",
       "      <td>2504</td>\n",
       "      <td>39.000000</td>\n",
       "      <td>39</td>\n",
       "      <td>97656</td>\n",
       "      <td>1998-01-31 00:00:00</td>\n",
       "      <td>2002-04-30 00:00:00</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>cif_2016</th>\n",
       "      <td>M</td>\n",
       "      <td>12</td>\n",
       "      <td>False</td>\n",
       "      <td>72</td>\n",
       "      <td>86.722222</td>\n",
       "      <td>108</td>\n",
       "      <td>6244</td>\n",
       "      <td>1970-01-31 00:00:00</td>\n",
       "      <td>1980-01-31 00:00:00</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>corporacion_favorita</th>\n",
       "      <td>D</td>\n",
       "      <td>16</td>\n",
       "      <td>False</td>\n",
       "      <td>171091</td>\n",
       "      <td>1088.955690</td>\n",
       "      <td>1672</td>\n",
       "      <td>186310518</td>\n",
       "      <td>2013-01-01 00:00:00</td>\n",
       "      <td>2017-08-16 00:00:00</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>covid_deaths</th>\n",
       "      <td>D</td>\n",
       "      <td>30</td>\n",
       "      <td>True</td>\n",
       "      <td>227</td>\n",
       "      <td>182.000000</td>\n",
       "      <td>182</td>\n",
       "      <td>41314</td>\n",
       "      <td>2020-01-22 00:00:00</td>\n",
       "      <td>2020-08-21 00:00:00</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>dominick</th>\n",
       "      <td>W</td>\n",
       "      <td>8</td>\n",
       "      <td>False</td>\n",
       "      <td>115163</td>\n",
       "      <td>157.490192</td>\n",
       "      <td>385</td>\n",
       "      <td>18137043</td>\n",
       "      <td>1970-01-04 00:00:00</td>\n",
       "      <td>1977-07-17 00:00:00</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>electricity</th>\n",
       "      <td>1H</td>\n",
       "      <td>24</td>\n",
       "      <td>True</td>\n",
       "      <td>321</td>\n",
       "      <td>21044.000000</td>\n",
       "      <td>21044</td>\n",
       "      <td>6755124</td>\n",
       "      <td>2012-01-01 00:00:00</td>\n",
       "      <td>2014-06-02 20:00:00</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>exchange_rate</th>\n",
       "      <td>B</td>\n",
       "      <td>30</td>\n",
       "      <td>False</td>\n",
       "      <td>8</td>\n",
       "      <td>6071.000000</td>\n",
       "      <td>6071</td>\n",
       "      <td>48568</td>\n",
       "      <td>1990-01-01 00:00:00</td>\n",
       "      <td>2013-11-05 00:00:00</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>fred_md</th>\n",
       "      <td>M</td>\n",
       "      <td>12</td>\n",
       "      <td>False</td>\n",
       "      <td>107</td>\n",
       "      <td>716.000000</td>\n",
       "      <td>716</td>\n",
       "      <td>76612</td>\n",
       "      <td>1959-01-31 00:00:00</td>\n",
       "      <td>2019-09-30 00:00:00</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>hospital</th>\n",
       "      <td>M</td>\n",
       "      <td>12</td>\n",
       "      <td>True</td>\n",
       "      <td>767</td>\n",
       "      <td>72.000000</td>\n",
       "      <td>72</td>\n",
       "      <td>55224</td>\n",
       "      <td>2000-01-31 00:00:00</td>\n",
       "      <td>2007-01-31 00:00:00</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>kdd_2018</th>\n",
       "      <td>H</td>\n",
       "      <td>48</td>\n",
       "      <td>False</td>\n",
       "      <td>270</td>\n",
       "      <td>10849.644444</td>\n",
       "      <td>10872</td>\n",
       "      <td>2929404</td>\n",
       "      <td>2017-01-01 00:00:00</td>\n",
       "      <td>2018-04-01 00:00:00</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>london_smart_meters</th>\n",
       "      <td>0.5H</td>\n",
       "      <td>48</td>\n",
       "      <td>False</td>\n",
       "      <td>5559</td>\n",
       "      <td>29903.084727</td>\n",
       "      <td>39600</td>\n",
       "      <td>166231248</td>\n",
       "      <td>2011-11-24 00:00:00</td>\n",
       "      <td>2014-02-28 00:00:00</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>m1_monthly</th>\n",
       "      <td>M</td>\n",
       "      <td>18</td>\n",
       "      <td>False</td>\n",
       "      <td>617</td>\n",
       "      <td>72.758509</td>\n",
       "      <td>132</td>\n",
       "      <td>44892</td>\n",
       "      <td>1900-01-31 00:00:00</td>\n",
       "      <td>1991-02-28 00:00:00</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>m1_quarterly</th>\n",
       "      <td>Q</td>\n",
       "      <td>8</td>\n",
       "      <td>False</td>\n",
       "      <td>203</td>\n",
       "      <td>40.985222</td>\n",
       "      <td>106</td>\n",
       "      <td>8320</td>\n",
       "      <td>1900-03-31 00:00:00</td>\n",
       "      <td>2006-03-31 00:00:00</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>m1_yearly</th>\n",
       "      <td>Y</td>\n",
       "      <td>6</td>\n",
       "      <td>False</td>\n",
       "      <td>181</td>\n",
       "      <td>18.944751</td>\n",
       "      <td>52</td>\n",
       "      <td>3429</td>\n",
       "      <td>1865-12-31 00:00:00</td>\n",
       "      <td>2034-12-31 00:00:00</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>m3_monthly</th>\n",
       "      <td>M</td>\n",
       "      <td>18</td>\n",
       "      <td>False</td>\n",
       "      <td>1428</td>\n",
       "      <td>99.340336</td>\n",
       "      <td>126</td>\n",
       "      <td>141858</td>\n",
       "      <td>1750-01-31 00:00:00</td>\n",
       "      <td>2005-03-31 00:00:00</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>m3_other</th>\n",
       "      <td>Q</td>\n",
       "      <td>8</td>\n",
       "      <td>False</td>\n",
       "      <td>174</td>\n",
       "      <td>68.580460</td>\n",
       "      <td>96</td>\n",
       "      <td>11933</td>\n",
       "      <td>1750-03-31 00:00:00</td>\n",
       "      <td>1776-03-31 00:00:00</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>m3_quarterly</th>\n",
       "      <td>Q</td>\n",
       "      <td>8</td>\n",
       "      <td>False</td>\n",
       "      <td>756</td>\n",
       "      <td>40.947090</td>\n",
       "      <td>64</td>\n",
       "      <td>30956</td>\n",
       "      <td>1946-03-31 00:00:00</td>\n",
       "      <td>1996-12-31 00:00:00</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>m3_yearly</th>\n",
       "      <td>Y</td>\n",
       "      <td>6</td>\n",
       "      <td>False</td>\n",
       "      <td>645</td>\n",
       "      <td>22.401550</td>\n",
       "      <td>41</td>\n",
       "      <td>14449</td>\n",
       "      <td>1811-12-31 00:00:00</td>\n",
       "      <td>2002-12-31 00:00:00</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>m4_daily</th>\n",
       "      <td>D</td>\n",
       "      <td>14</td>\n",
       "      <td>False</td>\n",
       "      <td>4227</td>\n",
       "      <td>2357.383014</td>\n",
       "      <td>9919</td>\n",
       "      <td>9964658</td>\n",
       "      <td>1750-01-01 00:00:00</td>\n",
       "      <td>1777-03-13 00:00:00</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>m4_hourly</th>\n",
       "      <td>H</td>\n",
       "      <td>48</td>\n",
       "      <td>False</td>\n",
       "      <td>414</td>\n",
       "      <td>853.864734</td>\n",
       "      <td>960</td>\n",
       "      <td>353500</td>\n",
       "      <td>1750-01-01 00:00:00</td>\n",
       "      <td>1750-02-12 00:00:00</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>m4_monthly</th>\n",
       "      <td>M</td>\n",
       "      <td>18</td>\n",
       "      <td>False</td>\n",
       "      <td>48000</td>\n",
       "      <td>216.300229</td>\n",
       "      <td>2794</td>\n",
       "      <td>10382411</td>\n",
       "      <td>1750-01-31 00:00:00</td>\n",
       "      <td>1984-05-31 00:00:00</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>m4_quarterly</th>\n",
       "      <td>Q</td>\n",
       "      <td>8</td>\n",
       "      <td>False</td>\n",
       "      <td>24000</td>\n",
       "      <td>92.254500</td>\n",
       "      <td>866</td>\n",
       "      <td>2214108</td>\n",
       "      <td>1750-03-31 00:00:00</td>\n",
       "      <td>1968-09-30 00:00:00</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>m4_weekly</th>\n",
       "      <td>W</td>\n",
       "      <td>13</td>\n",
       "      <td>False</td>\n",
       "      <td>359</td>\n",
       "      <td>1022.038997</td>\n",
       "      <td>2597</td>\n",
       "      <td>366912</td>\n",
       "      <td>1750-01-04 00:00:00</td>\n",
       "      <td>1800-01-12 00:00:00</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>m4_yearly</th>\n",
       "      <td>Y</td>\n",
       "      <td>6</td>\n",
       "      <td>False</td>\n",
       "      <td>22974</td>\n",
       "      <td>30.785453</td>\n",
       "      <td>278</td>\n",
       "      <td>707265</td>\n",
       "      <td>1750-12-31 00:00:00</td>\n",
       "      <td>2034-12-31 00:00:00</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>m5</th>\n",
       "      <td>D</td>\n",
       "      <td>28</td>\n",
       "      <td>True</td>\n",
       "      <td>30490</td>\n",
       "      <td>1885.000000</td>\n",
       "      <td>1885</td>\n",
       "      <td>57473650</td>\n",
       "      <td>2011-01-29 00:00:00</td>\n",
       "      <td>2016-04-25 00:00:00</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>nn5</th>\n",
       "      <td>D</td>\n",
       "      <td>56</td>\n",
       "      <td>False</td>\n",
       "      <td>111</td>\n",
       "      <td>735.000000</td>\n",
       "      <td>735</td>\n",
       "      <td>81585</td>\n",
       "      <td>1996-03-18 00:00:00</td>\n",
       "      <td>1998-05-18 00:00:00</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>pedestrian_count</th>\n",
       "      <td>H</td>\n",
       "      <td>48</td>\n",
       "      <td>True</td>\n",
       "      <td>66</td>\n",
       "      <td>47411.787879</td>\n",
       "      <td>96376</td>\n",
       "      <td>3129178</td>\n",
       "      <td>2009-05-01 00:00:00</td>\n",
       "      <td>2020-05-01 00:00:00</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>restaurant</th>\n",
       "      <td>D</td>\n",
       "      <td>39</td>\n",
       "      <td>True</td>\n",
       "      <td>823</td>\n",
       "      <td>320.555286</td>\n",
       "      <td>439</td>\n",
       "      <td>263817</td>\n",
       "      <td>2016-01-01 00:00:00</td>\n",
       "      <td>2017-04-23 00:00:00</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>rideshare</th>\n",
       "      <td>H</td>\n",
       "      <td>48</td>\n",
       "      <td>False</td>\n",
       "      <td>2304</td>\n",
       "      <td>493.000000</td>\n",
       "      <td>493</td>\n",
       "      <td>1135872</td>\n",
       "      <td>2018-11-26 06:00:00</td>\n",
       "      <td>2018-12-18 19:00:00</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>rossmann</th>\n",
       "      <td>D</td>\n",
       "      <td>48</td>\n",
       "      <td>True</td>\n",
       "      <td>1115</td>\n",
       "      <td>864.295067</td>\n",
       "      <td>894</td>\n",
       "      <td>963689</td>\n",
       "      <td>2013-01-01 00:00:00</td>\n",
       "      <td>2015-08-01 00:00:00</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>san_francisco_traffic</th>\n",
       "      <td>H</td>\n",
       "      <td>48</td>\n",
       "      <td>False</td>\n",
       "      <td>862</td>\n",
       "      <td>17496.000000</td>\n",
       "      <td>17496</td>\n",
       "      <td>15081552</td>\n",
       "      <td>2015-01-01 00:00:00</td>\n",
       "      <td>2017-01-01 00:00:00</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>solar</th>\n",
       "      <td>H</td>\n",
       "      <td>24</td>\n",
       "      <td>False</td>\n",
       "      <td>137</td>\n",
       "      <td>7009.000000</td>\n",
       "      <td>7009</td>\n",
       "      <td>960233</td>\n",
       "      <td>2006-01-01 00:00:00</td>\n",
       "      <td>2006-10-27 01:00:00</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>taxi</th>\n",
       "      <td>30min</td>\n",
       "      <td>24</td>\n",
       "      <td>True</td>\n",
       "      <td>1214</td>\n",
       "      <td>1488.000000</td>\n",
       "      <td>1488</td>\n",
       "      <td>1806432</td>\n",
       "      <td>2016-01-01 00:00:00</td>\n",
       "      <td>2016-01-31 14:30:00</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>temperature_rain</th>\n",
       "      <td>D</td>\n",
       "      <td>30</td>\n",
       "      <td>False</td>\n",
       "      <td>32053</td>\n",
       "      <td>695.000000</td>\n",
       "      <td>695</td>\n",
       "      <td>22276835</td>\n",
       "      <td>2015-05-02 00:00:00</td>\n",
       "      <td>2017-04-26 00:00:00</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>tourism_monthly</th>\n",
       "      <td>M</td>\n",
       "      <td>24</td>\n",
       "      <td>False</td>\n",
       "      <td>366</td>\n",
       "      <td>274.579235</td>\n",
       "      <td>309</td>\n",
       "      <td>100496</td>\n",
       "      <td>1979-01-31 00:00:00</td>\n",
       "      <td>2007-10-31 00:00:00</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>tourism_quarterly</th>\n",
       "      <td>Q</td>\n",
       "      <td>8</td>\n",
       "      <td>False</td>\n",
       "      <td>427</td>\n",
       "      <td>91.634660</td>\n",
       "      <td>122</td>\n",
       "      <td>39128</td>\n",
       "      <td>1975-03-31 00:00:00</td>\n",
       "      <td>2007-12-31 00:00:00</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>tourism_yearly</th>\n",
       "      <td>Y</td>\n",
       "      <td>4</td>\n",
       "      <td>False</td>\n",
       "      <td>518</td>\n",
       "      <td>20.627413</td>\n",
       "      <td>43</td>\n",
       "      <td>10685</td>\n",
       "      <td>1960-12-31 00:00:00</td>\n",
       "      <td>2008-12-31 00:00:00</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>vehicle_trips</th>\n",
       "      <td>D</td>\n",
       "      <td>30</td>\n",
       "      <td>True</td>\n",
       "      <td>314</td>\n",
       "      <td>99.875796</td>\n",
       "      <td>213</td>\n",
       "      <td>31361</td>\n",
       "      <td>2015-01-01 00:00:00</td>\n",
       "      <td>2015-09-01 00:00:00</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>walmart</th>\n",
       "      <td>W</td>\n",
       "      <td>39</td>\n",
       "      <td>False</td>\n",
       "      <td>2934</td>\n",
       "      <td>101.741309</td>\n",
       "      <td>104</td>\n",
       "      <td>298509</td>\n",
       "      <td>2010-02-07 00:00:00</td>\n",
       "      <td>2012-11-04 00:00:00</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>weather</th>\n",
       "      <td>D</td>\n",
       "      <td>30</td>\n",
       "      <td>False</td>\n",
       "      <td>3010</td>\n",
       "      <td>14266.345515</td>\n",
       "      <td>65951</td>\n",
       "      <td>42941700</td>\n",
       "      <td>1970-01-01 00:00:00</td>\n",
       "      <td>2150-08-26 00:00:00</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>web_traffic</th>\n",
       "      <td>D</td>\n",
       "      <td>59</td>\n",
       "      <td>True</td>\n",
       "      <td>145026</td>\n",
       "      <td>744.000000</td>\n",
       "      <td>744</td>\n",
       "      <td>107899344</td>\n",
       "      <td>2015-07-01 00:00:00</td>\n",
       "      <td>2017-09-11 00:00:00</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>wiki</th>\n",
       "      <td>D</td>\n",
       "      <td>30</td>\n",
       "      <td>True</td>\n",
       "      <td>9535</td>\n",
       "      <td>762.000000</td>\n",
       "      <td>762</td>\n",
       "      <td>7265670</td>\n",
       "      <td>2012-01-01 00:00:00</td>\n",
       "      <td>2014-07-01 00:00:00</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>wind_farms</th>\n",
       "      <td>min</td>\n",
       "      <td>60</td>\n",
       "      <td>False</td>\n",
       "      <td>313</td>\n",
       "      <td>513441.948882</td>\n",
       "      <td>526980</td>\n",
       "      <td>160707330</td>\n",
       "      <td>2019-08-01 00:00:00</td>\n",
       "      <td>2020-08-01 00:00:00</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "                              frequency  prediction_length  integer_dataset  \\\n",
       "dataset                                                                       \n",
       "australian_electricity_demand      0.5H                 48            False   \n",
       "bitcoin                               D                 30            False   \n",
       "car_parts                             M                 12             True   \n",
       "cif_2016                              M                 12            False   \n",
       "corporacion_favorita                  D                 16            False   \n",
       "covid_deaths                          D                 30             True   \n",
       "dominick                              W                  8            False   \n",
       "electricity                          1H                 24             True   \n",
       "exchange_rate                         B                 30            False   \n",
       "fred_md                               M                 12            False   \n",
       "hospital                              M                 12             True   \n",
       "kdd_2018                              H                 48            False   \n",
       "london_smart_meters                0.5H                 48            False   \n",
       "m1_monthly                            M                 18            False   \n",
       "m1_quarterly                          Q                  8            False   \n",
       "m1_yearly                             Y                  6            False   \n",
       "m3_monthly                            M                 18            False   \n",
       "m3_other                              Q                  8            False   \n",
       "m3_quarterly                          Q                  8            False   \n",
       "m3_yearly                             Y                  6            False   \n",
       "m4_daily                              D                 14            False   \n",
       "m4_hourly                             H                 48            False   \n",
       "m4_monthly                            M                 18            False   \n",
       "m4_quarterly                          Q                  8            False   \n",
       "m4_weekly                             W                 13            False   \n",
       "m4_yearly                             Y                  6            False   \n",
       "m5                                    D                 28             True   \n",
       "nn5                                   D                 56            False   \n",
       "pedestrian_count                      H                 48             True   \n",
       "restaurant                            D                 39             True   \n",
       "rideshare                             H                 48            False   \n",
       "rossmann                              D                 48             True   \n",
       "san_francisco_traffic                 H                 48            False   \n",
       "solar                                 H                 24            False   \n",
       "taxi                              30min                 24             True   \n",
       "temperature_rain                      D                 30            False   \n",
       "tourism_monthly                       M                 24            False   \n",
       "tourism_quarterly                     Q                  8            False   \n",
       "tourism_yearly                        Y                  4            False   \n",
       "vehicle_trips                         D                 30             True   \n",
       "walmart                               W                 39            False   \n",
       "weather                               D                 30            False   \n",
       "web_traffic                           D                 59             True   \n",
       "wiki                                  D                 30             True   \n",
       "wind_farms                          min                 60            False   \n",
       "\n",
       "                               num_time_series    mean_length  max_length  \\\n",
       "dataset                                                                     \n",
       "australian_electricity_demand                5  231004.800000      232224   \n",
       "bitcoin                                     17    4134.058824        4551   \n",
       "car_parts                                 2504      39.000000          39   \n",
       "cif_2016                                    72      86.722222         108   \n",
       "corporacion_favorita                    171091    1088.955690        1672   \n",
       "covid_deaths                               227     182.000000         182   \n",
       "dominick                                115163     157.490192         385   \n",
       "electricity                                321   21044.000000       21044   \n",
       "exchange_rate                                8    6071.000000        6071   \n",
       "fred_md                                    107     716.000000         716   \n",
       "hospital                                   767      72.000000          72   \n",
       "kdd_2018                                   270   10849.644444       10872   \n",
       "london_smart_meters                       5559   29903.084727       39600   \n",
       "m1_monthly                                 617      72.758509         132   \n",
       "m1_quarterly                               203      40.985222         106   \n",
       "m1_yearly                                  181      18.944751          52   \n",
       "m3_monthly                                1428      99.340336         126   \n",
       "m3_other                                   174      68.580460          96   \n",
       "m3_quarterly                               756      40.947090          64   \n",
       "m3_yearly                                  645      22.401550          41   \n",
       "m4_daily                                  4227    2357.383014        9919   \n",
       "m4_hourly                                  414     853.864734         960   \n",
       "m4_monthly                               48000     216.300229        2794   \n",
       "m4_quarterly                             24000      92.254500         866   \n",
       "m4_weekly                                  359    1022.038997        2597   \n",
       "m4_yearly                                22974      30.785453         278   \n",
       "m5                                       30490    1885.000000        1885   \n",
       "nn5                                        111     735.000000         735   \n",
       "pedestrian_count                            66   47411.787879       96376   \n",
       "restaurant                                 823     320.555286         439   \n",
       "rideshare                                 2304     493.000000         493   \n",
       "rossmann                                  1115     864.295067         894   \n",
       "san_francisco_traffic                      862   17496.000000       17496   \n",
       "solar                                      137    7009.000000        7009   \n",
       "taxi                                      1214    1488.000000        1488   \n",
       "temperature_rain                         32053     695.000000         695   \n",
       "tourism_monthly                            366     274.579235         309   \n",
       "tourism_quarterly                          427      91.634660         122   \n",
       "tourism_yearly                             518      20.627413          43   \n",
       "vehicle_trips                              314      99.875796         213   \n",
       "walmart                                   2934     101.741309         104   \n",
       "weather                                   3010   14266.345515       65951   \n",
       "web_traffic                             145026     744.000000         744   \n",
       "wiki                                      9535     762.000000         762   \n",
       "wind_farms                                 313  513441.948882      526980   \n",
       "\n",
       "                               num_values            min_date  \\\n",
       "dataset                                                         \n",
       "australian_electricity_demand     1155024 2002-01-01 00:00:00   \n",
       "bitcoin                             70279 2009-01-03 00:00:00   \n",
       "car_parts                           97656 1998-01-31 00:00:00   \n",
       "cif_2016                             6244 1970-01-31 00:00:00   \n",
       "corporacion_favorita            186310518 2013-01-01 00:00:00   \n",
       "covid_deaths                        41314 2020-01-22 00:00:00   \n",
       "dominick                         18137043 1970-01-04 00:00:00   \n",
       "electricity                       6755124 2012-01-01 00:00:00   \n",
       "exchange_rate                       48568 1990-01-01 00:00:00   \n",
       "fred_md                             76612 1959-01-31 00:00:00   \n",
       "hospital                            55224 2000-01-31 00:00:00   \n",
       "kdd_2018                          2929404 2017-01-01 00:00:00   \n",
       "london_smart_meters             166231248 2011-11-24 00:00:00   \n",
       "m1_monthly                          44892 1900-01-31 00:00:00   \n",
       "m1_quarterly                         8320 1900-03-31 00:00:00   \n",
       "m1_yearly                            3429 1865-12-31 00:00:00   \n",
       "m3_monthly                         141858 1750-01-31 00:00:00   \n",
       "m3_other                            11933 1750-03-31 00:00:00   \n",
       "m3_quarterly                        30956 1946-03-31 00:00:00   \n",
       "m3_yearly                           14449 1811-12-31 00:00:00   \n",
       "m4_daily                          9964658 1750-01-01 00:00:00   \n",
       "m4_hourly                          353500 1750-01-01 00:00:00   \n",
       "m4_monthly                       10382411 1750-01-31 00:00:00   \n",
       "m4_quarterly                      2214108 1750-03-31 00:00:00   \n",
       "m4_weekly                          366912 1750-01-04 00:00:00   \n",
       "m4_yearly                          707265 1750-12-31 00:00:00   \n",
       "m5                               57473650 2011-01-29 00:00:00   \n",
       "nn5                                 81585 1996-03-18 00:00:00   \n",
       "pedestrian_count                  3129178 2009-05-01 00:00:00   \n",
       "restaurant                         263817 2016-01-01 00:00:00   \n",
       "rideshare                         1135872 2018-11-26 06:00:00   \n",
       "rossmann                           963689 2013-01-01 00:00:00   \n",
       "san_francisco_traffic            15081552 2015-01-01 00:00:00   \n",
       "solar                              960233 2006-01-01 00:00:00   \n",
       "taxi                              1806432 2016-01-01 00:00:00   \n",
       "temperature_rain                 22276835 2015-05-02 00:00:00   \n",
       "tourism_monthly                    100496 1979-01-31 00:00:00   \n",
       "tourism_quarterly                   39128 1975-03-31 00:00:00   \n",
       "tourism_yearly                      10685 1960-12-31 00:00:00   \n",
       "vehicle_trips                       31361 2015-01-01 00:00:00   \n",
       "walmart                            298509 2010-02-07 00:00:00   \n",
       "weather                          42941700 1970-01-01 00:00:00   \n",
       "web_traffic                     107899344 2015-07-01 00:00:00   \n",
       "wiki                              7265670 2012-01-01 00:00:00   \n",
       "wind_farms                      160707330 2019-08-01 00:00:00   \n",
       "\n",
       "                                         max_date  \n",
       "dataset                                            \n",
       "australian_electricity_demand 2015-04-02 00:00:00  \n",
       "bitcoin                       2021-07-20 00:00:00  \n",
       "car_parts                     2002-04-30 00:00:00  \n",
       "cif_2016                      1980-01-31 00:00:00  \n",
       "corporacion_favorita          2017-08-16 00:00:00  \n",
       "covid_deaths                  2020-08-21 00:00:00  \n",
       "dominick                      1977-07-17 00:00:00  \n",
       "electricity                   2014-06-02 20:00:00  \n",
       "exchange_rate                 2013-11-05 00:00:00  \n",
       "fred_md                       2019-09-30 00:00:00  \n",
       "hospital                      2007-01-31 00:00:00  \n",
       "kdd_2018                      2018-04-01 00:00:00  \n",
       "london_smart_meters           2014-02-28 00:00:00  \n",
       "m1_monthly                    1991-02-28 00:00:00  \n",
       "m1_quarterly                  2006-03-31 00:00:00  \n",
       "m1_yearly                     2034-12-31 00:00:00  \n",
       "m3_monthly                    2005-03-31 00:00:00  \n",
       "m3_other                      1776-03-31 00:00:00  \n",
       "m3_quarterly                  1996-12-31 00:00:00  \n",
       "m3_yearly                     2002-12-31 00:00:00  \n",
       "m4_daily                      1777-03-13 00:00:00  \n",
       "m4_hourly                     1750-02-12 00:00:00  \n",
       "m4_monthly                    1984-05-31 00:00:00  \n",
       "m4_quarterly                  1968-09-30 00:00:00  \n",
       "m4_weekly                     1800-01-12 00:00:00  \n",
       "m4_yearly                     2034-12-31 00:00:00  \n",
       "m5                            2016-04-25 00:00:00  \n",
       "nn5                           1998-05-18 00:00:00  \n",
       "pedestrian_count              2020-05-01 00:00:00  \n",
       "restaurant                    2017-04-23 00:00:00  \n",
       "rideshare                     2018-12-18 19:00:00  \n",
       "rossmann                      2015-08-01 00:00:00  \n",
       "san_francisco_traffic         2017-01-01 00:00:00  \n",
       "solar                         2006-10-27 01:00:00  \n",
       "taxi                          2016-01-31 14:30:00  \n",
       "temperature_rain              2017-04-26 00:00:00  \n",
       "tourism_monthly               2007-10-31 00:00:00  \n",
       "tourism_quarterly             2007-12-31 00:00:00  \n",
       "tourism_yearly                2008-12-31 00:00:00  \n",
       "vehicle_trips                 2015-09-01 00:00:00  \n",
       "walmart                       2012-11-04 00:00:00  \n",
       "weather                       2150-08-26 00:00:00  \n",
       "web_traffic                   2017-09-11 00:00:00  \n",
       "wiki                          2014-07-01 00:00:00  \n",
       "wind_farms                    2020-08-01 00:00:00  "
      ]
     },
     "execution_count": 5,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "statistics.sort_index()"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "c1f79147",
   "metadata": {},
   "source": [
    "## Latex"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "id": "0f59e610",
   "metadata": {},
   "outputs": [],
   "source": [
    "def frequency_formatter(value: str) -> str:\n",
    "    if value == \"min\":\n",
    "        return \"MIN\"\n",
    "    if value == \"30min\" or value == \"0.5H\":\n",
    "        return \"30 MIN\"\n",
    "    if value == \"H\" or value == \"1H\":\n",
    "        return \"H\"\n",
    "    if value == \"D\":\n",
    "        return \"D\"\n",
    "    if value == \"B\":\n",
    "        return \"B\"\n",
    "    if value == \"W\":\n",
    "        return \"W\"\n",
    "    if value == \"M\":\n",
    "        return \"M\"\n",
    "    if value == \"Q\":\n",
    "        return \"Q\"\n",
    "    if value == \"Y\":\n",
    "        return \"Y\"\n",
    "    raise NotImplementedError"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "id": "9226211c",
   "metadata": {},
   "outputs": [],
   "source": [
    "def integer_formatter(value: int) -> str:\n",
    "    return f\"{value:,}\""
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "id": "724bb829",
   "metadata": {},
   "outputs": [],
   "source": [
    "def float_formatter(value: float) -> str:\n",
    "    return f\"{value:,.0f}\""
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 9,
   "id": "4f64b6c9",
   "metadata": {},
   "outputs": [],
   "source": [
    "def process_index(index: pd.Index) -> pd.Index:\n",
    "    result = [\n",
    "        r\"\\textbf{\" +\n",
    "        item.replace(\"_\", \" \").title()\n",
    "            .replace(\"Nn\", \"NN\")\n",
    "            .replace(\"Kdd\", \"KDD\")\n",
    "            .replace(\"Cif\", \"CIF\")\n",
    "            .replace(\"Covid\", \"COVID\")\n",
    "            .replace(\"Corporacion\", \"Corporación\")\n",
    "            .replace(\" Md\", \"-MD\") + r\"}\"\n",
    "        for item in index\n",
    "    ]\n",
    "    return pd.Index(result, name=index.name)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 10,
   "id": "ab439942",
   "metadata": {},
   "outputs": [],
   "source": [
    "data = statistics.copy()\n",
    "data.index = process_index(data.index)\n",
    "data = data.sort_index()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 11,
   "id": "4646b88b",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\\begin{tabular}{lcc|rrr}\n",
      "\\toprule\n",
      "{} & \\textbf{Freq.} & \\textbf{Horizon} & \\textbf{\\# Series} & \\textbf{Avg. Length} & \\textbf{\\# Observations} \\\\\n",
      "\\midrule\n",
      "\\textbf{Australian Electricity Demand} &         30 MIN &               48 &                  5 &              231,005 &                1,155,024 \\\\\n",
      "\\textbf{Bitcoin}                       &              D &               30 &                 17 &                4,134 &                   70,279 \\\\\n",
      "\\textbf{CIF 2016}                      &              M &               12 &                 72 &                   87 &                    6,244 \\\\\n",
      "\\textbf{COVID Deaths}                  &              D &               30 &                227 &                  182 &                   41,314 \\\\\n",
      "\\textbf{Car Parts}                     &              M &               12 &              2,504 &                   39 &                   97,656 \\\\\n",
      "\\textbf{Corporación Favorita}          &              D &               16 &            171,091 &                1,089 &              186,310,518 \\\\\n",
      "\\textbf{Dominick}                      &              W &                8 &            115,163 &                  157 &               18,137,043 \\\\\n",
      "\\textbf{Electricity}                   &              H &               24 &                321 &               21,044 &                6,755,124 \\\\\n",
      "\\textbf{Exchange Rate}                 &              B &               30 &                  8 &                6,071 &                   48,568 \\\\\n",
      "\\textbf{Fred-MD}                       &              M &               12 &                107 &                  716 &                   76,612 \\\\\n",
      "\\textbf{Hospital}                      &              M &               12 &                767 &                   72 &                   55,224 \\\\\n",
      "\\textbf{KDD 2018}                      &              H &               48 &                270 &               10,850 &                2,929,404 \\\\\n",
      "\\textbf{London Smart Meters}           &         30 MIN &               48 &              5,559 &               29,903 &              166,231,248 \\\\\n",
      "\\textbf{M1 Monthly}                    &              M &               18 &                617 &                   73 &                   44,892 \\\\\n",
      "\\textbf{M1 Quarterly}                  &              Q &                8 &                203 &                   41 &                    8,320 \\\\\n",
      "\\textbf{M1 Yearly}                     &              Y &                6 &                181 &                   19 &                    3,429 \\\\\n",
      "\\textbf{M3 Monthly}                    &              M &               18 &              1,428 &                   99 &                  141,858 \\\\\n",
      "\\textbf{M3 Other}                      &              Q &                8 &                174 &                   69 &                   11,933 \\\\\n",
      "\\textbf{M3 Quarterly}                  &              Q &                8 &                756 &                   41 &                   30,956 \\\\\n",
      "\\textbf{M3 Yearly}                     &              Y &                6 &                645 &                   22 &                   14,449 \\\\\n",
      "\\textbf{M4 Daily}                      &              D &               14 &              4,227 &                2,357 &                9,964,658 \\\\\n",
      "\\textbf{M4 Hourly}                     &              H &               48 &                414 &                  854 &                  353,500 \\\\\n",
      "\\textbf{M4 Monthly}                    &              M &               18 &             48,000 &                  216 &               10,382,411 \\\\\n",
      "\\textbf{M4 Quarterly}                  &              Q &                8 &             24,000 &                   92 &                2,214,108 \\\\\n",
      "\\textbf{M4 Weekly}                     &              W &               13 &                359 &                1,022 &                  366,912 \\\\\n",
      "\\textbf{M4 Yearly}                     &              Y &                6 &             22,974 &                   31 &                  707,265 \\\\\n",
      "\\textbf{M5}                            &              D &               28 &             30,490 &                1,885 &               57,473,650 \\\\\n",
      "\\textbf{NN5}                           &              D &               56 &                111 &                  735 &                   81,585 \\\\\n",
      "\\textbf{Pedestrian Count}              &              H &               48 &                 66 &               47,412 &                3,129,178 \\\\\n",
      "\\textbf{Restaurant}                    &              D &               39 &                823 &                  321 &                  263,817 \\\\\n",
      "\\textbf{Rideshare}                     &              H &               48 &              2,304 &                  493 &                1,135,872 \\\\\n",
      "\\textbf{Rossmann}                      &              D &               48 &              1,115 &                  864 &                  963,689 \\\\\n",
      "\\textbf{San Francisco Traffic}         &              H &               48 &                862 &               17,496 &               15,081,552 \\\\\n",
      "\\textbf{Solar}                         &              H &               24 &                137 &                7,009 &                  960,233 \\\\\n",
      "\\textbf{Taxi}                          &         30 MIN &               24 &              1,214 &                1,488 &                1,806,432 \\\\\n",
      "\\textbf{Temperature Rain}              &              D &               30 &             32,053 &                  695 &               22,276,835 \\\\\n",
      "\\textbf{Tourism Monthly}               &              M &               24 &                366 &                  275 &                  100,496 \\\\\n",
      "\\textbf{Tourism Quarterly}             &              Q &                8 &                427 &                   92 &                   39,128 \\\\\n",
      "\\textbf{Tourism Yearly}                &              Y &                4 &                518 &                   21 &                   10,685 \\\\\n",
      "\\textbf{Vehicle Trips}                 &              D &               30 &                314 &                  100 &                   31,361 \\\\\n",
      "\\textbf{Walmart}                       &              W &               39 &              2,934 &                  102 &                  298,509 \\\\\n",
      "\\textbf{Weather}                       &              D &               30 &              3,010 &               14,266 &               42,941,700 \\\\\n",
      "\\textbf{Web Traffic}                   &              D &               59 &            145,026 &                  744 &              107,899,344 \\\\\n",
      "\\textbf{Wiki}                          &              D &               30 &              9,535 &                  762 &                7,265,670 \\\\\n",
      "\\textbf{Wind Farms}                    &            MIN &               60 &                313 &              513,442 &              160,707,330 \\\\\n",
      "\\bottomrule\n",
      "\\end{tabular}\n",
      "\n"
     ]
    }
   ],
   "source": [
    "with pd.option_context(\"max_colwidth\", 1000):\n",
    "    print(data.to_latex(\n",
    "        columns=[\"frequency\", \"prediction_length\", \"num_time_series\", \"mean_length\", \"num_values\"],\n",
    "        header=[\n",
    "            r\"\\textbf{Freq.}\",\n",
    "            r\"\\textbf{Horizon}\",\n",
    "            r\"\\textbf{\\# Series}\",\n",
    "            r\"\\textbf{Avg. Length}\",\n",
    "            r\"\\textbf{\\# Observations}\",\n",
    "        ],\n",
    "        formatters={\n",
    "            \"frequency\": frequency_formatter,\n",
    "            \"num_time_series\": integer_formatter,\n",
    "            \"num_values\": integer_formatter,\n",
    "            \"mean_length\": float_formatter,\n",
    "        },\n",
    "        index_names=False,\n",
    "    #     bold_rows=True,\n",
    "        escape=False,\n",
    "        column_format=\"lcc|rrr\"\n",
    "    ))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "521edc04",
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.8.9"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
