{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "id": "7e4662b1",
   "metadata": {},
   "outputs": [],
   "source": [
    "import pandas as pd\n",
    "import numpy as np\n",
    "import tensorflow as tf\n",
    "import matplotlib.pyplot as plt\n",
    "import time\n",
    "import math\n",
    "from sklearn.preprocessing import MinMaxScaler\n",
    "from sklearn.model_selection import train_test_split\n",
    "from sklearn.metrics import mean_squared_error, mean_absolute_error\n",
    "import seaborn as sns\n",
    "import random\n",
    "import os"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "id": "8b50d97d",
   "metadata": {},
   "outputs": [],
   "source": [
    "df = pd.read_csv('5G_millisecond.csv')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "id": "016d9dc7",
   "metadata": {},
   "outputs": [],
   "source": [
    "from autogluon.timeseries import TimeSeriesDataFrame, TimeSeriesPredictor"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "id": "13df3dc3",
   "metadata": {},
   "outputs": [],
   "source": [
    "df = df.rename(columns={\n",
    "    'ue_ident': 'item_id',\n",
    "    'DATE': 'timestamp',\n",
    "    'mac_dl_brate': 'target'\n",
    "})\n",
    "\n",
    "target_df = df[['item_id', 'timestamp', 'target']]\n",
    "uni_data = TimeSeriesDataFrame(target_df)\n",
    "uni_data.head()\n",
    "\n",
    "prediction_length = 96\n",
    "\n",
    "train_size = int(len(df) * 0.8)\n",
    "train_data = uni_data.iloc[:train_size]\n",
    "test_data = uni_data.iloc[train_size:]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "id": "7eca4241",
   "metadata": {},
   "outputs": [],
   "source": [
    "def rolling_chronos_forecast_all(predictor, test_data, prediction_length=96, stride=1, measure_time=False):\n",
    "    results = []\n",
    "    times = []\n",
    "\n",
    "    test_data = test_data.copy()\n",
    "    if not isinstance(test_data.index, pd.MultiIndex):\n",
    "        raise ValueError(\"Expected test_data with MultiIndex (item_id, timestamp).\")\n",
    "\n",
    "    for item_id, series in test_data.groupby(level=\"item_id\"):\n",
    "        series = series.reset_index()  \n",
    "\n",
    "        for start in range(0, len(series) - prediction_length, stride):\n",
    "            context = series.iloc[: start + prediction_length]\n",
    "\n",
    "            t0 = time.time()\n",
    "            forecast = predictor.predict(context.set_index([\"item_id\", \"timestamp\"]))\n",
    "            t1 = time.time()\n",
    "\n",
    "            if measure_time:\n",
    "                times.append(t1 - t0)\n",
    "\n",
    "            forecast_mean = forecast.loc[item_id][\"mean\"].to_numpy().flatten()\n",
    "            origin_ts = series[\"timestamp\"].iloc[start]  \n",
    "            forecast_ts = pd.date_range(start=origin_ts + pd.Timedelta(milliseconds=100),\n",
    "                                        periods=prediction_length,\n",
    "                                        freq=\"100ms\")\n",
    "\n",
    "            df_forecast = pd.DataFrame({\n",
    "                \"item_id\": item_id,\n",
    "                \"timestamp\": forecast_ts,\n",
    "                \"mean\": forecast_mean\n",
    "            })\n",
    "            results.append(df_forecast)\n",
    "\n",
    "    forecasts_df = pd.concat(results, ignore_index=True)\n",
    "    return (forecasts_df, times) if measure_time else forecasts_df\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "21db0559",
   "metadata": {},
   "outputs": [],
   "source": [
    "# Multiple seeds\n",
    "seeds = [123, 99, 42]\n",
    "rmse_list = []\n",
    "mae_list = []\n",
    "\n",
    "for seed in seeds:\n",
    "    print(f\"\\nRunning with seed={seed}\")\n",
    "    predictor = TimeSeriesPredictor(prediction_length=prediction_length, freq='100L')\n",
    "    \n",
    "    predictor.fit(\n",
    "        train_data,\n",
    "        presets=\"bolt_small\",\n",
    "        random_seed=seed\n",
    "    )\n",
    "\n",
    "    preds, times = rolling_chronos_forecast_all(\n",
    "        predictor, test_data, prediction_length=prediction_length, stride=1, measure_time=True\n",
    "    )\n",
    "\n",
    "    actual = test_data.reset_index()[[\"item_id\", \"timestamp\", \"target\"]]\n",
    "\n",
    "    aligned = preds.merge(actual, on=[\"item_id\", \"timestamp\"], how=\"inner\")\n",
    "\n",
    "    scaler = MinMaxScaler()\n",
    "    scaler.fit(train_data.reset_index()[[\"target\"]])  \n",
    "\n",
    "    aligned[\"mean_scaled\"] = scaler.transform(aligned[[\"mean\"]].values)\n",
    "    aligned[\"target_scaled\"] = scaler.transform(aligned[[\"target\"]].values)\n",
    "\n",
    "    rmse_scaled = np.sqrt(mean_squared_error(aligned[\"target_scaled\"], aligned[\"mean_scaled\"]))\n",
    "    mae_scaled = mean_absolute_error(aligned[\"target_scaled\"], aligned[\"mean_scaled\"])\n",
    "\n",
    "    print(f\"Seed={seed}: RMSE={rmse_scaled:.4f}, MAE={mae_scaled:.4f}\")\n",
    "    \n",
    "    rmse_list.append(rmse_scaled)\n",
    "    mae_list.append(mae_scaled)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "id": "3b556976",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "Summary\n",
      "RMSE: mean=0.0313, std=0.0000\n",
      "MAE : mean=0.0185, std=0.0000\n"
     ]
    }
   ],
   "source": [
    "'''\n",
    "Seed=42: RMSE=0.0313, MAE=0.0185\n",
    "Seed=99: RMSE=0.0313, MAE=0.0185\n",
    "Seed=123: RMSE=0.0313, MAE=0.0185\n",
    "'''\n",
    "\n",
    "rmse_list = [0.0313, 0.0313, 0.0313]\n",
    "mae_list = [0.0185, 0.0185, 0.0185]\n",
    "\n",
    "# Summary\n",
    "rmse_mean, rmse_std = np.mean(rmse_list), np.std(rmse_list)\n",
    "mae_mean, mae_std = np.mean(mae_list), np.std(mae_list)\n",
    "\n",
    "print(\"\\nSummary\")\n",
    "print(f\"RMSE: mean={rmse_mean:.4f}, std={rmse_std:.4f}\")\n",
    "print(f\"MAE : mean={mae_mean:.4f}, std={mae_std:.4f}\")"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "tf-env",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.10.18"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
