{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "faa61949-fbf3-4b6c-a9f6-699af84466ec",
   "metadata": {},
   "outputs": [],
   "source": [
    "import pandas as pd\n",
    "import numpy as np\n",
    "import torch\n",
    "from transformers import AutoModelForCausalLM\n",
    "from sklearn.preprocessing import StandardScaler\n",
    "from sklearn.metrics import mean_squared_error, mean_absolute_error\n",
    "\n",
    "\n",
    "# ---------------------------------------------------\n",
    "# 1. Load + normalize dataset\n",
    "# ---------------------------------------------------\n",
    "def load_and_norm(path):\n",
    "    df = pd.read_csv(path, index_col='date')\n",
    "    value_col = df.columns[0]\n",
    "\n",
    "    scaler = StandardScaler()\n",
    "    df[value_col] = scaler.fit_transform(df[[value_col]])\n",
    "\n",
    "    return df\n",
    "\n",
    "\n",
    "# ---------------------------------------------------\n",
    "# 2. TimeMoE Model Wrapper (with sliding context window)\n",
    "# ---------------------------------------------------\n",
    "model_path = ''\n",
    "class TimeMoEModel:\n",
    "    def __init__(self, name=model_path, context_window=512):\n",
    "        self.model = AutoModelForCausalLM.from_pretrained(\n",
    "            name,\n",
    "            device_map=\"cpu\",      # use GPU\n",
    "            trust_remote_code=True\n",
    "        )\n",
    "        self.context_window = context_window\n",
    "\n",
    "    def predict(self, context, horizon):\n",
    "        \"\"\"\n",
    "        context: torch tensor shape [T]\n",
    "        horizon: int\n",
    "        \"\"\"\n",
    "\n",
    "        # Always trim to sliding window to avoid OOM\n",
    "        if context.shape[0] > self.context_window:\n",
    "            context = context[-self.context_window:]\n",
    "\n",
    "        # Model expects [batch, seq]\n",
    "        if context.ndim == 1:\n",
    "            context = context.unsqueeze(0)\n",
    "\n",
    "        context = context.to(self.model.device)\n",
    "\n",
    "        # Generate H new tokens\n",
    "        out = self.model.generate(\n",
    "            context,\n",
    "            max_new_tokens=horizon,\n",
    "            use_cache=False\n",
    "        )\n",
    "\n",
    "        preds = out[:, -horizon:].detach().cpu().numpy().flatten()\n",
    "        return preds\n",
    "\n",
    "\n",
    "# ---------------------------------------------------\n",
    "# 3. Evaluation loop (same as Chronos)\n",
    "# ---------------------------------------------------\n",
    "def evaluate_model(df, model, horizons):\n",
    "    value_col = df.columns[0]\n",
    "    values = df[value_col].values\n",
    "    n = len(values)\n",
    "\n",
    "    results = []\n",
    "\n",
    "    for H in horizons:\n",
    "        if H >= n:\n",
    "            results.append({\n",
    "                \"horizon\": H,\n",
    "                \"MSE\": np.nan,\n",
    "                \"MAE\": np.nan,\n",
    "            })\n",
    "            continue\n",
    "\n",
    "        print(f\"Running for horizon = [{H}]\")\n",
    "\n",
    "        train = values[:-H]\n",
    "        test = values[-H:]\n",
    "\n",
    "        context = torch.tensor(train, dtype=torch.float32)\n",
    "\n",
    "        preds = model.predict(context, H)\n",
    "\n",
    "        mse = mean_squared_error(test, preds)\n",
    "        mae = mean_absolute_error(test, preds)\n",
    "\n",
    "        results.append({\n",
    "            \"horizon\": H,\n",
    "            \"MSE\": round(mse, 4),\n",
    "            \"MAE\": round(mae, 4),\n",
    "        })\n",
    "\n",
    "    return results\n",
    "\n",
    "\n",
    "# ---------------------------------------------------\n",
    "# 4. Benchmark loop\n",
    "# ---------------------------------------------------\n",
    "def run_benchmark(datasets, model, horizons):\n",
    "    table = []\n",
    "\n",
    "    for name, df in datasets.items():\n",
    "        print(f\"\\nRunning [{name}] dataset\")\n",
    "\n",
    "        results = evaluate_model(df, model, horizons)\n",
    "\n",
    "        for r in results:\n",
    "            table.append({\n",
    "                \"Dataset\": name,\n",
    "                \"Horizon\": r[\"horizon\"],\n",
    "                \"MSE\": r[\"MSE\"],\n",
    "                \"MAE\": r[\"MAE\"],\n",
    "            })\n",
    "\n",
    "    return pd.DataFrame(table)\n",
    "\n",
    "\n",
    "# ---------------------------------------------------\n",
    "# 5. Datasets\n",
    "# ---------------------------------------------------\n",
    "datasets = {\n",
    "    \"AUS_Elec_Demand\": load_and_norm(\"../energy_processed/australian_electricity_demand_dataset_processed.csv\"),\n",
    "    \"Electricity_Weekly\": load_and_norm(\"../energy_processed/electricity_weekly_dataset_processed.csv\"),\n",
    "\n",
    "    \"ETTh1\": load_and_norm(\"../energy_processed/ETTh1_processed.csv\"),\n",
    "    \"ETTh2\": load_and_norm(\"../energy_processed/ETTh2_processed.csv\"),\n",
    "    \"ETTm1\": load_and_norm(\"../energy_processed/ETTm1_processed.csv\"),\n",
    "    \"ETTm2\": load_and_norm(\"../energy_processed/ETTm2_processed.csv\"),\n",
    "\n",
    "    \"London_SmartMeters\": load_and_norm(\"../energy_processed/london_smart_meters_dataset_subset_processed.csv\"),\n",
    "\n",
    "    \"Solar_10min\": load_and_norm(\"../energy_processed/solar_10_minutes_dataset_processed.csv\"),\n",
    "}\n",
    "\n",
    "\n",
    "# ---------------------------------------------------\n",
    "# 6. Run TimeMoE Benchmark\n",
    "# ---------------------------------------------------\n",
    "model = TimeMoEModel(context_window=1024)\n",
    "\n",
    "table_timemoe = run_benchmark(\n",
    "    datasets,\n",
    "    model,\n",
    "    horizons=[24, 48, 96]\n",
    ")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "d71ea6c2-6689-4851-b523-a7ba303772a7",
   "metadata": {},
   "outputs": [],
   "source": [
    "table_timemoe.to_csv('../energy_results/TimesMOE_Energy.csv', index=False)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "b6646951-2bcd-4568-a309-5613a382a726",
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.10.19"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
