{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import pandas as pd\n",
    "import matplotlib.pyplot as plt\n",
    "import numpy as np\n",
    "\n",
    "\n",
    "\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import pandas as pd\n",
    "from TSB_AD.model_wrapper import run_Unsupervise_AD,run_Semisupervise_AD\n",
    "from TSB_AD.evaluation.metrics import get_metrics\n",
    "Unsupervise_AD_Pool = ['FFT', 'SR', 'NORMA', 'Series2Graph', 'Sub_IForest', 'IForest', 'LOF', 'Sub_LOF', 'POLY', 'MatrixProfile', 'Sub_PCA', 'PCA', 'HBOS',\n",
    "                        'Sub_HBOS', 'KNN', 'Sub_KNN','KMeansAD', 'KMeansAD_U', 'KShapeAD', 'COPOD', 'CBLOF', 'COF', 'EIF', 'RobustPCA', 'Lag_Llama', 'TimesFM', 'Chronos', 'MOMENT_ZS']\n",
    "Semisupervise_AD_Pool = ['Left_STAMPi', 'SAND', 'MCD', 'Sub_MCD', 'OCSVM', 'Sub_OCSVM', 'AutoEncoder', 'CNN', 'LSTMAD', 'TranAD', 'USAD', 'OmniAnomaly',\n",
    "                        'AnomalyTransformer', 'TimesNet', 'FITS', 'Donut', 'OFA', 'MOMENT_FT']\n",
    "import os\n",
    "\n",
    "U_data_list = os.listdir('../dataset/TSB-AD-U/TSB-AD-U/')\n",
    "M_data_list = os.listdir('../dataset/TSB-AD-M/TSB-AD-M/')\n",
    "U_data_list.sort()\n",
    "\n",
    "M_data_list.sort()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import warnings\n",
    "from sklearn.exceptions import UndefinedMetricWarning\n",
    "\n",
    "warnings.filterwarnings(\"ignore\", category=UndefinedMetricWarning)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "df_U_VUS_PR = pd.read_csv('./results/uni_mergedTable_VUS-PR.csv')\n",
    "df_M_VUS_PR = pd.read_csv('./results/multi_mergedTable_VUS-PR.csv')\n",
    "U_data_list = df_U_VUS_PR['file'].tolist()\n",
    "M_data_list = df_M_VUS_PR['file'].tolist()"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### Complexity and anomaly score calculation\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "score_list = []\n",
    "eval_res = []\n",
    "n_run = 1\n",
    "\n",
    "\n",
    "\n",
    "start_idx = 0\n",
    "end_idx = 0\n",
    "loop_idx = 0\n",
    "for U_data_dir in U_data_list[:1]:\n",
    "    \n",
    "    AD_Name = 'MOMENT_FT'   # It can be replaced with any anomaly detector availale in TSB-AD\n",
    "\n",
    "    data_direc = '../dataset/TSB-AD-U/TSB-AD-U/'+U_data_dir\n",
    "\n",
    "    # Loading Data\n",
    "    df = pd.read_csv(data_direc).dropna()\n",
    "    data = df.iloc[:, 0:-1].values.astype(float)\n",
    "\n",
    "    train_index = data_direc.split('_')[-3]\n",
    "    data_train = data[:int(train_index), :]\n",
    "    data_test = data\n",
    "\n",
    "    if U_data_dir in df_U_VUS_PR['file'].to_list():\n",
    "        loop_idx =+1\n",
    "        print(loop_idx/len(U_data_list))\n",
    "        # Specify Anomaly Detector to use and data directory\n",
    "        label = df['Label'].astype(int).to_numpy()\n",
    "        from MOMENT_custom import MOMENT_custom,ReconstructDataset_Moment\n",
    "        import torch\n",
    "\n",
    "        from sklearn.preprocessing import StandardScaler\n",
    "        clf = MOMENT_custom(win_size=256)\n",
    "        clf.model.embedding_vector = torch.tensor(0)\n",
    "        # Finetune\n",
    "        clf.fit(data_train)\n",
    "        raw_score = clf.decision_function(data_test,masking=False)\n",
    "        score = StandardScaler().fit_transform(raw_score.reshape(-1,1)).ravel()\n",
    "        \n",
    "\n",
    "        # Evaluation\n",
    "        evaluation_result = get_metrics(score, label)\n",
    "        eval_res.append(evaluation_result)\n",
    "        score_list.append(score)\n",
    "        torch.cuda.empty_cache() \n",
    "        torch.cuda.ipc_collect()  \n",
    "\n",
    "np.save('raw_MOMENT'+'_output_test.npy',np.concatenate(score_list,axis=0))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "from TSB_AD.model_wrapper import run_Unsupervise_AD,run_Semisupervise_AD\n",
    "from TSB_AD.evaluation.metrics import get_metrics\n",
    "import numpy as np\n",
    "import os\n",
    "import pandas as pd\n",
    "Comparaed_Solution_Pool = ['Sub_IForest','SR','Sub_HBOS','Sub_PCA','POLY']\n",
    "\n",
    "U_data_list.sort()\n",
    "\n",
    "n_run = 1\n",
    "loop_idx = 0\n",
    "for AD_Name in Comparaed_Solution_Pool:\n",
    "    score_list = []\n",
    "    eval_res = []\n",
    "    for U_data_dir in U_data_list[:1]:\n",
    "        loop_idx +=1\n",
    "        print(loop_idx/len(U_data_list))\n",
    "        # Specify Anomaly Detector to use and data directory\n",
    "\n",
    "        data_direc = '../dataset/TSB-AD-U/TSB-AD-U/'+U_data_dir\n",
    "\n",
    "        # Loading Data\n",
    "        df = pd.read_csv(data_direc).dropna()\n",
    "        data = df.iloc[:, 0:-1].values.astype(float)\n",
    "\n",
    "        train_index = data_direc.split('_')[-3]\n",
    "        data_train = data[:int(train_index), :]\n",
    "        data_test = data\n",
    "\n",
    "        label = df['Label'].astype(int).to_numpy()\n",
    "        label_test = df['Label'].astype(int).to_numpy()\n",
    "\n",
    "        # Applying Anomaly Detector\n",
    "        raw_score = run_Unsupervise_AD(AD_Name, data)\n",
    "        score = StandardScaler().fit_transform(raw_score.reshape(-1,1)).ravel()\n",
    "        # Evaluation\n",
    "        evaluation_result = get_metrics(score, label_test)\n",
    "\n",
    "        # Evaluation\n",
    "        eval_res.append(evaluation_result)\n",
    "        score_list.append(score)\n",
    "\n",
    "    eval_df = pd.DataFrame(eval_res)\n",
    "    eval_df.to_csv(AD_Name+\"_eval_df.csv\")\n",
    "    np.save(AD_Name+'_output.npy',np.concatenate(score_list,axis=0))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "score_list = []\n",
    "eval_res = []\n",
    "import importlib\n",
    "import MOMENT_custom\n",
    "importlib.reload(MOMENT_custom)\n",
    "import torch\n",
    "start_idx = 0\n",
    "end_idx = 0\n",
    "loop_idx = 0\n",
    "reconstruction_loss_list = []\n",
    "prediction_loss_list = []\n",
    "for U_data_dir in U_data_list[:3]:\n",
    "    \n",
    "    AD_Name = 'MOMENT_FT'   # It can be replaced with any anomaly detector availale in TSB-AD\n",
    "\n",
    "    data_direc = '../dataset/TSB-AD-U/TSB-AD-U/'+U_data_dir\n",
    "\n",
    "    # Loading Data\n",
    "    df = pd.read_csv(data_direc).dropna()\n",
    "    data = df.iloc[:, 0:-1].values.astype(float)\n",
    "\n",
    "    train_index = data_direc.split('_')[-3]\n",
    "    data_train = data[:int(train_index), :]\n",
    "    data_test = data\n",
    "    label = df['Label'].astype(int).to_numpy()\n",
    "    end_idx += len(label)\n",
    "        \n",
    "    start_idx = end_idx\n",
    "    if U_data_dir in df_U_VUS_PR['file'].to_list():\n",
    "        loop_idx =+1\n",
    "        print(loop_idx/len(U_data_list))\n",
    "        # Specify Anomaly Detector to use and data directory\n",
    "        \n",
    "        \n",
    "        \n",
    "\n",
    "        from sklearn.preprocessing import MinMaxScaler\n",
    "        clf = MOMENT_custom.MOMENT_custom(win_size=256)\n",
    "        clf.fit(data_train)\n",
    "        # Finetune\n",
    "        reconstruction_loss = clf.decision_function(data,masking=False)\n",
    "        prediction_loss = clf.decision_function(data,masking = True,n_split=3)\n",
    "        \n",
    "        reconstruction_loss_list.append(reconstruction_loss)\n",
    "        prediction_loss_list.append(prediction_loss)\n",
    "        torch.cuda.empty_cache()  \n",
    "        torch.cuda.ipc_collect()  \n"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### Complexity aware selection (CAE)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#raw_alpha_list = np.array([np.mean((prediction_loss_list[loop_idx])/(reconstruction_loss_list[loop_idx])) for loop_idx in range(len(prediction_loss_list))])\n",
    "raw_alpha_list = np.load('raw_alpha_list.npy')\n",
    "from sklearn.preprocessing import StandardScaler\n",
    "from sklearn.preprocessing import QuantileTransformer, MinMaxScaler\n",
    "sscaler = QuantileTransformer()\n",
    "sscaler.fit(X=raw_alpha_list.reshape(-1,1))\n",
    "proposed_alpha = sscaler.transform(X=raw_alpha_list.reshape(-1,1))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "from MOMENT_custom import MOMENT_custom,ReconstructDataset_Moment\n",
    "import torch\n",
    "import numpy as np\n",
    "from sklearn.preprocessing import MinMaxScaler,StandardScaler\n",
    "import pandas as pd\n",
    "import importlib\n",
    "import TSB_AD.evaluation.metrics\n",
    "\n",
    "importlib.reload(TSB_AD.evaluation.metrics)\n",
    "from TSB_AD.evaluation.metrics import get_metrics\n",
    "\n",
    "\n",
    "\n",
    "eval_df = pd.read_csv(\"eval_df_mean_std.csv\") \n",
    "import pandas as pd\n",
    "\n",
    "MOMENT_mean_std = np.load('raw_MOMENT_output_test.npy')\n",
    "POLY_mean_std = np.load('POLY_output.npy')\n",
    "PCA_mean_std = np.load('Sub_PCA_output.npy')\n",
    "eval_res = []\n",
    "\n",
    "start_idx = 0\n",
    "end_idx = 0\n",
    "loop_idx = 0\n",
    "for U_data_dir in U_data_list[:1]:\n",
    "    data_direc = '../dataset/TSB-AD-U/TSB-AD-U/'+U_data_dir\n",
    "\n",
    "    # Loading Data\n",
    "    df = pd.read_csv(data_direc).dropna()\n",
    "\n",
    "    label = df['Label'].astype(int).to_numpy()\n",
    "    end_idx += len(label)\n",
    "\n",
    "    loop_idx +=1\n",
    "    print(loop_idx/len(U_data_list))\n",
    "    # Specify Anomaly Detector to use and data directory\n",
    "    \n",
    "    \n",
    "    \n",
    "    for alpha in ['proposed']:\n",
    "        if alpha =='proposed':\n",
    "            alpha = proposed_alpha[loop_idx-1]\n",
    "            \n",
    "        pca_score = PCA_mean_std[start_idx:end_idx]\n",
    "        pca_score = StandardScaler().fit_transform(pca_score.reshape(-1,1)).ravel()\n",
    "        moment_score = MOMENT_mean_std[start_idx:end_idx]\n",
    "        score = ((1-alpha)*moment_score + alpha * pca_score)\n",
    "                \n",
    "        from sklearn.preprocessing import StandardScaler\n",
    "        \n",
    "        score = StandardScaler().fit_transform(score.reshape(-1,1)).ravel()\n",
    "\n",
    "        evaluation_result = get_metrics(score, label,version='opt')\n",
    "        evaluation_result['alpha'] = alpha\n",
    "        evaluation_result['file'] = U_data_dir\n",
    "        eval_res.append(evaluation_result)  \n",
    "    start_idx = end_idx"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### Other complexity"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import numpy as np\n",
    "import antropy as ant\n",
    "import pandas as pd\n",
    "\n",
    "def compute_complexity_measures(data_array, sf=1.0):\n",
    "    \"\"\"\n",
    "    data_array: shape = (N, 756)\n",
    "    sf: Sampling Hz, Required for Spectral Entropy (default: 1.0)\n",
    "    \n",
    "    return: dict{\n",
    "                \"app_entropy\": [..N..],\n",
    "                \"sample_entropy\": [..N..],\n",
    "                \"spectral_entropy\": [..N..],\n",
    "            }\n",
    "    \"\"\"\n",
    "\n",
    "    results = {\n",
    "        \"app_entropy\": [],\n",
    "        \"sample_entropy\": [],\n",
    "        \"spectral_entropy\": []\n",
    "    }\n",
    "    \n",
    "    for i in range(len(data_array)):\n",
    "        ts = data_array[i]  \n",
    "        \n",
    "        # 1) Approximate Entropy\n",
    "        app_ent = ant.app_entropy(ts, order=2)\n",
    "\n",
    "        # 2) Sample Entropy\n",
    "        samp_ent = ant.sample_entropy(ts, order=2)\n",
    "\n",
    "        # 3) Spectral Entropy\n",
    "        spec_ent = ant.spectral_entropy(ts, sf=sf, method='fft')\n",
    "\n",
    "\n",
    "        \n",
    "        results[\"app_entropy\"].append(app_ent)\n",
    "        results[\"sample_entropy\"].append(samp_ent)\n",
    "        results[\"spectral_entropy\"].append(spec_ent)\n",
    "    \n",
    "    return results"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "data_complexity_list = []\n",
    "for U_data_dir in U_data_list:\n",
    "    # Specify Anomaly Detector to use and data directory\n",
    "    \n",
    "\n",
    "    data_direc = './TSB-AD-U/'+U_data_dir\n",
    "\n",
    "    # Loading Data\n",
    "    df = pd.read_csv(data_direc).dropna()\n",
    "    data = df.iloc[:, 0:-1].values.astype(float)\n",
    "    if data.shape[1] == 1: \n",
    "        data = data.squeeze()\n",
    "        length, = data.shape\n",
    "        sample_num = max(0, (length - 256) // 1 + 1)\n",
    "\n",
    "        X = np.zeros((sample_num, 256))\n",
    "\n",
    "        for i in range(sample_num):\n",
    "            X[i, :] = data[i * 1: i * 1+ 256]\n",
    "\n",
    "        data_array = X[:, :, np.newaxis]\n",
    "    else:\n",
    "        sample_num = data.shape[0]\n",
    "\n",
    "        X = np.zeros((data.shape[0], data.shape[1]))\n",
    "        for i in range(sample_num):\n",
    "            X[i, :] = data[i, :]\n",
    "\n",
    "        data_array = X\n",
    "\n",
    "\n",
    "    result_dict = compute_complexity_measures(data_array.squeeze(2), sf=1.0)\n",
    "\n",
    "    df_results = pd.DataFrame(result_dict).mean().to_list()\n",
    "    data_complexity_list.append(['U',U_data_dir]+df_results)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### Time complexity"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "TSB-AD",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.11.11"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
