{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {},
   "outputs": [],
   "source": [
    "import os\n",
    "import numpy as np\n",
    "import pandas as pd"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "metadata": {},
   "outputs": [],
   "source": [
    "def get_mse_mae1(PATH, settings_list, cw,patch_size, model_dim, load_epoch, ft_epoch):\n",
    "    y = [x for x in settings_list if f'z3' in x]\n",
    "    y = [x for x in y if f'patch{patch_size}' in x]\n",
    "    y = [x for x in y if f'cw{cw}' in x]\n",
    "    y = [x for x in y if f'_D{model_dim}' in x]\n",
    "    try:\n",
    "        arch = os.path.join(PATH,y[0])\n",
    "    except:\n",
    "        return [999,999,999,999], [999,999,999,999]\n",
    "    #print(arch)\n",
    "    files = os.listdir(arch)\n",
    "    if len(files)==0:\n",
    "        return [999,999,999,999], [999,999,999,999]\n",
    "    files = [x for x in files if 'acc' in x]\n",
    "    files = [x for x in files if f'load_ep{load_epoch}' in x]\n",
    "    files = [x for x in files if f'ft_ep{ft_epoch}' in x]\n",
    "    idx_order = [int(x.split('_')[0].split('tw')[1]) for x in files]\n",
    "    files =  list(np.array(files)[np.argsort(idx_order)])\n",
    "    files = [os.path.join(x) for x in files]\n",
    "    files = [os.path.join(arch, f) for f in files]\n",
    "    mse_result = []\n",
    "    mae_result = []\n",
    "    for f in files:\n",
    "        try:\n",
    "            df = pd.read_csv(f)\n",
    "            mse_result.append(df['mse'][0])\n",
    "            mae_result.append(df['mae'][0])\n",
    "        except:\n",
    "            mse_result.append(999)\n",
    "            mae_result.append(999)\n",
    "    return mse_result, mae_result"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "metadata": {},
   "outputs": [],
   "source": [
    "def get_mse_mae2(PATH, settings_list, cw,patch_size, model_dim, tau_temp, load_epoch, ft_epoch):\n",
    "    y = [x for x in settings_list if f'z3' in x]\n",
    "    y = [x for x in y if f'cw{cw}' in x]\n",
    "    y = [x for x in y if f'patch{patch_size}' in x]\n",
    "    y = [x for x in y if f'_D{model_dim}' in x]\n",
    "    y = [x for x in y if f'tau_temp{tau_temp}' in x]\n",
    "    try:\n",
    "        arch = os.path.join(PATH,y[0])\n",
    "    except:\n",
    "        return [999,999,999,999], [999,999,999,999]\n",
    "    #print(arch)\n",
    "    files = os.listdir(arch)\n",
    "    if len(files)==0:\n",
    "        return [999,999,999,999], [999,999,999,999]\n",
    "    files = [x for x in files if 'acc' in x]\n",
    "    files = [x for x in files if f'load_ep{load_epoch}' in x]\n",
    "    files = [x for x in files if f'ft_ep{ft_epoch}' in x]\n",
    "    idx_order = [int(x.split('_')[0].split('tw')[1]) for x in files]\n",
    "    files =  list(np.array(files)[np.argsort(idx_order)])\n",
    "    files = [os.path.join(x) for x in files]\n",
    "    files = [os.path.join(arch, f) for f in files]\n",
    "    mse_result = []\n",
    "    mae_result = []\n",
    "    for f in files:\n",
    "        try:\n",
    "            df = pd.read_csv(f)\n",
    "            mse_result.append(df['mse'][0])\n",
    "            mae_result.append(df['mae'][0])\n",
    "        except:\n",
    "            mse_result.append(999)\n",
    "            mae_result.append(999)\n",
    "    return mse_result, mae_result"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "metadata": {},
   "outputs": [],
   "source": [
    "def get_mse_mae3(PATH, settings_list, cw,patch_size, model_dim, tau_temp,tau_inst, load_epoch, ft_epoch):\n",
    "    y = [x for x in settings_list if f'z3' in x]\n",
    "    y = [x for x in y if f'cw{cw}' in x]\n",
    "    y = [x for x in y if f'patch{patch_size}' in x]\n",
    "    y = [x for x in y if f'_D{model_dim}' in x]\n",
    "    y = [x for x in y if f'tau_temp{tau_temp}' in x]\n",
    "    y = [x for x in y if f'tau_inst{tau_inst}' in x]\n",
    "    try:\n",
    "        arch = os.path.join(PATH,y[0])\n",
    "    except:\n",
    "        return [999,999,999,999], [999,999,999,999]\n",
    "    #print(arch)\n",
    "    files = os.listdir(arch)\n",
    "    if len(files)==0:\n",
    "        return [999,999,999,999], [999,999,999,999]\n",
    "    files = [x for x in files if 'acc' in x]\n",
    "    files = [x for x in files if f'load_ep{load_epoch}' in x]\n",
    "    files = [x for x in files if f'ft_ep{ft_epoch}' in x]\n",
    "    idx_order = [int(x.split('_')[0].split('tw')[1]) for x in files]\n",
    "    files =  list(np.array(files)[np.argsort(idx_order)])\n",
    "    files = [os.path.join(x) for x in files]\n",
    "    files = [os.path.join(arch, f) for f in files]\n",
    "    mse_result = []\n",
    "    mae_result = []\n",
    "    for f in files:\n",
    "        try:\n",
    "            df = pd.read_csv(f)\n",
    "            mse_result.append(df['mse'][0])\n",
    "            mae_result.append(df['mae'][0])\n",
    "        except:\n",
    "            mse_result.append(999)\n",
    "            mae_result.append(999)\n",
    "    return mse_result, mae_result"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "metadata": {},
   "outputs": [],
   "source": [
    "def get_summary(dataset_list, type_='hard'):\n",
    "    for data in dataset_list:\n",
    "        print('='*50)\n",
    "        PATH1 = '/home/seunghan9613/PatchTST_sim/PatchTST_self_supervised/saved_models/'\n",
    "        PATH2 = f'{data}2{data}'\n",
    "        PATH3 = f'masked_patchtst_sim_half_v3_mean_FC2_sep_R/based_model/max'\n",
    "        PATH = os.path.join(PATH1, PATH2, PATH3)\n",
    "        settings = os.listdir(PATH)\n",
    "        \n",
    "        for share in [1]:\n",
    "            if share==0:\n",
    "                settings = [x for x in settings if 'no_share' in x]\n",
    "            else:\n",
    "                settings = [x for x in settings if 'no_share' not  in x]\n",
    "            \n",
    "            if type_ == 'hard':\n",
    "                settings = [x for x in settings if 'tau' not in x]\n",
    "            elif type_ == 'soft1':\n",
    "                settings = [x for x in settings if 'tau' in x]\n",
    "                settings = [x for x in settings if 'tau_inst' not in x]\n",
    "            elif type_ == 'soft2':\n",
    "                settings = [x for x in settings if 'tau' in x]\n",
    "                settings = [x for x in settings if 'tau_inst' in x]\n",
    "                \n",
    "            if type_ == 'hard':\n",
    "                for cw in [336,512,768]:\n",
    "                    for ps in [12,18,24]:\n",
    "                        for dim in [32,64,128,256]:\n",
    "                            for load_ep in [20,40,60,80,100,120,150]:\n",
    "                                for ft_ep in [20,40]:\n",
    "                                    mse_result, mae_result = get_mse_mae1(PATH = PATH, settings_list = settings,\n",
    "                                                                        cw = cw, patch_size=ps, \n",
    "                                                                        model_dim=dim, \n",
    "                                                                        load_epoch = load_ep, ft_epoch=ft_ep)\n",
    "                                    try:\n",
    "                                        if (mse_result[0] != 999):\n",
    "                                        #if (mse_result[0] != 999) & (len(mse_result)==4):\n",
    "                                            #print([ps,dim,load_ep,ft_ep],mse_result, mae_result)\n",
    "                                            print([cw,ps,dim,load_ep,ft_ep],np.mean(mse_result).round(3), mse_result)\n",
    "                                    except:\n",
    "                                        pass\n",
    "                \n",
    "            elif type_ == 'soft1':\n",
    "                for cw in [336,512,768]:\n",
    "                    for ps in [12,18,24]:\n",
    "                        print(f'-------- cw={cw},ps={ps} ---------')\n",
    "                        min_val = 999\n",
    "                        for dim in [32,64,128,256]:\n",
    "                            for tau1 in [1,3,5]:\n",
    "                                for load_ep in [20,40,60,80,100,120,150]:\n",
    "                                    for ft_ep in [20,40]:\n",
    "                                        mse_result, mae_result = get_mse_mae2(PATH = PATH, settings_list = settings,\n",
    "                                                                            cw=cw, patch_size=ps, \n",
    "                                                                            model_dim=dim, tau_temp=tau1,\n",
    "                                                                            load_epoch = load_ep, ft_epoch=ft_ep)\n",
    "                                        try:\n",
    "                                            if (mse_result[0] != 999):\n",
    "                                                if np.sum(mse_result)<min_val:\n",
    "                                                    print([cw,ps,dim,tau1,load_ep,ft_ep],np.mean(mse_result).round(3),mse_result)\n",
    "                                                    min_val = np.sum(mse_result)\n",
    "                                        except:\n",
    "                                            pass\n",
    "                \n",
    "            elif type_ == 'soft2':\n",
    "                for cw in [336,512,768]:\n",
    "                        \n",
    "                    for ps in [12,18,24]:\n",
    "                        for dim in [32,64,128,256]:\n",
    "                            for tau1 in [1,3,5]:\n",
    "                                for tau2 in [1,3,5]:\n",
    "                                    for load_ep in [20,40,60,80,100,120,150]:\n",
    "                                        for ft_ep in [20,40]:\n",
    "                                            mse_result, mae_result = get_mse_mae3(PATH = PATH,settings_list = settings,\n",
    "                                                                                cw=cw,patch_size=ps, \n",
    "                                                                                model_dim=dim, \n",
    "                                                                                tau_temp=tau1, tau_inst=tau2,\n",
    "                                                                                load_epoch = load_ep, ft_epoch=ft_ep)\n",
    "                                            try:\n",
    "                                                if (mse_result[0] != 999) & (len(mse_result)==4):\n",
    "                                                    #print([ps,dim,tau1,tau2,load_ep,ft_ep],mse_result, mae_result)\n",
    "                                                    print([cw,ps,dim,tau1,tau2,load_ep,ft_ep],np.mean(mse_result).round(3),mse_result)\n",
    "                                            except:\n",
    "                                                pass\n",
    "                            "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "metadata": {},
   "outputs": [],
   "source": [
    "def get_summary_soft1(dataset_list, type_='soft1'):\n",
    "    for cw in [336,512,768]:\n",
    "        for ps in [12,18,24]:\n",
    "            print(f'-------- cw={cw},ps={ps} ---------')\n",
    "            for dim in [32,64,128,256]:\n",
    "                for tau1 in [1,3,5]:\n",
    "                    for load_ep in [40,60,80,100,120,150]:\n",
    "                        for ft_ep in [20,40]:\n",
    "                            print('='*40)\n",
    "                            print([cw,ps,dim,tau1,load_ep,ft_ep])\n",
    "                            for data in dataset_list:\n",
    "                                #print(f'============== {data} ==============')\n",
    "                                min_val = 999\n",
    "                                PATH1 = '/home/seunghan9613/PatchTST_sim/PatchTST_self_supervised/saved_models/'\n",
    "                                PATH2 = f'{data}2{data}'\n",
    "                                PATH3 = f'masked_patchtst_sim_half_v3_mean_FC2_sep_R/based_model/max'\n",
    "                                PATH = os.path.join(PATH1, PATH2, PATH3)\n",
    "                                try:\n",
    "                                    settings = os.listdir(PATH)\n",
    "                                    \n",
    "                                    for share in [1]:\n",
    "                                        settings = [x for x in settings if 'no_share' not  in x]\n",
    "                                        settings = [x for x in settings if 'tau' in x]\n",
    "                                        settings = [x for x in settings if 'tau_inst' not in x]\n",
    "        \n",
    "                                        mse_result, mae_result = get_mse_mae2(PATH = PATH, settings_list = settings,\n",
    "                                                                            cw=cw, patch_size=ps, \n",
    "                                                                            model_dim=dim, tau_temp=tau1,\n",
    "                                                                            load_epoch = load_ep, ft_epoch=ft_ep)\n",
    "                                        try:\n",
    "                                            if len(mse_result)>0:\n",
    "                                                print(data, np.mean(mse_result).round(3), mse_result)\n",
    "                                            \n",
    "                                        except:\n",
    "                                            pass\n",
    "                                except:\n",
    "                                    pass\n",
    "                                "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "metadata": {},
   "outputs": [],
   "source": [
    "def get_summary_soft2(dataset_list, cw_list = [336,512,768],\n",
    "                      ps_list = [12,18,24], \n",
    "                      load_ep_list = [40,60,80,100,120,150],\n",
    "                      ft_ep_list = [20,40],\n",
    "                      type_='soft1'):\n",
    "    \n",
    "    \n",
    "    for cw in cw_list:\n",
    "        for ps in ps_list:\n",
    "            min_val = 999999\n",
    "            print('='*60)\n",
    "            print(f'-------- cw={cw},ps={ps} ---------')\n",
    "            print('='*60)\n",
    "            for dim in [32,64,128,256]:\n",
    "                for tau1 in [1,3,5]:\n",
    "                    for load_ep in load_ep_list:\n",
    "                        for ft_ep in ft_ep_list:\n",
    "                            #print('='*40)\n",
    "                            #print([cw,ps,dim,tau1,load_ep,ft_ep])\n",
    "                            data_sum = 0\n",
    "                            data_results = []\n",
    "                            for data in dataset_list:\n",
    "                                #print(f'============== {data} ==============')\n",
    "                                PATH1 = '/home/seunghan9613/PatchTST_sim/PatchTST_self_supervised/saved_models/'\n",
    "                                PATH2 = f'{data}2{data}'\n",
    "                                PATH3 = f'masked_patchtst_sim_half_v3_mean_FC2_sep_R/based_model/max'\n",
    "                                PATH = os.path.join(PATH1, PATH2, PATH3)\n",
    "                                try:\n",
    "                                    settings = os.listdir(PATH)\n",
    "                                    \n",
    "                                    for share in [1]:\n",
    "                                        settings = [x for x in settings if 'no_share' not  in x]\n",
    "                                        settings = [x for x in settings if 'tau' in x]\n",
    "                                        settings = [x for x in settings if 'tau_inst' not in x]\n",
    "        \n",
    "                                        mse_result, mae_result = get_mse_mae2(PATH = PATH, settings_list = settings,\n",
    "                                                                            cw=cw, patch_size=ps, \n",
    "                                                                            model_dim=dim, tau_temp=tau1,\n",
    "                                                                            load_epoch = load_ep, ft_epoch=ft_ep)\n",
    "                                        \n",
    "                                        try:\n",
    "                                            if len(mse_result)>0:\n",
    "                                                #print(data, np.mean(mse_result).round(3), mse_result)\n",
    "                                                data_sum += np.sum(mse_result)\n",
    "                                                data_results.append([data, np.mean(mse_result).round(3), mse_result])\n",
    "                                            \n",
    "                                        except:\n",
    "                                            pass\n",
    "                                        \n",
    "                                except:\n",
    "                                    pass\n",
    "                            \n",
    "                            #for k in data_results:\n",
    "                            #    print(k)\n",
    "                                \n",
    "                            if min_val > data_sum:\n",
    "                                min_val = data_sum\n",
    "                                print('-'*50)\n",
    "                                print([dim,tau1,load_ep,ft_ep])\n",
    "                                for k in data_results:\n",
    "                                    print(k)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 13,
   "metadata": {},
   "outputs": [],
   "source": [
    "def get_summary_hard(dataset_list, cw_list = [336,512,768],\n",
    "                      ps_list = [12,18,24], \n",
    "                      load_ep_list = [40,60,80,100,120,150],\n",
    "                      ft_ep_list = [20,40],\n",
    "                      type_='soft1'):\n",
    "    \n",
    "    \n",
    "    for cw in cw_list:\n",
    "        for ps in ps_list:\n",
    "            min_val = 999999\n",
    "            print('='*60)\n",
    "            print(f'-------- cw={cw},ps={ps} ---------')\n",
    "            print('='*60)\n",
    "            for dim in [32,64,128,256]:\n",
    "                for load_ep in load_ep_list:\n",
    "                    for ft_ep in ft_ep_list:\n",
    "                        #print('='*40)\n",
    "                        #print([cw,ps,dim,tau1,load_ep,ft_ep])\n",
    "                        data_sum = 0\n",
    "                        data_results = []\n",
    "                        for data in dataset_list:\n",
    "                            #print(f'============== {data} ==============')\n",
    "                            PATH1 = '/home/seunghan9613/PatchTST_sim/PatchTST_self_supervised/saved_models/'\n",
    "                            PATH2 = f'{data}2{data}'\n",
    "                            PATH3 = f'masked_patchtst_sim_half_v3_mean_FC2_sep_R/based_model/max'\n",
    "                            PATH = os.path.join(PATH1, PATH2, PATH3)\n",
    "                            try:\n",
    "                                settings = os.listdir(PATH)\n",
    "                                \n",
    "                                for share in [1]:\n",
    "                                    settings = [x for x in settings if 'no_share' not  in x]\n",
    "                                    settings = [x for x in settings if 'tau' not in x]\n",
    "    \n",
    "                                    mse_result, mae_result = get_mse_mae1(PATH = PATH, settings_list = settings,\n",
    "                                                                        cw=cw, patch_size=ps, \n",
    "                                                                        model_dim=dim, \n",
    "                                                                        load_epoch = load_ep, ft_epoch=ft_ep)\n",
    "                                    \n",
    "                                    try:\n",
    "                                        if len(mse_result)>0:\n",
    "                                            #print(data, np.mean(mse_result).round(3), mse_result)\n",
    "                                            data_sum += np.sum(mse_result)\n",
    "                                            data_results.append([data, np.mean(mse_result).round(3), mse_result])\n",
    "                                        \n",
    "                                    except:\n",
    "                                        pass\n",
    "                                    \n",
    "                            except:\n",
    "                                pass\n",
    "                        \n",
    "                        #for k in data_results:\n",
    "                        #    print(k)\n",
    "                            \n",
    "                        if min_val > data_sum:\n",
    "                            min_val = data_sum\n",
    "                            print('-'*50)\n",
    "                            print([dim,load_ep,ft_ep])\n",
    "                            for k in data_results:\n",
    "                                print(k)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 14,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============================================================\n",
      "-------- cw=512,ps=18 ---------\n",
      "============================================================\n",
      "--------------------------------------------------\n",
      "[32, 40, 20]\n",
      "['etth1', 0.423, [0.368087, 0.413445, 0.435895, 0.474134]]\n",
      "--------------------------------------------------\n",
      "[32, 40, 40]\n",
      "['etth1', 0.422, [0.369745, 0.408623, 0.428604, 0.482521]]\n",
      "--------------------------------------------------\n",
      "[32, 100, 20]\n",
      "['etth1', 0.422, [0.371667, 0.410078, 0.431848, 0.475518]]\n",
      "--------------------------------------------------\n",
      "[32, 120, 20]\n",
      "['etth1', 0.422, [0.372146, 0.404445, 0.436103, 0.475426]]\n",
      "--------------------------------------------------\n",
      "[32, 150, 20]\n",
      "['etth1', 0.421, [0.37102, 0.404673, 0.431576, 0.476186]]\n",
      "--------------------------------------------------\n",
      "[64, 40, 40]\n",
      "['etth1', 0.415, [0.368505, 0.402619, 0.427971, 0.460174]]\n"
     ]
    }
   ],
   "source": [
    "dataset_list = ['etth1']\n",
    "\n",
    "get_summary_hard(dataset_list, \n",
    "                  cw_list = [512],\n",
    "                    ps_list = [18], \n",
    "                    load_ep_list = [40,60,80,100,120,150],\n",
    "                    ft_ep_list = [20,40],\n",
    "                    type_='soft1')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 15,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============================================================\n",
      "-------- cw=512,ps=18 ---------\n",
      "============================================================\n",
      "--------------------------------------------------\n",
      "[32, 1, 40, 20]\n",
      "['etth1', 0.419, [0.368108, 0.40973, 0.42676, 0.46984]]\n",
      "--------------------------------------------------\n",
      "[64, 1, 40, 40]\n",
      "['etth1', 0.418, [0.373071, 0.406397, 0.423118, 0.467908]]\n"
     ]
    }
   ],
   "source": [
    "dataset_list = ['etth1']\n",
    "\n",
    "get_summary_soft2(dataset_list, \n",
    "                  cw_list = [512],\n",
    "                    ps_list = [18], \n",
    "                    load_ep_list = [40,60,80,100,120,150],\n",
    "                    ft_ep_list = [20,40],\n",
    "                    type_='soft1')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 10,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============================================================\n",
      "-------- cw=512,ps=18 ---------\n",
      "============================================================\n",
      "--------------------------------------------------\n",
      "[32, 1, 40, 20]\n",
      "['ettm1', 999.0, [999, 999, 999, 999]]\n"
     ]
    }
   ],
   "source": [
    "dataset_list = ['ettm1']\n",
    "\n",
    "get_summary_soft2(dataset_list, \n",
    "                  cw_list = [512],\n",
    "                    ps_list = [18], \n",
    "                    load_ep_list = [40,60,80,100,120,150],\n",
    "                    ft_ep_list = [20,40],\n",
    "                    type_='soft1')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "ssl_ts",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.10.11"
  },
  "orig_nbformat": 4
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
