{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {},
   "outputs": [],
   "source": [
    "import numpy as np\n",
    "import re\n",
    "import pdb"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 13,
   "metadata": {},
   "outputs": [],
   "source": [
    "names = ['Sparse GPVAE', 'VAE', 'GPVAE with linear likelihood', 'Sparse GP-VAE 100']\n",
    "models = ['SGPVAE-250', 'VAE', 'SGPVAE-LL-100', 'SGPVAE-100']\n",
    "rounds = ['1', '2', '3']\n",
    "years = ['1980', '1981']\n",
    "variables = ['TMAX', 'TMIN', 'TAVG']"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 28,
   "metadata": {},
   "outputs": [],
   "source": [
    "file = 'large_japan_results.txt'\n",
    "\n",
    "model_texts = {}\n",
    "for name in names:\n",
    "    model_texts[name] = ''\n",
    "\n",
    "with open(file, 'r') as f:\n",
    "    text = f.readlines()\n",
    "    \n",
    "    for line in text:\n",
    "        for i, name in enumerate(names):\n",
    "            if (name + '\\n') == line:\n",
    "                k = i\n",
    "                \n",
    "        model_texts[names[k]] += line"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 29,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "{'Sparse GPVAE': 'Sparse GPVAE\\nRound 1\\n1980:\\nTMAX: 3.736, 2.833\\nTMIN: 2.967, 2.585\\nTAVG: 2.258, 2.418\\n\\n1981:\\nTMAX: 3.367, 2.698\\nTMIN: 2.871, 2.580\\nTAVG: 2.119, 2.398\\n\\nRound 2\\n1980:\\nTMAX: 4.197, 2.945\\nTMIN: 3.008, 2.597\\nTAVG: 2.566, 2.460\\n\\n1981:\\nTMAX: 3.480, 2.650\\nTMIN: 3.142, 2.511\\nTAVG: 2.183, 3.246\\n\\nRound 3\\n1980:\\nTMAX: 4.249, 3.054\\nTMIN: 3.206, 2.646\\nTAVG: 2.269, 2.414\\n\\n1981:\\nTMAX: 3.292, 2.694\\nTMIN: 3.085, 2.591\\nTAVG: 2.100, 2.336\\n\\n',\n",
       " 'VAE': 'VAE\\nRound 1\\n1980:\\nTMAX: 5.046, 3.574\\nTMIN: 4.775, 3.365\\nTAVG: 2.895, 2.612\\n\\n1981:\\nTMAX: 5.041, 3.657\\nTMIN: 5.178, 3.579\\nTAVG: 3.634, 2.891\\n\\nRound 2\\n1980:\\nTMAX: 5.234, 3.302\\nTMIN: 5.072, 3.234\\nTAVG: 3.668, 2.857\\n\\n1981: \\nTMAX: 5.058, 3.306\\nTMIN: 5.379, 3.342\\nTAVG: 3.893, 2.937\\n\\nRound 3\\n1980: \\nTMAX: 6.139, 3.584\\nTMIN: 4.543, 3.170\\nTAVG: 3.404, 2.733\\n\\n1981: \\nTMAX: 4.850, 3.259\\nTMIN: 5.087, 3.383\\nTAVG: 3.581, 2.876\\n\\n',\n",
       " 'GPVAE with linear likelihood': 'GPVAE with linear likelihood\\nRound 1\\n1980:\\nTMAX: 4.088, 4.553\\nTMIN: 3.338, 3.320\\nTAVG: 2.388, 2.508\\n\\n1981:\\u2028TMAX: 3.787, 3.745\\nTMIN: 3.258, 3.078\\nTAVG: 2.602, 2.563\\n\\nRound 2\\n1980:\\u2028TMAX: 4.154, 3.362\\nTMIN: 3.247, 2.743\\nTAVG: 2.269, 2.290\\n\\n1981:\\nTMAX: 3.441, 2.875\\nTMIN: 3.331, 2.749\\nTAVG: 2.319, 2.335\\n\\nRound 3\\n1980:\\nTMAX: 3.218, 3.161\\nTMIN: 3.330, 2.699\\nTAVG: 2.409, 2.378\\n\\n1981:\\nTMAX: 4.282, 3.181\\nTMIN: 4.027, 2.992\\nTAVG: 3.603, 2.857\\n\\n\\n',\n",
       " 'Sparse GP-VAE 100': 'Sparse GP-VAE 100\\nRound 1\\n1980:\\nTMAX: 3.938, 2.837\\nTMIN: 3.175, 2.631\\nTAVG: 2.680, 2.521\\n\\n1981:\\nTMAX: 3.992, 2.882\\nTMIN: 3.628, 2.781\\nTAVG: 3.350, 2.700\\n\\nRound 2\\n1980:\\nTMAX: 3.998, 3.226\\nTMIN: 3.729, 2.967\\nTAVG: 2.802, 2.556\\n\\n1981: \\nTMAX: 3.553, 2.768\\nTMIN: 3.374, 2.740\\nTAVG: 3.172, 2.688\\n\\nRound 3\\n\\n'}"
      ]
     },
     "execution_count": 29,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "model_texts"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 34,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "> <ipython-input-34-2c9ab8acc096>(2)<module>()\n",
      "-> for name, text in model_texts.items():\n",
      "(Pdb) good_numbers\n",
      "[3.736, 2.833, 2.967, 2.585, 2.258, 2.418, 3.367, 2.698, 2.871, 2.58, 2.119, 2.398, 4.197, 2.945, 3.008, 2.597, 2.566, 2.46, 3.48, 2.65, 3.142, 2.511, 2.183, 3.246, 4.249, 3.054, 3.206, 2.646, 2.269, 2.414, 3.292, 2.694, 3.085, 2.591, 2.1, 2.336]\n",
      "(Pdb) q\n"
     ]
    },
    {
     "ename": "BdbQuit",
     "evalue": "",
     "output_type": "error",
     "traceback": [
      "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m",
      "\u001b[0;31mBdbQuit\u001b[0m                                   Traceback (most recent call last)",
      "\u001b[0;32m<ipython-input-34-2c9ab8acc096>\u001b[0m in \u001b[0;36m<module>\u001b[0;34m\u001b[0m\n\u001b[1;32m      1\u001b[0m \u001b[0mbad_numbers\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;34m[\u001b[0m\u001b[0;36m1.0\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;36m2.0\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;36m3.0\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;36m1980.0\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;36m1981.0\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m----> 2\u001b[0;31m \u001b[0;32mfor\u001b[0m \u001b[0mname\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mtext\u001b[0m \u001b[0;32min\u001b[0m \u001b[0mmodel_texts\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mitems\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m      3\u001b[0m     \u001b[0mnewstr\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;34m''\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mjoin\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mch\u001b[0m \u001b[0;32mif\u001b[0m \u001b[0mch\u001b[0m \u001b[0;32min\u001b[0m \u001b[0;34m'0123456789.'\u001b[0m \u001b[0;32melse\u001b[0m \u001b[0;34m' '\u001b[0m\u001b[0;34m)\u001b[0m \u001b[0;32mfor\u001b[0m \u001b[0mch\u001b[0m \u001b[0;32min\u001b[0m \u001b[0mtext\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m      4\u001b[0m     \u001b[0mnumber_list\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;34m[\u001b[0m\u001b[0mfloat\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mi\u001b[0m\u001b[0;34m)\u001b[0m \u001b[0;32mfor\u001b[0m \u001b[0mi\u001b[0m \u001b[0;32min\u001b[0m \u001b[0mnewstr\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0msplit\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m      5\u001b[0m     \u001b[0mgood_numbers\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;34m[\u001b[0m\u001b[0mi\u001b[0m \u001b[0;32mfor\u001b[0m \u001b[0mi\u001b[0m \u001b[0;32min\u001b[0m \u001b[0mnumber_list\u001b[0m \u001b[0;32mif\u001b[0m \u001b[0mi\u001b[0m \u001b[0;32mnot\u001b[0m \u001b[0;32min\u001b[0m \u001b[0mbad_numbers\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
      "\u001b[0;32m<ipython-input-34-2c9ab8acc096>\u001b[0m in \u001b[0;36m<module>\u001b[0;34m\u001b[0m\n\u001b[1;32m      1\u001b[0m \u001b[0mbad_numbers\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;34m[\u001b[0m\u001b[0;36m1.0\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;36m2.0\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;36m3.0\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;36m1980.0\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;36m1981.0\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m----> 2\u001b[0;31m \u001b[0;32mfor\u001b[0m \u001b[0mname\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mtext\u001b[0m \u001b[0;32min\u001b[0m \u001b[0mmodel_texts\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mitems\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m      3\u001b[0m     \u001b[0mnewstr\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;34m''\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mjoin\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mch\u001b[0m \u001b[0;32mif\u001b[0m \u001b[0mch\u001b[0m \u001b[0;32min\u001b[0m \u001b[0;34m'0123456789.'\u001b[0m \u001b[0;32melse\u001b[0m \u001b[0;34m' '\u001b[0m\u001b[0;34m)\u001b[0m \u001b[0;32mfor\u001b[0m \u001b[0mch\u001b[0m \u001b[0;32min\u001b[0m \u001b[0mtext\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m      4\u001b[0m     \u001b[0mnumber_list\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;34m[\u001b[0m\u001b[0mfloat\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mi\u001b[0m\u001b[0;34m)\u001b[0m \u001b[0;32mfor\u001b[0m \u001b[0mi\u001b[0m \u001b[0;32min\u001b[0m \u001b[0mnewstr\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0msplit\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m      5\u001b[0m     \u001b[0mgood_numbers\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;34m[\u001b[0m\u001b[0mi\u001b[0m \u001b[0;32mfor\u001b[0m \u001b[0mi\u001b[0m \u001b[0;32min\u001b[0m \u001b[0mnumber_list\u001b[0m \u001b[0;32mif\u001b[0m \u001b[0mi\u001b[0m \u001b[0;32mnot\u001b[0m \u001b[0;32min\u001b[0m \u001b[0mbad_numbers\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
      "\u001b[0;32m/Library/Frameworks/Python.framework/Versions/3.7/lib/python3.7/bdb.py\u001b[0m in \u001b[0;36mtrace_dispatch\u001b[0;34m(self, frame, event, arg)\u001b[0m\n\u001b[1;32m     86\u001b[0m             \u001b[0;32mreturn\u001b[0m \u001b[0;31m# None\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m     87\u001b[0m         \u001b[0;32mif\u001b[0m \u001b[0mevent\u001b[0m \u001b[0;34m==\u001b[0m \u001b[0;34m'line'\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m---> 88\u001b[0;31m             \u001b[0;32mreturn\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mdispatch_line\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mframe\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m     89\u001b[0m         \u001b[0;32mif\u001b[0m \u001b[0mevent\u001b[0m \u001b[0;34m==\u001b[0m \u001b[0;34m'call'\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m     90\u001b[0m             \u001b[0;32mreturn\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mdispatch_call\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mframe\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0marg\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
      "\u001b[0;32m/Library/Frameworks/Python.framework/Versions/3.7/lib/python3.7/bdb.py\u001b[0m in \u001b[0;36mdispatch_line\u001b[0;34m(self, frame)\u001b[0m\n\u001b[1;32m    111\u001b[0m         \u001b[0;32mif\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mstop_here\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mframe\u001b[0m\u001b[0;34m)\u001b[0m \u001b[0;32mor\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mbreak_here\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mframe\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m    112\u001b[0m             \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0muser_line\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mframe\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 113\u001b[0;31m             \u001b[0;32mif\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mquitting\u001b[0m\u001b[0;34m:\u001b[0m \u001b[0;32mraise\u001b[0m \u001b[0mBdbQuit\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m    114\u001b[0m         \u001b[0;32mreturn\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mtrace_dispatch\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m    115\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n",
      "\u001b[0;31mBdbQuit\u001b[0m: "
     ]
    }
   ],
   "source": [
    "bad_numbers = [1.0, 2.0, 3.0, 1980.0, 1981.0]\n",
    "\n",
    "base_idx = [0, 12, 24]\n",
    "\n",
    "tmax_rmse_idx = [0, 12, 24]\n",
    "tmax_mll_idx = [1, 13, 25]\n",
    "tmin_rmse_idx = [2, 14, 26]\n",
    "tmin_mll_idx = [3, 15, 27]\n",
    "tavg_rmse_idx = [4, 16, 28]\n",
    "tavg_mll_idx = [5, 17, 29]\n",
    "\n",
    "for i, (name, text) in enumerate(model_texts.items()):\n",
    "    model = models[i]\n",
    "    newstr = ''.join((ch if ch in '0123456789.' else ' ') for ch in text)\n",
    "    number_list = [float(i) for i in newstr.split()]\n",
    "    good_numbers = [i for i in number_list if i not in bad_numbers]\n",
    "    \n",
    "    for i, year in enumerate(years):\n",
    "        for j, metric in enumerate(['rmse', 'mll'])\n",
    "            for k, variable in enumerate(variables):\n",
    "                offset = 6*i + j + 2*k\n",
    "                idx = [k + offset for k in base_idx]\n",
    "                results[model][year][metric] = good_numbers[idx]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.7.3"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 4
}
