{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "id": "67576132",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Couldn't import dot_parser, loading of dot files will not be possible.\n"
     ]
    }
   ],
   "source": [
    "from math import inf\n",
    "import numpy as np\n",
    "import scipy\n",
    "import torch\n",
    "import torch.nn as nn\n",
    "import torch.nn.functional as F\n",
    "import torch.optim as optim\n",
    "import gymnasium as gym\n",
    "import pandas as pd\n",
    "from datetime import datetime\n",
    "from sklearn.base import BaseEstimator\n",
    "from realkd.boosting import WeightUpdateMethod\n",
    "from pandas import qcut\n",
    "from realkd.rules import SquaredLoss, AdditiveRuleEnsemble, Rule\n",
    "from realkd.search import Context\n",
    "\n",
    "import warnings\n",
    "warnings.filterwarnings(\"ignore\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "id": "62024ef9-a84a-414f-92db-e46f22bde7bb",
   "metadata": {},
   "outputs": [],
   "source": [
    "import os\n",
    "import gymnasium as gym\n",
    "import numpy as np\n",
    "import random\n",
    "from collections import deque\n",
    "from realkd.boosting import GradientBoostingObjectiveMWG, GradientBoostingObjectiveGPE, OrthogonalBoostingObjective, \\\n",
    "    FullyCorrective, LineSearch, GeneralRuleBoostingEstimator, \\\n",
    "    OrthogonalBoostingObjectiveShorter\n",
    "from realkd.rules import SquaredLoss, AdditiveRuleEnsemble, Rule\n",
    "import pandas as pd\n",
    "import matplotlib.pyplot as plt\n",
    "# import matplotlib.colors as mcolors\n",
    "# import matplotlib.patches as patches\n",
    "import warnings\n",
    "\n",
    "# Set EnergyPlus path - modify this to your installation path\n",
    "os.environ['EPLUS_PATH'] = \"/Applications/EnergyPlus-24-2-0\"  # Modify this path\n",
    "\n",
    "# Import sinergym after setting EPLUS_PATH\n",
    "import sinergym\n",
    "from gymnasium.spaces import Discrete\n",
    "\n",
    "# Suppress warnings\n",
    "warnings.filterwarnings('ignore')\n",
    "\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "id": "08221e5a-32a6-4e8d-ad37-0755b3d82dd6",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "['/opt/anaconda3/envs/sinergym/lib/python312.zip', '/opt/anaconda3/envs/sinergym/lib/python3.12', '/opt/anaconda3/envs/sinergym/lib/python3.12/lib-dynload', '', '/opt/anaconda3/envs/sinergym/lib/python3.12/site-packages', '/Users/fanyang/Downloads/sinergym-main', '/Applications/EnergyPlus-24-2-0', '/Applications/EnergyPlus-24-2-0/pyenergyplus']\n"
     ]
    }
   ],
   "source": [
    "import sys\n",
    "sys.path.append(\"/Applications/EnergyPlus-24-2-0\")\n",
    "sys.path.append(\"/Applications/EnergyPlus-24-2-0/pyenergyplus\")\n",
    "\n",
    "print(sys.path)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "id": "87e6fae7-baea-435d-8e3a-97ec683d49d7",
   "metadata": {},
   "outputs": [],
   "source": [
    "# Separate control wrapper for heating and cooling\n",
    "class DualTemperatureControl(gym.Wrapper):\n",
    "    def __init__(self, env, heating_steps=7, cooling_steps=7):\n",
    "        \"\"\"\n",
    "        Initialize the dual temperature control wrapper with separate heating and cooling actions.\n",
    "        \n",
    "        Args:\n",
    "            env: The environment to wrap\n",
    "            heating_steps: Number of discrete heating temperature values\n",
    "            cooling_steps: Number of discrete cooling temperature values\n",
    "        \"\"\"\n",
    "        super(DualTemperatureControl, self).__init__(env)\n",
    "        \n",
    "        # Get action space bounds\n",
    "        self.heating_low = env.action_space.low[0]\n",
    "        self.heating_high = env.action_space.high[0]\n",
    "        self.cooling_low = env.action_space.low[1]\n",
    "        self.cooling_high = env.action_space.high[1]\n",
    "        \n",
    "        # Important: Ensure cooling is always higher than heating\n",
    "        # In EnergyPlus, we must maintain cooling_setpoint > heating_setpoint\n",
    "        min_gap = 0.5  # Minimum gap between heating and cooling\n",
    "        \n",
    "        # Calculate temperature steps with 1°C increments when possible\n",
    "        self.heating_setpoints = np.round(np.linspace(self.heating_low, self.heating_high - min_gap, heating_steps))\n",
    "        self.cooling_setpoints = np.round(np.linspace(self.cooling_low + min_gap, self.cooling_high, cooling_steps))\n",
    "        \n",
    "        # Ensure all heating setpoints are less than all cooling setpoints\n",
    "        assert np.max(self.heating_setpoints) < np.min(self.cooling_setpoints), \\\n",
    "            \"Heating setpoints must be less than cooling setpoints\"\n",
    "        \n",
    "        # Create separate action spaces for heating and cooling\n",
    "        self.heating_action_space = Discrete(len(self.heating_setpoints))\n",
    "        self.cooling_action_space = Discrete(len(self.cooling_setpoints))\n",
    "        \n",
    "        # Create a combined action space (for convenience)\n",
    "        self.action_space = Discrete(len(self.heating_setpoints) + len(self.cooling_setpoints))\n",
    "        \n",
    "        # Print action space information\n",
    "        print(f\"Heating setpoints: {self.heating_setpoints}\")\n",
    "        print(f\"Cooling setpoints: {self.cooling_setpoints}\")\n",
    "        print(f\"Total action space size: {self.action_space.n}\")\n",
    "    \n",
    "    def step(self, action):\n",
    "        heating_actions = len(self.heating_setpoints)\n",
    "        cooling_actions = len(self.cooling_setpoints)\n",
    "        \n",
    "        # Determine if this is a heating or cooling action\n",
    "        if action < heating_actions:\n",
    "            # This is a heating action\n",
    "            heating_setpoint = self.heating_setpoints[action]\n",
    "            # Use the middle cooling setpoint by default\n",
    "            cooling_setpoint = self.cooling_setpoints[len(self.cooling_setpoints) // 2]\n",
    "        else:\n",
    "            # This is a cooling action\n",
    "            cooling_idx = action - heating_actions\n",
    "            cooling_setpoint = self.cooling_setpoints[cooling_idx]\n",
    "            # Use the middle heating setpoint by default\n",
    "            heating_setpoint = self.heating_setpoints[len(self.heating_setpoints) // 2]\n",
    "        \n",
    "        # Ensure the values are within the allowed range and of the correct type\n",
    "        heating_setpoint = float(np.clip(heating_setpoint, self.heating_low, self.heating_high))\n",
    "        cooling_setpoint = float(np.clip(cooling_setpoint, self.cooling_low, self.cooling_high))\n",
    "        \n",
    "        # Format according to environment's expected action format\n",
    "        actual_action = np.array([heating_setpoint, cooling_setpoint], dtype=np.float32)\n",
    "        \n",
    "        # Ensure the action is within bounds\n",
    "        if not self.env.action_space.contains(actual_action):\n",
    "            print(f\"Warning: Action {actual_action} is outside of bounds {self.env.action_space.low} - {self.env.action_space.high}\")\n",
    "            actual_action = np.clip(actual_action, self.env.action_space.low, self.env.action_space.high)\n",
    "        \n",
    "        try:\n",
    "            # Pass the converted action to the environment\n",
    "            obs, reward, terminated, truncated, info = self.env.step(actual_action)\n",
    "            return obs, reward, terminated, truncated, info\n",
    "        except (AssertionError, TypeError) as e:\n",
    "            print(f\"Error with action {actual_action}. Trying with a safe action instead.\")\n",
    "            # Use a safe middle action as fallback\n",
    "            safe_action = np.array([\n",
    "                (self.heating_low + self.heating_high) / 2,\n",
    "                (self.cooling_low + self.cooling_high) / 2\n",
    "            ], dtype=np.float32)\n",
    "            obs, reward, terminated, truncated, info = self.env.step(safe_action)\n",
    "            return obs, reward, terminated, truncated, info\n",
    "\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "id": "dc43db5a-8ac7-48da-85da-97fab6666ecc",
   "metadata": {},
   "outputs": [],
   "source": [
    "# Define an observation normalization wrapper\n",
    "class SimpleNormalizeObservation(gym.Wrapper):\n",
    "    def __init__(self, env):\n",
    "        super(SimpleNormalizeObservation, self).__init__(env)\n",
    "        self.obs_mean = None\n",
    "        self.obs_std = None\n",
    "        \n",
    "    def reset(self, **kwargs):\n",
    "        obs, info = self.env.reset(**kwargs)\n",
    "        if self.obs_mean is None:\n",
    "            self.obs_mean = np.zeros_like(obs)\n",
    "            self.obs_std = np.ones_like(obs)\n",
    "        return self._normalize(obs), info\n",
    "    \n",
    "    def step(self, action):\n",
    "        obs, reward, terminated, truncated, info = self.env.step(action)\n",
    "        return self._normalize(obs), reward, terminated, truncated, info\n",
    "    \n",
    "    def _normalize(self, obs):\n",
    "        return (obs - self.obs_mean) / (self.obs_std + 1e-8)\n",
    "\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "9ae9604e-9a8a-436d-bcbc-3613d7d2a53e",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "ad244c21-e8b9-44aa-8d21-782a3cfef9f1",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "10619434-39c2-4625-9f7c-11dc7e1be7aa",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "id": "8b8f01e2",
   "metadata": {},
   "outputs": [],
   "source": [
    "# !pip install \"gymnasium[box2d]\""
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "id": "db545637",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "#==============================================================================================#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Creating Gymnasium environment.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Name: demo-v1\u001b[0m\n",
      "#==============================================================================================#\n",
      "\u001b[38;20m[MODEL] (INFO) : Experiment working directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Working directory: /Users/fanyang/FIT_Research/FCOGB/Eplus-env-demo-v1-res16\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Model Config is correct.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Update building model Output:Variable with variable names.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Update building model Output:Meter with meter names.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Extra config: runperiod updated to {'apply_weekend_holiday_rule': 'No', 'begin_day_of_month': 1, 'begin_month': 1, 'begin_year': 1991, 'day_of_week_for_start_day': 'Monday', 'end_day_of_month': 1, 'end_month': 3, 'end_year': 1991, 'use_weather_file_daylight_saving_period': 'Yes', 'use_weather_file_holidays_and_special_days': 'Yes', 'use_weather_file_rain_indicators': 'Yes', 'use_weather_file_snow_indicators': 'Yes'}\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Updated episode length (seconds): 5184000.0\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Updated timestep size (seconds): 3600.0\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Updated timesteps per episode: 1440\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Runperiod established.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode length (seconds): 5184000.0\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : timestep size (seconds): 3600.0\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : timesteps per episode: 1440\u001b[0m\n",
      "\u001b[38;20m[REWARD] (INFO) : Reward function initialized.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Environment created successfully.\u001b[0m\n",
      "cpu\n"
     ]
    }
   ],
   "source": [
    "env = gym.make(\"Eplus-demo-v1\")\n",
    "device = torch.device(\"cuda\" if torch.cuda.is_available() else \"cpu\")\n",
    "print(device)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "id": "49645347-408b-4608-b016-e42773559aea",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Heating range: 15.0 to 22.5\n",
      "Cooling range: 22.5 to 30.0\n",
      "Heating setpoints: [15. 16. 17. 18. 20. 21. 22.]\n",
      "Cooling setpoints: [23. 24. 25. 26. 28. 29. 30.]\n",
      "Total action space size: 14\n"
     ]
    }
   ],
   "source": [
    "heating_low = env.action_space.low[0]\n",
    "heating_high = env.action_space.high[0]\n",
    "cooling_low = env.action_space.low[1]\n",
    "cooling_high = env.action_space.high[1]\n",
    "print(f\"Heating range: {heating_low} to {heating_high}\")\n",
    "print(f\"Cooling range: {cooling_low} to {cooling_high}\")\n",
    "env = DualTemperatureControl(env, heating_steps=7, cooling_steps=7)\n",
    "env = SimpleNormalizeObservation(env)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 9,
   "id": "a4c5a856-c0c2-4c8d-ac16-dcd35680f419",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 1: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 1 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers initialized.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Observation dimension: 9\n",
      "Action dimension: 14\n",
      "Creating rule-based models...\n",
      "Simulation Progress [Episode 1]: 100%|█| 100/100 [00:00<00:00, 257.33%/s, 100% c"
     ]
    }
   ],
   "source": [
    "state, _ = env.reset()\n",
    "state_dim = len(state)\n",
    "action_dim = env.action_space.n  # Number of discrete actions (now includes both heating and cooling)\n",
    "\n",
    "print(f\"Observation dimension: {state_dim}\")\n",
    "print(f\"Action dimension: {action_dim}\")\n",
    "\n",
    "# Define feature names for the DataFrame\n",
    "global features\n",
    "features = [f'obs_{i}' for i in range(state_dim)]\n",
    "\n",
    "print(\"Creating rule-based models...\")\n",
    "# Create models for each action (now includes both heating and cooling actions)\n",
    "num_rules = 30  # Number of rules per model\n",
    "\n",
    "# Main models used for training\n",
    "models = [GeneralRuleBoostingEstimator(\n",
    "    num_rules=num_rules, \n",
    "    objective_function=OrthogonalBoostingObjective,\n",
    "    weight_update_method=FullyCorrective(), \n",
    "    loss=SquaredLoss(),\n",
    "    reg=25.0, \n",
    "    search='greedy', \n",
    "    max_col_attr=20, \n",
    "    verbose=False) for _ in range(action_dim)]\n",
    "\n",
    "# Secondary models for exploration\n",
    "models2 = [GeneralRuleBoostingEstimator(\n",
    "    num_rules=num_rules, \n",
    "    objective_function=OrthogonalBoostingObjective,\n",
    "    weight_update_method=FullyCorrective(), \n",
    "    loss=SquaredLoss(),\n",
    "    reg=25.0, \n",
    "    search='greedy', \n",
    "    max_col_attr=20, \n",
    "    verbose=False) for _ in range(action_dim)]\n",
    "\n",
    "# Best models to track best performance\n",
    "best_models = [GeneralRuleBoostingEstimator(\n",
    "    num_rules=num_rules, \n",
    "    objective_function=OrthogonalBoostingObjective,\n",
    "    weight_update_method=FullyCorrective(), \n",
    "    loss=SquaredLoss(),\n",
    "    reg=25.0, \n",
    "    search='greedy', \n",
    "    max_col_attr=20,  # Reduced from 500 for better performance\n",
    "    verbose=False) for _ in range(action_dim)]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 10,
   "id": "732ec4cd-97de-4bd9-ba45-d9d12c223b7e",
   "metadata": {},
   "outputs": [],
   "source": [
    "column_names=features"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "4bc82cb4-ea0f-4735-99b4-b5caf36fbea0",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": 11,
   "id": "7aa6c889",
   "metadata": {},
   "outputs": [],
   "source": [
    "# column_names = ['x', 'y', 'vx', 'vy', 'ax', 'ay', 'wx', 'wy']"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 12,
   "id": "24f75485",
   "metadata": {},
   "outputs": [],
   "source": [
    "np.random.seed(56470569)\n",
    "torch.manual_seed(84078709)\n",
    "random.seed(235870535)\n",
    "num_rules=20\n",
    "action_space=action_dim\n",
    "reg=250.0\n",
    "nn_actor_train_iterations=200\n",
    "rule_actor_train_iterations=50\n",
    "# state_dim=8\n",
    "node_num=128"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 13,
   "id": "84732b72",
   "metadata": {},
   "outputs": [],
   "source": [
    "def orthonormalization(Q):\n",
    "    n, k = Q.shape\n",
    "    O = np.zeros(shape=(n, k))\n",
    "    q = Q[:, 0]\n",
    "    O[:, 0] = q / (norm(q) + 1e-6)\n",
    "    for i in range(1, k):\n",
    "        O_i = O[:, :i]\n",
    "        q = Q[:, i]\n",
    "        q_orth = q - O_i.dot(O_i.T.dot(q))\n",
    "        O[:, i] = q_orth / (norm(q_orth) + 1e-6)\n",
    "    return O"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 14,
   "id": "973f1f9b",
   "metadata": {},
   "outputs": [],
   "source": [
    "def softmax1(action, values, other_values, location):\n",
    "    all_values = np.insert(other_values, location, values, axis=1)\n",
    "    exps = np.exp(all_values)\n",
    "    res = np.exp(all_values[np.arange(values.shape[0]), action]) / np.sum(exps, axis=1)\n",
    "    return res\n",
    "\n",
    "def norm(x):\n",
    "    \"\"\"\n",
    "    Calculate the L-2 norm of a vector\n",
    "    :param x: the vector whose L-2 norm is to be calculated\n",
    "    :return: the L-2 norm of the vector\n",
    "    \"\"\"\n",
    "    return (x * x).sum() ** 0.5\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 15,
   "id": "5b0af6ac",
   "metadata": {},
   "outputs": [],
   "source": [
    "class PiLoss:\n",
    "    _instance = None\n",
    "\n",
    "    def __new__(cls):\n",
    "        if cls._instance is None:\n",
    "            cls._instance = super(PiLoss, cls).__new__(cls)\n",
    "        return cls._instance\n",
    "\n",
    "    @staticmethod\n",
    "    def __call__(action, values, advantage, other_values, current):\n",
    "        \"\"\"\n",
    "        :param action: the action chosen\n",
    "        :param values: the values provided by current model\n",
    "        :param other_values: the output by other models\n",
    "        :param current: the action represented by the current model\n",
    "        \"\"\"\n",
    "        sm = softmax1(action, values, other_values, current)+1e-6\n",
    "        return -np.log(sm) * advantage\n",
    "\n",
    "    @staticmethod\n",
    "    def g(action, values, advantage, other_values, current):\n",
    "        return np.where(action == current, -advantage * (1 - softmax1(current, values, other_values, current)),\n",
    "                        advantage * softmax1(current, values, other_values, current))\n",
    "\n",
    "    @staticmethod\n",
    "    def h(action, values, advantage, other_values, current):\n",
    "        sm = softmax1(current, values, other_values, current)\n",
    "        return advantage * sm * (1 - sm)\n",
    "\n",
    "    @staticmethod\n",
    "    def __repr__():\n",
    "        return 'pi_loss'\n",
    "\n",
    "    @staticmethod\n",
    "    def __str__():\n",
    "        return 'pi_loss'"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 16,
   "id": "67942365",
   "metadata": {},
   "outputs": [],
   "source": [
    "loss_functions = {\n",
    "    'pi_loss': PiLoss()\n",
    "}"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 17,
   "id": "693287f4",
   "metadata": {},
   "outputs": [],
   "source": [
    "def loss_function(loss):\n",
    "    \"\"\"Provides loss functions from string representation.\n",
    "\n",
    "    :param loss: string identifier of loss function loss function\n",
    "    :return: loss function matching corresponding to input string (or unchanged input if was already loss function)\n",
    "    \"\"\"\n",
    "    if callable(loss):\n",
    "        return loss\n",
    "    else:\n",
    "        return loss_functions[loss]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 18,
   "id": "ae0af97c",
   "metadata": {},
   "outputs": [],
   "source": [
    "def calc_risk(loss, action, rules, states, reg, advantage, others, current):\n",
    "    weights = np.array([rule.y for rule in rules])\n",
    "    risk = sum(loss(action, rules(states), advantage, others, current)) + reg * sum(weights * weights) / 2\n",
    "    return risk"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 19,
   "id": "d06dc96b",
   "metadata": {},
   "outputs": [],
   "source": [
    "class FullyCorrectiveA2C:\n",
    "    def __init__(self, loss='pi_loss', reg=reg, solver='L-BFGS-B'):\n",
    "        self.loss = loss_function(loss)\n",
    "        self.reg = reg\n",
    "        self.solver = solver\n",
    "\n",
    "    @staticmethod\n",
    "    def get_risk(loss, action, q_mat, reg, advantage, others, current):\n",
    "        def sum_loss(weights):\n",
    "            return sum(loss(action, q_mat.dot(weights), advantage, others, current)) + reg * sum(weights * weights) / 2\n",
    "\n",
    "        return sum_loss\n",
    "\n",
    "    @staticmethod\n",
    "    def get_gradient(g, action, q_mat, reg, advantage, other, current):\n",
    "        def gradient(weights):\n",
    "            grad_vec = g(action, q_mat.dot(weights), advantage, other, current)\n",
    "            return q_mat.T.dot(grad_vec) + reg * weights\n",
    "\n",
    "        return gradient\n",
    "\n",
    "    @staticmethod\n",
    "    def get_hessian(h, action, q_mat, reg, advantage, other, current):\n",
    "        def hessian(weights):\n",
    "            h_vec = h(action, q_mat.dot(weights), advantage, other, current)\n",
    "            return q_mat.T.dot(np.diag(h_vec)).dot(q_mat) + np.diag([reg] * len(weights))\n",
    "\n",
    "        return hessian\n",
    "\n",
    "    def calc_weight(self, data, action, rules, advantage, other, current):\n",
    "        g = self.loss.g\n",
    "        h = self.loss.h\n",
    "        loss = self.loss\n",
    "        y = np.array(action)\n",
    "        q_mat = np.column_stack(\n",
    "            [rules[i].q(data) + np.zeros(len(data)) for i in range(len(rules))])\n",
    "        sum_loss = self.get_risk(loss, y, q_mat, self.reg, advantage, other, current)\n",
    "        gradient = self.get_gradient(g, y, q_mat, self.reg, advantage, other, current)\n",
    "        hessian = self.get_hessian(h, y, q_mat, self.reg, advantage, other, current)\n",
    "        if self.solver == 'GD':  # Gradient descent\n",
    "            w = np.array([r.y for r in rules])\n",
    "            old_w = np.ones_like(w) * (1.0 if len(w) - sum(w) > 1e-5 else 2.0)\n",
    "            i = 0\n",
    "            while norm(old_w - w) > 1e-3 and i < 50:\n",
    "                old_w = np.array(w)\n",
    "                if norm(gradient(w)) == 0:\n",
    "                    break\n",
    "                p = -gradient(w) / norm(gradient(w))\n",
    "                w += GoldenRatioSearch(sum_loss, old_w, p, gradient).run() * p\n",
    "                i += 1\n",
    "        elif self.solver == 'Line':\n",
    "            w = np.array([r.y for r in rules])\n",
    "            if norm(gradient(w)) != 0:\n",
    "                p = -gradient(w) / norm(gradient(w))\n",
    "                distance = GoldenRatioSearch(sum_loss, w, p, gradient).run()\n",
    "                w += distance * p\n",
    "        else:\n",
    "            w = np.array([r.y for r in rules])\n",
    "            w = scipy.optimize.minimize(sum_loss, w, method=self.solver, jac=gradient,  # hess=hessian,\n",
    "                                        options={'disp': False}).x\n",
    "\n",
    "        return w"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 20,
   "id": "2d0c04a8",
   "metadata": {},
   "outputs": [],
   "source": [
    "class ObjectFunction:\n",
    "    def __init__(self, data, target, predictions, loss, reg, advantage, other_values, current, rules=None):\n",
    "        self.loss = loss_function(loss)\n",
    "        self.reg = reg\n",
    "        predictions = np.zeros_like(\n",
    "            target) if predictions is None else predictions\n",
    "        g = np.array(self.loss.g(target, predictions, advantage, other_values, current))\n",
    "        h = np.array(self.loss.h(target, predictions, advantage, other_values, current)) + 1e-6\n",
    "        r = g / h\n",
    "        order = np.argsort(r)[::-1]\n",
    "        self.g = g[order]\n",
    "        self.h = h[order]\n",
    "        self.data = data.iloc[order].reset_index(drop=True)\n",
    "        self.target = target.iloc[order].reset_index(drop=True)\n",
    "        self.n = len(target)\n",
    "\n",
    "    def __call__(self, ext):\n",
    "        raise NotImplementedError()\n",
    "\n",
    "    def bound(self, ext):\n",
    "        raise NotImplementedError()\n",
    "\n",
    "    def search(self, method='greedy', verbose=False, **search_params):\n",
    "        from realkd.search import search_methods\n",
    "        ctx = Context.from_df(self.data, **search_params)\n",
    "        if verbose >= 2:\n",
    "            print(\n",
    "                f'Created search context with {len(ctx.attributes)} attributes')\n",
    "        return search_methods[method](ctx, self, self.bound, verbose=verbose, **search_params).run()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 21,
   "id": "eaec4413",
   "metadata": {},
   "outputs": [],
   "source": [
    "class OrthogonalBoostingObjective(ObjectFunction):\n",
    "    def __init__(self, data, target, advantage, other_values, current, predictions=None, loss=SquaredLoss, reg=1.0,\n",
    "                 rules=None,\n",
    "                 epsilon=1e-4, **kwargs):\n",
    "        super().__init__(data, target, predictions, loss, reg, advantage, other_values, current, rules)\n",
    "        self.rules = [] if rules is None else rules\n",
    "        self.loss = loss_function(loss)\n",
    "        self.reg = reg\n",
    "        self.epsilon = epsilon\n",
    "        predictions = np.zeros_like(\n",
    "            target) if predictions is None else predictions\n",
    "        g = np.array(self.loss.g(target, predictions, advantage, other_values, current))\n",
    "        self.n = len(target)\n",
    "        r = g\n",
    "        order = np.argsort(r)[::-1]\n",
    "        self.g = g[order]\n",
    "        self.data = data.iloc[order].reset_index(drop=True)\n",
    "        self.target = target.iloc[order].reset_index(drop=True)\n",
    "        if len(rules) != 0:\n",
    "            orth_basis = kwargs['orth_basis']\n",
    "            self.orth_basis = orth_basis[order]\n",
    "            self.g = self.g - self.orth_basis @ self.orth_basis.T @ self.g\n",
    "        else:\n",
    "            self.orth_basis = np.zeros(self.n)\n",
    "\n",
    "    def __call__(self, ext):\n",
    "        if len(ext) == 0:\n",
    "            return -inf\n",
    "        g_q = self.g[ext]\n",
    "        if len(self.rules) == 0:\n",
    "            h_q = np.sqrt(sum(ext))\n",
    "            return abs(g_q.sum()) / h_q #np.sqrt(h_q.sum())\n",
    "        length = self.fast_orth_norm(ext)\n",
    "        if length > 1e-4:\n",
    "            obj = abs(g_q.sum()) / (length + self.epsilon)\n",
    "        else:\n",
    "            obj = 0\n",
    "        return obj\n",
    "\n",
    "    def fast_orth_norm(self, ext):\n",
    "        deltas = self.orth_basis[ext]\n",
    "        length = len(ext)\n",
    "        okqi = abs(np.sum(deltas, axis=0))\n",
    "        q_para_norms = (okqi ** 2).sum()\n",
    "        q_orth_norms_sq = np.abs(length - q_para_norms)\n",
    "        return np.sqrt(q_orth_norms_sq)\n",
    "\n",
    "    def fast_para_norms_prefix(self, ext):\n",
    "        deltas = self.orth_basis[ext]\n",
    "        length = len(ext)\n",
    "        okqi = np.cumsum(deltas, axis=0)\n",
    "        q_para_norms = (okqi ** 2).sum(axis=1)\n",
    "        q_orth_norms_sq = np.abs(np.arange(1, length + 1) - q_para_norms)\n",
    "        q_orth_norms = np.sqrt(q_orth_norms_sq)\n",
    "        return q_orth_norms\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 22,
   "id": "626cceb7",
   "metadata": {},
   "outputs": [],
   "source": [
    "class GeneralRuleBoostingEstimator(BaseEstimator):\n",
    "    def __init__(self, num_rules, objective_function, weight_update_method, loss='squared', reg=reg,\n",
    "                 search='greedy', max_col_attr=10,\n",
    "                 search_params=None, verbose=False):\n",
    "        if search_params is None:\n",
    "            search_params = {'order': 'bestboundfirst', 'apx': 1.0, 'max_depth': None, 'discretization': qcut,\n",
    "                             'max_col_attr': max_col_attr}\n",
    "        self.num_rules = num_rules\n",
    "        self.num_components = 500\n",
    "        self.objective = objective_function\n",
    "        self.objective_function = objective_function\n",
    "        self.max_col_attr = max_col_attr\n",
    "        self.weight_update_method = weight_update_method\n",
    "        self.loss = loss_function(loss)\n",
    "        self.reg = reg\n",
    "        self.weight_update_method.loss = loss\n",
    "        self.weight_update_method.reg = reg\n",
    "        self.verbose = verbose\n",
    "        self.search = search\n",
    "        self.rules_ = AdditiveRuleEnsemble([])\n",
    "        self.search_params = search_params\n",
    "        self.history = []\n",
    "        self.time = []\n",
    "\n",
    "    def set_reg(self, reg):\n",
    "        self.reg = reg\n",
    "        self.objective.reg = reg\n",
    "        self.weight_update_method.reg = reg\n",
    "\n",
    "    def fit(self, data, target, advantage, other_values, current, has_origin_rules=False, verbose=False):\n",
    "        if not has_origin_rules:\n",
    "            self.history = []\n",
    "            self.time = []\n",
    "            self.rules_.members = []\n",
    "            orth_basis = np.array([])\n",
    "        else:\n",
    "            q_mat = np.column_stack(\n",
    "                [self.rules_[i].q(data) + np.zeros(len(data)) for i in range(len(self.rules_))])\n",
    "            orth_basis = orthonormalization(q_mat)\n",
    "        num_components = 0\n",
    "        while len(self.rules_) < self.num_rules and num_components < self.num_components:\n",
    "            start_time = datetime.now()\n",
    "            # Search for a rule\n",
    "            scores = self.rules_(data)\n",
    "            obj = self.objective(data, target, advantage, other_values, current, predictions=scores,\n",
    "                                 loss=self.loss, reg=self.reg, rules=self.rules_, orth_basis=orth_basis)\n",
    "            q = obj.search(method=self.search, verbose=verbose,\n",
    "                           **self.search_params)\n",
    "            if hasattr(self.objective, 'opt_weight') and callable(getattr(self.objective, 'opt_weight')):\n",
    "                y = obj.opt_weight(q)\n",
    "            else:\n",
    "                y = 1.0  # np.random.random()\n",
    "            q_vec = q(data)\n",
    "            num_components += (1 + len(q))\n",
    "            if len(orth_basis) == 0:\n",
    "                basis = q_vec / norm(q_vec)\n",
    "                orth_basis = np.array([basis]).T\n",
    "            else:\n",
    "                basis = q_vec - orth_basis.dot(orth_basis.T.dot(q_vec))\n",
    "                basis = basis / (norm(basis) + 1e-6)\n",
    "                orth_basis = np.hstack((orth_basis, np.array([basis]).T))\n",
    "            rule = Rule(q, y)\n",
    "            if self.verbose:\n",
    "                print(rule)\n",
    "            self.rules_.append(rule)\n",
    "            # Calculate weights\n",
    "            weights = self.weight_update_method.calc_weight(\n",
    "                data, target, self.rules_, advantage, other_values, current)\n",
    "            for i in range(len(self.rules_)):\n",
    "                self.rules_[i].y = weights[i]\n",
    "            self.history.append(AdditiveRuleEnsemble(\n",
    "                [Rule(q=rule.q, y=rule.y) for rule in self.rules_.members]))\n",
    "            end_time = datetime.now()\n",
    "            self.time.append(str(end_time - start_time))\n",
    "        return self\n",
    "\n",
    "    def predict(self, data):\n",
    "        loss = loss_function(self.loss)\n",
    "        return loss.preidictions(self.rules_(data))\n",
    "\n",
    "    def decision_function(self, data):\n",
    "        return self.rules_(data)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 23,
   "id": "b50ce787",
   "metadata": {},
   "outputs": [],
   "source": [
    "# class Actor(nn.Module):\n",
    "#     def __init__(self, action_space, node=16):\n",
    "#         super(Actor, self).__init__()\n",
    "#         self.fc1 = nn.Linear(4, node)  \n",
    "# #         self.fc1_ = nn.Linear(node, node)\n",
    "#         self.fc2 = nn.Linear(node, action_space)\n",
    "\n",
    "#     def forward(self, state):\n",
    "#         x = F.relu(self.fc1(state))\n",
    "# #         x = F.relu(self.fc1_(x))\n",
    "#         x = self.fc2(x)\n",
    "#         return x"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 24,
   "id": "84b0ee0a",
   "metadata": {},
   "outputs": [],
   "source": [
    "def copy_rules(origin_rules):\n",
    "    rules = []\n",
    "    for n in range(len(origin_rules)):\n",
    "        rule = origin_rules[n]\n",
    "        rules.append(Rule(q=rule.q, y=rule.y))\n",
    "    return AdditiveRuleEnsemble(rules)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 25,
   "id": "bb3fcc8c",
   "metadata": {},
   "outputs": [],
   "source": [
    "class ActorRule():\n",
    "    def __init__(self, action_space=action_space, num_rules=num_rules):\n",
    "        self.action_space = action_space\n",
    "        self.model = [GeneralRuleBoostingEstimator(num_rules=num_rules, objective_function=OrthogonalBoostingObjective,\n",
    "                                                   weight_update_method=FullyCorrectiveA2C(), loss=PiLoss(),\n",
    "                                                   reg=reg, search='greedy', max_col_attr=80, verbose=False) for _ in\n",
    "                      range(action_space)]\n",
    "        self.best_model = [\n",
    "            GeneralRuleBoostingEstimator(num_rules=num_rules, objective_function=OrthogonalBoostingObjective,\n",
    "                                         weight_update_method=FullyCorrectiveA2C(), loss=PiLoss(),\n",
    "                                         reg=reg, search='greedy', max_col_attr=80, verbose=False) for _ in\n",
    "            range(action_space)]\n",
    "\n",
    "    def __call__(self, state):\n",
    "        res = [self.model[i].rules_(state) for i in range(len(self.model))]\n",
    "        return np.array(res)\n",
    "\n",
    "    def predict(self, state):\n",
    "        res = [self.best_model[i].rules_(state) for i in range(len(self.model))]\n",
    "        return np.array(res)\n",
    "\n",
    "\n",
    "def update_rules(estimator: GeneralRuleBoostingEstimator, x, y, adv, other_values, current):\n",
    "    queries_lst = []\n",
    "    queries = {}\n",
    "    original_rules = copy_rules(estimator.rules_)\n",
    "    origin_risk = calc_risk(PiLoss(), y, original_rules, x, estimator.reg, adv, other_values, current)\n",
    "    for i in range(len(estimator.rules_)):\n",
    "        q_str = str(estimator.rules_[i].q)\n",
    "        if q_str not in queries:\n",
    "            queries[q_str] = estimator.rules_[i].y\n",
    "            queries_lst.append(estimator.rules_[i].q)\n",
    "        else:\n",
    "            queries[q_str] += estimator.rules_[i].y\n",
    "    for k in queries:\n",
    "        queries[k] = abs(queries[k])\n",
    "    min_weight_query = min(queries, key=queries.get)\n",
    "    rules = []\n",
    "    for i in range(len(queries_lst)):\n",
    "        q_str = str(queries_lst[i])\n",
    "        if q_str != min_weight_query:\n",
    "            rules.append(Rule(q=queries_lst[i], y=queries[str(queries_lst[i])]))\n",
    "    if len(rules) == 0:\n",
    "        rules = [Rule(q=queries_lst[0], y=queries[str(queries_lst[0])])]\n",
    "    new_rules = AdditiveRuleEnsemble(rules)\n",
    "    weights = FullyCorrectiveA2C(loss_function('pi_loss'), estimator.reg).calc_weight(x, y, new_rules, adv,\n",
    "                                                                                      other_values, current)\n",
    "    for i in range(len(new_rules)):\n",
    "        new_rules[i].y = weights[i]\n",
    "    estimator.rules_ = new_rules\n",
    "    estimator.fit(x, y, adv, other_values, current, has_origin_rules=True)\n",
    "    weights = FullyCorrectiveA2C(loss_function('pi_loss'), estimator.reg).calc_weight(x, y, estimator.rules_, adv,\n",
    "                                                                                      other_values, current)\n",
    "    for i in range(len(estimator.rules_)):\n",
    "        estimator.rules_[i].y = weights[i]\n",
    "    new_risk = calc_risk(PiLoss(), y, estimator.rules_, x, estimator.reg, adv, other_values, current)\n",
    "    if new_risk > origin_risk:\n",
    "        estimator.rules_ = copy_rules(original_rules)\n",
    "#         print(\"origin\", origin_risk, 'new', new_risk, 'not updated')\n",
    "        # risk = sum(PiLoss.__call__(y, estimator.rules_[i].y))\n",
    "    return estimator"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 26,
   "id": "2824981f",
   "metadata": {},
   "outputs": [],
   "source": [
    "class Critic(nn.Module):\n",
    "    def __init__(self, node=node_num):\n",
    "        super(Critic, self).__init__()\n",
    "        self.fc1 = nn.Linear(state_dim, node)\n",
    "        self.fc2 = nn.Linear(node, 1)\n",
    "\n",
    "    def forward(self, state):\n",
    "        x = F.tanh(self.fc1(state))\n",
    "        x = self.fc2(x)\n",
    "        return x"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 27,
   "id": "6b6e2dd7",
   "metadata": {},
   "outputs": [],
   "source": [
    "gamma = 0.99\n",
    "actor = ActorRule()\n",
    "critic = Critic().to(device)\n",
    "critic_optimizer = optim.AdamW(critic.parameters(), lr=0.0005)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 28,
   "id": "ae072cc5",
   "metadata": {},
   "outputs": [],
   "source": [
    "class ActorNet(nn.Module):\n",
    "    def __init__(self, hidden_dim=node_num):\n",
    "        super().__init__()\n",
    "\n",
    "        self.hidden = nn.Linear(state_dim, hidden_dim)\n",
    "        self.output = nn.Linear(hidden_dim, action_space)\n",
    "\n",
    "    def forward(self, s):\n",
    "        outs = self.hidden(s)\n",
    "        outs = F.relu(outs)\n",
    "        logits = self.output(outs)\n",
    "        return logits\n",
    "\n",
    "\n",
    "actor_func = ActorNet().to(device)\n",
    "value_func = critic"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 29,
   "id": "e18bebc8",
   "metadata": {},
   "outputs": [],
   "source": [
    "def position_to_index(position):\n",
    "   \n",
    "    row = position % 12\n",
    "    col = position // 12\n",
    "    return [row, col]\n",
    "\n",
    "def one_hot_state(s, state_dim=8):\n",
    "    v = np.zeros(state_dim, dtype=np.float32)\n",
    "    v[s] = 1.0\n",
    "    return v"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 30,
   "id": "c565d5ef",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m                      \n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 2: demo-v1\u001b[0m                           \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m                         \n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m                \n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m                  \n",
      "Simulation Progress [Episode 1]: 100%|█| 100/100 [00:00<00:00, 169.32%/s, 100% c\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 2 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 0 with rewards -1899716.9293954847 with 1440 steps 98.20%/s, 100% co\n",
      "Simulation Progress [Episode 2]: 100%|█| 100/100 [00:02<00:00, 33.52%/s, 100% co\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 3: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 3 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 1 with rewards -1899716.9293954847 with 1440 steps 99.53%/s, 100% co\n",
      "Simulation Progress [Episode 3]: 100%|█| 100/100 [00:03<00:00, 32.82%/s, 100% co\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 4: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 4 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 2 with rewards -1899716.9293954847 with 1440 steps 86.31%/s, 100% co\n",
      "Simulation Progress [Episode 4]: 100%|█| 100/100 [00:03<00:00, 32.28%/s, 100% co\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 5: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 5 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 3 with rewards -1899716.9293954847 with 1440 steps 91.56%/s, 100% co\n",
      "Simulation Progress [Episode 5]: 100%|█| 100/100 [00:03<00:00, 32.77%/s, 100% co\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 6: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 6 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 4 with rewards -1899716.9293954847 with 1440 steps 91.93%/s, 100% co\n",
      "Simulation Progress [Episode 6]: 100%|█| 100/100 [00:03<00:00, 32.81%/s, 100% co\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 7: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 7 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 5 with rewards -1899716.9293954847 with 1440 steps 91.70%/s, 100% co\n",
      "Simulation Progress [Episode 7]: 100%|█| 100/100 [00:03<00:00, 32.37%/s, 100% co\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 8: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 8 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 6 with rewards -1899716.9293954847 with 1440 steps 84.91%/s, 100% co\n",
      "Simulation Progress [Episode 8]: 100%|█| 100/100 [00:03<00:00, 32.64%/s, 100% co\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 9: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 9 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 7 with rewards -1899716.9293954847 with 1440 steps 92.57%/s, 100% co\n",
      "Simulation Progress [Episode 9]: 100%|█| 100/100 [00:03<00:00, 32.63%/s, 100% co\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 10: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 10 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 8 with rewards -1899716.9293954847 with 1440 steps, 88.61%/s, 100% c\n",
      "Simulation Progress [Episode 10]: 100%|█| 100/100 [00:03<00:00, 32.20%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 11: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 11 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 9 with rewards -1899716.9293954847 with 1440 steps, 91.39%/s, 100% c\n",
      "Simulation Progress [Episode 11]: 100%|█| 100/100 [00:03<00:00, 32.65%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 12: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 12 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 10 with rewards -1899716.9293954847 with 1440 steps 90.12%/s, 100% c\n",
      "Simulation Progress [Episode 12]: 100%|█| 100/100 [00:03<00:00, 32.24%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 13: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 13 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 11 with rewards -1899716.9293954847 with 1440 steps 105.24%/s, 100% \n",
      "Simulation Progress [Episode 13]: 100%|█| 100/100 [00:02<00:00, 34.30%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 14: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 14 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 12 with rewards -1899716.9293954847 with 1440 steps 96.17%/s, 100% c\n",
      "Simulation Progress [Episode 14]: 100%|█| 100/100 [00:03<00:00, 33.03%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 15: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 15 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 13 with rewards -1899716.9293954847 with 1440 steps 99.00%/s, 100% c\n",
      "Simulation Progress [Episode 15]: 100%|█| 100/100 [00:02<00:00, 33.41%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 16: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 16 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 14 with rewards -1899716.9293954847 with 1440 steps 104.97%/s, 100% \n",
      "Simulation Progress [Episode 16]: 100%|█| 100/100 [00:02<00:00, 33.90%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 17: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 17 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 15 with rewards -1899716.9293954847 with 1440 steps 103.81%/s, 100% \n",
      "Simulation Progress [Episode 17]: 100%|█| 100/100 [00:02<00:00, 34.18%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 18: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 18 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 16 with rewards -1899716.9293954847 with 1440 steps 104.31%/s, 100% \n",
      "Simulation Progress [Episode 18]: 100%|█| 100/100 [00:03<00:00, 32.93%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 19: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 19 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 17 with rewards -1899716.9293954847 with 1440 steps 93.74%/s, 100% c\n",
      "Simulation Progress [Episode 19]: 100%|█| 100/100 [00:03<00:00, 32.99%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 20: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 20 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 18 with rewards -1899716.9293954847 with 1440 steps 95.79%/s, 100% c\n",
      "Simulation Progress [Episode 20]: 100%|█| 100/100 [00:02<00:00, 33.36%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 21: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 21 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 19 with rewards -1899716.9293954847 with 1440 steps 89.30%/s, 100% c\n",
      "Simulation Progress [Episode 21]: 100%|█| 100/100 [00:03<00:00, 32.63%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 22: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 22 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 20 with rewards -1899716.9293954847 with 1440 steps 101.24%/s, 100% \n",
      "Simulation Progress [Episode 22]: 100%|█| 100/100 [00:02<00:00, 33.50%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 23: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 23 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 21 with rewards -1899716.9293954847 with 1440 steps 106.05%/s, 100% \n",
      "Simulation Progress [Episode 23]: 100%|█| 100/100 [00:02<00:00, 34.18%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 24: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 24 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 22 with rewards -1899716.9293954847 with 1440 steps 95.94%/s, 100% c\n",
      "Simulation Progress [Episode 24]: 100%|█| 100/100 [00:02<00:00, 33.79%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 25: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 25 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 23 with rewards -1899716.9293954847 with 1440 steps 103.52%/s, 100% \n",
      "Simulation Progress [Episode 25]: 100%|█| 100/100 [00:02<00:00, 33.60%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 26: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 26 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 24 with rewards -1899716.9293954847 with 1440 steps 104.81%/s, 100% \n",
      "Simulation Progress [Episode 26]: 100%|█| 100/100 [00:02<00:00, 34.24%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 27: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 27 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 25 with rewards -1899716.9293954847 with 1440 steps 103.20%/s, 100% \n",
      "Simulation Progress [Episode 27]: 100%|█| 100/100 [00:02<00:00, 34.00%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 28: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 28 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 26 with rewards -1899716.9293954847 with 1440 steps 99.59%/s, 100% c\n",
      "Simulation Progress [Episode 28]: 100%|█| 100/100 [00:02<00:00, 34.12%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 29: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 29 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 27 with rewards -1899716.9293954847 with 1440 steps 100.64%/s, 100% \n",
      "Simulation Progress [Episode 29]: 100%|█| 100/100 [00:02<00:00, 34.12%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 30: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 30 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 28 with rewards -1899716.9293954847 with 1440 steps 103.61%/s, 100% \n",
      "Simulation Progress [Episode 30]: 100%|█| 100/100 [00:02<00:00, 34.26%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 31: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 31 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 29 with rewards -1899716.9293954847 with 1440 steps 96.68%/s, 100% c\n",
      "Simulation Progress [Episode 31]: 100%|█| 100/100 [00:02<00:00, 33.99%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 32: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 32 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 30 with rewards -1899716.9293954847 with 1440 steps 105.16%/s, 100% \n",
      "Simulation Progress [Episode 32]: 100%|█| 100/100 [00:02<00:00, 34.32%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 33: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 33 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 31 with rewards -1899716.9293954847 with 1440 steps 101.59%/s, 100% \n",
      "Simulation Progress [Episode 33]: 100%|█| 100/100 [00:02<00:00, 34.17%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 34: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 34 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 32 with rewards -1899716.9293954847 with 1440 steps 102.60%/s, 100% \n",
      "Simulation Progress [Episode 34]: 100%|█| 100/100 [00:02<00:00, 33.74%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 35: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 35 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 33 with rewards -1899716.9293954847 with 1440 steps 101.39%/s, 100% \n",
      "Simulation Progress [Episode 35]: 100%|█| 100/100 [00:02<00:00, 34.15%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 36: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 36 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 34 with rewards -1899716.9293954847 with 1440 steps 103.67%/s, 100% \n",
      "Simulation Progress [Episode 36]: 100%|█| 100/100 [00:02<00:00, 34.32%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 37: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 37 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 35 with rewards -1899716.9293954847 with 1440 steps 103.83%/s, 100% \n",
      "Simulation Progress [Episode 37]: 100%|█| 100/100 [00:02<00:00, 34.17%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 38: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 38 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 36 with rewards -1899716.9293954847 with 1440 steps 104.54%/s, 100% \n",
      "Simulation Progress [Episode 38]: 100%|█| 100/100 [00:02<00:00, 34.24%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 39: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 39 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 37 with rewards -1899716.9293954847 with 1440 steps 104.11%/s, 100% \n",
      "Simulation Progress [Episode 39]: 100%|█| 100/100 [00:02<00:00, 34.21%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 40: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 40 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 38 with rewards -1899716.9293954847 with 1440 steps 94.46%/s, 100% c\n",
      "Simulation Progress [Episode 40]: 100%|█| 100/100 [00:02<00:00, 33.47%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 41: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 41 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 39 with rewards -1899716.9293954847 with 1440 steps 104.19%/s, 100% \n",
      "Simulation Progress [Episode 41]: 100%|█| 100/100 [00:02<00:00, 34.29%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 42: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 42 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 40 with rewards -1899716.9293954847 with 1440 steps 104.49%/s, 100% \n",
      "Simulation Progress [Episode 42]: 100%|█| 100/100 [00:02<00:00, 34.42%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 43: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 43 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 41 with rewards -1899716.9293954847 with 1440 steps 104.81%/s, 100% \n",
      "Simulation Progress [Episode 43]: 100%|█| 100/100 [00:02<00:00, 34.33%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 44: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 44 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 42 with rewards -1899716.9293954847 with 1440 steps 104.19%/s, 100% \n",
      "Simulation Progress [Episode 44]: 100%|█| 100/100 [00:02<00:00, 34.04%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 45: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 45 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 43 with rewards -1899716.9293954847 with 1440 steps 102.15%/s, 100% \n",
      "Simulation Progress [Episode 45]: 100%|█| 100/100 [00:02<00:00, 34.32%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 46: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 46 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 44 with rewards -1899716.9293954847 with 1440 steps 103.02%/s, 100% \n",
      "Simulation Progress [Episode 46]: 100%|█| 100/100 [00:02<00:00, 34.19%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 47: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 47 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 45 with rewards -1899716.9293954847 with 1440 steps 104.13%/s, 100% \n",
      "Simulation Progress [Episode 47]: 100%|█| 100/100 [00:02<00:00, 34.42%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 48: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 48 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 46 with rewards -1899716.9293954847 with 1440 steps 105.49%/s, 100% \n",
      "Simulation Progress [Episode 48]: 100%|█| 100/100 [00:02<00:00, 34.38%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 49: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 49 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 47 with rewards -1899716.9293954847 with 1440 steps 103.10%/s, 100% \n",
      "Simulation Progress [Episode 49]: 100%|█| 100/100 [00:02<00:00, 34.23%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 50: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 50 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 48 with rewards -1899716.9293954847 with 1440 steps 103.98%/s, 100% \n",
      "Simulation Progress [Episode 50]: 100%|█| 100/100 [00:02<00:00, 34.40%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 51: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 51 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 49 with rewards -1899716.9293954847 with 1440 steps 103.30%/s, 100% \n",
      "Simulation Progress [Episode 51]: 100%|█| 100/100 [00:02<00:00, 34.26%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 52: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 52 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 50 with rewards -1899716.9293954847 with 1440 steps 104.08%/s, 100% \n",
      "Simulation Progress [Episode 52]: 100%|█| 100/100 [00:02<00:00, 34.27%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 53: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 53 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 51 with rewards -1899716.9293954847 with 1440 steps 106.20%/s, 100% \n",
      "Simulation Progress [Episode 53]: 100%|█| 100/100 [00:02<00:00, 34.29%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 54: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 54 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 52 with rewards -1899716.9293954847 with 1440 steps 105.65%/s, 100% \n",
      "Simulation Progress [Episode 54]: 100%|█| 100/100 [00:02<00:00, 34.50%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 55: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 55 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 53 with rewards -1899716.9293954847 with 1440 steps 104.22%/s, 100% \n",
      "Simulation Progress [Episode 55]: 100%|█| 100/100 [00:02<00:00, 34.35%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 56: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 56 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 54 with rewards -1899716.9293954847 with 1440 steps 105.19%/s, 100% \n",
      "Simulation Progress [Episode 56]: 100%|█| 100/100 [00:02<00:00, 34.42%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 57: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 57 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 55 with rewards -1899716.9293954847 with 1440 steps 104.90%/s, 100% \n",
      "Simulation Progress [Episode 57]: 100%|█| 100/100 [00:02<00:00, 34.40%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 58: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 58 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 56 with rewards -1899716.9293954847 with 1440 steps 105.32%/s, 100% \n",
      "Simulation Progress [Episode 58]: 100%|█| 100/100 [00:02<00:00, 34.39%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 59: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 59 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 57 with rewards -1899716.9293954847 with 1440 steps 97.89%/s, 100% c\n",
      "Simulation Progress [Episode 59]: 100%|█| 100/100 [00:02<00:00, 33.58%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 60: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 60 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 58 with rewards -1899716.9293954847 with 1440 steps 107.01%/s, 100% \n",
      "Simulation Progress [Episode 60]: 100%|█| 100/100 [00:02<00:00, 34.46%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 61: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 61 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 59 with rewards -1899716.9293954847 with 1440 steps 106.30%/s, 100% \n",
      "Simulation Progress [Episode 61]: 100%|█| 100/100 [00:02<00:00, 34.42%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 62: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 62 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 60 with rewards -1899716.9293954847 with 1440 steps 108.38%/s, 100% \n",
      "Simulation Progress [Episode 62]: 100%|█| 100/100 [00:02<00:00, 34.41%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 63: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 63 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 61 with rewards -1899716.9293954847 with 1440 steps 109.84%/s, 100% \n",
      "Simulation Progress [Episode 63]: 100%|█| 100/100 [00:02<00:00, 34.54%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 64: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 64 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 62 with rewards -1899716.9293954847 with 1440 steps 108.28%/s, 100% \n",
      "Simulation Progress [Episode 64]: 100%|█| 100/100 [00:02<00:00, 34.42%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 65: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 65 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 63 with rewards -1899716.9293954847 with 1440 steps 108.05%/s, 100% \n",
      "Simulation Progress [Episode 65]: 100%|█| 100/100 [00:02<00:00, 34.39%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 66: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 66 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 64 with rewards -1899716.9293954847 with 1440 steps 108.85%/s, 100% \n",
      "Simulation Progress [Episode 66]: 100%|█| 100/100 [00:02<00:00, 34.48%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 67: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 67 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 65 with rewards -1899716.9293954847 with 1440 steps 107.85%/s, 100% \n",
      "Simulation Progress [Episode 67]: 100%|█| 100/100 [00:02<00:00, 34.31%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 68: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 68 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 66 with rewards -1899716.9293954847 with 1440 steps 109.56%/s, 100% \n",
      "Simulation Progress [Episode 68]: 100%|█| 100/100 [00:02<00:00, 34.46%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 69: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 69 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 67 with rewards -1899716.9293954847 with 1440 steps 105.76%/s, 100% \n",
      "Simulation Progress [Episode 69]: 100%|█| 100/100 [00:02<00:00, 34.38%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 70: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 70 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 68 with rewards -1899716.9293954847 with 1440 steps 106.09%/s, 100% \n",
      "Simulation Progress [Episode 70]: 100%|█| 100/100 [00:02<00:00, 34.48%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 71: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 71 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 69 with rewards -1899716.9293954847 with 1440 steps 107.98%/s, 100% \n",
      "Simulation Progress [Episode 71]: 100%|█| 100/100 [00:02<00:00, 34.35%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 72: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 72 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 70 with rewards -1899716.9293954847 with 1440 steps 107.94%/s, 100% \n",
      "Simulation Progress [Episode 72]: 100%|█| 100/100 [00:02<00:00, 34.51%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 73: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 73 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 71 with rewards -1899716.9293954847 with 1440 steps 107.02%/s, 100% \n",
      "Simulation Progress [Episode 73]: 100%|█| 100/100 [00:02<00:00, 34.53%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 74: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 74 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 72 with rewards -1899716.9293954847 with 1440 steps 106.79%/s, 100% \n",
      "Simulation Progress [Episode 74]: 100%|█| 100/100 [00:02<00:00, 34.58%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 75: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 75 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 73 with rewards -1899716.9293954847 with 1440 steps 105.94%/s, 100% \n",
      "Simulation Progress [Episode 75]: 100%|█| 100/100 [00:02<00:00, 34.50%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 76: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 76 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 74 with rewards -1899716.9293954847 with 1440 steps 109.54%/s, 100% \n",
      "Simulation Progress [Episode 76]: 100%|█| 100/100 [00:02<00:00, 34.79%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 77: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 77 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 75 with rewards -1899716.9293954847 with 1440 steps 108.52%/s, 100% \n",
      "Simulation Progress [Episode 77]: 100%|█| 100/100 [00:02<00:00, 34.42%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 78: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 78 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 76 with rewards -1899716.9293954847 with 1440 steps 102.20%/s, 100% \n",
      "Simulation Progress [Episode 78]: 100%|█| 100/100 [00:02<00:00, 33.81%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 79: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 79 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 77 with rewards -1899716.9293954847 with 1440 steps 107.56%/s, 100% \n",
      "Simulation Progress [Episode 79]: 100%|█| 100/100 [00:02<00:00, 34.58%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 80: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 80 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 78 with rewards -1899716.9293954847 with 1440 steps 101.33%/s, 100% \n",
      "Simulation Progress [Episode 80]: 100%|█| 100/100 [00:02<00:00, 33.86%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 81: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 81 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 79 with rewards -1899716.9293954847 with 1440 steps 110.41%/s, 100% \n",
      "Simulation Progress [Episode 81]: 100%|█| 100/100 [00:02<00:00, 34.84%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 82: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 82 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 80 with rewards -1899716.9293954847 with 1440 steps 103.01%/s, 100% \n",
      "Simulation Progress [Episode 82]: 100%|█| 100/100 [00:02<00:00, 34.27%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 83: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 83 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 81 with rewards -1899716.9293954847 with 1440 steps 105.28%/s, 100% \n",
      "Simulation Progress [Episode 83]: 100%|█| 100/100 [00:02<00:00, 34.34%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 84: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 84 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 82 with rewards -1899716.9293954847 with 1440 steps 104.29%/s, 100% \n",
      "Simulation Progress [Episode 84]: 100%|█| 100/100 [00:02<00:00, 34.29%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 85: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 85 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 83 with rewards -1899716.9293954847 with 1440 steps 108.60%/s, 100% \n",
      "Simulation Progress [Episode 85]: 100%|█| 100/100 [00:02<00:00, 34.61%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 86: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 86 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 84 with rewards -1899716.9293954847 with 1440 steps 104.51%/s, 100% \n",
      "Simulation Progress [Episode 86]: 100%|█| 100/100 [00:02<00:00, 34.43%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 87: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 87 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 85 with rewards -1899716.9293954847 with 1440 steps 101.23%/s, 100% \n",
      "Simulation Progress [Episode 87]: 100%|█| 100/100 [00:02<00:00, 34.39%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 88: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 88 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 86 with rewards -1899716.9293954847 with 1440 steps 108.78%/s, 100% \n",
      "Simulation Progress [Episode 88]: 100%|█| 100/100 [00:02<00:00, 34.68%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 89: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 89 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 87 with rewards -1899716.9293954847 with 1440 steps 105.33%/s, 100% \n",
      "Simulation Progress [Episode 89]: 100%|█| 100/100 [00:02<00:00, 34.40%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 90: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 90 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 88 with rewards -1899716.9293954847 with 1440 steps 105.72%/s, 100% \n",
      "Simulation Progress [Episode 90]: 100%|█| 100/100 [00:02<00:00, 34.55%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 91: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 91 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 89 with rewards -1899716.9293954847 with 1440 steps 105.26%/s, 100% \n",
      "Simulation Progress [Episode 91]: 100%|█| 100/100 [00:02<00:00, 34.38%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 92: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 92 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 90 with rewards -1899716.9293954847 with 1440 steps 109.82%/s, 100% \n",
      "Simulation Progress [Episode 92]: 100%|█| 100/100 [00:02<00:00, 34.57%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 93: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 93 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 91 with rewards -1899716.9293954847 with 1440 steps 107.43%/s, 100% \n",
      "Simulation Progress [Episode 93]: 100%|█| 100/100 [00:02<00:00, 34.52%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 94: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 94 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 92 with rewards -1899716.9293954847 with 1440 steps 112.24%/s, 100% \n",
      "Simulation Progress [Episode 94]: 100%|█| 100/100 [00:02<00:00, 34.81%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 95: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 95 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 93 with rewards -1899716.9293954847 with 1440 steps 109.26%/s, 100% \n",
      "Simulation Progress [Episode 95]: 100%|█| 100/100 [00:02<00:00, 34.51%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 96: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 96 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 94 with rewards -1899716.9293954847 with 1440 steps 105.05%/s, 100% \n",
      "Simulation Progress [Episode 96]: 100%|█| 100/100 [00:02<00:00, 34.36%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 97: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 97 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 95 with rewards -1899716.9293954847 with 1440 steps 98.17%/s, 100% c\n",
      "Simulation Progress [Episode 97]: 100%|█| 100/100 [00:02<00:00, 33.62%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 98: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 98 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 96 with rewards -1899716.9293954847 with 1440 steps 108.98%/s, 100% \n",
      "Simulation Progress [Episode 98]: 100%|█| 100/100 [00:02<00:00, 34.55%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 99: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 99 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 97 with rewards -1899716.9293954847 with 1440 steps 109.61%/s, 100% \n",
      "Simulation Progress [Episode 99]: 100%|█| 100/100 [00:02<00:00, 34.72%/s, 100% c\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 100: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 100 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 98 with rewards -1899716.9293954847 with 1440 steps, 103.05%/s, 100%\n",
      "Simulation Progress [Episode 100]: 100%|█| 100/100 [00:02<00:00, 34.47%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 101: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 101 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 99 with rewards -1899716.9293954847 with 1440 steps, 109.86%/s, 100%\n",
      "Simulation Progress [Episode 101]: 100%|█| 100/100 [00:02<00:00, 34.48%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 102: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 102 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 100 with rewards -1899716.9293954847 with 1440 steps 110.28%/s, 100%\n",
      "Simulation Progress [Episode 102]: 100%|█| 100/100 [00:02<00:00, 34.84%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 103: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 103 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 101 with rewards -1899716.9293954847 with 1440 steps 109.38%/s, 100%\n",
      "Simulation Progress [Episode 103]: 100%|█| 100/100 [00:02<00:00, 34.46%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 104: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 104 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 102 with rewards -1899716.9293954847 with 1440 steps 107.36%/s, 100%\n",
      "Simulation Progress [Episode 104]: 100%|█| 100/100 [00:02<00:00, 34.56%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 105: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 105 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 103 with rewards -1899716.9293954847 with 1440 steps 105.81%/s, 100%\n",
      "Simulation Progress [Episode 105]: 100%|█| 100/100 [00:02<00:00, 34.60%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 106: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 106 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 104 with rewards -1899716.9293954847 with 1440 steps 110.45%/s, 100%\n",
      "Simulation Progress [Episode 106]: 100%|█| 100/100 [00:02<00:00, 34.60%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 107: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 107 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 105 with rewards -1899716.9293954847 with 1440 steps 109.83%/s, 100%\n",
      "Simulation Progress [Episode 107]: 100%|█| 100/100 [00:02<00:00, 34.79%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 108: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 108 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 106 with rewards -1899716.9293954847 with 1440 steps 111.26%/s, 100%\n",
      "Simulation Progress [Episode 108]: 100%|█| 100/100 [00:02<00:00, 34.52%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 109: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 109 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 107 with rewards -1899716.9293954847 with 1440 steps 109.60%/s, 100%\n",
      "Simulation Progress [Episode 109]: 100%|█| 100/100 [00:02<00:00, 34.71%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 110: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 110 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 108 with rewards -1899716.9293954847 with 1440 steps 106.24%/s, 100%\n",
      "Simulation Progress [Episode 110]: 100%|█| 100/100 [00:02<00:00, 34.28%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 111: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 111 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 109 with rewards -1899716.9293954847 with 1440 steps 107.19%/s, 100%\n",
      "Simulation Progress [Episode 111]: 100%|█| 100/100 [00:02<00:00, 34.56%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 112: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 112 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 110 with rewards -1899716.9293954847 with 1440 steps 108.01%/s, 100%\n",
      "Simulation Progress [Episode 112]: 100%|█| 100/100 [00:02<00:00, 34.47%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 113: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 113 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 111 with rewards -1899716.9293954847 with 1440 steps 107.54%/s, 100%\n",
      "Simulation Progress [Episode 113]: 100%|█| 100/100 [00:02<00:00, 34.53%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 114: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 114 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 112 with rewards -1899716.9293954847 with 1440 steps 107.26%/s, 100%\n",
      "Simulation Progress [Episode 114]: 100%|█| 100/100 [00:02<00:00, 34.44%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 115: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 115 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 113 with rewards -1899716.9293954847 with 1440 steps 105.49%/s, 100%\n",
      "Simulation Progress [Episode 115]: 100%|█| 100/100 [00:02<00:00, 34.14%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 116: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 116 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 114 with rewards -1899716.9293954847 with 1440 steps 99.40%/s, 100% \n",
      "Simulation Progress [Episode 116]: 100%|█| 100/100 [00:02<00:00, 33.92%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 117: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 117 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 115 with rewards -1899716.9293954847 with 1440 steps 106.45%/s, 100%\n",
      "Simulation Progress [Episode 117]: 100%|█| 100/100 [00:02<00:00, 34.55%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 118: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 118 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 116 with rewards -1899716.9293954847 with 1440 steps 102.78%/s, 100%\n",
      "Simulation Progress [Episode 118]: 100%|█| 100/100 [00:02<00:00, 34.61%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 119: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 119 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 117 with rewards -1899716.9293954847 with 1440 steps 110.28%/s, 100%\n",
      "Simulation Progress [Episode 119]: 100%|█| 100/100 [00:02<00:00, 34.79%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 120: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 120 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 118 with rewards -1899716.9293954847 with 1440 steps 109.04%/s, 100%\n",
      "Simulation Progress [Episode 120]: 100%|█| 100/100 [00:02<00:00, 34.74%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 121: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 121 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 119 with rewards -1899716.9293954847 with 1440 steps 107.22%/s, 100%\n",
      "Simulation Progress [Episode 121]: 100%|█| 100/100 [00:02<00:00, 34.42%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 122: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 122 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 120 with rewards -1899716.9293954847 with 1440 steps 103.64%/s, 100%\n",
      "Simulation Progress [Episode 122]: 100%|█| 100/100 [00:02<00:00, 34.29%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 123: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 123 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 121 with rewards -1899716.9293954847 with 1440 steps 108.08%/s, 100%\n",
      "Simulation Progress [Episode 123]: 100%|█| 100/100 [00:02<00:00, 34.59%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 124: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 124 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 122 with rewards -1899716.9293954847 with 1440 steps 109.47%/s, 100%\n",
      "Simulation Progress [Episode 124]: 100%|█| 100/100 [00:02<00:00, 34.48%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 125: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 125 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 123 with rewards -1899716.9293954847 with 1440 steps 107.54%/s, 100%\n",
      "Simulation Progress [Episode 125]: 100%|█| 100/100 [00:02<00:00, 34.47%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 126: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 126 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 124 with rewards -1899716.9293954847 with 1440 steps 106.00%/s, 100%\n",
      "Simulation Progress [Episode 126]: 100%|█| 100/100 [00:02<00:00, 34.40%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 127: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 127 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 125 with rewards -1899716.9293954847 with 1440 steps 103.63%/s, 100%\n",
      "Simulation Progress [Episode 127]: 100%|█| 100/100 [00:02<00:00, 34.35%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 128: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 128 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 126 with rewards -1899716.9293954847 with 1440 steps 105.69%/s, 100%\n",
      "Simulation Progress [Episode 128]: 100%|█| 100/100 [00:02<00:00, 34.44%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 129: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 129 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 127 with rewards -1899716.9293954847 with 1440 steps 99.28%/s, 100% \n",
      "Simulation Progress [Episode 129]: 100%|█| 100/100 [00:02<00:00, 33.99%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 130: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 130 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 128 with rewards -1899716.9293954847 with 1440 steps 105.00%/s, 100%\n",
      "Simulation Progress [Episode 130]: 100%|█| 100/100 [00:02<00:00, 34.39%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 131: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 131 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 129 with rewards -1899716.9293954847 with 1440 steps 105.69%/s, 100%\n",
      "Simulation Progress [Episode 131]: 100%|█| 100/100 [00:02<00:00, 34.59%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 132: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 132 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 130 with rewards -1899716.9293954847 with 1440 steps 103.57%/s, 100%\n",
      "Simulation Progress [Episode 132]: 100%|█| 100/100 [00:02<00:00, 34.30%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 133: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 133 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 131 with rewards -1899716.9293954847 with 1440 steps 100.63%/s, 100%\n",
      "Simulation Progress [Episode 133]: 100%|█| 100/100 [00:02<00:00, 34.19%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 134: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 134 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 132 with rewards -1899716.9293954847 with 1440 steps 106.14%/s, 100%\n",
      "Simulation Progress [Episode 134]: 100%|█| 100/100 [00:02<00:00, 34.36%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 135: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 135 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 133 with rewards -1899716.9293954847 with 1440 steps 98.56%/s, 100% \n",
      "Simulation Progress [Episode 135]: 100%|█| 100/100 [00:02<00:00, 33.61%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 136: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 136 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 134 with rewards -1899716.9293954847 with 1440 steps 100.73%/s, 100%\n",
      "Simulation Progress [Episode 136]: 100%|█| 100/100 [00:02<00:00, 33.85%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 137: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 137 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 135 with rewards -1899716.9293954847 with 1440 steps 103.80%/s, 100%\n",
      "Simulation Progress [Episode 137]: 100%|█| 100/100 [00:02<00:00, 34.32%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 138: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 138 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 136 with rewards -1899716.9293954847 with 1440 steps 103.27%/s, 100%\n",
      "Simulation Progress [Episode 138]: 100%|█| 100/100 [00:02<00:00, 34.37%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 139: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 139 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 137 with rewards -1899716.9293954847 with 1440 steps 105.53%/s, 100%\n",
      "Simulation Progress [Episode 139]: 100%|█| 100/100 [00:02<00:00, 34.38%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 140: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 140 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 138 with rewards -1899716.9293954847 with 1440 steps 106.23%/s, 100%\n",
      "Simulation Progress [Episode 140]: 100%|█| 100/100 [00:02<00:00, 34.62%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 141: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 141 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 139 with rewards -1899716.9293954847 with 1440 steps 103.56%/s, 100%\n",
      "Simulation Progress [Episode 141]: 100%|█| 100/100 [00:02<00:00, 34.31%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 142: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 142 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 140 with rewards -1899716.9293954847 with 1440 steps 105.87%/s, 100%\n",
      "Simulation Progress [Episode 142]: 100%|█| 100/100 [00:02<00:00, 34.27%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 143: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 143 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 141 with rewards -1899716.9293954847 with 1440 steps 100.94%/s, 100%\n",
      "Simulation Progress [Episode 143]: 100%|█| 100/100 [00:02<00:00, 34.38%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 144: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 144 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 142 with rewards -1899716.9293954847 with 1440 steps 106.72%/s, 100%\n",
      "Simulation Progress [Episode 144]: 100%|█| 100/100 [00:02<00:00, 34.63%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 145: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 145 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 143 with rewards -1899716.9293954847 with 1440 steps 105.04%/s, 100%\n",
      "Simulation Progress [Episode 145]: 100%|█| 100/100 [00:02<00:00, 34.54%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 146: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 146 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 144 with rewards -1899716.9293954847 with 1440 steps 102.41%/s, 100%\n",
      "Simulation Progress [Episode 146]: 100%|█| 100/100 [00:02<00:00, 34.26%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 147: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 147 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 145 with rewards -1899716.9293954847 with 1440 steps 101.88%/s, 100%\n",
      "Simulation Progress [Episode 147]: 100%|█| 100/100 [00:02<00:00, 34.26%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 148: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 148 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 146 with rewards -1899716.9293954847 with 1440 steps 102.80%/s, 100%\n",
      "Simulation Progress [Episode 148]: 100%|█| 100/100 [00:02<00:00, 34.08%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 149: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 149 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 147 with rewards -1899716.9293954847 with 1440 steps 103.07%/s, 100%\n",
      "Simulation Progress [Episode 149]: 100%|█| 100/100 [00:02<00:00, 34.06%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 150: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 150 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 148 with rewards -1899716.9293954847 with 1440 steps 101.65%/s, 100%\n",
      "Simulation Progress [Episode 150]: 100%|█| 100/100 [00:02<00:00, 34.02%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 151: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 151 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 149 with rewards -1899716.9293954847 with 1440 steps 101.16%/s, 100%\n",
      "Simulation Progress [Episode 151]: 100%|█| 100/100 [00:02<00:00, 34.07%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 152: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 152 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 150 with rewards -1899716.9293954847 with 1440 steps 107.78%/s, 100%\n",
      "Simulation Progress [Episode 152]: 100%|█| 100/100 [00:02<00:00, 34.11%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 153: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 153 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 151 with rewards -1899716.9293954847 with 1440 steps 107.10%/s, 100%\n",
      "Simulation Progress [Episode 153]: 100%|█| 100/100 [00:02<00:00, 34.31%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 154: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 154 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 152 with rewards -1899716.9293954847 with 1440 steps 96.86%/s, 100% \n",
      "Simulation Progress [Episode 154]: 100%|█| 100/100 [00:02<00:00, 33.41%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 155: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 155 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 153 with rewards -1899716.9293954847 with 1440 steps 104.44%/s, 100%\n",
      "Simulation Progress [Episode 155]: 100%|█| 100/100 [00:02<00:00, 34.15%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 156: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 156 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 154 with rewards -1899716.9293954847 with 1440 steps 98.53%/s, 100% \n",
      "Simulation Progress [Episode 156]: 100%|█| 100/100 [00:02<00:00, 34.18%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 157: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 157 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 155 with rewards -1899716.9293954847 with 1440 steps 106.40%/s, 100%\n",
      "Simulation Progress [Episode 157]: 100%|█| 100/100 [00:02<00:00, 34.60%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 158: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 158 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 156 with rewards -1899716.9293954847 with 1440 steps 106.11%/s, 100%\n",
      "Simulation Progress [Episode 158]: 100%|█| 100/100 [00:02<00:00, 34.38%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 159: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 159 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 157 with rewards -1899716.9293954847 with 1440 steps 107.67%/s, 100%\n",
      "Simulation Progress [Episode 159]: 100%|█| 100/100 [00:02<00:00, 34.63%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 160: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 160 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 158 with rewards -1899716.9293954847 with 1440 steps 107.50%/s, 100%\n",
      "Simulation Progress [Episode 160]: 100%|█| 100/100 [00:02<00:00, 34.41%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 161: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 161 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 159 with rewards -1899716.9293954847 with 1440 steps 105.29%/s, 100%\n",
      "Simulation Progress [Episode 161]: 100%|█| 100/100 [00:02<00:00, 34.53%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 162: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 162 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 160 with rewards -1899716.9293954847 with 1440 steps 109.97%/s, 100%\n",
      "Simulation Progress [Episode 162]: 100%|█| 100/100 [00:02<00:00, 34.58%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 163: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 163 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 161 with rewards -1899716.9293954847 with 1440 steps 109.01%/s, 100%\n",
      "Simulation Progress [Episode 163]: 100%|█| 100/100 [00:02<00:00, 34.52%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 164: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 164 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 162 with rewards -1899716.9293954847 with 1440 steps 106.39%/s, 100%\n",
      "Simulation Progress [Episode 164]: 100%|█| 100/100 [00:02<00:00, 34.42%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 165: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 165 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 163 with rewards -1899716.9293954847 with 1440 steps 106.33%/s, 100%\n",
      "Simulation Progress [Episode 165]: 100%|█| 100/100 [00:02<00:00, 34.56%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 166: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 166 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 164 with rewards -1899716.9293954847 with 1440 steps 107.38%/s, 100%\n",
      "Simulation Progress [Episode 166]: 100%|█| 100/100 [00:02<00:00, 34.64%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 167: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 167 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 165 with rewards -1899716.9293954847 with 1440 steps 107.49%/s, 100%\n",
      "Simulation Progress [Episode 167]: 100%|█| 100/100 [00:02<00:00, 34.47%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 168: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 168 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 166 with rewards -1899716.9293954847 with 1440 steps 105.15%/s, 100%\n",
      "Simulation Progress [Episode 168]: 100%|█| 100/100 [00:02<00:00, 34.50%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 169: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 169 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 167 with rewards -1899716.9293954847 with 1440 steps 106.02%/s, 100%\n",
      "Simulation Progress [Episode 169]: 100%|█| 100/100 [00:02<00:00, 34.59%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 170: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 170 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 168 with rewards -1899716.9293954847 with 1440 steps 106.42%/s, 100%\n",
      "Simulation Progress [Episode 170]: 100%|█| 100/100 [00:02<00:00, 34.47%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 171: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 171 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 169 with rewards -1899716.9293954847 with 1440 steps 105.77%/s, 100%\n",
      "Simulation Progress [Episode 171]: 100%|█| 100/100 [00:02<00:00, 34.47%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 172: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 172 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 170 with rewards -1899716.9293954847 with 1440 steps 106.12%/s, 100%\n",
      "Simulation Progress [Episode 172]: 100%|█| 100/100 [00:02<00:00, 34.55%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 173: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 173 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 171 with rewards -1899716.9293954847 with 1440 steps 98.40%/s, 100% \n",
      "Simulation Progress [Episode 173]: 100%|█| 100/100 [00:02<00:00, 33.79%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 174: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 174 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 172 with rewards -1899716.9293954847 with 1440 steps 107.49%/s, 100%\n",
      "Simulation Progress [Episode 174]: 100%|█| 100/100 [00:02<00:00, 34.56%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 175: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 175 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 173 with rewards -1899716.9293954847 with 1440 steps 102.68%/s, 100%\n",
      "Simulation Progress [Episode 175]: 100%|█| 100/100 [00:02<00:00, 34.49%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 176: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 176 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 174 with rewards -1899716.9293954847 with 1440 steps 107.36%/s, 100%\n",
      "Simulation Progress [Episode 176]: 100%|█| 100/100 [00:02<00:00, 34.48%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 177: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 177 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 175 with rewards -1899716.9293954847 with 1440 steps 102.45%/s, 100%\n",
      "Simulation Progress [Episode 177]: 100%|█| 100/100 [00:02<00:00, 34.53%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 178: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 178 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 176 with rewards -1899716.9293954847 with 1440 steps 105.59%/s, 100%\n",
      "Simulation Progress [Episode 178]: 100%|█| 100/100 [00:02<00:00, 34.44%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 179: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 179 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 177 with rewards -1899716.9293954847 with 1440 steps 106.56%/s, 100%\n",
      "Simulation Progress [Episode 179]: 100%|█| 100/100 [00:02<00:00, 34.41%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 180: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 180 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 178 with rewards -1899716.9293954847 with 1440 steps 106.60%/s, 100%\n",
      "Simulation Progress [Episode 180]: 100%|█| 100/100 [00:02<00:00, 34.44%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 181: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 181 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 179 with rewards -1899716.9293954847 with 1440 steps 108.79%/s, 100%\n",
      "Simulation Progress [Episode 181]: 100%|█| 100/100 [00:02<00:00, 34.24%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 182: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 182 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 180 with rewards -1899716.9293954847 with 1440 steps 108.98%/s, 100%\n",
      "Simulation Progress [Episode 182]: 100%|█| 100/100 [00:02<00:00, 34.73%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 183: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 183 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 181 with rewards -1899716.9293954847 with 1440 steps 105.42%/s, 100%\n",
      "Simulation Progress [Episode 183]: 100%|█| 100/100 [00:02<00:00, 34.53%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 184: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 184 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 182 with rewards -1899716.9293954847 with 1440 steps 106.74%/s, 100%\n",
      "Simulation Progress [Episode 184]: 100%|█| 100/100 [00:02<00:00, 34.26%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 185: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 185 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 183 with rewards -1899716.9293954847 with 1440 steps 105.45%/s, 100%\n",
      "Simulation Progress [Episode 185]: 100%|█| 100/100 [00:02<00:00, 34.47%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 186: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 186 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 184 with rewards -1899716.9293954847 with 1440 steps 100.64%/s, 100%\n",
      "Simulation Progress [Episode 186]: 100%|█| 100/100 [00:02<00:00, 34.29%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 187: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 187 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 185 with rewards -1899716.9293954847 with 1440 steps 107.20%/s, 100%\n",
      "Simulation Progress [Episode 187]: 100%|█| 100/100 [00:02<00:00, 34.69%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 188: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 188 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 186 with rewards -1899716.9293954847 with 1440 steps 107.55%/s, 100%\n",
      "Simulation Progress [Episode 188]: 100%|█| 100/100 [00:02<00:00, 34.65%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 189: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 189 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 187 with rewards -1899716.9293954847 with 1440 steps 106.66%/s, 100%\n",
      "Simulation Progress [Episode 189]: 100%|█| 100/100 [00:02<00:00, 34.43%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 190: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 190 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 188 with rewards -1899716.9293954847 with 1440 steps 109.89%/s, 100%\n",
      "Simulation Progress [Episode 190]: 100%|█| 100/100 [00:02<00:00, 34.39%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 191: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 191 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 189 with rewards -1899716.9293954847 with 1440 steps 105.19%/s, 100%\n",
      "Simulation Progress [Episode 191]: 100%|█| 100/100 [00:02<00:00, 34.39%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 192: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 192 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 190 with rewards -1899716.9293954847 with 1440 steps 99.03%/s, 100% \n",
      "Simulation Progress [Episode 192]: 100%|█| 100/100 [00:02<00:00, 33.77%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 193: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 193 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 191 with rewards -1899716.9293954847 with 1440 steps 104.06%/s, 100%\n",
      "Simulation Progress [Episode 193]: 100%|█| 100/100 [00:02<00:00, 34.55%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 194: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 194 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 192 with rewards -1899716.9293954847 with 1440 steps 101.25%/s, 100%\n",
      "Simulation Progress [Episode 194]: 100%|█| 100/100 [00:02<00:00, 34.44%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 195: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 195 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 193 with rewards -1899716.9293954847 with 1440 steps 101.53%/s, 100%\n",
      "Simulation Progress [Episode 195]: 100%|█| 100/100 [00:02<00:00, 34.38%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 196: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 196 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 194 with rewards -1899716.9293954847 with 1440 steps 108.86%/s, 100%\n",
      "Simulation Progress [Episode 196]: 100%|█| 100/100 [00:02<00:00, 34.72%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 197: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 197 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 195 with rewards -1899716.9293954847 with 1440 steps 105.20%/s, 100%\n",
      "Simulation Progress [Episode 197]: 100%|█| 100/100 [00:02<00:00, 34.44%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 198: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 198 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 196 with rewards -1899716.9293954847 with 1440 steps 101.95%/s, 100%\n",
      "Simulation Progress [Episode 198]: 100%|█| 100/100 [00:02<00:00, 34.46%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 199: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 199 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 197 with rewards -1899716.9293954847 with 1440 steps 101.22%/s, 100%\n",
      "Simulation Progress [Episode 199]: 100%|█| 100/100 [00:02<00:00, 34.45%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 200: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 200 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 198 with rewards -1899716.9293954847 with 1440 steps 101.73%/s, 100%\n",
      "Simulation Progress [Episode 200]: 100%|█| 100/100 [00:02<00:00, 34.39%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 201: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 201 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 199 with rewards -1899716.9293954847 with 1440 steps 100.24%/s, 100%\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Run episode 246 with rewards -244.2465385815842 with 347 steps, done\n",
      "Run episode 247 with rewards -31.006678544073196 with 366 steps, done\n",
      "Run episode 248 with rewards 234.06211793920582 with 438 steps, done\n",
      "Run episode 249 with rewards 257.416519274365 with 404 steps, done\n",
      "Run episode 250 with rewards -207.25224578637676 with 317 steps, done\n",
      "Run episode 251 with rewards -77.66199676750053 with 233 steps, done\n",
      "Run episode 252 with rewards -50.059639407754844 with 284 steps, done\n",
      "Run episode 253 with rewards -25.637406142059433 with 219 steps, done\n",
      "Run episode 254 with rewards -211.04986133483774 with 389 steps, done\n",
      "Run episode 255 with rewards -185.58244049154754 with 257 steps, done\n",
      "Run episode 256 with rewards -248.81314196124123 with 292 steps, done\n",
      "Run episode 257 with rewards 124.39431083202021 with 728 steps, done\n",
      "Run episode 258 with rewards 204.21369471963015 with 785 steps, done\n",
      "Run episode 260 with rewards 177.75477378850746 with 780 steps, done\n",
      "Run episode 261 with rewards -238.21693198890597 with 256 steps, done\n",
      "Run episode 262 with rewards -30.731398806317245 with 365 steps, done\n",
      "Run episode 263 with rewards 28.655058994896734 with 306 steps, done\n",
      "Run episode 264 with rewards 278.98567912535157 with 831 steps, done\n",
      "Run episode 265 with rewards -168.24450572996807 with 241 steps, done\n",
      "Run episode 266 with rewards -37.66702064353167 with 220 steps, done\n",
      "Run episode 267 with rewards -178.14300303184712 with 247 steps, done\n",
      "Run episode 268 with rewards -176.0757166786907 with 265 steps, done\n",
      "Run episode 269 with rewards -256.12054966712606 with 336 steps, done\n",
      "Run episode 270 with rewards -59.66322952035947 with 226 steps, done\n",
      "Run episode 271 with rewards 32.58733809139983 with 175 steps, done\n",
      "Run episode 272 with rewards -19.32903481550828 with 329 steps, done\n",
      "Run episode 273 with rewards -189.2514832048664 with 357 steps, done\n",
      "Run episode 274 with rewards -55.594473651245195 with 273 steps, done\n",
      "Run episode 275 with rewards -184.13387622083957 with 342 steps, done\n",
      "Run episode 276 with rewards 9.134317671466746 with 192 steps, done\n",
      "Run episode 277 with rewards -236.20993457525447 with 310 steps, done\n",
      "Run episode 278 with rewards -42.04629382779699 with 242 steps, done\n",
      "Run episode 279 with rewards -259.69836970206586 with 297 steps, done\n",
      "Run episode 280 with rewards -154.64069015182312 with 235 steps, done\n",
      "Run episode 281 with rewards 34.79384545551477 with 318 steps, done\n",
      "Run episode 282 with rewards -36.47286037710879 with 203 steps, done\n",
      "Run episode 283 with rewards -36.79908423540414 with 267 steps, done\n",
      "Run episode 284 with rewards -103.6595431781962 with 241 steps, done\n",
      "Run episode 285 with rewards 215.0247232767742 with 518 steps, done\n",
      "Run episode 286 with rewards -52.0088088039725 with 313 steps, done\n",
      "Run episode 287 with rewards -219.16264201584227 with 215 steps, done\n",
      "Run episode 288 with rewards -55.03163319953982 with 234 steps, done\n",
      "Run episode 289 with rewards -249.87109720717513 with 321 steps, done\n",
      "Run episode 290 with rewards -214.96715465816186 with 251 steps, done\n",
      "Run episode 291 with rewards -48.04295385786992 with 267 steps, done\n",
      "Run episode 292 with rewards -163.70308029492455 with 350 steps, done\n",
      "Run episode 293 with rewards 151.4317360417223 with 570 steps, done\n",
      "Run episode 294 with rewards -178.27432992747936 with 265 steps, done\n",
      "Run episode 295 with rewards -77.21628922917375 with 243 steps, done\n",
      "Run episode 296 with rewards -147.9267520246837 with 299 steps, done\n",
      "Run episode 297 with rewards -217.68753136290763 with 304 steps, done\n",
      "Run episode 298 with rewards -170.55398054889324 with 251 steps, done\n",
      "Run episode 299 with rewards 209.3158566516995 with 453 steps, done\n",
      "Run episode 300 with rewards -240.02434956807886 with 245 steps, done\n",
      "Run episode 301 with rewards -31.65473128631585 with 245 steps, done\n",
      "Run episode 302 with rewards 3.1187086818034544 with 258 steps, done\n",
      "Run episode 303 with rewards -175.26964963460608 with 307 steps, done\n",
      "Run episode 304 with rewards -133.5561604938311 with 285 steps, done\n",
      "Run episode 305 with rewards -39.332747662606224 with 274 steps, done\n",
      "Run episode 306 with rewards -274.24992882917593 with 318 steps, done\n",
      "Run episode 307 with rewards -232.69724914616592 with 398 steps, done\n",
      "Run episode 308 with rewards -182.76401864118543 with 281 steps, done\n",
      "Run episode 309 with rewards -184.9297459050511 with 245 steps, done\n",
      "Run episode 310 with rewards -35.024920383297214 with 317 steps, done\n",
      "Run episode 311 with rewards -75.90482960447353 with 370 steps, done\n",
      "Run episode 312 with rewards -241.48999904303957 with 281 steps, done\n",
      "Run episode 313 with rewards -28.2391010279471 with 262 steps, done\n",
      "Run episode 314 with rewards -2.8728539858909414 with 245 steps, done\n",
      "Run episode 315 with rewards -249.625363181883 with 395 steps, done\n",
      "Run episode 316 with rewards -220.6411860424547 with 437 steps, done\n",
      "Run episode 317 with rewards 233.33490822089024 with 568 steps, done\n",
      "Run episode 318 with rewards -167.00624825862687 with 295 steps, done\n",
      "Run episode 319 with rewards 8.777040559255866 with 196 steps, done\n",
      "Run episode 320 with rewards -43.283914175930356 with 303 steps, done\n",
      "Run episode 321 with rewards -190.2543051307646 with 301 steps, done\n",
      "Run episode 322 with rewards -167.08874614212397 with 309 steps, done\n",
      "Run episode 323 with rewards -106.04723207431032 with 325 steps, done\n",
      "Run episode 324 with rewards -186.10576906748105 with 220 steps, done\n",
      "Run episode 325 with rewards -235.12556073375885 with 301 steps, done\n",
      "Run episode 326 with rewards -68.3601675241952 with 241 steps, done\n",
      "Run episode 327 with rewards -72.46691415997566 with 402 steps, done\n",
      "Run episode 328 with rewards -210.4446901220499 with 513 steps, done\n",
      "Run episode 329 with rewards -26.162081904564715 with 302 steps, done\n",
      "Run episode 330 with rewards -206.1579012072595 with 295 steps, done\n",
      "Run episode 331 with rewards 197.10147440474603 with 892 steps, done\n",
      "Run episode 332 with rewards 240.45225774326374 with 409 steps, done\n",
      "Run episode 333 with rewards -97.93217811901216 with 379 steps, done\n",
      "Run episode 334 with rewards -190.2295074779645 with 314 steps, done\n",
      "Run episode 335 with rewards -207.24384503228373 with 310 steps, done\n",
      "Run episode 336 with rewards -192.23554854446894 with 244 steps, done\n",
      "Run episode 337 with rewards 182.74506043474992 with 765 steps, done\n",
      "Run episode 338 with rewards 212.75115537029092 with 718 steps, done\n",
      "Run episode 339 with rewards -72.8389372614992 with 173 steps, done\n",
      "Run episode 340 with rewards -178.78303382790085 with 322 steps, done\n",
      "Run episode 341 with rewards -48.2012490279366 with 230 steps, done\n",
      "Run episode 342 with rewards -26.8083809368363 with 222 steps, done\n",
      "Run episode 343 with rewards -56.88623634161195 with 246 steps, done\n",
      "Run episode 344 with rewards -185.1710796498661 with 295 steps, done\n",
      "Run episode 345 with rewards -223.28418044936933 with 354 steps, done\n",
      "Run episode 346 with rewards -13.013778857530468 with 250 steps, done\n",
      "Run episode 347 with rewards -57.6037435259405 with 254 steps, done\n",
      "Run episode 348 with rewards -214.29105902394662 with 291 steps, done\n",
      "Run episode 349 with rewards -77.80228868046795 with 314 steps, done\n",
      "Run episode 350 with rewards -20.043204701876434 with 251 steps, done\n",
      "Run episode 351 with rewards -195.4769881002441 with 229 steps, done\n",
      "Run episode 352 with rewards -20.302832114290226 with 180 steps, done\n",
      "Run episode 353 with rewards 181.40838807826705 with 716 steps, done\n",
      "Run episode 354 with rewards 220.33567020398152 with 625 steps, done\n",
      "Run episode 355 with rewards -166.2179338046505 with 277 steps, done\n",
      "Run episode 356 with rewards -42.59729572632081 with 254 steps, done\n",
      "Run episode 357 with rewards -250.71629103857904 with 347 steps, done\n",
      "Run episode 358 with rewards -24.355244771574377 with 267 steps, done\n",
      "Run episode 359 with rewards -33.230977365929945 with 261 steps, done\n",
      "Run episode 360 with rewards -227.14202569509186 with 367 steps, done\n",
      "Run episode 361 with rewards -27.231696393631765 with 284 steps, done\n",
      "Run episode 362 with rewards -191.67269135885203 with 281 steps, done\n",
      "Run episode 363 with rewards 275.02766124749735 with 433 steps, done\n",
      "Run episode 364 with rewards -38.58309829819113 with 332 steps, done\n",
      "Run episode 365 with rewards -175.57254326514175 with 308 steps, done\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Run episode 366 with rewards -48.44371582130563 with 361 steps, done\n",
      "Run episode 367 with rewards -202.04529337530425 with 221 steps, done\n",
      "Run episode 368 with rewards -17.176491653213304 with 201 steps, done\n",
      "Run episode 369 with rewards -234.77965840017097 with 276 steps, done\n",
      "Run episode 370 with rewards 211.77539410807992 with 416 steps, done\n",
      "Run episode 371 with rewards -204.51895391359886 with 226 steps, done\n",
      "Run episode 372 with rewards -48.86977679315119 with 168 steps, done\n",
      "Run episode 373 with rewards 41.375290033365815 with 252 steps, done\n",
      "Run episode 374 with rewards -68.59738069908633 with 235 steps, done\n",
      "Run episode 375 with rewards -14.414449491708169 with 263 steps, done\n",
      "Run episode 376 with rewards -146.32943051693857 with 462 steps, done\n",
      "Run episode 377 with rewards 223.58780566095825 with 424 steps, done\n",
      "Run episode 378 with rewards 195.76246947111778 with 478 steps, done\n",
      "Run episode 379 with rewards -47.99715427876442 with 228 steps, done\n",
      "Run episode 380 with rewards -18.186689962849044 with 248 steps, done\n",
      "Run episode 381 with rewards -155.48362691837266 with 313 steps, done\n",
      "Run episode 382 with rewards 215.43011728355455 with 485 steps, done\n",
      "Run episode 383 with rewards -30.477667284951394 with 222 steps, done\n",
      "Run episode 384 with rewards -213.13025661218518 with 268 steps, done\n",
      "Run episode 385 with rewards -30.85623815655289 with 264 steps, done\n",
      "Run episode 386 with rewards -207.26961687041305 with 319 steps, done\n",
      "Run episode 387 with rewards 259.9107522855444 with 377 steps, done\n",
      "Run episode 388 with rewards -213.28163022411167 with 253 steps, done\n",
      "Run episode 389 with rewards -33.033443402246974 with 271 steps, done\n",
      "Run episode 390 with rewards -42.914755702407625 with 363 steps, done\n",
      "Run episode 391 with rewards 11.081663655332093 with 180 steps, done\n",
      "Run episode 392 with rewards 2.770688463442923 with 291 steps, done\n",
      "Run episode 393 with rewards -155.37465423529204 with 281 steps, done\n",
      "Run episode 394 with rewards -17.338562812030787 with 224 steps, done\n",
      "Run episode 395 with rewards -44.94911463694095 with 287 steps, done\n",
      "Run episode 396 with rewards -202.97166096702065 with 152 steps, done\n",
      "Run episode 397 with rewards 270.3670760355457 with 327 steps, done\n",
      "Run episode 398 with rewards -197.51891298095148 with 220 steps, done\n",
      "Run episode 399 with rewards -206.7660120668284 with 289 steps, done\n",
      "Run episode 400 with rewards -218.88230382793353 with 273 steps, done\n",
      "Run episode 401 with rewards -197.68306617166144 with 251 steps, done\n",
      "Run episode 402 with rewards -151.28492149249428 with 313 steps, done\n",
      "Run episode 403 with rewards -34.323900832215855 with 258 steps, done\n",
      "Run episode 404 with rewards 222.75847005555946 with 411 steps, done\n",
      "Run episode 405 with rewards 255.56453933560863 with 472 steps, done\n",
      "Run episode 406 with rewards -4.6525354608802445 with 252 steps, done\n",
      "Run episode 407 with rewards -181.5768493915313 with 296 steps, done\n",
      "Run episode 408 with rewards 244.78220640721096 with 514 steps, done\n",
      "Run episode 409 with rewards -190.18379581087186 with 233 steps, done\n",
      "Run episode 410 with rewards 169.16768208385486 with 992 steps, done\n",
      "Run episode 412 with rewards -247.9991949983724 with 281 steps, done\n",
      "Run episode 413 with rewards -59.21957094710206 with 362 steps, done\n",
      "Run episode 414 with rewards -56.751088154927224 with 249 steps, done\n",
      "Run episode 415 with rewards -235.59834894299163 with 330 steps, done\n",
      "Run episode 416 with rewards -187.71099872614315 with 275 steps, done\n",
      "Run episode 417 with rewards 229.64219260058908 with 477 steps, done\n",
      "Run episode 418 with rewards 206.6187517786325 with 317 steps, done\n",
      "Run episode 419 with rewards -209.4481474012535 with 231 steps, done\n",
      "Run episode 420 with rewards -22.283879023162214 with 243 steps, done\n",
      "Run episode 421 with rewards -28.615185808515392 with 395 steps, done\n",
      "Run episode 422 with rewards 21.961083240851508 with 258 steps, done\n",
      "Run episode 423 with rewards -219.4634617561546 with 275 steps, done\n",
      "Run episode 424 with rewards -213.88407691390066 with 266 steps, done\n",
      "Run episode 425 with rewards -201.78986621738426 with 214 steps, done\n",
      "Run episode 426 with rewards 247.7256901225623 with 669 steps, done\n",
      "Run episode 427 with rewards -169.64356047454748 with 209 steps, done\n",
      "Run episode 428 with rewards -196.17931653729994 with 305 steps, done\n",
      "Run episode 429 with rewards -3.697400652282809 with 326 steps, done\n",
      "Run episode 431 with rewards -170.29932126742102 with 264 steps, done\n",
      "Run episode 432 with rewards -243.96085010600305 with 376 steps, done\n",
      "Run episode 433 with rewards 231.64607540902708 with 406 steps, done\n",
      "Run episode 434 with rewards 200.9306845140354 with 445 steps, done\n",
      "Run episode 435 with rewards -181.14318195129027 with 297 steps, done\n",
      "Run episode 436 with rewards 234.90342249299948 with 466 steps, done\n",
      "Run episode 437 with rewards 156.2106911171348 with 522 steps, done\n",
      "Run episode 438 with rewards -3.7198139016883403 with 250 steps, done\n",
      "Run episode 439 with rewards 23.54116352901049 with 276 steps, done\n",
      "Run episode 440 with rewards -57.21267845374936 with 286 steps, done\n",
      "Run episode 441 with rewards -200.41525143516105 with 281 steps, done\n",
      "Run episode 442 with rewards 230.20830579147946 with 428 steps, done\n",
      "Run episode 443 with rewards -243.41660307301552 with 349 steps, done\n",
      "Run episode 444 with rewards 7.602364275254629 with 283 steps, done\n",
      "Run episode 445 with rewards -110.39966925332585 with 323 steps, done\n",
      "Run episode 446 with rewards -237.3320563758705 with 284 steps, done\n",
      "Run episode 447 with rewards 234.8188811609295 with 419 steps, done\n",
      "Run episode 448 with rewards -17.678682776891236 with 196 steps, done\n",
      "Run episode 449 with rewards 203.03730832110375 with 445 steps, done\n",
      "Run episode 450 with rewards -47.555241255669856 with 273 steps, done\n",
      "Run episode 451 with rewards -157.9587446817854 with 212 steps, done\n",
      "Run episode 452 with rewards -151.08595914303496 with 309 steps, done\n",
      "Run episode 453 with rewards -229.2809114651153 with 399 steps, done\n",
      "Run episode 454 with rewards 256.4188158133843 with 522 steps, done\n",
      "Run episode 455 with rewards -185.87722137194282 with 244 steps, done\n",
      "Run episode 456 with rewards -171.6149137609924 with 291 steps, done\n",
      "Run episode 457 with rewards 229.68434192467356 with 491 steps, done\n",
      "Run episode 458 with rewards -193.8378617801393 with 243 steps, done\n",
      "Run episode 459 with rewards -180.0726641530449 with 250 steps, done\n",
      "Run episode 460 with rewards 266.3561207984869 with 321 steps, done\n",
      "Run episode 461 with rewards -213.15333293184 with 226 steps, done\n",
      "Run episode 462 with rewards -60.96946188928059 with 343 steps, done\n",
      "Run episode 463 with rewards -40.00903302726189 with 235 steps, done\n",
      "Run episode 464 with rewards -217.5919117534575 with 287 steps, done\n",
      "Run episode 465 with rewards 12.327950241146453 with 324 steps, done\n",
      "Run episode 466 with rewards -141.93655015550286 with 233 steps, done\n",
      "Run episode 467 with rewards -186.89560265207834 with 301 steps, done\n",
      "Run episode 468 with rewards -9.955118617833335 with 247 steps, done\n",
      "Run episode 469 with rewards -185.94548250184397 with 369 steps, done\n",
      "Run episode 470 with rewards -207.27461978234314 with 403 steps, done\n",
      "Run episode 471 with rewards 225.8193262921259 with 484 steps, done\n",
      "Run episode 472 with rewards 221.36936256501033 with 409 steps, done\n",
      "Run episode 473 with rewards -29.053628445525533 with 253 steps, done\n",
      "Run episode 474 with rewards -12.035417091793349 with 248 steps, done\n",
      "Run episode 475 with rewards 29.254463340165955 with 231 steps, done\n",
      "Run episode 476 with rewards -32.88727075268358 with 264 steps, done\n",
      "Run episode 477 with rewards -5.348219119021053 with 250 steps, done\n",
      "Run episode 478 with rewards -215.24673085923519 with 217 steps, done\n",
      "Run episode 479 with rewards -219.39221520203353 with 358 steps, done\n",
      "Run episode 480 with rewards -217.93500369403057 with 370 steps, done\n",
      "Run episode 481 with rewards -222.02038850166147 with 315 steps, done\n",
      "Run episode 482 with rewards -193.36471034077368 with 313 steps, done\n",
      "Run episode 483 with rewards 206.02721893000205 with 325 steps, done\n",
      "Run episode 484 with rewards -184.09350238008932 with 343 steps, done\n",
      "Run episode 485 with rewards -8.592702957705754 with 255 steps, done\n",
      "Run episode 486 with rewards 0.21780898288656658 with 240 steps, done\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Run episode 487 with rewards 277.2292388008925 with 271 steps, done\n",
      "Run episode 488 with rewards -21.429443670133864 with 345 steps, done\n",
      "Run episode 489 with rewards -74.83399916873474 with 338 steps, done\n",
      "Run episode 490 with rewards -64.82309784368846 with 338 steps, done\n",
      "Run episode 491 with rewards -58.88477789845844 with 348 steps, done\n",
      "Run episode 492 with rewards 48.13300656327243 with 266 steps, done\n",
      "Run episode 493 with rewards 224.16384194527194 with 978 steps, done\n",
      "Run episode 494 with rewards -40.98547173972675 with 318 steps, done\n",
      "Run episode 495 with rewards 289.8448226645586 with 394 steps, done\n",
      "Run episode 496 with rewards 17.94295990740605 with 302 steps, done\n",
      "Run episode 497 with rewards -229.8436769565745 with 304 steps, done\n",
      "Run episode 498 with rewards -55.85254480772765 with 329 steps, done\n",
      "Run episode 499 with rewards -99.87815534651025 with 314 steps, done\n",
      "Run episode 500 with rewards 221.5808546450197 with 803 steps, done\n",
      "Run episode 501 with rewards -153.4676085940006 with 207 steps, done\n",
      "Run episode 502 with rewards -229.2581507451816 with 315 steps, done\n",
      "Run episode 503 with rewards -173.66347600768609 with 340 steps, done\n",
      "Run episode 504 with rewards -190.46953130915222 with 217 steps, done\n",
      "Run episode 505 with rewards -82.31276307204405 with 355 steps, done\n",
      "Run episode 506 with rewards -255.4524613609664 with 339 steps, done\n",
      "Run episode 507 with rewards -213.30001399443478 with 243 steps, done\n",
      "Run episode 508 with rewards -224.64024352165708 with 474 steps, done\n",
      "Run episode 509 with rewards -187.67686434620094 with 282 steps, done\n",
      "Run episode 510 with rewards -73.31368554644442 with 352 steps, done\n",
      "Run episode 511 with rewards -193.6938827058392 with 315 steps, done\n",
      "Run episode 512 with rewards -31.283639693709887 with 245 steps, done\n",
      "Run episode 513 with rewards -172.82720354341092 with 311 steps, done\n",
      "Run episode 514 with rewards 203.35916456873005 with 720 steps, done\n",
      "Run episode 515 with rewards -199.88221329761222 with 305 steps, done\n",
      "Run episode 516 with rewards -193.31733115222238 with 271 steps, done\n",
      "Run episode 517 with rewards 233.50019507856115 with 380 steps, done\n",
      "Run episode 518 with rewards -119.15057987827404 with 241 steps, done\n",
      "Run episode 519 with rewards -96.48239189454925 with 404 steps, done\n",
      "Run episode 520 with rewards -48.733029862615126 with 250 steps, done\n",
      "Run episode 521 with rewards -40.86142126982671 with 267 steps, done\n",
      "Run episode 522 with rewards -159.9678671367988 with 229 steps, done\n",
      "Run episode 523 with rewards 207.54680942733464 with 517 steps, done\n",
      "Run episode 524 with rewards -78.96409201418889 with 309 steps, done\n",
      "Run episode 525 with rewards -182.9546650984813 with 343 steps, done\n",
      "Run episode 526 with rewards -45.790949422333014 with 311 steps, done\n",
      "Run episode 527 with rewards -242.84207594659983 with 342 steps, done\n",
      "Run episode 528 with rewards -53.02833908804685 with 314 steps, done\n",
      "Run episode 529 with rewards 218.51953875587594 with 434 steps, done\n",
      "Run episode 530 with rewards -200.93637145159659 with 283 steps, done\n",
      "Run episode 531 with rewards 6.287902787812897 with 341 steps, done\n",
      "Run episode 532 with rewards -234.65891866678004 with 295 steps, done\n",
      "Run episode 533 with rewards -233.04213441287845 with 365 steps, done\n",
      "Run episode 534 with rewards 39.3507012627862 with 199 steps, done\n",
      "Run episode 535 with rewards -19.897934711679 with 301 steps, done\n",
      "Run episode 536 with rewards -199.91036075421775 with 288 steps, done\n",
      "Run episode 537 with rewards -15.748662256422818 with 311 steps, done\n",
      "Run episode 538 with rewards 221.81036114081436 with 467 steps, done\n",
      "Run episode 539 with rewards -30.878330137384694 with 250 steps, done\n",
      "Run episode 540 with rewards -59.58665268838701 with 278 steps, done\n",
      "Run episode 541 with rewards -52.87106639285652 with 283 steps, done\n",
      "Run episode 542 with rewards -207.31136079510532 with 359 steps, done\n",
      "Run episode 543 with rewards 269.0735201532712 with 361 steps, done\n",
      "Run episode 544 with rewards -46.47382916289795 with 292 steps, done\n",
      "Run episode 545 with rewards -109.41887579755665 with 352 steps, done\n",
      "Run episode 546 with rewards -10.689716125996739 with 225 steps, done\n",
      "Run episode 547 with rewards -209.44130111066346 with 350 steps, done\n",
      "Run episode 548 with rewards -227.96809478265564 with 289 steps, done\n",
      "Run episode 549 with rewards -199.3542283604993 with 321 steps, done\n",
      "Run episode 550 with rewards -2.178113870629346 with 241 steps, done\n",
      "Run episode 551 with rewards -95.03228120071168 with 347 steps, done\n",
      "Run episode 552 with rewards 208.69030285861697 with 365 steps, done\n",
      "Run episode 553 with rewards -230.42882449230459 with 439 steps, done\n",
      "Run episode 554 with rewards -24.92361794151917 with 235 steps, done\n",
      "Run episode 555 with rewards -194.8944894445226 with 249 steps, done\n",
      "Run episode 556 with rewards -141.76449329829603 with 223 steps, done\n",
      "Run episode 557 with rewards -214.28021265375133 with 336 steps, done\n",
      "Run episode 558 with rewards 183.06641947213507 with 369 steps, done\n",
      "Run episode 559 with rewards -29.366515314525543 with 237 steps, done\n",
      "Run episode 560 with rewards -53.05784667465059 with 251 steps, done\n",
      "Run episode 561 with rewards -161.95281677994524 with 219 steps, done\n",
      "Run episode 562 with rewards -212.18678270522986 with 294 steps, done\n",
      "Run episode 563 with rewards -223.42235533441777 with 218 steps, done\n",
      "Run episode 564 with rewards -55.03380706260357 with 313 steps, done\n",
      "Run episode 565 with rewards -194.61547411084715 with 239 steps, done\n",
      "Run episode 566 with rewards -15.187200344052954 with 240 steps, done\n",
      "Run episode 567 with rewards -25.67717778775794 with 231 steps, done\n",
      "Run episode 568 with rewards -38.139365909114005 with 269 steps, done\n",
      "Run episode 569 with rewards 178.4775036580232 with 743 steps, done\n",
      "Run episode 570 with rewards -175.22858111546248 with 247 steps, done\n",
      "Run episode 571 with rewards 162.40974541659813 with 547 steps, done\n",
      "Run episode 572 with rewards 272.7263377638899 with 409 steps, done\n",
      "Run episode 573 with rewards -179.9529363325306 with 278 steps, done\n",
      "Run episode 574 with rewards -72.50290991706497 with 221 steps, done\n",
      "Run episode 575 with rewards -11.348741073677104 with 182 steps, done\n",
      "Run episode 576 with rewards -30.140446720502624 with 288 steps, done\n",
      "Run episode 577 with rewards -194.30582004792026 with 300 steps, done\n",
      "Run episode 578 with rewards -107.56025843766278 with 285 steps, done\n",
      "Run episode 579 with rewards -210.02343764662595 with 379 steps, done\n",
      "Run episode 580 with rewards -163.46192043636245 with 288 steps, done\n",
      "Run episode 581 with rewards -192.3475399203897 with 263 steps, done\n",
      "Run episode 582 with rewards -201.40465399783096 with 232 steps, done\n",
      "Run episode 583 with rewards -151.40637659028198 with 298 steps, done\n",
      "Run episode 584 with rewards 23.31546102606916 with 292 steps, done\n",
      "Run episode 585 with rewards -8.055906623968028 with 298 steps, done\n",
      "Run episode 586 with rewards -31.08365794949161 with 246 steps, done\n",
      "Run episode 587 with rewards -3.0744703647942515 with 244 steps, done\n",
      "Run episode 588 with rewards 256.71794190770413 with 443 steps, done\n",
      "Run episode 589 with rewards -16.32565665020026 with 369 steps, done\n",
      "Run episode 590 with rewards 221.33342776602694 with 755 steps, done\n",
      "Run episode 591 with rewards 209.66077778468872 with 816 steps, done\n",
      "Run episode 592 with rewards -203.65691394702844 with 307 steps, done\n",
      "Run episode 593 with rewards -171.40947686334448 with 218 steps, done\n",
      "Run episode 594 with rewards -38.718255346446966 with 371 steps, done\n",
      "Run episode 595 with rewards 206.06234949459775 with 823 steps, done\n",
      "Run episode 596 with rewards -42.4154010041874 with 277 steps, done\n",
      "Run episode 597 with rewards -170.89873759767636 with 246 steps, done\n",
      "Run episode 598 with rewards 251.6145003594563 with 422 steps, done\n",
      "Run episode 599 with rewards -207.5056143974765 with 287 steps, done\n",
      "Run episode 600 with rewards 255.05417774236747 with 332 steps, done\n",
      "Run episode 601 with rewards -49.06806218714627 with 316 steps, done\n",
      "Run episode 602 with rewards 268.2348532359259 with 390 steps, done\n",
      "Run episode 603 with rewards -62.74270658014756 with 326 steps, done\n",
      "Run episode 604 with rewards -242.7734375784077 with 382 steps, done\n",
      "Run episode 605 with rewards -165.86990035092694 with 233 steps, done\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Run episode 606 with rewards -157.5815992070482 with 305 steps, done\n",
      "Run episode 607 with rewards -53.20747149624078 with 246 steps, done\n",
      "Run episode 608 with rewards -36.73833135397046 with 264 steps, done\n",
      "Run episode 609 with rewards -224.3292836813523 with 399 steps, done\n",
      "Run episode 610 with rewards 222.19351971197045 with 464 steps, done\n",
      "Run episode 611 with rewards 226.1896506858136 with 393 steps, done\n",
      "Run episode 612 with rewards -177.84556821171964 with 312 steps, done\n",
      "Run episode 613 with rewards -44.19227971120334 with 283 steps, done\n",
      "Run episode 614 with rewards -63.375520161089085 with 292 steps, done\n",
      "Run episode 615 with rewards -97.66653314750229 with 344 steps, done\n",
      "Run episode 616 with rewards 179.71727426372286 with 640 steps, done\n",
      "Run episode 617 with rewards -190.6874998994025 with 223 steps, done\n",
      "Run episode 618 with rewards -194.32202902923427 with 304 steps, done\n",
      "Run episode 619 with rewards -173.65292136657922 with 241 steps, done\n",
      "Run episode 620 with rewards -37.585594241403925 with 243 steps, done\n",
      "Run episode 621 with rewards 242.0654515654267 with 338 steps, done\n",
      "Run episode 622 with rewards -81.22575594936588 with 312 steps, done\n",
      "Run episode 623 with rewards -51.4840696470189 with 316 steps, done\n",
      "Run episode 624 with rewards 17.09249142607591 with 249 steps, done\n",
      "Run episode 625 with rewards -229.08113856332676 with 249 steps, done\n",
      "Run episode 626 with rewards -29.31723213845069 with 237 steps, done\n",
      "Run episode 627 with rewards -5.619303911656289 with 248 steps, done\n",
      "Run episode 628 with rewards -156.0995213772103 with 203 steps, done\n",
      "Run episode 629 with rewards -188.38789515421493 with 219 steps, done\n",
      "Run episode 630 with rewards -153.46064908429702 with 242 steps, done\n",
      "Run episode 631 with rewards -207.02674060450784 with 288 steps, done\n",
      "Run episode 632 with rewards -202.0663205834128 with 230 steps, done\n",
      "Run episode 633 with rewards -23.533354951647 with 236 steps, done\n",
      "Run episode 634 with rewards -182.72805654215938 with 215 steps, done\n",
      "Run episode 635 with rewards 299.7850159275119 with 350 steps, done\n",
      "Run episode 636 with rewards -14.913070331562736 with 251 steps, done\n",
      "Run episode 637 with rewards 247.49635088830507 with 383 steps, done\n",
      "Run episode 638 with rewards -31.727275894824842 with 239 steps, done\n",
      "Run episode 639 with rewards -42.91027969290869 with 262 steps, done\n",
      "Run episode 640 with rewards 243.02600317273212 with 412 steps, done\n",
      "Run episode 641 with rewards 158.67715042659773 with 523 steps, done\n",
      "Run episode 642 with rewards 222.05721035799561 with 474 steps, done\n",
      "Run episode 643 with rewards -44.460637357170654 with 254 steps, done\n",
      "Run episode 644 with rewards -36.691235494998736 with 239 steps, done\n",
      "Run episode 645 with rewards 204.22147031367152 with 511 steps, done\n",
      "Run episode 646 with rewards -232.31848550094585 with 405 steps, done\n",
      "Run episode 647 with rewards -14.520423631786059 with 267 steps, done\n",
      "Run episode 648 with rewards -137.36688511898348 with 251 steps, done\n",
      "Run episode 649 with rewards -185.66873751701416 with 238 steps, done\n",
      "Run episode 650 with rewards -26.262215138650916 with 255 steps, done\n",
      "Run episode 651 with rewards -224.57636171243462 with 355 steps, done\n",
      "Run episode 652 with rewards -192.37817087607098 with 230 steps, done\n",
      "Run episode 653 with rewards 227.4877633382821 with 414 steps, done\n",
      "Run episode 654 with rewards 213.77894241668704 with 447 steps, done\n",
      "Run episode 655 with rewards -0.30724824515455396 with 274 steps, done\n",
      "Run episode 656 with rewards -70.41443200519892 with 238 steps, done\n",
      "Run episode 657 with rewards -149.8417849875255 with 254 steps, done\n",
      "Run episode 658 with rewards -6.695361825480504 with 387 steps, done\n",
      "Run episode 659 with rewards 255.10806119580036 with 364 steps, done\n",
      "Run episode 660 with rewards -62.433831602512385 with 232 steps, done\n",
      "Run episode 661 with rewards -54.31619607539356 with 230 steps, done\n",
      "Run episode 662 with rewards -13.066497483710762 with 229 steps, done\n",
      "Run episode 663 with rewards 194.20962547042876 with 467 steps, done\n",
      "Run episode 664 with rewards 238.06700438525826 with 531 steps, done\n",
      "Run episode 665 with rewards 191.02654297457343 with 378 steps, done\n",
      "Run episode 666 with rewards 222.61646220755412 with 419 steps, done\n",
      "Run episode 667 with rewards -241.4104860860518 with 286 steps, done\n",
      "Run episode 668 with rewards 2.180882122599357 with 234 steps, done\n",
      "Run episode 669 with rewards 229.96566185028541 with 437 steps, done\n",
      "Run episode 670 with rewards 219.54709536521932 with 458 steps, done\n",
      "Run episode 671 with rewards -184.97067913062054 with 234 steps, done\n",
      "Run episode 672 with rewards 198.60082498937086 with 392 steps, done\n",
      "Run episode 673 with rewards -248.29777110940586 with 346 steps, done\n",
      "Run episode 674 with rewards -195.02043100663877 with 231 steps, done\n",
      "Run episode 675 with rewards -48.63105862606295 with 279 steps, done\n",
      "Run episode 676 with rewards -172.45187368223884 with 281 steps, done\n",
      "Run episode 677 with rewards 220.88085611706313 with 467 steps, done\n",
      "Run episode 678 with rewards -37.395237935411615 with 266 steps, done\n",
      "Run episode 679 with rewards 6.335606373962108 with 237 steps, done\n",
      "Run episode 680 with rewards -35.979370320076725 with 206 steps, done\n",
      "Run episode 681 with rewards -15.568874388054496 with 227 steps, done\n",
      "Run episode 682 with rewards 228.06655816223196 with 470 steps, done\n",
      "Run episode 683 with rewards 220.94704690832657 with 455 steps, done\n",
      "Run episode 684 with rewards -79.03821505149844 with 320 steps, done\n",
      "Run episode 685 with rewards 19.15372095835363 with 272 steps, done\n",
      "Run episode 686 with rewards 195.5554612744551 with 526 steps, done\n",
      "Run episode 687 with rewards -181.42960250776528 with 260 steps, done\n",
      "Run episode 688 with rewards 176.92132207601992 with 700 steps, done\n",
      "Run episode 689 with rewards -164.78368339240518 with 206 steps, done\n",
      "Run episode 690 with rewards -206.9610488344577 with 314 steps, done\n",
      "Run episode 691 with rewards -33.30056137899345 with 266 steps, done\n",
      "Run episode 692 with rewards -196.05455990945077 with 249 steps, done\n",
      "Run episode 693 with rewards -174.8442089423386 with 240 steps, done\n",
      "Run episode 694 with rewards -44.383149792351276 with 282 steps, done\n",
      "Run episode 695 with rewards -179.7186312401124 with 363 steps, done\n",
      "Run episode 696 with rewards -39.826091058600895 with 244 steps, done\n",
      "Run episode 697 with rewards -30.702688320173436 with 234 steps, done\n",
      "Run episode 698 with rewards 214.56819080556016 with 571 steps, done\n",
      "Run episode 699 with rewards -175.4053907179237 with 230 steps, done\n",
      "Run episode 700 with rewards -226.97498608924818 with 286 steps, done\n",
      "Run episode 701 with rewards -3.4754032541730595 with 238 steps, done\n",
      "Run episode 702 with rewards -197.6070973171376 with 254 steps, done\n",
      "Run episode 703 with rewards -191.09667976487606 with 288 steps, done\n",
      "Run episode 704 with rewards -32.43538701087452 with 242 steps, done\n",
      "Run episode 705 with rewards -227.3696855929551 with 318 steps, done\n",
      "Run episode 706 with rewards -30.698161082394506 with 284 steps, done\n",
      "Run episode 707 with rewards -49.809543787728565 with 221 steps, done\n",
      "Run episode 708 with rewards 228.53565720915063 with 467 steps, done\n",
      "Run episode 709 with rewards 202.2193328130009 with 536 steps, done\n",
      "Run episode 710 with rewards -10.8532598270193 with 205 steps, done\n",
      "Run episode 711 with rewards 231.20480564619368 with 340 steps, done\n",
      "Run episode 712 with rewards -245.91615274515343 with 373 steps, done\n",
      "Run episode 713 with rewards 3.6257525770888606 with 270 steps, done\n",
      "Run episode 714 with rewards -192.18320470727627 with 272 steps, done\n",
      "Run episode 715 with rewards -67.47710185972853 with 270 steps, done\n",
      "Run episode 716 with rewards -76.9654548845243 with 245 steps, done\n",
      "Run episode 717 with rewards -224.5438419545544 with 269 steps, done\n",
      "Run episode 718 with rewards -10.613761264146731 with 259 steps, done\n",
      "Run episode 719 with rewards 221.61248378452729 with 616 steps, done\n",
      "Run episode 720 with rewards -43.68885106609091 with 331 steps, done\n",
      "Run episode 721 with rewards -249.46564900439682 with 400 steps, done\n",
      "Run episode 722 with rewards -24.0893210403476 with 255 steps, done\n",
      "Run episode 723 with rewards 264.88300981471997 with 390 steps, done\n",
      "Run episode 724 with rewards -18.790613677446828 with 224 steps, done\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Run episode 725 with rewards 172.44123879730031 with 785 steps, done\n",
      "Run episode 726 with rewards -26.922868708105668 with 190 steps, done\n",
      "Run episode 727 with rewards -147.86345375399821 with 288 steps, done\n",
      "Run episode 728 with rewards 259.1021906359449 with 328 steps, done\n",
      "Run episode 729 with rewards -213.17003930817543 with 215 steps, done\n",
      "Run episode 730 with rewards -57.18403018439807 with 372 steps, done\n",
      "Run episode 731 with rewards -202.55730472690647 with 277 steps, done\n",
      "Run episode 732 with rewards 228.45101483626357 with 387 steps, done\n",
      "Run episode 733 with rewards -200.10820555177668 with 312 steps, done\n",
      "Run episode 734 with rewards 206.23872366312202 with 378 steps, done\n",
      "Run episode 735 with rewards -5.871011426676333 with 250 steps, done\n",
      "Run episode 736 with rewards -240.05775229227888 with 373 steps, done\n",
      "Run episode 737 with rewards -204.3905082800331 with 301 steps, done\n",
      "Run episode 738 with rewards 250.04181091160197 with 426 steps, done\n",
      "Run episode 739 with rewards -225.1695121900506 with 311 steps, done\n",
      "Run episode 740 with rewards -63.812011547874505 with 273 steps, done\n",
      "Run episode 741 with rewards 37.62967329889614 with 242 steps, done\n",
      "Run episode 742 with rewards -188.79558160196908 with 245 steps, done\n",
      "Run episode 743 with rewards -229.50155613278548 with 370 steps, done\n",
      "Run episode 744 with rewards -248.1732695689629 with 348 steps, done\n",
      "Run episode 745 with rewards 34.11991572293823 with 273 steps, done\n",
      "Run episode 746 with rewards -15.50843956377436 with 181 steps, done\n",
      "Run episode 747 with rewards -33.32989533381365 with 291 steps, done\n",
      "Run episode 748 with rewards -34.86801399280047 with 244 steps, done\n",
      "Run episode 749 with rewards 238.64573386461493 with 367 steps, done\n",
      "Run episode 750 with rewards -2.2358160998651186 with 178 steps, done\n",
      "Run episode 751 with rewards -25.019960381111616 with 181 steps, done\n",
      "Run episode 752 with rewards -203.86860214045092 with 294 steps, done\n",
      "Run episode 753 with rewards 231.01555845865747 with 416 steps, done\n",
      "Run episode 754 with rewards -40.26239103444354 with 297 steps, done\n",
      "Run episode 755 with rewards 227.91741027201397 with 351 steps, done\n",
      "Run episode 756 with rewards -43.410695516252304 with 162 steps, done\n",
      "Run episode 757 with rewards 254.77019578544127 with 310 steps, done\n",
      "Run episode 758 with rewards -206.6779202102382 with 220 steps, done\n",
      "Run episode 759 with rewards -226.88001876786967 with 335 steps, done\n",
      "Run episode 760 with rewards -180.45576753511222 with 235 steps, done\n",
      "Run episode 761 with rewards -185.87418272804217 with 246 steps, done\n",
      "Run episode 762 with rewards -5.936380210635107 with 245 steps, done\n",
      "Run episode 763 with rewards -235.99292202319856 with 303 steps, done\n",
      "Run episode 764 with rewards -25.02700274326466 with 248 steps, done\n",
      "Run episode 765 with rewards -202.68199902256356 with 237 steps, done\n",
      "Run episode 766 with rewards -12.371624441953372 with 225 steps, done\n",
      "Run episode 767 with rewards 238.3419063757041 with 357 steps, done\n",
      "Run episode 768 with rewards 224.68092083282193 with 472 steps, done\n",
      "Run episode 769 with rewards -244.4837324115314 with 310 steps, done\n",
      "Run episode 770 with rewards 217.47367106890437 with 382 steps, done\n",
      "Run episode 771 with rewards -136.7623139343912 with 228 steps, done\n",
      "Run episode 772 with rewards -232.24082671919675 with 409 steps, done\n",
      "Run episode 773 with rewards 149.88444837641896 with 575 steps, done\n",
      "Run episode 774 with rewards -42.98761429788023 with 338 steps, done\n",
      "Run episode 775 with rewards -41.13976554248894 with 241 steps, done\n",
      "Run episode 776 with rewards 5.754914191178301 with 248 steps, done\n",
      "Run episode 777 with rewards 246.79805751635698 with 372 steps, done\n",
      "Run episode 778 with rewards -227.3768365045839 with 246 steps, done\n",
      "Run episode 779 with rewards 246.59341380113182 with 371 steps, done\n",
      "Run episode 780 with rewards 192.64520974309843 with 661 steps, done\n",
      "Run episode 781 with rewards -228.91678499709548 with 229 steps, done\n",
      "Run episode 782 with rewards 253.9958446195419 with 369 steps, done\n",
      "Run episode 783 with rewards -177.45836362127127 with 279 steps, done\n",
      "Run episode 784 with rewards -46.9154364490597 with 297 steps, done\n",
      "Run episode 785 with rewards -231.25280440392245 with 236 steps, done\n",
      "Run episode 786 with rewards -21.567747213092034 with 229 steps, done\n",
      "Run episode 787 with rewards 193.3310166515304 with 459 steps, done\n",
      "Run episode 788 with rewards -19.025520192826022 with 189 steps, done\n",
      "Run episode 789 with rewards 163.52445238152353 with 475 steps, done\n",
      "Run episode 790 with rewards -24.72791487489721 with 237 steps, done\n",
      "Run episode 791 with rewards -8.393087399904502 with 279 steps, done\n",
      "Run episode 792 with rewards 223.86855886622993 with 377 steps, done\n",
      "Run episode 793 with rewards -45.76297316979431 with 206 steps, done\n",
      "Run episode 794 with rewards -1.3221821726432097 with 233 steps, done\n",
      "Run episode 795 with rewards 172.4009035218496 with 386 steps, done\n",
      "Run episode 796 with rewards -196.46073019667958 with 268 steps, done\n",
      "Run episode 797 with rewards -16.73455070473466 with 275 steps, done\n",
      "Run episode 798 with rewards 259.6658729391149 with 350 steps, done\n",
      "Run episode 799 with rewards 273.66057957087855 with 322 steps, done\n",
      "Run episode 800 with rewards 290.3155392558566 with 334 steps, done\n",
      "Run episode 801 with rewards -42.48712121804752 with 236 steps, done\n",
      "Run episode 802 with rewards 243.6664138381372 with 421 steps, done\n"
     ]
    }
   ],
   "source": [
    "opt1 = torch.optim.AdamW(value_func.parameters(), lr=0.0005)\n",
    "opt2 = torch.optim.AdamW(actor_func.parameters(), lr=0.0003)\n",
    "\n",
    "def pick_sample(s):\n",
    "    with torch.no_grad():\n",
    "        #   --> size : (1, 4)\n",
    "        s_batch = np.expand_dims(s, axis=0)\n",
    "        s_batch = torch.tensor(s_batch, dtype=torch.float).to(device)\n",
    "        # Get logits from state\n",
    "        #   --> size : (1, 2)\n",
    "        logits = actor_func(s_batch)\n",
    "        #   --> size : (2)\n",
    "        logits = logits.squeeze(dim=0)\n",
    "        # From logits to probabilities\n",
    "        probs = F.softmax(logits, dim=-1)\n",
    "        # Pick up action's sample\n",
    "#         print(probs, end=', ')\n",
    "        a = torch.multinomial(probs, num_samples=1)\n",
    "        # Return\n",
    "        return a.tolist()[0]\n",
    "reward_records = []\n",
    "for i in range(nn_actor_train_iterations):\n",
    "    #\n",
    "    # Run episode till done\n",
    "    #\n",
    "    done = False\n",
    "    states_list = []\n",
    "    actions_list = []\n",
    "    rewards_list = []\n",
    "    s, _ = env.reset(seed=np.random.randint(0, 1e6))\n",
    "    old_s = s\n",
    "#     s=one_hot_state(s)\n",
    "    num_steps=0\n",
    "    total_reward = 0\n",
    "    while not done:\n",
    "        states_list.append(s)\n",
    "        a = pick_sample(s)\n",
    "        s0, r, term, trunc, _ = env.step(a)\n",
    "#         if s0==old_s:\n",
    "#             r=-10\n",
    "        old_s = s0\n",
    "#         s=one_hot_state(s0)\n",
    "#         ss = position_to_index(s0)\n",
    "        s=s0\n",
    "        ss = s0\n",
    "        done = term or trunc\n",
    "        actions_list.append(a)\n",
    "        rewards_list.append(r)\n",
    "        total_reward += r\n",
    "        num_steps+=1\n",
    "        # if (num_steps+1) % 100 == 0:\n",
    "        #     print(num_steps, end=', ')\n",
    "#         print(ss, end='\\r')\n",
    "#         print(i, s, num_steps, end='\\r')\n",
    "        #\n",
    "        # Get cumulative rewards\n",
    "        #\n",
    "        # print()\n",
    "    if done:\n",
    "        if not term: \n",
    "            print(\"Run episode {} with rewards {} with {} steps\".format(i, total_reward, num_steps))#, end=\"\\r\")\n",
    "    #         continue\n",
    "        else:\n",
    "            print(\"Run episode {} with rewards {} with {} steps, done\".format(i, total_reward, num_steps))#, end=\"\\r\")\n",
    "    if (num_steps+1)%1000==0 or term: \n",
    "        cum_rewards = np.zeros_like(rewards_list)\n",
    "        reward_len = len(rewards_list)\n",
    "        states = torch.tensor(np.array(states_list), dtype=torch.float).to(device)\n",
    "        value_s = value_func(states)\n",
    "        states_next = torch.tensor(np.array(states_list[1:]+[s]), dtype=torch.float).to(device)\n",
    "        value_next_s = value_func(states_next)\n",
    "        if term:\n",
    "            value_next_s[-1]=0.0\n",
    "        for j in reversed(range(reward_len)):\n",
    "            cum_rewards[j] = rewards_list[j] + (value_next_s[j]*gamma if j+1 < reward_len else 0)\n",
    "    #     cum_rewards = (cum_rewards-cum_rewards.mean())/(cum_rewards.std()+1e-6)\n",
    "        #\n",
    "        # Train (optimize parameters)\n",
    "        #\n",
    "    #     print(states_list)\n",
    "        # Optimize value loss (Critic)\n",
    "        opt1.zero_grad()\n",
    "        \n",
    "        cum_rewards = torch.tensor(cum_rewards, dtype=torch.float).to(device)\n",
    "        values = value_func(states)\n",
    "        values = values.squeeze(dim=1)\n",
    "        vf_loss = F.mse_loss(\n",
    "            values,\n",
    "            cum_rewards,\n",
    "            reduction=\"none\")\n",
    "        vf_loss.sum().backward()\n",
    "        opt1.step()\n",
    "\n",
    "        # Todo 2; RULE BASED UPDATES\n",
    "        with torch.no_grad():\n",
    "            values = value_func(states).squeeze(dim=1)\n",
    "        opt2.zero_grad()\n",
    "        actions = torch.tensor(actions_list, dtype=torch.int64).to(device)\n",
    "        advantages = cum_rewards - values\n",
    "    #     print(advantages)\n",
    "        logits = actor_func(states)\n",
    "        log_probs = -F.cross_entropy(logits, actions, reduction=\"none\")\n",
    "        pi_loss = -log_probs * advantages\n",
    "        pi_loss.sum().backward()\n",
    "        opt2.step()\n",
    "        states_list = []\n",
    "        actions_list = []\n",
    "        rewards_list = []\n",
    "    # Output total rewards in episode (max 500)\n",
    "    \n",
    "    reward_records.append(total_reward)\n",
    "    if np.average(reward_records[-5:])>200:\n",
    "        break\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 31,
   "id": "7d028b71",
   "metadata": {},
   "outputs": [],
   "source": [
    "# 1/0\n",
    "import copy\n",
    "actor = ActorRule()\n",
    "critic = copy.deepcopy(value_func)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 32,
   "id": "73589768",
   "metadata": {},
   "outputs": [],
   "source": [
    "def softmax(logits):\n",
    "    exp_logits = np.exp(logits)\n",
    "    sum_logits = np.sum(exp_logits)\n",
    "    return (exp_logits / sum_logits).reshape([-1])\n",
    "\n",
    "def pick_sample(s):\n",
    "    with torch.no_grad():\n",
    "        s_batch = np.expand_dims(s, axis=0)\n",
    "        logits = actor(pd.DataFrame(s_batch, columns=column_names))\n",
    "        probs = softmax(logits)\n",
    "        a = torch.multinomial(torch.tensor(probs), num_samples=1)\n",
    "        return a.tolist()[0]\n",
    "\n",
    "\n",
    "def train():\n",
    "    reward_records = []\n",
    "    best_rewards = -10000000000\n",
    "    # best_model = None\n",
    "    for i in range(rule_actor_train_iterations):\n",
    "        done = False\n",
    "        states_list_one = []\n",
    "        states_list = []\n",
    "        actions_list = []\n",
    "        rewards_list = []\n",
    "        s0, _ = env.reset(seed=np.random.randint(0, 1e6))\n",
    "        old_s = s0\n",
    "        s=s0 #position_to_index(s0)\n",
    "        sh = s0 #one_hot_state(s0)\n",
    "#         print('start',s)\n",
    "        num_steps=0\n",
    "        total_reward = 0\n",
    "        while not done:\n",
    "            states_list.append(s)\n",
    "            states_list_one.append(sh)\n",
    "            a = pick_sample(s)\n",
    "            s0, r, term, trunc, _ = env.step(a)\n",
    "#             if s0==old_s:\n",
    "#                 r=-10\n",
    "            old_s=s0\n",
    "            s= s0 #position_to_index(s0)\n",
    "#             print(s, end='\\r')\n",
    "            sh = s0 # one_hot_state(s0)\n",
    "            done = term or trunc\n",
    "            actions_list.append(a)\n",
    "            rewards_list.append(r)\n",
    "            total_reward += r\n",
    "            num_steps+=1\n",
    "#         print('============', i, '===========')\n",
    "#         print(len(actions), 'actions', actions)\n",
    "        acts=np.array(actions_list)\n",
    "#         if not((num_steps+1)%250==0 or done or num_steps+1>=1000):\n",
    "#             continue\n",
    "#         if term or num_steps+1>=1000:\n",
    "        if term:\n",
    "            print(\"Run episode {} with rewards {} with {} steps, done\".format(i, total_reward, num_steps))        \n",
    "        else:\n",
    "            print(\"Run episode {} with rewards {} with {} steps\".format(i, total_reward, num_steps))  \n",
    "#         if not (num_steps+1)%250==0:\n",
    "\n",
    "        cum_rewards = np.zeros_like(rewards_list)\n",
    "        reward_len = len(rewards_list)\n",
    "        states_oh = torch.tensor(np.array(states_list_one), dtype=torch.float).to(device)\n",
    "        value_s = critic(states_oh)\n",
    "        states_oh_next = torch.tensor(np.array(states_list_one[1:]+[sh]), dtype=torch.float).to(device)\n",
    "        value_next_s = critic(states_oh_next)\n",
    "#             print(reward_len, end=', ')\n",
    "        if term: \n",
    "            value_next_s[-1]=0.0\n",
    "        for j in reversed(range(reward_len)):\n",
    "            cum_rewards[j] = rewards_list[j] + (value_next_s[j + 1] * gamma if j + 1 < reward_len else 0)\n",
    "#             cum_rewards = (cum_rewards-cum_rewards.mean())/(cum_rewards.std()+1e-6)\n",
    "        #\n",
    "        # Train (optimize parameters)\n",
    "        #\n",
    "        # Optimize value loss (Critic)\n",
    "        critic_optimizer.zero_grad()\n",
    "        cum_rewards = torch.tensor(cum_rewards, dtype=torch.float).to(device)\n",
    "        values = critic(states_oh)\n",
    "        values = values.squeeze(dim=1)\n",
    "#             print(values.shape)\n",
    "        vf_loss = F.mse_loss(\n",
    "            values,\n",
    "            cum_rewards,\n",
    "            reduction=\"none\")\n",
    "        vf_loss.sum().backward()\n",
    "        critic_optimizer.step()\n",
    "\n",
    "        reward_records.append(total_reward)\n",
    "#                                                                            sum(rewards)))  # , end=\"\\r\")\n",
    "        with torch.no_grad():\n",
    "            values = critic(states_oh).squeeze(dim=1)\n",
    "#         states = torch.tensor(np.array(states_list), dtype=torch.float).to(device)\n",
    "        actions = torch.tensor(actions_list, dtype=torch.int64).to(device)\n",
    "        advantages = cum_rewards - values\n",
    "        states_array = np.array(states_list)\n",
    "        x = pd.DataFrame(states_array, columns=column_names)\n",
    "        y = pd.Series(actions.cpu().detach().numpy())\n",
    "#         advantages = (advantages-advantages.mean())/advantages.std()\n",
    "        adv = pd.Series(advantages.cpu().detach().numpy())\n",
    "        outputs = actor(x).T\n",
    "        # print('adv', advantages.cpu().detach().numpy())\n",
    "        # print('outputs', outputs.tolist())\n",
    "        for j in range(len(actor.model)):\n",
    "            m = actor.model[j]\n",
    "            masks = np.ones_like(outputs, dtype=bool)\n",
    "            masks[:, j] = False\n",
    "            other_values = outputs[masks].reshape(-1, outputs.shape[1] - 1)\n",
    "\n",
    "            if len(m.rules_) == 0:\n",
    "                m.fit(x, y, adv, other_values, j)\n",
    "            else:\n",
    "                for _ in range(1):\n",
    "                    update_rules(m, x, y, adv, other_values, j)\n",
    "        states_list = []\n",
    "        actions_list = []\n",
    "        states_list_one = []\n",
    "        rewards_list = []\n",
    "#         if i >= 0:# and not np.all(acts==acts[0]):\n",
    "        if total_reward >= best_rewards:\n",
    "            best_rewards = total_reward\n",
    "            for rr in range(actor.action_space):\n",
    "                rules = []\n",
    "                for n in range(len(actor.model[rr].rules_)):\n",
    "                    rule = actor.model[rr].rules_[n]\n",
    "                    rules.append(Rule(q=rule.q, y=rule.y))\n",
    "                actor.best_model[rr].rules_ = AdditiveRuleEnsemble(rules)\n",
    "            print('best')\n",
    "        if np.average(reward_records[-5:]) > 200:\n",
    "            break\n",
    "        #     else:\n",
    "        #         for rr in range(actor.action_space):\n",
    "        #             rules = []\n",
    "        #             for n in range(len(actor.best_model[rr].rules_)):\n",
    "        #                 rule = actor.best_model[rr].rules_[n]\n",
    "        #                 rules.append(Rule(q=rule.q, y=rule.y))\n",
    "        #             actor.model[rr].rules_ = AdditiveRuleEnsemble(rules)\n",
    "        #         print('')\n",
    "\n",
    "        #\n",
    "        # Todo 2; RULE BASED UPDATES\n",
    "        \n",
    "#         for i in range(4):\n",
    "#             print(\"--------------\\n{}\".format(actor.model[i].rules_))\n",
    "        # print(\n",
    "        #     \"{}\\n--------------\\n{}\\nRun episode {} with rewards {}\".format(actor.model[0].rules_,\n",
    "        #                                                                     actor.model[1].rules_,\n",
    "        #                                                                     i,\n",
    "        #                                                                     sum(rewards)))  # , end=\"\\r\")\n",
    "        \n",
    "    print(\"\\nDone\")\n",
    "    env.close()\n",
    "    return reward_records"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 33,
   "id": "b411aa5d",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Simulation Progress [Episode 201]: 100%|█| 100/100 [00:02<00:00, 34.16%/s, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 202: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 202 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 0 with rewards -2447119.721574934 with 1440 steps00, 87.41%/s, 100% \n",
      "bestlation Progress [Episode 202]: 100%|█| 100/100 [00:19<00:00, 87.41%/s, 100% \n",
      "Simulation Progress [Episode 202]: 100%|█| 100/100 [11:19<00:00,  6.79s/%, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 203: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 203 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 1 with rewards -1909169.1312731344 with 1440 steps0,  1.31s/%, 100% \n",
      "best\n",
      "Simulation Progress [Episode 203]: 100%|█| 100/100 [02:52<00:00,  1.72s/%, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 204: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 204 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 2 with rewards -1224568.667720431 with 1440 steps00,  1.32s/%, 100% \n",
      "best\n",
      "Simulation Progress [Episode 204]: 100%|█| 100/100 [02:51<00:00,  1.72s/%, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 205: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 205 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 3 with rewards -1916957.3455820982 with 1440 steps0,  1.27s/%, 100% \n",
      "Simulation Progress [Episode 205]: 100%|█| 100/100 [02:48<00:00,  1.68s/%, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 206: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 206 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 4 with rewards -1358758.0020844222 with 1440 steps0,  1.27s/%, 100% \n",
      "Simulation Progress [Episode 206]: 100%|█| 100/100 [02:48<00:00,  1.69s/%, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 207: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 207 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 5 with rewards -1973293.1505527168 with 1440 steps0,  1.27s/%, 100% \n",
      "Simulation Progress [Episode 207]: 100%|█| 100/100 [02:47<00:00,  1.68s/%, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 208: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 208 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 6 with rewards -1842209.147779301 with 1440 steps00,  1.29s/%, 100% \n",
      "Simulation Progress [Episode 208]: 100%|█| 100/100 [02:50<00:00,  1.70s/%, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 209: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 209 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 7 with rewards -3021548.3761594957 with 1440 steps0,  1.28s/%, 100% \n",
      "Simulation Progress [Episode 209]: 100%|█| 100/100 [02:50<00:00,  1.70s/%, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 210: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 210 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 8 with rewards -1707898.6547012427 with 1440 steps0,  1.29s/%, 100% \n",
      "Simulation Progress [Episode 210]: 100%|█| 100/100 [02:49<00:00,  1.70s/%, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 211: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 211 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 9 with rewards -2892697.148155452 with 1440 steps00,  1.27s/%, 100% \n",
      "Simulation Progress [Episode 211]: 100%|█| 100/100 [02:48<00:00,  1.69s/%, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 212: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 212 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 10 with rewards -1810145.3635994121 with 1440 steps,  1.26s/%, 100% \n",
      "Simulation Progress [Episode 212]: 100%|█| 100/100 [02:46<00:00,  1.67s/%, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 213: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 213 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 11 with rewards -2145893.2239632015 with 1440 steps,  1.35s/%, 100% \n",
      "Simulation Progress [Episode 213]: 100%|█| 100/100 [02:59<00:00,  1.79s/%, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 214: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 214 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 12 with rewards -1632755.834565517 with 1440 steps0,  1.37s/%, 100% \n",
      "Simulation Progress [Episode 214]: 100%|█| 100/100 [03:01<00:00,  1.82s/%, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 215: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 215 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 13 with rewards -1501277.0064945838 with 1440 steps,  1.24s/%, 100% \n",
      "Simulation Progress [Episode 215]: 100%|█| 100/100 [02:45<00:00,  1.65s/%, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 216: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 216 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 14 with rewards -1648877.190116013 with 1440 steps0,  1.23s/%, 100% \n",
      "Simulation Progress [Episode 216]: 100%|█| 100/100 [02:44<00:00,  1.65s/%, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 217: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 217 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 15 with rewards -2044660.5739301573 with 1440 steps,  1.24s/%, 100% \n",
      "Simulation Progress [Episode 217]: 100%|█| 100/100 [02:44<00:00,  1.65s/%, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 218: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 218 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 16 with rewards -1558897.2370247657 with 1440 steps,  1.25s/%, 100% \n",
      "Simulation Progress [Episode 218]: 100%|█| 100/100 [02:44<00:00,  1.65s/%, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 219: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 219 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 17 with rewards -1948766.9040755203 with 1440 steps,  1.24s/%, 100% \n",
      "Simulation Progress [Episode 219]: 100%|█| 100/100 [02:45<00:00,  1.66s/%, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 220: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 220 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 18 with rewards -1430856.284730146 with 1440 steps0,  1.23s/%, 100% \n",
      "Simulation Progress [Episode 220]: 100%|█| 100/100 [02:45<00:00,  1.65s/%, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 221: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 221 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 19 with rewards -1891964.5704747455 with 1440 steps,  1.24s/%, 100% \n",
      "Simulation Progress [Episode 221]: 100%|█| 100/100 [02:44<00:00,  1.64s/%, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 222: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 222 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 20 with rewards -1532941.8352557274 with 1440 steps,  1.23s/%, 100% \n",
      "Simulation Progress [Episode 222]: 100%|█| 100/100 [02:44<00:00,  1.64s/%, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 223: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 223 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 21 with rewards -2017990.825430776 with 1440 steps0,  1.21s/%, 100% \n",
      "Simulation Progress [Episode 223]: 100%|█| 100/100 [02:43<00:00,  1.63s/%, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 224: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 224 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 22 with rewards -1498328.2480189735 with 1440 steps,  1.17s/%, 100% \n",
      "Simulation Progress [Episode 224]: 100%|█| 100/100 [02:39<00:00,  1.59s/%, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 225: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 225 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 23 with rewards -2241196.1045821235 with 1440 steps,  1.15s/%, 100% \n",
      "Simulation Progress [Episode 225]: 100%|█| 100/100 [02:35<00:00,  1.56s/%, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 226: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 226 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 24 with rewards -1589268.8214191403 with 1440 steps,  1.15s/%, 100% \n",
      "Simulation Progress [Episode 226]: 100%|█| 100/100 [02:35<00:00,  1.55s/%, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 227: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 227 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 25 with rewards -1918123.864764696 with 1440 steps0,  1.15s/%, 100% \n",
      "Simulation Progress [Episode 227]: 100%|█| 100/100 [02:35<00:00,  1.55s/%, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 228: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 228 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 26 with rewards -1838374.1204716263 with 1440 steps,  1.14s/%, 100% \n",
      "Simulation Progress [Episode 228]: 100%|█| 100/100 [02:35<00:00,  1.55s/%, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 229: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 229 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 27 with rewards -1924696.2168723291 with 1440 steps,  1.15s/%, 100% \n",
      "Simulation Progress [Episode 229]: 100%|█| 100/100 [02:35<00:00,  1.55s/%, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 230: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 230 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 28 with rewards -1606578.9801534016 with 1440 steps,  1.16s/%, 100% \n",
      "Simulation Progress [Episode 230]: 100%|█| 100/100 [02:36<00:00,  1.57s/%, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 231: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 231 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 29 with rewards -2052399.2638519893 with 1440 steps,  1.25s/%, 100% \n",
      "Simulation Progress [Episode 231]: 100%|█| 100/100 [02:49<00:00,  1.70s/%, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 232: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 232 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 30 with rewards -1612280.8169074403 with 1440 steps,  1.25s/%, 100% \n",
      "Simulation Progress [Episode 232]: 100%|█| 100/100 [02:50<00:00,  1.70s/%, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 233: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 233 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 31 with rewards -1931339.9906714868 with 1440 steps,  1.25s/%, 100% \n",
      "Simulation Progress [Episode 233]: 100%|█| 100/100 [02:50<00:00,  1.70s/%, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 234: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 234 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 32 with rewards -1655784.5430307623 with 1440 steps,  1.27s/%, 100% \n",
      "Simulation Progress [Episode 234]: 100%|█| 100/100 [02:51<00:00,  1.72s/%, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 235: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 235 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 33 with rewards -1961936.5102411276 with 1440 steps,  1.27s/%, 100% \n",
      "Simulation Progress [Episode 235]: 100%|█| 100/100 [02:52<00:00,  1.72s/%, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 236: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 236 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 34 with rewards -1600199.7633640785 with 1440 steps,  1.30s/%, 100% \n",
      "Simulation Progress [Episode 236]: 100%|█| 100/100 [02:54<00:00,  1.75s/%, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 237: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 237 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 35 with rewards -1901622.293818299 with 1440 steps0,  1.30s/%, 100% \n",
      "Simulation Progress [Episode 237]: 100%|█| 100/100 [02:54<00:00,  1.75s/%, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 238: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 238 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 36 with rewards -2685761.20010585 with 1440 steps00,  1.30s/%, 100% \n",
      "Simulation Progress [Episode 238]: 100%|█| 100/100 [02:54<00:00,  1.74s/%, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 239: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 239 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 37 with rewards -1976318.521800029 with 1440 steps0,  1.29s/%, 100% \n",
      "Simulation Progress [Episode 239]: 100%|█| 100/100 [02:53<00:00,  1.74s/%, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 240: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 240 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 38 with rewards -1725856.9684125017 with 1440 steps,  1.30s/%, 100% \n",
      "Simulation Progress [Episode 240]: 100%|█| 100/100 [02:54<00:00,  1.75s/%, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 241: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 241 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 39 with rewards -2280038.856791893 with 1440 steps0,  1.30s/%, 100% \n",
      "Simulation Progress [Episode 241]: 100%|█| 100/100 [02:54<00:00,  1.75s/%, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 242: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 242 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 40 with rewards -1573664.6725527758 with 1440 steps,  1.30s/%, 100% \n",
      "Simulation Progress [Episode 242]: 100%|█| 100/100 [02:55<00:00,  1.76s/%, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 243: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 243 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 41 with rewards -1990795.3180323585 with 1440 steps,  1.33s/%, 100% \n",
      "Simulation Progress [Episode 243]: 100%|█| 100/100 [02:56<00:00,  1.77s/%, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 244: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 244 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 42 with rewards -1457989.6600046153 with 1440 steps,  1.31s/%, 100% \n",
      "Simulation Progress [Episode 244]: 100%|█| 100/100 [02:56<00:00,  1.76s/%, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 245: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 245 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 43 with rewards -1912417.7014134282 with 1440 steps,  1.30s/%, 100% \n",
      "Simulation Progress [Episode 245]: 100%|█| 100/100 [02:55<00:00,  1.75s/%, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 246: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 246 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 44 with rewards -1685350.0647269313 with 1440 steps,  1.30s/%, 100% \n",
      "Simulation Progress [Episode 246]: 100%|█| 100/100 [02:55<00:00,  1.75s/%, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 247: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 247 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 45 with rewards -2163838.277827226 with 1440 steps0,  1.30s/%, 100% \n",
      "Simulation Progress [Episode 247]: 100%|█| 100/100 [02:54<00:00,  1.74s/%, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 248: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 248 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 46 with rewards -1646846.1250367165 with 1440 steps,  1.30s/%, 100% \n",
      "Simulation Progress [Episode 248]: 100%|█| 100/100 [02:55<00:00,  1.75s/%, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 249: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 249 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 47 with rewards -2033865.5762567883 with 1440 steps,  1.31s/%, 100% \n",
      "Simulation Progress [Episode 249]: 100%|█| 100/100 [02:55<00:00,  1.76s/%, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 250: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 250 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 48 with rewards -2025161.8874596087 with 1440 steps,  1.30s/%, 100% \n",
      "Simulation Progress [Episode 250]: 100%|█| 100/100 [02:54<00:00,  1.74s/%, 100% \n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 251: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 251 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n",
      "Run episode 49 with rewards -1634641.7587382148 with 1440 steps,  1.22s/%, 100% \n",
      "\n",
      "Done\n",
      "Simulation Progress [Episode 251]: 100%|█| 100/100 [02:46<00:00,  1.66s/%, 100% \n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Environment closed. [demo-v1]\u001b[0m\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Run episode 242 with rewards -704.6498548031452 with 73 steps, done\n",
      "Run episode 243 with rewards -673.6535944495264 with 159 steps, done\n",
      "Run episode 244 with rewards -127.59144526898623 with 61 steps, done\n",
      "Run episode 245 with rewards -628.3553781722525 with 69 steps, done\n",
      "Run episode 246 with rewards -495.5276226002726 with 78 steps, done\n",
      "Run episode 247 with rewards -924.3431592753565 with 83 steps, done\n",
      "Run episode 248 with rewards -503.89582873309314 with 92 steps, done\n",
      "Run episode 249 with rewards -258.78173981880866 with 75 steps, done\n",
      "Run episode 250 with rewards -802.1072673751358 with 76 steps, done\n",
      "Run episode 251 with rewards -272.92544098768315 with 94 steps, done\n",
      "Run episode 252 with rewards -527.1391083329909 with 63 steps, done\n",
      "Run episode 253 with rewards -202.6219810320853 with 81 steps, done\n",
      "Run episode 254 with rewards -677.5815972915271 with 78 steps, done\n",
      "Run episode 255 with rewards -147.82618798829122 with 76 steps, done\n",
      "Run episode 256 with rewards -656.6679332498876 with 112 steps, done\n",
      "Run episode 257 with rewards -118.61189769325154 with 92 steps, done\n",
      "Run episode 258 with rewards -951.7963514159732 with 120 steps, done\n",
      "Run episode 259 with rewards -387.6517839010388 with 85 steps, done\n",
      "Run episode 260 with rewards -845.8451143700247 with 128 steps, done\n",
      "Run episode 261 with rewards -671.0302829672293 with 78 steps, done\n",
      "Run episode 262 with rewards -231.73052485706933 with 63 steps, done\n",
      "Run episode 263 with rewards -510.97132925029206 with 142 steps, done\n",
      "Run episode 264 with rewards -392.8530411947383 with 47 steps, done\n",
      "Run episode 265 with rewards -464.2082618678245 with 93 steps, done\n",
      "Run episode 266 with rewards -173.65403799138232 with 53 steps, done\n",
      "Run episode 267 with rewards -618.9685649044412 with 108 steps, done\n",
      "Run episode 268 with rewards -762.9568331207629 with 105 steps, done\n",
      "Run episode 269 with rewards -139.78287251777533 with 57 steps, done\n",
      "Run episode 270 with rewards -1328.5955434773325 with 176 steps, done\n",
      "Run episode 271 with rewards -122.82032372258097 with 92 steps, done\n",
      "Run episode 272 with rewards -697.395283633233 with 143 steps, done\n",
      "Run episode 273 with rewards -116.55131488990354 with 83 steps, done\n",
      "Run episode 274 with rewards -238.51665740746364 with 202 steps, done\n",
      "Run episode 275 with rewards -161.68274348690682 with 50 steps, done\n",
      "Run episode 276 with rewards -551.2838746767313 with 59 steps, done\n",
      "Run episode 277 with rewards -200.6215422937286 with 129 steps, done\n",
      "Run episode 278 with rewards -710.316302169485 with 109 steps, done\n",
      "Run episode 279 with rewards -720.4993298390816 with 89 steps, done\n",
      "Run episode 280 with rewards -1214.8474551721922 with 157 steps, done\n",
      "Run episode 281 with rewards -780.9442731554161 with 76 steps, done\n",
      "Run episode 282 with rewards -553.2271459632425 with 82 steps, done\n",
      "Run episode 283 with rewards -163.44433177838886 with 57 steps, done\n",
      "Run episode 284 with rewards -691.4373433010503 with 87 steps, done\n",
      "Run episode 285 with rewards -97.97824598969787 with 75 steps, done\n",
      "Run episode 286 with rewards -607.439743836512 with 96 steps, done\n",
      "Run episode 287 with rewards -264.63073671299594 with 79 steps, done\n",
      "Run episode 288 with rewards -523.5453416660723 with 77 steps, done\n",
      "Run episode 289 with rewards -170.25054873586578 with 68 steps, done\n",
      "Run episode 290 with rewards -544.525718929973 with 83 steps, done\n",
      "Run episode 291 with rewards -658.8591008616054 with 88 steps, done\n",
      "Run episode 292 with rewards -130.0266330654886 with 65 steps, done\n",
      "Run episode 293 with rewards -388.84410043450646 with 102 steps, done\n",
      "Run episode 294 with rewards -110.48056893638613 with 53 steps, done\n",
      "Run episode 295 with rewards -343.5895471167844 with 83 steps, done\n",
      "Run episode 296 with rewards -623.076375593057 with 113 steps, done\n",
      "Run episode 297 with rewards -791.3605286792139 with 75 steps, done\n",
      "Run episode 298 with rewards -491.4904007211435 with 73 steps, done\n",
      "Run episode 299 with rewards -140.3286962989198 with 76 steps, done\n",
      "Run episode 300 with rewards -90.50685334299732 with 98 steps, done\n",
      "Run episode 301 with rewards -729.0548166214579 with 115 steps, done\n",
      "Run episode 302 with rewards -176.39304043464787 with 67 steps, done\n",
      "Run episode 303 with rewards -879.5556027964114 with 128 steps, done\n",
      "Run episode 304 with rewards -418.8823471866229 with 54 steps, done\n",
      "Run episode 305 with rewards -555.7775637942782 with 84 steps, done\n",
      "Run episode 306 with rewards -430.6419025855995 with 85 steps, done\n",
      "Run episode 307 with rewards -522.7841943954124 with 102 steps, done\n",
      "Run episode 308 with rewards -152.1043622026301 with 77 steps, done\n",
      "Run episode 309 with rewards -1148.670144740428 with 358 steps, done\n",
      "Run episode 310 with rewards -433.29023372037295 with 72 steps, done\n",
      "Run episode 311 with rewards -104.4440170193288 with 58 steps, done\n",
      "Run episode 312 with rewards -339.5769872115924 with 50 steps, done\n",
      "Run episode 313 with rewards -519.7071702969154 with 85 steps, done\n",
      "Run episode 314 with rewards -555.9142441492285 with 61 steps, done\n",
      "Run episode 315 with rewards -809.7282965072462 with 78 steps, done\n",
      "Run episode 316 with rewards -253.8740746038218 with 70 steps, done\n",
      "Run episode 317 with rewards -501.5217011011507 with 57 steps, done\n",
      "Run episode 318 with rewards -268.60114822347515 with 80 steps, done\n",
      "Run episode 319 with rewards -623.4081863398271 with 65 steps, done\n",
      "Run episode 320 with rewards -148.42953116642133 with 66 steps, done\n",
      "Run episode 321 with rewards -88.93188347516264 with 88 steps, done\n",
      "Run episode 322 with rewards -88.62668757928049 with 53 steps, done\n",
      "Run episode 323 with rewards -543.4910033687468 with 62 steps, done\n",
      "Run episode 324 with rewards -646.9607651227402 with 100 steps, done\n",
      "Run episode 325 with rewards -826.6927696726468 with 80 steps, done\n",
      "Run episode 326 with rewards -457.8196741772067 with 65 steps, done\n",
      "Run episode 327 with rewards -566.8725083570696 with 66 steps, done\n",
      "Run episode 328 with rewards -590.0181375875131 with 85 steps, done\n",
      "Run episode 329 with rewards -350.036020129992 with 50 steps, done\n",
      "Run episode 330 with rewards -284.28084928089197 with 106 steps, done\n",
      "Run episode 331 with rewards -710.5987157317113 with 130 steps, done\n",
      "Run episode 332 with rewards -497.1931986215829 with 67 steps, done\n",
      "Run episode 333 with rewards -55.366252406627545 with 72 steps, done\n",
      "Run episode 334 with rewards -574.5721617886097 with 74 steps, done\n",
      "Run episode 335 with rewards -126.27920144439638 with 68 steps, done\n",
      "Run episode 336 with rewards -530.6545020320789 with 72 steps, done\n",
      "Run episode 337 with rewards -110.80071445886843 with 81 steps, done\n",
      "Run episode 338 with rewards -712.036186807748 with 131 steps, done\n",
      "Run episode 339 with rewards -785.4197842436055 with 110 steps, done\n",
      "Run episode 340 with rewards -486.30305000112287 with 61 steps, done\n",
      "Run episode 341 with rewards -186.05709127100184 with 71 steps, done\n",
      "Run episode 342 with rewards -633.9069229023593 with 67 steps, done\n",
      "Run episode 343 with rewards -165.53601977768125 with 76 steps, done\n",
      "Run episode 344 with rewards -106.91285437156291 with 63 steps, done\n",
      "Run episode 345 with rewards -155.4075158902171 with 75 steps, done\n",
      "Run episode 346 with rewards -186.29929724561993 with 110 steps, done\n",
      "Run episode 347 with rewards -97.58770017739943 with 57 steps, done\n",
      "Run episode 348 with rewards -360.63224619200497 with 87 steps, done\n",
      "Run episode 349 with rewards -125.92823626555153 with 75 steps, done\n",
      "Run episode 350 with rewards -83.2501973842979 with 143 steps, done\n",
      "Run episode 351 with rewards -448.686975208777 with 82 steps, done\n",
      "Run episode 352 with rewards -564.1790666120928 with 85 steps, done\n",
      "Run episode 353 with rewards -124.11427324172465 with 75 steps, done\n",
      "Run episode 354 with rewards -141.7551703760679 with 73 steps, done\n",
      "Run episode 355 with rewards -83.4398588120923 with 66 steps, done\n",
      "Run episode 356 with rewards -112.72123932356791 with 56 steps, done\n",
      "Run episode 357 with rewards -101.93554297885605 with 139 steps, done\n",
      "Run episode 358 with rewards -272.4471148288965 with 104 steps, done\n",
      "Run episode 359 with rewards -303.79565911968393 with 105 steps, done\n",
      "Run episode 360 with rewards -226.59771570483753 with 76 steps, done\n",
      "Run episode 361 with rewards -532.7206627894088 with 56 steps, done\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Run episode 362 with rewards -396.46484413560773 with 47 steps, done\n",
      "Run episode 363 with rewards -582.6944902380794 with 101 steps, done\n",
      "Run episode 364 with rewards -518.1246071919168 with 65 steps, done\n",
      "Run episode 365 with rewards 10.35136798463796 with 66 steps, done\n",
      "Run episode 366 with rewards -150.3999694001938 with 73 steps, done\n",
      "Run episode 367 with rewards -185.88968606032182 with 99 steps, done\n",
      "Run episode 368 with rewards -146.96504655150636 with 85 steps, done\n",
      "Run episode 369 with rewards -68.45123291311444 with 80 steps, done\n",
      "Run episode 370 with rewards -467.61107730781674 with 197 steps, done\n",
      "Run episode 371 with rewards -623.0568990433213 with 81 steps, done\n",
      "Run episode 372 with rewards -278.0336625026647 with 74 steps, done\n",
      "Run episode 373 with rewards -621.3479234315759 with 81 steps, done\n",
      "Run episode 374 with rewards -123.83295242202703 with 87 steps, done\n",
      "Run episode 375 with rewards -1170.1733310023558 with 163 steps, done\n",
      "Run episode 376 with rewards -136.83985112375854 with 52 steps, done\n",
      "Run episode 377 with rewards -204.6549780212738 with 120 steps, done\n",
      "Run episode 378 with rewards -110.280845330461 with 64 steps, done\n",
      "Run episode 379 with rewards -463.7332953799868 with 53 steps, done\n",
      "Run episode 380 with rewards -532.9630135243297 with 81 steps, done\n",
      "Run episode 381 with rewards -706.0459305122903 with 73 steps, done\n",
      "Run episode 382 with rewards -302.29329208616775 with 66 steps, done\n",
      "Run episode 383 with rewards -483.4462336440605 with 72 steps, done\n",
      "Run episode 384 with rewards -506.12501027969967 with 74 steps, done\n",
      "Run episode 385 with rewards -348.28602904452464 with 51 steps, done\n",
      "Run episode 386 with rewards -771.9218076439018 with 81 steps, done\n",
      "Run episode 387 with rewards -706.8850191173852 with 77 steps, done\n",
      "Run episode 388 with rewards -521.6461095025275 with 66 steps, done\n",
      "Run episode 389 with rewards -481.5976484076685 with 54 steps, done\n",
      "Run episode 390 with rewards -578.2513591649774 with 91 steps, done\n",
      "Run episode 391 with rewards -740.7335382651751 with 77 steps, done\n",
      "Run episode 392 with rewards -539.8319545730327 with 72 steps, done\n",
      "Run episode 393 with rewards -526.5110558439319 with 61 steps, done\n",
      "Run episode 394 with rewards -560.1640086635656 with 90 steps, done\n",
      "Run episode 395 with rewards -416.292186795172 with 56 steps, done\n",
      "Run episode 396 with rewards -141.00139653525537 with 60 steps, done\n",
      "Run episode 397 with rewards -256.0258050489475 with 78 steps, done\n",
      "Run episode 398 with rewards -414.23125513852096 with 82 steps, done\n",
      "Run episode 399 with rewards -142.70688630337355 with 54 steps, done\n",
      "Run episode 400 with rewards -443.40548884947736 with 133 steps, done\n",
      "Run episode 401 with rewards -158.3913099742667 with 74 steps, done\n",
      "Run episode 402 with rewards -406.02408920882834 with 90 steps, done\n",
      "Run episode 403 with rewards -147.24233522247428 with 81 steps, done\n",
      "Run episode 404 with rewards -49.527488294766684 with 60 steps, done\n",
      "Run episode 405 with rewards -143.56523123813946 with 77 steps, done\n",
      "Run episode 406 with rewards -253.04943015644557 with 104 steps, done\n",
      "Run episode 407 with rewards -122.56076835311316 with 86 steps, done\n",
      "Run episode 408 with rewards -175.22759136507958 with 76 steps, done\n",
      "Run episode 409 with rewards -307.36216061947226 with 139 steps, done\n",
      "Run episode 410 with rewards -31.29178832334543 with 90 steps, done\n",
      "Run episode 411 with rewards -748.7253922388923 with 119 steps, done\n",
      "Run episode 412 with rewards -102.67921176726591 with 85 steps, done\n",
      "Run episode 413 with rewards -6456.823208070876 with 511 steps, done\n",
      "Run episode 414 with rewards -123.59756474688146 with 60 steps, done\n",
      "Run episode 415 with rewards -601.9702254170137 with 117 steps, done\n",
      "Run episode 416 with rewards -156.22102137641434 with 71 steps, done\n",
      "Run episode 417 with rewards -529.3147628500748 with 105 steps, done\n",
      "Run episode 418 with rewards -146.27069619612087 with 77 steps, done\n",
      "Run episode 419 with rewards -390.87888892358865 with 79 steps, done\n",
      "Run episode 420 with rewards -98.71684516704029 with 99 steps, done\n",
      "Run episode 421 with rewards -911.4801674822085 with 133 steps, done\n",
      "Run episode 422 with rewards -278.50726008704817 with 83 steps, done\n",
      "Run episode 423 with rewards -703.0548053381766 with 99 steps, done\n",
      "Run episode 424 with rewards -140.64111761235327 with 53 steps, done\n",
      "Run episode 425 with rewards -727.5945169622628 with 93 steps, done\n",
      "Run episode 426 with rewards -112.75006480494291 with 61 steps, done\n",
      "Run episode 427 with rewards -584.418886987092 with 103 steps, done\n",
      "Run episode 428 with rewards -117.45082088251822 with 53 steps, done\n",
      "Run episode 429 with rewards -1814.5634917379195 with 243 steps, done\n",
      "Run episode 430 with rewards -193.08799609342142 with 80 steps, done\n",
      "Run episode 431 with rewards -539.4374094561961 with 103 steps, done\n",
      "Run episode 432 with rewards -596.7793299261104 with 73 steps, done\n",
      "Run episode 433 with rewards -400.20766899552774 with 66 steps, done\n",
      "Run episode 434 with rewards -1039.8410624082817 with 112 steps, done\n",
      "Run episode 435 with rewards -405.18893380503687 with 77 steps, done\n",
      "Run episode 436 with rewards -860.7953226521994 with 80 steps, done\n",
      "Run episode 437 with rewards -536.3987068378405 with 78 steps, done\n",
      "Run episode 438 with rewards -446.1093427018557 with 52 steps, done\n",
      "Run episode 439 with rewards -235.8368630192767 with 118 steps, done\n",
      "Run episode 440 with rewards -853.8459856119299 with 87 steps, done\n",
      "Run episode 441 with rewards -207.25038797166147 with 89 steps, done\n",
      "Run episode 442 with rewards -552.554317766888 with 72 steps, done\n",
      "Run episode 443 with rewards -153.55090494622397 with 75 steps, done\n",
      "Run episode 444 with rewards -375.55860105415974 with 50 steps, done\n",
      "Run episode 445 with rewards -1477.6828563558486 with 185 steps, done\n",
      "Run episode 446 with rewards -169.0550357523526 with 69 steps, done\n",
      "Run episode 447 with rewards -630.5785699033604 with 92 steps, done\n",
      "Run episode 448 with rewards -193.7706338988341 with 56 steps, done\n",
      "Run episode 449 with rewards -725.1677564671231 with 137 steps, done\n",
      "Run episode 450 with rewards -433.67772040955043 with 60 steps, done\n",
      "Run episode 451 with rewards -317.81919009131127 with 80 steps, done\n",
      "Run episode 452 with rewards -476.5888891460287 with 62 steps, done\n",
      "Run episode 453 with rewards -483.19026140498676 with 62 steps, done\n",
      "Run episode 454 with rewards -270.41095847407826 with 72 steps, done\n",
      "Run episode 455 with rewards -513.2661403095874 with 66 steps, done\n",
      "Run episode 456 with rewards -108.89280923178967 with 75 steps, done\n",
      "Run episode 457 with rewards -504.69996508414977 with 67 steps, done\n",
      "Run episode 458 with rewards -176.17630104151232 with 83 steps, done\n",
      "Run episode 459 with rewards -805.6015789208595 with 83 steps, done\n",
      "Run episode 460 with rewards -525.2546243190095 with 78 steps, done\n",
      "Run episode 461 with rewards -469.5920574227407 with 62 steps, done\n",
      "Run episode 462 with rewards -599.2503688298158 with 95 steps, done\n",
      "Run episode 463 with rewards -357.4645181372907 with 90 steps, done\n",
      "Run episode 464 with rewards -395.8579237177501 with 109 steps, done\n",
      "Run episode 465 with rewards -380.7321155697987 with 55 steps, done\n",
      "Run episode 466 with rewards -274.23065888513304 with 83 steps, done\n",
      "Run episode 467 with rewards -488.63848985315497 with 57 steps, done\n",
      "Run episode 468 with rewards -482.1701571621876 with 73 steps, done\n",
      "Run episode 469 with rewards -717.0750227808193 with 78 steps, done\n",
      "Run episode 470 with rewards -444.00206682801036 with 76 steps, done\n",
      "Run episode 471 with rewards -524.1950989607783 with 67 steps, done\n",
      "Run episode 472 with rewards -475.6653022930659 with 67 steps, done\n",
      "Run episode 473 with rewards -504.9784501375406 with 71 steps, done\n",
      "Run episode 474 with rewards -368.1467280897998 with 54 steps, done\n",
      "Run episode 475 with rewards -507.71305148447414 with 81 steps, done\n",
      "Run episode 476 with rewards -283.1847864469454 with 107 steps, done\n",
      "Run episode 477 with rewards -229.0527338652101 with 64 steps, done\n",
      "Run episode 478 with rewards -371.4495658438018 with 90 steps, done\n",
      "Run episode 479 with rewards -77.66893360980795 with 55 steps, done\n",
      "Run episode 480 with rewards -569.2018483435205 with 63 steps, done\n",
      "Run episode 481 with rewards -429.96984342249027 with 111 steps, done\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Run episode 482 with rewards -394.7829688852658 with 59 steps, done\n",
      "Run episode 483 with rewards -790.0243409156483 with 197 steps, done\n",
      "Run episode 484 with rewards -104.61146017508386 with 91 steps, done\n",
      "Run episode 485 with rewards -94.98208509372378 with 110 steps, done\n",
      "Run episode 486 with rewards -204.66004393385776 with 74 steps, done\n",
      "Run episode 487 with rewards -87.71100966836885 with 81 steps, done\n",
      "Run episode 488 with rewards -637.2459149141263 with 113 steps, done\n",
      "Run episode 489 with rewards -487.7042073486832 with 56 steps, done\n",
      "Run episode 490 with rewards -373.07796792955105 with 105 steps, done\n",
      "Run episode 491 with rewards -176.90825638695827 with 92 steps, done\n",
      "Run episode 492 with rewards -530.4859511924419 with 66 steps, done\n",
      "Run episode 493 with rewards -527.8946294383223 with 58 steps, done\n",
      "Run episode 494 with rewards -632.8712948388516 with 81 steps, done\n",
      "Run episode 495 with rewards -257.53411433773647 with 76 steps, done\n",
      "Run episode 496 with rewards -747.1023541100465 with 101 steps, done\n",
      "Run episode 497 with rewards -727.4414037118155 with 73 steps, done\n",
      "Run episode 498 with rewards -474.3313302223061 with 100 steps, done\n",
      "Run episode 499 with rewards -764.9950724663274 with 75 steps, done\n",
      "Run episode 500 with rewards -384.7298385152653 with 95 steps, done\n",
      "Run episode 501 with rewards -566.5342204390943 with 76 steps, done\n",
      "Run episode 502 with rewards -244.04887057911708 with 84 steps, done\n",
      "Run episode 503 with rewards -554.7726181935344 with 79 steps, done\n",
      "Run episode 504 with rewards -197.1653301738778 with 82 steps, done\n",
      "Run episode 505 with rewards -634.5510172267434 with 86 steps, done\n",
      "Run episode 506 with rewards -423.1698594790831 with 51 steps, done\n",
      "Run episode 507 with rewards -706.4264054585964 with 85 steps, done\n",
      "Run episode 508 with rewards -757.3604936885381 with 84 steps, done\n",
      "Run episode 509 with rewards -628.988141222292 with 105 steps, done\n",
      "Run episode 510 with rewards -450.1983165716281 with 72 steps, done\n",
      "Run episode 511 with rewards -291.27031842286925 with 91 steps, done\n",
      "Run episode 512 with rewards -378.7808762593024 with 56 steps, done\n",
      "Run episode 513 with rewards -630.2104307324553 with 107 steps, done\n",
      "Run episode 514 with rewards -785.5481549799131 with 86 steps, done\n",
      "Run episode 515 with rewards -623.416175123133 with 113 steps, done\n",
      "Run episode 516 with rewards -398.28312657279594 with 56 steps, done\n",
      "Run episode 517 with rewards -509.7308364252441 with 96 steps, done\n",
      "Run episode 518 with rewards -139.148207958162 with 56 steps, done\n",
      "Run episode 519 with rewards -372.2307548190058 with 87 steps, done\n",
      "Run episode 520 with rewards -190.41637827935514 with 74 steps, done\n",
      "Run episode 521 with rewards -483.75581470828087 with 70 steps, done\n",
      "Run episode 522 with rewards -253.35616379130474 with 70 steps, done\n",
      "Run episode 523 with rewards -590.8745995413985 with 96 steps, done\n",
      "Run episode 524 with rewards -135.71743142765925 with 51 steps, done\n",
      "Run episode 525 with rewards -371.02097550928136 with 78 steps, done\n",
      "Run episode 526 with rewards -100.69184273180548 with 54 steps, done\n",
      "Run episode 527 with rewards -690.2606891381309 with 110 steps, done\n",
      "Run episode 528 with rewards -203.05317105114045 with 85 steps, done\n",
      "Run episode 529 with rewards -1043.106827364291 with 169 steps, done\n",
      "Run episode 530 with rewards -109.66445379877088 with 58 steps, done\n",
      "Run episode 531 with rewards -425.68781818888596 with 75 steps, done\n",
      "Run episode 532 with rewards -132.5374674460886 with 57 steps, done\n",
      "Run episode 533 with rewards -797.9698336458401 with 96 steps, done\n",
      "Run episode 534 with rewards -51.11259025231611 with 66 steps, done\n",
      "Run episode 535 with rewards -1051.1665684043664 with 138 steps, done\n",
      "Run episode 536 with rewards -120.36224811528564 with 87 steps, done\n",
      "Run episode 537 with rewards -227.52664564932365 with 81 steps, done\n",
      "Run episode 538 with rewards -225.38383926611453 with 116 steps, done\n",
      "Run episode 539 with rewards -471.26571584902126 with 71 steps, done\n",
      "Run episode 540 with rewards -815.1891151097577 with 82 steps, done\n",
      "Run episode 541 with rewards -477.3581207068428 with 62 steps, done\n",
      "Run episode 542 with rewards -376.7662273353539 with 52 steps, done\n",
      "Run episode 543 with rewards -462.57852350494574 with 59 steps, done\n",
      "Run episode 544 with rewards -68.9911249938066 with 84 steps, done\n",
      "Run episode 545 with rewards -520.759379482733 with 57 steps, done\n",
      "Run episode 546 with rewards -854.8398493587905 with 83 steps, done\n",
      "Run episode 547 with rewards -690.4162932473482 with 78 steps, done\n",
      "Run episode 548 with rewards -455.6921007316906 with 87 steps, done\n",
      "Run episode 549 with rewards -467.1156590753953 with 61 steps, done\n",
      "Run episode 550 with rewards -360.60204875745075 with 65 steps, done\n",
      "Run episode 551 with rewards -121.65095461672398 with 55 steps, done\n",
      "Run episode 552 with rewards -975.8328407877417 with 85 steps, done\n",
      "Run episode 553 with rewards -159.98733556927368 with 84 steps, done\n",
      "Run episode 554 with rewards -683.9452756910288 with 79 steps, done\n",
      "Run episode 555 with rewards -304.8209253663706 with 81 steps, done\n",
      "Run episode 556 with rewards -484.7279193297893 with 64 steps, done\n",
      "Run episode 557 with rewards -601.6736680862707 with 78 steps, done\n",
      "Run episode 558 with rewards -208.3346397803623 with 87 steps, done\n",
      "Run episode 559 with rewards -130.49394455534937 with 53 steps, done\n",
      "Run episode 560 with rewards -356.67453089047405 with 102 steps, done\n",
      "Run episode 561 with rewards -201.46391819983447 with 68 steps, done\n",
      "Run episode 562 with rewards -498.7847690772178 with 73 steps, done\n",
      "Run episode 563 with rewards -311.62938096353514 with 83 steps, done\n",
      "Run episode 564 with rewards -375.82545452310757 with 54 steps, done\n",
      "Run episode 565 with rewards -537.6644446166188 with 84 steps, done\n",
      "Run episode 566 with rewards -645.617802092681 with 82 steps, done\n",
      "Run episode 567 with rewards -428.94673909782114 with 77 steps, done\n",
      "Run episode 568 with rewards 14.772529651832372 with 75 steps, done\n",
      "Run episode 569 with rewards -131.94040589319357 with 58 steps, done\n",
      "Run episode 570 with rewards -233.6166932499659 with 127 steps, done\n",
      "Run episode 571 with rewards -177.02323927233294 with 85 steps, done\n",
      "Run episode 572 with rewards -163.4213808941129 with 59 steps, done\n",
      "Run episode 573 with rewards -130.5323815266327 with 90 steps, done\n",
      "Run episode 574 with rewards -632.9510488010607 with 72 steps, done\n",
      "Run episode 575 with rewards -456.49796127959894 with 63 steps, done\n",
      "Run episode 576 with rewards -439.2717450788253 with 57 steps, done\n",
      "Run episode 577 with rewards -401.9933692550842 with 103 steps, done\n",
      "Run episode 578 with rewards -1197.6692036054806 with 188 steps, done\n",
      "Run episode 579 with rewards -1101.3012984405984 with 159 steps, done\n",
      "Run episode 580 with rewards -98.49171561293585 with 58 steps, done\n",
      "Run episode 581 with rewards -1028.802980626379 with 182 steps, done\n",
      "Run episode 582 with rewards -143.8847248158358 with 52 steps, done\n",
      "Run episode 583 with rewards -788.5578633489107 with 147 steps, done\n",
      "Run episode 584 with rewards -169.3092182078043 with 68 steps, done\n",
      "Run episode 585 with rewards -508.0449925447333 with 76 steps, done\n",
      "Run episode 586 with rewards -200.28138045296356 with 86 steps, done\n",
      "Run episode 587 with rewards -433.63246120065554 with 78 steps, done\n",
      "Run episode 588 with rewards -212.93208525446147 with 82 steps, done\n",
      "Run episode 589 with rewards -524.717272674046 with 89 steps, done\n",
      "Run episode 590 with rewards -152.46924935546653 with 61 steps, done\n",
      "Run episode 591 with rewards -608.8699444791907 with 121 steps, done\n",
      "Run episode 592 with rewards -166.49488340930787 with 74 steps, done\n",
      "Run episode 593 with rewards -623.2306321355024 with 195 steps, done\n",
      "Run episode 594 with rewards -137.24123398058646 with 68 steps, done\n",
      "Run episode 595 with rewards -211.97979325388184 with 95 steps, done\n",
      "Run episode 596 with rewards -280.3221609149858 with 65 steps, done\n",
      "Run episode 597 with rewards -516.4863144061317 with 69 steps, done\n",
      "Run episode 598 with rewards -482.8686266797856 with 88 steps, done\n",
      "Run episode 599 with rewards -136.4503740906265 with 56 steps, done\n",
      "Run episode 600 with rewards -519.0267250186516 with 81 steps, done\n",
      "Run episode 601 with rewards -153.4068766423386 with 50 steps, done\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Run episode 602 with rewards -695.2000671651831 with 90 steps, done\n",
      "Run episode 603 with rewards -196.1447293145871 with 84 steps, done\n",
      "Run episode 604 with rewards -535.4157109485172 with 84 steps, done\n",
      "Run episode 605 with rewards -188.82440316049255 with 72 steps, done\n",
      "Run episode 606 with rewards -536.1747597830032 with 88 steps, done\n",
      "Run episode 607 with rewards -185.42380037721972 with 71 steps, done\n",
      "Run episode 608 with rewards -735.475360960094 with 138 steps, done\n",
      "Run episode 609 with rewards -141.55562289958334 with 56 steps, done\n",
      "Run episode 610 with rewards -468.63091236704867 with 57 steps, done\n",
      "Run episode 611 with rewards -491.88016035395447 with 112 steps, done\n",
      "Run episode 612 with rewards -692.5027868392554 with 78 steps, done\n",
      "Run episode 613 with rewards -617.3777476118229 with 93 steps, done\n",
      "Run episode 614 with rewards -392.8069746678686 with 55 steps, done\n",
      "Run episode 615 with rewards -636.3005717605253 with 95 steps, done\n",
      "Run episode 616 with rewards -692.1411914222128 with 76 steps, done\n",
      "Run episode 617 with rewards -409.2185081068448 with 64 steps, done\n",
      "Run episode 618 with rewards -436.33944861003846 with 58 steps, done\n",
      "Run episode 619 with rewards -685.8625340407442 with 104 steps, done\n",
      "Run episode 620 with rewards -112.71369469437346 with 88 steps, done\n",
      "Run episode 621 with rewards -65.79516572014195 with 85 steps, done\n",
      "Run episode 622 with rewards -540.4507485592769 with 86 steps, done\n",
      "Run episode 623 with rewards -126.33541806706103 with 62 steps, done\n",
      "Run episode 624 with rewards -806.4607343516873 with 96 steps, done\n",
      "Run episode 625 with rewards -511.27299325601314 with 94 steps, done\n",
      "Run episode 626 with rewards -188.9500378786823 with 127 steps, done\n",
      "Run episode 627 with rewards -148.98020169073146 with 88 steps, done\n",
      "Run episode 628 with rewards -110.3800141560425 with 117 steps, done\n",
      "Run episode 629 with rewards -160.03281422336983 with 58 steps, done\n",
      "Run episode 630 with rewards -429.57335958936517 with 97 steps, done\n",
      "Run episode 631 with rewards -399.5857152168942 with 57 steps, done\n",
      "Run episode 632 with rewards -661.4627506956073 with 76 steps, done\n",
      "Run episode 633 with rewards -477.41167565165944 with 56 steps, done\n",
      "Run episode 634 with rewards -481.5244007818919 with 76 steps, done\n",
      "Run episode 635 with rewards -440.0509384014417 with 59 steps, done\n",
      "Run episode 636 with rewards -571.8092251571825 with 102 steps, done\n",
      "Run episode 637 with rewards -469.90322485336344 with 56 steps, done\n",
      "Run episode 638 with rewards -581.341212073032 with 105 steps, done\n",
      "Run episode 639 with rewards -281.2648323282416 with 86 steps, done\n",
      "Run episode 640 with rewards -610.7185974855217 with 109 steps, done\n",
      "Run episode 641 with rewards -140.15935972723193 with 59 steps, done\n",
      "Run episode 642 with rewards -459.03446694153473 with 73 steps, done\n",
      "Run episode 643 with rewards -117.08264903456936 with 82 steps, done\n",
      "Run episode 644 with rewards -515.0846953663989 with 90 steps, done\n",
      "Run episode 645 with rewards -380.06807141250476 with 52 steps, done\n",
      "Run episode 646 with rewards -510.99195903185745 with 106 steps, done\n",
      "Run episode 647 with rewards -455.05908094539024 with 59 steps, done\n",
      "Run episode 648 with rewards -585.4981992202145 with 81 steps, done\n",
      "Run episode 649 with rewards -205.28565902089144 with 62 steps, done\n",
      "Run episode 650 with rewards -611.2430556354429 with 117 steps, done\n",
      "Run episode 651 with rewards -455.1511640365037 with 67 steps, done\n",
      "Run episode 652 with rewards 9.56119589183065 with 85 steps, done\n",
      "Run episode 653 with rewards -592.6236863424162 with 63 steps, done\n",
      "Run episode 654 with rewards -109.91130375197042 with 61 steps, done\n",
      "Run episode 655 with rewards -703.96379541477 with 76 steps, done\n",
      "Run episode 656 with rewards -216.59060619507358 with 58 steps, done\n",
      "Run episode 657 with rewards -743.8211576287734 with 129 steps, done\n",
      "Run episode 658 with rewards -244.75043588530693 with 85 steps, done\n",
      "Run episode 659 with rewards -800.6377975873575 with 127 steps, done\n",
      "Run episode 660 with rewards -736.4623875944263 with 79 steps, done\n",
      "Run episode 661 with rewards -561.9840313556415 with 79 steps, done\n",
      "Run episode 662 with rewards -167.88497709428157 with 65 steps, done\n",
      "Run episode 663 with rewards -963.2922712533358 with 123 steps, done\n",
      "Run episode 664 with rewards -129.89551541870694 with 62 steps, done\n",
      "Run episode 665 with rewards -637.7830638897005 with 75 steps, done\n",
      "Run episode 666 with rewards -150.41204970405863 with 61 steps, done\n",
      "Run episode 667 with rewards -416.3848925740013 with 76 steps, done\n",
      "Run episode 668 with rewards -128.51406248589535 with 62 steps, done\n",
      "Run episode 669 with rewards -990.4754379979478 with 134 steps, done\n",
      "Run episode 670 with rewards -124.16933607230501 with 55 steps, done\n",
      "Run episode 671 with rewards -636.1041672486928 with 95 steps, done\n",
      "Run episode 672 with rewards -216.4459042179244 with 82 steps, done\n",
      "Run episode 673 with rewards -993.9703426829022 with 124 steps, done\n",
      "Run episode 674 with rewards -638.9671545544941 with 73 steps, done\n",
      "Run episode 675 with rewards -577.0644658194592 with 78 steps, done\n",
      "Run episode 676 with rewards -151.83300372476862 with 71 steps, done\n",
      "Run episode 677 with rewards -548.5104758046795 with 89 steps, done\n",
      "Run episode 678 with rewards -119.50258700388869 with 58 steps, done\n",
      "Run episode 679 with rewards -146.70333299468112 with 74 steps, done\n",
      "Run episode 680 with rewards -566.995150758612 with 74 steps, done\n",
      "Run episode 681 with rewards -369.1804200727523 with 55 steps, done\n",
      "Run episode 682 with rewards -853.0901762107687 with 78 steps, done\n",
      "Run episode 683 with rewards -325.7449769234441 with 92 steps, done\n",
      "Run episode 684 with rewards -603.9474378323015 with 98 steps, done\n",
      "Run episode 685 with rewards -356.58334631538526 with 101 steps, done\n",
      "Run episode 686 with rewards -668.8021092334409 with 106 steps, done\n",
      "Run episode 687 with rewards -386.7043965198172 with 73 steps, done\n",
      "Run episode 688 with rewards -819.3219976641749 with 114 steps, done\n",
      "Run episode 689 with rewards -123.71311873297776 with 68 steps, done\n",
      "Run episode 690 with rewards -441.2789361719204 with 78 steps, done\n",
      "Run episode 691 with rewards -127.43604100389258 with 67 steps, done\n",
      "Run episode 692 with rewards -473.59316423288107 with 91 steps, done\n",
      "Run episode 693 with rewards -134.23053460959295 with 54 steps, done\n",
      "Run episode 694 with rewards -633.0090240750361 with 76 steps, done\n",
      "Run episode 695 with rewards -141.41816062672544 with 74 steps, done\n",
      "Run episode 696 with rewards -1073.7533142855268 with 88 steps, done\n",
      "Run episode 697 with rewards -472.7382894813613 with 93 steps, done\n",
      "Run episode 698 with rewards -499.76846442270124 with 66 steps, done\n",
      "Run episode 699 with rewards -2288.4688855997874 with 291 steps, done\n",
      "Run episode 700 with rewards -336.5013568470848 with 78 steps, done\n",
      "Run episode 701 with rewards -2460.0476303085143 with 257 steps, done\n",
      "Run episode 702 with rewards -330.2702392827353 with 78 steps, done\n",
      "Run episode 703 with rewards -1216.1103608738545 with 184 steps, done\n",
      "Run episode 704 with rewards -387.5057632287115 with 79 steps, done\n",
      "Run episode 705 with rewards -937.2925533484008 with 139 steps, done\n",
      "Run episode 706 with rewards -136.2196885230475 with 79 steps, done\n",
      "Run episode 707 with rewards -1658.9050435877425 with 190 steps, done\n",
      "Run episode 708 with rewards -106.5441129787587 with 53 steps, done\n",
      "Run episode 709 with rewards -864.3915687825815 with 130 steps, done\n",
      "Run episode 710 with rewards -148.480741901979 with 89 steps, done\n",
      "Run episode 711 with rewards -413.0881907380885 with 75 steps, done\n",
      "Run episode 712 with rewards -262.44920327210326 with 70 steps, done\n",
      "Run episode 713 with rewards -675.7930673006688 with 77 steps, done\n",
      "Run episode 714 with rewards -231.0884049607538 with 59 steps, done\n",
      "Run episode 715 with rewards -132.8129212522281 with 53 steps, done\n",
      "Run episode 716 with rewards -413.6414727187554 with 51 steps, done\n",
      "Run episode 717 with rewards -341.4040364148998 with 75 steps, done\n",
      "Run episode 718 with rewards -771.7253817254295 with 81 steps, done\n",
      "Run episode 719 with rewards -20.9157098574197 with 74 steps, done\n",
      "Run episode 720 with rewards -376.1041808263914 with 47 steps, done\n",
      "Run episode 721 with rewards -136.87267367593668 with 89 steps, done\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Run episode 722 with rewards -463.5300037517736 with 58 steps, done\n",
      "Run episode 723 with rewards -525.7166490890288 with 120 steps, done\n",
      "Run episode 724 with rewards -570.5467919486616 with 62 steps, done\n",
      "Run episode 725 with rewards -1477.9694822887502 with 212 steps, done\n",
      "Run episode 726 with rewards -169.968867326637 with 66 steps, done\n",
      "Run episode 727 with rewards -602.5806197037082 with 88 steps, done\n",
      "Run episode 728 with rewards -140.96809014376197 with 83 steps, done\n",
      "Run episode 729 with rewards -731.3675226532807 with 116 steps, done\n",
      "Run episode 730 with rewards -155.90399171237314 with 81 steps, done\n",
      "Run episode 731 with rewards -5.628294884086529 with 97 steps, done\n",
      "Run episode 732 with rewards -1716.7784914417632 with 223 steps, done\n",
      "Run episode 733 with rewards -853.0238126042299 with 83 steps, done\n",
      "Run episode 734 with rewards -482.3705111835198 with 60 steps, done\n",
      "Run episode 735 with rewards -586.3841617905578 with 89 steps, done\n",
      "Run episode 736 with rewards -542.9819418948537 with 64 steps, done\n",
      "Run episode 737 with rewards -539.170621702851 with 81 steps, done\n",
      "Run episode 738 with rewards -570.12403654634 with 62 steps, done\n",
      "Run episode 739 with rewards -353.26177098874564 with 83 steps, done\n",
      "Run episode 740 with rewards -443.25122965198045 with 77 steps, done\n",
      "Run episode 741 with rewards -428.0824638199142 with 78 steps, done\n",
      "Run episode 742 with rewards -480.03864544554 with 55 steps, done\n",
      "Run episode 743 with rewards -570.6050046994942 with 79 steps, done\n",
      "Run episode 744 with rewards -148.71824627736783 with 65 steps, done\n",
      "Run episode 745 with rewards -1875.5418845877462 with 223 steps, done\n",
      "Run episode 746 with rewards -144.21985710429718 with 83 steps, done\n",
      "Run episode 747 with rewards -432.19958767856 with 78 steps, done\n",
      "Run episode 748 with rewards -178.29465892069584 with 73 steps, done\n",
      "Run episode 749 with rewards -920.6304280518074 with 150 steps, done\n",
      "Run episode 750 with rewards -566.7223257184935 with 62 steps, done\n",
      "Run episode 751 with rewards -477.1975367706471 with 61 steps, done\n",
      "Run episode 752 with rewards -343.88660083548825 with 90 steps, done\n",
      "Run episode 753 with rewards -634.3296805508323 with 104 steps, done\n",
      "Run episode 754 with rewards -168.6038014328927 with 67 steps, done\n",
      "Run episode 755 with rewards -80.04663975452462 with 83 steps, done\n",
      "Run episode 756 with rewards -169.4840285948066 with 102 steps, done\n",
      "Run episode 757 with rewards -686.6755740859701 with 79 steps, done\n",
      "Run episode 758 with rewards -547.3872776397257 with 145 steps, done\n",
      "Run episode 759 with rewards -447.31931562307955 with 55 steps, done\n",
      "Run episode 760 with rewards -1577.2356561403687 with 231 steps, done\n",
      "Run episode 761 with rewards -642.751698981043 with 67 steps, done\n",
      "Run episode 762 with rewards -1243.9669471489042 with 163 steps, done\n",
      "Run episode 763 with rewards -163.17866877366006 with 79 steps, done\n",
      "Run episode 764 with rewards -468.564325762347 with 79 steps, done\n",
      "Run episode 765 with rewards -201.62986761806556 with 86 steps, done\n",
      "Run episode 766 with rewards -658.0144965873616 with 111 steps, done\n",
      "Run episode 767 with rewards -387.7389541021909 with 63 steps, done\n",
      "Run episode 768 with rewards -158.17547644205268 with 55 steps, done\n",
      "Run episode 769 with rewards -144.10049019636938 with 61 steps, done\n",
      "Run episode 770 with rewards -150.90744269757084 with 74 steps, done\n",
      "Run episode 771 with rewards -398.1996964292261 with 107 steps, done\n",
      "Run episode 772 with rewards -94.22636791740354 with 85 steps, done\n",
      "Run episode 773 with rewards -77.206331698752 with 62 steps, done\n",
      "Run episode 774 with rewards -248.14354176074715 with 140 steps, done\n",
      "Run episode 775 with rewards -755.1299648920375 with 85 steps, done\n",
      "Run episode 776 with rewards -952.8847568468603 with 144 steps, done\n",
      "Run episode 777 with rewards -558.7821318566043 with 63 steps, done\n",
      "Run episode 778 with rewards -580.7602094566965 with 81 steps, done\n",
      "Run episode 779 with rewards -110.26171752779136 with 56 steps, done\n",
      "Run episode 780 with rewards -5333.272310754525 with 437 steps, done\n",
      "Run episode 781 with rewards -102.49882867132654 with 58 steps, done\n",
      "Run episode 782 with rewards -528.9822256535065 with 79 steps, done\n",
      "Run episode 783 with rewards -242.2946500550245 with 79 steps, done\n",
      "Run episode 784 with rewards -1218.7051985386902 with 192 steps, done\n",
      "Run episode 785 with rewards -343.1012307769539 with 54 steps, done\n",
      "Run episode 786 with rewards -9.12241166792451 with 102 steps, done\n",
      "Run episode 787 with rewards -507.61019496854396 with 59 steps, done\n",
      "Run episode 788 with rewards -384.9589545613588 with 115 steps, done\n",
      "Run episode 789 with rewards -432.3017859598601 with 57 steps, done\n",
      "Run episode 790 with rewards -451.9734347923025 with 80 steps, done\n",
      "Run episode 791 with rewards -499.2501039296028 with 63 steps, done\n",
      "Run episode 792 with rewards -528.1978255030504 with 88 steps, done\n",
      "Run episode 793 with rewards -137.60549579670862 with 56 steps, done\n",
      "Run episode 794 with rewards -891.0476557082528 with 136 steps, done\n",
      "Run episode 795 with rewards -402.67275085383403 with 56 steps, done\n",
      "Run episode 796 with rewards -523.8804804240145 with 84 steps, done\n",
      "Run episode 797 with rewards -409.31564574833584 with 56 steps, done\n",
      "Run episode 798 with rewards -618.5198991107261 with 75 steps, done\n",
      "Run episode 799 with rewards -135.04642832508577 with 78 steps, done\n",
      "Run episode 800 with rewards -726.6106621708042 with 97 steps, done\n",
      "Run episode 801 with rewards -318.034508804758 with 85 steps, done\n",
      "Run episode 802 with rewards -519.7586287868958 with 79 steps, done\n",
      "Run episode 803 with rewards -145.80652823108096 with 53 steps, done\n",
      "Run episode 804 with rewards -603.4428318162629 with 79 steps, done\n",
      "Run episode 805 with rewards -211.61960567149637 with 69 steps, done\n",
      "Run episode 806 with rewards -522.4034171871654 with 101 steps, done\n",
      "Run episode 807 with rewards -665.2848350810781 with 86 steps, done\n",
      "Run episode 808 with rewards -394.74309606251643 with 52 steps, done\n",
      "Run episode 809 with rewards -781.7842706908077 with 128 steps, done\n",
      "Run episode 810 with rewards -131.2495355413974 with 80 steps, done\n",
      "Run episode 811 with rewards -2077.602796807363 with 285 steps, done\n",
      "Run episode 812 with rewards -132.8072714905722 with 75 steps, done\n",
      "Run episode 813 with rewards -465.945336679633 with 86 steps, done\n",
      "Run episode 814 with rewards -156.97186367359552 with 76 steps, done\n",
      "Run episode 815 with rewards -723.2974804705107 with 99 steps, done\n",
      "Run episode 816 with rewards -406.58816437825885 with 56 steps, done\n",
      "Run episode 817 with rewards -333.18939086420346 with 49 steps, done\n",
      "Run episode 818 with rewards -743.1195362593379 with 116 steps, done\n",
      "Run episode 819 with rewards -835.8346468482864 with 78 steps, done\n",
      "Run episode 820 with rewards -233.23106272026655 with 75 steps, done\n",
      "Run episode 821 with rewards -609.6790503718446 with 90 steps, done\n",
      "Run episode 822 with rewards -571.8118764124049 with 70 steps, done\n",
      "Run episode 823 with rewards -411.6667225814271 with 57 steps, done\n",
      "Run episode 824 with rewards -617.0776720464922 with 93 steps, done\n",
      "Run episode 825 with rewards -428.355881562989 with 55 steps, done\n",
      "Run episode 826 with rewards -89.46523130795852 with 68 steps, done\n",
      "Run episode 827 with rewards -740.3691452491757 with 104 steps, done\n",
      "Run episode 828 with rewards -32.454714662239425 with 94 steps, done\n",
      "Run episode 829 with rewards -694.9140025424855 with 104 steps, done\n",
      "Run episode 830 with rewards -687.092130152119 with 70 steps, done\n",
      "Run episode 831 with rewards -767.0152107215598 with 158 steps, done\n",
      "Run episode 832 with rewards -775.3352742488693 with 82 steps, done\n",
      "Run episode 833 with rewards -430.7504802800663 with 65 steps, done\n",
      "Run episode 834 with rewards -451.1416781983076 with 89 steps, done\n",
      "Run episode 835 with rewards -652.9417525149331 with 83 steps, done\n",
      "Run episode 836 with rewards -552.9048584760965 with 62 steps, done\n",
      "Run episode 837 with rewards -275.7242876577047 with 86 steps, done\n",
      "Run episode 838 with rewards -520.5536949772342 with 63 steps, done\n",
      "Run episode 839 with rewards -275.08870881096846 with 82 steps, done\n",
      "Run episode 840 with rewards -503.85962856861374 with 58 steps, done\n",
      "Run episode 841 with rewards -559.969079762988 with 76 steps, done\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Run episode 842 with rewards -465.42757803051296 with 57 steps, done\n",
      "Run episode 843 with rewards -609.7321088568456 with 79 steps, done\n",
      "Run episode 844 with rewards -748.7790444561901 with 85 steps, done\n",
      "Run episode 845 with rewards -462.95320268879885 with 62 steps, done\n",
      "Run episode 846 with rewards -407.5306089691316 with 53 steps, done\n",
      "Run episode 847 with rewards -615.806574167445 with 92 steps, done\n",
      "Run episode 848 with rewards -451.5538911949379 with 60 steps, done\n",
      "Run episode 849 with rewards -523.0911976884368 with 97 steps, done\n",
      "Run episode 850 with rewards -2012.3502850172472 with 225 steps, done\n",
      "Run episode 851 with rewards -115.49741647966428 with 83 steps, done\n",
      "Run episode 852 with rewards -690.0068804516227 with 88 steps, done\n",
      "Run episode 853 with rewards -117.78427961237702 with 74 steps, done\n",
      "Run episode 854 with rewards -438.0771258522531 with 53 steps, done\n",
      "Run episode 855 with rewards -623.349718312904 with 84 steps, done\n",
      "Run episode 856 with rewards -215.16870833563868 with 68 steps, done\n",
      "Run episode 857 with rewards -1011.0363372318598 with 149 steps, done\n",
      "Run episode 858 with rewards -217.5309931914128 with 122 steps, done\n",
      "Run episode 859 with rewards -163.43426309745593 with 82 steps, done\n",
      "Run episode 860 with rewards -623.1786928382418 with 70 steps, done\n",
      "Run episode 861 with rewards -249.1655555457631 with 58 steps, done\n",
      "Run episode 862 with rewards -441.489455335523 with 61 steps, done\n",
      "Run episode 863 with rewards -214.94878817395116 with 98 steps, done\n",
      "Run episode 864 with rewards -456.92317518607905 with 88 steps, done\n",
      "Run episode 865 with rewards -139.80981391948285 with 60 steps, done\n",
      "Run episode 866 with rewards -342.1237334723919 with 62 steps, done\n",
      "Run episode 867 with rewards -495.3164257980482 with 57 steps, done\n",
      "Run episode 868 with rewards -397.7674613441054 with 63 steps, done\n",
      "Run episode 869 with rewards -902.8907005432338 with 83 steps, done\n",
      "Run episode 870 with rewards -201.80227444737017 with 74 steps, done\n",
      "Run episode 871 with rewards -340.48642293148 with 52 steps, done\n",
      "Run episode 872 with rewards -462.10331222017095 with 84 steps, done\n",
      "Run episode 873 with rewards -425.3085957130939 with 50 steps, done\n",
      "Run episode 874 with rewards -636.7116679112779 with 63 steps, done\n",
      "Run episode 875 with rewards -386.63906466316973 with 69 steps, done\n",
      "Run episode 876 with rewards -723.4259890077112 with 105 steps, done\n",
      "Run episode 877 with rewards -373.1121009795411 with 55 steps, done\n",
      "Run episode 878 with rewards -220.45878806836424 with 69 steps, done\n",
      "Run episode 879 with rewards -757.9627302131257 with 84 steps, done\n",
      "Run episode 880 with rewards -999.364614127944 with 178 steps, done\n",
      "Run episode 881 with rewards -133.95407477786063 with 62 steps, done\n",
      "Run episode 882 with rewards -504.873042663713 with 75 steps, done\n",
      "Run episode 883 with rewards -146.73921624987747 with 75 steps, done\n",
      "Run episode 884 with rewards -621.7000314234867 with 105 steps, done\n",
      "Run episode 885 with rewards -141.45677760819677 with 73 steps, done\n",
      "Run episode 886 with rewards -309.77721590097343 with 79 steps, done\n",
      "Run episode 887 with rewards -343.6361276373538 with 82 steps, done\n",
      "Run episode 888 with rewards -161.31293229113624 with 63 steps, done\n",
      "Run episode 889 with rewards -500.5621934729083 with 62 steps, done\n",
      "Run episode 890 with rewards -503.9991013966107 with 85 steps, done\n",
      "Run episode 891 with rewards -343.0250730039844 with 52 steps, done\n",
      "Run episode 892 with rewards -595.476771133568 with 64 steps, done\n",
      "Run episode 893 with rewards -592.0883608519542 with 70 steps, done\n",
      "Run episode 894 with rewards -703.1443049550298 with 82 steps, done\n",
      "Run episode 895 with rewards -254.4689166049413 with 96 steps, done\n",
      "Run episode 896 with rewards -189.06837008424344 with 87 steps, done\n",
      "Run episode 897 with rewards -542.7738478016856 with 65 steps, done\n",
      "Run episode 898 with rewards -433.3508246858563 with 79 steps, done\n",
      "Run episode 899 with rewards -336.1650475257737 with 78 steps, done\n",
      "Run episode 900 with rewards -615.0853910077324 with 63 steps, done\n",
      "Run episode 901 with rewards -163.04725180556176 with 88 steps, done\n",
      "Run episode 902 with rewards -822.6289831216337 with 139 steps, done\n",
      "Run episode 903 with rewards -116.82520386893154 with 77 steps, done\n",
      "Run episode 904 with rewards -640.6447650269708 with 85 steps, done\n",
      "Run episode 905 with rewards -945.0731286646358 with 85 steps, done\n",
      "Run episode 906 with rewards -581.4254306681593 with 99 steps, done\n",
      "Run episode 907 with rewards -765.1378620672222 with 88 steps, done\n",
      "Run episode 908 with rewards -620.9830102673978 with 75 steps, done\n",
      "Run episode 909 with rewards -159.3091219798378 with 78 steps, done\n",
      "Run episode 910 with rewards -380.36701567059026 with 96 steps, done\n",
      "Run episode 911 with rewards -552.209921936431 with 102 steps, done\n",
      "Run episode 912 with rewards -111.60454024723794 with 53 steps, done\n",
      "Run episode 913 with rewards -291.91010521899517 with 73 steps, done\n",
      "Run episode 914 with rewards -1059.8402560714853 with 178 steps, done\n",
      "Run episode 915 with rewards -523.9769804902191 with 71 steps, done\n",
      "Run episode 916 with rewards -2141.264950175145 with 247 steps, done\n",
      "Run episode 917 with rewards -733.2283994493686 with 73 steps, done\n",
      "Run episode 918 with rewards -631.5163638213274 with 78 steps, done\n",
      "Run episode 919 with rewards -162.77930534654718 with 57 steps, done\n",
      "Run episode 920 with rewards -593.4088382002419 with 74 steps, done\n",
      "Run episode 921 with rewards -203.48898565381177 with 66 steps, done\n",
      "Run episode 922 with rewards -1378.9725697495173 with 200 steps, done\n",
      "Run episode 923 with rewards -129.44917498675994 with 65 steps, done\n",
      "Run episode 924 with rewards -714.60602293362 with 192 steps, done\n",
      "Run episode 925 with rewards -214.92857768218315 with 88 steps, done\n",
      "Run episode 926 with rewards -294.8364549970118 with 75 steps, done\n",
      "Run episode 927 with rewards -609.3678927921743 with 63 steps, done\n",
      "Run episode 928 with rewards -589.837579378602 with 71 steps, done\n",
      "Run episode 929 with rewards -505.3980752148054 with 55 steps, done\n",
      "Run episode 930 with rewards -579.7478197499256 with 66 steps, done\n",
      "Run episode 931 with rewards -527.7607974707614 with 85 steps, done\n",
      "Run episode 932 with rewards -733.0041883575198 with 75 steps, done\n",
      "Run episode 933 with rewards -639.1514137216352 with 106 steps, done\n",
      "Run episode 934 with rewards -132.93332015696595 with 57 steps, done\n",
      "Run episode 935 with rewards -214.18951478907826 with 114 steps, done\n",
      "Run episode 936 with rewards -99.41206093530943 with 87 steps, done\n",
      "Run episode 937 with rewards -94.69660113249934 with 75 steps, done\n",
      "Run episode 938 with rewards -253.90820289384712 with 92 steps, done\n",
      "Run episode 939 with rewards -254.4359413247206 with 105 steps, done\n",
      "Run episode 940 with rewards -873.2389246826606 with 149 steps, done\n",
      "Run episode 941 with rewards -131.4017040993774 with 52 steps, done\n",
      "Run episode 942 with rewards -1072.8261416843752 with 170 steps, done\n",
      "Run episode 943 with rewards -703.8068068122061 with 70 steps, done\n",
      "Run episode 944 with rewards -470.41135682600753 with 73 steps, done\n",
      "Run episode 945 with rewards -624.2101320046745 with 66 steps, done\n",
      "Run episode 946 with rewards -699.0272184904147 with 104 steps, done\n",
      "Run episode 947 with rewards -522.0713783777377 with 66 steps, done\n",
      "Run episode 948 with rewards -839.0644482382643 with 114 steps, done\n",
      "Run episode 949 with rewards -576.7701049164947 with 62 steps, done\n",
      "Run episode 950 with rewards -386.67450109738974 with 67 steps, done\n",
      "Run episode 951 with rewards -489.45675781765505 with 54 steps, done\n",
      "Run episode 952 with rewards -1239.2706429291106 with 192 steps, done\n",
      "Run episode 953 with rewards -157.47254761067472 with 74 steps, done\n",
      "Run episode 954 with rewards -105.6645276688278 with 80 steps, done\n",
      "Run episode 955 with rewards -449.98669204310494 with 74 steps, done\n",
      "Run episode 956 with rewards -131.74330705688158 with 61 steps, done\n",
      "Run episode 957 with rewards -245.48236229389133 with 87 steps, done\n",
      "Run episode 958 with rewards -153.40250423361337 with 78 steps, done\n",
      "Run episode 959 with rewards -84.64742295478314 with 93 steps, done\n",
      "Run episode 960 with rewards -142.21900475995773 with 64 steps, done\n",
      "Run episode 961 with rewards -527.4862032570982 with 95 steps, done\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Run episode 962 with rewards -144.39849232798554 with 58 steps, done\n",
      "Run episode 963 with rewards -570.4562595639335 with 68 steps, done\n",
      "Run episode 964 with rewards -594.4635614911316 with 96 steps, done\n",
      "Run episode 965 with rewards -720.2306615858496 with 74 steps, done\n",
      "Run episode 966 with rewards -409.7586486630376 with 110 steps, done\n",
      "Run episode 967 with rewards -829.4897999897324 with 80 steps, done\n",
      "Run episode 968 with rewards -579.9632805285248 with 85 steps, done\n",
      "Run episode 969 with rewards -488.9382848991255 with 73 steps, done\n",
      "Run episode 970 with rewards -284.6977407074739 with 79 steps, done\n",
      "Run episode 971 with rewards -599.030812819678 with 63 steps, done\n",
      "Run episode 972 with rewards -433.886165913954 with 59 steps, done\n",
      "Run episode 973 with rewards -348.79876232172853 with 62 steps, done\n",
      "Run episode 974 with rewards -528.9282768835492 with 62 steps, done\n",
      "Run episode 975 with rewards -264.70760831141115 with 78 steps, done\n",
      "Run episode 976 with rewards -1039.9125103306342 with 131 steps, done\n",
      "Run episode 977 with rewards -323.078837487372 with 53 steps, done\n",
      "Run episode 978 with rewards -632.7552790594715 with 69 steps, done\n",
      "Run episode 979 with rewards -522.3009141835348 with 58 steps, done\n",
      "Run episode 980 with rewards -884.8918866940312 with 109 steps, done\n",
      "Run episode 981 with rewards -138.07792806439696 with 56 steps, done\n",
      "Run episode 982 with rewards -609.4579126720203 with 116 steps, done\n",
      "Run episode 983 with rewards -23.44606065300316 with 75 steps, done\n",
      "Run episode 984 with rewards -789.8469223221032 with 110 steps, done\n",
      "Run episode 985 with rewards -657.7929062600269 with 69 steps, done\n",
      "Run episode 986 with rewards -718.4301368395699 with 114 steps, done\n",
      "Run episode 987 with rewards -143.88153976040053 with 76 steps, done\n",
      "Run episode 988 with rewards -114.09680510105032 with 85 steps, done\n",
      "Run episode 989 with rewards -117.32898127611614 with 56 steps, done\n",
      "Run episode 990 with rewards -412.21286752795345 with 52 steps, done\n",
      "Run episode 991 with rewards -447.50944899153075 with 109 steps, done\n",
      "Run episode 992 with rewards -122.66345340796656 with 55 steps, done\n",
      "Run episode 993 with rewards -995.0742011877967 with 184 steps, done\n",
      "Run episode 994 with rewards -177.81061804814465 with 72 steps, done\n",
      "Run episode 995 with rewards -500.3495218454035 with 83 steps, done\n",
      "Run episode 996 with rewards -190.7471935688532 with 74 steps, done\n",
      "Run episode 997 with rewards -497.6689901764888 with 90 steps, done\n",
      "Run episode 998 with rewards -806.0407803729711 with 110 steps, done\n",
      "Run episode 999 with rewards -128.99301876988866 with 72 steps, done\n",
      "Run episode 1000 with rewards -598.941487338951 with 132 steps, done\n",
      "Run episode 1001 with rewards -134.02999572957026 with 107 steps, done\n",
      "Run episode 1002 with rewards -533.6919675396038 with 56 steps, done\n",
      "Run episode 1003 with rewards -105.26287450821567 with 61 steps, done\n",
      "Run episode 1004 with rewards -378.37155551184014 with 53 steps, done\n",
      "Run episode 1005 with rewards -126.829713419533 with 114 steps, done\n",
      "Run episode 1006 with rewards -553.1606642200868 with 90 steps, done\n",
      "Run episode 1007 with rewards -169.4162635981635 with 68 steps, done\n",
      "Run episode 1008 with rewards -879.5125556844501 with 147 steps, done\n",
      "Run episode 1009 with rewards -98.1356684856646 with 82 steps, done\n",
      "Run episode 1010 with rewards -2210.919361170861 with 271 steps, done\n",
      "Run episode 1011 with rewards -108.54949298584185 with 68 steps, done\n",
      "Run episode 1012 with rewards -815.2664596195909 with 139 steps, done\n",
      "Run episode 1013 with rewards -200.09974194028854 with 75 steps, done\n",
      "Run episode 1014 with rewards -291.3337992160275 with 106 steps, done\n",
      "Run episode 1015 with rewards -420.1635446485046 with 51 steps, done\n",
      "Run episode 1016 with rewards -687.4864776073923 with 86 steps, done\n",
      "Run episode 1017 with rewards -248.49847037699473 with 62 steps, done\n",
      "Run episode 1018 with rewards -755.7365031830391 with 84 steps, done\n",
      "Run episode 1019 with rewards -448.48981819695655 with 77 steps, done\n",
      "Run episode 1020 with rewards -606.4268968121 with 71 steps, done\n",
      "Run episode 1021 with rewards -530.4139536090646 with 88 steps, done\n",
      "Run episode 1022 with rewards -774.7235014867655 with 77 steps, done\n",
      "Run episode 1023 with rewards -456.51515057860956 with 115 steps, done\n",
      "Run episode 1024 with rewards -136.78603972183066 with 66 steps, done\n",
      "Run episode 1025 with rewards -1101.573010293043 with 166 steps, done\n",
      "Run episode 1026 with rewards -151.107933703352 with 113 steps, done\n",
      "Run episode 1027 with rewards -506.32239186276803 with 65 steps, done\n",
      "Run episode 1028 with rewards -464.4311451284131 with 53 steps, done\n",
      "Run episode 1029 with rewards -514.2888207175329 with 89 steps, done\n",
      "Run episode 1030 with rewards -478.9848352766754 with 71 steps, done\n",
      "Run episode 1031 with rewards -449.34007670968253 with 84 steps, done\n",
      "Run episode 1032 with rewards -590.2239875149123 with 114 steps, done\n",
      "Run episode 1033 with rewards -407.0970136165917 with 69 steps, done\n",
      "Run episode 1034 with rewards -748.8254886313143 with 82 steps, done\n",
      "Run episode 1035 with rewards -6983.629554101514 with 492 steps, done\n",
      "Run episode 1036 with rewards -544.8641726211708 with 69 steps, done\n",
      "Run episode 1037 with rewards -397.2876992188772 with 71 steps, done\n",
      "Run episode 1038 with rewards -404.1549393035597 with 50 steps, done\n",
      "Run episode 1039 with rewards -360.3908066029105 with 65 steps, done\n",
      "Run episode 1040 with rewards -346.14015375865347 with 86 steps, done\n",
      "Run episode 1041 with rewards -469.02652209059664 with 78 steps, done\n",
      "Run episode 1042 with rewards -881.750299950348 with 80 steps, done\n",
      "Run episode 1043 with rewards -618.5973783317937 with 107 steps, done\n",
      "Run episode 1044 with rewards -526.8439902301116 with 84 steps, done\n",
      "Run episode 1045 with rewards -407.3331779417803 with 67 steps, done\n",
      "Run episode 1046 with rewards -815.2515214437022 with 78 steps, done\n",
      "Run episode 1047 with rewards -296.69793186625054 with 64 steps, done\n",
      "Run episode 1048 with rewards -546.1654452879836 with 68 steps, done\n",
      "Run episode 1049 with rewards -453.45796004612953 with 83 steps, done\n",
      "Run episode 1050 with rewards -413.3583744808353 with 55 steps, done\n",
      "Run episode 1051 with rewards -780.7548400944319 with 108 steps, done\n",
      "Run episode 1052 with rewards -378.05637064966527 with 49 steps, done\n",
      "Run episode 1053 with rewards -533.2777094560302 with 104 steps, done\n",
      "Run episode 1054 with rewards -100.11171024424753 with 61 steps, done\n",
      "Run episode 1055 with rewards -585.7308655849529 with 72 steps, done\n",
      "Run episode 1056 with rewards -146.64943157585247 with 64 steps, done\n",
      "Run episode 1057 with rewards -1129.0948732120075 with 150 steps, done\n",
      "Run episode 1058 with rewards -144.25544741878963 with 66 steps, done\n",
      "Run episode 1059 with rewards -507.10139943158134 with 68 steps, done\n",
      "Run episode 1060 with rewards -138.22394973915698 with 87 steps, done\n",
      "Run episode 1061 with rewards -564.2304941843825 with 65 steps, done\n",
      "Run episode 1062 with rewards -95.8427954852724 with 55 steps, done\n",
      "Run episode 1063 with rewards -566.341904921415 with 69 steps, done\n",
      "Run episode 1064 with rewards -259.6767340642335 with 58 steps, done\n",
      "Run episode 1065 with rewards -476.1215650516144 with 62 steps, done\n",
      "Run episode 1066 with rewards -437.05381252112977 with 81 steps, done\n",
      "Run episode 1067 with rewards -702.2934680503569 with 68 steps, done\n",
      "Run episode 1068 with rewards -583.1505213888096 with 70 steps, done\n",
      "Run episode 1069 with rewards -163.74927732819248 with 62 steps, done\n",
      "Run episode 1070 with rewards -757.4070642800505 with 93 steps, done\n",
      "Run episode 1071 with rewards -1575.2833651315082 with 216 steps, done\n",
      "Run episode 1072 with rewards -239.64717011404767 with 53 steps, done\n",
      "Run episode 1073 with rewards -813.2880437828792 with 112 steps, done\n",
      "Run episode 1074 with rewards -408.1336880596255 with 102 steps, done\n",
      "Run episode 1075 with rewards -153.48712536313215 with 60 steps, done\n",
      "Run episode 1076 with rewards -601.0912738690519 with 82 steps, done\n",
      "Run episode 1077 with rewards -1065.217866829391 with 130 steps, done\n",
      "Run episode 1078 with rewards -459.9836450000114 with 62 steps, done\n",
      "Run episode 1079 with rewards -339.1598627159925 with 53 steps, done\n",
      "Run episode 1080 with rewards -1043.087189839243 with 160 steps, done\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Run episode 1081 with rewards -580.5856204301099 with 67 steps, done\n",
      "Run episode 1082 with rewards -618.2938211076452 with 81 steps, done\n",
      "Run episode 1083 with rewards -456.4015198441516 with 76 steps, done\n",
      "Run episode 1084 with rewards -772.9534759062647 with 83 steps, done\n",
      "Run episode 1085 with rewards -193.3866169972606 with 75 steps, done\n",
      "Run episode 1086 with rewards -355.2934917687338 with 51 steps, done\n",
      "Run episode 1087 with rewards -621.522872504287 with 101 steps, done\n",
      "Run episode 1088 with rewards -469.0842317285589 with 86 steps, done\n",
      "Run episode 1089 with rewards -1247.1304675034235 with 196 steps, done\n",
      "Run episode 1090 with rewards -112.12147807495131 with 88 steps, done\n",
      "Run episode 1091 with rewards -630.9825166754144 with 99 steps, done\n",
      "Run episode 1092 with rewards -258.81290340971725 with 86 steps, done\n",
      "Run episode 1093 with rewards -528.9457191683282 with 78 steps, done\n",
      "Run episode 1094 with rewards -335.7945480526273 with 49 steps, done\n",
      "Run episode 1095 with rewards -820.5674548675496 with 126 steps, done\n",
      "Run episode 1096 with rewards -214.09176092197558 with 65 steps, done\n",
      "Run episode 1097 with rewards -951.1384092624279 with 173 steps, done\n",
      "Run episode 1098 with rewards -176.05673915872305 with 73 steps, done\n",
      "Run episode 1099 with rewards -480.93967180107 with 76 steps, done\n",
      "Run episode 1100 with rewards -117.16481611379243 with 53 steps, done\n",
      "Run episode 1101 with rewards -268.50359232205966 with 54 steps, done\n",
      "Run episode 1102 with rewards -549.0149026614865 with 137 steps, done\n",
      "Run episode 1103 with rewards -634.2047745691303 with 68 steps, done\n",
      "Run episode 1104 with rewards -216.54215617675555 with 68 steps, done\n",
      "Run episode 1105 with rewards -727.4157648155536 with 150 steps, done\n",
      "Run episode 1106 with rewards -159.64837545573215 with 58 steps, done\n",
      "Run episode 1107 with rewards -129.31735979130417 with 206 steps, done\n",
      "Run episode 1108 with rewards -327.16002136304564 with 51 steps, done\n",
      "Run episode 1109 with rewards -522.883352561959 with 93 steps, done\n",
      "Run episode 1110 with rewards -445.91927325121196 with 70 steps, done\n",
      "Run episode 1111 with rewards -411.53920239296923 with 63 steps, done\n",
      "Run episode 1112 with rewards -455.1359969596688 with 283 steps, done\n",
      "Run episode 1113 with rewards -510.9617015294485 with 61 steps, done\n",
      "Run episode 1114 with rewards -309.49952768512463 with 148 steps, done\n",
      "Run episode 1115 with rewards -960.0120788035838 with 134 steps, done\n",
      "Run episode 1116 with rewards -256.4276514943798 with 75 steps, done\n",
      "Run episode 1117 with rewards -418.9835662302435 with 78 steps, done\n",
      "Run episode 1118 with rewards -121.8984272670477 with 64 steps, done\n",
      "Run episode 1119 with rewards -543.8245206821641 with 106 steps, done\n",
      "Run episode 1120 with rewards -94.8414591559388 with 86 steps, done\n",
      "Run episode 1121 with rewards -564.3676596107148 with 79 steps, done\n",
      "Run episode 1122 with rewards -609.2534834937682 with 68 steps, done\n",
      "Run episode 1123 with rewards -558.5035533224863 with 99 steps, done\n",
      "Run episode 1124 with rewards -420.5111405295155 with 50 steps, done\n",
      "Run episode 1125 with rewards -488.58645102071057 with 61 steps, done\n",
      "Run episode 1126 with rewards -569.8251533043417 with 99 steps, done\n",
      "Run episode 1127 with rewards -513.4133900139661 with 63 steps, done\n",
      "Run episode 1128 with rewards -137.60031144440214 with 68 steps, done\n",
      "Run episode 1129 with rewards -652.3330649198433 with 86 steps, done\n",
      "Run episode 1130 with rewards -523.5813508492497 with 85 steps, done\n",
      "Run episode 1131 with rewards -660.4288383561924 with 80 steps, done\n",
      "Run episode 1132 with rewards -586.2608138855342 with 78 steps, done\n",
      "Run episode 1133 with rewards -639.5527797879942 with 103 steps, done\n",
      "Run episode 1134 with rewards -578.5763960908953 with 65 steps, done\n",
      "Run episode 1135 with rewards -705.6369410679515 with 81 steps, done\n",
      "Run episode 1136 with rewards -516.4398725392705 with 56 steps, done\n",
      "Run episode 1137 with rewards -616.1594603878036 with 103 steps, done\n",
      "Run episode 1138 with rewards -150.05341416139785 with 82 steps, done\n",
      "Run episode 1139 with rewards -105.66761557995146 with 94 steps, done\n",
      "Run episode 1140 with rewards -497.4689647009349 with 102 steps, done\n",
      "Run episode 1141 with rewards -405.04939160249245 with 57 steps, done\n",
      "Run episode 1142 with rewards -203.28519539896462 with 79 steps, done\n",
      "Run episode 1143 with rewards -328.9560323974822 with 57 steps, done\n",
      "Run episode 1144 with rewards -395.51911397102344 with 64 steps, done\n",
      "Run episode 1145 with rewards -370.4903633471228 with 79 steps, done\n",
      "Run episode 1146 with rewards -324.5482255306001 with 85 steps, done\n",
      "Run episode 1147 with rewards -362.39143405214764 with 50 steps, done\n",
      "Run episode 1148 with rewards -508.7464825518664 with 73 steps, done\n",
      "Run episode 1149 with rewards -483.9803440945763 with 97 steps, done\n",
      "Run episode 1150 with rewards -728.473479390205 with 72 steps, done\n",
      "Run episode 1151 with rewards -692.4955003392349 with 94 steps, done\n",
      "Run episode 1152 with rewards -457.7543396164104 with 57 steps, done\n",
      "Run episode 1153 with rewards -510.6040581976204 with 87 steps, done\n",
      "Run episode 1154 with rewards -632.9273742180595 with 68 steps, done\n",
      "Run episode 1155 with rewards -483.7691550401355 with 82 steps, done\n",
      "Run episode 1156 with rewards -642.1034307280987 with 77 steps, done\n",
      "Run episode 1157 with rewards -253.21175524418913 with 74 steps, done\n",
      "Run episode 1158 with rewards -471.7485491783412 with 53 steps, done\n",
      "Run episode 1159 with rewards -424.5115140268685 with 52 steps, done\n",
      "Run episode 1160 with rewards -134.60874060468493 with 65 steps, done\n",
      "Run episode 1161 with rewards -403.78579017140305 with 56 steps, done\n",
      "Run episode 1162 with rewards -603.550789762832 with 123 steps, done\n",
      "Run episode 1163 with rewards -444.13606716690646 with 59 steps, done\n",
      "Run episode 1164 with rewards -348.44572257188594 with 50 steps, done\n",
      "Run episode 1165 with rewards -463.5291362870145 with 63 steps, done\n",
      "Run episode 1166 with rewards -708.4488232519533 with 80 steps, done\n",
      "Run episode 1167 with rewards -766.8665430437368 with 75 steps, done\n",
      "Run episode 1168 with rewards -845.517289016589 with 86 steps, done\n",
      "Run episode 1169 with rewards -494.70290036012165 with 94 steps, done\n",
      "Run episode 1170 with rewards -426.38658535103895 with 58 steps, done\n",
      "Run episode 1171 with rewards -228.2591944627413 with 63 steps, done\n",
      "Run episode 1172 with rewards -524.5162039846839 with 69 steps, done\n",
      "Run episode 1173 with rewards -430.3354318721112 with 51 steps, done\n",
      "Run episode 1174 with rewards -715.2502779614034 with 78 steps, done\n",
      "Run episode 1175 with rewards -503.31228345428644 with 65 steps, done\n",
      "Run episode 1176 with rewards -512.0619234497527 with 88 steps, done\n",
      "Run episode 1177 with rewards -761.2798274339802 with 79 steps, done\n",
      "Run episode 1178 with rewards -283.33042553427833 with 73 steps, done\n",
      "Run episode 1179 with rewards -1117.067220889581 with 90 steps, done\n",
      "Run episode 1180 with rewards -618.1938671682033 with 102 steps, done\n",
      "Run episode 1181 with rewards -421.31777106267305 with 52 steps, done\n",
      "Run episode 1182 with rewards -707.5388134455663 with 126 steps, done\n",
      "Run episode 1183 with rewards -532.5572611158791 with 60 steps, done\n",
      "Run episode 1184 with rewards -147.21549981542626 with 67 steps, done\n",
      "Run episode 1185 with rewards -195.8195624053954 with 93 steps, done\n",
      "Run episode 1186 with rewards -75.42847424859994 with 86 steps, done\n",
      "Run episode 1187 with rewards -178.36489955027696 with 87 steps, done\n",
      "Run episode 1188 with rewards -133.81544267876623 with 62 steps, done\n",
      "Run episode 1189 with rewards -348.0380936631597 with 74 steps, done\n",
      "Run episode 1190 with rewards -386.4501179835802 with 54 steps, done\n",
      "Run episode 1191 with rewards -372.4946056337696 with 107 steps, done\n",
      "Run episode 1192 with rewards -750.9428332377125 with 76 steps, done\n",
      "Run episode 1193 with rewards -612.5254201382135 with 91 steps, done\n",
      "Run episode 1194 with rewards -683.2151942516253 with 78 steps, done\n",
      "Run episode 1195 with rewards -117.36267689931688 with 56 steps, done\n",
      "Run episode 1196 with rewards -636.7714338536447 with 68 steps, done\n",
      "Run episode 1197 with rewards -313.89553280894404 with 83 steps, done\n",
      "Run episode 1198 with rewards -467.9570238404639 with 60 steps, done\n",
      "Run episode 1199 with rewards -612.9128099252018 with 88 steps, done\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Run episode 1200 with rewards -897.3773109888108 with 87 steps, done\n",
      "Run episode 1201 with rewards -455.0496541304582 with 76 steps, done\n",
      "Run episode 1202 with rewards -391.54046455699194 with 54 steps, done\n",
      "Run episode 1203 with rewards -480.9349807066548 with 76 steps, done\n",
      "Run episode 1204 with rewards -779.5241503593714 with 87 steps, done\n",
      "Run episode 1205 with rewards -124.8631230272427 with 57 steps, done\n",
      "Run episode 1206 with rewards -637.8845622467687 with 70 steps, done\n",
      "Run episode 1207 with rewards -509.58604932714786 with 90 steps, done\n",
      "Run episode 1208 with rewards -623.6445563956335 with 72 steps, done\n",
      "Run episode 1209 with rewards 24.86674097544173 with 94 steps, done\n",
      "best\n",
      "Run episode 1210 with rewards -135.90378127938496 with 61 steps, done\n",
      "Run episode 1211 with rewards -191.95321150376898 with 103 steps, done\n",
      "Run episode 1212 with rewards -84.37525857420813 with 56 steps, done\n",
      "Run episode 1213 with rewards -618.4828548675403 with 75 steps, done\n",
      "Run episode 1214 with rewards -960.4550019480472 with 86 steps, done\n",
      "Run episode 1215 with rewards -642.1504951399938 with 74 steps, done\n",
      "Run episode 1216 with rewards -617.6081209658905 with 65 steps, done\n",
      "Run episode 1217 with rewards -525.9888167700374 with 77 steps, done\n",
      "Run episode 1218 with rewards -365.4936825044963 with 53 steps, done\n",
      "Run episode 1219 with rewards -302.0427834195791 with 142 steps, done\n",
      "Run episode 1220 with rewards -713.980035039705 with 85 steps, done\n",
      "Run episode 1221 with rewards -402.8495915299054 with 54 steps, done\n",
      "Run episode 1222 with rewards -810.5077328782456 with 77 steps, done\n",
      "Run episode 1223 with rewards -548.5211682197912 with 81 steps, done\n",
      "Run episode 1224 with rewards -463.80564547693996 with 54 steps, done\n",
      "Run episode 1225 with rewards -350.320322248916 with 63 steps, done\n",
      "Run episode 1226 with rewards -555.6168770968852 with 68 steps, done\n",
      "Run episode 1227 with rewards -468.3774880525817 with 74 steps, done\n",
      "Run episode 1228 with rewards -570.5764215470563 with 62 steps, done\n",
      "Run episode 1229 with rewards -370.1443355721503 with 80 steps, done\n",
      "Run episode 1230 with rewards -786.7408723940595 with 76 steps, done\n",
      "Run episode 1231 with rewards -148.5471660206263 with 83 steps, done\n",
      "Run episode 1232 with rewards -110.50339986384714 with 118 steps, done\n",
      "Run episode 1233 with rewards -156.65989428488328 with 65 steps, done\n",
      "Run episode 1234 with rewards -431.73398399578764 with 86 steps, done\n",
      "Run episode 1235 with rewards -137.8949005495712 with 69 steps, done\n",
      "Run episode 1236 with rewards -412.549867574834 with 86 steps, done\n",
      "Run episode 1237 with rewards -145.6768780136079 with 74 steps, done\n",
      "Run episode 1238 with rewards -329.7752303270019 with 113 steps, done\n",
      "Run episode 1239 with rewards -145.88064527582793 with 68 steps, done\n",
      "Run episode 1240 with rewards -93.52279917197478 with 71 steps, done\n",
      "Run episode 1241 with rewards -161.4442395424273 with 86 steps, done\n",
      "Run episode 1242 with rewards -383.73200422338607 with 122 steps, done\n",
      "Run episode 1243 with rewards -683.948448843687 with 77 steps, done\n",
      "Run episode 1244 with rewards -822.594790715026 with 150 steps, done\n",
      "Run episode 1245 with rewards -400.24551818480666 with 54 steps, done\n",
      "Run episode 1246 with rewards -81.37711926503471 with 85 steps, done\n",
      "Run episode 1247 with rewards -1390.1089771872316 with 208 steps, done\n",
      "Run episode 1248 with rewards -111.28009390284566 with 57 steps, done\n",
      "Run episode 1249 with rewards -438.3726793398007 with 81 steps, done\n",
      "Run episode 1250 with rewards -132.55863553677744 with 65 steps, done\n",
      "Run episode 1251 with rewards -596.994797940911 with 77 steps, done\n",
      "Run episode 1252 with rewards -139.73847871166964 with 69 steps, done\n",
      "Run episode 1253 with rewards -320.4259959773456 with 107 steps, done\n",
      "Run episode 1254 with rewards -485.8612784550464 with 165 steps, done\n",
      "Run episode 1255 with rewards -433.2556643721675 with 102 steps, done\n",
      "Run episode 1256 with rewards -157.26359309162598 with 76 steps, done\n",
      "Run episode 1257 with rewards -122.08614060895798 with 74 steps, done\n",
      "Run episode 1258 with rewards -120.9681096350499 with 74 steps, done\n",
      "Run episode 1259 with rewards -492.1972635595389 with 71 steps, done\n",
      "Run episode 1260 with rewards -313.11660266092986 with 80 steps, done\n",
      "Run episode 1261 with rewards -631.0546705439119 with 66 steps, done\n",
      "Run episode 1262 with rewards -586.6160806701148 with 98 steps, done\n",
      "Run episode 1263 with rewards -387.4122627774458 with 102 steps, done\n",
      "Run episode 1264 with rewards -214.61037008106146 with 83 steps, done\n",
      "Run episode 1265 with rewards -735.9921194978901 with 73 steps, done\n",
      "Run episode 1266 with rewards -461.72676423370956 with 113 steps, done\n",
      "Run episode 1267 with rewards -545.161958470738 with 58 steps, done\n",
      "Run episode 1268 with rewards -172.8759941402027 with 91 steps, done\n",
      "Run episode 1269 with rewards -130.14931061323932 with 54 steps, done\n",
      "Run episode 1270 with rewards -44.278360300126806 with 78 steps, done\n",
      "Run episode 1271 with rewards -386.3179890422784 with 149 steps, done\n",
      "Run episode 1272 with rewards -251.35403770573424 with 94 steps, done\n",
      "Run episode 1273 with rewards -179.15922538159464 with 73 steps, done\n",
      "Run episode 1274 with rewards -140.93380771868016 with 101 steps, done\n",
      "Run episode 1275 with rewards -34.62633702562974 with 91 steps, done\n",
      "Run episode 1276 with rewards -94.04788942954289 with 98 steps, done\n",
      "Run episode 1277 with rewards -1168.7942137232756 with 243 steps, done\n",
      "Run episode 1278 with rewards -473.8301010510132 with 78 steps, done\n",
      "Run episode 1279 with rewards -236.38313750854658 with 85 steps, done\n",
      "Run episode 1280 with rewards -791.6311516982698 with 124 steps, done\n",
      "Run episode 1281 with rewards -2.798954341385638 with 89 steps, done\n",
      "Run episode 1282 with rewards -1225.7747956196533 with 153 steps, done\n",
      "Run episode 1283 with rewards -388.4003914365214 with 52 steps, done\n",
      "Run episode 1284 with rewards -568.8177758614976 with 59 steps, done\n",
      "Run episode 1285 with rewards -362.3419731046434 with 135 steps, done\n",
      "Run episode 1286 with rewards -110.17334356154484 with 54 steps, done\n",
      "Run episode 1287 with rewards -1953.0458589779835 with 213 steps, done\n",
      "Run episode 1288 with rewards -197.81958242644617 with 86 steps, done\n",
      "Run episode 1289 with rewards -458.4286908799107 with 76 steps, done\n",
      "Run episode 1290 with rewards -136.03428691777884 with 96 steps, done\n",
      "Run episode 1291 with rewards -476.97838302136626 with 135 steps, done\n",
      "Run episode 1292 with rewards -570.6610945212055 with 61 steps, done\n",
      "Run episode 1293 with rewards -455.8001243753099 with 89 steps, done\n",
      "Run episode 1294 with rewards -387.1692752969939 with 80 steps, done\n",
      "Run episode 1295 with rewards -695.7914441625919 with 146 steps, done\n",
      "Run episode 1296 with rewards -377.86433596942675 with 153 steps, done\n",
      "Run episode 1297 with rewards -353.9435655418447 with 50 steps, done\n",
      "Run episode 1298 with rewards -691.2681885535362 with 79 steps, done\n",
      "Run episode 1299 with rewards -642.0901727452957 with 72 steps, done\n",
      "Run episode 1300 with rewards -767.9789406258759 with 84 steps, done\n",
      "Run episode 1301 with rewards -329.6093718183022 with 74 steps, done\n",
      "Run episode 1302 with rewards -659.0720725407099 with 76 steps, done\n",
      "Run episode 1303 with rewards -531.4572610377147 with 58 steps, done\n",
      "Run episode 1304 with rewards -817.2708242479159 with 113 steps, done\n",
      "Run episode 1305 with rewards -776.131185750356 with 77 steps, done\n",
      "Run episode 1306 with rewards -581.6206029351938 with 118 steps, done\n",
      "Run episode 1307 with rewards -598.8944648132712 with 72 steps, done\n",
      "Run episode 1308 with rewards -101.89446630799527 with 67 steps, done\n",
      "Run episode 1309 with rewards -625.6376178039026 with 226 steps, done\n",
      "Run episode 1310 with rewards -465.16206276758965 with 63 steps, done\n",
      "Run episode 1311 with rewards -765.3728752685274 with 75 steps, done\n",
      "Run episode 1312 with rewards -329.84820315597705 with 90 steps, done\n",
      "Run episode 1313 with rewards -707.394467325614 with 76 steps, done\n",
      "Run episode 1314 with rewards -455.464111006407 with 72 steps, done\n",
      "Run episode 1315 with rewards -233.55166386225957 with 59 steps, done\n",
      "Run episode 1316 with rewards -338.20147152875984 with 67 steps, done\n",
      "Run episode 1317 with rewards -678.545653271816 with 77 steps, done\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Run episode 1318 with rewards -144.00541030112143 with 80 steps, done\n",
      "Run episode 1319 with rewards -551.355144924979 with 66 steps, done\n",
      "Run episode 1320 with rewards -652.1681650167571 with 88 steps, done\n",
      "Run episode 1321 with rewards -603.0477519499202 with 67 steps, done\n",
      "Run episode 1322 with rewards -209.25992251850224 with 72 steps, done\n",
      "Run episode 1323 with rewards -464.82699604800746 with 57 steps, done\n",
      "Run episode 1324 with rewards -118.33421102578816 with 74 steps, done\n",
      "Run episode 1325 with rewards -607.8696175287544 with 124 steps, done\n",
      "Run episode 1326 with rewards -129.30765750867536 with 83 steps, done\n",
      "Run episode 1327 with rewards -460.85473526230726 with 89 steps, done\n",
      "Run episode 1328 with rewards -256.7964336793958 with 83 steps, done\n",
      "Run episode 1329 with rewards -820.7449104965606 with 109 steps, done\n",
      "Run episode 1330 with rewards -118.7807201398752 with 88 steps, done\n",
      "Run episode 1331 with rewards -176.19282593823343 with 170 steps, done\n",
      "Run episode 1332 with rewards -178.17542080877743 with 126 steps, done\n",
      "Run episode 1333 with rewards -562.2746347678909 with 84 steps, done\n",
      "Run episode 1334 with rewards -149.9515160090878 with 85 steps, done\n",
      "Run episode 1335 with rewards -657.4982520976141 with 99 steps, done\n",
      "Run episode 1336 with rewards -134.89654372614712 with 73 steps, done\n",
      "Run episode 1337 with rewards -670.0382591108631 with 97 steps, done\n",
      "Run episode 1338 with rewards -111.20661926929733 with 84 steps, done\n",
      "Run episode 1339 with rewards -640.3521743281079 with 98 steps, done\n",
      "Run episode 1340 with rewards -110.7321674451157 with 72 steps, done\n",
      "Run episode 1341 with rewards -891.7360563214692 with 157 steps, done\n",
      "Run episode 1342 with rewards -143.65516632761552 with 57 steps, done\n",
      "Run episode 1343 with rewards -461.90279886644527 with 154 steps, done\n",
      "Run episode 1344 with rewards -564.1580446384635 with 63 steps, done\n",
      "Run episode 1345 with rewards -14.861348032635902 with 80 steps, done\n",
      "Run episode 1346 with rewards -158.70525334662182 with 74 steps, done\n",
      "Run episode 1347 with rewards -62.90944344843692 with 68 steps, done\n",
      "Run episode 1348 with rewards -394.81191769749705 with 82 steps, done\n",
      "Run episode 1349 with rewards -177.76009152412718 with 63 steps, done\n",
      "Run episode 1350 with rewards -1009.8614926606541 with 85 steps, done\n",
      "Run episode 1351 with rewards -145.60968444858213 with 55 steps, done\n",
      "Run episode 1352 with rewards -429.94595158454626 with 54 steps, done\n",
      "Run episode 1353 with rewards -197.29802762524696 with 58 steps, done\n",
      "Run episode 1354 with rewards -833.1428562824871 with 87 steps, done\n",
      "Run episode 1355 with rewards -418.5087403692191 with 89 steps, done\n",
      "Run episode 1356 with rewards -405.94375433005627 with 50 steps, done\n",
      "Run episode 1357 with rewards -670.7692440058546 with 98 steps, done\n",
      "Run episode 1358 with rewards -440.6094404966945 with 57 steps, done\n",
      "Run episode 1359 with rewards -409.2926605655345 with 99 steps, done\n",
      "Run episode 1360 with rewards -375.84535923132086 with 50 steps, done\n",
      "Run episode 1361 with rewards -609.9469108332743 with 101 steps, done\n",
      "Run episode 1362 with rewards -500.9389979160629 with 62 steps, done\n",
      "Run episode 1363 with rewards -401.47463999833485 with 96 steps, done\n",
      "Run episode 1364 with rewards -569.5855108378041 with 123 steps, done\n",
      "Run episode 1365 with rewards -125.94282968444702 with 86 steps, done\n",
      "Run episode 1366 with rewards -596.5285893299382 with 92 steps, done\n",
      "Run episode 1367 with rewards -120.30613885394355 with 57 steps, done\n",
      "Run episode 1368 with rewards -620.9782661610135 with 95 steps, done\n",
      "Run episode 1369 with rewards -115.16088515410196 with 88 steps, done\n",
      "Run episode 1370 with rewards -263.0200049262298 with 133 steps, done\n",
      "Run episode 1371 with rewards -127.43383873545682 with 79 steps, done\n",
      "Run episode 1372 with rewards -444.00694291414266 with 85 steps, done\n",
      "Run episode 1373 with rewards -658.6975314029579 with 70 steps, done\n",
      "Run episode 1374 with rewards -194.72058539406197 with 82 steps, done\n",
      "Run episode 1375 with rewards -547.3041697164243 with 59 steps, done\n",
      "Run episode 1376 with rewards -575.5547368886823 with 96 steps, done\n",
      "Run episode 1377 with rewards -383.4353278676051 with 56 steps, done\n",
      "Run episode 1378 with rewards -267.2275130851285 with 67 steps, done\n",
      "Run episode 1379 with rewards -127.09706498187089 with 57 steps, done\n",
      "Run episode 1380 with rewards -535.5088943467244 with 78 steps, done\n",
      "Run episode 1381 with rewards -151.14351531131916 with 91 steps, done\n",
      "Run episode 1382 with rewards -367.5015984451013 with 83 steps, done\n",
      "Run episode 1383 with rewards -779.0271592597757 with 78 steps, done\n",
      "Run episode 1384 with rewards -474.9022559509219 with 61 steps, done\n",
      "Run episode 1385 with rewards -361.33633456541526 with 67 steps, done\n",
      "Run episode 1386 with rewards -498.25800788549765 with 57 steps, done\n",
      "Run episode 1387 with rewards -541.6865372498048 with 59 steps, done\n",
      "Run episode 1388 with rewards -806.4905246976633 with 85 steps, done\n",
      "Run episode 1389 with rewards -496.9274042942984 with 56 steps, done\n",
      "Run episode 1390 with rewards -618.7474275267284 with 87 steps, done\n",
      "Run episode 1391 with rewards -903.1631217524231 with 86 steps, done\n",
      "Run episode 1392 with rewards -586.8808333253593 with 99 steps, done\n",
      "Run episode 1393 with rewards -688.9611268105226 with 103 steps, done\n",
      "Run episode 1394 with rewards -666.5990282680373 with 122 steps, done\n",
      "Run episode 1395 with rewards -793.8458906413641 with 84 steps, done\n",
      "Run episode 1396 with rewards -118.24288082190652 with 95 steps, done\n",
      "Run episode 1397 with rewards -129.43681894429733 with 87 steps, done\n",
      "Run episode 1398 with rewards -232.3906449530921 with 58 steps, done\n",
      "Run episode 1399 with rewards -136.7908633591788 with 79 steps, done\n",
      "Run episode 1400 with rewards -364.2542523420879 with 50 steps, done\n",
      "Run episode 1401 with rewards -642.3244326504008 with 72 steps, done\n",
      "Run episode 1402 with rewards -731.1647056594621 with 92 steps, done\n",
      "Run episode 1403 with rewards -716.854367923543 with 117 steps, done\n",
      "Run episode 1404 with rewards -846.0855800373366 with 84 steps, done\n",
      "Run episode 1405 with rewards -492.69511270700616 with 119 steps, done\n",
      "Run episode 1406 with rewards -754.4172378976602 with 76 steps, done\n",
      "Run episode 1407 with rewards -499.32686243379953 with 115 steps, done\n",
      "Run episode 1408 with rewards -718.0167507725934 with 81 steps, done\n",
      "Run episode 1409 with rewards -413.81788315712265 with 55 steps, done\n",
      "Run episode 1410 with rewards -570.1586340954641 with 65 steps, done\n",
      "Run episode 1411 with rewards -589.4752934941174 with 101 steps, done\n",
      "Run episode 1412 with rewards -759.5181743952958 with 77 steps, done\n",
      "Run episode 1413 with rewards -312.78747660177476 with 68 steps, done\n",
      "Run episode 1414 with rewards -865.5851786288187 with 80 steps, done\n",
      "Run episode 1415 with rewards -620.1142195242578 with 83 steps, done\n",
      "Run episode 1416 with rewards -517.7844299918594 with 70 steps, done\n",
      "Run episode 1417 with rewards -227.48993095589287 with 84 steps, done\n",
      "Run episode 1418 with rewards -532.3756669023962 with 58 steps, done\n",
      "Run episode 1419 with rewards -379.0018029724489 with 55 steps, done\n",
      "Run episode 1420 with rewards -99.28971962268923 with 53 steps, done\n",
      "Run episode 1421 with rewards -122.53466039105362 with 54 steps, done\n",
      "Run episode 1422 with rewards -610.4611668172715 with 65 steps, done\n",
      "Run episode 1423 with rewards -528.2809651833936 with 116 steps, done\n",
      "Run episode 1424 with rewards -802.3282710182863 with 77 steps, done\n",
      "Run episode 1425 with rewards -546.0670257875863 with 98 steps, done\n",
      "Run episode 1426 with rewards -785.9582465251714 with 80 steps, done\n",
      "Run episode 1427 with rewards -373.4914214129114 with 86 steps, done\n",
      "Run episode 1428 with rewards -629.8152773915579 with 66 steps, done\n",
      "Run episode 1429 with rewards -303.708831529785 with 69 steps, done\n",
      "Run episode 1430 with rewards -500.99868215413085 with 59 steps, done\n",
      "Run episode 1431 with rewards -428.4331490155337 with 100 steps, done\n",
      "Run episode 1432 with rewards -168.93133790753228 with 61 steps, done\n",
      "Run episode 1433 with rewards -473.0218535086538 with 55 steps, done\n",
      "Run episode 1434 with rewards -414.14633402350773 with 107 steps, done\n",
      "Run episode 1435 with rewards -419.56339722387855 with 53 steps, done\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Run episode 1436 with rewards -144.8089545840225 with 55 steps, done\n",
      "Run episode 1437 with rewards -116.77787985045384 with 130 steps, done\n",
      "Run episode 1438 with rewards -249.6770004947296 with 91 steps, done\n",
      "Run episode 1439 with rewards -564.8758748567069 with 73 steps, done\n",
      "Run episode 1440 with rewards -167.00818408369545 with 76 steps, done\n",
      "Run episode 1441 with rewards -114.75847864008502 with 94 steps, done\n",
      "Run episode 1442 with rewards -1630.1336488021836 with 277 steps, done\n",
      "Run episode 1443 with rewards -527.5932153870716 with 58 steps, done\n",
      "Run episode 1444 with rewards -638.0654545941201 with 111 steps, done\n",
      "Run episode 1445 with rewards -632.3178797129929 with 70 steps, done\n",
      "Run episode 1446 with rewards -528.047411154967 with 91 steps, done\n",
      "Run episode 1447 with rewards -510.1289602547206 with 68 steps, done\n",
      "Run episode 1448 with rewards -794.4285993147644 with 81 steps, done\n",
      "Run episode 1449 with rewards -585.7320096918203 with 75 steps, done\n",
      "Run episode 1450 with rewards -869.8054731154758 with 80 steps, done\n",
      "Run episode 1451 with rewards -358.3082086821922 with 80 steps, done\n",
      "Run episode 1452 with rewards -401.56446449323494 with 48 steps, done\n",
      "Run episode 1453 with rewards -477.7435294351485 with 79 steps, done\n",
      "Run episode 1454 with rewards -384.66343795958824 with 71 steps, done\n",
      "Run episode 1455 with rewards -169.5904176255326 with 87 steps, done\n",
      "Run episode 1456 with rewards -482.68562051365353 with 59 steps, done\n",
      "Run episode 1457 with rewards -583.9628165272115 with 74 steps, done\n",
      "Run episode 1458 with rewards -441.19411461885784 with 75 steps, done\n",
      "Run episode 1459 with rewards -412.1449025567103 with 102 steps, done\n",
      "Run episode 1460 with rewards -511.5068152588502 with 58 steps, done\n",
      "Run episode 1461 with rewards -494.26082874859014 with 73 steps, done\n",
      "Run episode 1462 with rewards -375.69938373142463 with 85 steps, done\n",
      "Run episode 1463 with rewards -561.0737709696396 with 59 steps, done\n",
      "Run episode 1464 with rewards -329.7387992488333 with 66 steps, done\n",
      "Run episode 1465 with rewards -574.2057738119962 with 70 steps, done\n",
      "Run episode 1466 with rewards -79.25973087019358 with 67 steps, done\n",
      "Run episode 1467 with rewards -800.0770328134183 with 76 steps, done\n",
      "Run episode 1468 with rewards -484.3932045452107 with 62 steps, done\n",
      "Run episode 1469 with rewards -89.53941423707951 with 148 steps, done\n",
      "Run episode 1470 with rewards -661.893851884838 with 99 steps, done\n",
      "Run episode 1471 with rewards -620.7177001183333 with 83 steps, done\n",
      "Run episode 1472 with rewards -117.83206202917165 with 63 steps, done\n",
      "Run episode 1473 with rewards -124.7004606831272 with 146 steps, done\n",
      "Run episode 1474 with rewards -97.48262287767315 with 59 steps, done\n",
      "Run episode 1475 with rewards -977.1947619912803 with 132 steps, done\n",
      "Run episode 1476 with rewards -190.16498387392664 with 93 steps, done\n",
      "Run episode 1477 with rewards -561.7545324350472 with 85 steps, done\n",
      "Run episode 1478 with rewards -163.8597671994092 with 73 steps, done\n",
      "Run episode 1479 with rewards -528.0971959941538 with 113 steps, done\n",
      "Run episode 1480 with rewards -179.9243324255487 with 52 steps, done\n",
      "Run episode 1481 with rewards -609.5892991853784 with 102 steps, done\n",
      "Run episode 1482 with rewards -519.0536347477155 with 67 steps, done\n",
      "Run episode 1483 with rewards -220.91888318356013 with 191 steps, done\n",
      "Run episode 1484 with rewards -419.18272049392 with 58 steps, done\n",
      "Run episode 1485 with rewards -279.4203299289875 with 64 steps, done\n",
      "Run episode 1486 with rewards -817.9694174000215 with 77 steps, done\n",
      "Run episode 1487 with rewards -360.69231586548585 with 71 steps, done\n",
      "Run episode 1488 with rewards -568.3562346821067 with 89 steps, done\n",
      "Run episode 1489 with rewards -305.68676514598485 with 50 steps, done\n",
      "Run episode 1490 with rewards -449.4191924093513 with 55 steps, done\n",
      "Run episode 1491 with rewards -273.3216497758067 with 72 steps, done\n",
      "Run episode 1492 with rewards -351.19421527641134 with 87 steps, done\n",
      "Run episode 1493 with rewards -85.87053162393367 with 55 steps, done\n",
      "Run episode 1494 with rewards -929.5253691098238 with 119 steps, done\n",
      "Run episode 1495 with rewards -161.8106255536713 with 67 steps, done\n",
      "Run episode 1496 with rewards -695.8872693266857 with 129 steps, done\n",
      "Run episode 1497 with rewards -147.53343229480453 with 77 steps, done\n",
      "Run episode 1498 with rewards -585.8541449918839 with 81 steps, done\n",
      "Run episode 1499 with rewards -163.51928643139917 with 63 steps, done\n",
      "Run episode 1500 with rewards -884.5672928456971 with 140 steps, done\n",
      "Run episode 1501 with rewards -212.69582148388395 with 73 steps, done\n",
      "Run episode 1502 with rewards -1605.180911607505 with 213 steps, done\n",
      "Run episode 1503 with rewards -907.0012720698375 with 82 steps, done\n",
      "Run episode 1504 with rewards -112.79726536536552 with 85 steps, done\n",
      "Run episode 1505 with rewards -1895.5281830123174 with 262 steps, done\n",
      "Run episode 1506 with rewards -368.9529072136895 with 69 steps, done\n",
      "Run episode 1507 with rewards -481.005780269065 with 68 steps, done\n",
      "Run episode 1508 with rewards -210.09450259241598 with 152 steps, done\n",
      "Run episode 1509 with rewards -134.01116107516825 with 55 steps, done\n",
      "Run episode 1510 with rewards -147.43307390398272 with 146 steps, done\n",
      "Run episode 1511 with rewards -155.45648336120868 with 69 steps, done\n",
      "Run episode 1512 with rewards -118.0969878100164 with 81 steps, done\n",
      "Run episode 1513 with rewards -522.9659397202885 with 65 steps, done\n",
      "Run episode 1514 with rewards -140.490459851029 with 54 steps, done\n",
      "Run episode 1515 with rewards -641.6099277607603 with 77 steps, done\n",
      "Run episode 1516 with rewards -361.68285592037597 with 90 steps, done\n",
      "Run episode 1517 with rewards -475.08488440352323 with 71 steps, done\n",
      "Run episode 1518 with rewards -525.2981199319884 with 134 steps, done\n",
      "Run episode 1519 with rewards -465.7627366928765 with 60 steps, done\n",
      "Run episode 1520 with rewards -449.4877369801001 with 73 steps, done\n",
      "Run episode 1521 with rewards -726.6788168755036 with 77 steps, done\n",
      "Run episode 1522 with rewards -339.3333540103529 with 105 steps, done\n",
      "Run episode 1523 with rewards -982.5994110611347 with 123 steps, done\n",
      "Run episode 1524 with rewards -147.56647710814735 with 62 steps, done\n",
      "Run episode 1525 with rewards -328.48484908926986 with 142 steps, done\n",
      "Run episode 1526 with rewards -460.13494957132946 with 60 steps, done\n",
      "Run episode 1527 with rewards -425.86051620029923 with 56 steps, done\n",
      "Run episode 1528 with rewards -279.570858483194 with 99 steps, done\n",
      "Run episode 1529 with rewards -534.6910290071163 with 57 steps, done\n",
      "Run episode 1530 with rewards -248.5286019694776 with 67 steps, done\n",
      "Run episode 1531 with rewards -684.9527594221898 with 102 steps, done\n",
      "Run episode 1532 with rewards -623.6689502280005 with 62 steps, done\n",
      "Run episode 1533 with rewards -414.7011264973654 with 98 steps, done\n",
      "Run episode 1534 with rewards -124.70821769132337 with 65 steps, done\n",
      "Run episode 1535 with rewards -333.3474907092419 with 98 steps, done\n",
      "Run episode 1536 with rewards -176.01769213373638 with 101 steps, done\n",
      "Run episode 1537 with rewards -124.18779534194255 with 60 steps, done\n",
      "Run episode 1538 with rewards -219.18880752002468 with 67 steps, done\n",
      "Run episode 1539 with rewards -127.3642411226131 with 54 steps, done\n",
      "Run episode 1540 with rewards -335.155081125524 with 95 steps, done\n",
      "Run episode 1541 with rewards -124.82748394578175 with 69 steps, done\n",
      "Run episode 1542 with rewards -121.17905783184433 with 139 steps, done\n",
      "Run episode 1543 with rewards -60.65135966393106 with 56 steps, done\n",
      "Run episode 1544 with rewards 9.595303409375404 with 86 steps, done\n",
      "Run episode 1545 with rewards -604.1787643539471 with 77 steps, done\n",
      "Run episode 1546 with rewards -167.7700576817501 with 68 steps, done\n",
      "Run episode 1547 with rewards -635.5590122462265 with 81 steps, done\n",
      "Run episode 1548 with rewards -115.65665266902158 with 88 steps, done\n",
      "Run episode 1549 with rewards -1132.5124723661497 with 156 steps, done\n",
      "Run episode 1550 with rewards -118.85472934538379 with 58 steps, done\n",
      "Run episode 1551 with rewards -627.4973452203383 with 88 steps, done\n",
      "Run episode 1552 with rewards -14.17173005547231 with 86 steps, done\n",
      "Run episode 1553 with rewards -428.2502814881782 with 78 steps, done\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Run episode 1554 with rewards -242.45826808111093 with 100 steps, done\n",
      "Run episode 1555 with rewards -288.330691766791 with 63 steps, done\n",
      "Run episode 1556 with rewards -272.0701986983531 with 67 steps, done\n",
      "Run episode 1557 with rewards -553.4639782965285 with 59 steps, done\n",
      "Run episode 1558 with rewards -166.61745614034828 with 66 steps, done\n",
      "Run episode 1559 with rewards -112.15079540289534 with 76 steps, done\n",
      "Run episode 1560 with rewards -95.88700205290651 with 86 steps, done\n",
      "Run episode 1561 with rewards -634.5784881416598 with 103 steps, done\n",
      "Run episode 1562 with rewards -325.7568861502285 with 63 steps, done\n",
      "Run episode 1563 with rewards -308.6373394651856 with 92 steps, done\n",
      "Run episode 1564 with rewards -293.4509551773715 with 77 steps, done\n",
      "Run episode 1565 with rewards -462.0887895280384 with 59 steps, done\n",
      "Run episode 1566 with rewards -477.0541729520992 with 53 steps, done\n",
      "Run episode 1567 with rewards -672.8787361827775 with 110 steps, done\n",
      "Run episode 1568 with rewards -534.4734564628266 with 59 steps, done\n",
      "Run episode 1569 with rewards -422.55649422835455 with 67 steps, done\n",
      "Run episode 1570 with rewards -485.89993480457804 with 70 steps, done\n",
      "Run episode 1571 with rewards -520.8868514007947 with 81 steps, done\n",
      "Run episode 1572 with rewards -790.995726511648 with 81 steps, done\n",
      "Run episode 1573 with rewards -654.3684088292006 with 91 steps, done\n",
      "Run episode 1574 with rewards -838.9889524655487 with 79 steps, done\n",
      "Run episode 1575 with rewards -449.3377565096446 with 69 steps, done\n",
      "Run episode 1576 with rewards -626.8436240147971 with 72 steps, done\n",
      "Run episode 1577 with rewards -642.3434474915153 with 104 steps, done\n",
      "Run episode 1578 with rewards -499.8952158068712 with 68 steps, done\n",
      "Run episode 1579 with rewards -554.5716333629534 with 94 steps, done\n",
      "Run episode 1580 with rewards -796.3512676422049 with 79 steps, done\n",
      "Run episode 1581 with rewards -334.7814295518878 with 89 steps, done\n",
      "Run episode 1582 with rewards -376.98523369075946 with 86 steps, done\n",
      "Run episode 1583 with rewards -147.6820340530359 with 53 steps, done\n",
      "Run episode 1584 with rewards -36.259650377022695 with 140 steps, done\n",
      "Run episode 1585 with rewards -158.34975125582787 with 68 steps, done\n",
      "Run episode 1586 with rewards -539.3197105529705 with 72 steps, done\n",
      "Run episode 1587 with rewards -341.22162312217813 with 93 steps, done\n",
      "Run episode 1588 with rewards -520.9661961773757 with 94 steps, done\n",
      "Run episode 1589 with rewards -173.2442275015535 with 66 steps, done\n",
      "Run episode 1590 with rewards -2548.312571270115 with 303 steps, done\n",
      "Run episode 1591 with rewards -444.7317156167696 with 72 steps, done\n",
      "Run episode 1592 with rewards -318.1317991472905 with 99 steps, done\n",
      "Run episode 1593 with rewards -834.3281757822812 with 88 steps, done\n",
      "Run episode 1594 with rewards -496.49058645335316 with 102 steps, done\n",
      "Run episode 1595 with rewards -638.6466090265792 with 69 steps, done\n",
      "Run episode 1596 with rewards -388.51506170591597 with 93 steps, done\n",
      "Run episode 1597 with rewards -423.0694514603745 with 54 steps, done\n",
      "Run episode 1598 with rewards -482.3554393019614 with 78 steps, done\n",
      "Run episode 1599 with rewards -455.03632991451116 with 79 steps, done\n",
      "Run episode 1600 with rewards -445.9642559727127 with 69 steps, done\n",
      "Run episode 1601 with rewards -129.12264156459312 with 67 steps, done\n",
      "Run episode 1602 with rewards -823.5429894162038 with 77 steps, done\n",
      "Run episode 1603 with rewards -305.1374869085454 with 64 steps, done\n",
      "Run episode 1604 with rewards -785.1760537292784 with 78 steps, done\n",
      "Run episode 1605 with rewards -680.6137436963576 with 123 steps, done\n",
      "Run episode 1606 with rewards -348.12092882689035 with 53 steps, done\n",
      "Run episode 1607 with rewards -517.1725534184561 with 88 steps, done\n",
      "Run episode 1608 with rewards -162.842153751184 with 78 steps, done\n",
      "Run episode 1609 with rewards -613.3105406756757 with 66 steps, done\n",
      "Run episode 1610 with rewards -441.7396202941904 with 84 steps, done\n",
      "Run episode 1611 with rewards -768.9856902088575 with 77 steps, done\n",
      "Run episode 1612 with rewards -142.0768515354715 with 83 steps, done\n",
      "Run episode 1613 with rewards -489.35161284328865 with 68 steps, done\n",
      "Run episode 1614 with rewards -225.4815810375337 with 118 steps, done\n",
      "Run episode 1615 with rewards -172.2559248771802 with 70 steps, done\n",
      "Run episode 1616 with rewards -346.2488387478095 with 51 steps, done\n",
      "Run episode 1617 with rewards -103.74398439218712 with 55 steps, done\n",
      "Run episode 1618 with rewards -419.13178474537114 with 98 steps, done\n",
      "Run episode 1619 with rewards -611.2277680693999 with 114 steps, done\n",
      "Run episode 1620 with rewards -608.2601231374987 with 66 steps, done\n",
      "Run episode 1621 with rewards -302.07649117858284 with 73 steps, done\n",
      "Run episode 1622 with rewards -407.9649453903308 with 50 steps, done\n",
      "Run episode 1623 with rewards -643.7916459102339 with 104 steps, done\n",
      "Run episode 1624 with rewards -335.50739711210065 with 51 steps, done\n",
      "Run episode 1625 with rewards -114.68377042325416 with 111 steps, done\n",
      "Run episode 1626 with rewards -145.53354114771076 with 102 steps, done\n",
      "Run episode 1627 with rewards -108.01844376473923 with 52 steps, done\n",
      "Run episode 1628 with rewards -401.7793710652624 with 73 steps, done\n",
      "Run episode 1629 with rewards -464.8942049152931 with 56 steps, done\n",
      "Run episode 1630 with rewards -566.9677812004618 with 81 steps, done\n",
      "Run episode 1631 with rewards -529.6196165791271 with 67 steps, done\n",
      "Run episode 1632 with rewards -340.62630215344416 with 52 steps, done\n",
      "Run episode 1633 with rewards -838.239447340499 with 78 steps, done\n",
      "Run episode 1634 with rewards -526.596936854606 with 56 steps, done\n",
      "Run episode 1635 with rewards -510.6735762933479 with 84 steps, done\n",
      "Run episode 1636 with rewards -647.292671053843 with 77 steps, done\n",
      "Run episode 1637 with rewards -316.7919202935061 with 113 steps, done\n",
      "Run episode 1638 with rewards -519.8007087635899 with 64 steps, done\n",
      "Run episode 1639 with rewards -139.45908300498007 with 71 steps, done\n",
      "Run episode 1640 with rewards -152.2349165037323 with 80 steps, done\n",
      "Run episode 1641 with rewards -109.92263628403313 with 89 steps, done\n",
      "Run episode 1642 with rewards -740.3577416588545 with 80 steps, done\n",
      "Run episode 1643 with rewards -162.17583973311037 with 86 steps, done\n",
      "Run episode 1644 with rewards -553.0120936043368 with 67 steps, done\n",
      "Run episode 1645 with rewards -397.592631940602 with 64 steps, done\n",
      "Run episode 1646 with rewards -382.7220430259562 with 50 steps, done\n",
      "Run episode 1647 with rewards -396.6058876029089 with 109 steps, done\n",
      "Run episode 1648 with rewards -530.7804291570272 with 68 steps, done\n",
      "Run episode 1649 with rewards -775.0455817139411 with 103 steps, done\n",
      "Run episode 1650 with rewards -115.59407252636353 with 53 steps, done\n",
      "Run episode 1651 with rewards -825.4466243262007 with 112 steps, done\n",
      "Run episode 1652 with rewards -148.93895431905798 with 55 steps, done\n",
      "Run episode 1653 with rewards -692.4041283168661 with 120 steps, done\n",
      "Run episode 1654 with rewards -174.41632798636886 with 68 steps, done\n",
      "Run episode 1655 with rewards -849.247905355985 with 159 steps, done\n",
      "Run episode 1656 with rewards -162.08070598753656 with 57 steps, done\n",
      "Run episode 1657 with rewards -877.2732076542329 with 134 steps, done\n",
      "Run episode 1658 with rewards -134.3171324895713 with 73 steps, done\n",
      "Run episode 1659 with rewards -470.00775259998625 with 91 steps, done\n",
      "Run episode 1660 with rewards -121.1157852709002 with 88 steps, done\n",
      "Run episode 1661 with rewards -107.1498489480813 with 65 steps, done\n",
      "Run episode 1662 with rewards -570.0102034268414 with 92 steps, done\n",
      "Run episode 1663 with rewards -492.1601568230069 with 63 steps, done\n",
      "Run episode 1664 with rewards -569.0416892427841 with 79 steps, done\n",
      "Run episode 1665 with rewards -357.5450116745732 with 84 steps, done\n",
      "Run episode 1666 with rewards -1048.122120989649 with 138 steps, done\n",
      "Run episode 1667 with rewards -141.0400348305639 with 67 steps, done\n",
      "Run episode 1668 with rewards -536.0480670131651 with 91 steps, done\n",
      "Run episode 1669 with rewards -138.2521757864361 with 54 steps, done\n",
      "Run episode 1670 with rewards -510.71690403994353 with 110 steps, done\n",
      "Run episode 1671 with rewards -124.19764167598605 with 71 steps, done\n",
      "Run episode 1672 with rewards -510.09901107187113 with 103 steps, done\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Run episode 1673 with rewards -119.6935194500227 with 53 steps, done\n",
      "Run episode 1674 with rewards -407.82154559986486 with 53 steps, done\n",
      "Run episode 1675 with rewards -213.74598101785384 with 82 steps, done\n",
      "Run episode 1676 with rewards -632.6302485844103 with 75 steps, done\n",
      "Run episode 1677 with rewards -352.7191005032653 with 64 steps, done\n",
      "Run episode 1678 with rewards -462.31605554224143 with 60 steps, done\n",
      "Run episode 1679 with rewards -216.43874359338616 with 72 steps, done\n",
      "Run episode 1680 with rewards -621.4933743554024 with 77 steps, done\n",
      "Run episode 1681 with rewards -490.08580530485096 with 81 steps, done\n",
      "Run episode 1682 with rewards -216.07593985822888 with 76 steps, done\n",
      "Run episode 1683 with rewards -477.2559217311229 with 249 steps, done\n",
      "Run episode 1684 with rewards -102.16626021948639 with 91 steps, done\n",
      "Run episode 1685 with rewards -814.2173002149053 with 87 steps, done\n",
      "Run episode 1686 with rewards -602.7395812996886 with 96 steps, done\n",
      "Run episode 1687 with rewards -1026.838037258758 with 88 steps, done\n",
      "Run episode 1688 with rewards -652.2671900739714 with 85 steps, done\n",
      "Run episode 1689 with rewards -600.3466076669004 with 72 steps, done\n",
      "Run episode 1690 with rewards -622.4027262722096 with 108 steps, done\n",
      "Run episode 1691 with rewards -383.1380094630991 with 56 steps, done\n",
      "Run episode 1692 with rewards -314.92756217533145 with 55 steps, done\n",
      "Run episode 1693 with rewards -466.80582054125813 with 59 steps, done\n",
      "Run episode 1694 with rewards -664.2733214700219 with 99 steps, done\n",
      "Run episode 1695 with rewards -470.90171167857636 with 73 steps, done\n",
      "Run episode 1696 with rewards -119.78693912348672 with 97 steps, done\n",
      "Run episode 1697 with rewards -427.5473919371655 with 95 steps, done\n",
      "Run episode 1698 with rewards -175.739181187409 with 74 steps, done\n",
      "Run episode 1699 with rewards -148.42464720775104 with 87 steps, done\n",
      "Run episode 1700 with rewards -387.08153393698996 with 53 steps, done\n",
      "Run episode 1701 with rewards -504.979660245952 with 69 steps, done\n",
      "Run episode 1702 with rewards -589.6020146447779 with 91 steps, done\n",
      "Run episode 1703 with rewards -525.9324263030528 with 58 steps, done\n",
      "Run episode 1704 with rewards -215.58155134634467 with 74 steps, done\n",
      "Run episode 1705 with rewards -535.0206013644079 with 59 steps, done\n",
      "Run episode 1706 with rewards -507.8581762791874 with 116 steps, done\n",
      "Run episode 1707 with rewards -695.7980818895289 with 75 steps, done\n",
      "Run episode 1708 with rewards -764.5575036644517 with 107 steps, done\n",
      "Run episode 1709 with rewards -717.6778725683375 with 75 steps, done\n",
      "Run episode 1710 with rewards -503.80239063203584 with 99 steps, done\n",
      "Run episode 1711 with rewards -782.3453412739606 with 76 steps, done\n",
      "Run episode 1712 with rewards -308.95456045672336 with 84 steps, done\n",
      "Run episode 1713 with rewards -428.32641752036017 with 59 steps, done\n",
      "Run episode 1714 with rewards -535.9599537909986 with 110 steps, done\n",
      "Run episode 1715 with rewards -493.6729430278698 with 55 steps, done\n",
      "Run episode 1716 with rewards -253.88978586688745 with 65 steps, done\n",
      "Run episode 1717 with rewards -319.92951424442003 with 66 steps, done\n",
      "Run episode 1718 with rewards -762.0547391844337 with 85 steps, done\n",
      "Run episode 1719 with rewards -291.20201996297556 with 79 steps, done\n",
      "Run episode 1720 with rewards -457.3403166329638 with 101 steps, done\n",
      "Run episode 1721 with rewards -514.254029895241 with 86 steps, done\n",
      "Run episode 1722 with rewards -127.04241358588354 with 86 steps, done\n",
      "Run episode 1723 with rewards -95.90644403760021 with 57 steps, done\n",
      "Run episode 1724 with rewards -531.5513061866685 with 58 steps, done\n",
      "Run episode 1725 with rewards -561.8355844791103 with 98 steps, done\n",
      "Run episode 1726 with rewards -489.58301797635994 with 53 steps, done\n",
      "Run episode 1727 with rewards -372.117095554508 with 73 steps, done\n",
      "Run episode 1728 with rewards -437.0054429529059 with 78 steps, done\n",
      "Run episode 1729 with rewards -377.5135518339768 with 90 steps, done\n",
      "Run episode 1730 with rewards -711.3021835440953 with 81 steps, done\n",
      "Run episode 1731 with rewards -381.70668922532633 with 83 steps, done\n",
      "Run episode 1732 with rewards -608.8410672027962 with 59 steps, done\n",
      "Run episode 1733 with rewards -138.48035042410177 with 56 steps, done\n",
      "Run episode 1734 with rewards -284.8567822762436 with 99 steps, done\n",
      "Run episode 1735 with rewards -287.7741832149514 with 100 steps, done\n",
      "Run episode 1736 with rewards -528.6274112192214 with 60 steps, done\n",
      "Run episode 1737 with rewards -519.822876567684 with 93 steps, done\n",
      "Run episode 1738 with rewards -1226.527483454626 with 165 steps, done\n",
      "Run episode 1739 with rewards -47.21766141828458 with 122 steps, done\n",
      "Run episode 1740 with rewards -468.17354397809675 with 83 steps, done\n",
      "Run episode 1741 with rewards -98.24221095374506 with 49 steps, done\n",
      "Run episode 1742 with rewards -359.2558738953834 with 55 steps, done\n",
      "Run episode 1743 with rewards -492.7933237814238 with 95 steps, done\n",
      "Run episode 1744 with rewards -475.98505277942184 with 73 steps, done\n",
      "Run episode 1745 with rewards -396.06092626673046 with 78 steps, done\n",
      "Run episode 1746 with rewards -811.1420794651369 with 87 steps, done\n",
      "Run episode 1747 with rewards -572.6190637802991 with 77 steps, done\n",
      "Run episode 1748 with rewards -519.436777792542 with 58 steps, done\n",
      "Run episode 1749 with rewards -249.35679919308168 with 80 steps, done\n",
      "Run episode 1750 with rewards -621.1264670267407 with 65 steps, done\n",
      "Run episode 1751 with rewards -389.5440606566614 with 128 steps, done\n",
      "Run episode 1752 with rewards -378.3372745281532 with 54 steps, done\n",
      "Run episode 1753 with rewards -550.9079373070413 with 85 steps, done\n",
      "Run episode 1754 with rewards -776.5762243977639 with 81 steps, done\n",
      "Run episode 1755 with rewards -677.0644026438637 with 114 steps, done\n",
      "Run episode 1756 with rewards -640.7325667370083 with 99 steps, done\n",
      "Run episode 1757 with rewards -469.7141756998928 with 64 steps, done\n",
      "Run episode 1758 with rewards -585.4294200324069 with 119 steps, done\n",
      "Run episode 1759 with rewards -368.77828550057666 with 109 steps, done\n",
      "Run episode 1760 with rewards -501.3928678997572 with 55 steps, done\n",
      "Run episode 1761 with rewards -650.2610774079762 with 109 steps, done\n",
      "Run episode 1762 with rewards -703.6690738616737 with 68 steps, done\n",
      "Run episode 1763 with rewards -644.1806311427837 with 114 steps, done\n",
      "Run episode 1764 with rewards -607.635439561433 with 67 steps, done\n",
      "Run episode 1765 with rewards -132.45887582142367 with 102 steps, done\n",
      "Run episode 1766 with rewards -119.97347732028237 with 65 steps, done\n",
      "Run episode 1767 with rewards -498.22701723122174 with 77 steps, done\n",
      "Run episode 1768 with rewards -786.3901696959135 with 79 steps, done\n",
      "Run episode 1769 with rewards -641.5526128102285 with 84 steps, done\n",
      "Run episode 1770 with rewards -776.8544451712348 with 77 steps, done\n",
      "Run episode 1771 with rewards -956.4143887695767 with 136 steps, done\n",
      "Run episode 1772 with rewards -150.08671078140569 with 75 steps, done\n",
      "Run episode 1773 with rewards -271.0535236694076 with 91 steps, done\n",
      "Run episode 1774 with rewards -160.91996815842487 with 80 steps, done\n",
      "Run episode 1775 with rewards -37.05052054999274 with 81 steps, done\n",
      "Run episode 1776 with rewards -157.4274158947488 with 81 steps, done\n",
      "Run episode 1777 with rewards -510.12416893634935 with 58 steps, done\n",
      "Run episode 1778 with rewards -0.6128395247240377 with 79 steps, done\n",
      "Run episode 1779 with rewards -453.07630307635054 with 73 steps, done\n",
      "Run episode 1780 with rewards -149.72918610953047 with 67 steps, done\n",
      "Run episode 1781 with rewards -765.7938970764922 with 84 steps, done\n",
      "Run episode 1782 with rewards -934.4817922877187 with 149 steps, done\n",
      "Run episode 1783 with rewards -529.6916931959776 with 65 steps, done\n",
      "Run episode 1784 with rewards -564.6390984998043 with 97 steps, done\n",
      "Run episode 1785 with rewards -827.599561801849 with 75 steps, done\n",
      "Run episode 1786 with rewards -882.6501882062443 with 132 steps, done\n",
      "Run episode 1787 with rewards -702.4155000487336 with 80 steps, done\n",
      "Run episode 1788 with rewards -643.8018223007282 with 114 steps, done\n",
      "Run episode 1789 with rewards -512.9564194321053 with 58 steps, done\n",
      "Run episode 1790 with rewards -2204.827439321145 with 241 steps, done\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Run episode 1791 with rewards -515.541109748855 with 59 steps, done\n",
      "Run episode 1792 with rewards -491.85872557262394 with 86 steps, done\n",
      "Run episode 1793 with rewards -158.12562109133302 with 61 steps, done\n",
      "Run episode 1794 with rewards -1730.7833024970537 with 221 steps, done\n",
      "Run episode 1795 with rewards -121.38666270104088 with 75 steps, done\n",
      "Run episode 1796 with rewards -1337.6017112737088 with 188 steps, done\n",
      "Run episode 1797 with rewards -141.53042841858286 with 62 steps, done\n",
      "Run episode 1798 with rewards -477.84437179018505 with 118 steps, done\n",
      "Run episode 1799 with rewards -164.55113725807516 with 93 steps, done\n",
      "Run episode 1800 with rewards -519.1928400187396 with 60 steps, done\n",
      "Run episode 1801 with rewards -125.05934464748023 with 87 steps, done\n",
      "Run episode 1802 with rewards -163.7401326356889 with 70 steps, done\n",
      "Run episode 1803 with rewards -102.6319360349577 with 100 steps, done\n",
      "Run episode 1804 with rewards -432.9057828238203 with 122 steps, done\n",
      "Run episode 1805 with rewards -159.12481032247834 with 59 steps, done\n",
      "Run episode 1806 with rewards -890.7447537866227 with 86 steps, done\n",
      "Run episode 1807 with rewards -111.21883483195035 with 77 steps, done\n",
      "Run episode 1808 with rewards -523.9260075068917 with 67 steps, done\n",
      "Run episode 1809 with rewards -501.5435788526926 with 81 steps, done\n",
      "Run episode 1810 with rewards -495.8682105398614 with 62 steps, done\n",
      "Run episode 1811 with rewards -139.91063172884657 with 123 steps, done\n",
      "Run episode 1812 with rewards -455.5221867334126 with 155 steps, done\n",
      "Run episode 1813 with rewards -336.87136669864026 with 167 steps, done\n",
      "Run episode 1814 with rewards -560.5706252222224 with 61 steps, done\n",
      "Run episode 1815 with rewards -1869.1889667931664 with 251 steps, done\n",
      "Run episode 1816 with rewards -454.3539273336288 with 62 steps, done\n",
      "Run episode 1817 with rewards -499.2213597003582 with 106 steps, done\n",
      "Run episode 1818 with rewards -480.01514729652257 with 75 steps, done\n",
      "Run episode 1819 with rewards -273.5725531879841 with 105 steps, done\n",
      "Run episode 1820 with rewards -138.14658659476882 with 78 steps, done\n",
      "Run episode 1821 with rewards -597.3232064299123 with 67 steps, done\n",
      "Run episode 1822 with rewards -428.40632921307093 with 78 steps, done\n",
      "Run episode 1823 with rewards -444.9483690762076 with 83 steps, done\n",
      "Run episode 1824 with rewards -336.7596795826619 with 51 steps, done\n",
      "Run episode 1825 with rewards -745.7403914389047 with 108 steps, done\n",
      "Run episode 1826 with rewards -369.6068136538006 with 55 steps, done\n",
      "Run episode 1827 with rewards -603.9978332176161 with 78 steps, done\n",
      "Run episode 1828 with rewards -194.11691965473676 with 74 steps, done\n",
      "Run episode 1829 with rewards -1239.5937121643701 with 148 steps, done\n",
      "Run episode 1830 with rewards -227.34325902500947 with 53 steps, done\n",
      "Run episode 1831 with rewards -970.1182838464858 with 140 steps, done\n",
      "Run episode 1832 with rewards -357.96264269076414 with 86 steps, done\n",
      "Run episode 1833 with rewards -406.39062671651635 with 77 steps, done\n",
      "Run episode 1834 with rewards -118.18751537860972 with 59 steps, done\n",
      "Run episode 1835 with rewards -968.2941822600815 with 150 steps, done\n",
      "Run episode 1836 with rewards -218.7495271012793 with 76 steps, done\n",
      "Run episode 1837 with rewards -617.0326172062395 with 87 steps, done\n",
      "Run episode 1838 with rewards -158.78764394937787 with 61 steps, done\n",
      "Run episode 1839 with rewards -772.5361000559307 with 151 steps, done\n",
      "Run episode 1840 with rewards -130.37556629447317 with 60 steps, done\n",
      "Run episode 1841 with rewards -643.5020607019343 with 68 steps, done\n",
      "Run episode 1842 with rewards -731.7403369251792 with 114 steps, done\n",
      "Run episode 1843 with rewards -395.3142269094671 with 80 steps, done\n",
      "Run episode 1844 with rewards -634.0363683285005 with 123 steps, done\n",
      "Run episode 1845 with rewards -111.99599109542285 with 62 steps, done\n",
      "Run episode 1846 with rewards -106.06901504068566 with 78 steps, done\n",
      "Run episode 1847 with rewards -634.5998290605235 with 66 steps, done\n",
      "Run episode 1848 with rewards -342.54781275813895 with 82 steps, done\n",
      "Run episode 1849 with rewards -593.8332969788086 with 61 steps, done\n",
      "Run episode 1850 with rewards -603.020021367753 with 92 steps, done\n",
      "Run episode 1851 with rewards -716.6813823455549 with 81 steps, done\n",
      "Run episode 1852 with rewards -500.3029465627237 with 100 steps, done\n",
      "Run episode 1853 with rewards -506.08347738710046 with 61 steps, done\n",
      "Run episode 1854 with rewards -530.3658677147806 with 102 steps, done\n",
      "Run episode 1855 with rewards -817.0746320517271 with 89 steps, done\n",
      "Run episode 1856 with rewards -554.4216912925243 with 128 steps, done\n",
      "Run episode 1857 with rewards -359.9057928622837 with 127 steps, done\n",
      "Run episode 1858 with rewards -700.7099898173211 with 82 steps, done\n",
      "Run episode 1859 with rewards -972.2144926711227 with 137 steps, done\n",
      "Run episode 1860 with rewards -143.73425304632508 with 65 steps, done\n",
      "Run episode 1861 with rewards -635.6307330239229 with 111 steps, done\n",
      "Run episode 1862 with rewards -142.4987280892338 with 61 steps, done\n",
      "Run episode 1863 with rewards -525.0956535818491 with 86 steps, done\n",
      "Run episode 1864 with rewards -137.353211474565 with 87 steps, done\n",
      "Run episode 1865 with rewards -405.58459066746343 with 82 steps, done\n",
      "Run episode 1866 with rewards -500.82883421661745 with 74 steps, done\n",
      "Run episode 1867 with rewards -453.8974811329293 with 61 steps, done\n",
      "Run episode 1868 with rewards -556.9270566585171 with 83 steps, done\n",
      "Run episode 1869 with rewards -560.2500751113845 with 71 steps, done\n",
      "Run episode 1870 with rewards -390.1254120606418 with 109 steps, done\n",
      "Run episode 1871 with rewards -189.69553944520302 with 87 steps, done\n",
      "Run episode 1872 with rewards -104.24923952011092 with 62 steps, done\n",
      "Run episode 1873 with rewards -682.1775886785039 with 80 steps, done\n",
      "Run episode 1874 with rewards -381.02792486820385 with 76 steps, done\n",
      "Run episode 1875 with rewards -633.153488377442 with 67 steps, done\n",
      "Run episode 1876 with rewards -115.82190973104174 with 55 steps, done\n",
      "Run episode 1877 with rewards -2237.8199577741884 with 280 steps, done\n",
      "Run episode 1878 with rewards -334.50421590265006 with 101 steps, done\n",
      "Run episode 1879 with rewards -810.0564458466315 with 124 steps, done\n",
      "Run episode 1880 with rewards -224.72347235404447 with 73 steps, done\n",
      "Run episode 1881 with rewards -777.0730462555081 with 87 steps, done\n",
      "Run episode 1882 with rewards -161.9734594071782 with 60 steps, done\n",
      "Run episode 1883 with rewards -433.9133503899429 with 95 steps, done\n",
      "Run episode 1884 with rewards -110.67630756343465 with 56 steps, done\n",
      "Run episode 1885 with rewards -668.5737830937649 with 233 steps, done\n",
      "Run episode 1886 with rewards -495.105385536394 with 57 steps, done\n",
      "Run episode 1887 with rewards -481.7124766486238 with 55 steps, done\n",
      "Run episode 1888 with rewards -579.2951323483395 with 110 steps, done\n",
      "Run episode 1889 with rewards -524.5318092167979 with 57 steps, done\n",
      "Run episode 1890 with rewards -288.1260752737662 with 86 steps, done\n",
      "Run episode 1891 with rewards -405.0969154433392 with 81 steps, done\n",
      "Run episode 1892 with rewards -270.72398955062727 with 58 steps, done\n",
      "Run episode 1893 with rewards -404.06021110254943 with 58 steps, done\n",
      "Run episode 1894 with rewards -155.35882598360226 with 82 steps, done\n",
      "Run episode 1895 with rewards -474.17696449541154 with 74 steps, done\n",
      "Run episode 1896 with rewards -31.50488630301504 with 58 steps, done\n",
      "Run episode 1897 with rewards -178.5791894284515 with 75 steps, done\n",
      "Run episode 1898 with rewards -153.31918549629427 with 86 steps, done\n",
      "Run episode 1899 with rewards -616.4177333256057 with 101 steps, done\n",
      "Run episode 1900 with rewards -119.01834080273682 with 89 steps, done\n",
      "Run episode 1901 with rewards -678.4470602428972 with 124 steps, done\n",
      "Run episode 1902 with rewards -131.377514143087 with 72 steps, done\n",
      "Run episode 1903 with rewards -662.594192149944 with 88 steps, done\n",
      "Run episode 1904 with rewards -153.39472477337074 with 63 steps, done\n",
      "Run episode 1905 with rewards -699.6210609812767 with 119 steps, done\n",
      "Run episode 1906 with rewards -273.56299961251415 with 69 steps, done\n",
      "Run episode 1907 with rewards -672.0387611988458 with 80 steps, done\n",
      "Run episode 1908 with rewards -148.27206404715304 with 68 steps, done\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Run episode 1909 with rewards -1292.4305079142507 with 209 steps, done\n",
      "Run episode 1910 with rewards -113.82087876431811 with 64 steps, done\n",
      "Run episode 1911 with rewards -275.92339321543824 with 115 steps, done\n",
      "Run episode 1912 with rewards -99.91427800192628 with 55 steps, done\n",
      "Run episode 1913 with rewards -1025.4924415475043 with 135 steps, done\n",
      "Run episode 1914 with rewards -124.72735249138333 with 58 steps, done\n",
      "Run episode 1915 with rewards -1728.4553557228921 with 211 steps, done\n",
      "Run episode 1916 with rewards -144.22731781019513 with 77 steps, done\n",
      "Run episode 1917 with rewards -667.8936495637857 with 133 steps, done\n",
      "Run episode 1918 with rewards -132.49719368213403 with 68 steps, done\n",
      "Run episode 1919 with rewards -673.3244556233343 with 124 steps, done\n",
      "Run episode 1920 with rewards -307.97733952433396 with 85 steps, done\n",
      "Run episode 1921 with rewards -940.2607636594828 with 127 steps, done\n",
      "Run episode 1922 with rewards -128.33776701014884 with 68 steps, done\n",
      "Run episode 1923 with rewards -624.1524459706376 with 79 steps, done\n",
      "Run episode 1924 with rewards -202.97587770807064 with 53 steps, done\n",
      "Run episode 1925 with rewards -514.5272954020138 with 103 steps, done\n",
      "Run episode 1926 with rewards -126.86613140450412 with 80 steps, done\n",
      "Run episode 1927 with rewards -489.06442789965155 with 58 steps, done\n",
      "Run episode 1928 with rewards -113.14080361775402 with 67 steps, done\n",
      "Run episode 1929 with rewards -95.3459919501203 with 82 steps, done\n",
      "Run episode 1930 with rewards -632.9123847538223 with 132 steps, done\n",
      "Run episode 1931 with rewards -168.90260875842716 with 74 steps, done\n",
      "Run episode 1932 with rewards -615.922212985571 with 79 steps, done\n",
      "Run episode 1933 with rewards -96.91748684424923 with 52 steps, done\n",
      "Run episode 1934 with rewards -1178.6405813770461 with 196 steps, done\n",
      "Run episode 1935 with rewards -207.8951464567176 with 64 steps, done\n",
      "Run episode 1936 with rewards -513.7797835305228 with 102 steps, done\n",
      "Run episode 1937 with rewards -443.89604979313606 with 80 steps, done\n",
      "Run episode 1938 with rewards -746.807052107223 with 125 steps, done\n",
      "Run episode 1939 with rewards -828.4463275046908 with 79 steps, done\n",
      "Run episode 1940 with rewards -382.7326414452288 with 82 steps, done\n",
      "Run episode 1941 with rewards -390.1363440958733 with 55 steps, done\n",
      "Run episode 1942 with rewards -637.7553990444912 with 111 steps, done\n",
      "Run episode 1943 with rewards -440.04893776453093 with 60 steps, done\n",
      "Run episode 1944 with rewards -383.79210503442846 with 83 steps, done\n",
      "Run episode 1945 with rewards -769.9854371943162 with 75 steps, done\n",
      "Run episode 1946 with rewards -617.649928765328 with 103 steps, done\n",
      "Run episode 1947 with rewards -473.8408943712343 with 77 steps, done\n",
      "Run episode 1948 with rewards -125.9223487588917 with 70 steps, done\n",
      "Run episode 1949 with rewards -760.4301787646008 with 77 steps, done\n",
      "Run episode 1950 with rewards -579.3804203054183 with 115 steps, done\n",
      "Run episode 1951 with rewards -702.5694596672594 with 73 steps, done\n",
      "Run episode 1952 with rewards -548.4039571992502 with 80 steps, done\n",
      "Run episode 1953 with rewards -483.2272636934789 with 55 steps, done\n",
      "Run episode 1954 with rewards -841.341666941022 with 157 steps, done\n",
      "Run episode 1955 with rewards -120.85372342566026 with 54 steps, done\n",
      "Run episode 1956 with rewards -811.0300214633124 with 130 steps, done\n",
      "Run episode 1957 with rewards -418.0358341867048 with 50 steps, done\n",
      "Run episode 1958 with rewards -356.2016327339325 with 72 steps, done\n",
      "Run episode 1959 with rewards -571.3627168927162 with 68 steps, done\n",
      "Run episode 1960 with rewards -519.0006752784675 with 85 steps, done\n",
      "Run episode 1961 with rewards -145.70310566837736 with 67 steps, done\n",
      "Run episode 1962 with rewards -856.1939426974612 with 88 steps, done\n",
      "Run episode 1963 with rewards -489.4886741921323 with 70 steps, done\n",
      "Run episode 1964 with rewards -376.04627303066883 with 69 steps, done\n",
      "Run episode 1965 with rewards -417.5063999072836 with 50 steps, done\n",
      "Run episode 1966 with rewards -529.9695920759007 with 118 steps, done\n",
      "Run episode 1967 with rewards -748.4476472777658 with 78 steps, done\n",
      "Run episode 1968 with rewards -544.0729425100335 with 108 steps, done\n",
      "Run episode 1969 with rewards -327.7384039434216 with 87 steps, done\n",
      "Run episode 1970 with rewards -126.05266697917035 with 58 steps, done\n",
      "Run episode 1971 with rewards -1733.8785198879466 with 201 steps, done\n",
      "Run episode 1972 with rewards -117.27405792871383 with 52 steps, done\n",
      "Run episode 1973 with rewards -280.86381072069787 with 103 steps, done\n",
      "Run episode 1974 with rewards -135.58765141099983 with 66 steps, done\n",
      "Run episode 1975 with rewards -243.78243358326338 with 122 steps, done\n",
      "Run episode 1976 with rewards -121.42495232288937 with 57 steps, done\n",
      "Run episode 1977 with rewards -320.8942305437039 with 85 steps, done\n",
      "Run episode 1978 with rewards -934.0304160464823 with 86 steps, done\n",
      "Run episode 1979 with rewards -98.24510355733169 with 61 steps, done\n",
      "Run episode 1980 with rewards -331.38135070016784 with 148 steps, done\n",
      "Run episode 1981 with rewards -199.12844242283558 with 75 steps, done\n",
      "Run episode 1982 with rewards -109.0933652555157 with 69 steps, done\n",
      "Run episode 1983 with rewards -115.73701600149667 with 63 steps, done\n",
      "Run episode 1984 with rewards -272.08312379340214 with 109 steps, done\n",
      "Run episode 1985 with rewards -159.30710072469282 with 77 steps, done\n",
      "Run episode 1986 with rewards -396.21782566021244 with 54 steps, done\n",
      "Run episode 1987 with rewards -343.2009749880497 with 78 steps, done\n",
      "Run episode 1988 with rewards -505.79898839810414 with 62 steps, done\n",
      "Run episode 1989 with rewards -397.05191655913865 with 98 steps, done\n",
      "Run episode 1990 with rewards -714.9715716800347 with 74 steps, done\n",
      "Run episode 1991 with rewards -154.22927706316682 with 78 steps, done\n",
      "Run episode 1992 with rewards -411.91957353883924 with 107 steps, done\n",
      "Run episode 1993 with rewards -145.5869277053195 with 66 steps, done\n",
      "Run episode 1994 with rewards -10.736583802361423 with 81 steps, done\n",
      "Run episode 1995 with rewards -114.56578027996594 with 81 steps, done\n",
      "Run episode 1996 with rewards -321.9327079957599 with 147 steps, done\n",
      "Run episode 1997 with rewards -148.86558827602977 with 57 steps, done\n",
      "Run episode 1998 with rewards -137.9731877265387 with 90 steps, done\n",
      "Run episode 1999 with rewards -127.47930758977262 with 75 steps, done\n",
      "Run episode 2000 with rewards -71.5241936698685 with 65 steps, done\n",
      "Run episode 2001 with rewards -320.84032357033516 with 96 steps, done\n",
      "Run episode 2002 with rewards -97.952880504718 with 87 steps, done\n",
      "Run episode 2003 with rewards -99.60740322053773 with 81 steps, done\n",
      "Run episode 2004 with rewards -411.1414077442262 with 179 steps, done\n",
      "Run episode 2005 with rewards -522.7272890980738 with 68 steps, done\n",
      "Run episode 2006 with rewards -429.8100103617863 with 51 steps, done\n",
      "Run episode 2007 with rewards -298.1725252381724 with 70 steps, done\n",
      "Run episode 2008 with rewards -566.9634420056927 with 60 steps, done\n",
      "Run episode 2009 with rewards -455.86005039188586 with 86 steps, done\n",
      "Run episode 2010 with rewards -605.6300919314388 with 65 steps, done\n",
      "Run episode 2011 with rewards -2731.8800320123296 with 308 steps, done\n",
      "Run episode 2012 with rewards -668.3051566714266 with 75 steps, done\n",
      "Run episode 2013 with rewards -573.7403146554474 with 78 steps, done\n",
      "Run episode 2014 with rewards -160.2603902467336 with 64 steps, done\n",
      "Run episode 2015 with rewards -1934.3835352524798 with 241 steps, done\n",
      "Run episode 2016 with rewards -228.27673112530394 with 85 steps, done\n",
      "Run episode 2017 with rewards -553.5130109108763 with 87 steps, done\n",
      "Run episode 2018 with rewards -117.5431694445047 with 55 steps, done\n",
      "Run episode 2019 with rewards -593.0286979107069 with 88 steps, done\n",
      "Run episode 2020 with rewards -140.39745503605985 with 61 steps, done\n",
      "Run episode 2021 with rewards -617.3159664057464 with 90 steps, done\n",
      "Run episode 2022 with rewards -235.92270342149885 with 71 steps, done\n",
      "Run episode 2023 with rewards -381.22428824251267 with 166 steps, done\n",
      "Run episode 2024 with rewards -346.55167474937764 with 83 steps, done\n",
      "Run episode 2025 with rewards -101.29930904467344 with 65 steps, done\n",
      "Run episode 2026 with rewards -607.7775293977704 with 80 steps, done\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Run episode 2027 with rewards -143.48117136753916 with 84 steps, done\n",
      "Run episode 2028 with rewards -710.5872949882684 with 122 steps, done\n",
      "Run episode 2029 with rewards -149.1714247722769 with 51 steps, done\n",
      "Run episode 2030 with rewards -593.8045882141168 with 95 steps, done\n",
      "Run episode 2031 with rewards -134.75642407570643 with 61 steps, done\n",
      "Run episode 2032 with rewards -621.8256488164377 with 119 steps, done\n",
      "Run episode 2033 with rewards -119.76018234636835 with 55 steps, done\n",
      "Run episode 2034 with rewards -380.3207747768304 with 83 steps, done\n",
      "Run episode 2035 with rewards -44.02290905552738 with 80 steps, done\n",
      "Run episode 2036 with rewards -602.0151869743911 with 72 steps, done\n",
      "Run episode 2037 with rewards -110.5062802207579 with 90 steps, done\n",
      "Run episode 2038 with rewards -539.2053555472 with 68 steps, done\n",
      "Run episode 2039 with rewards -394.2050987068845 with 85 steps, done\n",
      "Run episode 2040 with rewards -600.6809428974592 with 64 steps, done\n",
      "Run episode 2041 with rewards -598.5755339920624 with 84 steps, done\n",
      "Run episode 2042 with rewards -737.6815372947369 with 80 steps, done\n",
      "Run episode 2043 with rewards -569.2665810944238 with 122 steps, done\n",
      "Run episode 2044 with rewards -670.8889420393764 with 91 steps, done\n",
      "Run episode 2045 with rewards -579.6531259334266 with 80 steps, done\n",
      "Run episode 2046 with rewards -538.405388075412 with 64 steps, done\n",
      "Run episode 2047 with rewards -214.24839190280855 with 89 steps, done\n",
      "Run episode 2048 with rewards -777.1292817011811 with 77 steps, done\n",
      "Run episode 2049 with rewards -201.3933045362674 with 89 steps, done\n",
      "Run episode 2050 with rewards -131.0158350614156 with 103 steps, done\n",
      "Run episode 2051 with rewards -518.6445414924244 with 65 steps, done\n",
      "Run episode 2052 with rewards -191.51656025862755 with 88 steps, done\n",
      "Run episode 2053 with rewards -523.9861384405322 with 118 steps, done\n",
      "Run episode 2054 with rewards -123.22741123524162 with 55 steps, done\n",
      "Run episode 2055 with rewards -1182.969949387485 with 128 steps, done\n",
      "Run episode 2056 with rewards -466.9591170435793 with 53 steps, done\n",
      "Run episode 2057 with rewards -129.80928318128667 with 79 steps, done\n",
      "Run episode 2058 with rewards -158.52076702196356 with 94 steps, done\n",
      "Run episode 2059 with rewards -577.1932445935427 with 78 steps, done\n",
      "Run episode 2060 with rewards -187.64001442582384 with 57 steps, done\n",
      "Run episode 2061 with rewards -105.85166129668468 with 90 steps, done\n",
      "Run episode 2062 with rewards -89.22037662912449 with 103 steps, done\n",
      "Run episode 2063 with rewards -92.42064138299129 with 58 steps, done\n",
      "Run episode 2064 with rewards -1068.7941479775563 with 122 steps, done\n",
      "Run episode 2065 with rewards -104.58677114562929 with 82 steps, done\n",
      "Run episode 2066 with rewards -1205.0550236328415 with 167 steps, done\n",
      "Run episode 2067 with rewards -112.40550117136685 with 85 steps, done\n",
      "Run episode 2068 with rewards -613.2216065065714 with 74 steps, done\n",
      "Run episode 2069 with rewards -99.38068396155293 with 84 steps, done\n",
      "Run episode 2070 with rewards -538.4544023896517 with 98 steps, done\n",
      "Run episode 2071 with rewards -155.68588598757935 with 73 steps, done\n",
      "Run episode 2072 with rewards -651.7362314509064 with 137 steps, done\n",
      "Run episode 2073 with rewards -150.32196574131117 with 79 steps, done\n",
      "Run episode 2074 with rewards -434.6723954168971 with 80 steps, done\n",
      "Run episode 2075 with rewards -625.8755154810436 with 65 steps, done\n",
      "Run episode 2076 with rewards -2460.0961633464426 with 284 steps, done\n",
      "Run episode 2077 with rewards -712.5275240826815 with 73 steps, done\n",
      "Run episode 2078 with rewards -500.9568433688199 with 112 steps, done\n",
      "Run episode 2079 with rewards -145.929568793442 with 59 steps, done\n",
      "Run episode 2080 with rewards -388.3307543569224 with 77 steps, done\n",
      "Run episode 2081 with rewards -118.28212965225116 with 71 steps, done\n",
      "Run episode 2082 with rewards -459.79693378323014 with 100 steps, done\n",
      "Run episode 2083 with rewards -164.42357080335202 with 78 steps, done\n",
      "Run episode 2084 with rewards -143.0599051588851 with 56 steps, done\n",
      "Run episode 2085 with rewards -700.1650757575732 with 80 steps, done\n",
      "Run episode 2086 with rewards -477.03898900514565 with 62 steps, done\n",
      "Run episode 2087 with rewards -565.183917396527 with 78 steps, done\n",
      "Run episode 2088 with rewards -741.8714144323568 with 79 steps, done\n",
      "Run episode 2089 with rewards -161.21898815559692 with 86 steps, done\n",
      "Run episode 2090 with rewards -799.2413829192607 with 79 steps, done\n",
      "Run episode 2091 with rewards -425.74365490319394 with 100 steps, done\n",
      "Run episode 2092 with rewards -415.61747719237434 with 72 steps, done\n",
      "Run episode 2093 with rewards -285.5424573337293 with 90 steps, done\n",
      "Run episode 2094 with rewards -329.1409682144067 with 54 steps, done\n",
      "Run episode 2095 with rewards -270.70619145320444 with 163 steps, done\n",
      "Run episode 2096 with rewards -414.26008203196005 with 111 steps, done\n",
      "Run episode 2097 with rewards -565.2704482438119 with 87 steps, done\n",
      "Run episode 2098 with rewards -368.6372493824922 with 55 steps, done\n",
      "Run episode 2099 with rewards -120.88367224063134 with 63 steps, done\n",
      "Run episode 2100 with rewards -56.649669927241334 with 72 steps, done\n",
      "Run episode 2101 with rewards -170.5585098386174 with 75 steps, done\n",
      "Run episode 2102 with rewards -759.6831615992807 with 74 steps, done\n",
      "Run episode 2103 with rewards -84.99393751803905 with 66 steps, done\n",
      "Run episode 2104 with rewards -489.14462540733007 with 69 steps, done\n",
      "Run episode 2105 with rewards -297.01329111790176 with 54 steps, done\n",
      "Run episode 2106 with rewards -495.4394463149351 with 63 steps, done\n",
      "Run episode 2107 with rewards -415.49740626574805 with 69 steps, done\n",
      "Run episode 2108 with rewards -607.3348490429644 with 106 steps, done\n",
      "Run episode 2109 with rewards -423.41723207075233 with 75 steps, done\n",
      "Run episode 2110 with rewards -469.04553959925477 with 90 steps, done\n",
      "Run episode 2111 with rewards -150.18707799726133 with 57 steps, done\n",
      "Run episode 2112 with rewards -103.92214990303475 with 76 steps, done\n",
      "Run episode 2113 with rewards -139.91447645378565 with 66 steps, done\n",
      "Run episode 2114 with rewards -274.9927532887293 with 82 steps, done\n",
      "Run episode 2115 with rewards -140.5895447006499 with 60 steps, done\n",
      "Run episode 2116 with rewards -516.2468766879491 with 61 steps, done\n",
      "Run episode 2117 with rewards -239.90983793406627 with 60 steps, done\n",
      "Run episode 2118 with rewards -774.6098275339185 with 114 steps, done\n",
      "Run episode 2119 with rewards -648.4442423291792 with 75 steps, done\n",
      "Run episode 2120 with rewards -1315.202437849309 with 165 steps, done\n",
      "Run episode 2121 with rewards -124.34731655306025 with 71 steps, done\n",
      "Run episode 2122 with rewards -613.9496527072246 with 87 steps, done\n",
      "Run episode 2123 with rewards -167.75067309965556 with 71 steps, done\n",
      "Run episode 2124 with rewards -1094.9647109191544 with 169 steps, done\n",
      "Run episode 2125 with rewards -121.9721522634147 with 80 steps, done\n",
      "Run episode 2126 with rewards -750.0498553135947 with 127 steps, done\n",
      "Run episode 2127 with rewards -278.04242256386505 with 84 steps, done\n",
      "Run episode 2128 with rewards -931.0566667948357 with 147 steps, done\n",
      "Run episode 2129 with rewards -277.94050020798556 with 86 steps, done\n",
      "Run episode 2130 with rewards -1782.1480632713653 with 218 steps, done\n",
      "Run episode 2131 with rewards -703.8776068001399 with 80 steps, done\n",
      "Run episode 2132 with rewards -3159.486150382077 with 316 steps, done\n",
      "Run episode 2133 with rewards -151.38046911531794 with 52 steps, done\n",
      "Run episode 2134 with rewards -618.1827223963711 with 80 steps, done\n",
      "Run episode 2135 with rewards -140.33961479139302 with 80 steps, done\n",
      "Run episode 2136 with rewards -2431.9704726441546 with 277 steps, done\n",
      "Run episode 2137 with rewards -119.72854985859573 with 57 steps, done\n",
      "Run episode 2138 with rewards -888.6349200131333 with 120 steps, done\n",
      "Run episode 2139 with rewards -160.4101165620488 with 85 steps, done\n",
      "Run episode 2140 with rewards -1060.1033127371054 with 138 steps, done\n",
      "Run episode 2141 with rewards -119.17348828204169 with 51 steps, done\n",
      "Run episode 2142 with rewards -520.1649833406443 with 113 steps, done\n",
      "Run episode 2143 with rewards -129.21541861703236 with 55 steps, done\n",
      "Run episode 2144 with rewards -530.166504667985 with 110 steps, done\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Run episode 2145 with rewards -341.66069609367696 with 74 steps, done\n",
      "Run episode 2146 with rewards -463.089463704726 with 114 steps, done\n",
      "Run episode 2147 with rewards -124.57068680116146 with 56 steps, done\n",
      "Run episode 2148 with rewards -1024.430812576043 with 141 steps, done\n",
      "Run episode 2149 with rewards -132.70342053294272 with 88 steps, done\n",
      "Run episode 2150 with rewards -700.447289275071 with 135 steps, done\n",
      "Run episode 2151 with rewards -139.02383151164324 with 71 steps, done\n",
      "Run episode 2152 with rewards -904.6164346176442 with 124 steps, done\n",
      "Run episode 2153 with rewards -128.7425041466812 with 87 steps, done\n",
      "Run episode 2154 with rewards -617.717314924184 with 94 steps, done\n",
      "Run episode 2155 with rewards -142.78273299601574 with 60 steps, done\n",
      "Run episode 2156 with rewards -728.4836692851385 with 125 steps, done\n",
      "Run episode 2157 with rewards -193.74335671382215 with 56 steps, done\n",
      "Run episode 2158 with rewards -627.2952057048501 with 95 steps, done\n",
      "Run episode 2159 with rewards -121.53659459796488 with 83 steps, done\n",
      "Run episode 2160 with rewards -1638.6152572755243 with 203 steps, done\n",
      "Run episode 2161 with rewards -864.5988953257609 with 81 steps, done\n",
      "Run episode 2162 with rewards -503.428509957632 with 84 steps, done\n",
      "Run episode 2163 with rewards -49.12292491118007 with 69 steps, done\n",
      "Run episode 2164 with rewards -498.900338132748 with 96 steps, done\n",
      "Run episode 2165 with rewards -854.7283643207362 with 85 steps, done\n",
      "Run episode 2166 with rewards -113.79749721233041 with 71 steps, done\n",
      "Run episode 2167 with rewards -336.0067848952466 with 50 steps, done\n",
      "Run episode 2168 with rewards -594.3576178085682 with 86 steps, done\n",
      "Run episode 2169 with rewards -697.2807101015643 with 69 steps, done\n",
      "Run episode 2170 with rewards -5058.8197064694305 with 333 steps, done\n",
      "Run episode 2171 with rewards -148.78688047199597 with 64 steps, done\n",
      "Run episode 2172 with rewards -544.551377437595 with 102 steps, done\n",
      "Run episode 2173 with rewards -428.5112645187098 with 69 steps, done\n",
      "Run episode 2174 with rewards -173.85892357419903 with 72 steps, done\n",
      "Run episode 2175 with rewards -118.75146446078357 with 58 steps, done\n",
      "Run episode 2176 with rewards -158.71989534985033 with 59 steps, done\n",
      "Run episode 2177 with rewards -787.1752995306437 with 123 steps, done\n",
      "Run episode 2178 with rewards -116.69711217099012 with 90 steps, done\n",
      "Run episode 2179 with rewards -516.2422695034719 with 91 steps, done\n",
      "Run episode 2180 with rewards -111.5287540296918 with 89 steps, done\n",
      "Run episode 2181 with rewards -931.9001529725689 with 150 steps, done\n",
      "Run episode 2182 with rewards -106.22889900571917 with 62 steps, done\n",
      "Run episode 2183 with rewards -403.7453006149589 with 72 steps, done\n",
      "Run episode 2184 with rewards -517.744339989835 with 93 steps, done\n",
      "Run episode 2185 with rewards -443.0736003562148 with 94 steps, done\n",
      "Run episode 2186 with rewards -156.54787785204078 with 80 steps, done\n",
      "Run episode 2187 with rewards -224.0171764106674 with 92 steps, done\n",
      "Run episode 2188 with rewards -165.2689318453008 with 90 steps, done\n",
      "Run episode 2189 with rewards -109.37357572701828 with 154 steps, done\n",
      "Run episode 2190 with rewards -179.7881886667289 with 68 steps, done\n",
      "Run episode 2191 with rewards -644.2619887561149 with 78 steps, done\n",
      "Run episode 2192 with rewards -706.7619806266691 with 98 steps, done\n",
      "Run episode 2193 with rewards -445.8974783653581 with 73 steps, done\n",
      "Run episode 2194 with rewards -557.0057705201016 with 95 steps, done\n",
      "Run episode 2195 with rewards -486.52699087655515 with 79 steps, done\n",
      "Run episode 2196 with rewards -576.3277310235718 with 100 steps, done\n",
      "Run episode 2197 with rewards -459.30333123366694 with 57 steps, done\n",
      "Run episode 2198 with rewards -607.4691923265334 with 104 steps, done\n",
      "Run episode 2199 with rewards -498.2050793833899 with 142 steps, done\n",
      "Run episode 2200 with rewards -392.94634012766136 with 60 steps, done\n",
      "Run episode 2201 with rewards -143.89878136783594 with 85 steps, done\n",
      "Run episode 2202 with rewards -101.16799957686236 with 61 steps, done\n",
      "Run episode 2203 with rewards -763.0727508988283 with 76 steps, done\n",
      "Run episode 2204 with rewards -232.69357811969195 with 70 steps, done\n",
      "Run episode 2205 with rewards -712.7530049941807 with 146 steps, done\n",
      "Run episode 2206 with rewards -107.06415127229646 with 60 steps, done\n",
      "Run episode 2207 with rewards -499.29219143705245 with 76 steps, done\n",
      "Run episode 2208 with rewards -141.40567645685286 with 56 steps, done\n",
      "Run episode 2209 with rewards -111.55960194105697 with 77 steps, done\n",
      "Run episode 2210 with rewards -128.71892172085174 with 72 steps, done\n",
      "Run episode 2211 with rewards -210.2989952891667 with 112 steps, done\n",
      "Run episode 2212 with rewards -99.84442702252117 with 55 steps, done\n",
      "Run episode 2213 with rewards -296.0742446330489 with 91 steps, done\n",
      "Run episode 2214 with rewards -330.046045052078 with 86 steps, done\n",
      "Run episode 2215 with rewards -681.3905331438922 with 100 steps, done\n",
      "Run episode 2216 with rewards -265.86421224947844 with 75 steps, done\n",
      "Run episode 2217 with rewards -858.6316048544502 with 138 steps, done\n",
      "Run episode 2218 with rewards -125.27782572747225 with 50 steps, done\n",
      "Run episode 2219 with rewards -586.3048301778553 with 79 steps, done\n",
      "Run episode 2220 with rewards -145.62521961069297 with 62 steps, done\n",
      "Run episode 2221 with rewards -954.9878539841444 with 154 steps, done\n",
      "Run episode 2222 with rewards -397.60571509230454 with 72 steps, done\n",
      "Run episode 2223 with rewards -167.03545801661014 with 88 steps, done\n",
      "Run episode 2224 with rewards -199.50341661667534 with 76 steps, done\n",
      "Run episode 2225 with rewards -211.97735854537993 with 94 steps, done\n",
      "Run episode 2226 with rewards -396.74403231099825 with 99 steps, done\n",
      "Run episode 2227 with rewards -613.1952779992652 with 84 steps, done\n",
      "Run episode 2228 with rewards -145.75263476680132 with 62 steps, done\n",
      "Run episode 2229 with rewards -971.0793918849141 with 135 steps, done\n",
      "Run episode 2230 with rewards -118.33516009241819 with 66 steps, done\n",
      "Run episode 2231 with rewards -565.9427934223509 with 89 steps, done\n",
      "Run episode 2232 with rewards -118.60876986603982 with 73 steps, done\n",
      "Run episode 2233 with rewards -412.2117054883564 with 52 steps, done\n",
      "Run episode 2234 with rewards -161.3978188442893 with 89 steps, done\n",
      "Run episode 2235 with rewards -428.52466469708065 with 79 steps, done\n",
      "Run episode 2236 with rewards -147.39170208099256 with 75 steps, done\n",
      "Run episode 2237 with rewards -566.3305519722874 with 87 steps, done\n",
      "Run episode 2238 with rewards -187.3839020065841 with 70 steps, done\n",
      "Run episode 2239 with rewards -422.677634645828 with 75 steps, done\n",
      "Run episode 2240 with rewards -13.213333658440618 with 68 steps, done\n",
      "Run episode 2241 with rewards -163.50695308382942 with 59 steps, done\n",
      "Run episode 2242 with rewards -452.54400661751714 with 86 steps, done\n",
      "Run episode 2243 with rewards -132.77546819722852 with 65 steps, done\n",
      "Run episode 2244 with rewards -1187.2202234581644 with 143 steps, done\n",
      "Run episode 2245 with rewards -220.84378932776136 with 65 steps, done\n",
      "Run episode 2246 with rewards -527.5467955731908 with 73 steps, done\n",
      "Run episode 2247 with rewards 30.95753423960565 with 72 steps, done\n",
      "best\n",
      "Run episode 2248 with rewards -291.64893658328435 with 233 steps, done\n",
      "Run episode 2249 with rewards -121.3415423247641 with 70 steps, done\n",
      "Run episode 2250 with rewards -972.1686307181193 with 84 steps, done\n",
      "Run episode 2251 with rewards -621.0713960540122 with 64 steps, done\n",
      "Run episode 2252 with rewards -673.7096837036306 with 105 steps, done\n",
      "Run episode 2253 with rewards -444.2068567699164 with 82 steps, done\n",
      "Run episode 2254 with rewards -920.5378674701011 with 165 steps, done\n",
      "Run episode 2255 with rewards -452.81361063207123 with 98 steps, done\n",
      "Run episode 2256 with rewards -930.0177465079374 with 134 steps, done\n",
      "Run episode 2257 with rewards -189.19923000488035 with 55 steps, done\n",
      "Run episode 2258 with rewards -1203.8169136527351 with 170 steps, done\n",
      "Run episode 2259 with rewards -198.57091026431203 with 83 steps, done\n",
      "Run episode 2260 with rewards -636.2090432708248 with 130 steps, done\n",
      "Run episode 2261 with rewards -190.91948480179258 with 73 steps, done\n",
      "Run episode 2262 with rewards -1077.2187372268704 with 149 steps, done\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Run episode 2263 with rewards -197.2032555640347 with 65 steps, done\n",
      "Run episode 2264 with rewards -711.7410660692763 with 98 steps, done\n",
      "Run episode 2265 with rewards -413.97912479219224 with 64 steps, done\n",
      "Run episode 2266 with rewards -544.5524447963957 with 64 steps, done\n",
      "Run episode 2267 with rewards -706.1356987280842 with 117 steps, done\n",
      "Run episode 2268 with rewards -125.53556431369185 with 56 steps, done\n",
      "Run episode 2269 with rewards -1468.3099201242596 with 194 steps, done\n",
      "Run episode 2270 with rewards -148.93861604613932 with 79 steps, done\n",
      "Run episode 2271 with rewards -483.19862347001515 with 83 steps, done\n",
      "Run episode 2272 with rewards -169.19823122270805 with 74 steps, done\n",
      "Run episode 2273 with rewards -957.0291290878455 with 150 steps, done\n",
      "Run episode 2274 with rewards -110.8516683724255 with 63 steps, done\n",
      "Run episode 2275 with rewards -2502.0381613957643 with 286 steps, done\n",
      "Run episode 2276 with rewards -342.91565474240986 with 100 steps, done\n",
      "Run episode 2277 with rewards -2078.0392028689057 with 237 steps, done\n",
      "Run episode 2278 with rewards -213.1412520269248 with 92 steps, done\n",
      "Run episode 2279 with rewards -453.1504819058729 with 98 steps, done\n",
      "Run episode 2280 with rewards -150.74617942208664 with 59 steps, done\n",
      "Run episode 2281 with rewards -870.5600950781429 with 214 steps, done\n",
      "Run episode 2282 with rewards -137.07761537156108 with 72 steps, done\n",
      "Run episode 2283 with rewards -195.8597641721271 with 93 steps, done\n",
      "Run episode 2284 with rewards -122.79820628046963 with 67 steps, done\n",
      "Run episode 2285 with rewards -499.74515571838197 with 57 steps, done\n",
      "Run episode 2286 with rewards -143.66907809266107 with 71 steps, done\n",
      "Run episode 2287 with rewards -496.6459619208273 with 69 steps, done\n",
      "Run episode 2288 with rewards -157.20185305490565 with 66 steps, done\n",
      "Run episode 2289 with rewards -483.03567666893866 with 61 steps, done\n",
      "Run episode 2290 with rewards -547.8402996695784 with 85 steps, done\n",
      "Run episode 2291 with rewards -540.191835183256 with 60 steps, done\n",
      "Run episode 2292 with rewards -337.73990854371436 with 89 steps, done\n",
      "Run episode 2293 with rewards -435.73667448177827 with 53 steps, done\n",
      "Run episode 2294 with rewards -296.0810949840337 with 95 steps, done\n",
      "Run episode 2295 with rewards -360.03955427616023 with 54 steps, done\n",
      "Run episode 2296 with rewards -422.80733739408174 with 79 steps, done\n",
      "Run episode 2297 with rewards -772.3523822226366 with 83 steps, done\n",
      "Run episode 2298 with rewards -875.1165966674334 with 81 steps, done\n",
      "Run episode 2299 with rewards -851.6647951446747 with 82 steps, done\n",
      "Run episode 2300 with rewards -592.3219479390866 with 95 steps, done\n",
      "Run episode 2301 with rewards -581.253910522487 with 60 steps, done\n",
      "Run episode 2302 with rewards -502.7291935309038 with 104 steps, done\n",
      "Run episode 2303 with rewards -488.993772721801 with 56 steps, done\n",
      "Run episode 2304 with rewards -122.05916176766726 with 89 steps, done\n",
      "Run episode 2305 with rewards -742.0534437374316 with 81 steps, done\n",
      "Run episode 2306 with rewards -141.90201126727206 with 76 steps, done\n",
      "Run episode 2307 with rewards -254.86740176075878 with 116 steps, done\n",
      "Run episode 2308 with rewards -161.0734382278146 with 67 steps, done\n",
      "Run episode 2309 with rewards -105.96524788969967 with 72 steps, done\n",
      "Run episode 2310 with rewards -182.83375460489938 with 101 steps, done\n",
      "Run episode 2311 with rewards -495.8080284272618 with 61 steps, done\n",
      "Run episode 2312 with rewards -577.0982224964405 with 102 steps, done\n",
      "Run episode 2313 with rewards -432.83621526762647 with 51 steps, done\n",
      "Run episode 2314 with rewards -674.4198370179479 with 105 steps, done\n",
      "Run episode 2315 with rewards -136.44642195256816 with 78 steps, done\n",
      "Run episode 2316 with rewards -527.3397741354645 with 63 steps, done\n",
      "Run episode 2317 with rewards -301.98999566186603 with 91 steps, done\n",
      "Run episode 2318 with rewards -158.01493758385192 with 61 steps, done\n",
      "Run episode 2319 with rewards -168.86635843690613 with 80 steps, done\n",
      "Run episode 2320 with rewards -513.9295259108394 with 110 steps, done\n",
      "Run episode 2321 with rewards -350.1669850976572 with 54 steps, done\n",
      "Run episode 2322 with rewards -243.02179244253705 with 67 steps, done\n",
      "Run episode 2323 with rewards -836.2508021306302 with 86 steps, done\n",
      "Run episode 2324 with rewards -640.1108072080506 with 76 steps, done\n",
      "Run episode 2325 with rewards -558.1737703215861 with 61 steps, done\n",
      "Run episode 2326 with rewards -324.9482039718969 with 83 steps, done\n",
      "Run episode 2327 with rewards -617.895211323317 with 118 steps, done\n",
      "Run episode 2328 with rewards -735.6661557788226 with 76 steps, done\n",
      "Run episode 2329 with rewards -359.59698019081657 with 105 steps, done\n",
      "Run episode 2330 with rewards -431.19018842955467 with 51 steps, done\n",
      "Run episode 2331 with rewards -505.0956166530002 with 65 steps, done\n",
      "Run episode 2332 with rewards -86.72328620745472 with 84 steps, done\n",
      "Run episode 2333 with rewards -918.0869369376328 with 187 steps, done\n",
      "Run episode 2334 with rewards -161.14090752217385 with 79 steps, done\n",
      "Run episode 2335 with rewards -86.76723305758479 with 65 steps, done\n",
      "Run episode 2336 with rewards -1657.7068962574735 with 231 steps, done\n",
      "Run episode 2337 with rewards -164.63701483589097 with 84 steps, done\n",
      "Run episode 2338 with rewards -109.31767326120436 with 89 steps, done\n",
      "Run episode 2339 with rewards -118.52309432622775 with 67 steps, done\n",
      "Run episode 2340 with rewards -119.77064975203476 with 59 steps, done\n",
      "Run episode 2341 with rewards -415.11253876852857 with 57 steps, done\n",
      "Run episode 2342 with rewards -404.6953384192242 with 55 steps, done\n",
      "Run episode 2343 with rewards -364.73768045452834 with 50 steps, done\n",
      "Run episode 2344 with rewards -135.37979841411644 with 118 steps, done\n",
      "Run episode 2345 with rewards -638.4486586961694 with 134 steps, done\n",
      "Run episode 2346 with rewards -263.187025728771 with 67 steps, done\n",
      "Run episode 2347 with rewards -857.8455969319131 with 84 steps, done\n",
      "Run episode 2348 with rewards -311.6963646270352 with 72 steps, done\n",
      "Run episode 2349 with rewards -373.6945378670053 with 54 steps, done\n",
      "Run episode 2350 with rewards -439.8860454386029 with 104 steps, done\n",
      "Run episode 2351 with rewards -491.0748442894866 with 81 steps, done\n",
      "Run episode 2352 with rewards -129.9736175642977 with 87 steps, done\n",
      "Run episode 2353 with rewards -500.4115111309937 with 61 steps, done\n",
      "Run episode 2354 with rewards -42.7501103195998 with 69 steps, done\n",
      "Run episode 2355 with rewards -864.2165691059209 with 116 steps, done\n",
      "Run episode 2356 with rewards -537.1400719672888 with 69 steps, done\n",
      "Run episode 2357 with rewards -569.466051014216 with 89 steps, done\n",
      "Run episode 2358 with rewards -139.8630333132717 with 84 steps, done\n",
      "Run episode 2359 with rewards -425.77945183000804 with 104 steps, done\n",
      "Run episode 2360 with rewards -292.6108728878363 with 101 steps, done\n",
      "Run episode 2361 with rewards -515.1896173437308 with 85 steps, done\n",
      "Run episode 2362 with rewards -157.4976634567389 with 63 steps, done\n",
      "Run episode 2363 with rewards -601.537184352653 with 79 steps, done\n",
      "Run episode 2364 with rewards -182.65299653266862 with 80 steps, done\n",
      "Run episode 2365 with rewards -584.6700760305245 with 74 steps, done\n",
      "Run episode 2366 with rewards -139.19820321659057 with 61 steps, done\n",
      "Run episode 2367 with rewards -969.2650868265334 with 132 steps, done\n",
      "Run episode 2368 with rewards -153.9094178466769 with 74 steps, done\n",
      "Run episode 2369 with rewards -766.0605647436776 with 128 steps, done\n",
      "Run episode 2370 with rewards -181.18670756171645 with 65 steps, done\n",
      "Run episode 2371 with rewards -739.2133093437924 with 99 steps, done\n",
      "Run episode 2372 with rewards -468.13329744730345 with 61 steps, done\n",
      "Run episode 2373 with rewards -615.2674177236498 with 106 steps, done\n",
      "Run episode 2374 with rewards -473.54287272081467 with 55 steps, done\n",
      "Run episode 2375 with rewards -147.39200031755522 with 82 steps, done\n",
      "Run episode 2376 with rewards -224.35635933007978 with 73 steps, done\n",
      "Run episode 2377 with rewards -20.095640109292674 with 82 steps, done\n",
      "Run episode 2378 with rewards -674.2462680118936 with 69 steps, done\n",
      "Run episode 2379 with rewards -530.8863750722068 with 119 steps, done\n",
      "Run episode 2380 with rewards -462.48974389540393 with 60 steps, done\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Run episode 2381 with rewards -623.364671517616 with 72 steps, done\n",
      "Run episode 2382 with rewards -549.6952568063529 with 79 steps, done\n",
      "Run episode 2383 with rewards -731.7116181167828 with 76 steps, done\n",
      "Run episode 2384 with rewards -629.1793742480992 with 102 steps, done\n",
      "Run episode 2385 with rewards -1036.9426690038003 with 88 steps, done\n",
      "Run episode 2386 with rewards -296.2402321464068 with 66 steps, done\n",
      "Run episode 2387 with rewards -554.8675826431352 with 76 steps, done\n",
      "Run episode 2388 with rewards -505.047725028767 with 58 steps, done\n",
      "Run episode 2389 with rewards -198.42920574690032 with 110 steps, done\n",
      "Run episode 2390 with rewards -483.9991208946178 with 86 steps, done\n",
      "Run episode 2391 with rewards -714.981427351812 with 107 steps, done\n",
      "Run episode 2392 with rewards -149.44024165116542 with 75 steps, done\n",
      "Run episode 2393 with rewards -587.8426363760132 with 87 steps, done\n",
      "Run episode 2394 with rewards -175.0419181496386 with 65 steps, done\n",
      "Run episode 2395 with rewards -1833.0577330598608 with 214 steps, done\n",
      "Run episode 2396 with rewards -124.91304010938397 with 68 steps, done\n",
      "Run episode 2397 with rewards -1175.6739572154595 with 202 steps, done\n",
      "Run episode 2398 with rewards -143.78448708003458 with 68 steps, done\n",
      "Run episode 2399 with rewards -415.2308617396071 with 82 steps, done\n",
      "Run episode 2400 with rewards -114.95145578647686 with 54 steps, done\n",
      "Run episode 2401 with rewards -520.6842385187738 with 81 steps, done\n",
      "Run episode 2402 with rewards -118.76431559621187 with 84 steps, done\n",
      "Run episode 2403 with rewards -426.2500578634625 with 75 steps, done\n",
      "Run episode 2404 with rewards -525.6033629731484 with 67 steps, done\n",
      "Run episode 2405 with rewards -474.3519615423266 with 81 steps, done\n",
      "Run episode 2406 with rewards -477.8944086501362 with 62 steps, done\n",
      "Run episode 2407 with rewards -687.5707703075628 with 94 steps, done\n",
      "Run episode 2408 with rewards -213.15540979231298 with 61 steps, done\n",
      "Run episode 2409 with rewards -537.3817709944115 with 84 steps, done\n",
      "Run episode 2410 with rewards -495.6933681257206 with 56 steps, done\n",
      "Run episode 2411 with rewards -103.22226885129396 with 74 steps, done\n",
      "Run episode 2412 with rewards -532.9135223866235 with 89 steps, done\n",
      "Run episode 2413 with rewards -138.62400790046317 with 62 steps, done\n",
      "Run episode 2414 with rewards -1422.677609851304 with 184 steps, done\n",
      "Run episode 2415 with rewards -250.56941760197034 with 72 steps, done\n",
      "Run episode 2416 with rewards -808.4814537741427 with 123 steps, done\n",
      "Run episode 2417 with rewards -83.63426713129422 with 83 steps, done\n",
      "Run episode 2418 with rewards -498.49175126417254 with 78 steps, done\n",
      "Run episode 2419 with rewards -330.2946655114796 with 55 steps, done\n",
      "Run episode 2420 with rewards -675.7961384521377 with 78 steps, done\n",
      "Run episode 2421 with rewards -428.14381326694735 with 68 steps, done\n",
      "Run episode 2422 with rewards -498.988082603621 with 55 steps, done\n",
      "Run episode 2423 with rewards -275.5383433949144 with 67 steps, done\n",
      "Run episode 2424 with rewards -857.1304691084912 with 87 steps, done\n",
      "Run episode 2425 with rewards -341.25275183442426 with 94 steps, done\n",
      "Run episode 2426 with rewards -779.3917630246154 with 76 steps, done\n",
      "Run episode 2427 with rewards -532.5781743529596 with 81 steps, done\n",
      "Run episode 2428 with rewards -1075.4517850237557 with 89 steps, done\n",
      "Run episode 2429 with rewards -1107.6743500267066 with 182 steps, done\n",
      "Run episode 2430 with rewards -515.3935879686326 with 56 steps, done\n",
      "Run episode 2431 with rewards -826.6742045613531 with 122 steps, done\n",
      "Run episode 2432 with rewards -312.84634759473954 with 68 steps, done\n",
      "Run episode 2433 with rewards -502.1471113042377 with 86 steps, done\n",
      "Run episode 2434 with rewards -103.59426485404748 with 50 steps, done\n",
      "Run episode 2435 with rewards -741.2820726854058 with 92 steps, done\n",
      "Run episode 2436 with rewards -156.52181206527484 with 77 steps, done\n",
      "Run episode 2437 with rewards -607.0157404966242 with 83 steps, done\n",
      "Run episode 2438 with rewards -185.90290777756178 with 81 steps, done\n",
      "Run episode 2439 with rewards -562.5926451932975 with 77 steps, done\n",
      "Run episode 2440 with rewards -427.7856284733937 with 73 steps, done\n",
      "Run episode 2441 with rewards -516.0007848926036 with 84 steps, done\n",
      "Run episode 2442 with rewards -783.5737449929891 with 85 steps, done\n",
      "Run episode 2443 with rewards -631.4999172701274 with 95 steps, done\n",
      "Run episode 2444 with rewards -476.47164276651 with 55 steps, done\n",
      "Run episode 2445 with rewards -316.13905963407234 with 73 steps, done\n",
      "Run episode 2446 with rewards -442.5848318116408 with 59 steps, done\n",
      "Run episode 2447 with rewards -416.56819582623837 with 96 steps, done\n",
      "Run episode 2448 with rewards -568.3373782035519 with 63 steps, done\n",
      "Run episode 2449 with rewards -590.1807218400684 with 65 steps, done\n",
      "Run episode 2450 with rewards -162.39659551973517 with 75 steps, done\n",
      "Run episode 2451 with rewards -296.2961521222596 with 104 steps, done\n",
      "Run episode 2452 with rewards -190.80247716880692 with 63 steps, done\n",
      "Run episode 2453 with rewards -629.2562507335341 with 73 steps, done\n",
      "Run episode 2454 with rewards -233.2847442251151 with 85 steps, done\n",
      "Run episode 2455 with rewards -112.86991832665122 with 55 steps, done\n",
      "Run episode 2456 with rewards -472.2237526043431 with 57 steps, done\n",
      "Run episode 2457 with rewards -151.0191101857844 with 75 steps, done\n",
      "Run episode 2458 with rewards -590.5429006967331 with 62 steps, done\n",
      "Run episode 2459 with rewards -507.4351522803617 with 112 steps, done\n",
      "Run episode 2460 with rewards -755.6966952629466 with 73 steps, done\n",
      "Run episode 2461 with rewards -500.05753422278156 with 115 steps, done\n",
      "Run episode 2462 with rewards -539.9885750636365 with 73 steps, done\n",
      "Run episode 2463 with rewards -252.46995492929045 with 88 steps, done\n",
      "Run episode 2464 with rewards -698.9955616118048 with 79 steps, done\n",
      "Run episode 2465 with rewards -899.5404685256041 with 132 steps, done\n",
      "Run episode 2466 with rewards -106.32408297731585 with 91 steps, done\n",
      "Run episode 2467 with rewards -724.0686356292932 with 92 steps, done\n",
      "Run episode 2468 with rewards -179.24186906392634 with 82 steps, done\n",
      "Run episode 2469 with rewards -697.4321239766334 with 86 steps, done\n",
      "Run episode 2470 with rewards -126.96917460479145 with 52 steps, done\n",
      "Run episode 2471 with rewards -417.48788643725334 with 94 steps, done\n",
      "Run episode 2472 with rewards -539.5623771789581 with 83 steps, done\n",
      "Run episode 2473 with rewards -129.62812392285062 with 68 steps, done\n",
      "Run episode 2474 with rewards -128.27444666899677 with 76 steps, done\n",
      "Run episode 2475 with rewards -176.68441802471108 with 75 steps, done\n",
      "Run episode 2476 with rewards -45.55589891844267 with 91 steps, done\n",
      "Run episode 2477 with rewards -85.06923355811045 with 52 steps, done\n",
      "Run episode 2478 with rewards -126.78166274313126 with 108 steps, done\n",
      "Run episode 2479 with rewards -660.2715803819224 with 67 steps, done\n",
      "Run episode 2480 with rewards -517.1137242912655 with 111 steps, done\n",
      "Run episode 2481 with rewards -386.24782654677296 with 84 steps, done\n",
      "Run episode 2482 with rewards -124.47189243879569 with 71 steps, done\n",
      "Run episode 2483 with rewards -233.57822747533544 with 104 steps, done\n",
      "Run episode 2484 with rewards -130.2468359011882 with 88 steps, done\n",
      "Run episode 2485 with rewards -437.0499394022717 with 60 steps, done\n",
      "Run episode 2486 with rewards -82.02170266362131 with 59 steps, done\n",
      "Run episode 2487 with rewards -752.2283415956325 with 126 steps, done\n",
      "Run episode 2488 with rewards -116.59639754064193 with 86 steps, done\n",
      "Run episode 2489 with rewards -468.1444932536803 with 54 steps, done\n",
      "Run episode 2490 with rewards -557.8317435951296 with 105 steps, done\n",
      "Run episode 2491 with rewards -463.1574704946739 with 56 steps, done\n",
      "Run episode 2492 with rewards -120.74007664705181 with 61 steps, done\n",
      "Run episode 2493 with rewards -112.69582043152924 with 104 steps, done\n",
      "Run episode 2494 with rewards -206.92469215289898 with 81 steps, done\n",
      "Run episode 2495 with rewards -581.7866740697248 with 65 steps, done\n",
      "Run episode 2496 with rewards -33.03697239096513 with 71 steps, done\n",
      "Run episode 2497 with rewards -47.298204238476124 with 103 steps, done\n",
      "Run episode 2498 with rewards -140.02350600068377 with 67 steps, done\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Run episode 2499 with rewards -183.89342786257464 with 99 steps, done\n",
      "Run episode 2500 with rewards -125.74703147494759 with 77 steps, done\n",
      "Run episode 2501 with rewards -167.89669668841307 with 67 steps, done\n",
      "Run episode 2502 with rewards -129.847052748411 with 71 steps, done\n",
      "Run episode 2503 with rewards -618.7348447765415 with 114 steps, done\n",
      "Run episode 2504 with rewards -144.7356055281722 with 75 steps, done\n",
      "Run episode 2505 with rewards -842.5192800552558 with 114 steps, done\n",
      "Run episode 2506 with rewards -212.04280191984793 with 82 steps, done\n",
      "Run episode 2507 with rewards -415.1098406875357 with 75 steps, done\n",
      "Run episode 2508 with rewards -150.11459020760464 with 66 steps, done\n",
      "Run episode 2509 with rewards -1307.1398620768805 with 176 steps, done\n",
      "Run episode 2510 with rewards -128.86406732568818 with 51 steps, done\n",
      "Run episode 2511 with rewards -1516.3839933227803 with 193 steps, done\n",
      "Run episode 2512 with rewards -161.82814879551455 with 79 steps, done\n",
      "Run episode 2513 with rewards -197.9550570831708 with 120 steps, done\n",
      "Run episode 2514 with rewards -130.75545935556949 with 62 steps, done\n",
      "Run episode 2515 with rewards -414.38479783215246 with 49 steps, done\n",
      "Run episode 2516 with rewards -527.0472048543854 with 75 steps, done\n",
      "Run episode 2517 with rewards -415.23909486331286 with 57 steps, done\n",
      "Run episode 2518 with rewards -336.2729734079629 with 64 steps, done\n",
      "Run episode 2519 with rewards -431.8292895298942 with 55 steps, done\n",
      "Run episode 2520 with rewards -257.1187373068386 with 78 steps, done\n",
      "Run episode 2521 with rewards -513.4216625049521 with 60 steps, done\n",
      "Run episode 2522 with rewards -415.22577652869484 with 70 steps, done\n",
      "Run episode 2523 with rewards -490.96411779682796 with 55 steps, done\n",
      "Run episode 2524 with rewards -375.10668341621624 with 53 steps, done\n",
      "Run episode 2525 with rewards -442.63553529942124 with 60 steps, done\n",
      "Run episode 2526 with rewards -239.9435461326139 with 85 steps, done\n",
      "Run episode 2527 with rewards -496.3835923598341 with 68 steps, done\n",
      "Run episode 2528 with rewards -119.77139152845155 with 73 steps, done\n",
      "Run episode 2529 with rewards -621.4883537652266 with 103 steps, done\n",
      "Run episode 2530 with rewards -187.58097922539454 with 76 steps, done\n",
      "Run episode 2531 with rewards -131.66019368057425 with 58 steps, done\n",
      "Run episode 2532 with rewards -194.80854300569683 with 130 steps, done\n",
      "Run episode 2533 with rewards -1183.6294385046328 with 217 steps, done\n",
      "Run episode 2534 with rewards -94.05084306904976 with 54 steps, done\n",
      "Run episode 2535 with rewards -88.87337722738525 with 129 steps, done\n",
      "Run episode 2536 with rewards -198.44201747279322 with 72 steps, done\n",
      "Run episode 2537 with rewards -301.28201679857847 with 114 steps, done\n",
      "Run episode 2538 with rewards -153.46864322489967 with 64 steps, done\n",
      "Run episode 2539 with rewards -272.0403681481939 with 98 steps, done\n",
      "Run episode 2540 with rewards -501.338704472804 with 114 steps, done\n",
      "Run episode 2541 with rewards -38.878825005330114 with 99 steps, done\n",
      "Run episode 2542 with rewards -504.14093124528716 with 75 steps, done\n",
      "Run episode 2543 with rewards -260.0807307910644 with 86 steps, done\n",
      "Run episode 2544 with rewards -732.1675799792449 with 110 steps, done\n",
      "Run episode 2545 with rewards -184.9448688288548 with 61 steps, done\n",
      "Run episode 2546 with rewards -571.5508263869459 with 83 steps, done\n",
      "Run episode 2547 with rewards -275.6155363486995 with 83 steps, done\n",
      "Run episode 2548 with rewards -1283.8370010350056 with 159 steps, done\n",
      "Run episode 2549 with rewards -159.0332249225393 with 78 steps, done\n",
      "Run episode 2550 with rewards -1235.5360485911801 with 169 steps, done\n",
      "Run episode 2551 with rewards -140.11592933556568 with 56 steps, done\n",
      "Run episode 2552 with rewards -1205.3176033757616 with 156 steps, done\n",
      "Run episode 2553 with rewards -140.95942028166053 with 73 steps, done\n",
      "Run episode 2554 with rewards -1497.033652301806 with 188 steps, done\n",
      "Run episode 2555 with rewards -347.28191757906154 with 57 steps, done\n",
      "Run episode 2556 with rewards -153.1742088895467 with 54 steps, done\n",
      "Run episode 2557 with rewards -190.35089353347223 with 97 steps, done\n",
      "Run episode 2558 with rewards -389.4340989848911 with 140 steps, done\n",
      "Run episode 2559 with rewards -454.0838087167997 with 74 steps, done\n",
      "Run episode 2560 with rewards -109.83671525482572 with 76 steps, done\n",
      "Run episode 2561 with rewards -360.2326371993039 with 84 steps, done\n",
      "Run episode 2562 with rewards -248.52809163204938 with 157 steps, done\n",
      "Run episode 2563 with rewards -586.5710632680111 with 99 steps, done\n",
      "Run episode 2564 with rewards -150.9264723231238 with 73 steps, done\n",
      "Run episode 2565 with rewards -237.10333024981378 with 92 steps, done\n",
      "Run episode 2566 with rewards -305.49013355078046 with 163 steps, done\n",
      "Run episode 2567 with rewards -123.79634809302186 with 86 steps, done\n",
      "Run episode 2568 with rewards -179.0538754822783 with 111 steps, done\n",
      "Run episode 2569 with rewards -110.3979511730303 with 163 steps, done\n",
      "Run episode 2570 with rewards -690.2895966945215 with 65 steps, done\n",
      "Run episode 2571 with rewards -1042.3163208626202 with 154 steps, done\n",
      "Run episode 2572 with rewards -168.04580286168073 with 68 steps, done\n",
      "Run episode 2573 with rewards -899.169060844416 with 146 steps, done\n",
      "Run episode 2574 with rewards -126.60744931629266 with 68 steps, done\n",
      "Run episode 2575 with rewards -621.8697926849375 with 142 steps, done\n",
      "Run episode 2576 with rewards -99.87349062931797 with 55 steps, done\n",
      "Run episode 2577 with rewards -558.2015336448999 with 90 steps, done\n",
      "Run episode 2578 with rewards -138.6816575639209 with 72 steps, done\n",
      "Run episode 2579 with rewards -565.9869775015136 with 124 steps, done\n",
      "Run episode 2580 with rewards -134.76824921470387 with 64 steps, done\n",
      "Run episode 2581 with rewards -395.1865592718484 with 56 steps, done\n",
      "Run episode 2582 with rewards -130.4151588765195 with 72 steps, done\n",
      "Run episode 2583 with rewards -827.2385390526339 with 83 steps, done\n",
      "Run episode 2584 with rewards -119.77912354718143 with 81 steps, done\n",
      "Run episode 2585 with rewards -410.0626091964646 with 57 steps, done\n",
      "Run episode 2586 with rewards -685.9955702042369 with 110 steps, done\n",
      "Run episode 2587 with rewards -514.431931614526 with 74 steps, done\n",
      "Run episode 2588 with rewards -305.9888419610786 with 75 steps, done\n",
      "Run episode 2589 with rewards -115.14417557620283 with 59 steps, done\n",
      "Run episode 2590 with rewards -445.24609965508756 with 56 steps, done\n",
      "Run episode 2591 with rewards -455.70171214991717 with 61 steps, done\n",
      "Run episode 2592 with rewards -587.854219748036 with 86 steps, done\n",
      "Run episode 2593 with rewards -775.2755860710432 with 83 steps, done\n",
      "Run episode 2594 with rewards -585.0602204796501 with 101 steps, done\n",
      "Run episode 2595 with rewards -452.13146503360815 with 61 steps, done\n",
      "Run episode 2596 with rewards -597.4078270433652 with 118 steps, done\n",
      "Run episode 2597 with rewards -646.9549187641746 with 77 steps, done\n",
      "Run episode 2598 with rewards -96.18145863654397 with 62 steps, done\n",
      "Run episode 2599 with rewards -745.4915704526975 with 82 steps, done\n",
      "Run episode 2600 with rewards -115.21999968847221 with 71 steps, done\n",
      "Run episode 2601 with rewards -597.1958870396875 with 64 steps, done\n",
      "Run episode 2602 with rewards -706.8922522556103 with 77 steps, done\n",
      "Run episode 2603 with rewards -528.7836799288577 with 81 steps, done\n",
      "Run episode 2604 with rewards -338.69810138610944 with 51 steps, done\n",
      "Run episode 2605 with rewards -108.75169471731766 with 59 steps, done\n",
      "Run episode 2606 with rewards -710.297325985307 with 106 steps, done\n",
      "Run episode 2607 with rewards -524.3597776602104 with 61 steps, done\n",
      "Run episode 2608 with rewards -496.71945997422904 with 70 steps, done\n",
      "Run episode 2609 with rewards -169.1320600749444 with 122 steps, done\n",
      "Run episode 2610 with rewards -497.54801700433956 with 66 steps, done\n",
      "Run episode 2611 with rewards -600.328773274626 with 75 steps, done\n",
      "Run episode 2612 with rewards -565.8983655245239 with 60 steps, done\n",
      "Run episode 2613 with rewards -583.7129465089427 with 121 steps, done\n",
      "Run episode 2614 with rewards -571.2885181890543 with 71 steps, done\n",
      "Run episode 2615 with rewards -389.4089265137732 with 111 steps, done\n",
      "Run episode 2616 with rewards -331.393991091913 with 85 steps, done\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Run episode 2617 with rewards -597.9229511135165 with 66 steps, done\n",
      "Run episode 2618 with rewards -295.15364904563296 with 78 steps, done\n",
      "Run episode 2619 with rewards -732.6015200842887 with 75 steps, done\n",
      "Run episode 2620 with rewards -448.0487500742079 with 108 steps, done\n",
      "Run episode 2621 with rewards -548.0431873397619 with 65 steps, done\n",
      "Run episode 2622 with rewards -37.690299633548165 with 125 steps, done\n",
      "Run episode 2623 with rewards -199.98872708292942 with 53 steps, done\n",
      "Run episode 2624 with rewards -100.19268208709975 with 113 steps, done\n",
      "Run episode 2625 with rewards -461.52433268993514 with 67 steps, done\n",
      "Run episode 2626 with rewards -833.5157987079139 with 163 steps, done\n",
      "Run episode 2627 with rewards -750.9175337907677 with 75 steps, done\n",
      "Run episode 2628 with rewards -879.5562055401261 with 143 steps, done\n",
      "Run episode 2629 with rewards -328.25238113148373 with 73 steps, done\n",
      "Run episode 2630 with rewards -577.0580046305187 with 112 steps, done\n",
      "Run episode 2631 with rewards -86.96912006573065 with 54 steps, done\n",
      "Run episode 2632 with rewards -775.974838082011 with 123 steps, done\n",
      "Run episode 2633 with rewards -55.26965013802739 with 84 steps, done\n",
      "Run episode 2634 with rewards -274.998628164989 with 61 steps, done\n",
      "Run episode 2635 with rewards -680.8096516730276 with 79 steps, done\n",
      "Run episode 2636 with rewards -626.8201215222523 with 63 steps, done\n",
      "Run episode 2637 with rewards -99.60299218455725 with 131 steps, done\n",
      "Run episode 2638 with rewards -445.9395273193667 with 106 steps, done\n",
      "Run episode 2639 with rewards -864.804454091187 with 85 steps, done\n",
      "Run episode 2640 with rewards -430.562753276061 with 90 steps, done\n",
      "Run episode 2641 with rewards -138.5060095232927 with 59 steps, done\n",
      "Run episode 2642 with rewards -176.36606902145013 with 88 steps, done\n",
      "Run episode 2643 with rewards -484.2550991173422 with 82 steps, done\n",
      "Run episode 2644 with rewards -939.4124430748717 with 86 steps, done\n",
      "Run episode 2645 with rewards -601.2076849042252 with 90 steps, done\n",
      "Run episode 2646 with rewards -334.79293105551983 with 51 steps, done\n",
      "Run episode 2647 with rewards -322.8160694234704 with 112 steps, done\n",
      "Run episode 2648 with rewards -606.1621795078115 with 214 steps, done\n",
      "Run episode 2649 with rewards -378.1235111100095 with 64 steps, done\n",
      "Run episode 2650 with rewards -225.82263746552735 with 145 steps, done\n",
      "Run episode 2651 with rewards -220.3079327735636 with 96 steps, done\n",
      "Run episode 2652 with rewards -154.46939568921482 with 82 steps, done\n",
      "Run episode 2653 with rewards -64.54638519042243 with 73 steps, done\n",
      "Run episode 2654 with rewards -159.48134741272798 with 90 steps, done\n",
      "Run episode 2655 with rewards -681.0508543083301 with 74 steps, done\n",
      "Run episode 2656 with rewards -414.70933676925466 with 52 steps, done\n",
      "Run episode 2657 with rewards -399.1522264592652 with 82 steps, done\n",
      "Run episode 2658 with rewards -113.51954946295102 with 60 steps, done\n",
      "Run episode 2659 with rewards -687.3963082381837 with 104 steps, done\n",
      "Run episode 2660 with rewards -383.90167565675847 with 79 steps, done\n",
      "Run episode 2661 with rewards -519.4079385356254 with 78 steps, done\n",
      "Run episode 2662 with rewards -112.51808972658571 with 59 steps, done\n",
      "Run episode 2663 with rewards -515.7497621706968 with 78 steps, done\n",
      "Run episode 2664 with rewards -111.35335536994938 with 53 steps, done\n",
      "Run episode 2665 with rewards -480.1096180813461 with 74 steps, done\n",
      "Run episode 2666 with rewards -146.63202779836544 with 63 steps, done\n",
      "Run episode 2667 with rewards -546.5065410270983 with 79 steps, done\n",
      "Run episode 2668 with rewards -104.45652749125578 with 53 steps, done\n",
      "Run episode 2669 with rewards -476.24747151044073 with 84 steps, done\n",
      "Run episode 2670 with rewards -53.62086205559217 with 50 steps, done\n",
      "Run episode 2671 with rewards -625.4838328266266 with 99 steps, done\n",
      "Run episode 2672 with rewards -130.86107477940632 with 59 steps, done\n",
      "Run episode 2673 with rewards -651.7736620692943 with 97 steps, done\n",
      "Run episode 2674 with rewards -87.93144137801167 with 55 steps, done\n",
      "Run episode 2675 with rewards -617.2917631467087 with 91 steps, done\n",
      "Run episode 2676 with rewards -148.90683534113998 with 63 steps, done\n",
      "Run episode 2677 with rewards -953.0136117595694 with 136 steps, done\n",
      "Run episode 2678 with rewards -209.4737388793121 with 85 steps, done\n",
      "Run episode 2679 with rewards -769.0766555336107 with 126 steps, done\n",
      "Run episode 2680 with rewards -123.99143680573337 with 60 steps, done\n",
      "Run episode 2681 with rewards -1205.9851191554787 with 207 steps, done\n",
      "Run episode 2682 with rewards -154.72191475131547 with 55 steps, done\n",
      "Run episode 2683 with rewards -110.69932646129672 with 145 steps, done\n",
      "Run episode 2684 with rewards -378.8162850528338 with 65 steps, done\n",
      "Run episode 2685 with rewards -579.1956030270088 with 78 steps, done\n",
      "Run episode 2686 with rewards -349.2926375923386 with 50 steps, done\n",
      "Run episode 2687 with rewards -568.8658411120764 with 80 steps, done\n",
      "Run episode 2688 with rewards -158.15017392982122 with 63 steps, done\n",
      "Run episode 2689 with rewards -560.3071676945979 with 94 steps, done\n",
      "Run episode 2690 with rewards -190.744718987204 with 121 steps, done\n",
      "Run episode 2691 with rewards -97.06132422008213 with 84 steps, done\n",
      "Run episode 2692 with rewards -1966.907658455244 with 214 steps, done\n",
      "Run episode 2693 with rewards -353.2435098745816 with 52 steps, done\n",
      "Run episode 2694 with rewards -304.2658262955074 with 70 steps, done\n",
      "Run episode 2695 with rewards -500.27456375356024 with 75 steps, done\n",
      "Run episode 2696 with rewards -958.3460499806297 with 128 steps, done\n",
      "Run episode 2697 with rewards -177.44034241343525 with 70 steps, done\n",
      "Run episode 2698 with rewards -1212.2279091345667 with 161 steps, done\n",
      "Run episode 2699 with rewards -138.07148507984044 with 53 steps, done\n",
      "Run episode 2700 with rewards -1224.0832389217148 with 158 steps, done\n",
      "Run episode 2701 with rewards -116.78780153898859 with 78 steps, done\n",
      "Run episode 2702 with rewards -603.4285158217787 with 105 steps, done\n",
      "Run episode 2703 with rewards -584.0661646006404 with 65 steps, done\n",
      "Run episode 2704 with rewards -175.92347825140865 with 70 steps, done\n",
      "Run episode 2705 with rewards -126.9378866402414 with 71 steps, done\n",
      "Run episode 2706 with rewards -151.31687366680254 with 59 steps, done\n",
      "Run episode 2707 with rewards -390.55171131991506 with 55 steps, done\n",
      "Run episode 2708 with rewards -539.4385196567812 with 95 steps, done\n",
      "Run episode 2709 with rewards -658.5005985909269 with 81 steps, done\n",
      "Run episode 2710 with rewards -431.8290391757302 with 72 steps, done\n",
      "Run episode 2711 with rewards -480.5710779585616 with 58 steps, done\n",
      "Run episode 2712 with rewards -280.253147668299 with 96 steps, done\n",
      "Run episode 2713 with rewards -439.8538176583734 with 54 steps, done\n",
      "Run episode 2714 with rewards -464.6355624460014 with 95 steps, done\n",
      "Run episode 2715 with rewards -829.5966749688989 with 76 steps, done\n",
      "Run episode 2716 with rewards -561.2846924917735 with 117 steps, done\n",
      "Run episode 2717 with rewards -120.81175213650917 with 91 steps, done\n",
      "Run episode 2718 with rewards -1191.8411897651074 with 159 steps, done\n",
      "Run episode 2719 with rewards -124.11729008711202 with 83 steps, done\n",
      "Run episode 2720 with rewards -778.3592483360993 with 103 steps, done\n",
      "Run episode 2721 with rewards -144.119651416401 with 76 steps, done\n",
      "Run episode 2722 with rewards -1359.6742616014994 with 199 steps, done\n",
      "Run episode 2723 with rewards -137.10441231409771 with 76 steps, done\n",
      "Run episode 2724 with rewards -134.23101369489638 with 109 steps, done\n",
      "Run episode 2725 with rewards -660.8021010677447 with 67 steps, done\n",
      "Run episode 2726 with rewards -102.48978712535447 with 59 steps, done\n",
      "Run episode 2727 with rewards -90.9961558186483 with 60 steps, done\n",
      "Run episode 2728 with rewards -471.6187671316485 with 179 steps, done\n",
      "Run episode 2729 with rewards -498.82547874517763 with 56 steps, done\n",
      "Run episode 2730 with rewards -546.7484027472626 with 107 steps, done\n",
      "Run episode 2731 with rewards -399.7589239313929 with 51 steps, done\n",
      "Run episode 2732 with rewards -489.97237757451074 with 84 steps, done\n",
      "Run episode 2733 with rewards -352.2639596907888 with 55 steps, done\n",
      "Run episode 2734 with rewards -537.4966435298159 with 89 steps, done\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Run episode 2735 with rewards -472.22048030344195 with 73 steps, done\n",
      "Run episode 2736 with rewards -513.5914184055316 with 82 steps, done\n",
      "Run episode 2737 with rewards -201.88813152266144 with 80 steps, done\n",
      "Run episode 2738 with rewards -536.0224732645934 with 78 steps, done\n",
      "Run episode 2739 with rewards -261.16592972684134 with 91 steps, done\n",
      "Run episode 2740 with rewards -1305.7026599203775 with 125 steps, done\n",
      "Run episode 2741 with rewards 15.099843118497574 with 83 steps, done\n",
      "Run episode 2742 with rewards -124.27919590016853 with 80 steps, done\n",
      "Run episode 2743 with rewards -560.5993950118368 with 74 steps, done\n",
      "Run episode 2744 with rewards -141.69128584596436 with 66 steps, done\n",
      "Run episode 2745 with rewards -98.7300100668571 with 72 steps, done\n",
      "Run episode 2746 with rewards -122.130922381543 with 83 steps, done\n",
      "Run episode 2747 with rewards -93.05076038218402 with 123 steps, done\n",
      "Run episode 2748 with rewards -198.8673731983564 with 79 steps, done\n",
      "Run episode 2749 with rewards -196.00131016370244 with 130 steps, done\n",
      "Run episode 2750 with rewards -205.4706022417944 with 73 steps, done\n",
      "Run episode 2751 with rewards -93.3407693787919 with 91 steps, done\n",
      "Run episode 2752 with rewards -114.4600527425919 with 74 steps, done\n",
      "Run episode 2753 with rewards -885.2366220308902 with 82 steps, done\n",
      "Run episode 2754 with rewards -478.8766936867353 with 80 steps, done\n",
      "Run episode 2755 with rewards -598.7262930582958 with 68 steps, done\n",
      "Run episode 2756 with rewards -523.3320197138994 with 86 steps, done\n",
      "Run episode 2757 with rewards -578.3580589319258 with 68 steps, done\n",
      "Run episode 2758 with rewards -267.35004181499767 with 95 steps, done\n",
      "Run episode 2759 with rewards -532.8374229405315 with 67 steps, done\n",
      "Run episode 2760 with rewards -343.6269544780958 with 80 steps, done\n",
      "Run episode 2761 with rewards -545.0022124950842 with 67 steps, done\n",
      "Run episode 2762 with rewards -624.5374784770418 with 86 steps, done\n",
      "Run episode 2763 with rewards -534.866035350835 with 66 steps, done\n",
      "Run episode 2764 with rewards -620.7774973850837 with 106 steps, done\n",
      "Run episode 2765 with rewards -371.31904508361686 with 91 steps, done\n",
      "Run episode 2766 with rewards -463.9234986562824 with 75 steps, done\n",
      "Run episode 2767 with rewards -597.0348323256317 with 65 steps, done\n",
      "Run episode 2768 with rewards -129.6823220092935 with 66 steps, done\n",
      "Run episode 2769 with rewards -599.629460178754 with 64 steps, done\n",
      "Run episode 2770 with rewards -244.15933615152488 with 66 steps, done\n",
      "Run episode 2771 with rewards -1079.9132283738882 with 89 steps, done\n",
      "Run episode 2772 with rewards -794.135263686871 with 83 steps, done\n",
      "Run episode 2773 with rewards -708.2412098519144 with 67 steps, done\n",
      "Run episode 2774 with rewards -767.1051694958613 with 84 steps, done\n",
      "Run episode 2775 with rewards -53.96666401208239 with 67 steps, done\n",
      "Run episode 2776 with rewards -409.3870828214105 with 129 steps, done\n",
      "Run episode 2777 with rewards -828.1580584481289 with 86 steps, done\n",
      "Run episode 2778 with rewards -313.9276214067956 with 166 steps, done\n",
      "Run episode 2779 with rewards -433.37351774808417 with 75 steps, done\n",
      "Run episode 2780 with rewards -231.84673462270024 with 82 steps, done\n",
      "Run episode 2781 with rewards -830.5054781589985 with 138 steps, done\n",
      "Run episode 2782 with rewards -465.74630294235084 with 57 steps, done\n",
      "Run episode 2783 with rewards -606.8826265098928 with 79 steps, done\n",
      "Run episode 2784 with rewards -130.3593204319203 with 58 steps, done\n",
      "Run episode 2785 with rewards -534.7069270788534 with 91 steps, done\n",
      "Run episode 2786 with rewards -112.45840891072247 with 54 steps, done\n",
      "Run episode 2787 with rewards -1555.6350540218773 with 193 steps, done\n",
      "Run episode 2788 with rewards -444.68403979464136 with 57 steps, done\n",
      "Run episode 2789 with rewards -508.54146292417977 with 71 steps, done\n",
      "Run episode 2790 with rewards -181.99373540206227 with 49 steps, done\n",
      "Run episode 2791 with rewards -631.195470547389 with 125 steps, done\n",
      "Run episode 2792 with rewards -405.67884915491226 with 80 steps, done\n",
      "Run episode 2793 with rewards -877.0169440105863 with 129 steps, done\n",
      "Run episode 2794 with rewards -71.5148869235157 with 67 steps, done\n",
      "Run episode 2795 with rewards -128.62152446922784 with 67 steps, done\n",
      "Run episode 2796 with rewards -538.7696441857545 with 71 steps, done\n",
      "Run episode 2797 with rewards -435.6429166074171 with 71 steps, done\n",
      "Run episode 2798 with rewards -168.36215901195672 with 73 steps, done\n",
      "Run episode 2799 with rewards -683.9346968665503 with 86 steps, done\n",
      "Run episode 2800 with rewards -139.92842403378 with 55 steps, done\n",
      "Run episode 2801 with rewards -847.6254304974801 with 147 steps, done\n",
      "Run episode 2802 with rewards -131.14999124110747 with 68 steps, done\n",
      "Run episode 2803 with rewards -804.6157591988909 with 128 steps, done\n",
      "Run episode 2804 with rewards -488.7221035394396 with 60 steps, done\n",
      "Run episode 2805 with rewards -224.77483529109406 with 61 steps, done\n",
      "Run episode 2806 with rewards -641.5329893422859 with 133 steps, done\n",
      "Run episode 2807 with rewards -46.866974635518716 with 90 steps, done\n",
      "Run episode 2808 with rewards -347.33072137398585 with 96 steps, done\n",
      "Run episode 2809 with rewards -139.3510871105237 with 67 steps, done\n",
      "Run episode 2810 with rewards -142.6160055011168 with 123 steps, done\n",
      "Run episode 2811 with rewards -107.92019888217949 with 62 steps, done\n",
      "Run episode 2812 with rewards -981.0520834014814 with 137 steps, done\n",
      "Run episode 2813 with rewards -154.187968089433 with 84 steps, done\n",
      "Run episode 2814 with rewards -637.132123375524 with 79 steps, done\n",
      "Run episode 2815 with rewards -136.27959073145615 with 53 steps, done\n",
      "Run episode 2816 with rewards -471.10251388783445 with 75 steps, done\n",
      "Run episode 2817 with rewards -124.2768570552997 with 75 steps, done\n",
      "Run episode 2818 with rewards -473.1233013007191 with 86 steps, done\n",
      "Run episode 2819 with rewards -359.2409590891764 with 92 steps, done\n",
      "Run episode 2820 with rewards -645.0424602727767 with 81 steps, done\n",
      "Run episode 2821 with rewards -248.11471229729344 with 72 steps, done\n",
      "Run episode 2822 with rewards -793.7899672273008 with 84 steps, done\n",
      "Run episode 2823 with rewards -742.9798066612238 with 128 steps, done\n",
      "Run episode 2824 with rewards -163.09313863238197 with 62 steps, done\n",
      "Run episode 2825 with rewards -609.1377189159331 with 84 steps, done\n",
      "Run episode 2826 with rewards -537.3157536723123 with 61 steps, done\n",
      "Run episode 2827 with rewards -732.4782880269182 with 130 steps, done\n",
      "Run episode 2828 with rewards -170.23106904334514 with 65 steps, done\n",
      "Run episode 2829 with rewards -447.095411493668 with 81 steps, done\n",
      "Run episode 2830 with rewards -79.44936505310899 with 73 steps, done\n",
      "Run episode 2831 with rewards -682.5683009223443 with 98 steps, done\n",
      "Run episode 2832 with rewards -215.98125042755905 with 80 steps, done\n",
      "Run episode 2833 with rewards -492.8709533217588 with 105 steps, done\n",
      "Run episode 2834 with rewards -162.32982276957657 with 75 steps, done\n",
      "Run episode 2835 with rewards -925.4112729452252 with 131 steps, done\n",
      "Run episode 2836 with rewards -151.21254880348403 with 84 steps, done\n",
      "Run episode 2837 with rewards -876.1759921773643 with 128 steps, done\n",
      "Run episode 2838 with rewards -214.0834558654169 with 68 steps, done\n",
      "Run episode 2839 with rewards -596.3720697052437 with 92 steps, done\n",
      "Run episode 2840 with rewards -156.73249024175055 with 65 steps, done\n",
      "Run episode 2841 with rewards -635.8702035891147 with 87 steps, done\n",
      "Run episode 2842 with rewards -100.55863650246746 with 86 steps, done\n",
      "Run episode 2843 with rewards -430.2945849929503 with 121 steps, done\n",
      "Run episode 2844 with rewards -156.2108722352225 with 79 steps, done\n",
      "Run episode 2845 with rewards -654.7211135163245 with 82 steps, done\n",
      "Run episode 2846 with rewards -192.1513159466362 with 57 steps, done\n",
      "Run episode 2847 with rewards -674.815474773905 with 103 steps, done\n",
      "Run episode 2848 with rewards -151.14985789383394 with 53 steps, done\n",
      "Run episode 2849 with rewards -690.4147681678617 with 97 steps, done\n",
      "Run episode 2850 with rewards -144.6399480617267 with 86 steps, done\n",
      "Run episode 2851 with rewards -931.6006340354223 with 132 steps, done\n",
      "Run episode 2852 with rewards -232.44239944881505 with 85 steps, done\n",
      "Run episode 2853 with rewards -399.9593873564645 with 86 steps, done\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Run episode 2854 with rewards -151.54574477411882 with 84 steps, done\n",
      "Run episode 2855 with rewards -698.3370339928867 with 71 steps, done\n",
      "Run episode 2856 with rewards -731.8837523873945 with 113 steps, done\n",
      "Run episode 2857 with rewards -319.0383991374358 with 51 steps, done\n",
      "Run episode 2858 with rewards -268.0118113296321 with 65 steps, done\n",
      "Run episode 2859 with rewards -894.5168077988682 with 107 steps, done\n",
      "Run episode 2860 with rewards -904.9901980257982 with 81 steps, done\n",
      "Run episode 2861 with rewards -82.81500390351991 with 101 steps, done\n",
      "Run episode 2862 with rewards -1071.7547394829069 with 163 steps, done\n",
      "Run episode 2863 with rewards -167.93056707242647 with 66 steps, done\n",
      "Run episode 2864 with rewards -2916.022984090285 with 281 steps, done\n",
      "Run episode 2865 with rewards -193.64673762324264 with 62 steps, done\n",
      "Run episode 2866 with rewards -926.3870979761034 with 185 steps, done\n",
      "Run episode 2867 with rewards -516.3707332625622 with 69 steps, done\n",
      "Run episode 2868 with rewards -476.3493083921743 with 67 steps, done\n",
      "Run episode 2869 with rewards -757.9672888383668 with 80 steps, done\n",
      "Run episode 2870 with rewards -170.38854324032087 with 118 steps, done\n",
      "Run episode 2871 with rewards -673.0443164954708 with 68 steps, done\n",
      "Run episode 2872 with rewards -330.27171068016816 with 63 steps, done\n",
      "Run episode 2873 with rewards -88.8512902689409 with 153 steps, done\n",
      "Run episode 2874 with rewards -1097.8912659620646 with 234 steps, done\n",
      "Run episode 2875 with rewards -1055.8533568779321 with 87 steps, done\n",
      "Run episode 2876 with rewards -355.1413833591139 with 81 steps, done\n",
      "Run episode 2877 with rewards -712.2740392370649 with 77 steps, done\n",
      "Run episode 2878 with rewards -568.4495275530065 with 66 steps, done\n",
      "Run episode 2879 with rewards -173.98450273996053 with 104 steps, done\n",
      "Run episode 2880 with rewards -535.5122460302086 with 65 steps, done\n",
      "Run episode 2881 with rewards -346.97967089859947 with 108 steps, done\n",
      "Run episode 2882 with rewards -91.67710645044937 with 51 steps, done\n",
      "Run episode 2883 with rewards -408.6870907781595 with 49 steps, done\n",
      "Run episode 2884 with rewards -1258.368688991049 with 182 steps, done\n",
      "Run episode 2885 with rewards -453.1626182609286 with 54 steps, done\n",
      "Run episode 2886 with rewards -659.5677590612958 with 121 steps, done\n",
      "Run episode 2887 with rewards -152.46240137003818 with 81 steps, done\n",
      "Run episode 2888 with rewards -640.6338212559778 with 120 steps, done\n",
      "Run episode 2889 with rewards -149.67092562230033 with 53 steps, done\n",
      "Run episode 2890 with rewards -728.6424312967745 with 107 steps, done\n",
      "Run episode 2891 with rewards -228.67598346804184 with 79 steps, done\n",
      "Run episode 2892 with rewards -758.8969134895854 with 132 steps, done\n",
      "Run episode 2893 with rewards -208.15335653468637 with 67 steps, done\n",
      "Run episode 2894 with rewards -613.3653259365298 with 121 steps, done\n",
      "Run episode 2895 with rewards -211.82485887698476 with 63 steps, done\n",
      "Run episode 2896 with rewards -442.64140217126334 with 93 steps, done\n",
      "Run episode 2897 with rewards -776.8201566992112 with 73 steps, done\n",
      "Run episode 2898 with rewards -334.45217124876996 with 107 steps, done\n",
      "Run episode 2899 with rewards -560.7766505387847 with 67 steps, done\n",
      "Run episode 2900 with rewards -514.8661964967575 with 80 steps, done\n",
      "Run episode 2901 with rewards -607.4304996098019 with 66 steps, done\n",
      "Run episode 2902 with rewards -419.5265635406849 with 125 steps, done\n",
      "Run episode 2903 with rewards -518.1791992583062 with 72 steps, done\n",
      "Run episode 2904 with rewards -436.47990938691424 with 50 steps, done\n",
      "Run episode 2905 with rewards -838.3148306416477 with 78 steps, done\n",
      "Run episode 2906 with rewards -476.2896894621899 with 54 steps, done\n",
      "Run episode 2907 with rewards -786.4877876996169 with 83 steps, done\n",
      "Run episode 2908 with rewards -249.3882759590552 with 65 steps, done\n",
      "Run episode 2909 with rewards -483.9515418253736 with 58 steps, done\n",
      "Run episode 2910 with rewards -563.2054270069361 with 94 steps, done\n",
      "Run episode 2911 with rewards -477.2704716119173 with 71 steps, done\n",
      "Run episode 2912 with rewards -428.0671041253899 with 56 steps, done\n",
      "Run episode 2913 with rewards -438.2311114025189 with 67 steps, done\n",
      "Run episode 2914 with rewards -708.1420087570739 with 75 steps, done\n",
      "Run episode 2915 with rewards -666.4890653504456 with 92 steps, done\n",
      "Run episode 2916 with rewards -409.6547972451596 with 54 steps, done\n",
      "Run episode 2917 with rewards -433.7095093655293 with 112 steps, done\n",
      "Run episode 2918 with rewards -452.2379569811904 with 54 steps, done\n",
      "Run episode 2919 with rewards -411.4442369946983 with 86 steps, done\n",
      "Run episode 2920 with rewards -260.39196673839 with 63 steps, done\n",
      "Run episode 2921 with rewards -30.744716994038043 with 54 steps, done\n",
      "Run episode 2922 with rewards -220.115894071502 with 89 steps, done\n",
      "Run episode 2923 with rewards -581.4314622456925 with 69 steps, done\n",
      "Run episode 2924 with rewards -500.5368658053286 with 81 steps, done\n",
      "Run episode 2925 with rewards -522.3711840129974 with 65 steps, done\n",
      "Run episode 2926 with rewards -159.6301758904695 with 74 steps, done\n",
      "Run episode 2927 with rewards -449.95492910105384 with 78 steps, done\n",
      "Run episode 2928 with rewards -526.9533285943678 with 94 steps, done\n",
      "Run episode 2929 with rewards -540.3200357250885 with 68 steps, done\n",
      "Run episode 2930 with rewards -187.73710923146274 with 72 steps, done\n",
      "Run episode 2931 with rewards -432.7615554412627 with 51 steps, done\n",
      "Run episode 2932 with rewards -498.8709141891268 with 58 steps, done\n",
      "Run episode 2933 with rewards -454.5000049180619 with 75 steps, done\n",
      "Run episode 2934 with rewards -338.3905979572009 with 90 steps, done\n",
      "Run episode 2935 with rewards -673.1227359735286 with 75 steps, done\n",
      "Run episode 2936 with rewards -579.3415305991814 with 121 steps, done\n",
      "Run episode 2937 with rewards -171.9035403017693 with 65 steps, done\n",
      "Run episode 2938 with rewards -89.58823917817153 with 62 steps, done\n",
      "Run episode 2939 with rewards -646.0234571849695 with 197 steps, done\n",
      "Run episode 2940 with rewards -240.24720266298198 with 70 steps, done\n",
      "Run episode 2941 with rewards -487.4231261408122 with 63 steps, done\n",
      "Run episode 2942 with rewards -438.2293641706762 with 108 steps, done\n",
      "Run episode 2943 with rewards -362.9440406703609 with 59 steps, done\n",
      "Run episode 2944 with rewards -542.9616359565318 with 77 steps, done\n",
      "Run episode 2945 with rewards -615.2497191395804 with 94 steps, done\n",
      "Run episode 2946 with rewards -803.2830940445575 with 80 steps, done\n",
      "Run episode 2947 with rewards -384.7690726870126 with 72 steps, done\n",
      "Run episode 2948 with rewards -491.5528749609665 with 61 steps, done\n",
      "Run episode 2949 with rewards -479.34382508766777 with 92 steps, done\n",
      "Run episode 2950 with rewards -120.04080777415997 with 54 steps, done\n",
      "Run episode 2951 with rewards -298.4261133139735 with 85 steps, done\n",
      "Run episode 2952 with rewards -731.168561989475 with 123 steps, done\n",
      "Run episode 2953 with rewards -510.13253012314664 with 60 steps, done\n",
      "Run episode 2954 with rewards -580.5306671149467 with 105 steps, done\n",
      "Run episode 2955 with rewards -752.8653626968162 with 79 steps, done\n",
      "Run episode 2956 with rewards -334.6007308428119 with 72 steps, done\n",
      "Run episode 2957 with rewards -808.293248474644 with 78 steps, done\n",
      "Run episode 2958 with rewards -258.01048785023903 with 83 steps, done\n",
      "Run episode 2959 with rewards -399.3691366883217 with 50 steps, done\n",
      "Run episode 2960 with rewards -526.3459690108338 with 110 steps, done\n",
      "Run episode 2961 with rewards -96.55320680169285 with 56 steps, done\n",
      "Run episode 2962 with rewards -171.5772738769076 with 113 steps, done\n",
      "Run episode 2963 with rewards -591.1279033674296 with 75 steps, done\n",
      "Run episode 2964 with rewards -156.8085093051404 with 62 steps, done\n",
      "Run episode 2965 with rewards -116.75980211896982 with 109 steps, done\n",
      "Run episode 2966 with rewards -198.69097923150528 with 90 steps, done\n",
      "Run episode 2967 with rewards -316.72803696015444 with 55 steps, done\n",
      "Run episode 2968 with rewards -658.4627504328053 with 112 steps, done\n",
      "Run episode 2969 with rewards -274.5515835067438 with 101 steps, done\n",
      "Run episode 2970 with rewards -424.3311127651502 with 63 steps, done\n",
      "Run episode 2971 with rewards -665.1365470921329 with 109 steps, done\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Run episode 2972 with rewards -831.5853369181506 with 79 steps, done\n",
      "Run episode 2973 with rewards -127.05910376008916 with 61 steps, done\n",
      "Run episode 2974 with rewards -297.32658512905004 with 65 steps, done\n",
      "Run episode 2975 with rewards -58.0625621334743 with 72 steps, done\n",
      "Run episode 2976 with rewards -321.1609157056117 with 106 steps, done\n",
      "Run episode 2977 with rewards -192.5444980012049 with 56 steps, done\n",
      "Run episode 2978 with rewards -702.1085473920144 with 120 steps, done\n",
      "Run episode 2979 with rewards -132.94596145142577 with 51 steps, done\n",
      "Run episode 2980 with rewards -679.8807766133325 with 119 steps, done\n",
      "Run episode 2981 with rewards -256.92030725096697 with 81 steps, done\n",
      "Run episode 2982 with rewards -545.3108050906474 with 77 steps, done\n",
      "Run episode 2983 with rewards -155.23074137353106 with 71 steps, done\n",
      "Run episode 2984 with rewards -393.65913329621446 with 96 steps, done\n",
      "Run episode 2985 with rewards -323.9746045101172 with 59 steps, done\n",
      "Run episode 2986 with rewards -315.2398853701984 with 95 steps, done\n",
      "Run episode 2987 with rewards -149.80397652789281 with 87 steps, done\n",
      "Run episode 2988 with rewards -304.5265692704605 with 180 steps, done\n",
      "Run episode 2989 with rewards -109.97157730945824 with 54 steps, done\n",
      "Run episode 2990 with rewards -747.3085014409916 with 131 steps, done\n",
      "Run episode 2991 with rewards -149.68387337494542 with 53 steps, done\n",
      "Run episode 2992 with rewards -703.3267213236245 with 108 steps, done\n",
      "Run episode 2993 with rewards -475.74556153152463 with 54 steps, done\n",
      "Run episode 2994 with rewards -540.9110365197237 with 69 steps, done\n",
      "Run episode 2995 with rewards -430.2002092379778 with 81 steps, done\n",
      "Run episode 2996 with rewards -352.78868834493096 with 73 steps, done\n",
      "Run episode 2997 with rewards -788.0623235379437 with 77 steps, done\n",
      "Run episode 2998 with rewards -332.6014103708633 with 56 steps, done\n",
      "Run episode 2999 with rewards -1552.6820465981757 with 183 steps, done\n",
      "Run episode 3000 with rewards -456.22649159540475 with 56 steps, done\n",
      "Run episode 3001 with rewards -582.9420617473372 with 72 steps, done\n",
      "Run episode 3002 with rewards -335.5316316378528 with 71 steps, done\n",
      "Run episode 3003 with rewards -1883.0823208983375 with 241 steps, done\n",
      "Run episode 3004 with rewards -156.16673752598854 with 74 steps, done\n",
      "Run episode 3005 with rewards -587.7289683537417 with 115 steps, done\n",
      "Run episode 3006 with rewards -205.13078961687404 with 84 steps, done\n",
      "Run episode 3007 with rewards -953.4221963312963 with 163 steps, done\n",
      "Run episode 3008 with rewards -486.23299176562506 with 62 steps, done\n",
      "Run episode 3009 with rewards -274.8593884923886 with 119 steps, done\n",
      "Run episode 3010 with rewards -434.2068373747911 with 69 steps, done\n",
      "Run episode 3011 with rewards -510.35623300365484 with 101 steps, done\n",
      "Run episode 3012 with rewards -163.60843561291614 with 71 steps, done\n",
      "Run episode 3013 with rewards -624.4563345054983 with 101 steps, done\n",
      "Run episode 3014 with rewards -87.37188849483047 with 54 steps, done\n",
      "Run episode 3015 with rewards -813.6762835857743 with 127 steps, done\n",
      "Run episode 3016 with rewards -39.70785760744475 with 71 steps, done\n",
      "Run episode 3017 with rewards -440.3944097801872 with 83 steps, done\n",
      "Run episode 3018 with rewards -105.65770822538956 with 53 steps, done\n",
      "Run episode 3019 with rewards -840.1542332315394 with 154 steps, done\n",
      "Run episode 3020 with rewards -435.9277343332924 with 79 steps, done\n",
      "Run episode 3021 with rewards -955.855694720877 with 144 steps, done\n",
      "Run episode 3022 with rewards -174.8806172639587 with 93 steps, done\n",
      "Run episode 3023 with rewards -791.3526773869825 with 144 steps, done\n",
      "Run episode 3024 with rewards -74.51578806832123 with 64 steps, done\n",
      "Run episode 3025 with rewards -260.5266029441348 with 106 steps, done\n",
      "Run episode 3026 with rewards -312.1063325845961 with 133 steps, done\n",
      "Run episode 3027 with rewards -698.5018434175134 with 73 steps, done\n",
      "Run episode 3028 with rewards -2.5378069915298482 with 61 steps, done\n",
      "Run episode 3029 with rewards -608.9926191935538 with 114 steps, done\n",
      "Run episode 3030 with rewards -249.7652120301939 with 58 steps, done\n",
      "Run episode 3031 with rewards -78.56758184180933 with 60 steps, done\n",
      "Run episode 3032 with rewards -635.0921863581594 with 67 steps, done\n",
      "Run episode 3033 with rewards -111.6792023884837 with 77 steps, done\n",
      "Run episode 3034 with rewards -1734.418047097894 with 207 steps, done\n",
      "Run episode 3035 with rewards -563.5692599074612 with 66 steps, done\n",
      "Run episode 3036 with rewards -539.0360800079227 with 82 steps, done\n",
      "Run episode 3037 with rewards -331.07897263198004 with 89 steps, done\n",
      "Run episode 3038 with rewards -508.884795201272 with 90 steps, done\n",
      "Run episode 3039 with rewards -111.59304148712235 with 52 steps, done\n",
      "Run episode 3040 with rewards -641.6715011789794 with 78 steps, done\n",
      "Run episode 3041 with rewards -120.7914366023835 with 65 steps, done\n",
      "Run episode 3042 with rewards -515.869845824849 with 89 steps, done\n",
      "Run episode 3043 with rewards -180.3384177177415 with 73 steps, done\n",
      "Run episode 3044 with rewards -335.8888092689031 with 104 steps, done\n",
      "Run episode 3045 with rewards -663.4810023346793 with 79 steps, done\n",
      "Run episode 3046 with rewards -419.93509249156494 with 64 steps, done\n",
      "Run episode 3047 with rewards -458.5180183647349 with 90 steps, done\n",
      "Run episode 3048 with rewards -150.60979312395511 with 67 steps, done\n",
      "Run episode 3049 with rewards -605.2342151878709 with 116 steps, done\n",
      "Run episode 3050 with rewards -154.23252863710903 with 80 steps, done\n",
      "Run episode 3051 with rewards -607.8559747614242 with 110 steps, done\n",
      "Run episode 3052 with rewards -136.82573601394864 with 64 steps, done\n",
      "Run episode 3053 with rewards -571.5764374313788 with 149 steps, done\n",
      "Run episode 3054 with rewards -141.94180469271342 with 57 steps, done\n",
      "Run episode 3055 with rewards -814.356171330196 with 115 steps, done\n",
      "Run episode 3056 with rewards -188.52975500518545 with 90 steps, done\n",
      "Run episode 3057 with rewards -583.5026840804371 with 78 steps, done\n",
      "Run episode 3058 with rewards -265.1076687391639 with 77 steps, done\n",
      "Run episode 3059 with rewards -848.6135753734159 with 153 steps, done\n",
      "Run episode 3060 with rewards -128.4085401016606 with 51 steps, done\n",
      "Run episode 3061 with rewards -598.3404667773725 with 81 steps, done\n",
      "Run episode 3062 with rewards -138.081417265796 with 67 steps, done\n",
      "Run episode 3063 with rewards -403.2988969682557 with 81 steps, done\n",
      "Run episode 3064 with rewards -117.66686258506489 with 61 steps, done\n",
      "Run episode 3065 with rewards -487.08192764324104 with 90 steps, done\n",
      "Run episode 3066 with rewards -172.12205901219764 with 82 steps, done\n",
      "Run episode 3067 with rewards -551.8766749777369 with 79 steps, done\n",
      "Run episode 3068 with rewards -448.775602769492 with 105 steps, done\n",
      "Run episode 3069 with rewards -771.7631713128447 with 111 steps, done\n",
      "Run episode 3070 with rewards -160.09131176110898 with 85 steps, done\n",
      "Run episode 3071 with rewards -425.49154488252475 with 85 steps, done\n",
      "Run episode 3072 with rewards -139.52683445197874 with 64 steps, done\n",
      "Run episode 3073 with rewards -899.6560246390636 with 148 steps, done\n",
      "Run episode 3074 with rewards -266.48898280439454 with 77 steps, done\n",
      "Run episode 3075 with rewards -897.4703188616071 with 86 steps, done\n",
      "Run episode 3076 with rewards -1520.7969583288964 with 201 steps, done\n",
      "Run episode 3077 with rewards -638.9161229268175 with 65 steps, done\n",
      "Run episode 3078 with rewards -187.3806156852525 with 93 steps, done\n",
      "Run episode 3079 with rewards -433.81043954869966 with 78 steps, done\n",
      "Run episode 3080 with rewards -576.0208905155242 with 155 steps, done\n",
      "Run episode 3081 with rewards -391.9522179807359 with 63 steps, done\n",
      "Run episode 3082 with rewards -803.6928210398519 with 81 steps, done\n",
      "Run episode 3083 with rewards -398.94443919423327 with 87 steps, done\n",
      "Run episode 3084 with rewards -467.4021456518701 with 54 steps, done\n",
      "Run episode 3085 with rewards -40.49492581554222 with 67 steps, done\n",
      "Run episode 3086 with rewards -567.1473348315451 with 60 steps, done\n",
      "Run episode 3087 with rewards -495.6812310389971 with 103 steps, done\n",
      "Run episode 3088 with rewards -505.2198118593458 with 62 steps, done\n",
      "Run episode 3089 with rewards -140.6519715808161 with 61 steps, done\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Run episode 3090 with rewards -205.3206964988125 with 84 steps, done\n",
      "Run episode 3091 with rewards -111.24818143743684 with 65 steps, done\n",
      "Run episode 3092 with rewards -444.94884118445714 with 99 steps, done\n",
      "Run episode 3093 with rewards -23.086157531581392 with 88 steps, done\n",
      "Run episode 3094 with rewards -688.9626765966794 with 113 steps, done\n",
      "Run episode 3095 with rewards -153.88818722033642 with 62 steps, done\n",
      "Run episode 3096 with rewards -102.70318908996875 with 57 steps, done\n",
      "Run episode 3097 with rewards -792.4358482822697 with 114 steps, done\n",
      "Run episode 3098 with rewards -208.77202147746942 with 82 steps, done\n",
      "Run episode 3099 with rewards -63.14942228476718 with 67 steps, done\n",
      "Run episode 3100 with rewards -406.08191677243974 with 79 steps, done\n",
      "Run episode 3101 with rewards -539.016414024909 with 58 steps, done\n",
      "Run episode 3102 with rewards -487.45665362753465 with 60 steps, done\n",
      "Run episode 3103 with rewards -206.48318262174274 with 97 steps, done\n",
      "Run episode 3104 with rewards -767.5045831433324 with 82 steps, done\n",
      "Run episode 3105 with rewards -128.30401349795164 with 49 steps, done\n",
      "Run episode 3106 with rewards -223.0551673181925 with 117 steps, done\n",
      "Run episode 3107 with rewards -173.23473174981805 with 64 steps, done\n",
      "Run episode 3108 with rewards -356.847916787716 with 91 steps, done\n",
      "Run episode 3109 with rewards -102.41402928729593 with 57 steps, done\n",
      "Run episode 3110 with rewards -37.600591244743164 with 84 steps, done\n",
      "Run episode 3111 with rewards -122.77292637045507 with 62 steps, done\n",
      "Run episode 3112 with rewards -664.7117824903346 with 123 steps, done\n",
      "Run episode 3113 with rewards -170.67360249906574 with 73 steps, done\n",
      "Run episode 3114 with rewards -656.5957769517962 with 92 steps, done\n",
      "Run episode 3115 with rewards -129.69189545750464 with 61 steps, done\n",
      "Run episode 3116 with rewards -1326.0333042263676 with 192 steps, done\n",
      "Run episode 3117 with rewards -123.78967256978194 with 81 steps, done\n",
      "Run episode 3118 with rewards -411.32365717179283 with 74 steps, done\n",
      "Run episode 3119 with rewards -138.34351381388586 with 70 steps, done\n",
      "Run episode 3120 with rewards -653.2984513332659 with 83 steps, done\n",
      "Run episode 3121 with rewards -111.54524289409704 with 68 steps, done\n",
      "Run episode 3122 with rewards -1565.1024883733248 with 226 steps, done\n",
      "Run episode 3123 with rewards -128.9142982215663 with 76 steps, done\n",
      "Run episode 3124 with rewards -979.5468988285189 with 127 steps, done\n",
      "Run episode 3125 with rewards -134.5443147320188 with 54 steps, done\n",
      "Run episode 3126 with rewards -4555.2267614453685 with 377 steps, done\n",
      "Run episode 3127 with rewards -140.72522117111157 with 61 steps, done\n",
      "Run episode 3128 with rewards -506.36545623402634 with 79 steps, done\n",
      "Run episode 3129 with rewards -786.3920283719866 with 83 steps, done\n",
      "Run episode 3130 with rewards -138.44442375168458 with 57 steps, done\n",
      "Run episode 3131 with rewards -467.67152510212344 with 55 steps, done\n",
      "Run episode 3132 with rewards -318.91854864329787 with 80 steps, done\n",
      "Run episode 3133 with rewards -672.5890993431876 with 76 steps, done\n",
      "Run episode 3134 with rewards -542.1918158753983 with 92 steps, done\n",
      "Run episode 3135 with rewards -124.5582926676802 with 64 steps, done\n",
      "Run episode 3136 with rewards -448.5128892319626 with 52 steps, done\n",
      "Run episode 3137 with rewards -97.99206400042664 with 91 steps, done\n",
      "Run episode 3138 with rewards -277.2558384217281 with 120 steps, done\n",
      "Run episode 3139 with rewards -144.23577600411718 with 68 steps, done\n",
      "Run episode 3140 with rewards -36.039204590996434 with 106 steps, done\n",
      "Run episode 3141 with rewards -630.0822058739195 with 80 steps, done\n",
      "Run episode 3142 with rewards -510.81459658551677 with 63 steps, done\n",
      "Run episode 3143 with rewards -310.0989121435531 with 79 steps, done\n",
      "Run episode 3144 with rewards -225.20888620593956 with 83 steps, done\n",
      "Run episode 3145 with rewards -191.71620042188619 with 61 steps, done\n",
      "Run episode 3146 with rewards -456.0433383321961 with 55 steps, done\n",
      "Run episode 3147 with rewards -533.4343018838265 with 104 steps, done\n",
      "Run episode 3148 with rewards -121.22620750688391 with 52 steps, done\n",
      "Run episode 3149 with rewards -466.96658288983724 with 86 steps, done\n",
      "Run episode 3150 with rewards -25.849531505355188 with 70 steps, done\n",
      "Run episode 3151 with rewards -446.392525895415 with 51 steps, done\n",
      "Run episode 3152 with rewards -358.358824497538 with 51 steps, done\n",
      "Run episode 3153 with rewards -593.4763013050458 with 83 steps, done\n",
      "Run episode 3154 with rewards -436.6018393646515 with 58 steps, done\n",
      "Run episode 3155 with rewards -354.1972382107522 with 102 steps, done\n",
      "Run episode 3156 with rewards -509.80700536023915 with 58 steps, done\n",
      "Run episode 3157 with rewards -883.3725482846323 with 83 steps, done\n",
      "Run episode 3158 with rewards -739.3220955782497 with 79 steps, done\n",
      "Run episode 3159 with rewards -469.3429735779067 with 67 steps, done\n",
      "Run episode 3160 with rewards -460.3042061185383 with 54 steps, done\n",
      "Run episode 3161 with rewards -637.9979470267862 with 101 steps, done\n",
      "Run episode 3162 with rewards -459.0680331564026 with 61 steps, done\n",
      "Run episode 3163 with rewards -955.8012018918926 with 86 steps, done\n",
      "Run episode 3164 with rewards -374.16364814552514 with 63 steps, done\n",
      "Run episode 3165 with rewards -530.1599669777547 with 66 steps, done\n",
      "Run episode 3166 with rewards -568.1124711590851 with 92 steps, done\n",
      "Run episode 3167 with rewards -740.6520329522597 with 85 steps, done\n",
      "Run episode 3168 with rewards -2200.005411445822 with 263 steps, done\n",
      "Run episode 3169 with rewards -122.18873189884982 with 88 steps, done\n",
      "Run episode 3170 with rewards -2103.2123454770763 with 238 steps, done\n",
      "Run episode 3171 with rewards -159.30765958742012 with 68 steps, done\n",
      "Run episode 3172 with rewards -455.067074139971 with 89 steps, done\n",
      "Run episode 3173 with rewards -150.9599431446803 with 78 steps, done\n",
      "Run episode 3174 with rewards -574.4305758166554 with 78 steps, done\n",
      "Run episode 3175 with rewards -124.17611762723331 with 74 steps, done\n",
      "Run episode 3176 with rewards -675.1909802893384 with 103 steps, done\n",
      "Run episode 3177 with rewards -1042.5972733883973 with 86 steps, done\n",
      "Run episode 3178 with rewards -393.91146019417755 with 111 steps, done\n",
      "Run episode 3179 with rewards -435.8077387298428 with 53 steps, done\n",
      "Run episode 3180 with rewards -119.85418592794679 with 67 steps, done\n",
      "Run episode 3181 with rewards -477.67532201007486 with 62 steps, done\n",
      "Run episode 3182 with rewards -364.2720111708723 with 89 steps, done\n",
      "Run episode 3183 with rewards -165.5399695338645 with 81 steps, done\n",
      "Run episode 3184 with rewards -138.55310857107463 with 51 steps, done\n",
      "Run episode 3185 with rewards -427.8103250596857 with 58 steps, done\n",
      "Run episode 3186 with rewards -552.6727270533324 with 84 steps, done\n",
      "Run episode 3187 with rewards -828.9768103618716 with 86 steps, done\n",
      "Run episode 3188 with rewards -824.0490560897478 with 86 steps, done\n",
      "Run episode 3189 with rewards -418.3159433204157 with 103 steps, done\n",
      "Run episode 3190 with rewards -716.1625597068044 with 81 steps, done\n",
      "Run episode 3191 with rewards -99.52422389669668 with 92 steps, done\n",
      "Run episode 3192 with rewards -525.1788670427604 with 76 steps, done\n",
      "Run episode 3193 with rewards -294.56600104241215 with 50 steps, done\n",
      "Run episode 3194 with rewards -1090.1918698087752 with 156 steps, done\n",
      "Run episode 3195 with rewards -227.6467049317139 with 70 steps, done\n",
      "Run episode 3196 with rewards -584.304259631543 with 98 steps, done\n",
      "Run episode 3197 with rewards -202.37886608614926 with 82 steps, done\n",
      "Run episode 3198 with rewards -780.3174793222121 with 134 steps, done\n",
      "Run episode 3199 with rewards -205.2191135838218 with 88 steps, done\n",
      "Run episode 3200 with rewards -580.3855325699209 with 76 steps, done\n",
      "Run episode 3201 with rewards -145.42437301613455 with 65 steps, done\n",
      "Run episode 3202 with rewards -2052.0546387052955 with 267 steps, done\n",
      "Run episode 3203 with rewards -153.80945933124852 with 85 steps, done\n",
      "Run episode 3204 with rewards -769.2928934775204 with 77 steps, done\n",
      "Run episode 3205 with rewards -561.3896882524025 with 80 steps, done\n",
      "Run episode 3206 with rewards -501.92337500063155 with 61 steps, done\n",
      "Run episode 3207 with rewards -474.9809163711209 with 96 steps, done\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Run episode 3208 with rewards -481.1893468536315 with 79 steps, done\n",
      "Run episode 3209 with rewards -165.01087969044863 with 64 steps, done\n",
      "Run episode 3210 with rewards -425.5654944954304 with 76 steps, done\n",
      "Run episode 3211 with rewards -1121.102505257266 with 91 steps, done\n",
      "Run episode 3212 with rewards -590.1423808527652 with 105 steps, done\n",
      "Run episode 3213 with rewards -552.5569909416129 with 71 steps, done\n",
      "Run episode 3214 with rewards -535.528403337087 with 92 steps, done\n",
      "Run episode 3215 with rewards -656.3136131071518 with 72 steps, done\n",
      "Run episode 3216 with rewards -541.7849607151345 with 77 steps, done\n",
      "Run episode 3217 with rewards -449.1078622662091 with 51 steps, done\n",
      "Run episode 3218 with rewards -243.9752075923874 with 84 steps, done\n",
      "Run episode 3219 with rewards -654.1254834208617 with 77 steps, done\n",
      "Run episode 3220 with rewards -397.23291848027407 with 56 steps, done\n",
      "Run episode 3221 with rewards -360.9229948377263 with 66 steps, done\n",
      "Run episode 3222 with rewards -531.1603259663486 with 58 steps, done\n",
      "Run episode 3223 with rewards -721.5830799097994 with 101 steps, done\n",
      "Run episode 3224 with rewards -645.4677954272917 with 73 steps, done\n",
      "Run episode 3225 with rewards -523.6803193641375 with 73 steps, done\n",
      "Run episode 3226 with rewards -332.8975922175448 with 88 steps, done\n",
      "Run episode 3227 with rewards -850.4516880523207 with 81 steps, done\n",
      "Run episode 3228 with rewards -136.3555803449529 with 54 steps, done\n",
      "Run episode 3229 with rewards -427.59770152377735 with 86 steps, done\n",
      "Run episode 3230 with rewards -152.3520157560835 with 78 steps, done\n",
      "Run episode 3231 with rewards -711.5118066615038 with 79 steps, done\n",
      "Run episode 3232 with rewards -487.93898226220546 with 76 steps, done\n",
      "Run episode 3233 with rewards -782.8756463655022 with 87 steps, done\n",
      "Run episode 3234 with rewards -313.59933877878063 with 71 steps, done\n",
      "Run episode 3235 with rewards -691.0966583279194 with 73 steps, done\n",
      "Run episode 3236 with rewards -503.4330381003975 with 80 steps, done\n",
      "Run episode 3237 with rewards -405.04529655320107 with 57 steps, done\n",
      "Run episode 3238 with rewards -729.5323130856146 with 95 steps, done\n",
      "Run episode 3239 with rewards -794.0615651952183 with 79 steps, done\n",
      "Run episode 3240 with rewards -1102.4794215851425 with 164 steps, done\n",
      "Run episode 3241 with rewards -643.4803168440151 with 67 steps, done\n",
      "Run episode 3242 with rewards -463.22273029568674 with 111 steps, done\n",
      "Run episode 3243 with rewards -130.14903434409678 with 62 steps, done\n",
      "Run episode 3244 with rewards -499.36689518349937 with 79 steps, done\n",
      "Run episode 3245 with rewards -138.2416505161109 with 59 steps, done\n",
      "Run episode 3246 with rewards -769.8731125469047 with 99 steps, done\n",
      "Run episode 3247 with rewards -384.5585786374966 with 52 steps, done\n",
      "Run episode 3248 with rewards -122.60493639087935 with 88 steps, done\n",
      "Run episode 3249 with rewards -395.40176107602895 with 86 steps, done\n",
      "Run episode 3250 with rewards -105.49915590418945 with 78 steps, done\n",
      "Run episode 3251 with rewards -115.02886952907093 with 69 steps, done\n",
      "Run episode 3252 with rewards -752.0024786911431 with 202 steps, done\n",
      "Run episode 3253 with rewards -167.7825535717264 with 78 steps, done\n",
      "Run episode 3254 with rewards -766.0314244220242 with 144 steps, done\n",
      "Run episode 3255 with rewards -637.5426888624579 with 67 steps, done\n",
      "Run episode 3256 with rewards -1327.8767108497348 with 180 steps, done\n",
      "Run episode 3257 with rewards -176.60791108724754 with 60 steps, done\n",
      "Run episode 3258 with rewards -751.967152857872 with 127 steps, done\n",
      "Run episode 3259 with rewards -325.6623574163657 with 79 steps, done\n",
      "Run episode 3260 with rewards -534.6350502742988 with 87 steps, done\n",
      "Run episode 3261 with rewards -114.95908541272735 with 72 steps, done\n",
      "Run episode 3262 with rewards -1042.3413993067356 with 139 steps, done\n",
      "Run episode 3263 with rewards -173.97859720525508 with 65 steps, done\n",
      "Run episode 3264 with rewards -459.9409875514904 with 94 steps, done\n",
      "Run episode 3265 with rewards -147.57080315826954 with 83 steps, done\n",
      "Run episode 3266 with rewards -1228.147590669999 with 155 steps, done\n",
      "Run episode 3267 with rewards -98.47474452217077 with 82 steps, done\n",
      "Run episode 3268 with rewards -1902.794917358155 with 252 steps, done\n",
      "Run episode 3269 with rewards -311.0928286208377 with 96 steps, done\n",
      "Run episode 3270 with rewards -454.3618768939171 with 63 steps, done\n",
      "Run episode 3271 with rewards -645.3597591863073 with 76 steps, done\n",
      "Run episode 3272 with rewards -208.0911269663334 with 117 steps, done\n",
      "Run episode 3273 with rewards -845.2679672638174 with 111 steps, done\n",
      "Run episode 3274 with rewards -759.697873643693 with 114 steps, done\n",
      "Run episode 3275 with rewards -425.92928401488007 with 118 steps, done\n",
      "Run episode 3276 with rewards -550.3190995795551 with 60 steps, done\n",
      "Run episode 3277 with rewards -447.17733141939595 with 74 steps, done\n",
      "Run episode 3278 with rewards -804.0801334016312 with 98 steps, done\n",
      "Run episode 3279 with rewards -244.1083273412586 with 67 steps, done\n",
      "Run episode 3280 with rewards -446.92106672509306 with 94 steps, done\n",
      "Run episode 3281 with rewards -103.84498632244231 with 64 steps, done\n",
      "Run episode 3282 with rewards -111.10471746668742 with 91 steps, done\n",
      "Run episode 3283 with rewards -343.08517497841433 with 74 steps, done\n",
      "Run episode 3284 with rewards -508.1709310510316 with 69 steps, done\n",
      "Run episode 3285 with rewards -911.5594838562852 with 104 steps, done\n",
      "Run episode 3286 with rewards -153.09812679923223 with 56 steps, done\n",
      "Run episode 3287 with rewards -559.9617697638678 with 112 steps, done\n",
      "Run episode 3288 with rewards -924.857631413594 with 85 steps, done\n",
      "Run episode 3289 with rewards -456.2131654388491 with 85 steps, done\n",
      "Run episode 3290 with rewards -608.7570528932981 with 62 steps, done\n",
      "Run episode 3291 with rewards -539.9067369398726 with 91 steps, done\n",
      "Run episode 3292 with rewards -519.2916983886513 with 68 steps, done\n",
      "Run episode 3293 with rewards -265.8840234951293 with 66 steps, done\n",
      "Run episode 3294 with rewards -755.7098545477318 with 74 steps, done\n",
      "Run episode 3295 with rewards -183.5196184192791 with 82 steps, done\n",
      "Run episode 3296 with rewards -409.0326393345374 with 55 steps, done\n",
      "Run episode 3297 with rewards -443.7903942267966 with 74 steps, done\n",
      "Run episode 3298 with rewards -816.974298528623 with 75 steps, done\n",
      "Run episode 3299 with rewards -771.4233563576831 with 134 steps, done\n",
      "Run episode 3300 with rewards -973.581191322321 with 87 steps, done\n",
      "Run episode 3301 with rewards -124.4887702201033 with 59 steps, done\n",
      "Run episode 3302 with rewards -182.12337022710938 with 155 steps, done\n",
      "Run episode 3303 with rewards -114.10168558050879 with 61 steps, done\n",
      "Run episode 3304 with rewards -398.51086879619385 with 103 steps, done\n",
      "Run episode 3305 with rewards -160.78105083527237 with 81 steps, done\n",
      "Run episode 3306 with rewards -463.9215952084063 with 78 steps, done\n",
      "Run episode 3307 with rewards -294.0487220457337 with 82 steps, done\n",
      "Run episode 3308 with rewards -91.10262966694606 with 87 steps, done\n",
      "Run episode 3309 with rewards -342.2385502482018 with 94 steps, done\n",
      "Run episode 3310 with rewards -122.13455140345403 with 71 steps, done\n",
      "Run episode 3311 with rewards -679.2443650910499 with 77 steps, done\n",
      "Run episode 3312 with rewards -95.38951438819964 with 70 steps, done\n",
      "Run episode 3313 with rewards -454.78312062155237 with 84 steps, done\n",
      "Run episode 3314 with rewards -560.3259792146954 with 84 steps, done\n",
      "Run episode 3315 with rewards -790.5112044453818 with 83 steps, done\n",
      "Run episode 3316 with rewards -488.9792106411928 with 55 steps, done\n",
      "Run episode 3317 with rewards -678.3128933455772 with 72 steps, done\n",
      "Run episode 3318 with rewards -853.7245311525623 with 86 steps, done\n",
      "Run episode 3319 with rewards -462.3147701754748 with 85 steps, done\n",
      "Run episode 3320 with rewards -463.9991266838254 with 60 steps, done\n",
      "Run episode 3321 with rewards -141.78556316391982 with 100 steps, done\n",
      "Run episode 3322 with rewards -161.28500167104824 with 56 steps, done\n",
      "Run episode 3323 with rewards -448.85979705461097 with 57 steps, done\n",
      "Run episode 3324 with rewards -487.66274440946086 with 98 steps, done\n",
      "Run episode 3325 with rewards -1006.5583834369666 with 104 steps, done\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Run episode 3326 with rewards -302.9948929127959 with 50 steps, done\n",
      "Run episode 3327 with rewards -450.07845044316576 with 58 steps, done\n",
      "Run episode 3328 with rewards -339.8342152957591 with 80 steps, done\n",
      "Run episode 3329 with rewards -315.67054497118824 with 52 steps, done\n",
      "Run episode 3330 with rewards -359.91813341323564 with 74 steps, done\n",
      "Run episode 3331 with rewards -141.30718855313427 with 53 steps, done\n",
      "Run episode 3332 with rewards -386.87788243886826 with 82 steps, done\n",
      "Run episode 3333 with rewards -253.70091523914013 with 119 steps, done\n",
      "Run episode 3334 with rewards -700.5806712927242 with 77 steps, done\n",
      "Run episode 3335 with rewards -582.3717019300377 with 78 steps, done\n",
      "Run episode 3336 with rewards -504.6550827322162 with 66 steps, done\n",
      "Run episode 3337 with rewards -590.3750630669256 with 99 steps, done\n",
      "Run episode 3338 with rewards -306.0198845728102 with 63 steps, done\n",
      "Run episode 3339 with rewards -164.443051646328 with 62 steps, done\n",
      "Run episode 3340 with rewards -137.83941532201345 with 144 steps, done\n",
      "Run episode 3341 with rewards -147.11034126889064 with 58 steps, done\n",
      "Run episode 3342 with rewards -162.53749166853248 with 114 steps, done\n",
      "Run episode 3343 with rewards -361.5385824918068 with 75 steps, done\n",
      "Run episode 3344 with rewards -537.0922995582325 with 58 steps, done\n",
      "Run episode 3345 with rewards -177.933198421273 with 81 steps, done\n",
      "Run episode 3346 with rewards -630.787572738568 with 65 steps, done\n",
      "Run episode 3347 with rewards -214.50920056396438 with 81 steps, done\n",
      "Run episode 3348 with rewards -445.3512291762949 with 57 steps, done\n",
      "Run episode 3349 with rewards -513.25631703458 with 84 steps, done\n",
      "Run episode 3350 with rewards -471.2632073790684 with 72 steps, done\n",
      "Run episode 3351 with rewards -331.5016682054489 with 99 steps, done\n",
      "Run episode 3352 with rewards -848.7478635537309 with 82 steps, done\n",
      "Run episode 3353 with rewards -490.2178372044428 with 80 steps, done\n",
      "Run episode 3354 with rewards -374.2652120827643 with 97 steps, done\n",
      "Run episode 3355 with rewards -403.6426901770887 with 58 steps, done\n",
      "Run episode 3356 with rewards -473.03917348789224 with 57 steps, done\n",
      "Run episode 3357 with rewards -405.65335854477746 with 75 steps, done\n",
      "Run episode 3358 with rewards -405.50445104579217 with 52 steps, done\n",
      "Run episode 3359 with rewards -731.3026599964243 with 127 steps, done\n",
      "Run episode 3360 with rewards -508.60246601690574 with 56 steps, done\n",
      "Run episode 3361 with rewards -510.5418858128593 with 91 steps, done\n",
      "Run episode 3362 with rewards -990.5151269054719 with 85 steps, done\n",
      "Run episode 3363 with rewards -249.04370229287412 with 67 steps, done\n",
      "Run episode 3364 with rewards -573.1337047716845 with 65 steps, done\n",
      "Run episode 3365 with rewards -591.1856357175401 with 83 steps, done\n",
      "Run episode 3366 with rewards -1026.317132188236 with 86 steps, done\n",
      "Run episode 3367 with rewards -121.33698112767667 with 52 steps, done\n",
      "Run episode 3368 with rewards -927.606046383427 with 85 steps, done\n",
      "Run episode 3369 with rewards -604.6141284538334 with 94 steps, done\n",
      "Run episode 3370 with rewards -558.8832922529554 with 61 steps, done\n",
      "Run episode 3371 with rewards -536.2978566066922 with 84 steps, done\n",
      "Run episode 3372 with rewards -1062.4837409989589 with 111 steps, done\n",
      "Run episode 3373 with rewards -508.81555416206385 with 58 steps, done\n",
      "Run episode 3374 with rewards -809.6032732357717 with 81 steps, done\n",
      "Run episode 3375 with rewards -128.83526066755684 with 71 steps, done\n",
      "Run episode 3376 with rewards -579.8812258178475 with 70 steps, done\n",
      "Run episode 3377 with rewards -353.7602710028321 with 78 steps, done\n",
      "Run episode 3378 with rewards -720.6119960770505 with 80 steps, done\n",
      "Run episode 3379 with rewards -361.68142012442416 with 88 steps, done\n",
      "Run episode 3380 with rewards -835.6246343948725 with 155 steps, done\n",
      "Run episode 3381 with rewards -160.1521626725796 with 56 steps, done\n",
      "Run episode 3382 with rewards -1498.0049906408024 with 207 steps, done\n",
      "Run episode 3383 with rewards -157.46921277222089 with 71 steps, done\n",
      "Run episode 3384 with rewards -2889.3184564882904 with 299 steps, done\n",
      "Run episode 3385 with rewards -114.72151677682295 with 59 steps, done\n",
      "Run episode 3386 with rewards -812.7689949173536 with 97 steps, done\n",
      "Run episode 3387 with rewards -449.19246075646254 with 74 steps, done\n",
      "Run episode 3388 with rewards -1354.7432006020877 with 214 steps, done\n",
      "Run episode 3389 with rewards -225.47182990244042 with 62 steps, done\n",
      "Run episode 3390 with rewards -568.0234798609895 with 91 steps, done\n",
      "Run episode 3391 with rewards -110.74731932401798 with 66 steps, done\n",
      "Run episode 3392 with rewards -79.19129575730052 with 103 steps, done\n",
      "Run episode 3393 with rewards -382.2619834452664 with 58 steps, done\n",
      "Run episode 3394 with rewards -693.8779215558005 with 131 steps, done\n",
      "Run episode 3395 with rewards -278.0978241053366 with 84 steps, done\n",
      "Run episode 3396 with rewards -356.29802457147923 with 76 steps, done\n",
      "Run episode 3397 with rewards -219.6842119898427 with 88 steps, done\n",
      "Run episode 3398 with rewards -656.4123170759686 with 136 steps, done\n",
      "Run episode 3399 with rewards -103.53872826660762 with 59 steps, done\n",
      "Run episode 3400 with rewards -788.2674026211042 with 140 steps, done\n",
      "Run episode 3401 with rewards -266.93090094952527 with 71 steps, done\n",
      "Run episode 3402 with rewards -467.96068986388366 with 101 steps, done\n",
      "Run episode 3403 with rewards -153.17969943419962 with 59 steps, done\n",
      "Run episode 3404 with rewards -555.8683030374626 with 81 steps, done\n",
      "Run episode 3405 with rewards -309.3064275771467 with 78 steps, done\n",
      "Run episode 3406 with rewards -647.6169256118831 with 99 steps, done\n",
      "Run episode 3407 with rewards -472.7022745749148 with 55 steps, done\n",
      "Run episode 3408 with rewards -551.1802997695637 with 111 steps, done\n",
      "Run episode 3409 with rewards -316.9293469189985 with 59 steps, done\n",
      "Run episode 3410 with rewards -711.467871035842 with 180 steps, done\n",
      "Run episode 3411 with rewards -94.16962577972294 with 51 steps, done\n",
      "Run episode 3412 with rewards -538.2671219938015 with 94 steps, done\n",
      "Run episode 3413 with rewards -168.21017914587722 with 55 steps, done\n",
      "Run episode 3414 with rewards -617.6707089662202 with 85 steps, done\n",
      "Run episode 3415 with rewards -123.32498387147791 with 59 steps, done\n",
      "Run episode 3416 with rewards -511.67451619035734 with 131 steps, done\n",
      "Run episode 3417 with rewards -110.51981023825873 with 53 steps, done\n",
      "Run episode 3418 with rewards -709.8283214247207 with 112 steps, done\n",
      "Run episode 3419 with rewards -168.74334916290047 with 80 steps, done\n",
      "Run episode 3420 with rewards -1831.585216951161 with 223 steps, done\n",
      "Run episode 3421 with rewards -136.21123206429922 with 76 steps, done\n",
      "Run episode 3422 with rewards -433.1136068261734 with 81 steps, done\n",
      "Run episode 3423 with rewards -139.69719395629753 with 108 steps, done\n",
      "Run episode 3424 with rewards -952.0825678955962 with 101 steps, done\n",
      "Run episode 3425 with rewards -119.53372331214291 with 76 steps, done\n",
      "Run episode 3426 with rewards -584.7794039395187 with 100 steps, done\n",
      "Run episode 3427 with rewards -164.75676260260528 with 65 steps, done\n",
      "Run episode 3428 with rewards -902.889347505735 with 141 steps, done\n",
      "Run episode 3429 with rewards -143.7145374341217 with 88 steps, done\n",
      "Run episode 3430 with rewards -839.0784613356376 with 114 steps, done\n",
      "Run episode 3431 with rewards -102.08410296658575 with 90 steps, done\n",
      "Run episode 3432 with rewards -768.5492418158141 with 95 steps, done\n",
      "Run episode 3433 with rewards -40.50297741169395 with 81 steps, done\n",
      "Run episode 3434 with rewards -153.557119689985 with 116 steps, done\n",
      "Run episode 3435 with rewards -652.8488275774222 with 69 steps, done\n",
      "Run episode 3436 with rewards -360.91702557052747 with 73 steps, done\n",
      "Run episode 3437 with rewards -546.586557494476 with 69 steps, done\n",
      "Run episode 3438 with rewards -180.20873978483522 with 66 steps, done\n",
      "Run episode 3439 with rewards -578.7273299104672 with 63 steps, done\n",
      "Run episode 3440 with rewards -225.38760647154027 with 74 steps, done\n",
      "Run episode 3441 with rewards -482.62825834272417 with 60 steps, done\n",
      "Run episode 3442 with rewards -193.38681388483423 with 78 steps, done\n",
      "Run episode 3443 with rewards -2256.917858525098 with 182 steps, done\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Run episode 3444 with rewards -712.5413562446662 with 80 steps, done\n",
      "Run episode 3445 with rewards -161.04298491372683 with 71 steps, done\n",
      "Run episode 3446 with rewards -526.9389793562453 with 60 steps, done\n",
      "Run episode 3447 with rewards -179.4839060554054 with 55 steps, done\n",
      "Run episode 3448 with rewards -374.48443699728904 with 49 steps, done\n",
      "Run episode 3449 with rewards -110.36099759065573 with 56 steps, done\n",
      "Run episode 3450 with rewards -118.78600945465163 with 117 steps, done\n",
      "Run episode 3451 with rewards -151.72133033690844 with 82 steps, done\n",
      "Run episode 3452 with rewards -633.4424220309928 with 78 steps, done\n",
      "Run episode 3453 with rewards -178.65301157938657 with 76 steps, done\n",
      "Run episode 3454 with rewards -643.0695536624083 with 131 steps, done\n",
      "Run episode 3455 with rewards -571.3256768617675 with 93 steps, done\n",
      "Run episode 3456 with rewards -142.32796533226428 with 67 steps, done\n",
      "Run episode 3457 with rewards -646.3823457828818 with 95 steps, done\n",
      "Run episode 3458 with rewards -160.5236556541699 with 62 steps, done\n",
      "Run episode 3459 with rewards -994.7059405579287 with 153 steps, done\n",
      "Run episode 3460 with rewards -215.96900420773613 with 77 steps, done\n",
      "Run episode 3461 with rewards -713.8428367549177 with 91 steps, done\n",
      "Run episode 3462 with rewards -170.8949688860938 with 68 steps, done\n",
      "Run episode 3463 with rewards -851.1609618927239 with 118 steps, done\n",
      "Run episode 3464 with rewards -699.7557296382818 with 78 steps, done\n",
      "Run episode 3465 with rewards -807.9472896364402 with 112 steps, done\n",
      "Run episode 3466 with rewards -801.5975399513466 with 82 steps, done\n",
      "Run episode 3467 with rewards -742.9520062707196 with 104 steps, done\n",
      "Run episode 3468 with rewards -198.92185419621995 with 78 steps, done\n",
      "Run episode 3469 with rewards -422.4852575137173 with 74 steps, done\n",
      "Run episode 3470 with rewards -245.97040081377486 with 89 steps, done\n",
      "Run episode 3471 with rewards -649.3541823306623 with 101 steps, done\n",
      "Run episode 3472 with rewards -419.8836993977679 with 79 steps, done\n",
      "Run episode 3473 with rewards -110.72957872333802 with 78 steps, done\n",
      "Run episode 3474 with rewards -93.84267767272935 with 81 steps, done\n",
      "Run episode 3475 with rewards -177.07773748035186 with 87 steps, done\n",
      "Run episode 3476 with rewards -617.0769956804119 with 61 steps, done\n",
      "Run episode 3477 with rewards -1549.2092132349107 with 237 steps, done\n",
      "Run episode 3478 with rewards -130.4967765772248 with 91 steps, done\n",
      "Run episode 3479 with rewards -442.0348466672531 with 92 steps, done\n",
      "Run episode 3480 with rewards -92.2573919743672 with 53 steps, done\n",
      "Run episode 3481 with rewards -663.6260009523519 with 112 steps, done\n",
      "Run episode 3482 with rewards -145.59175573188932 with 59 steps, done\n",
      "Run episode 3483 with rewards -606.6435687877704 with 99 steps, done\n",
      "Run episode 3484 with rewards -126.34868416163947 with 58 steps, done\n",
      "Run episode 3485 with rewards -755.3018928241095 with 133 steps, done\n",
      "Run episode 3486 with rewards -101.82438566702122 with 52 steps, done\n",
      "Run episode 3487 with rewards -959.5847041803738 with 134 steps, done\n",
      "Run episode 3488 with rewards -116.89979617230446 with 82 steps, done\n",
      "Run episode 3489 with rewards -636.4992587759946 with 116 steps, done\n",
      "Run episode 3490 with rewards -143.24879395842373 with 77 steps, done\n",
      "Run episode 3491 with rewards -683.5353782412996 with 118 steps, done\n",
      "Run episode 3492 with rewards -581.1651598259617 with 76 steps, done\n",
      "Run episode 3493 with rewards -80.22970065496564 with 62 steps, done\n",
      "Run episode 3494 with rewards -568.7268146820211 with 74 steps, done\n",
      "Run episode 3495 with rewards -355.00566586178115 with 84 steps, done\n",
      "Run episode 3496 with rewards -155.10635974185317 with 75 steps, done\n",
      "Run episode 3497 with rewards -118.31550500301195 with 93 steps, done\n",
      "Run episode 3498 with rewards -170.24909112358122 with 77 steps, done\n",
      "Run episode 3499 with rewards -117.26992894235653 with 80 steps, done\n",
      "Run episode 3500 with rewards -359.97856805776945 with 58 steps, done\n",
      "Run episode 3501 with rewards -405.84651158224 with 69 steps, done\n",
      "Run episode 3502 with rewards -907.6450147008771 with 82 steps, done\n",
      "Run episode 3503 with rewards -511.9982583891159 with 60 steps, done\n",
      "Run episode 3504 with rewards -480.13172601357314 with 68 steps, done\n",
      "Run episode 3505 with rewards -517.0144240975598 with 69 steps, done\n",
      "Run episode 3506 with rewards -692.5494104103406 with 108 steps, done\n",
      "Run episode 3507 with rewards -513.6130325915467 with 66 steps, done\n",
      "Run episode 3508 with rewards -774.8243683099478 with 143 steps, done\n",
      "Run episode 3509 with rewards -522.9136433349478 with 62 steps, done\n",
      "Run episode 3510 with rewards -619.6841918320116 with 118 steps, done\n",
      "Run episode 3511 with rewards -494.06583820899834 with 73 steps, done\n",
      "Run episode 3512 with rewards -351.8086244807963 with 104 steps, done\n",
      "Run episode 3513 with rewards -488.24939997778205 with 66 steps, done\n",
      "Run episode 3514 with rewards -157.63703158617503 with 82 steps, done\n",
      "Run episode 3515 with rewards 32.49489219329476 with 133 steps, done\n",
      "best\n",
      "Run episode 3516 with rewards -969.9184031661815 with 128 steps, done\n",
      "Run episode 3517 with rewards -471.1351631807615 with 65 steps, done\n",
      "Run episode 3518 with rewards -632.8473411069742 with 80 steps, done\n",
      "Run episode 3519 with rewards -544.7125047538134 with 105 steps, done\n",
      "Run episode 3520 with rewards -375.9948568956057 with 50 steps, done\n",
      "Run episode 3521 with rewards -120.39447055992667 with 94 steps, done\n",
      "Run episode 3522 with rewards -465.0408075871916 with 76 steps, done\n",
      "Run episode 3523 with rewards -349.6233720471582 with 59 steps, done\n",
      "Run episode 3524 with rewards -489.8794796396584 with 112 steps, done\n",
      "Run episode 3525 with rewards -178.3889754896254 with 75 steps, done\n",
      "Run episode 3526 with rewards -473.0112633666292 with 77 steps, done\n",
      "Run episode 3527 with rewards -126.44575797305745 with 60 steps, done\n",
      "Run episode 3528 with rewards -894.8183912901964 with 126 steps, done\n",
      "Run episode 3529 with rewards -112.71756405072976 with 55 steps, done\n",
      "Run episode 3530 with rewards -485.93360638473104 with 84 steps, done\n",
      "Run episode 3531 with rewards -158.9748454853588 with 58 steps, done\n",
      "Run episode 3532 with rewards -466.98230050454794 with 76 steps, done\n",
      "Run episode 3533 with rewards -278.4038967792541 with 72 steps, done\n",
      "Run episode 3534 with rewards -607.7161526481693 with 72 steps, done\n",
      "Run episode 3535 with rewards -453.0966819572278 with 54 steps, done\n",
      "Run episode 3536 with rewards -688.000201681057 with 112 steps, done\n",
      "Run episode 3537 with rewards -890.2150865402735 with 82 steps, done\n",
      "Run episode 3538 with rewards -363.4182427561985 with 106 steps, done\n",
      "Run episode 3539 with rewards -516.6898734004042 with 61 steps, done\n",
      "Run episode 3540 with rewards -577.0060121262098 with 114 steps, done\n",
      "Run episode 3541 with rewards -699.1631929868587 with 73 steps, done\n",
      "Run episode 3542 with rewards -581.5307550700734 with 132 steps, done\n",
      "Run episode 3543 with rewards -142.2546548685685 with 55 steps, done\n",
      "Run episode 3544 with rewards -47.33411824435976 with 84 steps, done\n",
      "Run episode 3545 with rewards -105.2217326322673 with 60 steps, done\n",
      "Run episode 3546 with rewards -114.76308393119749 with 70 steps, done\n",
      "Run episode 3547 with rewards -479.91654933901816 with 87 steps, done\n",
      "Run episode 3548 with rewards -382.62737216938586 with 53 steps, done\n",
      "Run episode 3549 with rewards -209.38739654509612 with 76 steps, done\n",
      "Run episode 3550 with rewards -480.5359188943536 with 56 steps, done\n",
      "Run episode 3551 with rewards -688.9630985966822 with 70 steps, done\n",
      "Run episode 3552 with rewards -549.8514122836048 with 67 steps, done\n",
      "Run episode 3553 with rewards -667.5727626530517 with 90 steps, done\n",
      "Run episode 3554 with rewards -556.1311479019073 with 67 steps, done\n",
      "Run episode 3555 with rewards -676.8916335196881 with 102 steps, done\n",
      "Run episode 3556 with rewards -436.33857463911255 with 53 steps, done\n",
      "Run episode 3557 with rewards -413.24240317357203 with 85 steps, done\n",
      "Run episode 3558 with rewards -352.40290398550115 with 75 steps, done\n",
      "Run episode 3559 with rewards -553.4860076871355 with 64 steps, done\n",
      "Run episode 3560 with rewards 10.366745880318746 with 71 steps, done\n",
      "Run episode 3561 with rewards -510.38434788052587 with 66 steps, done\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Run episode 3562 with rewards -398.2919335524021 with 76 steps, done\n",
      "Run episode 3563 with rewards -281.13451390168944 with 103 steps, done\n",
      "Run episode 3564 with rewards -918.156411720201 with 117 steps, done\n",
      "Run episode 3565 with rewards -138.76651325686535 with 63 steps, done\n",
      "Run episode 3566 with rewards -435.1040812038528 with 85 steps, done\n",
      "Run episode 3567 with rewards -108.90415352293184 with 98 steps, done\n",
      "Run episode 3568 with rewards -485.90454432308354 with 75 steps, done\n",
      "Run episode 3569 with rewards -326.05701598826363 with 100 steps, done\n",
      "Run episode 3570 with rewards -164.8621119509957 with 84 steps, done\n",
      "Run episode 3571 with rewards -130.74461897851347 with 82 steps, done\n",
      "Run episode 3572 with rewards -163.05229250360057 with 69 steps, done\n",
      "Run episode 3573 with rewards -316.2609405713632 with 94 steps, done\n",
      "Run episode 3574 with rewards -140.60501572226622 with 89 steps, done\n",
      "Run episode 3575 with rewards -267.1451295098999 with 94 steps, done\n",
      "Run episode 3576 with rewards -79.44944321191423 with 62 steps, done\n",
      "Run episode 3577 with rewards -601.3246327342372 with 81 steps, done\n",
      "Run episode 3578 with rewards -174.30722531214633 with 66 steps, done\n",
      "Run episode 3579 with rewards -723.5523671651792 with 93 steps, done\n",
      "Run episode 3580 with rewards -151.28350387484997 with 67 steps, done\n",
      "Run episode 3581 with rewards -816.5888413393295 with 97 steps, done\n",
      "Run episode 3582 with rewards -181.35330726390663 with 73 steps, done\n",
      "Run episode 3583 with rewards -730.9424064466202 with 90 steps, done\n",
      "Run episode 3584 with rewards -144.9114986237492 with 77 steps, done\n",
      "Run episode 3585 with rewards -572.7184644343635 with 103 steps, done\n",
      "Run episode 3586 with rewards -110.13114511237616 with 56 steps, done\n",
      "Run episode 3587 with rewards -636.7323637695071 with 99 steps, done\n",
      "Run episode 3588 with rewards -160.84183714676846 with 66 steps, done\n",
      "Run episode 3589 with rewards -646.3230177851076 with 102 steps, done\n",
      "Run episode 3590 with rewards -111.34198625627407 with 56 steps, done\n",
      "Run episode 3591 with rewards -626.6445008584815 with 97 steps, done\n",
      "Run episode 3592 with rewards -227.675859828695 with 81 steps, done\n",
      "Run episode 3593 with rewards -899.8690754218184 with 116 steps, done\n",
      "Run episode 3594 with rewards -155.6201452167159 with 66 steps, done\n",
      "Run episode 3595 with rewards -646.6516983474393 with 110 steps, done\n",
      "Run episode 3596 with rewards -169.0205898644506 with 94 steps, done\n",
      "Run episode 3597 with rewards -588.6125689647101 with 78 steps, done\n",
      "Run episode 3598 with rewards -147.7387379492709 with 61 steps, done\n",
      "Run episode 3599 with rewards -397.4708221702622 with 87 steps, done\n",
      "Run episode 3600 with rewards -153.2352078669552 with 104 steps, done\n",
      "Run episode 3601 with rewards -264.03693125239454 with 87 steps, done\n",
      "Run episode 3602 with rewards -354.7720256899404 with 133 steps, done\n",
      "Run episode 3603 with rewards -125.36794334570939 with 56 steps, done\n",
      "Run episode 3604 with rewards -138.28202781320954 with 85 steps, done\n",
      "Run episode 3605 with rewards -63.80732545410662 with 138 steps, done\n",
      "Run episode 3606 with rewards -814.4756032029313 with 112 steps, done\n",
      "Run episode 3607 with rewards -377.56301533706323 with 85 steps, done\n",
      "Run episode 3608 with rewards -109.62150644308737 with 65 steps, done\n",
      "Run episode 3609 with rewards -1021.1041502054719 with 170 steps, done\n",
      "Run episode 3610 with rewards -460.27669398590365 with 60 steps, done\n",
      "Run episode 3611 with rewards -333.3460299188582 with 78 steps, done\n",
      "Run episode 3612 with rewards -751.5975727608584 with 81 steps, done\n",
      "Run episode 3613 with rewards -130.00615100166715 with 50 steps, done\n",
      "Run episode 3614 with rewards -899.979713797466 with 81 steps, done\n",
      "Run episode 3615 with rewards -521.8342544634158 with 116 steps, done\n",
      "Run episode 3616 with rewards -477.0435125497031 with 54 steps, done\n",
      "Run episode 3617 with rewards -475.35156157366566 with 111 steps, done\n",
      "Run episode 3618 with rewards -508.30471581650767 with 66 steps, done\n",
      "Run episode 3619 with rewards -873.1384736396561 with 116 steps, done\n",
      "Run episode 3620 with rewards -134.25098457754058 with 76 steps, done\n",
      "Run episode 3621 with rewards -1333.173262509913 with 125 steps, done\n",
      "Run episode 3622 with rewards -738.0439573339844 with 84 steps, done\n",
      "Run episode 3623 with rewards -95.19201169543553 with 67 steps, done\n",
      "Run episode 3624 with rewards -1272.8227728248787 with 166 steps, done\n",
      "Run episode 3625 with rewards -157.67230803435336 with 72 steps, done\n",
      "Run episode 3626 with rewards -709.3049789687236 with 83 steps, done\n",
      "Run episode 3627 with rewards -564.9821187567031 with 101 steps, done\n",
      "Run episode 3628 with rewards -464.455276901957 with 71 steps, done\n",
      "Run episode 3629 with rewards -648.8108248418376 with 70 steps, done\n",
      "Run episode 3630 with rewards -604.2273573479788 with 122 steps, done\n",
      "Run episode 3631 with rewards -436.35028964719766 with 52 steps, done\n",
      "Run episode 3632 with rewards -460.9888840977329 with 74 steps, done\n",
      "Run episode 3633 with rewards -472.4185190501219 with 55 steps, done\n",
      "Run episode 3634 with rewards -398.16056210998124 with 161 steps, done\n",
      "Run episode 3635 with rewards -157.89489696099693 with 62 steps, done\n",
      "Run episode 3636 with rewards -311.2894206242557 with 51 steps, done\n",
      "Run episode 3637 with rewards -334.4748010702574 with 88 steps, done\n",
      "Run episode 3638 with rewards -423.6878085844146 with 56 steps, done\n",
      "Run episode 3639 with rewards -666.6235055652874 with 105 steps, done\n",
      "Run episode 3640 with rewards -390.58223216898546 with 52 steps, done\n",
      "Run episode 3641 with rewards -356.29701106028386 with 86 steps, done\n",
      "Run episode 3642 with rewards -531.2471648548692 with 59 steps, done\n",
      "Run episode 3643 with rewards -509.17260998066195 with 62 steps, done\n",
      "Run episode 3644 with rewards -581.6283429805246 with 113 steps, done\n",
      "Run episode 3645 with rewards -856.0717074195011 with 87 steps, done\n",
      "Run episode 3646 with rewards -314.48118434376283 with 72 steps, done\n",
      "Run episode 3647 with rewards -508.6541803738594 with 64 steps, done\n",
      "Run episode 3648 with rewards -800.8525060794309 with 82 steps, done\n",
      "Run episode 3649 with rewards -127.7959338358337 with 93 steps, done\n",
      "Run episode 3650 with rewards -499.2531035790086 with 91 steps, done\n",
      "Run episode 3651 with rewards -562.8624832631907 with 92 steps, done\n",
      "Run episode 3652 with rewards -584.1333209389411 with 63 steps, done\n",
      "Run episode 3653 with rewards -2047.392652930294 with 252 steps, done\n",
      "Run episode 3654 with rewards -737.5224430555585 with 75 steps, done\n",
      "Run episode 3655 with rewards -494.69728857793893 with 81 steps, done\n",
      "Run episode 3656 with rewards -127.97518818276704 with 58 steps, done\n",
      "Run episode 3657 with rewards -579.5980736285517 with 90 steps, done\n",
      "Run episode 3658 with rewards -151.84554007946048 with 52 steps, done\n",
      "Run episode 3659 with rewards -952.005916964081 with 140 steps, done\n",
      "Run episode 3660 with rewards -124.91739876203322 with 101 steps, done\n",
      "Run episode 3661 with rewards -144.70753580429246 with 88 steps, done\n",
      "Run episode 3662 with rewards -93.68565935045115 with 70 steps, done\n",
      "Run episode 3663 with rewards -243.4236256264356 with 126 steps, done\n",
      "Run episode 3664 with rewards -173.32126629130204 with 84 steps, done\n",
      "Run episode 3665 with rewards -143.96413328308813 with 59 steps, done\n",
      "Run episode 3666 with rewards -770.8456408201162 with 81 steps, done\n",
      "Run episode 3667 with rewards -490.93680905416204 with 76 steps, done\n",
      "Run episode 3668 with rewards -785.9036171312332 with 85 steps, done\n",
      "Run episode 3669 with rewards -302.1741044286352 with 86 steps, done\n",
      "Run episode 3670 with rewards -601.9374791926541 with 63 steps, done\n",
      "Run episode 3671 with rewards -487.3335895717698 with 110 steps, done\n",
      "Run episode 3672 with rewards -679.4303559950368 with 86 steps, done\n",
      "Run episode 3673 with rewards -300.1350022145481 with 127 steps, done\n",
      "Run episode 3674 with rewards -181.02553531429385 with 79 steps, done\n",
      "Run episode 3675 with rewards -302.3941198725733 with 83 steps, done\n",
      "Run episode 3676 with rewards -115.84277511265034 with 56 steps, done\n",
      "Run episode 3677 with rewards -282.12563740567873 with 111 steps, done\n",
      "Run episode 3678 with rewards -552.7705261036474 with 59 steps, done\n",
      "Run episode 3679 with rewards -182.54894905440526 with 87 steps, done\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Run episode 3680 with rewards -1017.0130192061531 with 88 steps, done\n",
      "Run episode 3681 with rewards -513.3825207416969 with 84 steps, done\n",
      "Run episode 3682 with rewards -145.0425370666994 with 143 steps, done\n",
      "Run episode 3683 with rewards -1707.3053393027483 with 199 steps, done\n",
      "Run episode 3684 with rewards -323.3178282325383 with 85 steps, done\n",
      "Run episode 3685 with rewards -696.5770141974926 with 89 steps, done\n",
      "Run episode 3686 with rewards -143.08931427922766 with 60 steps, done\n",
      "Run episode 3687 with rewards -726.848387502138 with 99 steps, done\n",
      "Run episode 3688 with rewards -339.9351385034283 with 55 steps, done\n",
      "Run episode 3689 with rewards -473.9433775230989 with 63 steps, done\n",
      "Run episode 3690 with rewards -470.7030558564514 with 63 steps, done\n",
      "Run episode 3691 with rewards -492.64772797340765 with 65 steps, done\n",
      "Run episode 3692 with rewards -400.8798176875479 with 52 steps, done\n",
      "Run episode 3693 with rewards -632.0743549944879 with 98 steps, done\n",
      "Run episode 3694 with rewards -723.817374219427 with 81 steps, done\n",
      "Run episode 3695 with rewards -200.94999561172602 with 89 steps, done\n",
      "Run episode 3696 with rewards -500.3213592101862 with 69 steps, done\n",
      "Run episode 3697 with rewards -671.1510044578215 with 93 steps, done\n",
      "Run episode 3698 with rewards -500.6548810823455 with 55 steps, done\n",
      "Run episode 3699 with rewards -504.02534847010725 with 81 steps, done\n",
      "Run episode 3700 with rewards -420.95081692917535 with 53 steps, done\n",
      "Run episode 3701 with rewards -452.8298442085968 with 105 steps, done\n",
      "Run episode 3702 with rewards -199.39017617413077 with 61 steps, done\n",
      "Run episode 3703 with rewards -767.4669641986799 with 76 steps, done\n",
      "Run episode 3704 with rewards -450.7351265568149 with 86 steps, done\n",
      "Run episode 3705 with rewards -300.2793112501891 with 92 steps, done\n",
      "Run episode 3706 with rewards -178.835659699216 with 112 steps, done\n",
      "Run episode 3707 with rewards -3501.310960911556 with 347 steps, done\n",
      "Run episode 3708 with rewards -757.9280425427032 with 83 steps, done\n",
      "Run episode 3709 with rewards -251.59750175729056 with 78 steps, done\n",
      "Run episode 3710 with rewards -655.2298133933615 with 84 steps, done\n",
      "Run episode 3711 with rewards -174.03928433521338 with 71 steps, done\n",
      "Run episode 3712 with rewards -660.9847179295253 with 87 steps, done\n",
      "Run episode 3713 with rewards -680.4682190388546 with 102 steps, done\n",
      "Run episode 3714 with rewards -472.53277317607143 with 55 steps, done\n",
      "Run episode 3715 with rewards -641.7280262087055 with 65 steps, done\n",
      "Run episode 3716 with rewards -290.28193544205146 with 62 steps, done\n",
      "Run episode 3717 with rewards -798.7611644758117 with 83 steps, done\n",
      "Run episode 3718 with rewards -263.36113868381756 with 79 steps, done\n",
      "Run episode 3719 with rewards -561.0410943304387 with 108 steps, done\n",
      "Run episode 3720 with rewards -143.9068535037245 with 82 steps, done\n",
      "Run episode 3721 with rewards -772.4204443140655 with 103 steps, done\n",
      "Run episode 3722 with rewards -154.46658091783706 with 85 steps, done\n",
      "Run episode 3723 with rewards -524.6849563392229 with 60 steps, done\n",
      "Run episode 3724 with rewards -242.83349829281067 with 65 steps, done\n",
      "Run episode 3725 with rewards -427.78342476387945 with 59 steps, done\n",
      "Run episode 3726 with rewards -160.0994179598397 with 70 steps, done\n",
      "Run episode 3727 with rewards -987.5052450164469 with 178 steps, done\n",
      "Run episode 3728 with rewards -178.06261156385096 with 63 steps, done\n",
      "Run episode 3729 with rewards -379.7024245006978 with 52 steps, done\n",
      "Run episode 3730 with rewards -543.9605861076616 with 80 steps, done\n",
      "Run episode 3731 with rewards -520.6853820404208 with 69 steps, done\n",
      "Run episode 3732 with rewards -573.4363673020468 with 96 steps, done\n",
      "Run episode 3733 with rewards -512.8328602164329 with 59 steps, done\n",
      "Run episode 3734 with rewards -545.858612414338 with 91 steps, done\n",
      "Run episode 3735 with rewards -732.7434857726087 with 75 steps, done\n",
      "Run episode 3736 with rewards -480.1595648235105 with 84 steps, done\n",
      "Run episode 3737 with rewards -425.42111530961887 with 54 steps, done\n",
      "Run episode 3738 with rewards -369.12979099190693 with 109 steps, done\n",
      "Run episode 3739 with rewards -763.2898000024152 with 76 steps, done\n",
      "Run episode 3740 with rewards -126.70364413616126 with 65 steps, done\n",
      "Run episode 3741 with rewards -477.000023661226 with 63 steps, done\n",
      "Run episode 3742 with rewards -499.72544122651675 with 56 steps, done\n",
      "Run episode 3743 with rewards -1004.3097666694127 with 88 steps, done\n",
      "Run episode 3744 with rewards -205.026408855059 with 59 steps, done\n",
      "Run episode 3745 with rewards -1176.8905268411304 with 147 steps, done\n",
      "Run episode 3746 with rewards -502.2383969567989 with 54 steps, done\n",
      "Run episode 3747 with rewards -600.54491283996 with 115 steps, done\n",
      "Run episode 3748 with rewards -372.7361995340156 with 52 steps, done\n",
      "Run episode 3749 with rewards -329.9807691508651 with 74 steps, done\n",
      "Run episode 3750 with rewards -605.3731233557487 with 77 steps, done\n",
      "Run episode 3751 with rewards -488.7026787825893 with 73 steps, done\n",
      "Run episode 3752 with rewards -391.7787187671812 with 82 steps, done\n",
      "Run episode 3753 with rewards -672.402494335746 with 128 steps, done\n",
      "Run episode 3754 with rewards -515.205086376384 with 69 steps, done\n",
      "Run episode 3755 with rewards -534.5635158989794 with 116 steps, done\n",
      "Run episode 3756 with rewards -525.2178815308403 with 59 steps, done\n",
      "Run episode 3757 with rewards -116.96356898155983 with 73 steps, done\n",
      "Run episode 3758 with rewards -1600.8037069860197 with 209 steps, done\n",
      "Run episode 3759 with rewards -140.04953401807086 with 75 steps, done\n",
      "Run episode 3760 with rewards -778.6702510339043 with 83 steps, done\n",
      "Run episode 3761 with rewards -458.48438551207647 with 112 steps, done\n",
      "Run episode 3762 with rewards -553.9140435290298 with 61 steps, done\n",
      "Run episode 3763 with rewards -600.0483940169856 with 81 steps, done\n",
      "Run episode 3764 with rewards -555.4974908424458 with 77 steps, done\n",
      "Run episode 3765 with rewards -1436.6349433908438 with 185 steps, done\n",
      "Run episode 3766 with rewards -150.0146240524435 with 58 steps, done\n",
      "Run episode 3767 with rewards -688.4800838349809 with 109 steps, done\n",
      "Run episode 3768 with rewards -147.9302646210354 with 52 steps, done\n",
      "Run episode 3769 with rewards -530.1647396314482 with 76 steps, done\n",
      "Run episode 3770 with rewards -122.73712983088889 with 51 steps, done\n",
      "Run episode 3771 with rewards -497.4444101463755 with 91 steps, done\n",
      "Run episode 3772 with rewards -93.90460381022868 with 49 steps, done\n",
      "Run episode 3773 with rewards -644.6232847558028 with 79 steps, done\n",
      "Run episode 3774 with rewards -134.28780184567455 with 53 steps, done\n",
      "Run episode 3775 with rewards -1331.1257134240664 with 162 steps, done\n",
      "Run episode 3776 with rewards -172.6442315210169 with 62 steps, done\n",
      "Run episode 3777 with rewards -970.0759970194306 with 175 steps, done\n",
      "Run episode 3778 with rewards -116.86991272557208 with 82 steps, done\n",
      "Run episode 3779 with rewards -856.3250727934901 with 128 steps, done\n",
      "Run episode 3780 with rewards -131.76431085943506 with 66 steps, done\n",
      "Run episode 3781 with rewards -827.435503116404 with 136 steps, done\n",
      "Run episode 3782 with rewards -103.82347789541848 with 61 steps, done\n",
      "Run episode 3783 with rewards -529.5184861303719 with 87 steps, done\n",
      "Run episode 3784 with rewards -419.70130470062105 with 58 steps, done\n",
      "Run episode 3785 with rewards -174.61359555520374 with 81 steps, done\n",
      "Run episode 3786 with rewards -771.6248734227056 with 76 steps, done\n",
      "Run episode 3787 with rewards -26.057228397694686 with 78 steps, done\n",
      "Run episode 3788 with rewards -569.1597680788271 with 68 steps, done\n",
      "Run episode 3789 with rewards -610.2450162616339 with 90 steps, done\n",
      "Run episode 3790 with rewards -510.70300667452136 with 62 steps, done\n",
      "Run episode 3791 with rewards -508.037545201704 with 81 steps, done\n",
      "Run episode 3792 with rewards -426.15046811458393 with 55 steps, done\n",
      "Run episode 3793 with rewards -808.7333200638577 with 115 steps, done\n",
      "Run episode 3794 with rewards -508.48929617026334 with 59 steps, done\n",
      "Run episode 3795 with rewards -177.02106507204581 with 64 steps, done\n",
      "Run episode 3796 with rewards -71.69254599122041 with 73 steps, done\n",
      "Run episode 3797 with rewards -17.94420195181462 with 60 steps, done\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Run episode 3798 with rewards -783.6348996956146 with 85 steps, done\n",
      "Run episode 3799 with rewards -165.54633448186235 with 75 steps, done\n",
      "Run episode 3800 with rewards -513.6639680845994 with 56 steps, done\n",
      "Run episode 3801 with rewards -342.9476987561409 with 67 steps, done\n",
      "Run episode 3802 with rewards -787.8211143909705 with 79 steps, done\n",
      "Run episode 3803 with rewards -367.2409457640123 with 80 steps, done\n",
      "Run episode 3804 with rewards -362.22159121957213 with 76 steps, done\n",
      "Run episode 3805 with rewards -478.3517422050429 with 90 steps, done\n",
      "Run episode 3806 with rewards -103.5073448169459 with 98 steps, done\n",
      "Run episode 3807 with rewards -75.01764352749069 with 99 steps, done\n",
      "Run episode 3808 with rewards -297.93920141928277 with 50 steps, done\n",
      "Run episode 3809 with rewards -857.4556991804768 with 79 steps, done\n",
      "Run episode 3810 with rewards -117.06053796625562 with 99 steps, done\n",
      "Run episode 3811 with rewards -57.09144432828979 with 84 steps, done\n",
      "Run episode 3812 with rewards -686.2337202218727 with 91 steps, done\n",
      "Run episode 3813 with rewards -740.2408393039261 with 77 steps, done\n",
      "Run episode 3814 with rewards -1240.1681425495663 with 166 steps, done\n",
      "Run episode 3815 with rewards -562.1140395635356 with 74 steps, done\n",
      "Run episode 3816 with rewards -634.737220830817 with 75 steps, done\n",
      "Run episode 3817 with rewards -133.75907219621098 with 64 steps, done\n",
      "Run episode 3818 with rewards -731.6686070564042 with 107 steps, done\n",
      "Run episode 3819 with rewards -147.50842515015592 with 84 steps, done\n",
      "Run episode 3820 with rewards -1850.6231372360269 with 371 steps, done\n",
      "Run episode 3821 with rewards -220.7393775150737 with 61 steps, done\n",
      "Run episode 3822 with rewards -157.67983112630304 with 66 steps, done\n",
      "Run episode 3823 with rewards -199.0257639782095 with 80 steps, done\n",
      "Run episode 3824 with rewards -204.7125196505396 with 95 steps, done\n",
      "Run episode 3825 with rewards -169.5771883014046 with 150 steps, done\n",
      "Run episode 3826 with rewards -156.84513008718648 with 77 steps, done\n",
      "Run episode 3827 with rewards -224.56880724817427 with 134 steps, done\n",
      "Run episode 3828 with rewards -441.5369728336393 with 79 steps, done\n",
      "Run episode 3829 with rewards -520.1718026639467 with 73 steps, done\n",
      "Run episode 3830 with rewards 11.775857037338312 with 95 steps, done\n",
      "Run episode 3831 with rewards -863.4704864994463 with 115 steps, done\n",
      "Run episode 3832 with rewards -113.5354679098876 with 69 steps, done\n",
      "Run episode 3833 with rewards -455.21611274799454 with 70 steps, done\n",
      "Run episode 3834 with rewards -578.4814996157116 with 116 steps, done\n",
      "Run episode 3835 with rewards -453.074526602949 with 64 steps, done\n",
      "Run episode 3836 with rewards -544.7267388255507 with 70 steps, done\n",
      "Run episode 3837 with rewards -732.4972987940605 with 76 steps, done\n",
      "Run episode 3838 with rewards -290.6207748666874 with 56 steps, done\n",
      "Run episode 3839 with rewards -471.54195288085833 with 54 steps, done\n",
      "Run episode 3840 with rewards -692.7738451823394 with 106 steps, done\n",
      "Run episode 3841 with rewards -906.2889932112712 with 86 steps, done\n",
      "Run episode 3842 with rewards -773.7097661909496 with 132 steps, done\n",
      "Run episode 3843 with rewards -432.6938703369114 with 54 steps, done\n",
      "Run episode 3844 with rewards -275.49838403686465 with 63 steps, done\n",
      "Run episode 3845 with rewards -271.37709618164195 with 123 steps, done\n",
      "Run episode 3846 with rewards -102.59829323608716 with 78 steps, done\n",
      "Run episode 3847 with rewards -152.72343451392894 with 109 steps, done\n",
      "Run episode 3848 with rewards -129.3140572510086 with 69 steps, done\n",
      "Run episode 3849 with rewards -645.7751271500547 with 67 steps, done\n",
      "Run episode 3850 with rewards -1108.448526570378 with 170 steps, done\n",
      "Run episode 3851 with rewards -530.8391703967148 with 86 steps, done\n",
      "Run episode 3852 with rewards -136.41290815324055 with 66 steps, done\n",
      "Run episode 3853 with rewards -91.68693975875989 with 97 steps, done\n",
      "Run episode 3854 with rewards -636.2887505096938 with 91 steps, done\n",
      "Run episode 3855 with rewards -514.8419355216711 with 58 steps, done\n",
      "Run episode 3856 with rewards -135.4706058049842 with 87 steps, done\n",
      "Run episode 3857 with rewards -2983.5530602013996 with 291 steps, done\n",
      "Run episode 3858 with rewards -889.0406573967812 with 86 steps, done\n",
      "Run episode 3859 with rewards -55.259454746701884 with 62 steps, done\n",
      "Run episode 3860 with rewards -476.68266334763746 with 81 steps, done\n",
      "Run episode 3861 with rewards -288.43478031037574 with 80 steps, done\n",
      "Run episode 3862 with rewards -2463.315709373914 with 287 steps, done\n",
      "Run episode 3863 with rewards -447.43003533435785 with 53 steps, done\n",
      "Run episode 3864 with rewards -567.5876749002803 with 119 steps, done\n",
      "Run episode 3865 with rewards -725.2192393680159 with 82 steps, done\n",
      "Run episode 3866 with rewards -673.5965523373268 with 101 steps, done\n",
      "Run episode 3867 with rewards -429.65829249275237 with 50 steps, done\n",
      "Run episode 3868 with rewards -557.1696490981864 with 92 steps, done\n",
      "Run episode 3869 with rewards -444.68473282444165 with 58 steps, done\n",
      "Run episode 3870 with rewards -348.9511058216991 with 81 steps, done\n",
      "Run episode 3871 with rewards -439.3847767766109 with 81 steps, done\n",
      "Run episode 3872 with rewards -676.6371327459613 with 75 steps, done\n",
      "Run episode 3873 with rewards -348.9926764716861 with 95 steps, done\n",
      "Run episode 3874 with rewards -734.2024877325414 with 77 steps, done\n",
      "Run episode 3875 with rewards -267.93805660495457 with 54 steps, done\n",
      "Run episode 3876 with rewards -856.4228362342634 with 81 steps, done\n",
      "Run episode 3877 with rewards -553.6767570837068 with 87 steps, done\n",
      "Run episode 3878 with rewards -691.4225038406162 with 68 steps, done\n",
      "Run episode 3879 with rewards -405.86712515005036 with 101 steps, done\n",
      "Run episode 3880 with rewards -620.9799617336625 with 71 steps, done\n",
      "Run episode 3881 with rewards -843.5163449527889 with 151 steps, done\n",
      "Run episode 3882 with rewards -433.2977578972782 with 59 steps, done\n",
      "Run episode 3883 with rewards -514.1780096666299 with 87 steps, done\n",
      "Run episode 3884 with rewards -715.6479240208442 with 79 steps, done\n",
      "Run episode 3885 with rewards -730.3978924898787 with 259 steps, done\n",
      "Run episode 3886 with rewards -441.6879956157336 with 59 steps, done\n",
      "Run episode 3887 with rewards -113.68216750562566 with 97 steps, done\n",
      "Run episode 3888 with rewards -723.7883771708775 with 81 steps, done\n",
      "Run episode 3889 with rewards -109.79722548889592 with 51 steps, done\n",
      "Run episode 3890 with rewards -206.53323681549836 with 92 steps, done\n",
      "Run episode 3891 with rewards -642.6366623793176 with 78 steps, done\n",
      "Run episode 3892 with rewards -748.7645761604742 with 113 steps, done\n",
      "Run episode 3893 with rewards -407.3663466559715 with 53 steps, done\n",
      "Run episode 3894 with rewards -464.31481113918466 with 53 steps, done\n",
      "Run episode 3895 with rewards -219.42717848788539 with 84 steps, done\n",
      "Run episode 3896 with rewards -467.5652780556352 with 69 steps, done\n",
      "Run episode 3897 with rewards -605.6143677410638 with 97 steps, done\n",
      "Run episode 3898 with rewards -359.40537109539184 with 54 steps, done\n",
      "Run episode 3899 with rewards -360.85917733364596 with 74 steps, done\n",
      "Run episode 3900 with rewards -635.1362473958197 with 65 steps, done\n",
      "Run episode 3901 with rewards -512.8697683105552 with 66 steps, done\n",
      "Run episode 3902 with rewards -1612.9845415593759 with 229 steps, done\n",
      "Run episode 3903 with rewards -369.36525642475834 with 85 steps, done\n",
      "Run episode 3904 with rewards -647.1248651905182 with 84 steps, done\n",
      "Run episode 3905 with rewards -757.6327440334774 with 75 steps, done\n",
      "Run episode 3906 with rewards -703.688966652968 with 99 steps, done\n",
      "Run episode 3907 with rewards -385.448990013356 with 49 steps, done\n",
      "Run episode 3908 with rewards -322.7373152242125 with 78 steps, done\n",
      "Run episode 3909 with rewards -580.8077266824853 with 65 steps, done\n",
      "Run episode 3910 with rewards -294.9966337107525 with 55 steps, done\n",
      "Run episode 3911 with rewards -111.53979066850599 with 53 steps, done\n",
      "Run episode 3912 with rewards -613.1850880670572 with 67 steps, done\n",
      "Run episode 3913 with rewards -400.91825855127206 with 75 steps, done\n",
      "Run episode 3914 with rewards -468.6887715703941 with 58 steps, done\n",
      "Run episode 3915 with rewards -491.65615077980715 with 105 steps, done\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Run episode 3916 with rewards -530.5618055965012 with 58 steps, done\n",
      "Run episode 3917 with rewards -2438.5355588527705 with 260 steps, done\n",
      "Run episode 3918 with rewards -559.6415441673886 with 68 steps, done\n",
      "Run episode 3919 with rewards -460.34625788199304 with 78 steps, done\n",
      "Run episode 3920 with rewards -118.47194454021567 with 87 steps, done\n",
      "Run episode 3921 with rewards -561.8949731113942 with 77 steps, done\n",
      "Run episode 3922 with rewards -197.62520010830775 with 57 steps, done\n",
      "Run episode 3923 with rewards -136.0634027055283 with 72 steps, done\n",
      "Run episode 3924 with rewards -579.7081569046481 with 78 steps, done\n",
      "Run episode 3925 with rewards -460.8248553737645 with 61 steps, done\n",
      "Run episode 3926 with rewards -557.2132772934174 with 99 steps, done\n",
      "Run episode 3927 with rewards -788.0578232032083 with 83 steps, done\n",
      "Run episode 3928 with rewards -348.30338228101965 with 69 steps, done\n",
      "Run episode 3929 with rewards -699.9566262128013 with 80 steps, done\n",
      "Run episode 3930 with rewards -473.85712485928076 with 109 steps, done\n",
      "Run episode 3931 with rewards -353.4165987865647 with 95 steps, done\n",
      "Run episode 3932 with rewards -307.45678797188503 with 60 steps, done\n",
      "Run episode 3933 with rewards -388.4997851479151 with 53 steps, done\n",
      "Run episode 3934 with rewards -664.8857980276385 with 74 steps, done\n",
      "Run episode 3935 with rewards -395.7832861219933 with 94 steps, done\n",
      "Run episode 3936 with rewards -840.2702216311943 with 91 steps, done\n",
      "Run episode 3937 with rewards -397.8789104864699 with 108 steps, done\n",
      "Run episode 3938 with rewards -612.2222618198899 with 71 steps, done\n",
      "Run episode 3939 with rewards -160.15905762769407 with 85 steps, done\n",
      "Run episode 3940 with rewards -262.97039943388756 with 74 steps, done\n",
      "Run episode 3941 with rewards -107.60633801826216 with 58 steps, done\n",
      "Run episode 3942 with rewards -165.11492997859693 with 81 steps, done\n",
      "Run episode 3943 with rewards -394.86677971339975 with 58 steps, done\n",
      "Run episode 3944 with rewards -370.30544059526886 with 51 steps, done\n",
      "Run episode 3945 with rewards -579.3211409723893 with 103 steps, done\n",
      "Run episode 3946 with rewards -501.84755308935 with 55 steps, done\n",
      "Run episode 3947 with rewards -497.8361801657279 with 91 steps, done\n",
      "Run episode 3948 with rewards -719.22444684926 with 70 steps, done\n",
      "Run episode 3949 with rewards -305.65317757007045 with 98 steps, done\n",
      "Run episode 3950 with rewards -523.5921245538659 with 59 steps, done\n",
      "Run episode 3951 with rewards -559.7222590739968 with 107 steps, done\n",
      "Run episode 3952 with rewards -491.03113613706574 with 67 steps, done\n",
      "Run episode 3953 with rewards -586.7836026242344 with 92 steps, done\n",
      "Run episode 3954 with rewards -327.45840375186214 with 138 steps, done\n",
      "Run episode 3955 with rewards -282.89094524701636 with 51 steps, done\n",
      "Run episode 3956 with rewards -486.2996960104525 with 96 steps, done\n",
      "Run episode 3957 with rewards -116.53481845810427 with 64 steps, done\n",
      "Run episode 3958 with rewards -474.60576062772105 with 118 steps, done\n",
      "Run episode 3959 with rewards -587.4184506939132 with 65 steps, done\n",
      "Run episode 3960 with rewards -374.0113366066231 with 70 steps, done\n",
      "Run episode 3961 with rewards -646.4173201678598 with 71 steps, done\n",
      "Run episode 3962 with rewards -470.9900195809645 with 72 steps, done\n",
      "Run episode 3963 with rewards -275.0701529905897 with 115 steps, done\n",
      "Run episode 3964 with rewards -530.6819205939056 with 84 steps, done\n",
      "Run episode 3965 with rewards -145.61241129357225 with 60 steps, done\n",
      "Run episode 3966 with rewards -349.4733522057345 with 90 steps, done\n",
      "Run episode 3967 with rewards -367.8181083137049 with 63 steps, done\n",
      "Run episode 3968 with rewards -485.7747363371918 with 81 steps, done\n",
      "Run episode 3969 with rewards -631.6693609535732 with 97 steps, done\n",
      "Run episode 3970 with rewards -520.3255675235531 with 96 steps, done\n",
      "Run episode 3971 with rewards -738.5892904557919 with 71 steps, done\n",
      "Run episode 3972 with rewards -559.7706095560172 with 76 steps, done\n",
      "Run episode 3973 with rewards -886.8845432024984 with 82 steps, done\n",
      "Run episode 3974 with rewards -366.42200448626465 with 76 steps, done\n",
      "Run episode 3975 with rewards -599.5475154180712 with 63 steps, done\n",
      "Run episode 3976 with rewards -580.7760613066906 with 83 steps, done\n",
      "Run episode 3977 with rewards -373.0338901438507 with 54 steps, done\n",
      "Run episode 3978 with rewards -659.6222885022839 with 119 steps, done\n",
      "Run episode 3979 with rewards -352.7682020233839 with 55 steps, done\n",
      "Run episode 3980 with rewards -367.4905805433561 with 100 steps, done\n",
      "Run episode 3981 with rewards -679.7428408404071 with 111 steps, done\n",
      "Run episode 3982 with rewards -143.36139804858897 with 53 steps, done\n",
      "Run episode 3983 with rewards -821.618744802561 with 130 steps, done\n",
      "Run episode 3984 with rewards -133.17966953450298 with 59 steps, done\n",
      "Run episode 3985 with rewards -465.8271644194549 with 60 steps, done\n",
      "Run episode 3986 with rewards -919.712566178158 with 92 steps, done\n",
      "Run episode 3987 with rewards -786.3608015798596 with 76 steps, done\n",
      "Run episode 3988 with rewards -467.5763885019628 with 59 steps, done\n",
      "Run episode 3989 with rewards -456.5849699244085 with 86 steps, done\n",
      "Run episode 3990 with rewards -486.47546226184426 with 60 steps, done\n",
      "Run episode 3991 with rewards -684.8325983459607 with 103 steps, done\n",
      "Run episode 3992 with rewards -569.8156777284972 with 72 steps, done\n",
      "Run episode 3993 with rewards -569.1554860432004 with 72 steps, done\n",
      "Run episode 3994 with rewards -942.1590366822138 with 84 steps, done\n",
      "Run episode 3995 with rewards -405.2457190177929 with 58 steps, done\n",
      "Run episode 3996 with rewards -744.6344410973325 with 82 steps, done\n",
      "Run episode 3997 with rewards -630.7627011529645 with 93 steps, done\n",
      "Run episode 3998 with rewards -332.04909830088025 with 51 steps, done\n",
      "Run episode 3999 with rewards -641.1216166461974 with 100 steps, done\n",
      "Run episode 4000 with rewards -159.42603776061463 with 71 steps, done\n",
      "Run episode 4001 with rewards -659.4089699814081 with 98 steps, done\n",
      "Run episode 4002 with rewards -335.7364200881743 with 66 steps, done\n",
      "Run episode 4003 with rewards -638.8694448698569 with 125 steps, done\n",
      "Run episode 4004 with rewards -681.3145029880101 with 99 steps, done\n",
      "Run episode 4005 with rewards -128.29220357934747 with 66 steps, done\n",
      "Run episode 4006 with rewards -584.0140141865091 with 75 steps, done\n",
      "Run episode 4007 with rewards -216.4950267973107 with 74 steps, done\n",
      "Run episode 4008 with rewards -760.4247372605826 with 130 steps, done\n",
      "Run episode 4009 with rewards -161.60026869983878 with 66 steps, done\n",
      "Run episode 4010 with rewards -419.9048585043076 with 56 steps, done\n",
      "Run episode 4011 with rewards -398.199223947935 with 79 steps, done\n",
      "Run episode 4012 with rewards -608.5594664328931 with 65 steps, done\n",
      "Run episode 4013 with rewards -1712.5300915257465 with 230 steps, done\n",
      "Run episode 4014 with rewards -175.77917536105804 with 59 steps, done\n",
      "Run episode 4015 with rewards -743.3795572088004 with 109 steps, done\n",
      "Run episode 4016 with rewards -189.75108801295278 with 82 steps, done\n",
      "Run episode 4017 with rewards -476.5841680373789 with 184 steps, done\n",
      "Run episode 4018 with rewards -395.0133588238883 with 79 steps, done\n",
      "Run episode 4019 with rewards -101.48455558595654 with 52 steps, done\n",
      "Run episode 4020 with rewards -93.57272731152415 with 81 steps, done\n",
      "Run episode 4021 with rewards -123.32315945697903 with 69 steps, done\n",
      "Run episode 4022 with rewards -147.4527167989824 with 95 steps, done\n",
      "Run episode 4023 with rewards -429.2037523385066 with 67 steps, done\n",
      "Run episode 4024 with rewards -815.3695292523086 with 82 steps, done\n",
      "Run episode 4025 with rewards -486.0212385480155 with 72 steps, done\n",
      "Run episode 4026 with rewards -641.3764270025467 with 94 steps, done\n",
      "Run episode 4027 with rewards -654.7007784560242 with 71 steps, done\n",
      "Run episode 4028 with rewards -795.604950056678 with 126 steps, done\n",
      "Run episode 4029 with rewards -323.32708929636647 with 104 steps, done\n",
      "Run episode 4030 with rewards -348.73260684238994 with 63 steps, done\n",
      "Run episode 4031 with rewards -516.400445454464 with 57 steps, done\n",
      "Run episode 4032 with rewards -705.9998311679625 with 84 steps, done\n",
      "Run episode 4033 with rewards -727.9435968363046 with 109 steps, done\n",
      "Run episode 4034 with rewards -780.5341189910631 with 83 steps, done\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Run episode 4035 with rewards -552.8435215030684 with 90 steps, done\n",
      "Run episode 4036 with rewards -504.30140988953235 with 57 steps, done\n",
      "Run episode 4037 with rewards -527.2783638180651 with 86 steps, done\n",
      "Run episode 4038 with rewards -773.4233619955711 with 77 steps, done\n",
      "Run episode 4039 with rewards -263.2490867459925 with 87 steps, done\n",
      "Run episode 4040 with rewards -445.6690403524623 with 60 steps, done\n",
      "Run episode 4041 with rewards -605.381801044894 with 80 steps, done\n",
      "Run episode 4042 with rewards -460.08866385428837 with 71 steps, done\n",
      "Run episode 4043 with rewards -549.9946844092284 with 59 steps, done\n",
      "Run episode 4044 with rewards -440.5901512394576 with 87 steps, done\n",
      "Run episode 4045 with rewards -650.6060420084542 with 67 steps, done\n",
      "Run episode 4046 with rewards -866.1549879840219 with 80 steps, done\n",
      "Run episode 4047 with rewards -396.3414693296449 with 108 steps, done\n",
      "Run episode 4048 with rewards -325.1344141816527 with 86 steps, done\n",
      "Run episode 4049 with rewards -592.0215940441534 with 151 steps, done\n",
      "Run episode 4050 with rewards -476.6525918864932 with 61 steps, done\n",
      "Run episode 4051 with rewards -576.5203165472606 with 123 steps, done\n",
      "Run episode 4052 with rewards -332.55056985427336 with 66 steps, done\n",
      "Run episode 4053 with rewards -288.05183018741235 with 69 steps, done\n",
      "Run episode 4054 with rewards -741.2908991736606 with 82 steps, done\n",
      "Run episode 4055 with rewards -367.4901708289906 with 61 steps, done\n",
      "Run episode 4056 with rewards -691.8404829508884 with 72 steps, done\n",
      "Run episode 4057 with rewards -520.0738746377223 with 100 steps, done\n",
      "Run episode 4058 with rewards -786.2845274157737 with 91 steps, done\n",
      "Run episode 4059 with rewards -655.1100452287757 with 83 steps, done\n",
      "Run episode 4060 with rewards -437.60757125517307 with 59 steps, done\n",
      "Run episode 4061 with rewards -503.1541845355746 with 83 steps, done\n",
      "Run episode 4062 with rewards -163.63232630194085 with 64 steps, done\n",
      "Run episode 4063 with rewards -479.26643541240253 with 56 steps, done\n",
      "Run episode 4064 with rewards -462.2958805875502 with 99 steps, done\n",
      "Run episode 4065 with rewards -604.2731452097797 with 83 steps, done\n",
      "Run episode 4066 with rewards -1893.6575967749438 with 250 steps, done\n",
      "Run episode 4067 with rewards -488.5050326478657 with 63 steps, done\n",
      "Run episode 4068 with rewards -531.5857115910044 with 77 steps, done\n",
      "Run episode 4069 with rewards -545.0907477783203 with 59 steps, done\n",
      "Run episode 4070 with rewards -484.81337336470534 with 72 steps, done\n",
      "Run episode 4071 with rewards -516.8061600722331 with 63 steps, done\n",
      "Run episode 4072 with rewards -624.4883962736229 with 88 steps, done\n",
      "Run episode 4073 with rewards -372.70381509468524 with 54 steps, done\n",
      "Run episode 4074 with rewards -536.5744616083214 with 76 steps, done\n",
      "Run episode 4075 with rewards -145.5798666289634 with 68 steps, done\n",
      "Run episode 4076 with rewards -1262.4990070601057 with 168 steps, done\n",
      "Run episode 4077 with rewards -216.46691933015546 with 67 steps, done\n",
      "Run episode 4078 with rewards -440.14648679085207 with 74 steps, done\n",
      "Run episode 4079 with rewards -883.8464954374278 with 84 steps, done\n",
      "Run episode 4080 with rewards -565.5771879104509 with 80 steps, done\n",
      "Run episode 4081 with rewards -427.97249970684436 with 58 steps, done\n",
      "Run episode 4082 with rewards -263.2887988769864 with 86 steps, done\n",
      "Run episode 4083 with rewards -666.1952696899766 with 104 steps, done\n",
      "Run episode 4084 with rewards -558.2132610289162 with 67 steps, done\n",
      "Run episode 4085 with rewards -459.88687443324727 with 67 steps, done\n",
      "Run episode 4086 with rewards -469.2438100895072 with 75 steps, done\n",
      "Run episode 4087 with rewards -507.3590738890696 with 69 steps, done\n",
      "Run episode 4088 with rewards -528.35124756408 with 107 steps, done\n",
      "Run episode 4089 with rewards -411.666738305957 with 57 steps, done\n",
      "Run episode 4090 with rewards -80.0428462028245 with 52 steps, done\n",
      "Run episode 4091 with rewards -284.0366241555498 with 187 steps, done\n",
      "Run episode 4092 with rewards -90.98541581163283 with 56 steps, done\n",
      "Run episode 4093 with rewards -191.79894470223002 with 116 steps, done\n",
      "Run episode 4094 with rewards -391.3176095124397 with 56 steps, done\n",
      "Run episode 4095 with rewards -411.35664183548687 with 56 steps, done\n",
      "Run episode 4096 with rewards -648.2867362521326 with 102 steps, done\n",
      "Run episode 4097 with rewards -968.4126672539295 with 88 steps, done\n",
      "Run episode 4098 with rewards -210.6683343950755 with 64 steps, done\n",
      "Run episode 4099 with rewards -432.7392718451931 with 55 steps, done\n",
      "Run episode 4100 with rewards -588.147657232792 with 103 steps, done\n",
      "Run episode 4101 with rewards -404.39880445050443 with 53 steps, done\n",
      "Run episode 4102 with rewards -835.97606024691 with 80 steps, done\n",
      "Run episode 4103 with rewards -379.2606751440207 with 105 steps, done\n",
      "Run episode 4104 with rewards -497.64699562665334 with 59 steps, done\n",
      "Run episode 4105 with rewards -382.99806968718354 with 57 steps, done\n",
      "Run episode 4106 with rewards -506.9856847714485 with 77 steps, done\n",
      "Run episode 4107 with rewards -782.6237891715251 with 78 steps, done\n",
      "Run episode 4108 with rewards -257.72362385792644 with 98 steps, done\n",
      "Run episode 4109 with rewards -450.0393345042053 with 54 steps, done\n",
      "Run episode 4110 with rewards -501.9802988506446 with 66 steps, done\n",
      "Run episode 4111 with rewards -638.7745268647017 with 96 steps, done\n",
      "Run episode 4112 with rewards -411.7824257684153 with 56 steps, done\n",
      "Run episode 4113 with rewards -612.9841022303387 with 102 steps, done\n",
      "Run episode 4114 with rewards -502.33937377708594 with 64 steps, done\n",
      "Run episode 4115 with rewards -668.4957321714996 with 118 steps, done\n",
      "Run episode 4116 with rewards -672.9766157883834 with 69 steps, done\n",
      "Run episode 4117 with rewards -360.70753626709944 with 69 steps, done\n",
      "Run episode 4118 with rewards -730.1307063625214 with 80 steps, done\n",
      "Run episode 4119 with rewards -342.13288899233294 with 70 steps, done\n",
      "Run episode 4120 with rewards -649.1747851804586 with 100 steps, done\n",
      "Run episode 4121 with rewards -99.33854259263931 with 108 steps, done\n",
      "Run episode 4122 with rewards -1037.7560610144606 with 87 steps, done\n",
      "Run episode 4123 with rewards -871.6708782773205 with 91 steps, done\n",
      "Run episode 4124 with rewards -146.63310155276216 with 102 steps, done\n",
      "Run episode 4125 with rewards -607.1740621735712 with 102 steps, done\n",
      "Run episode 4126 with rewards -315.70268365058365 with 83 steps, done\n",
      "Run episode 4127 with rewards -505.4963965624093 with 88 steps, done\n",
      "Run episode 4128 with rewards -124.39480306478637 with 88 steps, done\n",
      "Run episode 4129 with rewards -716.3995694106454 with 102 steps, done\n",
      "Run episode 4130 with rewards -125.64520097086451 with 52 steps, done\n",
      "Run episode 4131 with rewards -3376.223904307151 with 347 steps, done\n",
      "Run episode 4132 with rewards -173.45801297333963 with 72 steps, done\n",
      "Run episode 4133 with rewards -3566.534521105006 with 342 steps, done\n",
      "Run episode 4134 with rewards -148.82625779011562 with 77 steps, done\n",
      "Run episode 4135 with rewards -742.0910983345847 with 101 steps, done\n",
      "Run episode 4136 with rewards -109.32394010812216 with 55 steps, done\n",
      "Run episode 4137 with rewards -801.580392377381 with 111 steps, done\n",
      "Run episode 4138 with rewards -139.30768793380412 with 84 steps, done\n",
      "Run episode 4139 with rewards -705.3003303425165 with 95 steps, done\n",
      "Run episode 4140 with rewards -491.83263369039264 with 55 steps, done\n",
      "Run episode 4141 with rewards -256.28479854865213 with 73 steps, done\n",
      "Run episode 4142 with rewards -1095.8799175903964 with 89 steps, done\n",
      "Run episode 4143 with rewards -685.3167846009663 with 97 steps, done\n",
      "Run episode 4144 with rewards -326.93132904284874 with 51 steps, done\n",
      "Run episode 4145 with rewards -220.37397355867284 with 110 steps, done\n",
      "Run episode 4146 with rewards -826.0201411380945 with 94 steps, done\n",
      "Run episode 4147 with rewards -553.6577625445256 with 92 steps, done\n",
      "Run episode 4148 with rewards -160.68217624224408 with 72 steps, done\n",
      "Run episode 4149 with rewards -79.26570741995013 with 75 steps, done\n",
      "Run episode 4150 with rewards -450.71515422319106 with 75 steps, done\n",
      "Run episode 4151 with rewards -135.0733146110634 with 76 steps, done\n",
      "Run episode 4152 with rewards -100.93434153616666 with 71 steps, done\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Run episode 4153 with rewards -392.38514026809986 with 53 steps, done\n",
      "Run episode 4154 with rewards -603.4440373821565 with 80 steps, done\n",
      "Run episode 4155 with rewards -550.6976144096052 with 67 steps, done\n",
      "Run episode 4156 with rewards -653.7474509821193 with 99 steps, done\n",
      "Run episode 4157 with rewards -579.6234828357601 with 71 steps, done\n",
      "Run episode 4158 with rewards -763.8812378994063 with 73 steps, done\n",
      "Run episode 4159 with rewards -509.83954939969084 with 89 steps, done\n",
      "Run episode 4160 with rewards -520.5497282139119 with 67 steps, done\n",
      "Run episode 4161 with rewards -291.65734840691493 with 67 steps, done\n",
      "Run episode 4162 with rewards -445.6728626246833 with 52 steps, done\n",
      "Run episode 4163 with rewards -577.8381049947563 with 128 steps, done\n",
      "Run episode 4164 with rewards -548.6924067697067 with 70 steps, done\n",
      "Run episode 4165 with rewards -745.4756950144117 with 133 steps, done\n",
      "Run episode 4166 with rewards -253.1757036688397 with 82 steps, done\n",
      "Run episode 4167 with rewards -1123.4868886632764 with 155 steps, done\n",
      "Run episode 4168 with rewards -168.42427013124325 with 56 steps, done\n",
      "Run episode 4169 with rewards -1781.5295552078967 with 225 steps, done\n",
      "Run episode 4170 with rewards -197.13550591397234 with 71 steps, done\n",
      "Run episode 4171 with rewards -454.7567858319028 with 73 steps, done\n",
      "Run episode 4172 with rewards -94.96044033370559 with 101 steps, done\n",
      "Run episode 4173 with rewards -548.1501960998482 with 62 steps, done\n",
      "Run episode 4174 with rewards -169.55770226106347 with 95 steps, done\n",
      "Run episode 4175 with rewards -430.7269725758958 with 78 steps, done\n",
      "Run episode 4176 with rewards -152.10720998044343 with 63 steps, done\n",
      "Run episode 4177 with rewards -889.3987259149584 with 115 steps, done\n",
      "Run episode 4178 with rewards -127.93578938706878 with 85 steps, done\n",
      "Run episode 4179 with rewards -540.6168825366398 with 72 steps, done\n",
      "Run episode 4180 with rewards -32.44448339960445 with 83 steps, done\n",
      "Run episode 4181 with rewards -1345.2857639061433 with 183 steps, done\n",
      "Run episode 4182 with rewards -123.37424091610778 with 56 steps, done\n",
      "Run episode 4183 with rewards -543.557484146545 with 100 steps, done\n",
      "Run episode 4184 with rewards -151.05305075477162 with 83 steps, done\n",
      "Run episode 4185 with rewards -1850.1089429397186 with 235 steps, done\n",
      "Run episode 4186 with rewards -105.47153108320195 with 56 steps, done\n",
      "Run episode 4187 with rewards -527.4180972822028 with 90 steps, done\n",
      "Run episode 4188 with rewards -118.02473664541003 with 65 steps, done\n",
      "Run episode 4189 with rewards -572.2224941983917 with 88 steps, done\n",
      "Run episode 4190 with rewards -110.0461605490271 with 67 steps, done\n",
      "Run episode 4191 with rewards -1551.530325488559 with 209 steps, done\n",
      "Run episode 4192 with rewards -154.93657164003545 with 61 steps, done\n",
      "Run episode 4193 with rewards -579.6436741029697 with 79 steps, done\n",
      "Run episode 4194 with rewards -128.2723001814575 with 72 steps, done\n",
      "Run episode 4195 with rewards -757.9473703288663 with 125 steps, done\n",
      "Run episode 4196 with rewards -195.42490025678433 with 56 steps, done\n",
      "Run episode 4197 with rewards -575.0862630685021 with 79 steps, done\n",
      "Run episode 4198 with rewards -181.68790578361597 with 81 steps, done\n",
      "Run episode 4199 with rewards -625.4306747239665 with 98 steps, done\n",
      "Run episode 4200 with rewards -92.47154683224764 with 54 steps, done\n",
      "Run episode 4201 with rewards -160.0552976626794 with 63 steps, done\n",
      "Run episode 4202 with rewards -624.3099057674308 with 73 steps, done\n",
      "Run episode 4203 with rewards -576.2734960479124 with 88 steps, done\n",
      "Run episode 4204 with rewards -447.9689709136548 with 53 steps, done\n",
      "Run episode 4205 with rewards -273.26582751034607 with 114 steps, done\n",
      "Run episode 4206 with rewards -455.0889800434292 with 51 steps, done\n",
      "Run episode 4207 with rewards -333.14775626965775 with 61 steps, done\n",
      "Run episode 4208 with rewards -361.1218138006075 with 53 steps, done\n",
      "Run episode 4209 with rewards -648.3061677089639 with 117 steps, done\n",
      "Run episode 4210 with rewards -324.39990383827217 with 51 steps, done\n",
      "Run episode 4211 with rewards -207.88211060099945 with 73 steps, done\n",
      "Run episode 4212 with rewards -548.0077615232727 with 60 steps, done\n",
      "Run episode 4213 with rewards -232.4144428024954 with 75 steps, done\n",
      "Run episode 4214 with rewards -451.5572982992758 with 53 steps, done\n",
      "Run episode 4215 with rewards -194.54767247628797 with 63 steps, done\n",
      "Run episode 4216 with rewards -522.5420224559966 with 58 steps, done\n",
      "Run episode 4217 with rewards -124.96393950548932 with 53 steps, done\n",
      "Run episode 4218 with rewards -521.7558543637731 with 56 steps, done\n",
      "Run episode 4219 with rewards -576.2998042585693 with 87 steps, done\n",
      "Run episode 4220 with rewards -503.81512776112965 with 64 steps, done\n",
      "Run episode 4221 with rewards -316.1058398318238 with 89 steps, done\n",
      "Run episode 4222 with rewards -534.6977767834048 with 62 steps, done\n",
      "Run episode 4223 with rewards -566.7601746830981 with 95 steps, done\n",
      "Run episode 4224 with rewards -742.4466969789763 with 75 steps, done\n",
      "Run episode 4225 with rewards -812.5379286399675 with 77 steps, done\n",
      "Run episode 4226 with rewards -254.42429794703682 with 69 steps, done\n",
      "Run episode 4227 with rewards -866.9213631382993 with 84 steps, done\n",
      "Run episode 4228 with rewards -226.48452795241678 with 72 steps, done\n",
      "Run episode 4229 with rewards -442.6322721482623 with 57 steps, done\n",
      "Run episode 4230 with rewards -182.5504871056696 with 89 steps, done\n",
      "Run episode 4231 with rewards -320.25566145943196 with 51 steps, done\n",
      "Run episode 4232 with rewards -480.76615651572655 with 61 steps, done\n",
      "Run episode 4233 with rewards -492.94864420368094 with 112 steps, done\n",
      "Run episode 4234 with rewards -467.15544834310873 with 54 steps, done\n",
      "Run episode 4235 with rewards -481.5316155736354 with 91 steps, done\n",
      "Run episode 4236 with rewards -606.2494524897622 with 73 steps, done\n",
      "Run episode 4237 with rewards -762.1518235815639 with 74 steps, done\n",
      "Run episode 4238 with rewards -214.5922933494159 with 71 steps, done\n",
      "Run episode 4239 with rewards -480.9534223798947 with 55 steps, done\n",
      "Run episode 4240 with rewards -820.860995668752 with 126 steps, done\n",
      "Run episode 4241 with rewards -492.49055466625026 with 61 steps, done\n",
      "Run episode 4242 with rewards -572.213104623065 with 86 steps, done\n",
      "Run episode 4243 with rewards -596.4147540806198 with 70 steps, done\n",
      "Run episode 4244 with rewards -622.7922309375067 with 90 steps, done\n",
      "Run episode 4245 with rewards -546.770415658402 with 70 steps, done\n",
      "Run episode 4246 with rewards -90.42651827098365 with 54 steps, done\n",
      "Run episode 4247 with rewards -161.3208039279955 with 84 steps, done\n",
      "Run episode 4248 with rewards -974.1666800648852 with 86 steps, done\n",
      "Run episode 4249 with rewards -93.6884148127555 with 56 steps, done\n",
      "Run episode 4250 with rewards -300.1735947049706 with 88 steps, done\n",
      "Run episode 4251 with rewards -516.1994844264157 with 130 steps, done\n",
      "Run episode 4252 with rewards -157.37678102972532 with 86 steps, done\n",
      "Run episode 4253 with rewards -86.77451529724222 with 96 steps, done\n",
      "Run episode 4254 with rewards -369.92289792284197 with 57 steps, done\n",
      "Run episode 4255 with rewards -630.2242960423146 with 92 steps, done\n",
      "Run episode 4256 with rewards -770.0285623211621 with 85 steps, done\n",
      "Run episode 4257 with rewards -495.5410035106504 with 103 steps, done\n",
      "Run episode 4258 with rewards -325.76852789389665 with 52 steps, done\n",
      "Run episode 4259 with rewards -284.0048569981582 with 69 steps, done\n",
      "Run episode 4260 with rewards -552.6745046750026 with 96 steps, done\n",
      "Run episode 4261 with rewards -25.363420903990388 with 91 steps, done\n",
      "Run episode 4262 with rewards -668.9514802030307 with 73 steps, done\n",
      "Run episode 4263 with rewards -170.10334290480927 with 68 steps, done\n",
      "Run episode 4264 with rewards -563.7395634015788 with 70 steps, done\n",
      "Run episode 4265 with rewards -456.13268209039984 with 79 steps, done\n",
      "Run episode 4266 with rewards -476.5006473082172 with 53 steps, done\n",
      "Run episode 4267 with rewards -560.0258595357168 with 86 steps, done\n",
      "Run episode 4268 with rewards -1042.3337360755377 with 86 steps, done\n",
      "Run episode 4269 with rewards -530.0604354932984 with 67 steps, done\n",
      "Run episode 4270 with rewards -743.6223939588901 with 116 steps, done\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Run episode 4271 with rewards -435.5982691564133 with 58 steps, done\n",
      "Run episode 4272 with rewards -106.04413548654657 with 61 steps, done\n",
      "Run episode 4273 with rewards -745.0049794019055 with 144 steps, done\n",
      "Run episode 4274 with rewards -117.77738281483332 with 57 steps, done\n",
      "Run episode 4275 with rewards -2544.113342086967 with 272 steps, done\n",
      "Run episode 4276 with rewards -170.71948324044854 with 77 steps, done\n",
      "Run episode 4277 with rewards -434.3078706503481 with 82 steps, done\n",
      "Run episode 4278 with rewards -113.15085990528377 with 79 steps, done\n",
      "Run episode 4279 with rewards -822.0289596198262 with 111 steps, done\n",
      "Run episode 4280 with rewards -124.97473712311061 with 84 steps, done\n",
      "Run episode 4281 with rewards -102.03558609935462 with 80 steps, done\n",
      "Run episode 4282 with rewards -766.2741002026605 with 75 steps, done\n",
      "Run episode 4283 with rewards -241.43328123353504 with 86 steps, done\n",
      "Run episode 4284 with rewards -536.015856067076 with 68 steps, done\n",
      "Run episode 4285 with rewards -611.3022527782065 with 101 steps, done\n",
      "Run episode 4286 with rewards -428.72310167100585 with 49 steps, done\n",
      "Run episode 4287 with rewards -432.9581158154957 with 60 steps, done\n",
      "Run episode 4288 with rewards -523.3844644509106 with 84 steps, done\n",
      "Run episode 4289 with rewards -801.811078144051 with 84 steps, done\n",
      "Run episode 4290 with rewards -1589.0701905200985 with 208 steps, done\n",
      "Run episode 4291 with rewards 2.056768580511587 with 87 steps, done\n",
      "Run episode 4292 with rewards -387.0834097887294 with 114 steps, done\n",
      "Run episode 4293 with rewards -495.6028321336038 with 70 steps, done\n",
      "Run episode 4294 with rewards -737.8743709933404 with 94 steps, done\n",
      "Run episode 4295 with rewards -188.87306145832827 with 60 steps, done\n",
      "Run episode 4296 with rewards -2137.7528526213273 with 291 steps, done\n",
      "Run episode 4297 with rewards -207.12923786239045 with 72 steps, done\n",
      "Run episode 4298 with rewards -701.6567460842233 with 128 steps, done\n",
      "Run episode 4299 with rewards -159.424770604248 with 78 steps, done\n",
      "Run episode 4300 with rewards -522.7168806349587 with 78 steps, done\n",
      "Run episode 4301 with rewards -252.1269947335117 with 90 steps, done\n",
      "Run episode 4302 with rewards -578.4272335308985 with 118 steps, done\n",
      "Run episode 4303 with rewards -188.92893326054633 with 61 steps, done\n",
      "Run episode 4304 with rewards -1048.1840846893738 with 169 steps, done\n",
      "Run episode 4305 with rewards -110.74315957280638 with 62 steps, done\n",
      "Run episode 4306 with rewards -1151.0291195812456 with 227 steps, done\n",
      "Run episode 4307 with rewards -529.3086243837195 with 59 steps, done\n",
      "Run episode 4308 with rewards -121.54636170081174 with 79 steps, done\n",
      "Run episode 4309 with rewards -462.6189338514771 with 76 steps, done\n",
      "Run episode 4310 with rewards -143.1507783034155 with 77 steps, done\n",
      "Run episode 4311 with rewards -1715.0361180919053 with 207 steps, done\n",
      "Run episode 4312 with rewards -1077.7129320470817 with 140 steps, done\n",
      "Run episode 4313 with rewards -112.16496215138298 with 54 steps, done\n",
      "Run episode 4314 with rewards -560.6155672022635 with 101 steps, done\n",
      "Run episode 4315 with rewards -3.2544022316763517 with 65 steps, done\n",
      "Run episode 4316 with rewards -516.2563165179102 with 65 steps, done\n",
      "Run episode 4317 with rewards -2611.424844334769 with 234 steps, done\n",
      "Run episode 4318 with rewards -674.132865932992 with 92 steps, done\n",
      "Run episode 4319 with rewards -2.2246937488395275 with 100 steps, done\n",
      "Run episode 4320 with rewards -1082.3239422320646 with 182 steps, done\n",
      "Run episode 4321 with rewards -123.34190908554538 with 52 steps, done\n",
      "Run episode 4322 with rewards -193.01928891246706 with 107 steps, done\n",
      "Run episode 4323 with rewards -81.52749947938858 with 53 steps, done\n",
      "Run episode 4324 with rewards -3728.939302547168 with 323 steps, done\n",
      "Run episode 4325 with rewards -529.5333363504211 with 68 steps, done\n",
      "Run episode 4326 with rewards -267.6660503506125 with 90 steps, done\n",
      "Run episode 4327 with rewards -386.5696567452504 with 52 steps, done\n",
      "Run episode 4328 with rewards -554.5275932904875 with 109 steps, done\n",
      "Run episode 4329 with rewards -1245.2900164318876 with 187 steps, done\n",
      "Run episode 4330 with rewards -363.76293156488197 with 53 steps, done\n",
      "Run episode 4331 with rewards -320.0715922391014 with 72 steps, done\n",
      "Run episode 4332 with rewards -536.846073825042 with 65 steps, done\n",
      "Run episode 4333 with rewards -762.5570955709434 with 111 steps, done\n",
      "Run episode 4334 with rewards -279.77706054765804 with 69 steps, done\n",
      "Run episode 4335 with rewards -161.09743007344485 with 67 steps, done\n",
      "Run episode 4336 with rewards -125.81745787816111 with 104 steps, done\n",
      "Run episode 4337 with rewards -177.81511142907829 with 72 steps, done\n",
      "Run episode 4338 with rewards -487.5242528148207 with 125 steps, done\n",
      "Run episode 4339 with rewards -172.7789736383796 with 75 steps, done\n",
      "Run episode 4340 with rewards -386.73167100339197 with 57 steps, done\n",
      "Run episode 4341 with rewards -36.813276589473645 with 112 steps, done\n",
      "Run episode 4342 with rewards -341.19051372774294 with 54 steps, done\n",
      "Run episode 4343 with rewards -251.9758937402473 with 73 steps, done\n",
      "Run episode 4344 with rewards -841.2853890721715 with 82 steps, done\n",
      "Run episode 4345 with rewards -562.077129030764 with 76 steps, done\n",
      "Run episode 4346 with rewards -390.8497829108477 with 103 steps, done\n",
      "Run episode 4347 with rewards -328.08378909119585 with 52 steps, done\n",
      "Run episode 4348 with rewards -109.60201052325111 with 84 steps, done\n",
      "Run episode 4349 with rewards -1222.7091160079933 with 168 steps, done\n",
      "Run episode 4350 with rewards -387.6403222198866 with 68 steps, done\n",
      "Run episode 4351 with rewards -290.20290180438235 with 110 steps, done\n",
      "Run episode 4352 with rewards -79.82900619782316 with 67 steps, done\n",
      "Run episode 4353 with rewards -384.75007539169525 with 86 steps, done\n",
      "Run episode 4354 with rewards -88.38296959897221 with 54 steps, done\n",
      "Run episode 4355 with rewards -128.24189265485268 with 104 steps, done\n",
      "Run episode 4356 with rewards -9.182918792411655 with 86 steps, done\n",
      "Run episode 4357 with rewards -417.5639880967736 with 82 steps, done\n",
      "Run episode 4358 with rewards -164.88163422123026 with 60 steps, done\n",
      "Run episode 4359 with rewards -637.730078873532 with 84 steps, done\n",
      "Run episode 4360 with rewards -128.6592891370694 with 88 steps, done\n",
      "Run episode 4361 with rewards -458.8764396778987 with 83 steps, done\n",
      "Run episode 4362 with rewards -118.55577426534991 with 72 steps, done\n",
      "Run episode 4363 with rewards -730.1508135627744 with 111 steps, done\n",
      "Run episode 4364 with rewards -469.7200929946159 with 53 steps, done\n",
      "Run episode 4365 with rewards -287.60794093174 with 97 steps, done\n",
      "Run episode 4366 with rewards -225.00613902875762 with 60 steps, done\n",
      "Run episode 4367 with rewards -630.9940124241607 with 75 steps, done\n",
      "Run episode 4368 with rewards -130.43236837659583 with 55 steps, done\n",
      "Run episode 4369 with rewards -809.2357467669223 with 114 steps, done\n",
      "Run episode 4370 with rewards -469.7641797664065 with 55 steps, done\n",
      "Run episode 4371 with rewards -383.82392032638165 with 126 steps, done\n",
      "Run episode 4372 with rewards -415.73935794117114 with 55 steps, done\n",
      "Run episode 4373 with rewards -531.96589679664 with 82 steps, done\n",
      "Run episode 4374 with rewards -534.6534255771817 with 56 steps, done\n",
      "Run episode 4375 with rewards -318.04298503940686 with 74 steps, done\n",
      "Run episode 4376 with rewards -653.5129754898268 with 70 steps, done\n",
      "Run episode 4377 with rewards -590.0239285011961 with 116 steps, done\n",
      "Run episode 4378 with rewards -782.8680566803231 with 82 steps, done\n",
      "Run episode 4379 with rewards -586.504909970671 with 63 steps, done\n",
      "Run episode 4380 with rewards -597.3126779246473 with 120 steps, done\n",
      "Run episode 4381 with rewards -534.1347759116891 with 58 steps, done\n",
      "Run episode 4382 with rewards -667.7505076282812 with 117 steps, done\n",
      "Run episode 4383 with rewards -434.86799541131234 with 71 steps, done\n",
      "Run episode 4384 with rewards -660.5878360846499 with 103 steps, done\n",
      "Run episode 4385 with rewards -550.927568231811 with 74 steps, done\n",
      "Run episode 4386 with rewards -678.8204084975437 with 96 steps, done\n",
      "Run episode 4387 with rewards -254.84490219504954 with 77 steps, done\n",
      "Run episode 4388 with rewards -920.0450835521018 with 140 steps, done\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Run episode 4389 with rewards -112.60823761616246 with 69 steps, done\n",
      "Run episode 4390 with rewards -652.3242019285866 with 83 steps, done\n",
      "Run episode 4391 with rewards -150.44194870969446 with 64 steps, done\n",
      "Run episode 4392 with rewards -31.6570623914823 with 84 steps, done\n",
      "Run episode 4393 with rewards -152.03791663649508 with 74 steps, done\n",
      "Run episode 4394 with rewards -141.37133700570627 with 123 steps, done\n",
      "Run episode 4395 with rewards -392.90348043808683 with 202 steps, done\n",
      "Run episode 4396 with rewards -411.87005424730137 with 89 steps, done\n",
      "Run episode 4397 with rewards -110.24126818553475 with 51 steps, done\n",
      "Run episode 4398 with rewards -455.8202392873597 with 51 steps, done\n",
      "Run episode 4399 with rewards -582.6865596313968 with 92 steps, done\n",
      "Run episode 4400 with rewards -901.2617423184622 with 83 steps, done\n",
      "Run episode 4401 with rewards -506.15006245745155 with 63 steps, done\n",
      "Run episode 4402 with rewards -328.86666981347344 with 53 steps, done\n",
      "Run episode 4403 with rewards -623.0206176341941 with 91 steps, done\n",
      "Run episode 4404 with rewards -130.65380606727243 with 54 steps, done\n",
      "Run episode 4405 with rewards -569.5507442820962 with 60 steps, done\n",
      "Run episode 4406 with rewards -469.9545828245216 with 77 steps, done\n",
      "Run episode 4407 with rewards -410.7093522397156 with 54 steps, done\n",
      "Run episode 4408 with rewards -1633.3719160568103 with 202 steps, done\n",
      "Run episode 4409 with rewards -133.85936525071014 with 62 steps, done\n",
      "Run episode 4410 with rewards -434.95346082920014 with 77 steps, done\n",
      "Run episode 4411 with rewards -155.15164300282714 with 69 steps, done\n",
      "Run episode 4412 with rewards -639.4949478779737 with 76 steps, done\n",
      "Run episode 4413 with rewards -177.17621034254046 with 55 steps, done\n",
      "Run episode 4414 with rewards -705.8748944508976 with 117 steps, done\n",
      "Run episode 4415 with rewards -178.23523570783925 with 65 steps, done\n",
      "Run episode 4416 with rewards -89.17170443603425 with 84 steps, done\n",
      "Run episode 4417 with rewards -164.22096452212355 with 77 steps, done\n",
      "Run episode 4418 with rewards -149.46124612461182 with 95 steps, done\n",
      "Run episode 4419 with rewards -280.65842854230107 with 85 steps, done\n",
      "Run episode 4420 with rewards -376.908280444918 with 53 steps, done\n",
      "Run episode 4421 with rewards -119.80640873961136 with 60 steps, done\n",
      "Run episode 4422 with rewards -233.85686848906053 with 121 steps, done\n",
      "Run episode 4423 with rewards -133.88282304008297 with 74 steps, done\n",
      "Run episode 4424 with rewards -106.67188731594855 with 65 steps, done\n",
      "Run episode 4425 with rewards -125.42909658619641 with 68 steps, done\n",
      "Run episode 4426 with rewards -152.35053070580145 with 136 steps, done\n",
      "Run episode 4427 with rewards -155.99151344777957 with 83 steps, done\n",
      "Run episode 4428 with rewards -496.8686851516552 with 69 steps, done\n",
      "Run episode 4429 with rewards -567.6365035050711 with 95 steps, done\n",
      "Run episode 4430 with rewards -448.0451998804889 with 55 steps, done\n",
      "Run episode 4431 with rewards -197.30847689249427 with 90 steps, done\n",
      "Run episode 4432 with rewards -692.1252078670764 with 69 steps, done\n",
      "Run episode 4433 with rewards -97.9719676239643 with 57 steps, done\n",
      "Run episode 4434 with rewards -616.3748048098095 with 72 steps, done\n",
      "Run episode 4435 with rewards -588.8353788384762 with 84 steps, done\n",
      "Run episode 4436 with rewards -504.0871912090294 with 55 steps, done\n",
      "Run episode 4437 with rewards -311.9834411362083 with 80 steps, done\n",
      "Run episode 4438 with rewards -519.4243609836948 with 64 steps, done\n",
      "Run episode 4439 with rewards -559.9746735932692 with 108 steps, done\n",
      "Run episode 4440 with rewards -124.92095139388431 with 74 steps, done\n",
      "Run episode 4441 with rewards -302.26110449499095 with 80 steps, done\n",
      "Run episode 4442 with rewards -93.58305922335032 with 85 steps, done\n",
      "Run episode 4443 with rewards -406.8685482227528 with 113 steps, done\n",
      "Run episode 4444 with rewards -155.28609240180964 with 81 steps, done\n",
      "Run episode 4445 with rewards -221.98612400203035 with 111 steps, done\n",
      "Run episode 4446 with rewards -121.47834064745187 with 71 steps, done\n",
      "Run episode 4447 with rewards -167.83175584913573 with 75 steps, done\n",
      "Run episode 4448 with rewards -426.2478143508368 with 79 steps, done\n",
      "Run episode 4449 with rewards -192.9466460361182 with 79 steps, done\n",
      "Run episode 4450 with rewards -90.62476183406558 with 90 steps, done\n",
      "Run episode 4451 with rewards -160.19504782953805 with 89 steps, done\n",
      "Run episode 4452 with rewards -107.48558432976951 with 82 steps, done\n",
      "Run episode 4453 with rewards -181.4430950881669 with 64 steps, done\n",
      "Run episode 4454 with rewards -734.3061224593772 with 93 steps, done\n",
      "Run episode 4455 with rewards -203.0624770241569 with 79 steps, done\n",
      "Run episode 4456 with rewards -65.7194194476902 with 95 steps, done\n",
      "Run episode 4457 with rewards 3.0884757656139072 with 94 steps, done\n",
      "Run episode 4458 with rewards -547.5996901522403 with 119 steps, done\n",
      "Run episode 4459 with rewards -777.9185905924859 with 79 steps, done\n",
      "Run episode 4460 with rewards -481.30593367672105 with 97 steps, done\n",
      "Run episode 4461 with rewards -827.6644562972925 with 78 steps, done\n",
      "Run episode 4462 with rewards -1163.1163836253913 with 105 steps, done\n",
      "Run episode 4463 with rewards -542.0565191293045 with 71 steps, done\n",
      "Run episode 4464 with rewards -573.5761383921342 with 112 steps, done\n",
      "Run episode 4465 with rewards -526.1493458165269 with 64 steps, done\n",
      "Run episode 4466 with rewards -667.7653334431417 with 103 steps, done\n",
      "Run episode 4467 with rewards -401.66423141264676 with 52 steps, done\n",
      "Run episode 4468 with rewards -361.23103019163625 with 89 steps, done\n",
      "Run episode 4469 with rewards -730.8705440643539 with 74 steps, done\n",
      "Run episode 4470 with rewards -507.889534149227 with 96 steps, done\n",
      "Run episode 4471 with rewards -436.8642837071636 with 52 steps, done\n",
      "Run episode 4472 with rewards -553.6222882510374 with 83 steps, done\n",
      "Run episode 4473 with rewards -557.0569603113589 with 61 steps, done\n",
      "Run episode 4474 with rewards -522.7705189227744 with 84 steps, done\n",
      "Run episode 4475 with rewards -457.4548992267368 with 60 steps, done\n",
      "Run episode 4476 with rewards -323.64527380422567 with 80 steps, done\n",
      "Run episode 4477 with rewards -640.2957724188243 with 83 steps, done\n",
      "Run episode 4478 with rewards -385.4826787551791 with 73 steps, done\n",
      "Run episode 4479 with rewards -124.2622134486628 with 60 steps, done\n",
      "Run episode 4480 with rewards -879.8577426454642 with 90 steps, done\n",
      "Run episode 4481 with rewards -160.90294923374643 with 91 steps, done\n",
      "Run episode 4482 with rewards -296.9509160157976 with 76 steps, done\n",
      "Run episode 4483 with rewards -194.50130718955566 with 169 steps, done\n",
      "Run episode 4484 with rewards -664.4435092439055 with 72 steps, done\n",
      "Run episode 4485 with rewards -330.8193157389717 with 76 steps, done\n",
      "Run episode 4486 with rewards -539.7703221153611 with 61 steps, done\n",
      "Run episode 4487 with rewards -271.0124890472649 with 55 steps, done\n",
      "Run episode 4488 with rewards -373.2273628680462 with 50 steps, done\n",
      "Run episode 4489 with rewards -447.5070185749847 with 71 steps, done\n",
      "Run episode 4490 with rewards -494.6454126232893 with 59 steps, done\n",
      "Run episode 4491 with rewards -613.5798690940101 with 77 steps, done\n",
      "Run episode 4492 with rewards -444.67518687176425 with 59 steps, done\n",
      "Run episode 4493 with rewards -223.12587171124787 with 73 steps, done\n",
      "Run episode 4494 with rewards -819.5609238758321 with 86 steps, done\n",
      "Run episode 4495 with rewards -669.8705177085649 with 117 steps, done\n",
      "Run episode 4496 with rewards -174.98829359904238 with 64 steps, done\n",
      "Run episode 4497 with rewards -1803.198670341363 with 208 steps, done\n",
      "Run episode 4498 with rewards -141.53943021086863 with 89 steps, done\n",
      "Run episode 4499 with rewards -468.2323074755792 with 72 steps, done\n",
      "Run episode 4500 with rewards -17.186087463039996 with 115 steps, done\n",
      "Run episode 4501 with rewards -623.3085370133301 with 71 steps, done\n",
      "Run episode 4502 with rewards -630.9155657364114 with 67 steps, done\n",
      "Run episode 4503 with rewards -188.30765656868158 with 67 steps, done\n",
      "Run episode 4504 with rewards -434.7475831519437 with 69 steps, done\n",
      "Run episode 4505 with rewards -625.9398378647454 with 86 steps, done\n",
      "Run episode 4506 with rewards -457.63344942577515 with 72 steps, done\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Run episode 4507 with rewards -135.9399866101057 with 63 steps, done\n",
      "Run episode 4508 with rewards -19.17260949175764 with 80 steps, done\n",
      "Run episode 4509 with rewards -2446.3161113039196 with 296 steps, done\n",
      "Run episode 4510 with rewards -134.62954178870115 with 68 steps, done\n",
      "Run episode 4511 with rewards -485.7701093517168 with 84 steps, done\n",
      "Run episode 4512 with rewards -307.52100664069724 with 86 steps, done\n",
      "Run episode 4513 with rewards -581.1595205694073 with 90 steps, done\n",
      "Run episode 4514 with rewards -357.1144197738736 with 89 steps, done\n",
      "Run episode 4515 with rewards -462.28985851693943 with 121 steps, done\n",
      "Run episode 4516 with rewards -124.81848198885962 with 62 steps, done\n",
      "Run episode 4517 with rewards -519.7232606945078 with 76 steps, done\n",
      "Run episode 4518 with rewards -516.5840113540966 with 70 steps, done\n",
      "Run episode 4519 with rewards -436.8487745116047 with 81 steps, done\n",
      "Run episode 4520 with rewards -588.5598859161507 with 71 steps, done\n",
      "Run episode 4521 with rewards -430.44996148788294 with 78 steps, done\n",
      "Run episode 4522 with rewards -1057.0968602366456 with 91 steps, done\n",
      "Run episode 4523 with rewards -601.8914463281073 with 97 steps, done\n",
      "Run episode 4524 with rewards -654.2500581440896 with 74 steps, done\n",
      "Run episode 4525 with rewards -547.2453040769026 with 90 steps, done\n",
      "Run episode 4526 with rewards -764.7858422557923 with 75 steps, done\n",
      "Run episode 4527 with rewards -518.6948317332158 with 93 steps, done\n",
      "Run episode 4528 with rewards -496.8635796053904 with 57 steps, done\n",
      "Run episode 4529 with rewards -534.898335734699 with 58 steps, done\n",
      "Run episode 4530 with rewards -356.94094671253606 with 94 steps, done\n",
      "Run episode 4531 with rewards -475.4167990130355 with 56 steps, done\n",
      "Run episode 4532 with rewards -530.2809862369368 with 78 steps, done\n",
      "Run episode 4533 with rewards -518.7170761593225 with 66 steps, done\n",
      "Run episode 4534 with rewards -658.1579281713313 with 123 steps, done\n",
      "Run episode 4535 with rewards -478.93659611399414 with 70 steps, done\n",
      "Run episode 4536 with rewards -595.7895440610721 with 91 steps, done\n",
      "Run episode 4537 with rewards -300.47718011377424 with 74 steps, done\n",
      "Run episode 4538 with rewards -837.3218530619956 with 88 steps, done\n",
      "Run episode 4539 with rewards -569.0717554366037 with 59 steps, done\n",
      "Run episode 4540 with rewards -448.2442300413541 with 54 steps, done\n",
      "Run episode 4541 with rewards -619.7002601780201 with 67 steps, done\n",
      "Run episode 4542 with rewards -570.0016450611813 with 79 steps, done\n",
      "Run episode 4543 with rewards -476.4320745752318 with 55 steps, done\n",
      "Run episode 4544 with rewards -549.617623292519 with 84 steps, done\n",
      "Run episode 4545 with rewards -449.19885696052916 with 85 steps, done\n",
      "Run episode 4546 with rewards -468.8996208071845 with 96 steps, done\n",
      "Run episode 4547 with rewards -712.9251388474461 with 87 steps, done\n",
      "Run episode 4548 with rewards -566.1399372152846 with 82 steps, done\n",
      "Run episode 4549 with rewards -308.08656322157003 with 88 steps, done\n",
      "Run episode 4550 with rewards -186.03107882972654 with 59 steps, done\n",
      "Run episode 4551 with rewards -142.2405730971368 with 62 steps, done\n",
      "Run episode 4552 with rewards -495.2968346251099 with 71 steps, done\n",
      "Run episode 4553 with rewards -626.4633782268523 with 102 steps, done\n",
      "Run episode 4554 with rewards -739.8144772477576 with 74 steps, done\n",
      "Run episode 4555 with rewards -174.5798806482885 with 73 steps, done\n",
      "Run episode 4556 with rewards -426.21731890431346 with 56 steps, done\n",
      "Run episode 4557 with rewards -277.4844293462358 with 76 steps, done\n",
      "Run episode 4558 with rewards -713.2796588856278 with 70 steps, done\n",
      "Run episode 4559 with rewards -566.2399697124097 with 63 steps, done\n",
      "Run episode 4560 with rewards -464.52764550686 with 70 steps, done\n",
      "Run episode 4561 with rewards -459.81068375107895 with 61 steps, done\n",
      "Run episode 4562 with rewards -809.5266730645922 with 114 steps, done\n",
      "Run episode 4563 with rewards -832.4159346272418 with 86 steps, done\n",
      "Run episode 4564 with rewards -383.7836277361933 with 76 steps, done\n",
      "Run episode 4565 with rewards -969.4159157179157 with 89 steps, done\n",
      "Run episode 4566 with rewards -311.0925674588839 with 85 steps, done\n",
      "Run episode 4567 with rewards -885.1480656622883 with 81 steps, done\n",
      "Run episode 4568 with rewards -603.3084611415403 with 85 steps, done\n",
      "Run episode 4569 with rewards -509.44995227530984 with 64 steps, done\n",
      "Run episode 4570 with rewards -459.5042836541791 with 55 steps, done\n",
      "Run episode 4571 with rewards -387.61384741308063 with 74 steps, done\n",
      "Run episode 4572 with rewards -482.4268933762623 with 58 steps, done\n",
      "Run episode 4573 with rewards -117.97029760068537 with 63 steps, done\n",
      "Run episode 4574 with rewards -449.0975410892984 with 52 steps, done\n",
      "Run episode 4575 with rewards -350.82856513039155 with 63 steps, done\n",
      "Run episode 4576 with rewards -329.7317418594214 with 97 steps, done\n",
      "Run episode 4577 with rewards -503.3221281289588 with 56 steps, done\n",
      "Run episode 4578 with rewards -1301.393984335805 with 212 steps, done\n",
      "Run episode 4579 with rewards -745.5698971426712 with 88 steps, done\n",
      "Run episode 4580 with rewards -151.93510560355236 with 91 steps, done\n",
      "Run episode 4581 with rewards -325.6985254505594 with 51 steps, done\n",
      "Run episode 4582 with rewards -399.47506387493524 with 86 steps, done\n",
      "Run episode 4583 with rewards -490.7555093435675 with 54 steps, done\n",
      "Run episode 4584 with rewards -149.32886106075205 with 58 steps, done\n",
      "Run episode 4585 with rewards -230.7708986912455 with 115 steps, done\n",
      "Run episode 4586 with rewards -26.269167550870833 with 61 steps, done\n",
      "Run episode 4587 with rewards -524.8968148737113 with 91 steps, done\n",
      "Run episode 4588 with rewards -395.98469852495316 with 55 steps, done\n",
      "Run episode 4589 with rewards -497.8505351564753 with 125 steps, done\n",
      "Run episode 4590 with rewards -114.57247449557781 with 60 steps, done\n",
      "Run episode 4591 with rewards -156.90059787139074 with 71 steps, done\n",
      "Run episode 4592 with rewards -348.591840905667 with 90 steps, done\n",
      "Run episode 4593 with rewards -637.9974995134917 with 65 steps, done\n",
      "Run episode 4594 with rewards -291.6114866559451 with 82 steps, done\n",
      "Run episode 4595 with rewards -527.1480719845349 with 61 steps, done\n",
      "Run episode 4596 with rewards -733.2087283690732 with 116 steps, done\n",
      "Run episode 4597 with rewards -349.38917580146665 with 53 steps, done\n",
      "Run episode 4598 with rewards -710.6259517574371 with 103 steps, done\n",
      "Run episode 4599 with rewards -446.8569375460987 with 76 steps, done\n",
      "Run episode 4600 with rewards -462.31788296117384 with 60 steps, done\n",
      "Run episode 4601 with rewards -470.44440423240343 with 71 steps, done\n",
      "Run episode 4602 with rewards -552.092342038992 with 68 steps, done\n",
      "Run episode 4603 with rewards -263.0168031361692 with 86 steps, done\n",
      "Run episode 4604 with rewards -693.6399068194071 with 103 steps, done\n",
      "Run episode 4605 with rewards -351.3690041931246 with 59 steps, done\n",
      "Run episode 4606 with rewards -523.6888932626732 with 67 steps, done\n",
      "Run episode 4607 with rewards -338.5745493444382 with 84 steps, done\n",
      "Run episode 4608 with rewards -550.3336541307526 with 70 steps, done\n",
      "Run episode 4609 with rewards -598.6059330855848 with 101 steps, done\n",
      "Run episode 4610 with rewards -600.3074919555854 with 65 steps, done\n",
      "Run episode 4611 with rewards -886.6970570065566 with 135 steps, done\n",
      "Run episode 4612 with rewards -95.33903372811935 with 51 steps, done\n",
      "Run episode 4613 with rewards -735.7537594463437 with 105 steps, done\n",
      "Run episode 4614 with rewards -93.53635021781986 with 90 steps, done\n",
      "Run episode 4615 with rewards -877.0255374732321 with 120 steps, done\n",
      "Run episode 4616 with rewards -133.33589278889673 with 55 steps, done\n",
      "Run episode 4617 with rewards -345.14637901877325 with 84 steps, done\n",
      "Run episode 4618 with rewards -147.49038325339492 with 64 steps, done\n",
      "Run episode 4619 with rewards -458.9614827294253 with 78 steps, done\n",
      "Run episode 4620 with rewards -114.6682408945201 with 54 steps, done\n",
      "Run episode 4621 with rewards -596.4180523774025 with 120 steps, done\n",
      "Run episode 4622 with rewards -183.84726256083997 with 83 steps, done\n",
      "Run episode 4623 with rewards -504.44052165594917 with 81 steps, done\n",
      "Run episode 4624 with rewards -87.51920901268701 with 91 steps, done\n",
      "Run episode 4625 with rewards -616.2944287825287 with 80 steps, done\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Run episode 4626 with rewards -424.06127668836416 with 94 steps, done\n",
      "Run episode 4627 with rewards -52.47427646117082 with 162 steps, done\n",
      "Run episode 4628 with rewards -441.33176040625887 with 79 steps, done\n",
      "Run episode 4629 with rewards -805.4557248166315 with 84 steps, done\n",
      "Run episode 4630 with rewards -248.27221515514506 with 57 steps, done\n",
      "Run episode 4631 with rewards -551.5249265215195 with 84 steps, done\n",
      "Run episode 4632 with rewards -155.97745774460407 with 76 steps, done\n",
      "Run episode 4633 with rewards -475.2964164849338 with 59 steps, done\n",
      "Run episode 4634 with rewards -365.71490966623185 with 61 steps, done\n",
      "Run episode 4635 with rewards -751.1344572136198 with 85 steps, done\n",
      "Run episode 4636 with rewards -429.96087274429215 with 90 steps, done\n",
      "Run episode 4637 with rewards -1071.7360944542247 with 142 steps, done\n",
      "Run episode 4638 with rewards -547.9413960507516 with 67 steps, done\n",
      "Run episode 4639 with rewards -329.5218052381912 with 50 steps, done\n",
      "Run episode 4640 with rewards -161.58876361799696 with 72 steps, done\n",
      "Run episode 4641 with rewards -476.66968656954896 with 56 steps, done\n",
      "Run episode 4642 with rewards -139.4817046655826 with 66 steps, done\n",
      "Run episode 4643 with rewards -1362.2250796825533 with 175 steps, done\n",
      "Run episode 4644 with rewards -141.12592794519756 with 73 steps, done\n",
      "Run episode 4645 with rewards -556.0673514810126 with 75 steps, done\n",
      "Run episode 4646 with rewards -106.62098327406883 with 60 steps, done\n",
      "Run episode 4647 with rewards -529.5541381964099 with 72 steps, done\n",
      "Run episode 4648 with rewards -200.51490729574573 with 77 steps, done\n",
      "Run episode 4649 with rewards -789.072635027664 with 131 steps, done\n",
      "Run episode 4650 with rewards -131.81033356959924 with 75 steps, done\n",
      "Run episode 4651 with rewards -730.3157031873491 with 130 steps, done\n",
      "Run episode 4652 with rewards -142.33222054677327 with 76 steps, done\n",
      "Run episode 4653 with rewards -771.7919582410408 with 113 steps, done\n",
      "Run episode 4654 with rewards -141.40676952367534 with 61 steps, done\n",
      "Run episode 4655 with rewards -1028.4030031835396 with 148 steps, done\n",
      "Run episode 4656 with rewards -204.4395953970533 with 98 steps, done\n",
      "Run episode 4657 with rewards -115.36283300929993 with 60 steps, done\n",
      "Run episode 4658 with rewards -94.37839349462584 with 59 steps, done\n",
      "Run episode 4659 with rewards -638.87895167907 with 67 steps, done\n",
      "Run episode 4660 with rewards -639.9839257348041 with 97 steps, done\n",
      "Run episode 4661 with rewards -531.642528379255 with 68 steps, done\n",
      "Run episode 4662 with rewards -426.3420712475801 with 94 steps, done\n",
      "Run episode 4663 with rewards -767.5625261933977 with 84 steps, done\n",
      "Run episode 4664 with rewards -541.2506850218225 with 73 steps, done\n",
      "Run episode 4665 with rewards -567.9989446247935 with 90 steps, done\n",
      "Run episode 4666 with rewards -204.91613942436405 with 54 steps, done\n",
      "Run episode 4667 with rewards -468.0353209779217 with 77 steps, done\n",
      "Run episode 4668 with rewards -603.2856961730265 with 72 steps, done\n",
      "Run episode 4669 with rewards -542.4796730491287 with 60 steps, done\n",
      "Run episode 4670 with rewards -625.935224661989 with 89 steps, done\n",
      "Run episode 4671 with rewards -512.984594904953 with 62 steps, done\n",
      "Run episode 4672 with rewards -119.26250101080348 with 66 steps, done\n",
      "Run episode 4673 with rewards -424.5509465761171 with 109 steps, done\n",
      "Run episode 4674 with rewards -100.95394073238197 with 59 steps, done\n",
      "Run episode 4675 with rewards -98.49680722910146 with 113 steps, done\n",
      "Run episode 4676 with rewards -46.853584955605115 with 78 steps, done\n",
      "Run episode 4677 with rewards -450.06999092142075 with 60 steps, done\n",
      "Run episode 4678 with rewards -119.05136198085555 with 59 steps, done\n",
      "Run episode 4679 with rewards -232.28947050820437 with 88 steps, done\n",
      "Run episode 4680 with rewards -125.0728175158325 with 73 steps, done\n",
      "Run episode 4681 with rewards -89.4687076474207 with 71 steps, done\n",
      "Run episode 4682 with rewards -118.34432170922435 with 58 steps, done\n",
      "Run episode 4683 with rewards -455.9654903306037 with 82 steps, done\n",
      "Run episode 4684 with rewards -309.3916548295206 with 88 steps, done\n",
      "Run episode 4685 with rewards -1408.134033542214 with 179 steps, done\n",
      "Run episode 4686 with rewards -126.94717636258098 with 81 steps, done\n",
      "Run episode 4687 with rewards -419.8621857377624 with 94 steps, done\n",
      "Run episode 4688 with rewards -303.3609322096687 with 97 steps, done\n",
      "Run episode 4689 with rewards -418.014769679185 with 76 steps, done\n",
      "Run episode 4690 with rewards -136.07067613759557 with 71 steps, done\n",
      "Run episode 4691 with rewards -470.28927619813373 with 82 steps, done\n",
      "Run episode 4692 with rewards -138.52783728025668 with 65 steps, done\n",
      "Run episode 4693 with rewards -646.7631384812565 with 134 steps, done\n",
      "Run episode 4694 with rewards -726.6270935354294 with 79 steps, done\n",
      "Run episode 4695 with rewards -126.04799005013459 with 79 steps, done\n",
      "Run episode 4696 with rewards -22.555180069516553 with 133 steps, done\n",
      "Run episode 4697 with rewards -56.0292307819492 with 202 steps, done\n",
      "Run episode 4698 with rewards -2154.4949125961093 with 231 steps, done\n",
      "Run episode 4699 with rewards -112.2695493237635 with 68 steps, done\n",
      "Run episode 4700 with rewards -1294.6804191579367 with 167 steps, done\n",
      "Run episode 4701 with rewards -139.58656321422018 with 53 steps, done\n",
      "Run episode 4702 with rewards -732.7409104040295 with 107 steps, done\n",
      "Run episode 4703 with rewards -147.31733757439656 with 67 steps, done\n",
      "Run episode 4704 with rewards -466.3534667671179 with 85 steps, done\n",
      "Run episode 4705 with rewards -126.40689522838487 with 74 steps, done\n",
      "Run episode 4706 with rewards -902.9968994865291 with 168 steps, done\n",
      "Run episode 4707 with rewards -123.31581947119473 with 70 steps, done\n",
      "Run episode 4708 with rewards -505.6534753553987 with 57 steps, done\n",
      "Run episode 4709 with rewards -353.38185645286313 with 110 steps, done\n",
      "Run episode 4710 with rewards -502.9694227685253 with 58 steps, done\n",
      "Run episode 4711 with rewards -387.7439855517168 with 105 steps, done\n",
      "Run episode 4712 with rewards -531.6456138520222 with 71 steps, done\n",
      "Run episode 4713 with rewards -491.6637012875379 with 60 steps, done\n",
      "Run episode 4714 with rewards -498.1375557284515 with 85 steps, done\n",
      "Run episode 4715 with rewards -476.1474425218289 with 68 steps, done\n",
      "Run episode 4716 with rewards -764.7179741833017 with 75 steps, done\n",
      "Run episode 4717 with rewards -194.27471044626193 with 70 steps, done\n",
      "Run episode 4718 with rewards -511.5759813211985 with 65 steps, done\n",
      "Run episode 4719 with rewards -406.42432454023765 with 74 steps, done\n",
      "Run episode 4720 with rewards -513.5686112856497 with 57 steps, done\n",
      "Run episode 4721 with rewards -351.64490435863723 with 71 steps, done\n",
      "Run episode 4722 with rewards -383.3809221650499 with 55 steps, done\n",
      "Run episode 4723 with rewards -464.5063104701341 with 82 steps, done\n",
      "Run episode 4724 with rewards -383.8550660342013 with 53 steps, done\n",
      "Run episode 4725 with rewards -280.07340503463587 with 99 steps, done\n",
      "Run episode 4726 with rewards -685.5291727114105 with 76 steps, done\n",
      "Run episode 4727 with rewards -154.44996908431207 with 70 steps, done\n",
      "Run episode 4728 with rewards -387.7725177534992 with 50 steps, done\n",
      "Run episode 4729 with rewards -631.8349731599848 with 101 steps, done\n",
      "Run episode 4730 with rewards -1238.0416165451797 with 132 steps, done\n",
      "Run episode 4731 with rewards -836.4430279959598 with 86 steps, done\n",
      "Run episode 4732 with rewards -316.92575430726663 with 92 steps, done\n",
      "Run episode 4733 with rewards -367.776307932991 with 81 steps, done\n",
      "Run episode 4734 with rewards -206.09739944801487 with 124 steps, done\n",
      "Run episode 4735 with rewards -474.5854617719388 with 81 steps, done\n",
      "Run episode 4736 with rewards -280.4302206970535 with 80 steps, done\n",
      "Run episode 4737 with rewards -431.6937322328691 with 82 steps, done\n",
      "Run episode 4738 with rewards -618.2209504647255 with 73 steps, done\n",
      "Run episode 4739 with rewards -110.92701560537205 with 79 steps, done\n",
      "Run episode 4740 with rewards -593.4226175408558 with 103 steps, done\n",
      "Run episode 4741 with rewards -400.3169047814544 with 54 steps, done\n",
      "Run episode 4742 with rewards -494.9563161279662 with 84 steps, done\n",
      "Run episode 4743 with rewards -651.5377352413345 with 66 steps, done\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Run episode 4744 with rewards -478.572403698442 with 88 steps, done\n",
      "Run episode 4745 with rewards -553.9000190491461 with 61 steps, done\n",
      "Run episode 4746 with rewards -293.471136535229 with 63 steps, done\n",
      "Run episode 4747 with rewards -412.7950197348316 with 49 steps, done\n",
      "Run episode 4748 with rewards -619.3261380195825 with 88 steps, done\n",
      "Run episode 4749 with rewards -563.6590146576784 with 71 steps, done\n",
      "Run episode 4750 with rewards -665.942566338734 with 99 steps, done\n",
      "Run episode 4751 with rewards -412.438893593443 with 58 steps, done\n",
      "Run episode 4752 with rewards -270.9196618634128 with 107 steps, done\n",
      "Run episode 4753 with rewards -606.8203574052473 with 81 steps, done\n",
      "Run episode 4754 with rewards -706.8313248530769 with 73 steps, done\n",
      "Run episode 4755 with rewards -229.60356389196176 with 93 steps, done\n",
      "Run episode 4756 with rewards -564.8102375492865 with 61 steps, done\n",
      "Run episode 4757 with rewards -418.750260129112 with 70 steps, done\n",
      "Run episode 4758 with rewards -792.4018016491301 with 77 steps, done\n",
      "Run episode 4759 with rewards -408.4274115533507 with 91 steps, done\n",
      "Run episode 4760 with rewards -773.6864949972437 with 80 steps, done\n",
      "Run episode 4761 with rewards -510.0797755951701 with 76 steps, done\n",
      "Run episode 4762 with rewards -379.3379549108971 with 52 steps, done\n",
      "Run episode 4763 with rewards -521.5712267743527 with 88 steps, done\n",
      "Run episode 4764 with rewards -666.8444016196129 with 87 steps, done\n",
      "Run episode 4765 with rewards -381.3007589998946 with 92 steps, done\n",
      "Run episode 4766 with rewards -1023.1190075776143 with 115 steps, done\n",
      "Run episode 4767 with rewards -572.2734050224759 with 62 steps, done\n",
      "Run episode 4768 with rewards -246.03930193369786 with 73 steps, done\n",
      "Run episode 4769 with rewards -954.1313311823282 with 103 steps, done\n",
      "Run episode 4770 with rewards -26.87627482513544 with 91 steps, done\n",
      "Run episode 4771 with rewards -132.39585530933948 with 54 steps, done\n",
      "Run episode 4772 with rewards -145.50341742945614 with 68 steps, done\n",
      "Run episode 4773 with rewards -200.62635397215791 with 72 steps, done\n",
      "Run episode 4774 with rewards -81.56312267899546 with 84 steps, done\n",
      "Run episode 4775 with rewards -993.9371748656316 with 87 steps, done\n",
      "Run episode 4776 with rewards -1014.8455601637047 with 87 steps, done\n",
      "Run episode 4777 with rewards -793.612032909617 with 84 steps, done\n",
      "Run episode 4778 with rewards -495.940196438227 with 62 steps, done\n",
      "Run episode 4779 with rewards -285.8058407763818 with 85 steps, done\n",
      "Run episode 4780 with rewards -528.3686509032041 with 66 steps, done\n",
      "Run episode 4781 with rewards -622.8760431259836 with 96 steps, done\n",
      "Run episode 4782 with rewards -670.9441272487176 with 73 steps, done\n",
      "Run episode 4783 with rewards -507.7882586239645 with 91 steps, done\n",
      "Run episode 4784 with rewards -691.7032955462624 with 79 steps, done\n",
      "Run episode 4785 with rewards -227.80422937874812 with 81 steps, done\n",
      "Run episode 4786 with rewards -147.10023471190868 with 57 steps, done\n",
      "Run episode 4787 with rewards -48.54851351014537 with 70 steps, done\n",
      "Run episode 4788 with rewards -361.29582916170995 with 87 steps, done\n",
      "Run episode 4789 with rewards -724.7885573714849 with 82 steps, done\n",
      "Run episode 4790 with rewards -131.38301142031693 with 53 steps, done\n",
      "Run episode 4791 with rewards -76.34295870187175 with 59 steps, done\n",
      "Run episode 4792 with rewards -773.655742325633 with 80 steps, done\n",
      "Run episode 4793 with rewards -20.29028532009093 with 71 steps, done\n",
      "Run episode 4794 with rewards -3619.9811045593115 with 365 steps, done\n",
      "Run episode 4795 with rewards -135.87283673973656 with 57 steps, done\n",
      "Run episode 4796 with rewards -728.163094326627 with 165 steps, done\n",
      "Run episode 4797 with rewards -747.005310740725 with 78 steps, done\n",
      "Run episode 4798 with rewards -108.22251030002569 with 89 steps, done\n",
      "Run episode 4799 with rewards -605.5115490864009 with 68 steps, done\n",
      "Run episode 4800 with rewards -150.9918591234857 with 68 steps, done\n",
      "Run episode 4801 with rewards -3.1953444994763913 with 62 steps, done\n",
      "Run episode 4802 with rewards -664.9084299358984 with 83 steps, done\n",
      "Run episode 4803 with rewards -228.97569040344445 with 67 steps, done\n",
      "Run episode 4804 with rewards -787.6820072799746 with 80 steps, done\n",
      "Run episode 4805 with rewards -610.7927101403917 with 129 steps, done\n",
      "Run episode 4806 with rewards -897.1963801351919 with 82 steps, done\n",
      "Run episode 4807 with rewards -78.49670001102363 with 60 steps, done\n",
      "Run episode 4808 with rewards -689.6330921391475 with 117 steps, done\n",
      "Run episode 4809 with rewards -513.4484209423917 with 90 steps, done\n",
      "Run episode 4810 with rewards -484.84780349335614 with 103 steps, done\n",
      "Run episode 4811 with rewards -159.1744706660919 with 85 steps, done\n",
      "Run episode 4812 with rewards -457.04909438004546 with 86 steps, done\n",
      "Run episode 4813 with rewards -261.01830328034043 with 87 steps, done\n",
      "Run episode 4814 with rewards -444.82396486655347 with 61 steps, done\n",
      "Run episode 4815 with rewards -607.6251719942937 with 95 steps, done\n",
      "Run episode 4816 with rewards -567.415808093607 with 64 steps, done\n",
      "Run episode 4817 with rewards -409.3359885670515 with 67 steps, done\n",
      "Run episode 4818 with rewards -548.0371539118603 with 61 steps, done\n",
      "Run episode 4819 with rewards -671.8586767189016 with 119 steps, done\n",
      "Run episode 4820 with rewards -372.44864166099126 with 70 steps, done\n",
      "Run episode 4821 with rewards -855.0979753231637 with 130 steps, done\n",
      "Run episode 4822 with rewards -440.2202059626657 with 57 steps, done\n",
      "Run episode 4823 with rewards -259.9575983656431 with 87 steps, done\n",
      "Run episode 4824 with rewards -711.802306489622 with 73 steps, done\n",
      "Run episode 4825 with rewards -346.6051895116833 with 77 steps, done\n",
      "Run episode 4826 with rewards -693.9190688892633 with 75 steps, done\n",
      "Run episode 4827 with rewards -578.5051843100822 with 71 steps, done\n",
      "Run episode 4828 with rewards -658.5791002666265 with 85 steps, done\n",
      "Run episode 4829 with rewards -485.15710567375436 with 69 steps, done\n",
      "Run episode 4830 with rewards -551.2634062121142 with 60 steps, done\n",
      "Run episode 4831 with rewards -230.76133071530842 with 79 steps, done\n",
      "Run episode 4832 with rewards -570.203437046599 with 66 steps, done\n",
      "Run episode 4833 with rewards -556.9173903129841 with 92 steps, done\n",
      "Run episode 4834 with rewards -874.5114385961659 with 81 steps, done\n",
      "Run episode 4835 with rewards -682.9684848376005 with 84 steps, done\n",
      "Run episode 4836 with rewards -437.4315965109116 with 58 steps, done\n",
      "Run episode 4837 with rewards -793.9325550672063 with 78 steps, done\n",
      "Run episode 4838 with rewards -479.3967039335208 with 101 steps, done\n",
      "Run episode 4839 with rewards -436.38898420271585 with 52 steps, done\n",
      "Run episode 4840 with rewards -619.5802348419088 with 96 steps, done\n",
      "Run episode 4841 with rewards -397.6558476425179 with 99 steps, done\n",
      "Run episode 4842 with rewards -470.5441835228922 with 53 steps, done\n",
      "Run episode 4843 with rewards -391.5344469396218 with 47 steps, done\n",
      "Run episode 4844 with rewards -778.7282472099217 with 83 steps, done\n",
      "Run episode 4845 with rewards -721.6510649239067 with 72 steps, done\n",
      "Run episode 4846 with rewards -545.4310393164067 with 64 steps, done\n",
      "Run episode 4847 with rewards -544.9016242857433 with 61 steps, done\n",
      "Run episode 4848 with rewards -706.3675565875751 with 132 steps, done\n",
      "Run episode 4849 with rewards -495.5292221152923 with 71 steps, done\n",
      "Run episode 4850 with rewards -193.62742104371608 with 97 steps, done\n",
      "Run episode 4851 with rewards -1636.2218357438057 with 230 steps, done\n",
      "Run episode 4852 with rewards -157.24534462529482 with 78 steps, done\n",
      "Run episode 4853 with rewards -436.98337383193535 with 57 steps, done\n",
      "Run episode 4854 with rewards -241.32212416740106 with 76 steps, done\n",
      "Run episode 4855 with rewards -509.41638126438306 with 58 steps, done\n",
      "Run episode 4856 with rewards -195.3571682072946 with 76 steps, done\n",
      "Run episode 4857 with rewards -492.3324009364652 with 72 steps, done\n",
      "Run episode 4858 with rewards -507.00560287915323 with 93 steps, done\n",
      "Run episode 4859 with rewards -151.57084198950815 with 50 steps, done\n",
      "Run episode 4860 with rewards -373.9300997663239 with 74 steps, done\n",
      "Run episode 4861 with rewards -164.80057517208698 with 74 steps, done\n",
      "Run episode 4862 with rewards -670.3586017535706 with 125 steps, done\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Run episode 4863 with rewards -131.22276026324818 with 53 steps, done\n",
      "Run episode 4864 with rewards -994.2854970102733 with 162 steps, done\n",
      "Run episode 4865 with rewards -102.58246375932413 with 56 steps, done\n",
      "Run episode 4866 with rewards -137.69575981787096 with 54 steps, done\n",
      "Run episode 4867 with rewards -759.4197434273528 with 78 steps, done\n",
      "Run episode 4868 with rewards -161.71249786809955 with 75 steps, done\n",
      "Run episode 4869 with rewards -128.18213330484775 with 159 steps, done\n",
      "Run episode 4870 with rewards -130.62254087869584 with 71 steps, done\n",
      "Run episode 4871 with rewards -501.9806132917637 with 79 steps, done\n",
      "Run episode 4872 with rewards -154.21272775446727 with 111 steps, done\n",
      "Run episode 4873 with rewards -475.5186647078661 with 54 steps, done\n",
      "Run episode 4874 with rewards -605.4645956696278 with 88 steps, done\n",
      "Run episode 4875 with rewards -190.5202720799993 with 52 steps, done\n",
      "Run episode 4876 with rewards -0.8300350613756109 with 86 steps, done\n",
      "Run episode 4877 with rewards -347.06169492582757 with 54 steps, done\n",
      "Run episode 4878 with rewards -206.76493177227627 with 66 steps, done\n",
      "Run episode 4879 with rewards -529.2478236305899 with 59 steps, done\n",
      "Run episode 4880 with rewards -269.58893364109997 with 76 steps, done\n",
      "Run episode 4881 with rewards -421.4229928494657 with 70 steps, done\n",
      "Run episode 4882 with rewards -470.0184060023386 with 94 steps, done\n",
      "Run episode 4883 with rewards -736.0835305217136 with 71 steps, done\n",
      "Run episode 4884 with rewards -512.2878677240567 with 75 steps, done\n",
      "Run episode 4885 with rewards -472.5144343314488 with 68 steps, done\n",
      "Run episode 4886 with rewards -521.603815900546 with 83 steps, done\n",
      "Run episode 4887 with rewards -520.9752465433623 with 56 steps, done\n",
      "Run episode 4888 with rewards -528.7535659274859 with 82 steps, done\n",
      "Run episode 4889 with rewards -127.89851313759237 with 52 steps, done\n",
      "Run episode 4890 with rewards -168.64181673774578 with 69 steps, done\n",
      "Run episode 4891 with rewards -157.01539403036492 with 70 steps, done\n",
      "Run episode 4892 with rewards -146.8383197919619 with 63 steps, done\n",
      "Run episode 4893 with rewards -664.645907599661 with 75 steps, done\n",
      "Run episode 4894 with rewards -555.4173577521831 with 76 steps, done\n",
      "Run episode 4895 with rewards -508.2856555725309 with 63 steps, done\n",
      "Run episode 4896 with rewards -304.61331813407867 with 93 steps, done\n",
      "Run episode 4897 with rewards -531.4451109646748 with 65 steps, done\n",
      "Run episode 4898 with rewards -434.78619596986545 with 51 steps, done\n",
      "Run episode 4899 with rewards -473.95401976985386 with 71 steps, done\n",
      "Run episode 4900 with rewards -272.63358269914517 with 52 steps, done\n",
      "Run episode 4901 with rewards -558.981189925222 with 61 steps, done\n",
      "Run episode 4902 with rewards -342.2024294700518 with 85 steps, done\n",
      "Run episode 4903 with rewards -462.6681557929209 with 63 steps, done\n",
      "Run episode 4904 with rewards -365.69291143522474 with 95 steps, done\n",
      "Run episode 4905 with rewards -529.3371041354931 with 132 steps, done\n",
      "Run episode 4906 with rewards -150.35971271608298 with 56 steps, done\n",
      "Run episode 4907 with rewards -768.983792474523 with 74 steps, done\n",
      "Run episode 4908 with rewards -564.259488391417 with 95 steps, done\n",
      "Run episode 4909 with rewards -391.17477484887536 with 96 steps, done\n",
      "Run episode 4910 with rewards -190.53959243768458 with 72 steps, done\n",
      "Run episode 4911 with rewards -134.2982597720813 with 71 steps, done\n",
      "Run episode 4912 with rewards -265.3849629239339 with 108 steps, done\n",
      "Run episode 4913 with rewards -1264.981758112043 with 196 steps, done\n",
      "Run episode 4914 with rewards -273.84056537773824 with 86 steps, done\n",
      "Run episode 4915 with rewards -183.55200713354287 with 70 steps, done\n",
      "Run episode 4916 with rewards -554.7311045941894 with 68 steps, done\n",
      "Run episode 4917 with rewards -466.43587575605216 with 52 steps, done\n",
      "Run episode 4918 with rewards -600.5251097487778 with 93 steps, done\n",
      "Run episode 4919 with rewards -407.7530331886734 with 53 steps, done\n",
      "Run episode 4920 with rewards -412.82714368412536 with 123 steps, done\n",
      "Run episode 4921 with rewards -773.069495198257 with 91 steps, done\n",
      "Run episode 4922 with rewards 41.291130809368724 with 73 steps, done\n",
      "best\n",
      "Run episode 4923 with rewards -1629.9074496271637 with 220 steps, done\n",
      "Run episode 4924 with rewards -201.58643469139747 with 71 steps, done\n",
      "Run episode 4925 with rewards -889.7091603093944 with 129 steps, done\n",
      "Run episode 4926 with rewards -256.39345036293025 with 66 steps, done\n",
      "Run episode 4927 with rewards -459.88927871429524 with 76 steps, done\n",
      "Run episode 4928 with rewards -118.77862028344629 with 54 steps, done\n",
      "Run episode 4929 with rewards -244.3149725057585 with 109 steps, done\n",
      "Run episode 4930 with rewards -459.2354581966889 with 68 steps, done\n",
      "Run episode 4931 with rewards -590.9089089850314 with 62 steps, done\n",
      "Run episode 4932 with rewards -682.3872563659164 with 107 steps, done\n",
      "Run episode 4933 with rewards -462.83501733180117 with 55 steps, done\n",
      "Run episode 4934 with rewards -309.793201403322 with 82 steps, done\n",
      "Run episode 4935 with rewards -621.3319183463318 with 76 steps, done\n",
      "Run episode 4936 with rewards -322.7948085464236 with 79 steps, done\n",
      "Run episode 4937 with rewards -591.4799292962184 with 86 steps, done\n",
      "Run episode 4938 with rewards -283.9713467272624 with 52 steps, done\n",
      "Run episode 4939 with rewards -537.111964595214 with 60 steps, done\n",
      "Run episode 4940 with rewards -525.6892735328806 with 111 steps, done\n",
      "Run episode 4941 with rewards -804.8649429733437 with 76 steps, done\n",
      "Run episode 4942 with rewards -149.10534231447576 with 74 steps, done\n",
      "Run episode 4943 with rewards -122.63360915763116 with 75 steps, done\n",
      "Run episode 4944 with rewards -554.0802035692582 with 99 steps, done\n",
      "Run episode 4945 with rewards -241.5229871294416 with 51 steps, done\n",
      "Run episode 4946 with rewards -235.89594579120472 with 112 steps, done\n",
      "Run episode 4947 with rewards -345.545553178506 with 50 steps, done\n",
      "Run episode 4948 with rewards -492.6878222749533 with 82 steps, done\n",
      "Run episode 4949 with rewards -630.153136892436 with 69 steps, done\n",
      "Run episode 4950 with rewards -619.9807773756523 with 96 steps, done\n",
      "Run episode 4951 with rewards -744.3072083261281 with 78 steps, done\n",
      "Run episode 4952 with rewards -714.9242201066975 with 74 steps, done\n",
      "Run episode 4953 with rewards -157.86076809930847 with 77 steps, done\n",
      "Run episode 4954 with rewards -797.8496661822039 with 79 steps, done\n",
      "Run episode 4955 with rewards -233.95833711157943 with 78 steps, done\n",
      "Run episode 4956 with rewards -659.1485633109901 with 95 steps, done\n",
      "Run episode 4957 with rewards -625.1384891886291 with 67 steps, done\n",
      "Run episode 4958 with rewards -519.6468209582863 with 116 steps, done\n",
      "Run episode 4959 with rewards -807.3664548119433 with 83 steps, done\n",
      "Run episode 4960 with rewards -2886.68305280577 with 294 steps, done\n",
      "Run episode 4961 with rewards -8.947215989223224 with 88 steps, done\n",
      "Run episode 4962 with rewards -798.6495104486107 with 154 steps, done\n",
      "Run episode 4963 with rewards -588.1961495214707 with 62 steps, done\n",
      "Run episode 4964 with rewards -159.17044573536063 with 70 steps, done\n",
      "Run episode 4965 with rewards -355.3224856033564 with 51 steps, done\n",
      "Run episode 4966 with rewards -140.4581536611033 with 67 steps, done\n",
      "Run episode 4967 with rewards -765.9859830119931 with 76 steps, done\n",
      "Run episode 4968 with rewards -290.07587682845866 with 89 steps, done\n",
      "Run episode 4969 with rewards -495.6886962443084 with 55 steps, done\n",
      "Run episode 4970 with rewards -201.82168285381425 with 74 steps, done\n",
      "Run episode 4971 with rewards -686.1863916074088 with 77 steps, done\n",
      "Run episode 4972 with rewards -600.0610656558122 with 90 steps, done\n",
      "Run episode 4973 with rewards -453.8110193986222 with 61 steps, done\n",
      "Run episode 4974 with rewards -184.93343352561226 with 90 steps, done\n",
      "Run episode 4975 with rewards -551.349407100483 with 67 steps, done\n",
      "Run episode 4976 with rewards -482.92623549089575 with 56 steps, done\n",
      "Run episode 4977 with rewards -703.9375856982437 with 71 steps, done\n",
      "Run episode 4978 with rewards -564.4953024745464 with 109 steps, done\n",
      "Run episode 4979 with rewards -577.0380748043617 with 114 steps, done\n",
      "Run episode 4980 with rewards -542.3041341231525 with 87 steps, done\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Run episode 4981 with rewards -464.3961547778753 with 55 steps, done\n",
      "Run episode 4982 with rewards -581.431817755688 with 89 steps, done\n",
      "Run episode 4983 with rewards -524.3411099580967 with 69 steps, done\n",
      "Run episode 4984 with rewards -366.34660717241155 with 66 steps, done\n",
      "Run episode 4985 with rewards -541.6526821436084 with 75 steps, done\n",
      "Run episode 4986 with rewards -497.6557105029059 with 58 steps, done\n",
      "Run episode 4987 with rewards -805.7433298357546 with 119 steps, done\n",
      "Run episode 4988 with rewards -808.5149305374982 with 80 steps, done\n",
      "Run episode 4989 with rewards -1840.3871953379085 with 217 steps, done\n",
      "Run episode 4990 with rewards -457.9073352484284 with 61 steps, done\n",
      "Run episode 4991 with rewards -395.74960416730147 with 89 steps, done\n",
      "Run episode 4992 with rewards -497.08449095419655 with 71 steps, done\n",
      "Run episode 4993 with rewards -160.86735608479884 with 71 steps, done\n",
      "Run episode 4994 with rewards -531.300104504832 with 91 steps, done\n",
      "Run episode 4995 with rewards -688.9686596222989 with 88 steps, done\n",
      "Run episode 4996 with rewards -607.9356222776717 with 83 steps, done\n",
      "Run episode 4997 with rewards -136.95631249179146 with 56 steps, done\n",
      "Run episode 4998 with rewards -1569.7542604659268 with 202 steps, done\n",
      "Run episode 4999 with rewards -124.94418332993783 with 68 steps, done\n",
      "\n",
      "Done\n"
     ]
    }
   ],
   "source": [
    "rewards = train()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 34,
   "id": "3d20e8e0",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "--------------\n",
      "  +89.2950 if obs_1>=2.0 & obs_3<=15.0 & obs_6<=22.70100908279419 & obs_6<=22.998740005493165\n",
      "  +13.5386 if obs_1<=12.0 & obs_1>=2.0 & obs_3<=-2.480000019073482 & obs_5<=26.0 & obs_6<=22.177796268463133\n",
      "   +3.2217 if obs_1<=29.0 & obs_1>=10.0 & obs_2<=4.0 & obs_2<=6.0 & obs_3<=-1.0 & obs_3<=0.5 & obs_3>=-7.300000190734863 & obs_3>=-8.399999618530273 & obs_4<=21.0 & obs_4>=16.0 & obs_5>=25.0 & obs_5>=26.0 & obs_6<=21.000030326843262 & obs_7<=56.14059104919433 & obs_8<=17991.406152343752 & obs_8>=568.9686584472656\n",
      "  +36.9233 if obs_1>=4.0 & obs_2>=4.0 & obs_4<=18.0 & obs_6<=19.74883813858032 & obs_6<=20.592261409759523 & obs_7<=36.43242073059082 & obs_7<=36.80724649429321 & obs_8>=2935.4127197265625\n",
      "  +16.7580 if obs_1<=15.0 & obs_2>=3.0 & obs_3<=-6.699999809265137 & obs_3>=-11.707499814033508 & obs_4<=20.0 & obs_6<=19.74883813858032 & obs_8>=3257.3261230468747\n",
      "  +16.3780 if obs_2<=2.0 & obs_6<=18.97082986831665 & obs_8>=3000.8402465820313\n",
      "  +56.3921 if obs_1>=2.0 & obs_3<=-5.0 & obs_6<=21.459081649780277 & obs_7<=61.74348316192627 & obs_7>=22.529983043670654 & obs_8>=1762.7387084960938\n",
      "  +58.4708 if obs_2<=6.0 & obs_4>=17.0 & obs_6<=19.887684488296507 & obs_6<=22.83117961883545 & obs_8>=2708.7663696289064\n",
      "  +55.7605 if obs_1>=2.0 & obs_3<=15.0 & obs_3>=-11.707499814033508 & obs_6<=21.841278553009033\n",
      "  +48.4805 if obs_1>=3.0 & obs_2<=6.0 & obs_3<=-5.599999904632568 & obs_8>=5741.618798828125\n",
      "  +13.8765 if obs_1>=2.0 & obs_3<=-1.2000000476837158 & obs_3>=-11.707499814033508 & obs_4<=15.0 & obs_6<=22.9116003036499 & obs_7<=63.92743215560914\n",
      "  +18.9247 if obs_1>=26.0 & obs_2>=1.0 & obs_3<=-2.0 & obs_4<=18.0 & obs_4<=20.0 & obs_5>=24.0 & obs_6<=22.515908813476564\n",
      "   +6.2941 if obs_1<=25.0 & obs_1>=4.0 & obs_3<=15.0 & obs_3>=-11.707499814033508 & obs_5<=24.0 & obs_6<=21.999748325347902\n",
      "   +5.6774 if obs_1<=26.0 & obs_1>=5.0 & obs_2<=0.0 & obs_3<=11.0 & obs_3>=-11.707499814033508 & obs_5<=28.0 & obs_6<=20.83740234375\n",
      "  +54.6676 if obs_1>=2.0 & obs_2<=21.0 & obs_3<=-5.0 & obs_6<=20.73638858795166 & obs_7>=24.441575813293458 & obs_8>=1738.9174713134767\n",
      "   +0.9462 if obs_2>=3.0 & obs_3<=-2.480000019073482 & obs_3>=-8.399999618530273 & obs_4>=22.0 & obs_6<=22.006057357788087 & obs_6>=21.450941181182863\n",
      "   +1.3375 if obs_2<=0.0 & obs_3<=-11.707499814033508\n",
      "   +0.6414 if obs_2<=1.0 & obs_6<=19.1446174621582 & obs_7>=59.65270099639892\n",
      "   +0.9549 if obs_4<=15.0 & obs_6<=19.112470388412476 & obs_8>=2780.427294921876\n",
      "   +8.2876 if obs_1<=26.0 & obs_3<=-7.300000190734863 & obs_4<=18.0 & obs_6<=22.938304519653318 & obs_6>=17.667845153808592 & obs_7>=25.293832969665527 & obs_8>=2412.479943847656\n",
      "--------------\n",
      " +100.6794 if obs_0<=2.0 & obs_3<=15.0 & obs_3>=-11.707499814033508 & obs_4<=21.0 & obs_6<=22.177796268463133 & obs_6<=22.70100908279419\n",
      "  +29.4817 if obs_2<=7.0 & obs_2>=2.0 & obs_3<=-4.0 & obs_3>=-11.707499814033508 & obs_6<=19.009052515029907 & obs_8<=9683.068164062503 & obs_8>=5646.802624511719\n",
      "  +52.9785 if obs_1<=24.0 & obs_2<=6.0 & obs_3<=0.5 & obs_3>=-11.707499814033508 & obs_4<=21.0 & obs_5<=29.0 & obs_6<=21.000030326843262 & obs_8>=568.9686584472656\n",
      "   +6.6761 if obs_1<=17.0 & obs_6<=20.592261409759523 & obs_7>=60.26889057159424\n",
      "  +58.3098 if obs_2>=1.0 & obs_3>=-11.707499814033508 & obs_6<=18.433651208877563 & obs_7>=22.757880306243898 & obs_8>=895.5278167724608\n",
      "  +69.2359 if obs_2<=6.0 & obs_3>=-11.707499814033508 & obs_6<=19.355116844177246 & obs_8>=492.0159454345703\n",
      "  +73.6616 if obs_3<=0.5 & obs_3>=-11.707499814033508 & obs_4<=20.0 & obs_6<=19.71504259109497 & obs_7>=22.529983043670654 & obs_8>=3032.436499023438\n",
      "  +32.3504 if obs_1<=25.0 & obs_1<=27.0 & obs_3<=-4.5 & obs_3<=-6.199999809265137 & obs_3>=-11.707499814033508 & obs_6<=19.57283444404602 & obs_6>=17.389590978622437 & obs_7>=22.9129599571228 & obs_7>=25.29561471939087 & obs_8>=6366.16953125\n",
      "   +4.6725 if obs_2>=21.0 & obs_3<=-1.0 & obs_3>=-11.707499814033508 & obs_6<=21.33929481506348 & obs_8>=1702.5115631103513\n",
      "  +19.0625 if obs_1<=27.0 & obs_3<=0.5 & obs_3>=-6.699999809265137 & obs_3>=-8.399999618530273 & obs_6<=19.217973518371583 & obs_6<=19.359976482391357 & obs_7<=61.80542621612549 & obs_7>=22.353507852554323 & obs_8>=1861.2105255126953 & obs_8>=2004.447509765625\n",
      "   +6.3846 if obs_1>=3.0 & obs_2<=2.0 & obs_3<=0.5 & obs_3>=-11.707499814033508 & obs_3>=-8.399999618530273 & obs_6<=19.54636526107788 & obs_6>=18.000740575790406 & obs_7<=64.12795448303223 & obs_7>=27.235195350646972 & obs_8>=3133.002301025391\n",
      "   +1.4869 if obs_3<=-8.399999618530273 & obs_3>=-11.707499814033508 & obs_4<=16.0 & obs_7>=21.751472330093385\n",
      "   +1.9827 if obs_1>=26.0 & obs_2<=3.0 & obs_2<=5.0 & obs_2>=1.0 & obs_2>=2.0 & obs_3>=-7.300000190734863 & obs_6<=19.456950902938843 & obs_8<=8161.607934570311 & obs_8>=854.5063720703125\n",
      "  +18.9273 if obs_2<=17.0 & obs_2>=11.0 & obs_3<=0.5 & obs_3>=-2.480000019073482 & obs_4<=18.0 & obs_5<=26.0 & obs_6>=20.665931510925294 & obs_6>=22.891964530944822 & obs_7<=60.45632057189942 & obs_8<=2261.5205078125\n",
      "  +22.3504 if obs_1>=26.0 & obs_2<=8.0 & obs_4<=21.0 & obs_5<=28.0 & obs_6<=20.904061365127564\n",
      "   +4.1862 if obs_2<=6.0 & obs_3<=0.5 & obs_3>=-11.707499814033508 & obs_5<=23.0\n",
      "   +2.7555 if obs_1>=2.0 & obs_3<=15.0 & obs_5<=29.0 & obs_6<=21.73469276428223 & obs_8<=928.4181945800782\n",
      "   +5.5446 if obs_2<=6.0 & obs_3<=-2.0 & obs_3>=-11.707499814033508 & obs_4<=16.0 & obs_7>=38.10074806213379 & obs_8>=1558.3621337890627\n",
      "   +1.3116 if obs_1<=26.0 & obs_3>=-11.707499814033508 & obs_5<=24.0 & obs_6<=22.000308990478516 & obs_7<=59.65270099639892 & obs_8>=869.6932250976564 & obs_8>=969.1310348510742\n",
      "  +10.5605 if obs_2<=6.0 & obs_3<=-7.300000190734863 & obs_3>=-11.707499814033508\n",
      "--------------\n",
      "  -16.9519 if obs_3<=-2.480000019073482 & obs_3>=-8.399999618530273 & obs_6<=22.177796268463133 & obs_8<=17991.406152343752\n",
      "   -4.7764 if obs_1<=30.0 & obs_1>=2.0 & obs_3>=-6.699999809265137 & obs_4<=18.0 & obs_6<=20.592261409759523 & obs_8<=1975.9460571289071\n",
      "   -3.8022 if obs_0>=2.0 & obs_1<=27.0 & obs_1>=2.0 & obs_3<=8.800000190734863 & obs_3>=-7.300000190734863 & obs_6<=22.998740005493165 & obs_8<=14654.500781249997 & obs_8>=380.8040405273438\n",
      "  -16.1714 if obs_0<=2.0 & obs_1<=28.0 & obs_3<=15.0 & obs_3>=-6.699999809265137 & obs_6<=22.000615882873536\n",
      "   -2.0705 if obs_2>=2.0 & obs_3<=-3.0 & obs_3>=-8.399999618530273 & obs_6<=21.989394187927246 & obs_8>=3635.091381835938\n",
      "   -0.7458 if obs_1<=28.0 & obs_2>=1.0 & obs_3<=-1.0 & obs_3>=-6.0 & obs_4<=17.0 & obs_6<=19.713508510589598 & obs_6>=17.494304513931276 & obs_7<=62.17353744506836 & obs_8>=792.7148559570313 & obs_8>=965.7166198730467\n",
      "   -7.3763 if obs_1<=27.0 & obs_2<=4.0 & obs_3>=-6.699999809265137 & obs_4<=18.0 & obs_7<=66.3616907119751 & obs_8>=1106.592529296875 & obs_8>=2045.947299194336\n",
      "   -1.2242 if obs_1<=27.0 & obs_1>=24.0 & obs_3<=2.0 & obs_5<=28.0 & obs_6<=21.7190043926239 & obs_8<=9706.131835937505\n",
      "   -5.1958 if obs_0<=2.0 & obs_1<=30.0 & obs_3>=-6.699999809265137 & obs_6<=20.751729726791382 & obs_6<=21.027472686767577 & obs_6>=18.435271501541138 & obs_8<=2057.523193359375\n",
      "   -7.0424 if obs_2<=22.0 & obs_3<=-1.0 & obs_3>=-8.399999618530273 & obs_6<=19.594702196121215 & obs_7>=23.042034149169922 & obs_8>=3124.2736938476583\n",
      "   -4.5610 if obs_3<=-5.0 & obs_3>=-8.399999618530273 & obs_6<=19.77602367401123 & obs_6<=19.989752674102782\n",
      "   -9.8319 if obs_0<=2.0 & obs_3<=15.0 & obs_3>=-2.480000019073482 & obs_3>=-8.399999618530273 & obs_6<=21.807869911193848 & obs_7>=22.339631414413454\n",
      "   -8.2208 if obs_1>=26.0 & obs_6<=19.999998092651367 & obs_7>=20.41123585700989 & obs_8<=5933.542053222656 & obs_8>=1137.6973724365234\n",
      "   -9.5157 if obs_2<=6.0 & obs_3>=-8.399999618530273 & obs_6<=19.603502464294433 & obs_8>=642.4375732421877 & obs_8>=737.6930572509766\n",
      "   -4.4893 if obs_2<=6.0 & obs_3<=-1.0 & obs_3<=0.5 & obs_3>=-8.399999618530273 & obs_6<=19.264748096466064 & obs_6<=20.520594024658205 & obs_7<=64.75711250305176 & obs_8>=2130.8052246093753 & obs_8>=2266.0539428710936\n",
      "   -0.9318 if obs_1<=28.0 & obs_2<=12.0 & obs_2<=21.0 & obs_3<=-2.480000019073482 & obs_3<=2.0 & obs_3>=-7.300000190734863 & obs_6<=21.76917266845703 & obs_7<=39.342803192138675 & obs_8<=3409.1862976074226 & obs_8<=3716.27294921875 & obs_8<=5073.7230224609375 & obs_8>=1266.370394897461\n",
      "   -2.0504 if obs_3<=-1.0 & obs_3>=-8.399999618530273 & obs_6>=20.815040826797485 & obs_8>=9904.482861328124\n",
      "   -0.3166 if obs_3>=-8.399999618530273 & obs_5>=28.0 & obs_6<=19.288299131393433 & obs_6>=18.103337574005128 & obs_7>=22.587212085723877 & obs_8>=2048.057849121094\n",
      "   -0.3166 if obs_2<=2.0 & obs_5<=25.0 & obs_6>=20.30489401817322\n",
      "   +1.0000 if obs_3<=4.320000171661381 & obs_3>=-8.399999618530273 & obs_4<=17.0 & obs_6<=18.320459938049318 & obs_8>=2080.554931640625\n",
      "--------------\n",
      " +124.5486 if obs_0<=2.0 & obs_1<=28.0 & obs_2>=3.0 & obs_3<=15.0 & obs_4<=21.0 & obs_6<=21.999842405319214 & obs_7>=30.120348739624024 & obs_8<=14654.500781249997\n",
      "  +32.0964 if obs_2>=2.0 & obs_3<=-8.399999618530273 & obs_6<=19.355116844177246 & obs_7>=40.868707275390626 & obs_8<=10144.1078125 & obs_8>=6151.636474609375\n",
      " +105.7383 if obs_0<=1.0 & obs_1<=29.0 & obs_2>=2.0 & obs_3<=8.800000190734863 & obs_4>=17.0 & obs_6<=19.453564262390138 & obs_7<=64.25104618072511 & obs_7>=30.506654977798462\n",
      "  +14.2700 if obs_3<=-2.480000019073482 & obs_4>=16.0 & obs_5<=29.0 & obs_6<=25.189791679382324 & obs_6>=22.73059253692627 & obs_6>=22.999444484710693 & obs_8>=1242.8953430175782\n",
      "  +15.8421 if obs_1<=3.0 & obs_2>=3.0 & obs_3>=-9.5 & obs_6<=20.759230756759642 & obs_7>=32.07972869873047\n",
      "  +63.3521 if obs_1<=29.0 & obs_2<=6.0 & obs_2>=3.0 & obs_6<=18.562196016311646 & obs_7>=29.883917236328124 & obs_8>=6365.397119140634\n",
      "   +0.8762 if obs_2>=3.0 & obs_3<=15.0 & obs_3>=4.320000171661381 & obs_6<=21.999615907669067 & obs_7>=33.92039680480957 & obs_8<=2360.1209594726565\n",
      " +107.8809 if obs_1>=2.0 & obs_2>=2.0 & obs_3<=0.5 & obs_4<=18.0 & obs_5<=29.0 & obs_5>=25.0 & obs_6<=21.574360132217407 & obs_7>=31.110543155670165 & obs_7>=32.62192287445068 & obs_8>=3686.024060058594\n",
      "   +5.6527 if obs_3<=-3.4000000953674316 & obs_3>=-9.5 & obs_4>=17.0 & obs_5<=29.0 & obs_6<=25.44772434234619 & obs_6>=23.058403062820435 & obs_8>=2405.3298339843755\n",
      "  +16.5432 if obs_1<=27.0 & obs_1>=26.0 & obs_2>=2.0 & obs_6<=18.404147386550903 & obs_8>=4192.727551269531\n",
      "  +24.5741 if obs_1>=26.0 & obs_2>=2.0 & obs_3<=-2.0 & obs_5<=28.0 & obs_6<=19.456950902938843 & obs_7>=29.95218391418457\n",
      "   +1.4249 if obs_1<=3.0 & obs_2>=5.0 & obs_7>=44.40178031921387 & obs_8>=9604.691406250004\n",
      "   +1.3357 if obs_3<=-3.4000000953674316 & obs_3>=-9.5 & obs_6<=25.151752710342407 & obs_6>=24.209823989868163 & obs_7<=50.07842845916748\n",
      "   +7.9327 if obs_2<=6.0 & obs_2>=2.0 & obs_3<=-2.480000019073482 & obs_6<=18.25954704284668 & obs_7>=30.449059677124023 & obs_8<=9467.85437011719 & obs_8>=7888.431005859376\n",
      "   +0.6714 if obs_3<=-3.0 & obs_3>=-9.5 & obs_4>=22.0 & obs_6>=23.12006611824036\n",
      "   +1.3955 if obs_2<=14.0 & obs_3<=-9.5 & obs_6>=23.006806898117066\n",
      "   +1.0926 if obs_1<=28.0 & obs_1>=27.0 & obs_3<=-2.0 & obs_3>=-3.4000000953674316 & obs_7>=32.880251216888425\n",
      "   +1.7730 if obs_0<=1.0 & obs_3<=-2.480000019073482 & obs_3>=-6.699999809265137 & obs_4>=21.0 & obs_6<=25.40608005523682\n",
      "   +2.8931 if obs_1<=2.0 & obs_2<=6.0 & obs_6<=18.18353614807129 & obs_6<=18.684878158569337\n",
      "  +44.6132 if obs_1<=29.0 & obs_1>=2.0 & obs_2>=2.0 & obs_3<=-7.300000190734863 & obs_5>=26.0 & obs_6<=21.895850944519044 & obs_7>=34.7031551361084\n"
     ]
    }
   ],
   "source": [
    "for i in range(4):\n",
    "    print(\"--------------\\n{}\".format(actor.model[i].rules_))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 35,
   "id": "0b443f87",
   "metadata": {},
   "outputs": [],
   "source": [
    "def test(num_test_episodes=100):\n",
    "    \"\"\"\n",
    "    Test the learned policy using the trained actor model.\n",
    "\n",
    "    Args:\n",
    "        num_test_episodes (int): Number of episodes to test the model.\n",
    "\n",
    "    Returns:\n",
    "        float: Average reward over the test episodes.\n",
    "    \"\"\"\n",
    "    total_reward = 0\n",
    "\n",
    "    for episode in range(num_test_episodes):\n",
    "        state = env.reset()[0]  # Reset the environment and get the initial state\n",
    "        episode_reward = 0\n",
    "        state=position_to_index(state)\n",
    "        for t in range(1, 100):  # Limit the number of time steps\n",
    "            # Convert state to tensor and predict action probabilities\n",
    "            #             state_tensor = torch.tensor(state, dtype=torch.float32).to(device)\n",
    "            action_probs = actor.predict(pd.DataFrame(np.array([state]), columns=column_names))\n",
    "            # Select action based on the highest probability\n",
    "            action = np.argmax(action_probs)\n",
    "            # Take the chosen action\n",
    "            next_state, reward, done, trunc, _ = env.step(action)\n",
    "            # Accumulate reward\n",
    "            episode_reward += reward\n",
    "            if done or trunc:\n",
    "                break\n",
    "            # Update state\n",
    "            state = next_state\n",
    "            state=position_to_index(state)\n",
    "        total_reward += episode_reward\n",
    "        print(f\"Test Episode {episode + 1}, Reward: {episode_reward}\")\n",
    "    avg_reward = total_reward / num_test_episodes\n",
    "    print(f\"\\nAverage Reward over {num_test_episodes} Test Episodes: {avg_reward}\")\n",
    "    return avg_reward"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 36,
   "id": "ef9e3e26",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Starting a new episode.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 252: demo-v1\u001b[0m\n",
      "#----------------------------------------------------------------------------------------------#\n",
      "\u001b[38;20m[MODEL] (INFO) : Episode directory created.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Weather file USA_PA_Pittsburgh-Allegheny.County.AP.725205_TMY3.epw used.\u001b[0m\n",
      "\u001b[38;20m[MODEL] (INFO) : Adapting weather to building model.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Saving episode output path.\u001b[0m\n",
      "\u001b[38;20m[ENVIRONMENT] (INFO) : Episode 252 started.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : handlers are ready.\u001b[0m\n",
      "\u001b[38;20m[SIMULATOR] (INFO) : System is ready.\u001b[0m\n"
     ]
    },
    {
     "ename": "ValueError",
     "evalue": "Must pass 2-d input. shape=(1, 2, 9)",
     "output_type": "error",
     "traceback": [
      "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m",
      "\u001b[0;31mValueError\u001b[0m                                Traceback (most recent call last)",
      "Cell \u001b[0;32mIn[36], line 1\u001b[0m\n\u001b[0;32m----> 1\u001b[0m avg_test_reward \u001b[38;5;241m=\u001b[39m test(num_test_episodes\u001b[38;5;241m=\u001b[39m\u001b[38;5;241m100\u001b[39m)\n",
      "Cell \u001b[0;32mIn[35], line 20\u001b[0m, in \u001b[0;36mtest\u001b[0;34m(num_test_episodes)\u001b[0m\n\u001b[1;32m     16\u001b[0m state\u001b[38;5;241m=\u001b[39mposition_to_index(state)\n\u001b[1;32m     17\u001b[0m \u001b[38;5;28;01mfor\u001b[39;00m t \u001b[38;5;129;01min\u001b[39;00m \u001b[38;5;28mrange\u001b[39m(\u001b[38;5;241m1\u001b[39m, \u001b[38;5;241m100\u001b[39m):  \u001b[38;5;66;03m# Limit the number of time steps\u001b[39;00m\n\u001b[1;32m     18\u001b[0m     \u001b[38;5;66;03m# Convert state to tensor and predict action probabilities\u001b[39;00m\n\u001b[1;32m     19\u001b[0m     \u001b[38;5;66;03m#             state_tensor = torch.tensor(state, dtype=torch.float32).to(device)\u001b[39;00m\n\u001b[0;32m---> 20\u001b[0m     action_probs \u001b[38;5;241m=\u001b[39m actor\u001b[38;5;241m.\u001b[39mpredict(pd\u001b[38;5;241m.\u001b[39mDataFrame(np\u001b[38;5;241m.\u001b[39marray([state]), columns\u001b[38;5;241m=\u001b[39mcolumn_names))\n\u001b[1;32m     21\u001b[0m     \u001b[38;5;66;03m# Select action based on the highest probability\u001b[39;00m\n\u001b[1;32m     22\u001b[0m     action \u001b[38;5;241m=\u001b[39m np\u001b[38;5;241m.\u001b[39margmax(action_probs)\n",
      "File \u001b[0;32m/opt/anaconda3/envs/sinergym/lib/python3.12/site-packages/pandas/core/frame.py:827\u001b[0m, in \u001b[0;36mDataFrame.__init__\u001b[0;34m(self, data, index, columns, dtype, copy)\u001b[0m\n\u001b[1;32m    816\u001b[0m         mgr \u001b[38;5;241m=\u001b[39m dict_to_mgr(\n\u001b[1;32m    817\u001b[0m             \u001b[38;5;66;03m# error: Item \"ndarray\" of \"Union[ndarray, Series, Index]\" has no\u001b[39;00m\n\u001b[1;32m    818\u001b[0m             \u001b[38;5;66;03m# attribute \"name\"\u001b[39;00m\n\u001b[0;32m   (...)\u001b[0m\n\u001b[1;32m    824\u001b[0m             copy\u001b[38;5;241m=\u001b[39m_copy,\n\u001b[1;32m    825\u001b[0m         )\n\u001b[1;32m    826\u001b[0m     \u001b[38;5;28;01melse\u001b[39;00m:\n\u001b[0;32m--> 827\u001b[0m         mgr \u001b[38;5;241m=\u001b[39m ndarray_to_mgr(\n\u001b[1;32m    828\u001b[0m             data,\n\u001b[1;32m    829\u001b[0m             index,\n\u001b[1;32m    830\u001b[0m             columns,\n\u001b[1;32m    831\u001b[0m             dtype\u001b[38;5;241m=\u001b[39mdtype,\n\u001b[1;32m    832\u001b[0m             copy\u001b[38;5;241m=\u001b[39mcopy,\n\u001b[1;32m    833\u001b[0m             typ\u001b[38;5;241m=\u001b[39mmanager,\n\u001b[1;32m    834\u001b[0m         )\n\u001b[1;32m    836\u001b[0m \u001b[38;5;66;03m# For data is list-like, or Iterable (will consume into list)\u001b[39;00m\n\u001b[1;32m    837\u001b[0m \u001b[38;5;28;01melif\u001b[39;00m is_list_like(data):\n",
      "File \u001b[0;32m/opt/anaconda3/envs/sinergym/lib/python3.12/site-packages/pandas/core/internals/construction.py:314\u001b[0m, in \u001b[0;36mndarray_to_mgr\u001b[0;34m(values, index, columns, dtype, copy, typ)\u001b[0m\n\u001b[1;32m    308\u001b[0m     _copy \u001b[38;5;241m=\u001b[39m (\n\u001b[1;32m    309\u001b[0m         copy_on_sanitize\n\u001b[1;32m    310\u001b[0m         \u001b[38;5;28;01mif\u001b[39;00m (dtype \u001b[38;5;129;01mis\u001b[39;00m \u001b[38;5;28;01mNone\u001b[39;00m \u001b[38;5;129;01mor\u001b[39;00m astype_is_view(values\u001b[38;5;241m.\u001b[39mdtype, dtype))\n\u001b[1;32m    311\u001b[0m         \u001b[38;5;28;01melse\u001b[39;00m \u001b[38;5;28;01mFalse\u001b[39;00m\n\u001b[1;32m    312\u001b[0m     )\n\u001b[1;32m    313\u001b[0m     values \u001b[38;5;241m=\u001b[39m np\u001b[38;5;241m.\u001b[39marray(values, copy\u001b[38;5;241m=\u001b[39m_copy)\n\u001b[0;32m--> 314\u001b[0m     values \u001b[38;5;241m=\u001b[39m _ensure_2d(values)\n\u001b[1;32m    316\u001b[0m \u001b[38;5;28;01melse\u001b[39;00m:\n\u001b[1;32m    317\u001b[0m     \u001b[38;5;66;03m# by definition an array here\u001b[39;00m\n\u001b[1;32m    318\u001b[0m     \u001b[38;5;66;03m# the dtypes will be coerced to a single dtype\u001b[39;00m\n\u001b[1;32m    319\u001b[0m     values \u001b[38;5;241m=\u001b[39m _prep_ndarraylike(values, copy\u001b[38;5;241m=\u001b[39mcopy_on_sanitize)\n",
      "File \u001b[0;32m/opt/anaconda3/envs/sinergym/lib/python3.12/site-packages/pandas/core/internals/construction.py:592\u001b[0m, in \u001b[0;36m_ensure_2d\u001b[0;34m(values)\u001b[0m\n\u001b[1;32m    590\u001b[0m     values \u001b[38;5;241m=\u001b[39m values\u001b[38;5;241m.\u001b[39mreshape((values\u001b[38;5;241m.\u001b[39mshape[\u001b[38;5;241m0\u001b[39m], \u001b[38;5;241m1\u001b[39m))\n\u001b[1;32m    591\u001b[0m \u001b[38;5;28;01melif\u001b[39;00m values\u001b[38;5;241m.\u001b[39mndim \u001b[38;5;241m!=\u001b[39m \u001b[38;5;241m2\u001b[39m:\n\u001b[0;32m--> 592\u001b[0m     \u001b[38;5;28;01mraise\u001b[39;00m \u001b[38;5;167;01mValueError\u001b[39;00m(\u001b[38;5;124mf\u001b[39m\u001b[38;5;124m\"\u001b[39m\u001b[38;5;124mMust pass 2-d input. shape=\u001b[39m\u001b[38;5;132;01m{\u001b[39;00mvalues\u001b[38;5;241m.\u001b[39mshape\u001b[38;5;132;01m}\u001b[39;00m\u001b[38;5;124m\"\u001b[39m)\n\u001b[1;32m    593\u001b[0m \u001b[38;5;28;01mreturn\u001b[39;00m values\n",
      "\u001b[0;31mValueError\u001b[0m: Must pass 2-d input. shape=(1, 2, 9)"
     ]
    }
   ],
   "source": [
    "avg_test_reward = test(num_test_episodes=100)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "31340922",
   "metadata": {},
   "outputs": [],
   "source": [
    "import matplotlib.pyplot as plt\n",
    "# Generate recent 50 interval average\n",
    "average_reward = []\n",
    "for idx in range(len(rewards)):\n",
    "    avg_list = np.empty(shape=(1,), dtype=int)\n",
    "    if idx < 5:\n",
    "        avg_list = rewards[:idx+1]\n",
    "    else:\n",
    "        avg_list = rewards[idx-4:idx+1]\n",
    "    average_reward.append(np.average(avg_list))\n",
    "plt.plot(rewards)\n",
    "plt.plot(average_reward)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "9f18bae5",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "44b0354e",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "58e2db1b",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "8385f8b3",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "c1d27da3",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "fb4df6e4",
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.12.9"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
