{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "406b6b96",
   "metadata": {},
   "outputs": [],
   "source": [
    "import math\n",
    "import sys\n",
    "import random\n",
    "from dataclasses import dataclass\n",
    "import time\n",
    "import argparse\n",
    "import matplotlib\n",
    "import matplotlib.pyplot as plt\n",
    "from collections import namedtuple, deque\n",
    "from itertools import count\n",
    "# from sklearn.preprocessing import StandardScaler\n",
    "import copy\n",
    "# from hybrid_q_gp_cost import HybridQWithGPCost\n",
    " # adjust if needed\n",
    "from cpo_agent_safepo_style import CPOConfig, CPOAgent\n",
    "from ActSafeAgent import ActSafeAgent, ActSafeConfig\n",
    "from safe_fqi import SafeFQI,collect_epoch_safe_fqi\n",
    "from torch.distributions.kl import kl_divergence\n",
    "\n",
    "from dataclasses import dataclass\n",
    "from typing import Tuple, Dict, Deque\n",
    "import json\n",
    "import numpy as np\n",
    "import torch\n",
    "import torch.nn as nn\n",
    "import torch.optim as optim\n",
    "import torch.nn.functional as F\n",
    "\n",
    "# import gymnasium as gym\n",
    "import safety_gymnasium as sg\n",
    "from tqdm import trange\n",
    "# from schedules import AnnealScheduler, Anneal\n",
    "# import gpytorch\n",
    "from scipy.linalg import solve\n",
    "# from gpytorch.kernels import RBFKernel,ScaleKernel,LinearKernel\n",
    "# from sklearn.gaussian_process import GaussianProcessRegressor\n",
    "# from sklearn.gaussian_process.kernels import RBF, WhiteKernel\n",
    "from collections import namedtuple, deque\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 20,
   "id": "6cd93241",
   "metadata": {},
   "outputs": [],
   "source": [
    "safety_bound=0.3\n",
    "epsilon_start = 1.0\n",
    "epsilon_end = 0.02\n",
    "epsilon_decay_rate = 0.9985\n",
    "max_steps_per_test_episode=200\n",
    "num_episodes = 2000\n",
    "max_steps_per_episode = 200\n",
    "test_episodes = 100\n",
    "gamma = 0.99\n",
    "lr = 0.0025\n",
    "buffer_size = 50000\n",
    "buffer = deque(maxlen=buffer_size)\n",
    "batch_size = 100\n",
    "penalty=60"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 21,
   "id": "6ddfd797",
   "metadata": {},
   "outputs": [],
   "source": [
    "def combined_shape(n, shape):\n",
    "    if np.isscalar(shape):\n",
    "        return (n, shape)\n",
    "    return (n, *shape)\n",
    "\n",
    "def to_tensor(x, device):\n",
    "    if isinstance(x, np.ndarray):\n",
    "        return torch.as_tensor(x, dtype=torch.float32, device=device)\n",
    "    return torch.tensor(x, dtype=torch.float32, device=device)\n",
    "\n",
    "def flat_params(model):\n",
    "    return torch.cat([p.data.view(-1) for p in model.parameters()])\n",
    "\n",
    "def flat_grad(grads):\n",
    "    return torch.cat([g.contiguous().view(-1) for g in grads])\n",
    "\n",
    "def set_params_from_flat(model, flat):\n",
    "    idx = 0\n",
    "    for p in model.parameters():\n",
    "        n = p.numel()\n",
    "        p.data.copy_(flat[idx:idx+n].view_as(p))\n",
    "        idx += n\n",
    "\n",
    "def count_parameters(module):\n",
    "    return sum(p.numel() for p in module.parameters() if p.requires_grad)\n",
    "\n",
    "class RunningNorm:\n",
    "    \"\"\"Keeps running mean/var for feature normalization.\"\"\"\n",
    "    def __init__(self, dim, eps=1e-8):\n",
    "        self.dim = dim\n",
    "        self.mean = np.zeros(dim, dtype=np.float64)\n",
    "        self.var = np.ones(dim, dtype=np.float64)\n",
    "        self.count = eps\n",
    "        self.eps = eps\n",
    "\n",
    "    def update(self, x_np: np.ndarray):\n",
    "        x = x_np.reshape(-1, self.dim).astype(np.float64)\n",
    "        batch_mean = x.mean(axis=0)\n",
    "        batch_var = x.var(axis=0)\n",
    "        batch_count = x.shape[0]\n",
    "\n",
    "        delta = batch_mean - self.mean\n",
    "        tot_count = self.count + batch_count\n",
    "\n",
    "        new_mean = self.mean + delta * batch_count / tot_count\n",
    "        m_a = self.var * self.count\n",
    "        m_b = batch_var * batch_count\n",
    "        M2 = m_a + m_b + delta**2 * self.count * batch_count / tot_count\n",
    "        new_var = M2 / (tot_count)\n",
    "\n",
    "        self.mean = new_mean\n",
    "        self.var = np.maximum(new_var, self.eps)\n",
    "        self.count = tot_count\n",
    "\n",
    "    def normalize_torch(self, x: torch.Tensor):\n",
    "        m = torch.as_tensor(self.mean, dtype=x.dtype, device=x.device)\n",
    "        s = torch.as_tensor(self.var, dtype=x.dtype, device=x.device).sqrt()\n",
    "        return (x - m) / (s + 1e-8)\n",
    "    \n",
    "class MLP(nn.Module):\n",
    "    def __init__(self, in_dim, out_dim, hidden=(64, 64), act=nn.Tanh, out_act=None):\n",
    "        super().__init__()\n",
    "        layers = []\n",
    "        last = in_dim\n",
    "        for h in hidden:\n",
    "            layers += [nn.Linear(last, h), act()]\n",
    "            last = h\n",
    "        layers.append(nn.Linear(last, out_dim))\n",
    "        if out_act:\n",
    "            layers.append(out_act())\n",
    "        self.net = nn.Sequential(*layers)\n",
    "    def forward(self, x):\n",
    "        return self.net(x)\n",
    "\n",
    "class GaussianPolicy(nn.Module):\n",
    "    \"\"\"\n",
    "    Tanh-squashed diagonal Gaussian policy for continuous actions.\n",
    "    KL is computed in pre-tanh Gaussian space.\n",
    "    \"\"\"\n",
    "    def __init__(self, obs_dim, act_dim, hidden=(64,64), log_std_init=-1):\n",
    "        super().__init__()\n",
    "        self.mu_net = MLP(obs_dim, act_dim, hidden, act=nn.Tanh)\n",
    "        self.log_std = nn.Parameter(torch.ones(act_dim) * log_std_init)\n",
    "        with torch.no_grad():\n",
    "            self.log_std.clamp_(-5.0, 2.0)\n",
    "    def _dist(self, obs):\n",
    "        mu  = self.mu_net(obs)\n",
    "        std = torch.exp(self.log_std)\n",
    "        return mu, std\n",
    "\n",
    "    @staticmethod\n",
    "    def atanh(x, eps=1e-6):\n",
    "        return 0.5 * (torch.log1p(x + eps) - torch.log1p(-x + eps))\n",
    "\n",
    "    def log_prob_from_u(self, u, mu, std, a):\n",
    "        pre_sum = -0.5 * (((u - mu) / (std + 1e-8)) ** 2 + 2 * torch.log(std + 1e-8) + math.log(2 * math.pi))\n",
    "        logp_u = pre_sum.sum(dim=-1)\n",
    "        logdet_jac = torch.log(1 - a.pow(2) + 1e-8).sum(dim=-1)\n",
    "        return logp_u - logdet_jac\n",
    "\n",
    "    def sample(self, obs):\n",
    "        mu, std = self._dist(obs)\n",
    "        eps = torch.randn_like(mu)\n",
    "        u = mu + std * eps\n",
    "        a = torch.tanh(u)\n",
    "        logp = self.log_prob_from_u(u, mu, std, a)\n",
    "        return a, logp, u, mu, std\n",
    "\n",
    "    def log_prob(self, obs, a):\n",
    "        mu, std = self._dist(obs)\n",
    "        u = self.atanh(a)\n",
    "        return self.log_prob_from_u(u, mu, std, a)\n",
    "\n",
    "    def kl_with(self, other, obs):\n",
    "        mu0, std0 = other._dist(obs)\n",
    "        mu1, std1 = self._dist(obs)\n",
    "        kl = (torch.log(std1 + 1e-8) - torch.log(std0 + 1e-8)\n",
    "              + (std0**2 + (mu0 - mu1)**2) / (2 * (std1**2) + 1e-8) - 0.5).sum(dim=-1)\n",
    "        return kl.mean()\n",
    "\n",
    "\n",
    "    def forward(self, obs):\n",
    "        # return a Normal in pre-tanh space\n",
    "        mu, std = self._dist(obs)     # your existing helper\n",
    "        return torch.distributions.Normal(mu, std)\n",
    "    def mean_kl(self, other, obs) -> torch.Tensor:\n",
    "    # KL(self || other) averaged over batch\n",
    "    # (our kl_with computes KL(other || self), so flip the order)\n",
    "        return other.kl_with(self, obs)\n",
    "\n",
    "class ValueNet(nn.Module):\n",
    "    def __init__(self, obs_dim, hidden=(64, 64)):\n",
    "        super().__init__()\n",
    "        self.v = MLP(obs_dim, 1, hidden, act=nn.Tanh)\n",
    "    def forward(self, obs):\n",
    "        return self.v(obs).squeeze(-1)\n",
    "\n",
    "# ============================================================\n",
    "# Buffer with reward & cost GAE\n",
    "# ============================================================\n",
    "\n",
    "class GAEBuffer:\n",
    "    def __init__(self, obs_space, act_space, size, gamma=0.99, lam=0.95, gamma_c=1, lam_c=0.95, device='cpu'):\n",
    "        self.obs_buf  = np.zeros(combined_shape(size, obs_space.shape), dtype=np.float32)\n",
    "        self.act_buf  = np.zeros(combined_shape(size, act_space.shape), dtype=np.float32)\n",
    "        self.rew_buf  = np.zeros(size, dtype=np.float32)\n",
    "        self.cost_buf = np.zeros(size, dtype=np.float32)\n",
    "        self.val_buf  = np.zeros(size, dtype=np.float32)\n",
    "        self.cval_buf = np.zeros(size, dtype=np.float32)\n",
    "        self.logp_buf = np.zeros(size, dtype=np.float32)\n",
    "        self.done_buf = np.zeros(size, dtype=np.float32)\n",
    "\n",
    "        self.gamma, self.lam = gamma, lam\n",
    "        self.gamma_c, self.lam_c = gamma_c, lam_c\n",
    "        self.ptr, self.path_start_idx, self.max_size = 0, 0, size\n",
    "        self.device = device\n",
    "\n",
    "    def reset(self):\n",
    "        self.ptr = 0\n",
    "        self.path_start_idx = 0\n",
    "\n",
    "    def store(self, obs, act, rew, cost, val, cval, logp, done):\n",
    "        assert self.ptr < self.max_size\n",
    "        self.obs_buf[self.ptr]  = obs\n",
    "        self.act_buf[self.ptr]  = act\n",
    "        self.rew_buf[self.ptr]  = rew\n",
    "        self.cost_buf[self.ptr] = cost\n",
    "        self.val_buf[self.ptr]  = val\n",
    "        self.cval_buf[self.ptr] = cval\n",
    "        self.logp_buf[self.ptr] = logp\n",
    "        self.done_buf[self.ptr] = done\n",
    "        self.ptr += 1\n",
    "\n",
    "    def _gae_like(self, deltas, gamma, lam):\n",
    "        adv = np.zeros_like(deltas, dtype=np.float32)\n",
    "        gae = 0.0\n",
    "        for t in reversed(range(len(deltas))):\n",
    "            gae = deltas[t] + gamma * lam * gae\n",
    "            adv[t] = gae\n",
    "        return adv\n",
    "\n",
    "    def finish_path(self, last_val, last_cval):\n",
    "        path_slice = slice(self.path_start_idx, self.ptr)\n",
    "\n",
    "        rews  = np.append(self.rew_buf[path_slice],  last_val)\n",
    "        costs = np.append(self.cost_buf[path_slice], last_cval)\n",
    "        vals  = self.val_buf[path_slice]\n",
    "        cvals = self.cval_buf[path_slice]\n",
    "\n",
    "        deltas  = rews[:-1]  + self.gamma   * np.append(vals[1:],  last_val)  - vals\n",
    "        cdelta  = costs[:-1] + self.gamma_c * np.append(cvals[1:], last_cval) - cvals\n",
    "\n",
    "        adv_r = self._gae_like(deltas, self.gamma, self.lam)\n",
    "        adv_c = self._gae_like(cdelta,  self.gamma_c, self.lam_c)\n",
    "\n",
    "        ret_r = adv_r + vals\n",
    "        ret_c = adv_c + cvals\n",
    "\n",
    "        self.adv_r_buf = getattr(self, \"adv_r_buf\", np.zeros_like(self.rew_buf))\n",
    "        self.adv_c_buf = getattr(self, \"adv_c_buf\", np.zeros_like(self.cost_buf))\n",
    "        self.ret_r_buf = getattr(self, \"ret_r_buf\", np.zeros_like(self.rew_buf))\n",
    "        self.ret_c_buf = getattr(self, \"ret_c_buf\", np.zeros_like(self.cost_buf))\n",
    "\n",
    "        self.adv_r_buf[path_slice] = adv_r\n",
    "        self.adv_c_buf[path_slice] = adv_c\n",
    "        self.ret_r_buf[path_slice] = ret_r\n",
    "        self.ret_c_buf[path_slice] = ret_c\n",
    "\n",
    "        self.path_start_idx = self.ptr\n",
    "\n",
    "    def get(self):\n",
    "        assert self.ptr == self.max_size\n",
    "\n",
    "        adv_r = self.adv_r_buf\n",
    "        adv_r = (adv_r - adv_r.mean()) / (adv_r.std() + 1e-8)\n",
    "        adv_c = self.adv_c_buf\n",
    "        adv_c = adv_c / (adv_c.std() + 1e-8)\n",
    "        # adv_c = (adv_c - adv_c.mean()) / (adv_c.std() + 1e-8)\n",
    "        data = dict(\n",
    "            obs   = to_tensor(self.obs_buf,   self.device),\n",
    "            act   = to_tensor(self.act_buf,   self.device),\n",
    "            logp  = to_tensor(self.logp_buf,  self.device),\n",
    "            adv_r = to_tensor(adv_r,          self.device),\n",
    "            adv_c = to_tensor(adv_c,          self.device),\n",
    "            # adv_c = to_tensor(self.adv_c_buf, self.device),\n",
    "            ret_r = to_tensor(self.ret_r_buf, self.device),\n",
    "            ret_c = to_tensor(self.ret_c_buf, self.device),\n",
    "        )\n",
    "        return data\n",
    "\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 22,
   "id": "0a9d7dda",
   "metadata": {},
   "outputs": [],
   "source": [
    "# class hybridBuffer:\n",
    "#     def __init__(self, obs_dim, act_dim, capacity=1_000_000, seed=0):\n",
    "#         self.n = capacity\n",
    "#         rng = np.random.default_rng(seed)\n",
    "#         self.rng = rng\n",
    "#         self.ptr = 0\n",
    "#         self.size = 0\n",
    "#         self.obs      = np.zeros((capacity, obs_dim), dtype=np.float32)\n",
    "#         self.next_obs = np.zeros((capacity, obs_dim), dtype=np.float32)\n",
    "#         self.act      = np.zeros((capacity, act_dim), dtype=np.float32)\n",
    "#         self.rew      = np.zeros((capacity, 1), dtype=np.float32)\n",
    "#         self.cost     = np.zeros((capacity, 1), dtype=np.float32)\n",
    "#         self.done     = np.zeros((capacity, 1), dtype=np.float32)\n",
    "\n",
    "#     def add(self, obs, act, rew, cost, next_obs, done):\n",
    "#         i = self.ptr\n",
    "#         self.obs[i]      = obs\n",
    "#         self.act[i]      = act\n",
    "#         self.rew[i, 0]   = rew\n",
    "#         self.cost[i, 0]  = cost\n",
    "#         self.next_obs[i] = next_obs\n",
    "#         self.done[i, 0]  = float(done)\n",
    "#         self.ptr = (self.ptr + 1) % self.n\n",
    "#         self.size = min(self.size + 1, self.n)\n",
    "\n",
    "#     def get(self, batch_size=256, bias_cost_frac=0.0, cost_threshold=1e-6):\n",
    "#         if bias_cost_frac <= 0.0 or (self.cost[:self.size] <= cost_threshold).all():\n",
    "#             idx = self.rng.integers(0, self.size, size=batch_size)\n",
    "#         else:\n",
    "#             # cost-aware: draw a fraction from cost>0 and the rest uniform\n",
    "#             cost_idx = np.flatnonzero(self.cost[:self.size, 0] > cost_threshold)\n",
    "#             k = int(batch_size * bias_cost_frac)\n",
    "#             if len(cost_idx) > 0 and k > 0:\n",
    "#                 k = min(k, len(cost_idx))\n",
    "#                 idx1 = self.rng.choice(cost_idx, size=k, replace=len(cost_idx) < k)\n",
    "#                 idx2 = self.rng.integers(0, self.size, size=batch_size - k)\n",
    "#                 idx = np.concatenate([idx1, idx2])\n",
    "#             else:\n",
    "#                 idx = self.rng.integers(0, self.size, size=batch_size)\n",
    "\n",
    "#         return {\n",
    "#             \"obs\":      self.obs[idx],\n",
    "#             \"act\":      self.act[idx],\n",
    "#             \"rew\":      self.rew[idx].squeeze(-1),\n",
    "#             \"cost\":     self.cost[idx].squeeze(-1),\n",
    "#             \"next_obs\": self.next_obs[idx],\n",
    "#             \"done\":     self.done[idx].squeeze(-1),\n",
    "#         }"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 23,
   "id": "ca52589a",
   "metadata": {},
   "outputs": [],
   "source": [
    "\n",
    "# ---------- tiny utils (self-contained; do not rely on globals) ----------\n",
    "\n",
    "def _flat_params(module: nn.Module) -> torch.Tensor:\n",
    "    return torch.cat([p.data.view(-1) for p in module.parameters()])\n",
    "\n",
    "def _set_flat_params(module: nn.Module, flat: torch.Tensor) -> None:\n",
    "    idx = 0\n",
    "    for p in module.parameters():\n",
    "        n = p.numel()\n",
    "        p.data.copy_(flat[idx:idx+n].view_as(p))\n",
    "        idx += n\n",
    "\n",
    "def _flat_grad(loss: torch.Tensor, params, retain_graph=False, create_graph=False) -> torch.Tensor:\n",
    "    grads = torch.autograd.grad(loss, params, retain_graph=retain_graph, create_graph=create_graph)\n",
    "    return torch.cat([g.contiguous().view(-1) for g in grads])\n",
    "\n",
    "def _to_tensor(x, device):\n",
    "    if isinstance(x, torch.Tensor):\n",
    "        return x.to(device)\n",
    "    x = np.asarray(x)\n",
    "    return torch.as_tensor(x, dtype=torch.float32, device=device)\n",
    "\n",
    "\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 24,
   "id": "6166a393",
   "metadata": {},
   "outputs": [],
   "source": [
    "device = (\"cuda\" if torch.cuda.is_available() else \"cpu\")\n",
    "device = \"cpu\"\n",
    "class QNetwork(nn.Module):\n",
    "    def __init__(self, state_size, action_size, seed, fc1_units=128, fc2_units=64):\n",
    "        super(QNetwork, self).__init__()\n",
    "        self.seed = torch.manual_seed(seed)\n",
    "        self.fc1 = nn.Linear(state_size, fc1_units)\n",
    "        self.fc2 = nn.Linear(fc1_units, fc2_units)\n",
    "        self.fc3 = nn.Linear(fc2_units, action_size)\n",
    "        self.to(device)\n",
    "\n",
    "    def forward(self, state):\n",
    "        x = F.relu(self.fc1(state))\n",
    "        x = F.relu(self.fc2(x))\n",
    "        return self.fc3(x)\n",
    "    \n",
    "class ReplayBuffer:\n",
    "    def __init__(self, action_size, buffer_size, batch_size, seed):\n",
    "        self.action_size = action_size\n",
    "        self.memory = deque(maxlen=buffer_size)\n",
    "        self.batch_size = batch_size\n",
    "        self.experience = namedtuple(\"Experience\", field_names=[\"state\", \"action\", \"reward\", \"next_state\", \"done\"])\n",
    "        self.seed = random.seed(seed)\n",
    "\n",
    "    def add(self, state, action, reward, next_state, done):\n",
    "        e = self.experience(state, action, reward, next_state, done)\n",
    "        self.memory.append(e)\n",
    "\n",
    "    # def sample(self):\n",
    "    #     experiences = random.sample(self.memory, k=self.batch_size)\n",
    "\n",
    "    #     states = torch.from_numpy(np.vstack([e.state for e in experiences if e is not None])).float().to(device)\n",
    "    #     actions = torch.from_numpy(np.vstack([e.action for e in experiences if e is not None])).long().to(device)\n",
    "    #     rewards = torch.from_numpy(np.vstack([e.reward for e in experiences if e is not None])).float().to(device)\n",
    "    #     next_states = torch.from_numpy(np.vstack([e.next_state for e in experiences if e is not None])).float().to(device)\n",
    "    #     dones = torch.from_numpy(np.vstack([e.done for e in experiences if e is not None]).astype(np.uint8)).float().to(device)\n",
    "\n",
    "    #     return (states, actions, rewards, next_states, dones)\n",
    "    def sample(self, batch_size, device=\"cpu\"):\n",
    "        n = len(self.experience)\n",
    "        idx = np.random.randint(0, n, size=batch_size)\n",
    "\n",
    "        # assume storage[i] is a dict with keys below\n",
    "        def cat(key, dtype=None):\n",
    "            arr = np.stack([self.experience[i][key] for i in idx], axis=0)\n",
    "            t = torch.from_numpy(arr)\n",
    "            if dtype is not None: t = t.to(dtype)\n",
    "            # pin + non_blocking helps GPU transfer\n",
    "            if device.type == \"cuda\":\n",
    "                t = t.pin_memory().to(device, non_blocking=True)\n",
    "            else:\n",
    "                t = t.to(device)\n",
    "            return t\n",
    "\n",
    "        S  = cat(\"obs\",       torch.float32)\n",
    "        A  = cat(\"act\",       torch.float32)\n",
    "        R  = cat(\"rew\",       torch.float32).squeeze(-1)\n",
    "        # C  = cat(\"cost\",      torch.float32).squeeze(-1)\n",
    "        S2 = cat(\"next_obs\",  torch.float32)\n",
    "        D  = cat(\"done\",      torch.float32).squeeze(-1)\n",
    "\n",
    "        return S, A, R,  S2, D\n",
    "\n",
    "    def __len__(self):\n",
    "        return len(self.memory)\n",
    "    \n",
    "class DQNAgent:\n",
    "    # Initialize the DQN agent\n",
    "    def __init__(self, state_size, action_size, seed, lr):\n",
    "        self.state_size = state_size\n",
    "        self.action_size = action_size\n",
    "        self.seed = random.seed(seed)\n",
    "\n",
    "        self.qnetwork_local = QNetwork(state_size, action_size, seed).to(device)\n",
    "        self.qnetwork_target = QNetwork(state_size, action_size, seed).to(device)\n",
    "        self.optimizer = optim.Adam(self.qnetwork_local.parameters(), lr)\n",
    "\n",
    "        self.memory = ReplayBuffer(action_size, buffer_size=int(1e5), batch_size=64, seed=seed)\n",
    "        self.t_step = 0\n",
    "\n",
    "    def step(self, state, action, reward, next_state, done):\n",
    "        self.memory.add(state, action, reward, next_state, done)\n",
    "\n",
    "        self.t_step = (self.t_step + 1) % 4\n",
    "        if self.t_step == 0:\n",
    "            if len(self.memory) > 64:\n",
    "                experiences = self.memory.sample()\n",
    "                self.learn(experiences, gamma=0.99)\n",
    "\n",
    "    # Choose an action based on the current state\n",
    "    def act(self, state, eps=0.):\n",
    "        state_tensor = torch.from_numpy(state).float().unsqueeze(0).to(device)\n",
    "        \n",
    "        self.qnetwork_local.eval()\n",
    "        with torch.no_grad():\n",
    "            action_values = self.qnetwork_local(state_tensor)\n",
    "        self.qnetwork_local.train()\n",
    "\n",
    "        if np.random.random() > eps:\n",
    "            return action_values.argmax(dim=1).item()\n",
    "        else:\n",
    "            return np.random.randint(self.action_size)\n",
    "        \n",
    "    # Choose an safe action based on the current state and prediction\n",
    "    def act_safe(self, state, model, CI_para, eps=0):\n",
    "        state_tensor = torch.from_numpy(state).float().unsqueeze(0).to(device)\n",
    "        \n",
    "        self.qnetwork_local.eval()\n",
    "        with torch.no_grad():\n",
    "            action_values = self.qnetwork_local(state_tensor)\n",
    "        self.qnetwork_local.train()\n",
    "        \n",
    "        possible_action=np.ones(self.action_size)\n",
    "        for i in range(self.action_size):\n",
    "            X=np.concatenate((state, np.array(i).reshape(1, )), axis=0)\n",
    "            X_tensor=torch.from_numpy(X).float().unsqueeze(0).to(device)\n",
    "            mean, log_var = model(X_tensor)\n",
    "            ub= mean.item()+CI_para*np.sqrt(np.exp(log_var.item()))\n",
    "            if ub>=safety_bound:\n",
    "                possible_action[i]=0 \n",
    "                # action_values[0][i]=-1\n",
    "               \n",
    "        if np.random.random() > eps:\n",
    "            return action_values.argmax(dim=1).item()\n",
    "        else:\n",
    "\n",
    "            if np.sum(possible_action)==0:\n",
    "                return action_values.argmax(dim=1).item()\n",
    "            else:\n",
    "                a=np.random.choice(self.action_size,size=1,p=possible_action/np.sum(possible_action))[0]\n",
    "                return int(a)\n",
    "            # return np.random.randint(self.action_size)\n",
    "    # Learn from batch of experiences\n",
    "    def learn(self, experiences, gamma):\n",
    "        states, actions, rewards, next_states, dones = zip(*experiences)\n",
    "        states = torch.from_numpy(np.vstack(states)).float().to(device)\n",
    "        actions = torch.from_numpy(np.vstack(actions)).long().to(device)\n",
    "        rewards = torch.from_numpy(np.vstack(rewards)).float().to(device)\n",
    "        next_states = torch.from_numpy(np.vstack(next_states)).float().to(device)\n",
    "        dones = torch.from_numpy(np.vstack(dones).astype(np.uint8)).float().to(device)\n",
    "\n",
    "        Q_targets_next = self.qnetwork_target(next_states).detach().max(1)[0].unsqueeze(1)\n",
    "        Q_targets = rewards + (gamma * Q_targets_next * (1 - dones))\n",
    "\n",
    "        Q_expected = self.qnetwork_local(states).gather(1, actions)\n",
    "\n",
    "        loss = F.mse_loss(Q_expected, Q_targets)\n",
    "        self.optimizer.zero_grad()\n",
    "        loss.backward()\n",
    "        self.optimizer.step()\n",
    "\n",
    "        self.soft_update(self.qnetwork_local, self.qnetwork_target, tau=1e-3)\n",
    "\n",
    "    def soft_update(self, local_model, target_model, tau):\n",
    "        for target_param, local_param in zip(target_model.parameters(), local_model.parameters()):\n",
    "            target_param.data.copy_(tau * local_param.data + (1.0 - tau) * target_param.data)\n",
    "    \n",
    "class ProbabilisticRegressor(nn.Module):\n",
    "    def __init__(self, input_dim, hidden_dim=128,init_log_var=0.0):\n",
    "        super().__init__()\n",
    "        self.shared = nn.Sequential(\n",
    "            nn.Linear(input_dim, hidden_dim),\n",
    "            nn.ReLU()\n",
    "        )\n",
    "        self.mean_head = nn.Linear(hidden_dim, 1)\n",
    "        self.log_var_head = nn.Linear(hidden_dim, 1)  # log variance for stability\n",
    "        nn.init.constant_(self.log_var_head.bias, init_log_var)# start with σ^2 ~ e^{init_log_var}\n",
    "\n",
    "    def forward(self, x):\n",
    "        h = self.shared(x)\n",
    "        mean = self.mean_head(h)\n",
    "        log_var = self.log_var_head(h)\n",
    "        return mean, log_var  # we return log variance to keep it numerically stable\n",
    "    \n",
    "\n",
    "def gaussian_nll_loss(mean, log_var, y, weight=None):\n",
    "    # per-sample loss:\n",
    "    loss_per = 0.5 * (log_var + (y - mean) ** 2 / torch.exp(log_var))\n",
    "    if weight is not None:\n",
    "        w = weight\n",
    "        loss = (loss_per * w).sum() / (w.sum() + 1e-8)\n",
    "    else:\n",
    "        loss = loss_per.mean()\n",
    "    return loss\n",
    "\n",
    "class CostReplay:\n",
    "    def __init__(self, maxlen=200_000, device='cpu'):\n",
    "        self.mem: Deque[tuple] = deque(maxlen=maxlen)\n",
    "        self.device = device\n",
    "    def add(self, s: np.ndarray, a: np.ndarray, c: float):\n",
    "        self.mem.append( (np.asarray(s, dtype=np.float32),\n",
    "                          np.asarray(a, dtype=np.float32),\n",
    "                          float(c)) )\n",
    "    def sample(self, batch_size: int):\n",
    "        if len(self.mem) == 0: return None\n",
    "        batch = random.sample(self.mem, k=min(batch_size, len(self.mem)))\n",
    "        S = torch.as_tensor(np.stack([b[0] for b in batch]), dtype=torch.float32, device=self.device)\n",
    "        A = torch.as_tensor(np.stack([b[1] for b in batch]), dtype=torch.float32, device=self.device)\n",
    "        C = torch.as_tensor(np.stack([b[2] for b in batch]), dtype=torch.float32, device=self.device).unsqueeze(1)\n",
    "        return S, A, C\n",
    "    def __len__(self): return len(self.mem)  "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 25,
   "id": "87ad6373",
   "metadata": {},
   "outputs": [],
   "source": [
    "\n",
    "\n",
    "# class HybridAgent:\n",
    "#     def __init__(self, obs_space, act_space, device=\"cpu\"):\n",
    "#         self.device = device\n",
    "#         self.core = HybridQWithGPCost(obs_space.shape[0], act_space.shape[0], device=device)\n",
    "\n",
    "#     def update(self, data, ep_cost_mean: float, cost_limit: float, avg_ep_len: float):\n",
    "#         # Delegate to core and softly update targets\n",
    "#         self.core.update(data)\n",
    "#         self.core.soft_update_(self.core.q1, self.core.q1_t)\n",
    "#         self.core.soft_update_(self.core.q2, self.core.q2_t)\n",
    "#         return {\"updates\": 1}\n",
    "\n",
    "\n",
    "def collect_epoch_hybrid(env, agent, steps_per_epoch, device):\n",
    "    o, info = env.reset()\n",
    "    obs_l, act_l, rew_l, cost_l, next_l, done_l = [], [], [], [], [], []\n",
    "    ep_costs, ep_rewards = [], []\n",
    "    ep_ret, ep_cost, ep_len = 0.0, 0.0, 0\n",
    "    unsafe_steps, num_eps = 0, 0\n",
    "    explore_prob=0.3\n",
    "    new_explore_prob=0.05\n",
    "    for _ in range(steps_per_epoch):\n",
    "        obs_np = o.astype(np.float32)\n",
    "        if np.random.rand() < explore_prob and agent.core.global_step < agent.core._warmup:\n",
    "            a_np = env.action_space.sample()\n",
    "        \n",
    "        else:\n",
    "            if np.random.rand() < new_explore_prob: \n",
    "                a_np = env.action_space.sample()\n",
    "            else:\n",
    "                a_np = agent.core.select_action_safe(obs_np)\n",
    "\n",
    "        step_out = env.step(a_np)\n",
    "        if len(step_out) == 6:\n",
    "            o2, r, c, terminated, truncated, info = step_out\n",
    "        else:\n",
    "            o2, r, terminated, truncated, info = step_out\n",
    "            c = float(info.get('cost', 0.0))\n",
    "\n",
    "        terminal = bool(terminated)\n",
    "        trunc = bool(truncated)\n",
    "        done = terminal or trunc\n",
    "\n",
    "        obs_l.append(obs_np)\n",
    "        act_l.append(a_np.astype(np.float32))\n",
    "        rew_l.append(float(r))\n",
    "        cost_l.append(float(c))\n",
    "        next_l.append(o2.astype(np.float32))\n",
    "        done_l.append(float(done))\n",
    "\n",
    "        unsafe_steps += int(float(c) > 0.0)\n",
    "        ep_len += 1\n",
    "        ep_cost += float(c)\n",
    "        ep_ret += float(r)\n",
    "        o = o2\n",
    "\n",
    "        if done:\n",
    "            ep_costs.append(ep_cost)\n",
    "            ep_rewards.append(ep_ret)\n",
    "            num_eps += 1\n",
    "            o, info = env.reset()\n",
    "            ep_ret, ep_len, ep_cost = 0.0, 0, 0.0\n",
    "\n",
    "    data = {\n",
    "        \"obs\": np.stack(obs_l, axis=0),\n",
    "        \"act\": np.stack(act_l, axis=0),\n",
    "        \"rew\": np.array(rew_l, dtype=np.float32),\n",
    "        \"cost\": np.array(cost_l, dtype=np.float32),\n",
    "        \"next_obs\": np.stack(next_l, axis=0),\n",
    "        \"done\": np.array(done_l, dtype=np.float32),\n",
    "        \"_unsafe_steps\": int(unsafe_steps),\n",
    "        \"_episodes\": int(max(1, num_eps))\n",
    "    }\n",
    "\n",
    "    ep_cost_mean = float(np.mean(ep_costs)) if len(ep_costs) > 0 else 0.0\n",
    "    avg_ep_len = steps_per_epoch / max(1, num_eps)\n",
    "    ep_reward_mean = float(np.mean(ep_rewards)) if len(ep_rewards) > 0 else 0.0\n",
    "\n",
    "    return data, ep_cost_mean, avg_ep_len, ep_reward_mean\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 26,
   "id": "6ea3115d",
   "metadata": {},
   "outputs": [],
   "source": [
    "@dataclass\n",
    "class GPQConfig:\n",
    "    # Actor / Critic\n",
    "    hidden: Tuple[int,int] = (64, 64)\n",
    "    gamma: float = 0.99\n",
    "    actor_lr: float = 3e-4\n",
    "    critic_lr: float = 3e-4\n",
    "    tau: float = 0.005                # soft target update\n",
    "    actor_updates: int = 80\n",
    "    critic_updates: int = 200\n",
    "    batch_size: int = 256\n",
    "    target_smooth_noise: float = 0.2  # optional target smoothing (set 0.0 to disable)\n",
    "    target_smooth_clip: float = 0.5\n",
    "\n",
    "    # Cost GP (neural)\n",
    "    cost_lr: float = 1e-3\n",
    "    cost_hidden: int = 128\n",
    "    cost_pos_weight: float = 10.0\n",
    "    var_floor: float = 0.05\n",
    "    ci_start: float = 1\n",
    "    ci_end: float = 0.5\n",
    "    ci_decay: float = 0.995\n",
    "    # Constraint enforcement - tuned for SafetyPointGoal2-v0\n",
    "    lambda_lr: float = 0.05       # higher learning rate for point navigation task\n",
    "    lambda_max = 10.0             # cap for strong constraint enforcement\n",
    "    # Remove old parameters that are no longer used\n",
    "    # alpha_ucb: float = 2.0         # not used in new design\n",
    "    # actor_cost_penalty: float = 0.5 # not used in new design\n",
    "    # Replay\n",
    "    replay_size: int = 500_000\n",
    "    safe_margin: float = 0.0         # hinge margin above cost_limit\n",
    "    penalty_power: float = 2.0       # 1.0=linear, 2.0=quadratic\n",
    "    clamp_ucb_max: float = 1.0       # cap UCB to [0, clamp_ucb_max]\n",
    "    use_lambda_in_critic: bool = False\n",
    "    lookahead_risk: bool = True      # also penalize next-state action risk\n",
    "    adaptive_alpha: bool = True      # scale alpha by batch stds\n",
    "\n",
    "    device: str = \"cpu\"\n",
    "\n",
    "class TransitionReplay:\n",
    "    def __init__(self, obs_dim, act_dim, maxlen=500_000, device='cpu'):\n",
    "        self.mem: Deque[tuple] = deque(maxlen=maxlen)\n",
    "        self.device = device\n",
    "        self.obs_dim = obs_dim\n",
    "        self.act_dim = act_dim\n",
    "    def add(self, s, a, r, c, s2, d):\n",
    "        self.mem.append((\n",
    "            np.asarray(s,  dtype=np.float32),\n",
    "            np.asarray(a,  dtype=np.float32),\n",
    "            float(r), float(c),\n",
    "            np.asarray(s2, dtype=np.float32),\n",
    "            float(d)\n",
    "        ))\n",
    "    def __len__(self): return len(self.mem)\n",
    "    def sample(self, batch_size: int):\n",
    "        batch_size = min(batch_size, len(self.mem))\n",
    "        idx = np.random.choice(len(self.mem), size=batch_size, replace=False)\n",
    "        S  = torch.as_tensor(np.stack([self.mem[i][0] for i in idx]), dtype=torch.float32, device=self.device)\n",
    "        A  = torch.as_tensor(np.stack([self.mem[i][1] for i in idx]), dtype=torch.float32, device=self.device)\n",
    "        R  = torch.as_tensor(np.array([self.mem[i][2] for i in idx])[:,None], dtype=torch.float32, device=self.device)\n",
    "        C  = torch.as_tensor(np.array([self.mem[i][3] for i in idx])[:,None], dtype=torch.float32, device=self.device)\n",
    "        S2 = torch.as_tensor(np.stack([self.mem[i][4] for i in idx]), dtype=torch.float32, device=self.device)\n",
    "        D  = torch.as_tensor(np.array([self.mem[i][5] for i in idx])[:,None], dtype=torch.float32, device=self.device)\n",
    "        return S, A, R, C, S2, D\n",
    "\n",
    "class QCritic(nn.Module):\n",
    "    \"\"\"Q(s,a) for continuous actions.\"\"\"\n",
    "    def __init__(self, obs_dim, act_dim, hidden=(64,64)):\n",
    "        super().__init__()\n",
    "        self.q = MLP(obs_dim + act_dim, 1, hidden, act=nn.ReLU)\n",
    "    def forward(self, s, a):\n",
    "        return self.q(torch.cat([s, a], dim=1))\n",
    "\n",
    "class GPQAgent:\n",
    "    \"\"\"\n",
    "    REDESIGNED GP-cost + Q-learning for SAFE continuous control.\n",
    "    - Cost model: learns continuous cost function with uncertainty\n",
    "    - Safe reward shaping: r' = r - penalty for constraint violations\n",
    "    - Constraint enforcement: dual variable λ with proper ascent\n",
    "    - Safe policy: ensures cost_limit is respected during training\n",
    "    \"\"\"\n",
    "    def __init__(self, obs_space, act_space, cfg: GPQConfig):\n",
    "        assert len(act_space.shape) == 1, \"Continuous Box action space expected.\"\n",
    "        self.cfg = cfg\n",
    "        self.device = cfg.device\n",
    "        print(f\"[gpq] device={self.device}\")\n",
    "\n",
    "        self.obs_dim = obs_space.shape[0]\n",
    "        self.act_dim = act_space.shape[0]\n",
    "\n",
    "        # Policy (Gaussian for exploration; we use its mean for actor update)\n",
    "        self.pi = GaussianPolicy(self.obs_dim, self.act_dim, hidden=cfg.hidden, log_std_init=-1).to(cfg.device)\n",
    "        self.pi_target = GaussianPolicy(self.obs_dim, self.act_dim, hidden=cfg.hidden, log_std_init=-1).to(cfg.device)\n",
    "        self.pi_target.load_state_dict(self.pi.state_dict())\n",
    "        self.old_pi = GaussianPolicy(self.obs_dim, self.act_dim, hidden=cfg.hidden, log_std_init=-1).to(cfg.device)\n",
    "        self.old_pi.load_state_dict(self.pi.state_dict())\n",
    "\n",
    "        # Critic + target\n",
    "        self.q = QCritic(self.obs_dim, self.act_dim, hidden=cfg.hidden).to(cfg.device)\n",
    "        self.q_target = QCritic(self.obs_dim, self.act_dim, hidden=cfg.hidden).to(cfg.device)\n",
    "        self.q_target.load_state_dict(self.q.state_dict())\n",
    "\n",
    "        # Value heads (only so your runner/GAE works; we fit them to returns it provides)\n",
    "        self.vf  = ValueNet(self.obs_dim, hidden=cfg.hidden).to(cfg.device)\n",
    "        self.cvf = ValueNet(self.obs_dim, hidden=cfg.hidden).to(cfg.device)\n",
    "        self.vf_opt  = torch.optim.Adam(self.vf.parameters(),  lr=3e-4)\n",
    "        self.cvf_opt = torch.optim.Adam(self.cvf.parameters(), lr=3e-4)\n",
    "\n",
    "        # Cost model (GP-like neural net)\n",
    "        self.cost_model = ProbabilisticRegressor(self.obs_dim + self.act_dim, hidden_dim=cfg.cost_hidden).to(cfg.device)\n",
    "        self.cost_opt   = torch.optim.Adam(self.cost_model.parameters(), lr=cfg.cost_lr)\n",
    "\n",
    "        # Normalizers for (s,a) before cost model\n",
    "        self.obs_norm = RunningNorm(self.obs_dim)\n",
    "        self.act_norm = RunningNorm(self.act_dim)\n",
    "\n",
    "        # Opts\n",
    "        self.actor_opt  = torch.optim.Adam(self.pi.parameters(), lr=cfg.actor_lr)\n",
    "        self.critic_opt = torch.optim.Adam(self.q.parameters(),  lr=cfg.critic_lr)\n",
    "\n",
    "        # Replay\n",
    "        self.replay = TransitionReplay(self.obs_dim, self.act_dim, maxlen=cfg.replay_size, device=cfg.device)\n",
    "\n",
    "        # CI schedule\n",
    "        self.ci = cfg.ci_start\n",
    "        self.lambda_c = torch.tensor(1.0, device=self.device, dtype=torch.float32)  # dual variable for cost\n",
    "        self.cost_limit = 5.0  # Match training cost limit\n",
    "\n",
    "    # ---------- plumbing hooks for the runner ----------\n",
    "    def _alpha_schedule(self):\n",
    "        # No longer needed in new design - constraint enforcement via dual variable\n",
    "        return 0.0\n",
    "    \n",
    "    def observe_transition(self, s, a, r, c, s2, done):\n",
    "        # keep normalizers fresh for cost model inputs\n",
    "        self.obs_norm.update(np.asarray(s, dtype=np.float32).reshape(1,-1))\n",
    "        self.act_norm.update(np.asarray(a, dtype=np.float32).reshape(1,-1))\n",
    "        self.replay.add(s, a, r, c, s2, done)\n",
    "\n",
    "    def _ucb_cost(self, S, A):\n",
    "        # normalize inputs to cost model\n",
    "        S_n = self.obs_norm.normalize_torch(S)\n",
    "        A_n = self.act_norm.normalize_torch(A)\n",
    "        X = torch.cat([S_n, A_n], dim=1)\n",
    "        mean, log_var = self.cost_model(X)\n",
    "        var = torch.exp(log_var).clamp_min(1e-6)\n",
    "        sigma = torch.sqrt(var)\n",
    "        UCB = (mean + self.ci * sigma).clamp(0.0, 1.0)\n",
    "        return UCB, mean.clamp(0.0, 1.0)\n",
    "\n",
    "    def _soft_update(self, net, target):\n",
    "        with torch.no_grad():\n",
    "            for p, tp in zip(net.parameters(), target.parameters()):\n",
    "                tp.mul_(1.0 - self.cfg.tau).add_(self.cfg.tau * p)\n",
    "\n",
    "    def update(self, data: Dict, ep_cost_mean: float, cost_limit: float, avg_ep_len: float):\n",
    "        \"\"\"One epoch of updates using whatever is in replay + (optionally) fit vf/cvf to provided returns.\"\"\"\n",
    "        # Snapshot policy BEFORE any updates for KL logging\n",
    "        self.old_pi.load_state_dict(self.pi.state_dict())\n",
    "        B = self.cfg.batch_size\n",
    "        updates_done = 0\n",
    "        self.cost_limit = float(cost_limit)\n",
    "        # ---------- critic + actor steps ----------\n",
    "        if len(self.replay) >= max(2*B, 10000):  # warmup: require at least 10k transitions\n",
    "            for _ in range(self.cfg.critic_updates):\n",
    "                S, A, R, C, S2, D = self.replay.sample(B)\n",
    "\n",
    "                # No reward shaping: critic target uses raw reward only\n",
    "                with torch.no_grad():\n",
    "                    mu2, _ = self.pi_target._dist(S2)\n",
    "                    A2 = torch.tanh(mu2)\n",
    "                    Q_targ = self.q_target(S2, A2)\n",
    "                    Y = R + (1.0 - D) * self.cfg.gamma * Q_targ\n",
    "                # --- risk for current and (optionally) next ---\n",
    "                    \n",
    "                # UCB_now, _ = self._ucb_cost(S, A)\n",
    "\n",
    "                # with torch.no_grad():\n",
    "                #     mu2, _ = self.pi_target._dist(S2)\n",
    "                #     A2     = torch.tanh(mu2)\n",
    "                #     UCB_next, _ = self._ucb_cost(S2, A2)\n",
    "\n",
    "                # # Potential-based shaping: encourage moves to safer states\n",
    "                # # NOTE: mask terminals so we don't add future risk at episode ends\n",
    "                # delta_ucb = UCB_now - (1.0 - D) * self.cfg.gamma * UCB_next\n",
    "\n",
    "                # # Scale gently; NO hinge, NO square here (keep it smooth)\n",
    "                # alpha = self._alpha_schedule()  # see helper below\n",
    "                # R_safe = R + alpha * delta_ucb.detach()\n",
    "\n",
    "                # # (Optional but recommended) limit extremes to avoid exploding TD targets\n",
    "                # R_safe = torch.clamp(R_safe, -5.0, 5.0)\n",
    "\n",
    "                # with torch.no_grad():\n",
    "                #     Q_targ = self.q_target(S2, A2)\n",
    "\n",
    "                # Y = R_safe + (1.0 - D) * self.cfg.gamma * Q_targ\n",
    "\n",
    "\n",
    "                # critic loss\n",
    "                Q = self.q(S, A)\n",
    "                critic_loss = F.mse_loss(Q, Y)\n",
    "                self.critic_opt.zero_grad()\n",
    "                critic_loss.backward()\n",
    "                self.critic_opt.step()\n",
    "\n",
    "                # Actor loss: maximize Q(s, pi(s)) with hinge constraint penalty per step\n",
    "                mu, _ = self.pi._dist(S)\n",
    "                A_det = torch.tanh(mu)\n",
    "                q_value = self.q(S, A_det).mean()\n",
    "                \n",
    "                # Predicted per-step hazard in [0,1]\n",
    "                _, mean_cost = self._ucb_cost(S, A_det)\n",
    "                # Per-step budget threshold\n",
    "                step_limit = torch.as_tensor(self.cost_limit / max(1.0, float(avg_ep_len)), device=S.device, dtype=mean_cost.dtype)\n",
    "                hinge = F.relu(mean_cost - step_limit)\n",
    "                \n",
    "                # Actor objective: maximize reward Q, penalize only above per-step budget\n",
    "                act_loss = -q_value + self.lambda_c * hinge.mean()\n",
    "                \n",
    "                # Small entropy bonus for exploration\n",
    "                dist = self.pi(S)\n",
    "                act_loss = act_loss - 1e-3 * dist.entropy().mean()\n",
    "                \n",
    "                self.actor_opt.zero_grad()\n",
    "                act_loss.backward()\n",
    "                self.actor_opt.step()\n",
    "\n",
    "                # targets\n",
    "                self._soft_update(self.q,  self.q_target)\n",
    "                self._soft_update(self.pi, self.pi_target)\n",
    "                self.total_updates = getattr(self, \"total_updates\", 0) + 1.\n",
    "                updates_done += 1\n",
    "\n",
    "                #     _, mean_c = self._ucb_cost(S, A)\n",
    "\n",
    "                #     actor_loss = - q_sa + self.lambda_c.detach() * mean_c.mean() * self.cfg.actor_cost_penalty\n",
    "                #     self.actor_opt.zero_grad()\n",
    "                #     actor_loss.backward()\n",
    "                #     self.actor_opt.step()\n",
    "\n",
    "                # (duplicate soft-update block removed)\n",
    "\n",
    "            # ---------- cost model steps ----------\n",
    "            for _ in range(self.cfg.critic_updates // 2):\n",
    "                S, A, _, C, _, _ = self.replay.sample(B)\n",
    "                # re-use normalization:\n",
    "                S_n = self.obs_norm.normalize_torch(S)\n",
    "                A_n = self.act_norm.normalize_torch(A)\n",
    "                X = torch.cat([S_n, A_n], dim=1)\n",
    "                # Cost model training - optimized for SafetyPointGoal2-v0\n",
    "                mean, log_var = self.cost_model(X)            # mean unconstrained; log_var free\n",
    "                nll = 0.5 * ((C - mean)**2 / torch.exp(log_var) + log_var)\n",
    "                loss = nll.mean()\n",
    "                # Total loss\n",
    "\n",
    "                self.cost_opt.zero_grad()\n",
    "                loss.backward()\n",
    "                self.cost_opt.step()\n",
    "\n",
    "                # logit, log_var = self.cost_model(X)\n",
    "                # pos_w = torch.tensor([self.cfg.cost_pos_weight], device=logit.device)\n",
    "                # bce = F.binary_cross_entropy_with_logits(logit, C, pos_weight=pos_w)\n",
    "                # var_reg = 1e-4 * torch.exp(log_var).mean()     # discourage huge σ instead of encouraging it\n",
    "                # loss = bce + var_reg\n",
    "                # self.cost_opt.zero_grad()\n",
    "                # loss.backward()\n",
    "                # self.cost_opt.step()\n",
    "     \n",
    "\n",
    "            # decay CI\n",
    "            self.ci = max(self.cfg.ci_end, self.ci * self.cfg.ci_decay)\n",
    "\n",
    "        # ---------- fit vf / cvf to returns from GAE buffer (optional; keeps runner happy) ----------\n",
    "        if 'ret_r' in data:\n",
    "            for _ in range(40):\n",
    "                v_loss = F.mse_loss(self.vf(data['obs']), data['ret_r'])\n",
    "                self.vf_opt.zero_grad(); v_loss.backward(); self.vf_opt.step()\n",
    "        if 'ret_c' in data:\n",
    "            for _ in range(20):\n",
    "                c_loss = F.mse_loss(self.cvf(data['obs']), data['ret_c'])\n",
    "                self.cvf_opt.zero_grad(); c_loss.backward(); self.cvf_opt.step()\n",
    "\n",
    "        # Compute KL wrt pre-update snapshot\n",
    "        with torch.no_grad():\n",
    "            try:\n",
    "                kl = self.pi.kl_with(self.old_pi, data['obs']).item()\n",
    "            except Exception:\n",
    "                kl = None\n",
    "        # Dual ascent: λ ← [λ + η ( empirical_cost − budget )]_+\n",
    "\n",
    "        # SafetyPointGoal2-v0 specific dual ascent\n",
    "        constraint_violation = float(ep_cost_mean) - float(cost_limit)\n",
    "        \n",
    "        if constraint_violation > 0:  # Constraint violated\n",
    "            # More aggressive update for point navigation task\n",
    "            self.lambda_c.add_(self.cfg.lambda_lr * (constraint_violation/ max(1.0, float(cost_limit))))\n",
    "            self.lambda_c.clamp_(0.0, self.cfg.lambda_max)\n",
    "            # Log constraint violation with more detail\n",
    "            print(f\"[gpq] SafetyPointGoal1: cost={ep_cost_mean:.2f} > limit={cost_limit:.2f}, λ={self.lambda_c.item():.4f}\")\n",
    "        else:  # Constraint satisfied\n",
    "            # Decay λ more slowly for point navigation (maintain safety)\n",
    "            self.lambda_c.mul_(0.995)\n",
    "            \n",
    "        # Clamp λ to reasonable range for point navigation\n",
    "        self.lambda_c.clamp_(0.0, self.cfg.lambda_max)\n",
    "        self.epoch_idx = getattr(self, \"epoch_idx\", 0) + 1\n",
    "\n",
    "        return {\"updates\": updates_done, \"ci\": float(self.ci), \"λ\": float(self.lambda_c.item())}"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 27,
   "id": "561758fc",
   "metadata": {},
   "outputs": [],
   "source": [
    "\n",
    "\n",
    "\n",
    "# =========================\n",
    "# Runner\n",
    "# =========================\n",
    "\n",
    "def make_env(env_id: str):\n",
    "    \"\"\"\n",
    "    Safety-Gymnasium step API:\n",
    "    obs, reward, cost, terminated, truncated, info\n",
    "    \"\"\"\n",
    "    return sg.make(env_id)\n",
    "\n",
    "\n",
    "def collect_epoch(env, agent, buf, steps_per_epoch, device):\n",
    "    o, info = env.reset()\n",
    "    ep_costs = []\n",
    "    ep_rewards = []\n",
    "    ep_ret, ep_len, ep_cost = 0.0, 0, 0.0\n",
    "    unsafe_steps = 0\n",
    "    explore_prob=0.3\n",
    "    for t in range(steps_per_epoch):\n",
    "        obs_t = o.astype(np.float32)\n",
    "        obs_t_torch = to_tensor(obs_t, device).unsqueeze(0)\n",
    "        if hasattr(agent, \"select_action_safe\"):\n",
    "            if np.random.rand() < explore_prob and agent.global_step < agent._warmup:\n",
    "                a_np = env.action_space.sample()\n",
    "            else:\n",
    "                a_np = agent.select_action_safe(obs_t, n_samples=256)\n",
    "        # NOTE: we keep no_grad() here for speed; refinement internally re-enables grad safely.\n",
    "        else:\n",
    "            with torch.no_grad():\n",
    "                a, logp, *_ = agent.pi.sample(obs_t_torch)\n",
    "                # if hasattr(agent, \"_ucb_cost\") and hasattr(agent, \"cost_limit\"):\n",
    "                #     UCB, _ = agent._ucb_cost(obs_t_torch, a)  # (1,1)\n",
    "                #     if float(UCB.item()) > float(agent.cost_limit)+0.1: #lossen UCB\n",
    "                #         a_np_try = a.squeeze(0).cpu().numpy()\n",
    "                #         for s in (0.5, 0.25, 0.1):\n",
    "                #             a_shrunk = np.tanh(s * np.arctanh(np.clip(a_np_try, -0.999, 0.999)))\n",
    "                #             U, _ = agent._ucb_cost(obs_t_torch, torch.as_tensor(a_shrunk, device=obs_t_torch.device).unsqueeze(0))\n",
    "                #         if float(U.item()) <= float(agent.cost_limit)+0.1: #lossen UCB\n",
    "                #             a = torch.as_tensor(a_shrunk, device=obs_t_torch.device).unsqueeze(0)\n",
    "                #             break\n",
    "                if hasattr(agent, \"_ucb_cost\"):\n",
    "                    UCB, _ = agent._ucb_cost(obs_t_torch, a)\n",
    "                    # th_hi = max(0.12 * float(getattr(agent, \"ci\", 1.0)), 0.06)\n",
    "                    # th_lo = max(0.06 * float(getattr(agent, \"ci\", 1.0)), 0.03)\n",
    "                    th_hi = 0.60\n",
    "                    th_lo = 0.40\n",
    "                    if float(UCB.item()) > th_hi:\n",
    "                        # a_try = a.squeeze(0).cpu().numpy()\n",
    "                        a_try =a.squeeze(0).cpu().numpy()\n",
    "                        accepted = False\n",
    "                        for s in (0.9, 0.8, 0.7):\n",
    "                            a_shrunk = np.tanh(s * np.arctanh(np.clip(a_try, -0.999, 0.999)))\n",
    "                            U, _ = agent._ucb_cost(\n",
    "                                obs_t_torch,\n",
    "                                torch.as_tensor(a_shrunk, device=obs_t_torch.device).unsqueeze(0)\n",
    "                            )\n",
    "                            if float(U.item()) <= th_lo:\n",
    "                                a = torch.as_tensor(a_shrunk, device=obs_t_torch.device).unsqueeze(0)\n",
    "                                accepted = True\n",
    "                                break\n",
    "                        #     U, _ = agent._ucb_cost(obs_t_torch, a_try)\n",
    "                        #     over = torch.nn.functional.relu(U - th_lo)\n",
    "                        #     if over.max() <= 1e-4: break\n",
    "                        #     g = torch.autograd.grad(over.mean(), a_try)[0]\n",
    "                        #     a_try = (a_try - getattr(agent.cfg, \"shield_lr\", 0.05) * g).clamp(-0.999, 0.999).detach().requires_grad_(True)\n",
    "                        # a_try = a_try.detach()\n",
    "                        # (if not accepted, keep original a)\n",
    "\n",
    "                v  = agent.vf(obs_t_torch).item()\n",
    "                if hasattr(agent, \"vc\"):\n",
    "                    cv = agent.vc(obs_t_torch).item()\n",
    "                elif hasattr(agent, \"cvf\"):\n",
    "                    cv = agent.cvf(obs_t_torch).item()\n",
    "                else:\n",
    "                    cv = 0.0\n",
    "\n",
    "                a_np = a.squeeze(0).cpu().numpy()\n",
    "        # a_np = a.squeeze(0).cpu().numpy()\n",
    "\n",
    "        step_out = env.step(a_np)\n",
    "        if len(step_out) == 6:\n",
    "            o2, r, c, terminated, truncated, info = step_out\n",
    "        else:\n",
    "            o2, r, terminated, truncated, info = step_out\n",
    "            c = float(info.get('cost', 0.0))\n",
    "        # if c > 0.0:\n",
    "        #     unsafe_steps += 1\n",
    "        terminal = bool(terminated)         # true terminal (collision/goal)\n",
    "        trunc    = bool(truncated)          # time-limit cutoff\n",
    "        done     = terminal or trunc\n",
    "\n",
    "        # Count “unsafe” (assuming costs are non-negative floats)\n",
    "        unsafe_steps += int(float(c) > 0.0)\n",
    "        ep_len += 1\n",
    "        ep_cost += float(c)\n",
    "        ep_ret += float(r)\n",
    "        if hasattr(agent, \"observe_transition\"):           \n",
    "            agent.observe_transition(obs_t, a_np, float(r), float(c), o2.astype(np.float32), done)\n",
    "        # elif hasattr(agent, \"observe_cost\"):\n",
    "        #     agent.observe_cost(obs_t, a_np, float(c))\n",
    "\n",
    "        if hasattr(buf, \"add\"):\n",
    "            buf.add(obs_t, a_np, float(r), float(c), o2, float(done))\n",
    "        else:\n",
    "            buf.store(obs_t, a_np, float(r), float(c), v, cv, float(logp.item()), float(done))\n",
    "        o = o2\n",
    "\n",
    "        # if done or (t == steps_per_epoch - 1):\n",
    "        if done or (t == steps_per_epoch - 1):\n",
    "            if terminal:\n",
    "                # true terminal → no bootstrap\n",
    "                last_v, last_cv = 0.0, 0.0\n",
    "            else:\n",
    "                # time-limit truncation or epoch boundary → MUST bootstrap\n",
    "                with torch.no_grad():\n",
    "                    last_v  = agent.vf(to_tensor(o, device).unsqueeze(0)).item()\n",
    "                    last_cv = (\n",
    "                        agent.vc(to_tensor(o, device).unsqueeze(0)).item()\n",
    "                        if hasattr(agent, \"vc\") else\n",
    "                        (agent.cvf(to_tensor(o, device).unsqueeze(0)).item() if hasattr(agent, \"cvf\") else 0.0)\n",
    "                    )\n",
    "            if hasattr(buf, \"finish_path\"):\n",
    "                buf.finish_path(last_v, last_cv)\n",
    "            ep_costs.append(float(ep_cost))\n",
    "            ep_rewards.append(float(ep_ret))\n",
    "            o, info = env.reset()\n",
    "            ep_ret, ep_len, ep_cost = 0.0, 0, 0.0\n",
    "\n",
    "    data = buf.get()\n",
    "    # if \"adv_r\" in data:\n",
    "    #     ar = data[\"adv_r\"]; data[\"adv_r\"] = (ar - ar.mean()) / (ar.std() + 1e-8)\n",
    "    # # optional: mean-center cost adv, but do NOT divide by std\n",
    "    # if \"adv_c\" in data:\n",
    "    #     ac = data[\"adv_c\"]; data[\"adv_c\"] = ac / (ac.std() + 1e-8) #- ac.mean() # notice\n",
    "    ep_cost_mean = float(np.mean(ep_costs)) if len(ep_costs) > 0 else 0.0\n",
    "    num_eps = max(1, len(ep_costs))\n",
    "    avg_ep_len = steps_per_epoch / num_eps\n",
    "    ep_reward_mean=float(np.mean(ep_rewards)) if len(ep_rewards) > 0 else 0.0\n",
    "    # expose for pretty prints\n",
    "    data['_unsafe_steps'] = int(unsafe_steps)\n",
    "    data['_episodes'] = int(num_eps)\n",
    "\n",
    "    buf.reset()\n",
    "    \n",
    "    return data, ep_cost_mean, avg_ep_len,ep_reward_mean\n",
    "    # data['_unsafe_steps'] = unsafe_steps\n",
    "    # data['_episodes'] = max(1, len(ep_costs))\n",
    "    # return data, ep_cost_mean\n",
    "\n",
    "def train(\n",
    "    algo: str = \"gp_shield\",\n",
    "    env_id: str = \"SafetyPointGoal1-v0\",\n",
    "    steps_per_epoch: int = 2048,\n",
    "    epochs: int = 20,\n",
    "    device: str =  (\"cuda\" if torch.cuda.is_available() else \"cpu\"),\n",
    "    seed: int = 0,\n",
    "    cost_limit: float = 5.0\n",
    "    ):\n",
    "    torch.manual_seed(seed)\n",
    "    np.random.seed(seed)\n",
    "\n",
    "    env = sg.make(env_id)\n",
    "    obs_space, act_space = env.observation_space, env.action_space\n",
    "    obs_dim   = int(obs_space.shape[0])\n",
    "    act_dim   = int(act_space.shape[0])\n",
    "    if algo.lower() == \"actsafe\":\n",
    "        a_low  = float(np.min(env.action_space.low))\n",
    "        a_high = float(np.max(env.action_space.high))\n",
    "\n",
    "        cfg = ActSafeConfig(\n",
    "            action_low=a_low,\n",
    "            action_high=a_high,\n",
    "            shield_eps_risk=cost_limit\n",
    "        )\n",
    "        agent = ActSafeAgent(env.observation_space, env.action_space, cfg, device=device)\n",
    "        buf = GAEBuffer(obs_space, act_space, size=steps_per_epoch,\n",
    "                       device=device)\n",
    "    elif algo.lower() == \"cpo\":\n",
    "        # cfg  = CPOConfig(device=device, seed=seed)\n",
    "        # agent = CPOAgent(obs_space, act_space, cfg)\n",
    "        buf = GAEBuffer(obs_space, act_space, size=steps_per_epoch, device=device, gamma_c=0.99)      \n",
    "        cfg = CPOConfig(steps_per_epoch=20000,gamma_c=0.99,cost_limit=cost_limit)\n",
    "        agent = CPOAgent(env.observation_space, env.action_space, cfg, device=device)\n",
    "    # elif algo.lower() in [\"gp_shield\", \"gpshield\", \"gp\"]:\n",
    "    #     cfg  = GPCostShieldConfig(device=device)\n",
    "    #     agent = GPCostShieldedAgent(obs_space, act_space, cfg)\n",
    "    #     buf = GAEBuffer(obs_space, act_space, size=steps_per_epoch,\n",
    "    #                     gamma=0.99, lam=0.95, gamma_c=0.99, lam_c=0.95, device=device)\n",
    "        \n",
    "    # elif algo.lower() in [\"gpq\", \"gp_q\", \"gpq_safe\"]:\n",
    "    #     cfg = GPQConfig(device=device)\n",
    "    #     agent = GPQAgent(obs_space, act_space, cfg)\n",
    "    #     buf = GAEBuffer(obs_space, act_space, size=steps_per_epoch,\n",
    "    #                     gamma=cfg.gamma, lam=0.95, gamma_c=0.99, lam_c=0.95, device=device)\n",
    "\n",
    "    # elif algo.lower() in {\"hybrid_q_gp_cost\", \"hybrid\"}:\n",
    "    #     # Use the small adapter that also handles target updates\n",
    "    #     agent = HybridAgent(obs_space, act_space, device=device)\n",
    "    #     buf = None  # not used by hybrid collector\n",
    "    \n",
    "    elif algo.lower() in {\"safe_fqi\"}:\n",
    "        agent = SafeFQI(\n",
    "        obs_dim=obs_dim,\n",
    "        act_dim=act_dim,\n",
    "        device=device     # per-step threshold; anneals to thresh_final\n",
    "        )\n",
    "        buf = None  # not used by hybrid collector  \n",
    "    else:\n",
    "        env.close()\n",
    "        raise ValueError(\"Unknown algo. Use 'cpo' or 'gp_shield'.\")\n",
    "\n",
    "    # Choose collection function\n",
    "    # if algo.lower() in {\"hybrid_q_gp_cost\", \"hybrid\"}:\n",
    "    #     coll_fn = lambda: collect_epoch_hybrid(env, agent, steps_per_epoch, device)\n",
    "    if algo.lower() in {\"safe_fqi\"}:\n",
    "        coll_fn = lambda: collect_epoch_safe_fqi(env, agent, steps_per_epoch, device)\n",
    "    else:\n",
    "        coll_fn = lambda: collect_epoch(env, agent, buf, steps_per_epoch, device)\n",
    "\n",
    "    print(f\"Training {algo} on {env_id} for {epochs} epochs...\")\n",
    "    ep_cost_curve = []\n",
    "    ep_reward_curve=[]\n",
    "\n",
    "\n",
    "    for ep in range(1, epochs + 1):\n",
    "        data, ep_cost_mean, avg_ep_len, ep_reward_mean = coll_fn()\n",
    "\n",
    "        #info = agent.update(data, ep_cost_mean=ep_cost_mean, cost_limit=cost_limit)\n",
    "        if algo.lower() == \"cpo\":\n",
    "            info = agent.update(data, ep_cost_mean=ep_cost_mean, avg_ep_len=avg_ep_len)\n",
    "        elif algo.lower() == \"actsafe\":\n",
    "            info = agent.update(data, ep_cost_mean=ep_cost_mean, avg_ep_len=avg_ep_len)\n",
    "        # elif algo.lower() in {\"hybrid_q_gp_cost\", \"hybrid\"}:\n",
    "        #     info = agent.update(data, ep_cost_mean=ep_cost_mean, cost_limit=cost_limit, avg_ep_len=avg_ep_len)\n",
    "        elif  algo.lower() in {\"safe_fqi\"}:\n",
    "            info = agent.update(data, ep_cost_mean=ep_cost_mean, cost_limit=cost_limit, avg_ep_len=avg_ep_len)\n",
    "        else:\n",
    "            info = agent.update(data, ep_cost_mean=ep_cost_mean, cost_limit=cost_limit, avg_ep_len=avg_ep_len)\n",
    "        kl = None\n",
    "        print(f\"[{algo}] Epoch {ep:03d} | ep_cost_mean={ep_cost_mean:.2f} | avg_ep_len={avg_ep_len:.2f}\"\n",
    "        f\"| ep_reward_mean={ep_reward_mean:.2f} \"\n",
    "        f\"| unsafe_steps={int(data.get('_unsafe_steps', 0))} over ~{int(data.get('_episodes', 1))} eps \"\n",
    "        f\"| info={info} | KL={kl}\")\n",
    "        # try:\n",
    "        #     old_pi = getattr(agent, \"old_pi\", None) or getattr(agent, \"pi_old\", None)\n",
    "        #     if old_pi is not None:\n",
    "        #         kl = agent.pi.kl_with(old_pi, data['obs']).item()   # KL(old || new)\n",
    "        # except Exception:\n",
    "        #     kl = None\n",
    "        # print(\n",
    "        #     f\"[{algo}] Epoch {ep:03d} | ep_cost_mean={ep_cost_mean:.2f} | avg_ep_len={avg_ep_len:.2f}\"\n",
    "        #     f\"| unsafe_steps={int(data.get('_unsafe_steps', 0))} over ~{int(data.get('_episodes', 1))} eps \"\n",
    "        #     f\"| info={info} | KL={kl}\"\n",
    "        # )\n",
    "        if algo.lower() in {\"safe_fqi\"}:\n",
    "            print(f\"| penalty={float(agent.penalty)} \")\n",
    "            print(f\"| global_step={float(agent.global_step)} \")\n",
    "\n",
    "        ep_cost_curve.append(ep_cost_mean)\n",
    "        ep_reward_curve.append(ep_reward_mean)\n",
    "\n",
    "    env.close()\n",
    "    return ep_cost_curve,ep_reward_curve\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 28,
   "id": "614f4cce",
   "metadata": {},
   "outputs": [],
   "source": [
    "device = torch.device(\"cuda\" if torch.cuda.is_available() else \"cpu\")\n",
    "device=\"cpu\""
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "f25e4603",
   "metadata": {},
   "outputs": [],
   "source": [
    "\n",
    "\n",
    "p = argparse.ArgumentParser()\n",
    "p.add_argument(\"--algo\", type=str, default=\"cpo\")\n",
    "p.add_argument(\"--env-id\", type=str, default=\"SafetyPointGoal1-v0\")\n",
    "p.add_argument(\"--steps-per-epoch\", type=int, default=4096)\n",
    "p.add_argument(\"--epochs\", type=int, default=200)\n",
    "p.add_argument(\"--device\", type=str, default=device)\n",
    "p.add_argument(\"--seed\", type=int, default=0)\n",
    "p.add_argument(\"--cost-limit\", type=float, default=0.02)\n",
    "\n",
    "    # ← this line is the key:\n",
    "args_CPO, _ = p.parse_known_args()\n",
    "\n",
    "cost_curve,rew_curve=train(\n",
    "    algo=args_CPO.algo,\n",
    "    env_id=args_CPO.env_id,\n",
    "    steps_per_epoch=args_CPO.steps_per_epoch,\n",
    "    epochs=args_CPO.epochs,\n",
    "    device=args_CPO.device,\n",
    "    seed=args_CPO.seed,\n",
    "    cost_limit=args_CPO.cost_limit,\n",
    ")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "33383264",
   "metadata": {},
   "outputs": [],
   "source": [
    "\n",
    "# pgp = argparse.ArgumentParser()\n",
    "# pgp.add_argument(\"--algo\", type=str, default=\"gpq\")\n",
    "# pgp.add_argument(\"--env-id\", type=str, default=\"SafetyPointGoal2-v0\")\n",
    "# pgp.add_argument(\"--steps-per-epoch\", type=int, default=10000)\n",
    "# pgp.add_argument(\"--epochs\", type=int, default=100)\n",
    "# pgp.add_argument(\"--device\", type=str, default=device)\n",
    "# pgp.add_argument(\"--seed\", type=int, default=0)\n",
    "# pgp.add_argument(\"--cost-limit\", type=float, default=5)\n",
    "\n",
    "# # ← this line is the key:\n",
    "# args_GP, _ = pgp.parse_known_args()\n",
    "# GP_cost_curve, GP_rew_curve=train(\n",
    "#     algo=args_GP.algo,\n",
    "#     env_id=args_GP.env_id,\n",
    "#     steps_per_epoch=args_GP.steps_per_epoch,\n",
    "#     epochs=args_GP.epochs,\n",
    "#     device=args_GP.device,\n",
    "#     seed=args_GP.seed,\n",
    "#     cost_limit=args_GP.cost_limit,\n",
    "# )"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 12,
   "id": "1d211781",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Training actsafe on SafetyPointGoal1-v0 for 200 epochs...\n",
      "[actsafe] Epoch 001 | ep_cost_mean=13.00 | avg_ep_len=819.20| ep_reward_mean=-1.39 | unsafe_steps=65 over ~5 eps | info={'pi_loss': -0.01353541575372219, 'kl': 0.006831116043031216, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 13.0, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 002 | ep_cost_mean=56.00 | avg_ep_len=819.20| ep_reward_mean=-0.16 | unsafe_steps=280 over ~5 eps | info={'pi_loss': -0.015557128004729748, 'kl': 0.012048015370965004, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 56.0, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 003 | ep_cost_mean=77.80 | avg_ep_len=819.20| ep_reward_mean=0.48 | unsafe_steps=389 over ~5 eps | info={'early_stop_iter': 67, 'pi_loss': -0.01830282434821129, 'kl': 0.01501636952161789, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 77.8, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 004 | ep_cost_mean=102.40 | avg_ep_len=819.20| ep_reward_mean=1.13 | unsafe_steps=512 over ~5 eps | info={'pi_loss': -0.01768798753619194, 'kl': 0.009949378669261932, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 102.4, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 005 | ep_cost_mean=146.60 | avg_ep_len=819.20| ep_reward_mean=0.60 | unsafe_steps=733 over ~5 eps | info={'early_stop_iter': 5, 'pi_loss': -0.004663689061999321, 'kl': 0.018613427877426147, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 146.6, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 006 | ep_cost_mean=249.80 | avg_ep_len=819.20| ep_reward_mean=0.55 | unsafe_steps=1249 over ~5 eps | info={'early_stop_iter': 5, 'pi_loss': -0.0038141985423862934, 'kl': 0.01848619431257248, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 249.8, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 007 | ep_cost_mean=55.40 | avg_ep_len=819.20| ep_reward_mean=0.27 | unsafe_steps=277 over ~5 eps | info={'early_stop_iter': 20, 'pi_loss': -0.01650378666818142, 'kl': 0.015366067178547382, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 55.4, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 008 | ep_cost_mean=26.80 | avg_ep_len=819.20| ep_reward_mean=1.80 | unsafe_steps=134 over ~5 eps | info={'early_stop_iter': 38, 'pi_loss': -0.014349562115967274, 'kl': 0.015004065819084644, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 26.8, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 009 | ep_cost_mean=85.00 | avg_ep_len=819.20| ep_reward_mean=2.59 | unsafe_steps=425 over ~5 eps | info={'early_stop_iter': 5, 'pi_loss': -0.0036812820471823215, 'kl': 0.01740248315036297, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 85.0, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 010 | ep_cost_mean=67.20 | avg_ep_len=819.20| ep_reward_mean=3.70 | unsafe_steps=336 over ~5 eps | info={'pi_loss': -0.01799873635172844, 'kl': 0.009328708052635193, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 67.2, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 011 | ep_cost_mean=77.80 | avg_ep_len=819.20| ep_reward_mean=3.38 | unsafe_steps=389 over ~5 eps | info={'pi_loss': -0.018995076417922974, 'kl': 0.009369941428303719, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 77.8, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 012 | ep_cost_mean=60.60 | avg_ep_len=819.20| ep_reward_mean=4.72 | unsafe_steps=303 over ~5 eps | info={'pi_loss': -0.02092408388853073, 'kl': 0.010755263268947601, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 60.6, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 013 | ep_cost_mean=226.00 | avg_ep_len=819.20| ep_reward_mean=3.79 | unsafe_steps=1130 over ~5 eps | info={'pi_loss': -0.02108084037899971, 'kl': 0.011507686227560043, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 226.0, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 014 | ep_cost_mean=48.40 | avg_ep_len=819.20| ep_reward_mean=5.60 | unsafe_steps=242 over ~5 eps | info={'pi_loss': -0.0225768331438303, 'kl': 0.01444169506430626, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 48.4, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 015 | ep_cost_mean=27.40 | avg_ep_len=819.20| ep_reward_mean=5.65 | unsafe_steps=137 over ~5 eps | info={'early_stop_iter': 49, 'pi_loss': -0.0190323144197464, 'kl': 0.015116221271455288, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 27.4, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 016 | ep_cost_mean=123.20 | avg_ep_len=819.20| ep_reward_mean=5.97 | unsafe_steps=616 over ~5 eps | info={'pi_loss': -0.02324409782886505, 'kl': 0.012100821360945702, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 123.2, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 017 | ep_cost_mean=85.20 | avg_ep_len=819.20| ep_reward_mean=6.19 | unsafe_steps=426 over ~5 eps | info={'pi_loss': -0.023491796106100082, 'kl': 0.012294599786400795, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 85.2, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 018 | ep_cost_mean=56.60 | avg_ep_len=819.20| ep_reward_mean=8.17 | unsafe_steps=283 over ~5 eps | info={'pi_loss': -0.02215294912457466, 'kl': 0.010736501775681973, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 56.6, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 019 | ep_cost_mean=72.20 | avg_ep_len=819.20| ep_reward_mean=5.86 | unsafe_steps=361 over ~5 eps | info={'pi_loss': -0.02481495775282383, 'kl': 0.010598059743642807, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 72.2, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 020 | ep_cost_mean=88.40 | avg_ep_len=819.20| ep_reward_mean=7.44 | unsafe_steps=442 over ~5 eps | info={'pi_loss': -0.021691521629691124, 'kl': 0.01300814002752304, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 88.4, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 021 | ep_cost_mean=64.60 | avg_ep_len=819.20| ep_reward_mean=11.07 | unsafe_steps=323 over ~5 eps | info={'pi_loss': -0.0257831159979105, 'kl': 0.010528745129704475, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 64.6, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 022 | ep_cost_mean=58.20 | avg_ep_len=819.20| ep_reward_mean=11.32 | unsafe_steps=291 over ~5 eps | info={'pi_loss': -0.025159282609820366, 'kl': 0.012429684400558472, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 58.2, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 023 | ep_cost_mean=23.20 | avg_ep_len=819.20| ep_reward_mean=10.21 | unsafe_steps=116 over ~5 eps | info={'early_stop_iter': 12, 'pi_loss': -0.01398303173482418, 'kl': 0.015189746394753456, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 23.2, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 024 | ep_cost_mean=48.60 | avg_ep_len=819.20| ep_reward_mean=12.02 | unsafe_steps=243 over ~5 eps | info={'pi_loss': -0.0272386334836483, 'kl': 0.012643421068787575, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 48.6, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 025 | ep_cost_mean=95.00 | avg_ep_len=819.20| ep_reward_mean=10.38 | unsafe_steps=475 over ~5 eps | info={'early_stop_iter': 14, 'pi_loss': -0.01260822732001543, 'kl': 0.015730861574411392, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 95.0, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 026 | ep_cost_mean=29.40 | avg_ep_len=819.20| ep_reward_mean=11.79 | unsafe_steps=147 over ~5 eps | info={'pi_loss': -0.02249673567712307, 'kl': 0.005891467910259962, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 29.4, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 027 | ep_cost_mean=90.80 | avg_ep_len=819.20| ep_reward_mean=12.85 | unsafe_steps=454 over ~5 eps | info={'pi_loss': -0.028346700593829155, 'kl': 0.012528279796242714, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 90.8, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 028 | ep_cost_mean=54.20 | avg_ep_len=819.20| ep_reward_mean=12.19 | unsafe_steps=271 over ~5 eps | info={'early_stop_iter': 73, 'pi_loss': -0.026945363730192184, 'kl': 0.0150460135191679, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 54.2, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 029 | ep_cost_mean=64.20 | avg_ep_len=819.20| ep_reward_mean=13.67 | unsafe_steps=321 over ~5 eps | info={'pi_loss': -0.025422783568501472, 'kl': 0.014371940866112709, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 64.2, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 030 | ep_cost_mean=55.20 | avg_ep_len=819.20| ep_reward_mean=14.03 | unsafe_steps=276 over ~5 eps | info={'early_stop_iter': 3, 'pi_loss': -0.0008091289782896638, 'kl': 0.01791057176887989, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 55.2, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 031 | ep_cost_mean=10.40 | avg_ep_len=819.20| ep_reward_mean=15.13 | unsafe_steps=52 over ~5 eps | info={'pi_loss': -0.025860311463475227, 'kl': 0.00572032667696476, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 10.4, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 032 | ep_cost_mean=45.20 | avg_ep_len=819.20| ep_reward_mean=15.43 | unsafe_steps=226 over ~5 eps | info={'pi_loss': -0.02759869582951069, 'kl': 0.01229636650532484, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 45.2, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 033 | ep_cost_mean=88.40 | avg_ep_len=819.20| ep_reward_mean=16.20 | unsafe_steps=442 over ~5 eps | info={'pi_loss': -0.026390455663204193, 'kl': 0.010059881024062634, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 88.4, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 034 | ep_cost_mean=25.00 | avg_ep_len=819.20| ep_reward_mean=14.07 | unsafe_steps=125 over ~5 eps | info={'early_stop_iter': 62, 'pi_loss': -0.026065897196531296, 'kl': 0.01592756062746048, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 25.0, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 035 | ep_cost_mean=45.40 | avg_ep_len=819.20| ep_reward_mean=17.13 | unsafe_steps=227 over ~5 eps | info={'pi_loss': -0.028205687180161476, 'kl': 0.0130855031311512, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 45.4, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 036 | ep_cost_mean=54.40 | avg_ep_len=819.20| ep_reward_mean=15.49 | unsafe_steps=272 over ~5 eps | info={'pi_loss': -0.02679949253797531, 'kl': 0.011350417509675026, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 54.4, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 037 | ep_cost_mean=30.60 | avg_ep_len=819.20| ep_reward_mean=16.42 | unsafe_steps=153 over ~5 eps | info={'pi_loss': -0.026007335633039474, 'kl': 0.010969117283821106, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 30.6, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 038 | ep_cost_mean=58.40 | avg_ep_len=819.20| ep_reward_mean=15.63 | unsafe_steps=292 over ~5 eps | info={'pi_loss': -0.02834152802824974, 'kl': 0.012248892337083817, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 58.4, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 039 | ep_cost_mean=40.40 | avg_ep_len=819.20| ep_reward_mean=15.08 | unsafe_steps=202 over ~5 eps | info={'early_stop_iter': 3, 'pi_loss': -0.00020594673696905375, 'kl': 0.015552524477243423, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 40.4, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 040 | ep_cost_mean=82.40 | avg_ep_len=819.20| ep_reward_mean=17.25 | unsafe_steps=412 over ~5 eps | info={'pi_loss': -0.02727692760527134, 'kl': 0.007312150672078133, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 82.4, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 041 | ep_cost_mean=29.00 | avg_ep_len=819.20| ep_reward_mean=16.87 | unsafe_steps=145 over ~5 eps | info={'pi_loss': -0.02797985076904297, 'kl': 0.011153734289109707, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 29.0, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 042 | ep_cost_mean=60.80 | avg_ep_len=819.20| ep_reward_mean=15.79 | unsafe_steps=304 over ~5 eps | info={'pi_loss': -0.030026858672499657, 'kl': 0.014073196798563004, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 60.8, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 043 | ep_cost_mean=48.00 | avg_ep_len=819.20| ep_reward_mean=17.88 | unsafe_steps=240 over ~5 eps | info={'early_stop_iter': 63, 'pi_loss': -0.027180049568414688, 'kl': 0.015812309458851814, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 48.0, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 044 | ep_cost_mean=67.20 | avg_ep_len=819.20| ep_reward_mean=14.32 | unsafe_steps=336 over ~5 eps | info={'early_stop_iter': 24, 'pi_loss': -0.016050387173891068, 'kl': 0.015111198648810387, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 67.2, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 045 | ep_cost_mean=57.80 | avg_ep_len=819.20| ep_reward_mean=17.03 | unsafe_steps=289 over ~5 eps | info={'early_stop_iter': 19, 'pi_loss': -0.01490546390414238, 'kl': 0.01595369540154934, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 57.8, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 046 | ep_cost_mean=57.60 | avg_ep_len=819.20| ep_reward_mean=16.74 | unsafe_steps=288 over ~5 eps | info={'pi_loss': -0.02921856939792633, 'kl': 0.011635306291282177, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 57.6, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 047 | ep_cost_mean=50.00 | avg_ep_len=819.20| ep_reward_mean=17.05 | unsafe_steps=250 over ~5 eps | info={'pi_loss': -0.029093869030475616, 'kl': 0.013905622065067291, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 50.0, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 048 | ep_cost_mean=53.00 | avg_ep_len=819.20| ep_reward_mean=14.76 | unsafe_steps=265 over ~5 eps | info={'pi_loss': -0.02719675377011299, 'kl': 0.007501211948692799, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 53.0, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 049 | ep_cost_mean=43.40 | avg_ep_len=819.20| ep_reward_mean=17.67 | unsafe_steps=217 over ~5 eps | info={'pi_loss': -0.02850453555583954, 'kl': 0.011519583873450756, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 43.4, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 050 | ep_cost_mean=67.40 | avg_ep_len=819.20| ep_reward_mean=19.25 | unsafe_steps=337 over ~5 eps | info={'early_stop_iter': 4, 'pi_loss': -0.0037694713100790977, 'kl': 0.016110165044665337, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 67.4, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 051 | ep_cost_mean=32.80 | avg_ep_len=819.20| ep_reward_mean=16.19 | unsafe_steps=164 over ~5 eps | info={'pi_loss': -0.026198729872703552, 'kl': 0.009497490711510181, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 32.8, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 052 | ep_cost_mean=27.40 | avg_ep_len=819.20| ep_reward_mean=17.14 | unsafe_steps=137 over ~5 eps | info={'pi_loss': -0.028734812512993813, 'kl': 0.013787226751446724, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 27.4, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 053 | ep_cost_mean=55.40 | avg_ep_len=819.20| ep_reward_mean=17.67 | unsafe_steps=277 over ~5 eps | info={'pi_loss': -0.0311066135764122, 'kl': 0.014469906687736511, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 55.4, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 054 | ep_cost_mean=64.40 | avg_ep_len=819.20| ep_reward_mean=18.31 | unsafe_steps=322 over ~5 eps | info={'early_stop_iter': 68, 'pi_loss': -0.026613343507051468, 'kl': 0.015108796767890453, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 64.4, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 055 | ep_cost_mean=43.80 | avg_ep_len=819.20| ep_reward_mean=18.68 | unsafe_steps=219 over ~5 eps | info={'early_stop_iter': 25, 'pi_loss': -0.019119711592793465, 'kl': 0.015308460220694542, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 43.8, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 056 | ep_cost_mean=50.80 | avg_ep_len=819.20| ep_reward_mean=17.91 | unsafe_steps=254 over ~5 eps | info={'pi_loss': -0.029157942160964012, 'kl': 0.012053010053932667, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 50.8, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 057 | ep_cost_mean=67.80 | avg_ep_len=819.20| ep_reward_mean=18.86 | unsafe_steps=339 over ~5 eps | info={'early_stop_iter': 18, 'pi_loss': -0.014944544062018394, 'kl': 0.016220612451434135, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 67.8, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 058 | ep_cost_mean=50.20 | avg_ep_len=819.20| ep_reward_mean=18.42 | unsafe_steps=251 over ~5 eps | info={'early_stop_iter': 60, 'pi_loss': -0.025505471974611282, 'kl': 0.015708474442362785, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 50.2, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 059 | ep_cost_mean=17.80 | avg_ep_len=819.20| ep_reward_mean=19.06 | unsafe_steps=89 over ~5 eps | info={'pi_loss': -0.028436509892344475, 'kl': 0.013533118180930614, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 17.8, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 060 | ep_cost_mean=37.40 | avg_ep_len=819.20| ep_reward_mean=18.66 | unsafe_steps=187 over ~5 eps | info={'pi_loss': -0.02631106600165367, 'kl': 0.013010094873607159, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 37.4, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 061 | ep_cost_mean=31.00 | avg_ep_len=819.20| ep_reward_mean=17.82 | unsafe_steps=155 over ~5 eps | info={'pi_loss': -0.03010990098118782, 'kl': 0.012657257728278637, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 31.0, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 062 | ep_cost_mean=35.80 | avg_ep_len=819.20| ep_reward_mean=18.44 | unsafe_steps=179 over ~5 eps | info={'early_stop_iter': 3, 'pi_loss': 0.0018821952398866415, 'kl': 0.016674257814884186, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 35.8, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 063 | ep_cost_mean=38.60 | avg_ep_len=819.20| ep_reward_mean=19.22 | unsafe_steps=193 over ~5 eps | info={'early_stop_iter': 48, 'pi_loss': -0.026461161673069, 'kl': 0.015102587640285492, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 38.6, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 064 | ep_cost_mean=45.00 | avg_ep_len=819.20| ep_reward_mean=18.42 | unsafe_steps=225 over ~5 eps | info={'pi_loss': -0.02721846103668213, 'kl': 0.011326917447149754, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 45.0, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 065 | ep_cost_mean=43.40 | avg_ep_len=819.20| ep_reward_mean=19.20 | unsafe_steps=217 over ~5 eps | info={'early_stop_iter': 73, 'pi_loss': -0.027872629463672638, 'kl': 0.015231463126838207, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 43.4, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 066 | ep_cost_mean=31.00 | avg_ep_len=819.20| ep_reward_mean=19.76 | unsafe_steps=155 over ~5 eps | info={'early_stop_iter': 51, 'pi_loss': -0.02455519698560238, 'kl': 0.015256116166710854, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 31.0, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 067 | ep_cost_mean=53.20 | avg_ep_len=819.20| ep_reward_mean=19.93 | unsafe_steps=266 over ~5 eps | info={'pi_loss': -0.027256421744823456, 'kl': 0.012731319293379784, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 53.2, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 068 | ep_cost_mean=61.60 | avg_ep_len=819.20| ep_reward_mean=19.02 | unsafe_steps=308 over ~5 eps | info={'pi_loss': -0.02956516295671463, 'kl': 0.011057807132601738, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 61.6, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 069 | ep_cost_mean=20.60 | avg_ep_len=819.20| ep_reward_mean=19.81 | unsafe_steps=103 over ~5 eps | info={'early_stop_iter': 75, 'pi_loss': -0.028607789427042007, 'kl': 0.015806956216692924, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 20.6, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 070 | ep_cost_mean=50.20 | avg_ep_len=819.20| ep_reward_mean=18.95 | unsafe_steps=251 over ~5 eps | info={'early_stop_iter': 3, 'pi_loss': -0.0017210027435794473, 'kl': 0.015326118096709251, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 50.2, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 071 | ep_cost_mean=28.60 | avg_ep_len=819.20| ep_reward_mean=20.28 | unsafe_steps=143 over ~5 eps | info={'pi_loss': -0.02452489174902439, 'kl': 0.013300434686243534, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 28.6, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 072 | ep_cost_mean=25.80 | avg_ep_len=819.20| ep_reward_mean=19.63 | unsafe_steps=129 over ~5 eps | info={'early_stop_iter': 62, 'pi_loss': -0.024848025292158127, 'kl': 0.015043641440570354, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 25.8, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 073 | ep_cost_mean=35.40 | avg_ep_len=819.20| ep_reward_mean=18.51 | unsafe_steps=177 over ~5 eps | info={'early_stop_iter': 30, 'pi_loss': -0.020192719995975494, 'kl': 0.015090662986040115, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 35.4, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 074 | ep_cost_mean=32.20 | avg_ep_len=819.20| ep_reward_mean=19.36 | unsafe_steps=161 over ~5 eps | info={'pi_loss': -0.03172915801405907, 'kl': 0.01145363599061966, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 32.2, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 075 | ep_cost_mean=38.40 | avg_ep_len=819.20| ep_reward_mean=20.18 | unsafe_steps=192 over ~5 eps | info={'pi_loss': -0.03414049372076988, 'kl': 0.011538347229361534, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 38.4, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 076 | ep_cost_mean=33.80 | avg_ep_len=819.20| ep_reward_mean=18.92 | unsafe_steps=169 over ~5 eps | info={'early_stop_iter': 3, 'pi_loss': -0.00018578104209154844, 'kl': 0.01615677960216999, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 33.8, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 077 | ep_cost_mean=60.20 | avg_ep_len=819.20| ep_reward_mean=19.25 | unsafe_steps=301 over ~5 eps | info={'early_stop_iter': 45, 'pi_loss': -0.024318058043718338, 'kl': 0.015060830861330032, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 60.2, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 078 | ep_cost_mean=63.60 | avg_ep_len=819.20| ep_reward_mean=20.32 | unsafe_steps=318 over ~5 eps | info={'early_stop_iter': 17, 'pi_loss': -0.01578327640891075, 'kl': 0.015562162734568119, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 63.6, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 079 | ep_cost_mean=47.00 | avg_ep_len=819.20| ep_reward_mean=20.52 | unsafe_steps=235 over ~5 eps | info={'pi_loss': -0.0295074712485075, 'kl': 0.010851321741938591, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 47.0, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 080 | ep_cost_mean=69.20 | avg_ep_len=819.20| ep_reward_mean=19.78 | unsafe_steps=346 over ~5 eps | info={'early_stop_iter': 22, 'pi_loss': -0.017253518104553223, 'kl': 0.0154804652556777, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 69.2, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 081 | ep_cost_mean=23.60 | avg_ep_len=819.20| ep_reward_mean=19.83 | unsafe_steps=118 over ~5 eps | info={'pi_loss': -0.02611253410577774, 'kl': 0.012741105630993843, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 23.6, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 082 | ep_cost_mean=49.40 | avg_ep_len=819.20| ep_reward_mean=19.94 | unsafe_steps=247 over ~5 eps | info={'early_stop_iter': 63, 'pi_loss': -0.024132627993822098, 'kl': 0.015069722197949886, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 49.4, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 083 | ep_cost_mean=34.80 | avg_ep_len=819.20| ep_reward_mean=19.16 | unsafe_steps=174 over ~5 eps | info={'early_stop_iter': 3, 'pi_loss': 0.001186187844723463, 'kl': 0.02008458785712719, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 34.8, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 084 | ep_cost_mean=60.60 | avg_ep_len=819.20| ep_reward_mean=18.87 | unsafe_steps=303 over ~5 eps | info={'early_stop_iter': 38, 'pi_loss': -0.024224651977419853, 'kl': 0.015639765188097954, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 60.6, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 085 | ep_cost_mean=34.40 | avg_ep_len=819.20| ep_reward_mean=20.39 | unsafe_steps=172 over ~5 eps | info={'early_stop_iter': 34, 'pi_loss': -0.023989107459783554, 'kl': 0.015012013725936413, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 34.4, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 086 | ep_cost_mean=57.20 | avg_ep_len=819.20| ep_reward_mean=20.80 | unsafe_steps=286 over ~5 eps | info={'early_stop_iter': 57, 'pi_loss': -0.01876465603709221, 'kl': 0.015290986746549606, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 57.2, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 087 | ep_cost_mean=51.00 | avg_ep_len=819.20| ep_reward_mean=20.42 | unsafe_steps=255 over ~5 eps | info={'early_stop_iter': 3, 'pi_loss': -0.0002033277414739132, 'kl': 0.019980423152446747, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 51.0, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 088 | ep_cost_mean=64.20 | avg_ep_len=819.20| ep_reward_mean=20.26 | unsafe_steps=321 over ~5 eps | info={'pi_loss': -0.02624211274087429, 'kl': 0.011964423581957817, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 64.2, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 089 | ep_cost_mean=44.60 | avg_ep_len=819.20| ep_reward_mean=19.86 | unsafe_steps=223 over ~5 eps | info={'early_stop_iter': 12, 'pi_loss': -0.011898265220224857, 'kl': 0.015163768082857132, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 44.6, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 090 | ep_cost_mean=80.00 | avg_ep_len=819.20| ep_reward_mean=19.00 | unsafe_steps=400 over ~5 eps | info={'early_stop_iter': 77, 'pi_loss': -0.027237998321652412, 'kl': 0.015037208795547485, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 80.0, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 091 | ep_cost_mean=27.40 | avg_ep_len=819.20| ep_reward_mean=20.55 | unsafe_steps=137 over ~5 eps | info={'early_stop_iter': 16, 'pi_loss': -0.013812728226184845, 'kl': 0.015038291923701763, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 27.4, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 092 | ep_cost_mean=66.80 | avg_ep_len=819.20| ep_reward_mean=20.06 | unsafe_steps=334 over ~5 eps | info={'early_stop_iter': 69, 'pi_loss': -0.027462245896458626, 'kl': 0.01515415869653225, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 66.8, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 093 | ep_cost_mean=45.60 | avg_ep_len=819.20| ep_reward_mean=21.29 | unsafe_steps=228 over ~5 eps | info={'early_stop_iter': 40, 'pi_loss': -0.020853925496339798, 'kl': 0.015108082443475723, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 45.6, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 094 | ep_cost_mean=37.80 | avg_ep_len=819.20| ep_reward_mean=20.23 | unsafe_steps=189 over ~5 eps | info={'early_stop_iter': 15, 'pi_loss': -0.0148446224629879, 'kl': 0.015861876308918, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 37.8, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 095 | ep_cost_mean=44.00 | avg_ep_len=819.20| ep_reward_mean=20.24 | unsafe_steps=220 over ~5 eps | info={'early_stop_iter': 38, 'pi_loss': -0.022012677043676376, 'kl': 0.015097379684448242, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 44.0, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 096 | ep_cost_mean=40.00 | avg_ep_len=819.20| ep_reward_mean=20.78 | unsafe_steps=200 over ~5 eps | info={'early_stop_iter': 20, 'pi_loss': -0.016548164188861847, 'kl': 0.017689473927021027, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 40.0, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 097 | ep_cost_mean=39.60 | avg_ep_len=819.20| ep_reward_mean=19.83 | unsafe_steps=198 over ~5 eps | info={'pi_loss': -0.028769519180059433, 'kl': 0.012846710160374641, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 39.6, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 098 | ep_cost_mean=22.80 | avg_ep_len=819.20| ep_reward_mean=20.41 | unsafe_steps=114 over ~5 eps | info={'pi_loss': -0.025690287351608276, 'kl': 0.013132091611623764, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 22.8, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 099 | ep_cost_mean=45.00 | avg_ep_len=819.20| ep_reward_mean=20.28 | unsafe_steps=225 over ~5 eps | info={'early_stop_iter': 34, 'pi_loss': -0.022363632917404175, 'kl': 0.015155122615396976, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 45.0, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 100 | ep_cost_mean=69.20 | avg_ep_len=819.20| ep_reward_mean=20.46 | unsafe_steps=346 over ~5 eps | info={'early_stop_iter': 35, 'pi_loss': -0.021298743784427643, 'kl': 0.016128480434417725, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 69.2, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 101 | ep_cost_mean=27.20 | avg_ep_len=819.20| ep_reward_mean=20.98 | unsafe_steps=136 over ~5 eps | info={'early_stop_iter': 30, 'pi_loss': -0.02159249782562256, 'kl': 0.015216287225484848, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 27.2, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 102 | ep_cost_mean=75.60 | avg_ep_len=819.20| ep_reward_mean=20.85 | unsafe_steps=378 over ~5 eps | info={'early_stop_iter': 71, 'pi_loss': -0.030114086344838142, 'kl': 0.015674620866775513, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 75.6, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 103 | ep_cost_mean=54.80 | avg_ep_len=819.20| ep_reward_mean=20.54 | unsafe_steps=274 over ~5 eps | info={'early_stop_iter': 52, 'pi_loss': -0.02561287395656109, 'kl': 0.015047764405608177, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 54.8, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 104 | ep_cost_mean=58.60 | avg_ep_len=819.20| ep_reward_mean=19.73 | unsafe_steps=293 over ~5 eps | info={'pi_loss': -0.02903672680258751, 'kl': 0.013331032358109951, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 58.6, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 105 | ep_cost_mean=64.20 | avg_ep_len=819.20| ep_reward_mean=20.74 | unsafe_steps=321 over ~5 eps | info={'early_stop_iter': 3, 'pi_loss': -0.0015633944422006607, 'kl': 0.01575634628534317, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 64.2, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 106 | ep_cost_mean=46.00 | avg_ep_len=819.20| ep_reward_mean=20.14 | unsafe_steps=230 over ~5 eps | info={'early_stop_iter': 3, 'pi_loss': -0.00044372607953846455, 'kl': 0.017721636220812798, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 46.0, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 107 | ep_cost_mean=36.20 | avg_ep_len=819.20| ep_reward_mean=20.49 | unsafe_steps=181 over ~5 eps | info={'early_stop_iter': 13, 'pi_loss': -0.009245875291526318, 'kl': 0.015515723265707493, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 36.2, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 108 | ep_cost_mean=37.80 | avg_ep_len=819.20| ep_reward_mean=18.86 | unsafe_steps=189 over ~5 eps | info={'pi_loss': -0.031685128808021545, 'kl': 0.009794900193810463, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 37.8, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 109 | ep_cost_mean=83.60 | avg_ep_len=819.20| ep_reward_mean=20.16 | unsafe_steps=418 over ~5 eps | info={'early_stop_iter': 61, 'pi_loss': -0.025910422205924988, 'kl': 0.015347464941442013, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 83.6, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 110 | ep_cost_mean=64.20 | avg_ep_len=819.20| ep_reward_mean=20.36 | unsafe_steps=321 over ~5 eps | info={'early_stop_iter': 43, 'pi_loss': -0.024990182369947433, 'kl': 0.015844423323869705, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 64.2, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 111 | ep_cost_mean=60.00 | avg_ep_len=819.20| ep_reward_mean=21.67 | unsafe_steps=300 over ~5 eps | info={'early_stop_iter': 36, 'pi_loss': -0.022261595353484154, 'kl': 0.015006671659648418, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 60.0, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 112 | ep_cost_mean=37.80 | avg_ep_len=819.20| ep_reward_mean=19.81 | unsafe_steps=189 over ~5 eps | info={'early_stop_iter': 25, 'pi_loss': -0.02003771811723709, 'kl': 0.015405933372676373, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 37.8, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 113 | ep_cost_mean=38.40 | avg_ep_len=819.20| ep_reward_mean=19.52 | unsafe_steps=192 over ~5 eps | info={'pi_loss': -0.029824737459421158, 'kl': 0.014560220763087273, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 38.4, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 114 | ep_cost_mean=48.40 | avg_ep_len=819.20| ep_reward_mean=20.77 | unsafe_steps=242 over ~5 eps | info={'early_stop_iter': 18, 'pi_loss': -0.013240072876214981, 'kl': 0.01500765047967434, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 48.4, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 115 | ep_cost_mean=34.00 | avg_ep_len=819.20| ep_reward_mean=20.09 | unsafe_steps=170 over ~5 eps | info={'early_stop_iter': 7, 'pi_loss': -0.005389055237174034, 'kl': 0.015642588958144188, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 34.0, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 116 | ep_cost_mean=45.60 | avg_ep_len=819.20| ep_reward_mean=21.69 | unsafe_steps=228 over ~5 eps | info={'early_stop_iter': 18, 'pi_loss': -0.01665542833507061, 'kl': 0.015239153057336807, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 45.6, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 117 | ep_cost_mean=21.20 | avg_ep_len=819.20| ep_reward_mean=20.59 | unsafe_steps=106 over ~5 eps | info={'early_stop_iter': 71, 'pi_loss': -0.02869117446243763, 'kl': 0.015601221472024918, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 21.2, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 118 | ep_cost_mean=66.00 | avg_ep_len=819.20| ep_reward_mean=21.15 | unsafe_steps=330 over ~5 eps | info={'early_stop_iter': 46, 'pi_loss': -0.021873855963349342, 'kl': 0.01606757566332817, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 66.0, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 119 | ep_cost_mean=38.00 | avg_ep_len=819.20| ep_reward_mean=18.61 | unsafe_steps=190 over ~5 eps | info={'pi_loss': -0.027177805081009865, 'kl': 0.008496840484440327, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 38.0, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 120 | ep_cost_mean=38.80 | avg_ep_len=819.20| ep_reward_mean=19.65 | unsafe_steps=194 over ~5 eps | info={'pi_loss': -0.02771090902388096, 'kl': 0.013484463095664978, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 38.8, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 121 | ep_cost_mean=43.80 | avg_ep_len=819.20| ep_reward_mean=19.98 | unsafe_steps=219 over ~5 eps | info={'early_stop_iter': 23, 'pi_loss': -0.016405180096626282, 'kl': 0.01505274698138237, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 43.8, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 122 | ep_cost_mean=54.00 | avg_ep_len=819.20| ep_reward_mean=21.00 | unsafe_steps=270 over ~5 eps | info={'pi_loss': -0.02856973372399807, 'kl': 0.010945357382297516, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 54.0, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 123 | ep_cost_mean=52.60 | avg_ep_len=819.20| ep_reward_mean=21.32 | unsafe_steps=263 over ~5 eps | info={'early_stop_iter': 17, 'pi_loss': -0.015136557631194592, 'kl': 0.016139207407832146, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 52.6, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 124 | ep_cost_mean=37.00 | avg_ep_len=819.20| ep_reward_mean=20.83 | unsafe_steps=185 over ~5 eps | info={'early_stop_iter': 47, 'pi_loss': -0.027995338663458824, 'kl': 0.015573287382721901, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 37.0, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 125 | ep_cost_mean=51.60 | avg_ep_len=819.20| ep_reward_mean=18.98 | unsafe_steps=258 over ~5 eps | info={'early_stop_iter': 9, 'pi_loss': -0.0075701442547142506, 'kl': 0.015227217227220535, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 51.6, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 126 | ep_cost_mean=45.60 | avg_ep_len=819.20| ep_reward_mean=19.88 | unsafe_steps=228 over ~5 eps | info={'early_stop_iter': 7, 'pi_loss': -0.005639359820634127, 'kl': 0.01521652564406395, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 45.6, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 127 | ep_cost_mean=36.00 | avg_ep_len=819.20| ep_reward_mean=19.80 | unsafe_steps=180 over ~5 eps | info={'early_stop_iter': 19, 'pi_loss': -0.015099354088306427, 'kl': 0.015195946209132671, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 36.0, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 128 | ep_cost_mean=31.80 | avg_ep_len=819.20| ep_reward_mean=21.34 | unsafe_steps=159 over ~5 eps | info={'early_stop_iter': 17, 'pi_loss': -0.013315809890627861, 'kl': 0.016279464587569237, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 31.8, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 129 | ep_cost_mean=55.00 | avg_ep_len=819.20| ep_reward_mean=20.65 | unsafe_steps=275 over ~5 eps | info={'early_stop_iter': 3, 'pi_loss': -0.0011373264715075493, 'kl': 0.01748182810842991, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 55.0, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 130 | ep_cost_mean=48.40 | avg_ep_len=819.20| ep_reward_mean=20.73 | unsafe_steps=242 over ~5 eps | info={'early_stop_iter': 3, 'pi_loss': -0.0003425751347094774, 'kl': 0.015167027711868286, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 48.4, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 131 | ep_cost_mean=35.00 | avg_ep_len=819.20| ep_reward_mean=21.23 | unsafe_steps=175 over ~5 eps | info={'early_stop_iter': 40, 'pi_loss': -0.02096141129732132, 'kl': 0.015134048648178577, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 35.0, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 132 | ep_cost_mean=24.20 | avg_ep_len=819.20| ep_reward_mean=19.49 | unsafe_steps=121 over ~5 eps | info={'pi_loss': -0.026163296774029732, 'kl': 0.01124389935284853, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 24.2, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 133 | ep_cost_mean=27.60 | avg_ep_len=819.20| ep_reward_mean=21.10 | unsafe_steps=138 over ~5 eps | info={'early_stop_iter': 45, 'pi_loss': -0.02071787789463997, 'kl': 0.015128478407859802, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 27.6, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 134 | ep_cost_mean=32.20 | avg_ep_len=819.20| ep_reward_mean=20.51 | unsafe_steps=161 over ~5 eps | info={'early_stop_iter': 7, 'pi_loss': -0.006378335878252983, 'kl': 0.015478558838367462, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 32.2, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 135 | ep_cost_mean=27.40 | avg_ep_len=819.20| ep_reward_mean=20.31 | unsafe_steps=137 over ~5 eps | info={'early_stop_iter': 14, 'pi_loss': -0.014116448350250721, 'kl': 0.016249975189566612, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 27.4, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 136 | ep_cost_mean=37.20 | avg_ep_len=819.20| ep_reward_mean=20.99 | unsafe_steps=186 over ~5 eps | info={'pi_loss': -0.027757462114095688, 'kl': 0.013759864494204521, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 37.2, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 137 | ep_cost_mean=35.00 | avg_ep_len=819.20| ep_reward_mean=20.63 | unsafe_steps=175 over ~5 eps | info={'early_stop_iter': 26, 'pi_loss': -0.017235560342669487, 'kl': 0.015639059245586395, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 35.0, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 138 | ep_cost_mean=47.20 | avg_ep_len=819.20| ep_reward_mean=20.61 | unsafe_steps=236 over ~5 eps | info={'early_stop_iter': 52, 'pi_loss': -0.0225793719291687, 'kl': 0.015770403668284416, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 47.2, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 139 | ep_cost_mean=67.40 | avg_ep_len=819.20| ep_reward_mean=21.20 | unsafe_steps=337 over ~5 eps | info={'early_stop_iter': 15, 'pi_loss': -0.0148091409355402, 'kl': 0.015941113233566284, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 67.4, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 140 | ep_cost_mean=33.80 | avg_ep_len=819.20| ep_reward_mean=18.69 | unsafe_steps=169 over ~5 eps | info={'early_stop_iter': 3, 'pi_loss': 0.003187794703990221, 'kl': 0.019783444702625275, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 33.8, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 141 | ep_cost_mean=51.20 | avg_ep_len=819.20| ep_reward_mean=20.20 | unsafe_steps=256 over ~5 eps | info={'early_stop_iter': 2, 'pi_loss': 0.0043325647711753845, 'kl': 0.02305096574127674, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 51.2, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 142 | ep_cost_mean=45.20 | avg_ep_len=819.20| ep_reward_mean=18.90 | unsafe_steps=226 over ~5 eps | info={'early_stop_iter': 2, 'pi_loss': 0.0008200146839953959, 'kl': 0.01901872456073761, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 45.2, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 143 | ep_cost_mean=41.00 | avg_ep_len=819.20| ep_reward_mean=21.10 | unsafe_steps=205 over ~5 eps | info={'early_stop_iter': 17, 'pi_loss': -0.017768587917089462, 'kl': 0.01529095508158207, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 41.0, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 144 | ep_cost_mean=40.80 | avg_ep_len=819.20| ep_reward_mean=20.56 | unsafe_steps=204 over ~5 eps | info={'early_stop_iter': 75, 'pi_loss': -0.03212227299809456, 'kl': 0.015245734713971615, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 40.8, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 145 | ep_cost_mean=60.80 | avg_ep_len=819.20| ep_reward_mean=19.87 | unsafe_steps=304 over ~5 eps | info={'early_stop_iter': 50, 'pi_loss': -0.022445235401391983, 'kl': 0.015480047091841698, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 60.8, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 146 | ep_cost_mean=47.00 | avg_ep_len=819.20| ep_reward_mean=21.84 | unsafe_steps=235 over ~5 eps | info={'early_stop_iter': 68, 'pi_loss': -0.023907139897346497, 'kl': 0.015631355345249176, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 47.0, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 147 | ep_cost_mean=41.20 | avg_ep_len=819.20| ep_reward_mean=21.27 | unsafe_steps=206 over ~5 eps | info={'early_stop_iter': 14, 'pi_loss': -0.013508599251508713, 'kl': 0.0166176650673151, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 41.2, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 148 | ep_cost_mean=30.40 | avg_ep_len=819.20| ep_reward_mean=20.57 | unsafe_steps=152 over ~5 eps | info={'early_stop_iter': 20, 'pi_loss': -0.014919042587280273, 'kl': 0.015579713508486748, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 30.4, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 149 | ep_cost_mean=50.40 | avg_ep_len=819.20| ep_reward_mean=20.95 | unsafe_steps=252 over ~5 eps | info={'early_stop_iter': 28, 'pi_loss': -0.016932612285017967, 'kl': 0.015899211168289185, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 50.4, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 150 | ep_cost_mean=59.80 | avg_ep_len=819.20| ep_reward_mean=20.24 | unsafe_steps=299 over ~5 eps | info={'early_stop_iter': 57, 'pi_loss': -0.025947727262973785, 'kl': 0.015280256047844887, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 59.8, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 151 | ep_cost_mean=43.80 | avg_ep_len=819.20| ep_reward_mean=19.17 | unsafe_steps=219 over ~5 eps | info={'early_stop_iter': 46, 'pi_loss': -0.022862426936626434, 'kl': 0.015128969214856625, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 43.8, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 152 | ep_cost_mean=54.80 | avg_ep_len=819.20| ep_reward_mean=20.85 | unsafe_steps=274 over ~5 eps | info={'early_stop_iter': 45, 'pi_loss': -0.02542468160390854, 'kl': 0.01516978070139885, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 54.8, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 153 | ep_cost_mean=68.80 | avg_ep_len=819.20| ep_reward_mean=19.47 | unsafe_steps=344 over ~5 eps | info={'early_stop_iter': 58, 'pi_loss': -0.025891421362757683, 'kl': 0.01533093024045229, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 68.8, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 154 | ep_cost_mean=24.20 | avg_ep_len=819.20| ep_reward_mean=20.87 | unsafe_steps=121 over ~5 eps | info={'early_stop_iter': 55, 'pi_loss': -0.02437453716993332, 'kl': 0.01618497259914875, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 24.2, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 155 | ep_cost_mean=82.00 | avg_ep_len=819.20| ep_reward_mean=20.33 | unsafe_steps=410 over ~5 eps | info={'early_stop_iter': 31, 'pi_loss': -0.022511089220643044, 'kl': 0.015824688598513603, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 82.0, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 156 | ep_cost_mean=56.20 | avg_ep_len=819.20| ep_reward_mean=21.01 | unsafe_steps=281 over ~5 eps | info={'early_stop_iter': 7, 'pi_loss': -0.009001165628433228, 'kl': 0.015613819472491741, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 56.2, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 157 | ep_cost_mean=36.00 | avg_ep_len=819.20| ep_reward_mean=20.68 | unsafe_steps=180 over ~5 eps | info={'early_stop_iter': 56, 'pi_loss': -0.02474183775484562, 'kl': 0.015081202611327171, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 36.0, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 158 | ep_cost_mean=45.20 | avg_ep_len=819.20| ep_reward_mean=21.01 | unsafe_steps=226 over ~5 eps | info={'early_stop_iter': 7, 'pi_loss': -0.006621976848691702, 'kl': 0.016322240233421326, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 45.2, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 159 | ep_cost_mean=68.60 | avg_ep_len=819.20| ep_reward_mean=21.32 | unsafe_steps=343 over ~5 eps | info={'early_stop_iter': 14, 'pi_loss': -0.01332051306962967, 'kl': 0.016430439427495003, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 68.6, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 160 | ep_cost_mean=51.20 | avg_ep_len=819.20| ep_reward_mean=20.28 | unsafe_steps=256 over ~5 eps | info={'pi_loss': -0.029632238671183586, 'kl': 0.013493211008608341, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 51.2, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 161 | ep_cost_mean=48.80 | avg_ep_len=819.20| ep_reward_mean=19.69 | unsafe_steps=244 over ~5 eps | info={'early_stop_iter': 55, 'pi_loss': -0.027889179065823555, 'kl': 0.015037322416901588, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 48.8, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 162 | ep_cost_mean=28.60 | avg_ep_len=819.20| ep_reward_mean=20.54 | unsafe_steps=143 over ~5 eps | info={'early_stop_iter': 14, 'pi_loss': -0.012445374391973019, 'kl': 0.015400303527712822, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 28.6, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 163 | ep_cost_mean=21.60 | avg_ep_len=819.20| ep_reward_mean=19.44 | unsafe_steps=108 over ~5 eps | info={'pi_loss': -0.028326183557510376, 'kl': 0.012032648548483849, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 21.6, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 164 | ep_cost_mean=37.80 | avg_ep_len=819.20| ep_reward_mean=20.02 | unsafe_steps=189 over ~5 eps | info={'pi_loss': -0.028273915871977806, 'kl': 0.013790307566523552, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 37.8, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 165 | ep_cost_mean=61.00 | avg_ep_len=819.20| ep_reward_mean=18.49 | unsafe_steps=305 over ~5 eps | info={'early_stop_iter': 57, 'pi_loss': -0.025478852912783623, 'kl': 0.016726206988096237, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 61.0, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 166 | ep_cost_mean=33.00 | avg_ep_len=819.20| ep_reward_mean=20.98 | unsafe_steps=165 over ~5 eps | info={'early_stop_iter': 29, 'pi_loss': -0.019958866760134697, 'kl': 0.015145383775234222, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 33.0, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 167 | ep_cost_mean=44.40 | avg_ep_len=819.20| ep_reward_mean=21.02 | unsafe_steps=222 over ~5 eps | info={'early_stop_iter': 17, 'pi_loss': -0.015024356544017792, 'kl': 0.015146730467677116, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 44.4, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 168 | ep_cost_mean=61.40 | avg_ep_len=819.20| ep_reward_mean=20.64 | unsafe_steps=307 over ~5 eps | info={'early_stop_iter': 6, 'pi_loss': -0.007441623602062464, 'kl': 0.01714004948735237, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 61.4, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 169 | ep_cost_mean=43.20 | avg_ep_len=819.20| ep_reward_mean=21.21 | unsafe_steps=216 over ~5 eps | info={'early_stop_iter': 3, 'pi_loss': 0.00010579248191788793, 'kl': 0.017366865649819374, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 43.2, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 170 | ep_cost_mean=50.20 | avg_ep_len=819.20| ep_reward_mean=21.18 | unsafe_steps=251 over ~5 eps | info={'early_stop_iter': 15, 'pi_loss': -0.012643364258110523, 'kl': 0.015240952372550964, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 50.2, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 171 | ep_cost_mean=49.00 | avg_ep_len=819.20| ep_reward_mean=20.52 | unsafe_steps=245 over ~5 eps | info={'early_stop_iter': 58, 'pi_loss': -0.023490838706493378, 'kl': 0.015794003382325172, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 49.0, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 172 | ep_cost_mean=38.60 | avg_ep_len=819.20| ep_reward_mean=21.35 | unsafe_steps=193 over ~5 eps | info={'early_stop_iter': 17, 'pi_loss': -0.014013918116688728, 'kl': 0.01510109007358551, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 38.6, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 173 | ep_cost_mean=38.40 | avg_ep_len=819.20| ep_reward_mean=21.74 | unsafe_steps=192 over ~5 eps | info={'early_stop_iter': 3, 'pi_loss': -0.001901370706036687, 'kl': 0.015201868489384651, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 38.4, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 174 | ep_cost_mean=50.40 | avg_ep_len=819.20| ep_reward_mean=21.25 | unsafe_steps=252 over ~5 eps | info={'early_stop_iter': 33, 'pi_loss': -0.022155456244945526, 'kl': 0.015406118705868721, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 50.4, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 175 | ep_cost_mean=57.20 | avg_ep_len=819.20| ep_reward_mean=21.20 | unsafe_steps=286 over ~5 eps | info={'early_stop_iter': 20, 'pi_loss': -0.019065389409661293, 'kl': 0.015849564224481583, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 57.2, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 176 | ep_cost_mean=43.60 | avg_ep_len=819.20| ep_reward_mean=21.46 | unsafe_steps=218 over ~5 eps | info={'early_stop_iter': 10, 'pi_loss': -0.011241579428315163, 'kl': 0.015774153172969818, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 43.6, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 177 | ep_cost_mean=53.40 | avg_ep_len=819.20| ep_reward_mean=21.09 | unsafe_steps=267 over ~5 eps | info={'early_stop_iter': 9, 'pi_loss': -0.00899096205830574, 'kl': 0.01590386964380741, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 53.4, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 178 | ep_cost_mean=52.00 | avg_ep_len=819.20| ep_reward_mean=20.34 | unsafe_steps=260 over ~5 eps | info={'early_stop_iter': 12, 'pi_loss': -0.01143697090446949, 'kl': 0.015899622812867165, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 52.0, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 179 | ep_cost_mean=46.40 | avg_ep_len=819.20| ep_reward_mean=19.10 | unsafe_steps=232 over ~5 eps | info={'early_stop_iter': 9, 'pi_loss': -0.007619895972311497, 'kl': 0.015449315309524536, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 46.4, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 180 | ep_cost_mean=72.40 | avg_ep_len=819.20| ep_reward_mean=20.79 | unsafe_steps=362 over ~5 eps | info={'early_stop_iter': 20, 'pi_loss': -0.01853572204709053, 'kl': 0.015617437660694122, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 72.4, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 181 | ep_cost_mean=43.20 | avg_ep_len=819.20| ep_reward_mean=20.75 | unsafe_steps=216 over ~5 eps | info={'early_stop_iter': 3, 'pi_loss': 0.0027798484079539776, 'kl': 0.018874945119023323, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 43.2, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 182 | ep_cost_mean=38.00 | avg_ep_len=819.20| ep_reward_mean=20.10 | unsafe_steps=190 over ~5 eps | info={'early_stop_iter': 53, 'pi_loss': -0.026578566059470177, 'kl': 0.016627352684736252, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 38.0, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 183 | ep_cost_mean=15.00 | avg_ep_len=819.20| ep_reward_mean=19.64 | unsafe_steps=75 over ~5 eps | info={'early_stop_iter': 30, 'pi_loss': -0.02031548134982586, 'kl': 0.01545602735131979, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 15.0, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 184 | ep_cost_mean=40.00 | avg_ep_len=819.20| ep_reward_mean=20.48 | unsafe_steps=200 over ~5 eps | info={'early_stop_iter': 11, 'pi_loss': -0.008747403509914875, 'kl': 0.015507455915212631, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 40.0, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 185 | ep_cost_mean=47.80 | avg_ep_len=819.20| ep_reward_mean=20.70 | unsafe_steps=239 over ~5 eps | info={'early_stop_iter': 7, 'pi_loss': -0.005166494287550449, 'kl': 0.020192448049783707, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 47.8, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 186 | ep_cost_mean=49.80 | avg_ep_len=819.20| ep_reward_mean=20.96 | unsafe_steps=249 over ~5 eps | info={'early_stop_iter': 29, 'pi_loss': -0.020395351573824883, 'kl': 0.015074668452143669, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 49.8, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 187 | ep_cost_mean=70.00 | avg_ep_len=819.20| ep_reward_mean=18.27 | unsafe_steps=350 over ~5 eps | info={'early_stop_iter': 6, 'pi_loss': -0.008718677796423435, 'kl': 0.015636438503861427, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 70.0, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 188 | ep_cost_mean=63.00 | avg_ep_len=819.20| ep_reward_mean=20.72 | unsafe_steps=315 over ~5 eps | info={'early_stop_iter': 16, 'pi_loss': -0.016151027753949165, 'kl': 0.01778547279536724, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 63.0, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 189 | ep_cost_mean=43.40 | avg_ep_len=819.20| ep_reward_mean=19.98 | unsafe_steps=217 over ~5 eps | info={'pi_loss': -0.028416138142347336, 'kl': 0.01497889868915081, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 43.4, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 190 | ep_cost_mean=44.20 | avg_ep_len=819.20| ep_reward_mean=20.91 | unsafe_steps=221 over ~5 eps | info={'early_stop_iter': 7, 'pi_loss': -0.008088385686278343, 'kl': 0.015026877634227276, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 44.2, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 191 | ep_cost_mean=39.60 | avg_ep_len=819.20| ep_reward_mean=20.45 | unsafe_steps=198 over ~5 eps | info={'early_stop_iter': 34, 'pi_loss': -0.02161847986280918, 'kl': 0.01558748073875904, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 39.6, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 192 | ep_cost_mean=38.20 | avg_ep_len=819.20| ep_reward_mean=20.70 | unsafe_steps=191 over ~5 eps | info={'early_stop_iter': 33, 'pi_loss': -0.02399457059800625, 'kl': 0.015364987775683403, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 38.2, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 193 | ep_cost_mean=33.00 | avg_ep_len=819.20| ep_reward_mean=20.47 | unsafe_steps=165 over ~5 eps | info={'early_stop_iter': 8, 'pi_loss': -0.011437945067882538, 'kl': 0.016667205840349197, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 33.0, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 194 | ep_cost_mean=48.80 | avg_ep_len=819.20| ep_reward_mean=19.81 | unsafe_steps=244 over ~5 eps | info={'early_stop_iter': 3, 'pi_loss': 0.0010966593399643898, 'kl': 0.019160572439432144, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 48.8, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 195 | ep_cost_mean=69.20 | avg_ep_len=819.20| ep_reward_mean=20.53 | unsafe_steps=346 over ~5 eps | info={'early_stop_iter': 15, 'pi_loss': -0.01263080257922411, 'kl': 0.016832949593663216, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 69.2, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 196 | ep_cost_mean=41.20 | avg_ep_len=819.20| ep_reward_mean=21.09 | unsafe_steps=206 over ~5 eps | info={'early_stop_iter': 20, 'pi_loss': -0.01555018499493599, 'kl': 0.01662876456975937, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 41.2, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 197 | ep_cost_mean=19.60 | avg_ep_len=819.20| ep_reward_mean=21.07 | unsafe_steps=98 over ~5 eps | info={'early_stop_iter': 7, 'pi_loss': -0.006685570813715458, 'kl': 0.017123086377978325, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 19.6, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 198 | ep_cost_mean=62.80 | avg_ep_len=819.20| ep_reward_mean=19.72 | unsafe_steps=314 over ~5 eps | info={'early_stop_iter': 21, 'pi_loss': -0.014171536080539227, 'kl': 0.015134483575820923, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 62.8, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 199 | ep_cost_mean=61.20 | avg_ep_len=819.20| ep_reward_mean=20.53 | unsafe_steps=306 over ~5 eps | info={'early_stop_iter': 17, 'pi_loss': -0.017788341268897057, 'kl': 0.016235418617725372, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 61.2, 'avg_ep_len': 819.2} | KL=None\n",
      "[actsafe] Epoch 200 | ep_cost_mean=46.60 | avg_ep_len=819.20| ep_reward_mean=20.07 | unsafe_steps=233 over ~5 eps | info={'early_stop_iter': 79, 'pi_loss': -0.027544187381863594, 'kl': 0.016165193170309067, 'shield_last_projected': False, 'shield_last_method': 'n/a', 'ep_cost_mean': 46.6, 'avg_ep_len': 819.2} | KL=None\n"
     ]
    }
   ],
   "source": [
    "act = argparse.ArgumentParser()\n",
    "act.add_argument(\"--algo\", type=str, default=\"actsafe\")\n",
    "act.add_argument(\"--env-id\", type=str, default=\"SafetyPointGoal1-v0\")\n",
    "act.add_argument(\"--steps-per-epoch\", type=int, default=4096)\n",
    "act.add_argument(\"--epochs\", type=int, default=200)\n",
    "act.add_argument(\"--device\", type=str, default=device)\n",
    "act.add_argument(\"--seed\", type=int, default=0)\n",
    "act.add_argument(\"--cost-limit\", type=float, default=0.02)\n",
    "\n",
    "# ← this line is the key:\n",
    "args_act, _ = act.parse_known_args()\n",
    "act_cost_curve, act_rew_curve=train(\n",
    "    algo=args_act.algo,\n",
    "    env_id=args_act.env_id,\n",
    "    steps_per_epoch=args_act.steps_per_epoch,\n",
    "    epochs=args_act.epochs,\n",
    "    device=args_act.device,\n",
    "    seed=args_act.seed,\n",
    "    cost_limit=args_act.cost_limit,\n",
    ")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "e1787ff3",
   "metadata": {},
   "outputs": [],
   "source": [
    "# bundle = {\"CPO_cost_curve\":cost_curve,\n",
    "# \"CPO_rew_curve\":rew_curve,\n",
    "# \"ActSafe_cost_curve\":act_cost_curve,\n",
    "# \"ActSafe_rew_curve\":act_rew_curve}\n",
    "\n",
    "\n",
    "# with open(\"bundle.json\", \"w\") as f:\n",
    "#     json.dump(bundle, f)\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "9344bcb0",
   "metadata": {},
   "outputs": [],
   "source": [
    "\n",
    "# with open(\"bundle.json\", \"r\") as f:\n",
    "#     loaded = json.load(f)\n",
    "    \n",
    "# cost_curve=loaded[\"CPO_cost_curve\"]\n",
    "# rew_curve=loaded[\"CPO_rew_curve\"]\n",
    "# act_cost_curve=loaded[\"ActSafe_cost_curve\"]\n",
    "# act_rew_curve=loaded[\"ActSafe_rew_curve\"]\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 29,
   "id": "fc9330ff",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Training safe_fqi on SafetyPointGoal1-v0 for 200 epochs...\n",
      "[safe_fqi] Epoch 001 | ep_cost_mean=22.25 | avg_ep_len=1024.00| ep_reward_mean=-0.59 | unsafe_steps=89 over ~4 eps | info={'q1_loss': 0.0019393533002585173, 'q2_loss': 0.011589813977479935, 'cost_loss': 0.02931806817650795, 'penalty': 1.0102675043114369} | KL=None\n",
      "| penalty=1.0102675043114369 \n",
      "| global_step=4096.0 \n",
      "[safe_fqi] Epoch 002 | ep_cost_mean=40.25 | avg_ep_len=1024.00| ep_reward_mean=-0.98 | unsafe_steps=167 over ~4 eps | info={'q1_loss': 0.009870998561382294, 'q2_loss': 0.013211851939558983, 'cost_loss': 0.03344899229705334, 'penalty': 1.0666537151011979} | KL=None\n",
      "| penalty=1.0666537151011979 \n",
      "| global_step=8192.0 \n",
      "[safe_fqi] Epoch 003 | ep_cost_mean=63.75 | avg_ep_len=1024.00| ep_reward_mean=-1.22 | unsafe_steps=255 over ~4 eps | info={'q1_loss': 0.04166841134428978, 'q2_loss': 0.04909440502524376, 'cost_loss': 0.026694248616695403, 'penalty': 1.1758702801913998} | KL=None\n",
      "| penalty=1.1758702801913998 \n",
      "| global_step=12288.0 \n",
      "[safe_fqi] Epoch 004 | ep_cost_mean=173.25 | avg_ep_len=1024.00| ep_reward_mean=-0.33 | unsafe_steps=693 over ~4 eps | info={'q1_loss': 0.1995978057384491, 'q2_loss': 0.21877995133399963, 'cost_loss': 0.0455594502389431, 'penalty': 1.478425202913867} | KL=None\n",
      "| penalty=1.478425202913867 \n",
      "| global_step=16384.0 \n",
      "[safe_fqi] Epoch 005 | ep_cost_mean=27.75 | avg_ep_len=1024.00| ep_reward_mean=-1.58 | unsafe_steps=111 over ~4 eps | info={'q1_loss': 0.7964272499084473, 'q2_loss': 0.8686040639877319, 'cost_loss': 0.03786942064762115, 'penalty': 1.6384311430863585} | KL=None\n",
      "| penalty=1.6384311430863585 \n",
      "| global_step=20480.0 \n",
      "[safe_fqi] Epoch 006 | ep_cost_mean=45.25 | avg_ep_len=1024.00| ep_reward_mean=-5.25 | unsafe_steps=181 over ~4 eps | info={'q1_loss': 1.522009253501892, 'q2_loss': 1.6469637155532837, 'cost_loss': 0.026156193763017654, 'penalty': 1.7179409836201416} | KL=None\n",
      "| penalty=1.7179409836201416 \n",
      "| global_step=24576.0 \n",
      "[safe_fqi] Epoch 007 | ep_cost_mean=27.25 | avg_ep_len=1024.00| ep_reward_mean=-0.40 | unsafe_steps=109 over ~4 eps | info={'q1_loss': 1.6424318552017212, 'q2_loss': 1.736829161643982, 'cost_loss': 0.03874246031045914, 'penalty': 1.774424717859341} | KL=None\n",
      "| penalty=1.774424717859341 \n",
      "| global_step=28672.0 \n",
      "[safe_fqi] Epoch 008 | ep_cost_mean=41.25 | avg_ep_len=1024.00| ep_reward_mean=-1.16 | unsafe_steps=165 over ~4 eps | info={'q1_loss': 2.0593135356903076, 'q2_loss': 2.0989644527435303, 'cost_loss': 0.030280455574393274, 'penalty': 1.8392945713563524} | KL=None\n",
      "| penalty=1.8392945713563524 \n",
      "| global_step=32768.0 \n",
      "[safe_fqi] Epoch 009 | ep_cost_mean=21.00 | avg_ep_len=1024.00| ep_reward_mean=-0.03 | unsafe_steps=84 over ~4 eps | info={'q1_loss': 2.5377113819122314, 'q2_loss': 2.5622754096984863, 'cost_loss': 0.025040341727435588, 'penalty': 1.8820712460886602} | KL=None\n",
      "| penalty=1.8820712460886602 \n",
      "| global_step=36864.0 \n",
      "[safe_fqi] Epoch 010 | ep_cost_mean=25.75 | avg_ep_len=1024.00| ep_reward_mean=0.24 | unsafe_steps=103 over ~4 eps | info={'q1_loss': 3.429176092147827, 'q2_loss': 3.461637496948242, 'cost_loss': 0.028992505744099617, 'penalty': 1.9171399368601476} | KL=None\n",
      "| penalty=1.9171399368601476 \n",
      "| global_step=40960.0 \n",
      "[safe_fqi] Epoch 011 | ep_cost_mean=129.75 | avg_ep_len=1024.00| ep_reward_mean=1.54 | unsafe_steps=519 over ~4 eps | info={'q1_loss': 3.781773090362549, 'q2_loss': 3.775789260864258, 'cost_loss': 0.03190207369625568, 'penalty': 2.1196367555266007} | KL=None\n",
      "| penalty=2.1196367555266007 \n",
      "| global_step=45056.0 \n",
      "[safe_fqi] Epoch 012 | ep_cost_mean=169.75 | avg_ep_len=1024.00| ep_reward_mean=0.98 | unsafe_steps=679 over ~4 eps | info={'q1_loss': 3.9319472312927246, 'q2_loss': 3.9737229347229004, 'cost_loss': 0.05095767080783844, 'penalty': 2.4679421593186497} | KL=None\n",
      "| penalty=2.4679421593186497 \n",
      "| global_step=49152.0 \n",
      "[safe_fqi] Epoch 013 | ep_cost_mean=128.00 | avg_ep_len=1024.00| ep_reward_mean=-0.18 | unsafe_steps=512 over ~4 eps | info={'q1_loss': 7.2405171394348145, 'q2_loss': 7.2863688468933105, 'cost_loss': 0.042196416109800336, 'penalty': 2.788030534808928} | KL=None\n",
      "| penalty=2.788030534808928 \n",
      "| global_step=53248.0 \n",
      "[safe_fqi] Epoch 014 | ep_cost_mean=42.25 | avg_ep_len=1024.00| ep_reward_mean=0.72 | unsafe_steps=169 over ~4 eps | info={'q1_loss': 3.516160011291504, 'q2_loss': 3.610886335372925, 'cost_loss': 0.04994371831417084, 'penalty': 2.9421194625236167} | KL=None\n",
      "| penalty=2.9421194625236167 \n",
      "| global_step=57344.0 \n",
      "[safe_fqi] Epoch 015 | ep_cost_mean=15.50 | avg_ep_len=1024.00| ep_reward_mean=-8.65 | unsafe_steps=62 over ~4 eps | info={'q1_loss': 4.283995151519775, 'q2_loss': 4.34134578704834, 'cost_loss': 0.040415351092815396, 'penalty': 2.9837117825942086} | KL=None\n",
      "| penalty=2.9837117825942086 \n",
      "| global_step=61440.0 \n",
      "[safe_fqi] Epoch 016 | ep_cost_mean=87.25 | avg_ep_len=1024.00| ep_reward_mean=-0.91 | unsafe_steps=349 over ~4 eps | info={'q1_loss': 4.185956954956055, 'q2_loss': 4.280730247497559, 'cost_loss': 0.03024454601109028, 'penalty': 3.112493582567738} | KL=None\n",
      "| penalty=3.112493582567738 \n",
      "| global_step=65536.0 \n",
      "[safe_fqi] Epoch 017 | ep_cost_mean=27.25 | avg_ep_len=1024.00| ep_reward_mean=-0.44 | unsafe_steps=109 over ~4 eps | info={'q1_loss': 3.9767487049102783, 'q2_loss': 4.1026411056518555, 'cost_loss': 0.03871361799538135, 'penalty': 3.2008453756898967} | KL=None\n",
      "| penalty=3.2008453756898967 \n",
      "| global_step=69632.0 \n",
      "[safe_fqi] Epoch 018 | ep_cost_mean=18.75 | avg_ep_len=1024.00| ep_reward_mean=-1.60 | unsafe_steps=75 over ~4 eps | info={'q1_loss': 4.298773288726807, 'q2_loss': 4.416734218597412, 'cost_loss': 0.031220510229468347, 'penalty': 3.2325035477849506} | KL=None\n",
      "| penalty=3.2325035477849506 \n",
      "| global_step=73728.0 \n",
      "[safe_fqi] Epoch 019 | ep_cost_mean=97.00 | avg_ep_len=1024.00| ep_reward_mean=-0.42 | unsafe_steps=388 over ~4 eps | info={'q1_loss': 4.223576545715332, 'q2_loss': 4.313423156738281, 'cost_loss': 0.03322011046111584, 'penalty': 3.3781478764121378} | KL=None\n",
      "| penalty=3.3781478764121378 \n",
      "| global_step=77824.0 \n",
      "[safe_fqi] Epoch 020 | ep_cost_mean=16.50 | avg_ep_len=1024.00| ep_reward_mean=-1.33 | unsafe_steps=66 over ~4 eps | info={'q1_loss': 4.2939910888671875, 'q2_loss': 4.41304874420166, 'cost_loss': 0.029665203019976615, 'penalty': 3.4572756357148493} | KL=None\n",
      "| penalty=3.4572756357148493 \n",
      "| global_step=81920.0 \n",
      "[safe_fqi] Epoch 021 | ep_cost_mean=72.50 | avg_ep_len=1024.00| ep_reward_mean=-0.69 | unsafe_steps=290 over ~4 eps | info={'q1_loss': 4.14593505859375, 'q2_loss': 4.29832124710083, 'cost_loss': 0.03043060563504696, 'penalty': 3.56623451355517} | KL=None\n",
      "| penalty=3.56623451355517 \n",
      "| global_step=86016.0 \n",
      "[safe_fqi] Epoch 022 | ep_cost_mean=43.00 | avg_ep_len=1024.00| ep_reward_mean=-1.06 | unsafe_steps=172 over ~4 eps | info={'q1_loss': 4.1715803146362305, 'q2_loss': 4.326228141784668, 'cost_loss': 0.039407404512166976, 'penalty': 3.6681653552969} | KL=None\n",
      "| penalty=3.6681653552969 \n",
      "| global_step=90112.0 \n",
      "[safe_fqi] Epoch 023 | ep_cost_mean=27.25 | avg_ep_len=1024.00| ep_reward_mean=-0.80 | unsafe_steps=109 over ~4 eps | info={'q1_loss': 4.661041736602783, 'q2_loss': 4.8417277336120605, 'cost_loss': 0.03237260691821575, 'penalty': 3.7248701570706895} | KL=None\n",
      "| penalty=3.7248701570706895 \n",
      "| global_step=94208.0 \n",
      "[safe_fqi] Epoch 024 | ep_cost_mean=51.50 | avg_ep_len=1024.00| ep_reward_mean=-1.09 | unsafe_steps=206 over ~4 eps | info={'q1_loss': 7.670723915100098, 'q2_loss': 7.781984806060791, 'cost_loss': 0.035293974727392194, 'penalty': 3.806003848432547} | KL=None\n",
      "| penalty=3.806003848432547 \n",
      "| global_step=98304.0 \n",
      "[safe_fqi] Epoch 025 | ep_cost_mean=129.50 | avg_ep_len=1024.00| ep_reward_mean=-0.15 | unsafe_steps=523 over ~4 eps | info={'q1_loss': 3.883901834487915, 'q2_loss': 4.086843013763428, 'cost_loss': 0.027610548213124274, 'penalty': 4.028862643609483} | KL=None\n",
      "| penalty=4.028862643609483 \n",
      "| global_step=102400.0 \n",
      "[safe_fqi] Epoch 026 | ep_cost_mean=19.75 | avg_ep_len=1024.00| ep_reward_mean=-0.11 | unsafe_steps=79 over ~4 eps | info={'q1_loss': 4.64254093170166, 'q2_loss': 4.919101238250732, 'cost_loss': 0.02941091135144234, 'penalty': 4.140809219165332} | KL=None\n",
      "| penalty=4.140809219165332 \n",
      "| global_step=106496.0 \n",
      "[safe_fqi] Epoch 027 | ep_cost_mean=0.00 | avg_ep_len=1024.00| ep_reward_mean=0.51 | unsafe_steps=26 over ~4 eps | info={'q1_loss': 4.301607131958008, 'q2_loss': 4.569650173187256, 'cost_loss': 0.030796969681978224, 'penalty': 4.139549364710593} | KL=None\n",
      "| penalty=4.139549364710593 \n",
      "| global_step=110592.0 \n",
      "[safe_fqi] Epoch 028 | ep_cost_mean=61.50 | avg_ep_len=1024.00| ep_reward_mean=-0.67 | unsafe_steps=246 over ~4 eps | info={'q1_loss': 4.569667816162109, 'q2_loss': 4.755352020263672, 'cost_loss': 0.023046791180968286, 'penalty': 4.2138570165958225} | KL=None\n",
      "| penalty=4.2138570165958225 \n",
      "| global_step=114688.0 \n",
      "[safe_fqi] Epoch 029 | ep_cost_mean=10.25 | avg_ep_len=1024.00| ep_reward_mean=0.75 | unsafe_steps=41 over ~4 eps | info={'q1_loss': 4.438371181488037, 'q2_loss': 4.6105122566223145, 'cost_loss': 0.039086722582578656, 'penalty': 4.253857569117482} | KL=None\n",
      "| penalty=4.253857569117482 \n",
      "| global_step=118784.0 \n",
      "[safe_fqi] Epoch 030 | ep_cost_mean=48.25 | avg_ep_len=1024.00| ep_reward_mean=1.16 | unsafe_steps=193 over ~4 eps | info={'q1_loss': 3.9593677520751953, 'q2_loss': 4.138827800750732, 'cost_loss': 0.036824310570955275, 'penalty': 4.317190088360196} | KL=None\n",
      "| penalty=4.317190088360196 \n",
      "| global_step=122880.0 \n",
      "[safe_fqi] Epoch 031 | ep_cost_mean=46.50 | avg_ep_len=1024.00| ep_reward_mean=0.55 | unsafe_steps=186 over ~4 eps | info={'q1_loss': 4.230099201202393, 'q2_loss': 4.453276634216309, 'cost_loss': 0.02910524494946003, 'penalty': 4.404946882002117} | KL=None\n",
      "| penalty=4.404946882002117 \n",
      "| global_step=126976.0 \n",
      "[safe_fqi] Epoch 032 | ep_cost_mean=5.25 | avg_ep_len=1024.00| ep_reward_mean=-0.50 | unsafe_steps=50 over ~4 eps | info={'q1_loss': 4.37723970413208, 'q2_loss': 4.63803768157959, 'cost_loss': 0.022850032523274423, 'penalty': 4.428029557542415} | KL=None\n",
      "| penalty=4.428029557542415 \n",
      "| global_step=131072.0 \n",
      "[safe_fqi] Epoch 033 | ep_cost_mean=12.75 | avg_ep_len=1024.00| ep_reward_mean=2.65 | unsafe_steps=51 over ~4 eps | info={'q1_loss': 4.623215198516846, 'q2_loss': 4.8963518142700195, 'cost_loss': 0.026985342055559157, 'penalty': 4.430448350233587} | KL=None\n",
      "| penalty=4.430448350233587 \n",
      "| global_step=135168.0 \n",
      "[safe_fqi] Epoch 034 | ep_cost_mean=8.50 | avg_ep_len=1024.00| ep_reward_mean=-0.25 | unsafe_steps=34 over ~4 eps | info={'q1_loss': 4.69192361831665, 'q2_loss': 4.945899963378906, 'cost_loss': 0.035435570776462554, 'penalty': 4.42955439087903} | KL=None\n",
      "| penalty=4.42955439087903 \n",
      "| global_step=139264.0 \n",
      "[safe_fqi] Epoch 035 | ep_cost_mean=40.75 | avg_ep_len=1024.00| ep_reward_mean=0.62 | unsafe_steps=163 over ~4 eps | info={'q1_loss': 4.217270851135254, 'q2_loss': 4.410697937011719, 'cost_loss': 0.030134906992316246, 'penalty': 4.476682492232281} | KL=None\n",
      "| penalty=4.476682492232281 \n",
      "| global_step=143360.0 \n",
      "[safe_fqi] Epoch 036 | ep_cost_mean=20.75 | avg_ep_len=1024.00| ep_reward_mean=0.88 | unsafe_steps=83 over ~4 eps | info={'q1_loss': 3.5422816276550293, 'q2_loss': 3.767289876937866, 'cost_loss': 0.033033328503370284, 'penalty': 4.517363516224682} | KL=None\n",
      "| penalty=4.517363516224682 \n",
      "| global_step=147456.0 \n",
      "[safe_fqi] Epoch 037 | ep_cost_mean=15.25 | avg_ep_len=1024.00| ep_reward_mean=0.11 | unsafe_steps=61 over ~4 eps | info={'q1_loss': 3.291651487350464, 'q2_loss': 3.5000336170196533, 'cost_loss': 0.036998210847377776, 'penalty': 4.535460741296324} | KL=None\n",
      "| penalty=4.535460741296324 \n",
      "| global_step=151552.0 \n",
      "[safe_fqi] Epoch 038 | ep_cost_mean=27.50 | avg_ep_len=1024.00| ep_reward_mean=0.34 | unsafe_steps=110 over ~4 eps | info={'q1_loss': 4.192119598388672, 'q2_loss': 4.388628959655762, 'cost_loss': 0.04512593820691109, 'penalty': 4.567560469463334} | KL=None\n",
      "| penalty=4.567560469463334 \n",
      "| global_step=155648.0 \n",
      "[safe_fqi] Epoch 039 | ep_cost_mean=24.00 | avg_ep_len=1024.00| ep_reward_mean=0.00 | unsafe_steps=96 over ~4 eps | info={'q1_loss': 4.10402774810791, 'q2_loss': 4.381265163421631, 'cost_loss': 0.02839716002345085, 'penalty': 4.6033789977555} | KL=None\n",
      "| penalty=4.6033789977555 \n",
      "| global_step=159744.0 \n",
      "[safe_fqi] Epoch 040 | ep_cost_mean=5.25 | avg_ep_len=1024.00| ep_reward_mean=-1.33 | unsafe_steps=21 over ~4 eps | info={'q1_loss': 3.664134979248047, 'q2_loss': 3.8634867668151855, 'cost_loss': 0.03985136151313782, 'penalty': 4.6074241262621705} | KL=None\n",
      "| penalty=4.6074241262621705 \n",
      "| global_step=163840.0 \n",
      "[safe_fqi] Epoch 041 | ep_cost_mean=117.75 | avg_ep_len=1024.00| ep_reward_mean=1.88 | unsafe_steps=471 over ~4 eps | info={'q1_loss': 5.402142524719238, 'q2_loss': 5.56816291809082, 'cost_loss': 0.032999437302351, 'penalty': 4.7748089945900265} | KL=None\n",
      "| penalty=4.7748089945900265 \n",
      "| global_step=167936.0 \n",
      "[safe_fqi] Epoch 042 | ep_cost_mean=62.50 | avg_ep_len=1024.00| ep_reward_mean=1.21 | unsafe_steps=266 over ~4 eps | info={'q1_loss': 2.87251353263855, 'q2_loss': 3.0333168506622314, 'cost_loss': 0.031746494397521016, 'penalty': 4.9423934629734925} | KL=None\n",
      "| penalty=4.9423934629734925 \n",
      "| global_step=172032.0 \n",
      "[safe_fqi] Epoch 043 | ep_cost_mean=17.00 | avg_ep_len=1024.00| ep_reward_mean=-1.43 | unsafe_steps=68 over ~4 eps | info={'q1_loss': 2.9278676509857178, 'q2_loss': 3.0648446083068848, 'cost_loss': 0.03639870099723339, 'penalty': 5.000938824288851} | KL=None\n",
      "| penalty=5.000938824288851 \n",
      "| global_step=176128.0 \n",
      "[safe_fqi] Epoch 044 | ep_cost_mean=5.50 | avg_ep_len=1024.00| ep_reward_mean=-1.08 | unsafe_steps=22 over ~4 eps | info={'q1_loss': 3.5106632709503174, 'q2_loss': 3.6472935676574707, 'cost_loss': 0.039377549290657045, 'penalty': 5.002449460963654} | KL=None\n",
      "| penalty=5.002449460963654 \n",
      "| global_step=180224.0 \n",
      "[safe_fqi] Epoch 045 | ep_cost_mean=4.00 | avg_ep_len=1024.00| ep_reward_mean=-1.49 | unsafe_steps=16 over ~4 eps | info={'q1_loss': 3.3395743370056152, 'q2_loss': 3.4989473819732666, 'cost_loss': 0.024787047877907753, 'penalty': 4.989506274372336} | KL=None\n",
      "| penalty=4.989506274372336 \n",
      "| global_step=184320.0 \n",
      "[safe_fqi] Epoch 046 | ep_cost_mean=7.75 | avg_ep_len=1024.00| ep_reward_mean=-1.50 | unsafe_steps=31 over ~4 eps | info={'q1_loss': 3.941507577896118, 'q2_loss': 4.080687999725342, 'cost_loss': 0.0380650095641613, 'penalty': 4.980392156208599} | KL=None\n",
      "| penalty=4.980392156208599 \n",
      "| global_step=188416.0 \n",
      "[safe_fqi] Epoch 047 | ep_cost_mean=91.00 | avg_ep_len=1024.00| ep_reward_mean=-0.50 | unsafe_steps=364 over ~4 eps | info={'q1_loss': 3.5264627933502197, 'q2_loss': 3.6414713859558105, 'cost_loss': 0.021764545887708663, 'penalty': 5.106035468466603} | KL=None\n",
      "| penalty=5.106035468466603 \n",
      "| global_step=192512.0 \n",
      "[safe_fqi] Epoch 048 | ep_cost_mean=0.00 | avg_ep_len=1024.00| ep_reward_mean=-1.44 | unsafe_steps=0 over ~4 eps | info={'q1_loss': 4.043833255767822, 'q2_loss': 4.223998546600342, 'cost_loss': 0.03712403252720833, 'penalty': 5.153459844298306} | KL=None\n",
      "| penalty=5.153459844298306 \n",
      "| global_step=196608.0 \n",
      "[safe_fqi] Epoch 049 | ep_cost_mean=10.00 | avg_ep_len=1024.00| ep_reward_mean=0.22 | unsafe_steps=40 over ~4 eps | info={'q1_loss': 4.140402793884277, 'q2_loss': 4.283152103424072, 'cost_loss': 0.03001680001616478, 'penalty': 5.14988309984158} | KL=None\n",
      "| penalty=5.14988309984158 \n",
      "| global_step=200704.0 \n",
      "[safe_fqi] Epoch 050 | ep_cost_mean=10.50 | avg_ep_len=1024.00| ep_reward_mean=-1.89 | unsafe_steps=42 over ~4 eps | info={'q1_loss': 4.357587814331055, 'q2_loss': 4.558239459991455, 'cost_loss': 0.023272209241986273, 'penalty': 5.149859562961015} | KL=None\n",
      "| penalty=5.149859562961015 \n",
      "| global_step=204800.0 \n",
      "[safe_fqi] Epoch 051 | ep_cost_mean=24.75 | avg_ep_len=1024.00| ep_reward_mean=-0.65 | unsafe_steps=116 over ~4 eps | info={'q1_loss': 4.288805961608887, 'q2_loss': 4.459815979003906, 'cost_loss': 0.026574117690324785, 'penalty': 5.173030728839055} | KL=None\n",
      "| penalty=5.173030728839055 \n",
      "| global_step=208896.0 \n",
      "[safe_fqi] Epoch 052 | ep_cost_mean=36.50 | avg_ep_len=1024.00| ep_reward_mean=-0.10 | unsafe_steps=146 over ~4 eps | info={'q1_loss': 3.8765311241149902, 'q2_loss': 4.024336338043213, 'cost_loss': 0.026347381994128227, 'penalty': 5.226137089980496} | KL=None\n",
      "| penalty=5.226137089980496 \n",
      "| global_step=212992.0 \n",
      "[safe_fqi] Epoch 053 | ep_cost_mean=64.00 | avg_ep_len=1024.00| ep_reward_mean=-0.64 | unsafe_steps=256 over ~4 eps | info={'q1_loss': 3.681580066680908, 'q2_loss': 3.8882901668548584, 'cost_loss': 0.019721225276589392, 'penalty': 5.332990691465591} | KL=None\n",
      "| penalty=5.332990691465591 \n",
      "| global_step=217088.0 \n",
      "[safe_fqi] Epoch 054 | ep_cost_mean=7.00 | avg_ep_len=1024.00| ep_reward_mean=-2.40 | unsafe_steps=28 over ~4 eps | info={'q1_loss': 4.28216028213501, 'q2_loss': 4.347803115844727, 'cost_loss': 0.037386801466345786, 'penalty': 5.3720152978927995} | KL=None\n",
      "| penalty=5.3720152978927995 \n",
      "| global_step=221184.0 \n",
      "[safe_fqi] Epoch 055 | ep_cost_mean=11.25 | avg_ep_len=1024.00| ep_reward_mean=-2.11 | unsafe_steps=45 over ~4 eps | info={'q1_loss': 3.312230348587036, 'q2_loss': 3.478768825531006, 'cost_loss': 0.03240032345056534, 'penalty': 5.374453025384194} | KL=None\n",
      "| penalty=5.374453025384194 \n",
      "| global_step=225280.0 \n",
      "[safe_fqi] Epoch 056 | ep_cost_mean=9.00 | avg_ep_len=1024.00| ep_reward_mean=-1.28 | unsafe_steps=36 over ~4 eps | info={'q1_loss': 3.3938333988189697, 'q2_loss': 3.549699544906616, 'cost_loss': 0.013303673267364502, 'penalty': 5.373350307254786} | KL=None\n",
      "| penalty=5.373350307254786 \n",
      "| global_step=229376.0 \n",
      "[safe_fqi] Epoch 057 | ep_cost_mean=36.25 | avg_ep_len=1024.00| ep_reward_mean=-0.35 | unsafe_steps=145 over ~4 eps | info={'q1_loss': 3.6790835857391357, 'q2_loss': 3.799732208251953, 'cost_loss': 0.02729307599365711, 'penalty': 5.413663839954755} | KL=None\n",
      "| penalty=5.413663839954755 \n",
      "| global_step=233472.0 \n",
      "[safe_fqi] Epoch 058 | ep_cost_mean=24.25 | avg_ep_len=1024.00| ep_reward_mean=-1.59 | unsafe_steps=97 over ~4 eps | info={'q1_loss': 3.1543519496917725, 'q2_loss': 3.299203872680664, 'cost_loss': 0.027335334569215775, 'penalty': 5.456359982739948} | KL=None\n",
      "| penalty=5.456359982739948 \n",
      "| global_step=237568.0 \n",
      "[safe_fqi] Epoch 059 | ep_cost_mean=10.25 | avg_ep_len=1024.00| ep_reward_mean=-2.66 | unsafe_steps=41 over ~4 eps | info={'q1_loss': 3.369880437850952, 'q2_loss': 3.464715003967285, 'cost_loss': 0.023561898432672024, 'penalty': 5.469026714974713} | KL=None\n",
      "| penalty=5.469026714974713 \n",
      "| global_step=241664.0 \n",
      "[safe_fqi] Epoch 060 | ep_cost_mean=19.50 | avg_ep_len=1024.00| ep_reward_mean=-1.95 | unsafe_steps=78 over ~4 eps | info={'q1_loss': 3.763624906539917, 'q2_loss': 3.8979573249816895, 'cost_loss': 0.028915493190288542, 'penalty': 5.484685663351732} | KL=None\n",
      "| penalty=5.484685663351732 \n",
      "| global_step=245760.0 \n",
      "[safe_fqi] Epoch 061 | ep_cost_mean=0.00 | avg_ep_len=1024.00| ep_reward_mean=-0.73 | unsafe_steps=0 over ~4 eps | info={'q1_loss': 3.1490535736083984, 'q2_loss': 3.341383457183838, 'cost_loss': 0.01685298178344965, 'penalty': 5.475849835821038} | KL=None\n",
      "| penalty=5.475849835821038 \n",
      "| global_step=249856.0 \n",
      "[safe_fqi] Epoch 062 | ep_cost_mean=11.50 | avg_ep_len=1024.00| ep_reward_mean=-2.05 | unsafe_steps=46 over ~4 eps | info={'q1_loss': 3.3389155864715576, 'q2_loss': 3.3870420455932617, 'cost_loss': 0.016046494990587235, 'penalty': 5.470321735967856} | KL=None\n",
      "| penalty=5.470321735967856 \n",
      "| global_step=253952.0 \n",
      "[safe_fqi] Epoch 063 | ep_cost_mean=3.75 | avg_ep_len=1024.00| ep_reward_mean=-2.50 | unsafe_steps=15 over ~4 eps | info={'q1_loss': 4.0761566162109375, 'q2_loss': 4.161581516265869, 'cost_loss': 0.039937295764684674, 'penalty': 5.460451665472465} | KL=None\n",
      "| penalty=5.460451665472465 \n",
      "| global_step=258048.0 \n",
      "[safe_fqi] Epoch 064 | ep_cost_mean=0.00 | avg_ep_len=1024.00| ep_reward_mean=-0.58 | unsafe_steps=0 over ~4 eps | info={'q1_loss': 3.6778740882873535, 'q2_loss': 3.8137128353118896, 'cost_loss': 0.027690978720784187, 'penalty': 5.43912269727253} | KL=None\n",
      "| penalty=5.43912269727253 \n",
      "| global_step=262144.0 \n",
      "[safe_fqi] Epoch 065 | ep_cost_mean=21.50 | avg_ep_len=1024.00| ep_reward_mean=-0.96 | unsafe_steps=86 over ~4 eps | info={'q1_loss': 4.001325607299805, 'q2_loss': 4.0943284034729, 'cost_loss': 0.03242105953395367, 'penalty': 5.448483876754904} | KL=None\n",
      "| penalty=5.448483876754904 \n",
      "| global_step=266240.0 \n",
      "[safe_fqi] Epoch 066 | ep_cost_mean=151.75 | avg_ep_len=1024.00| ep_reward_mean=-1.10 | unsafe_steps=628 over ~4 eps | info={'q1_loss': 3.3866219520568848, 'q2_loss': 3.51870059967041, 'cost_loss': 0.023101060651242733, 'penalty': 5.6810327641039935} | KL=None\n",
      "| penalty=5.6810327641039935 \n",
      "| global_step=270336.0 \n",
      "[safe_fqi] Epoch 067 | ep_cost_mean=25.25 | avg_ep_len=1024.00| ep_reward_mean=-1.99 | unsafe_steps=101 over ~4 eps | info={'q1_loss': 4.362616539001465, 'q2_loss': 4.500914573669434, 'cost_loss': 0.03257664181292057, 'penalty': 5.817316788124117} | KL=None\n",
      "| penalty=5.817316788124117 \n",
      "| global_step=274432.0 \n",
      "[safe_fqi] Epoch 068 | ep_cost_mean=37.50 | avg_ep_len=1024.00| ep_reward_mean=-0.94 | unsafe_steps=150 over ~4 eps | info={'q1_loss': 3.6016435623168945, 'q2_loss': 3.7656748294830322, 'cost_loss': 0.022449539229273795, 'penalty': 5.881045919678784} | KL=None\n",
      "| penalty=5.881045919678784 \n",
      "| global_step=278528.0 \n",
      "[safe_fqi] Epoch 069 | ep_cost_mean=22.75 | avg_ep_len=1024.00| ep_reward_mean=-0.52 | unsafe_steps=106 over ~4 eps | info={'q1_loss': 4.045893669128418, 'q2_loss': 4.22872257232666, 'cost_loss': 0.02727922722697258, 'penalty': 5.924001810494752} | KL=None\n",
      "| penalty=5.924001810494752 \n",
      "| global_step=282624.0 \n",
      "[safe_fqi] Epoch 070 | ep_cost_mean=9.50 | avg_ep_len=1024.00| ep_reward_mean=-0.99 | unsafe_steps=51 over ~4 eps | info={'q1_loss': 3.6201894283294678, 'q2_loss': 3.77955961227417, 'cost_loss': 0.019114502333104612, 'penalty': 5.934496992855801} | KL=None\n",
      "| penalty=5.934496992855801 \n",
      "| global_step=286720.0 \n",
      "[safe_fqi] Epoch 071 | ep_cost_mean=0.00 | avg_ep_len=1024.00| ep_reward_mean=-2.10 | unsafe_steps=0 over ~4 eps | info={'q1_loss': 4.122448921203613, 'q2_loss': 4.282707691192627, 'cost_loss': 0.027407768368721008, 'penalty': 5.918578880147618} | KL=None\n",
      "| penalty=5.918578880147618 \n",
      "| global_step=290816.0 \n",
      "[safe_fqi] Epoch 072 | ep_cost_mean=13.50 | avg_ep_len=1024.00| ep_reward_mean=-0.88 | unsafe_steps=54 over ~4 eps | info={'q1_loss': 4.479525566101074, 'q2_loss': 4.62040901184082, 'cost_loss': 0.04056838303804398, 'penalty': 5.915675946783647} | KL=None\n",
      "| penalty=5.915675946783647 \n",
      "| global_step=294912.0 \n",
      "[safe_fqi] Epoch 073 | ep_cost_mean=5.75 | avg_ep_len=1024.00| ep_reward_mean=0.06 | unsafe_steps=45 over ~4 eps | info={'q1_loss': 4.195278644561768, 'q2_loss': 4.3181047439575195, 'cost_loss': 0.017974390462040902, 'penalty': 5.91051497427177} | KL=None\n",
      "| penalty=5.91051497427177 \n",
      "| global_step=299008.0 \n",
      "[safe_fqi] Epoch 074 | ep_cost_mean=0.00 | avg_ep_len=1024.00| ep_reward_mean=-0.10 | unsafe_steps=0 over ~4 eps | info={'q1_loss': 3.3582873344421387, 'q2_loss': 3.5434060096740723, 'cost_loss': 0.02457841970026493, 'penalty': 5.890885339365563} | KL=None\n",
      "| penalty=5.890885339365563 \n",
      "| global_step=303104.0 \n",
      "[safe_fqi] Epoch 075 | ep_cost_mean=33.75 | avg_ep_len=1024.00| ep_reward_mean=-1.57 | unsafe_steps=135 over ~4 eps | info={'q1_loss': 3.6657612323760986, 'q2_loss': 3.9394757747650146, 'cost_loss': 0.016827942244708537, 'penalty': 5.919794214582168} | KL=None\n",
      "| penalty=5.919794214582168 \n",
      "| global_step=307200.0 \n",
      "[safe_fqi] Epoch 076 | ep_cost_mean=31.25 | avg_ep_len=1024.00| ep_reward_mean=-0.76 | unsafe_steps=125 over ~4 eps | info={'q1_loss': 3.3175172805786133, 'q2_loss': 3.6459953784942627, 'cost_loss': 0.02413228414952755, 'penalty': 5.9710369810618324} | KL=None\n",
      "| penalty=5.9710369810618324 \n",
      "| global_step=311296.0 \n",
      "[safe_fqi] Epoch 077 | ep_cost_mean=2.00 | avg_ep_len=1024.00| ep_reward_mean=-2.18 | unsafe_steps=8 over ~4 eps | info={'q1_loss': 3.5099053382873535, 'q2_loss': 3.8525567054748535, 'cost_loss': 0.012940309569239616, 'penalty': 5.975964089494034} | KL=None\n",
      "| penalty=5.975964089494034 \n",
      "| global_step=315392.0 \n",
      "[safe_fqi] Epoch 078 | ep_cost_mean=2.75 | avg_ep_len=1024.00| ep_reward_mean=-1.82 | unsafe_steps=11 over ~4 eps | info={'q1_loss': 3.4544734954833984, 'q2_loss': 3.7918615341186523, 'cost_loss': 0.03545902147889137, 'penalty': 5.958962727005522} | KL=None\n",
      "| penalty=5.958962727005522 \n",
      "| global_step=319488.0 \n",
      "[safe_fqi] Epoch 079 | ep_cost_mean=19.50 | avg_ep_len=1024.00| ep_reward_mean=-2.26 | unsafe_steps=78 over ~4 eps | info={'q1_loss': 4.004456520080566, 'q2_loss': 4.59179162979126, 'cost_loss': 0.020548527128994465, 'penalty': 5.967325145070761} | KL=None\n",
      "| penalty=5.967325145070761 \n",
      "| global_step=323584.0 \n",
      "[safe_fqi] Epoch 080 | ep_cost_mean=0.00 | avg_ep_len=1024.00| ep_reward_mean=-1.29 | unsafe_steps=0 over ~4 eps | info={'q1_loss': 3.539954900741577, 'q2_loss': 4.157759666442871, 'cost_loss': 0.022530648671090604, 'penalty': 5.957927886195623} | KL=None\n",
      "| penalty=5.957927886195623 \n",
      "| global_step=327680.0 \n",
      "[safe_fqi] Epoch 081 | ep_cost_mean=4.00 | avg_ep_len=1024.00| ep_reward_mean=-0.08 | unsafe_steps=16 over ~4 eps | info={'q1_loss': 3.5351145267486572, 'q2_loss': 4.088423252105713, 'cost_loss': 0.028958485275506974, 'penalty': 5.940468664219915} | KL=None\n",
      "| penalty=5.940468664219915 \n",
      "| global_step=331776.0 \n",
      "[safe_fqi] Epoch 082 | ep_cost_mean=6.75 | avg_ep_len=1024.00| ep_reward_mean=-1.48 | unsafe_steps=30 over ~4 eps | info={'q1_loss': 4.3876543045043945, 'q2_loss': 5.071457386016846, 'cost_loss': 0.01075133252888918, 'penalty': 5.9294220034516325} | KL=None\n",
      "| penalty=5.9294220034516325 \n",
      "| global_step=335872.0 \n",
      "[safe_fqi] Epoch 083 | ep_cost_mean=8.00 | avg_ep_len=1024.00| ep_reward_mean=-1.79 | unsafe_steps=32 over ~4 eps | info={'q1_loss': 3.3106753826141357, 'q2_loss': 3.826500177383423, 'cost_loss': 0.0164787370711565, 'penalty': 5.92268844132934} | KL=None\n",
      "| penalty=5.92268844132934 \n",
      "| global_step=339968.0 \n",
      "[safe_fqi] Epoch 084 | ep_cost_mean=18.75 | avg_ep_len=1024.00| ep_reward_mean=-0.22 | unsafe_steps=75 over ~4 eps | info={'q1_loss': 6.777667999267578, 'q2_loss': 7.536355495452881, 'cost_loss': 0.011846411414444447, 'penalty': 5.9341617264075} | KL=None\n",
      "| penalty=5.9341617264075 \n",
      "| global_step=344064.0 \n",
      "[safe_fqi] Epoch 085 | ep_cost_mean=21.25 | avg_ep_len=1024.00| ep_reward_mean=-1.69 | unsafe_steps=85 over ~4 eps | info={'q1_loss': 4.139612674713135, 'q2_loss': 5.013665676116943, 'cost_loss': 0.016746986843645572, 'penalty': 5.958184909105968} | KL=None\n",
      "| penalty=5.958184909105968 \n",
      "| global_step=348160.0 \n",
      "[safe_fqi] Epoch 086 | ep_cost_mean=98.50 | avg_ep_len=1024.00| ep_reward_mean=0.54 | unsafe_steps=394 over ~4 eps | info={'q1_loss': 3.619091033935547, 'q2_loss': 4.125626564025879, 'cost_loss': 0.023594509251415728, 'penalty': 6.107290588055382} | KL=None\n",
      "| penalty=6.107290588055382 \n",
      "| global_step=352256.0 \n",
      "[safe_fqi] Epoch 087 | ep_cost_mean=14.25 | avg_ep_len=1024.00| ep_reward_mean=-2.27 | unsafe_steps=57 over ~4 eps | info={'q1_loss': 3.4297733306884766, 'q2_loss': 4.251989841461182, 'cost_loss': 0.02181309200823307, 'penalty': 6.184121047931936} | KL=None\n",
      "| penalty=6.184121047931936 \n",
      "| global_step=356352.0 \n",
      "[safe_fqi] Epoch 088 | ep_cost_mean=5.00 | avg_ep_len=1024.00| ep_reward_mean=-2.27 | unsafe_steps=20 over ~4 eps | info={'q1_loss': 4.265789985656738, 'q2_loss': 4.9346771240234375, 'cost_loss': 0.01984202116727829, 'penalty': 6.184407739061198} | KL=None\n",
      "| penalty=6.184407739061198 \n",
      "| global_step=360448.0 \n",
      "[safe_fqi] Epoch 089 | ep_cost_mean=22.75 | avg_ep_len=1024.00| ep_reward_mean=-2.71 | unsafe_steps=91 over ~4 eps | info={'q1_loss': 3.9619088172912598, 'q2_loss': 4.808474540710449, 'cost_loss': 0.02351020388305187, 'penalty': 6.20075593504771} | KL=None\n",
      "| penalty=6.20075593504771 \n",
      "| global_step=364544.0 \n",
      "[safe_fqi] Epoch 090 | ep_cost_mean=5.00 | avg_ep_len=1024.00| ep_reward_mean=-2.19 | unsafe_steps=20 over ~4 eps | info={'q1_loss': 3.964705467224121, 'q2_loss': 4.791101455688477, 'cost_loss': 0.021043716184794902, 'penalty': 6.202071035306971} | KL=None\n",
      "| penalty=6.202071035306971 \n",
      "| global_step=368640.0 \n",
      "[safe_fqi] Epoch 091 | ep_cost_mean=0.00 | avg_ep_len=1024.00| ep_reward_mean=-2.43 | unsafe_steps=0 over ~4 eps | info={'q1_loss': 4.286659240722656, 'q2_loss': 4.958093166351318, 'cost_loss': 0.017468255758285523, 'penalty': 6.182438329710352} | KL=None\n",
      "| penalty=6.182438329710352 \n",
      "| global_step=372736.0 \n",
      "[safe_fqi] Epoch 092 | ep_cost_mean=71.25 | avg_ep_len=1024.00| ep_reward_mean=-1.56 | unsafe_steps=285 over ~4 eps | info={'q1_loss': 3.699723720550537, 'q2_loss': 4.595488548278809, 'cost_loss': 0.016668184846639632, 'penalty': 6.2707865826608025} | KL=None\n",
      "| penalty=6.2707865826608025 \n",
      "| global_step=376832.0 \n",
      "[safe_fqi] Epoch 093 | ep_cost_mean=4.50 | avg_ep_len=1024.00| ep_reward_mean=-2.15 | unsafe_steps=33 over ~4 eps | info={'q1_loss': 4.216766357421875, 'q2_loss': 5.080532550811768, 'cost_loss': 0.027129750326275827, 'penalty': 6.309271250082222} | KL=None\n",
      "| penalty=6.309271250082222 \n",
      "| global_step=380928.0 \n",
      "[safe_fqi] Epoch 094 | ep_cost_mean=0.00 | avg_ep_len=1024.00| ep_reward_mean=-1.88 | unsafe_steps=0 over ~4 eps | info={'q1_loss': 6.497770309448242, 'q2_loss': 7.264989852905273, 'cost_loss': 0.026297695562243463, 'penalty': 6.29216430794549} | KL=None\n",
      "| penalty=6.29216430794549 \n",
      "| global_step=385024.0 \n",
      "[safe_fqi] Epoch 095 | ep_cost_mean=33.25 | avg_ep_len=1024.00| ep_reward_mean=-2.00 | unsafe_steps=143 over ~4 eps | info={'q1_loss': 4.115466117858887, 'q2_loss': 4.788983345031738, 'cost_loss': 0.018015182577073574, 'penalty': 6.320474763508096} | KL=None\n",
      "| penalty=6.320474763508096 \n",
      "| global_step=389120.0 \n",
      "[safe_fqi] Epoch 096 | ep_cost_mean=24.00 | avg_ep_len=1024.00| ep_reward_mean=-2.15 | unsafe_steps=96 over ~4 eps | info={'q1_loss': 4.089006423950195, 'q2_loss': 4.908361911773682, 'cost_loss': 0.02813931219279766, 'penalty': 6.359845577927607} | KL=None\n",
      "| penalty=6.359845577927607 \n",
      "| global_step=393216.0 \n",
      "[safe_fqi] Epoch 097 | ep_cost_mean=1.00 | avg_ep_len=1024.00| ep_reward_mean=-1.89 | unsafe_steps=4 over ~4 eps | info={'q1_loss': 4.536749839782715, 'q2_loss': 5.676555156707764, 'cost_loss': 0.01286041084676981, 'penalty': 6.357427547414941} | KL=None\n",
      "| penalty=6.357427547414941 \n",
      "| global_step=397312.0 \n",
      "[safe_fqi] Epoch 098 | ep_cost_mean=12.50 | avg_ep_len=1024.00| ep_reward_mean=-2.41 | unsafe_steps=50 over ~4 eps | info={'q1_loss': 7.904103755950928, 'q2_loss': 8.816343307495117, 'cost_loss': 0.027463584765791894, 'penalty': 6.354646817101095} | KL=None\n",
      "| penalty=6.354646817101095 \n",
      "| global_step=401408.0 \n",
      "[safe_fqi] Epoch 099 | ep_cost_mean=24.25 | avg_ep_len=1024.00| ep_reward_mean=-1.75 | unsafe_steps=97 over ~4 eps | info={'q1_loss': 4.303956985473633, 'q2_loss': 5.335580825805664, 'cost_loss': 0.01962446831166744, 'penalty': 6.378150294477616} | KL=None\n",
      "| penalty=6.378150294477616 \n",
      "| global_step=405504.0 \n",
      "[safe_fqi] Epoch 100 | ep_cost_mean=6.00 | avg_ep_len=1024.00| ep_reward_mean=-1.25 | unsafe_steps=24 over ~4 eps | info={'q1_loss': 3.9273743629455566, 'q2_loss': 4.860570430755615, 'cost_loss': 0.019257372803986074, 'penalty': 6.382603757959435} | KL=None\n",
      "| penalty=6.382603757959435 \n",
      "| global_step=409600.0 \n",
      "[safe_fqi] Epoch 101 | ep_cost_mean=53.50 | avg_ep_len=1024.00| ep_reward_mean=-1.41 | unsafe_steps=214 over ~4 eps | info={'q1_loss': 4.12800931930542, 'q2_loss': 5.060904026031494, 'cost_loss': 0.01931730266660452, 'penalty': 6.448681545561094} | KL=None\n",
      "| penalty=6.448681545561094 \n",
      "| global_step=413696.0 \n",
      "[safe_fqi] Epoch 102 | ep_cost_mean=12.50 | avg_ep_len=1024.00| ep_reward_mean=-1.55 | unsafe_steps=83 over ~4 eps | info={'q1_loss': 4.280649662017822, 'q2_loss': 5.465203285217285, 'cost_loss': 0.022611703351140024, 'penalty': 6.486267260756155} | KL=None\n",
      "| penalty=6.486267260756155 \n",
      "| global_step=417792.0 \n",
      "[safe_fqi] Epoch 103 | ep_cost_mean=10.75 | avg_ep_len=1024.00| ep_reward_mean=-1.72 | unsafe_steps=43 over ~4 eps | info={'q1_loss': 3.9450483322143555, 'q2_loss': 4.815011024475098, 'cost_loss': 0.029887601733207703, 'penalty': 6.4914784722414725} | KL=None\n",
      "| penalty=6.4914784722414725 \n",
      "| global_step=421888.0 \n",
      "[safe_fqi] Epoch 104 | ep_cost_mean=9.75 | avg_ep_len=1024.00| ep_reward_mean=-1.30 | unsafe_steps=39 over ~4 eps | info={'q1_loss': 4.066959857940674, 'q2_loss': 4.891276836395264, 'cost_loss': 0.025920262560248375, 'penalty': 6.491443704083115} | KL=None\n",
      "| penalty=6.491443704083115 \n",
      "| global_step=425984.0 \n",
      "[safe_fqi] Epoch 105 | ep_cost_mean=6.75 | avg_ep_len=1024.00| ep_reward_mean=-2.35 | unsafe_steps=27 over ~4 eps | info={'q1_loss': 4.839130878448486, 'q2_loss': 5.737588405609131, 'cost_loss': 0.023291503265500068, 'penalty': 6.4855816190972195} | KL=None\n",
      "| penalty=6.4855816190972195 \n",
      "| global_step=430080.0 \n",
      "[safe_fqi] Epoch 106 | ep_cost_mean=9.50 | avg_ep_len=1024.00| ep_reward_mean=-1.90 | unsafe_steps=38 over ~4 eps | info={'q1_loss': 4.51603889465332, 'q2_loss': 5.269113540649414, 'cost_loss': 0.022237338498234747, 'penalty': 6.481624568590643} | KL=None\n",
      "| penalty=6.481624568590643 \n",
      "| global_step=434176.0 \n",
      "[safe_fqi] Epoch 107 | ep_cost_mean=20.75 | avg_ep_len=1024.00| ep_reward_mean=-2.13 | unsafe_steps=83 over ~4 eps | info={'q1_loss': 3.8322737216949463, 'q2_loss': 4.672554016113281, 'cost_loss': 0.019373722746968268, 'penalty': 6.497484348932882} | KL=None\n",
      "| penalty=6.497484348932882 \n",
      "| global_step=438272.0 \n",
      "[safe_fqi] Epoch 108 | ep_cost_mean=11.50 | avg_ep_len=1024.00| ep_reward_mean=-2.33 | unsafe_steps=46 over ~4 eps | info={'q1_loss': 4.229565143585205, 'q2_loss': 4.937976837158203, 'cost_loss': 0.02810264825820923, 'penalty': 6.507727742624717} | KL=None\n",
      "| penalty=6.507727742624717 \n",
      "| global_step=442368.0 \n",
      "[safe_fqi] Epoch 109 | ep_cost_mean=12.75 | avg_ep_len=1024.00| ep_reward_mean=-2.29 | unsafe_steps=74 over ~4 eps | info={'q1_loss': 3.99708890914917, 'q2_loss': 4.938066482543945, 'cost_loss': 0.02419825866818428, 'penalty': 6.513336716672152} | KL=None\n",
      "| penalty=6.513336716672152 \n",
      "| global_step=446464.0 \n",
      "[safe_fqi] Epoch 110 | ep_cost_mean=20.75 | avg_ep_len=1024.00| ep_reward_mean=-0.44 | unsafe_steps=83 over ~4 eps | info={'q1_loss': 5.33876895904541, 'q2_loss': 6.165482044219971, 'cost_loss': 0.033311649784445764, 'penalty': 6.532105166319139} | KL=None\n",
      "| penalty=6.532105166319139 \n",
      "| global_step=450560.0 \n",
      "[safe_fqi] Epoch 111 | ep_cost_mean=9.00 | avg_ep_len=1024.00| ep_reward_mean=-1.17 | unsafe_steps=36 over ~4 eps | info={'q1_loss': 4.459436893463135, 'q2_loss': 5.091660499572754, 'cost_loss': 0.02454942762851715, 'penalty': 6.538609726564851} | KL=None\n",
      "| penalty=6.538609726564851 \n",
      "| global_step=454656.0 \n",
      "[safe_fqi] Epoch 112 | ep_cost_mean=5.25 | avg_ep_len=1024.00| ep_reward_mean=-1.20 | unsafe_steps=21 over ~4 eps | info={'q1_loss': 3.8027055263519287, 'q2_loss': 4.734567642211914, 'cost_loss': 0.022586798295378685, 'penalty': 6.530371853531338} | KL=None\n",
      "| penalty=6.530371853531338 \n",
      "| global_step=458752.0 \n",
      "[safe_fqi] Epoch 113 | ep_cost_mean=23.75 | avg_ep_len=1024.00| ep_reward_mean=-0.74 | unsafe_steps=95 over ~4 eps | info={'q1_loss': 3.6951866149902344, 'q2_loss': 4.554004192352295, 'cost_loss': 0.02012046929448843, 'penalty': 6.547816307495871} | KL=None\n",
      "| penalty=6.547816307495871 \n",
      "| global_step=462848.0 \n",
      "[safe_fqi] Epoch 114 | ep_cost_mean=22.50 | avg_ep_len=1024.00| ep_reward_mean=-1.13 | unsafe_steps=90 over ~4 eps | info={'q1_loss': 4.39054536819458, 'q2_loss': 5.195853233337402, 'cost_loss': 0.01635850705206394, 'penalty': 6.577622741768136} | KL=None\n",
      "| penalty=6.577622741768136 \n",
      "| global_step=466944.0 \n",
      "[safe_fqi] Epoch 115 | ep_cost_mean=50.25 | avg_ep_len=1024.00| ep_reward_mean=-0.51 | unsafe_steps=215 over ~4 eps | info={'q1_loss': 4.437655925750732, 'q2_loss': 5.118230819702148, 'cost_loss': 0.018778277561068535, 'penalty': 6.651530062759365} | KL=None\n",
      "| penalty=6.651530062759365 \n",
      "| global_step=471040.0 \n",
      "[safe_fqi] Epoch 116 | ep_cost_mean=0.00 | avg_ep_len=1024.00| ep_reward_mean=-1.70 | unsafe_steps=0 over ~4 eps | info={'q1_loss': 4.441143035888672, 'q2_loss': 5.324153900146484, 'cost_loss': 0.035098282247781755, 'penalty': 6.667732404756226} | KL=None\n",
      "| penalty=6.667732404756226 \n",
      "| global_step=475136.0 \n",
      "[safe_fqi] Epoch 117 | ep_cost_mean=58.50 | avg_ep_len=1024.00| ep_reward_mean=-0.58 | unsafe_steps=234 over ~4 eps | info={'q1_loss': 4.3183746337890625, 'q2_loss': 5.113317489624023, 'cost_loss': 0.015069111809134483, 'penalty': 6.738628515795063} | KL=None\n",
      "| penalty=6.738628515795063 \n",
      "| global_step=479232.0 \n",
      "[safe_fqi] Epoch 118 | ep_cost_mean=36.25 | avg_ep_len=1024.00| ep_reward_mean=3.52 | unsafe_steps=145 over ~4 eps | info={'q1_loss': 4.1526198387146, 'q2_loss': 4.837233543395996, 'cost_loss': 0.028509694337844848, 'penalty': 6.817572545304161} | KL=None\n",
      "| penalty=6.817572545304161 \n",
      "| global_step=483328.0 \n",
      "[safe_fqi] Epoch 119 | ep_cost_mean=7.75 | avg_ep_len=1024.00| ep_reward_mean=3.47 | unsafe_steps=31 over ~4 eps | info={'q1_loss': 4.23118257522583, 'q2_loss': 4.976517200469971, 'cost_loss': 0.030429900251328947, 'penalty': 6.837087680547724} | KL=None\n",
      "| penalty=6.837087680547724 \n",
      "| global_step=487424.0 \n",
      "[safe_fqi] Epoch 120 | ep_cost_mean=47.75 | avg_ep_len=1024.00| ep_reward_mean=2.33 | unsafe_steps=191 over ~4 eps | info={'q1_loss': 3.4323129653930664, 'q2_loss': 4.151915073394775, 'cost_loss': 0.021983988396823407, 'penalty': 6.896380181845404} | KL=None\n",
      "| penalty=6.896380181845404 \n",
      "| global_step=491520.0 \n",
      "[safe_fqi] Epoch 121 | ep_cost_mean=134.75 | avg_ep_len=1024.00| ep_reward_mean=-0.75 | unsafe_steps=539 over ~4 eps | info={'q1_loss': 3.2109899520874023, 'q2_loss': 3.897390842437744, 'cost_loss': 0.022780200839042662, 'penalty': 7.123373093405567} | KL=None\n",
      "| penalty=7.123373093405567 \n",
      "| global_step=495616.0 \n",
      "[safe_fqi] Epoch 122 | ep_cost_mean=14.50 | avg_ep_len=1024.00| ep_reward_mean=1.76 | unsafe_steps=58 over ~4 eps | info={'q1_loss': 3.207531213760376, 'q2_loss': 3.9558756351470947, 'cost_loss': 0.011664478667080402, 'penalty': 7.230825826130943} | KL=None\n",
      "| penalty=7.230825826130943 \n",
      "| global_step=499712.0 \n",
      "[safe_fqi] Epoch 123 | ep_cost_mean=49.25 | avg_ep_len=1024.00| ep_reward_mean=-0.54 | unsafe_steps=197 over ~4 eps | info={'q1_loss': 3.262111186981201, 'q2_loss': 3.850338935852051, 'cost_loss': 0.018750226497650145, 'penalty': 7.303774615800189} | KL=None\n",
      "| penalty=7.303774615800189 \n",
      "| global_step=503808.0 \n",
      "[safe_fqi] Epoch 124 | ep_cost_mean=60.25 | avg_ep_len=1024.00| ep_reward_mean=3.46 | unsafe_steps=241 over ~4 eps | info={'q1_loss': 3.2974839210510254, 'q2_loss': 3.924966335296631, 'cost_loss': 0.02394297793507576, 'penalty': 7.414734354201524} | KL=None\n",
      "| penalty=7.414734354201524 \n",
      "| global_step=507904.0 \n",
      "[safe_fqi] Epoch 125 | ep_cost_mean=28.75 | avg_ep_len=1024.00| ep_reward_mean=2.69 | unsafe_steps=115 over ~4 eps | info={'q1_loss': 3.531076431274414, 'q2_loss': 4.259357452392578, 'cost_loss': 0.02242315746843815, 'penalty': 7.486043023608507} | KL=None\n",
      "| penalty=7.486043023608507 \n",
      "| global_step=512000.0 \n",
      "[safe_fqi] Epoch 126 | ep_cost_mean=18.50 | avg_ep_len=1024.00| ep_reward_mean=4.00 | unsafe_steps=74 over ~4 eps | info={'q1_loss': 3.6500916481018066, 'q2_loss': 4.108515739440918, 'cost_loss': 0.03352318219840526, 'penalty': 7.5169962927766285} | KL=None\n",
      "| penalty=7.5169962927766285 \n",
      "| global_step=516096.0 \n",
      "[safe_fqi] Epoch 127 | ep_cost_mean=22.25 | avg_ep_len=1024.00| ep_reward_mean=1.93 | unsafe_steps=89 over ~4 eps | info={'q1_loss': 3.3933279514312744, 'q2_loss': 3.9965734481811523, 'cost_loss': 0.022567739337682725, 'penalty': 7.543936294759613} | KL=None\n",
      "| penalty=7.543936294759613 \n",
      "| global_step=520192.0 \n",
      "[safe_fqi] Epoch 128 | ep_cost_mean=13.25 | avg_ep_len=1024.00| ep_reward_mean=2.70 | unsafe_steps=70 over ~4 eps | info={'q1_loss': 5.939526081085205, 'q2_loss': 6.464014053344727, 'cost_loss': 0.033185144886374474, 'penalty': 7.5588088483847224} | KL=None\n",
      "| penalty=7.5588088483847224 \n",
      "| global_step=524288.0 \n",
      "[safe_fqi] Epoch 129 | ep_cost_mean=70.00 | avg_ep_len=1024.00| ep_reward_mean=8.95 | unsafe_steps=280 over ~4 eps | info={'q1_loss': 3.106069803237915, 'q2_loss': 3.654764413833618, 'cost_loss': 0.013433218374848366, 'penalty': 7.656688358296969} | KL=None\n",
      "| penalty=7.656688358296969 \n",
      "| global_step=528384.0 \n",
      "[safe_fqi] Epoch 130 | ep_cost_mean=55.00 | avg_ep_len=1024.00| ep_reward_mean=4.46 | unsafe_steps=220 over ~4 eps | info={'q1_loss': 2.984611988067627, 'q2_loss': 3.397125005722046, 'cost_loss': 0.015854626148939132, 'penalty': 7.775116134997702} | KL=None\n",
      "| penalty=7.775116134997702 \n",
      "| global_step=532480.0 \n",
      "[safe_fqi] Epoch 131 | ep_cost_mean=69.50 | avg_ep_len=1024.00| ep_reward_mean=5.38 | unsafe_steps=278 over ~4 eps | info={'q1_loss': 3.663973093032837, 'q2_loss': 4.308442115783691, 'cost_loss': 0.019105824269354345, 'penalty': 7.908080876001311} | KL=None\n",
      "| penalty=7.908080876001311 \n",
      "| global_step=536576.0 \n",
      "[safe_fqi] Epoch 132 | ep_cost_mean=46.50 | avg_ep_len=1024.00| ep_reward_mean=3.84 | unsafe_steps=186 over ~4 eps | info={'q1_loss': 3.9913902282714844, 'q2_loss': 4.598213195800781, 'cost_loss': 0.017567091807723045, 'penalty': 8.015401057799334} | KL=None\n",
      "| penalty=8.015401057799334 \n",
      "| global_step=540672.0 \n",
      "[safe_fqi] Epoch 133 | ep_cost_mean=47.75 | avg_ep_len=1024.00| ep_reward_mean=-4.02 | unsafe_steps=191 over ~4 eps | info={'q1_loss': 3.4490926265716553, 'q2_loss': 3.989682197570801, 'cost_loss': 0.019828814640641214, 'penalty': 8.107353933633414} | KL=None\n",
      "| penalty=8.107353933633414 \n",
      "| global_step=544768.0 \n",
      "[safe_fqi] Epoch 134 | ep_cost_mean=60.00 | avg_ep_len=1024.00| ep_reward_mean=1.13 | unsafe_steps=247 over ~4 eps | info={'q1_loss': 3.265845775604248, 'q2_loss': 3.8092920780181885, 'cost_loss': 0.020924513041973115, 'penalty': 8.218376932982121} | KL=None\n",
      "| penalty=8.218376932982121 \n",
      "| global_step=548864.0 \n",
      "[safe_fqi] Epoch 135 | ep_cost_mean=45.75 | avg_ep_len=1024.00| ep_reward_mean=6.19 | unsafe_steps=206 over ~4 eps | info={'q1_loss': 3.2039284706115723, 'q2_loss': 3.781205177307129, 'cost_loss': 0.021377287432551385, 'penalty': 8.316469304368214} | KL=None\n",
      "| penalty=8.316469304368214 \n",
      "| global_step=552960.0 \n",
      "[safe_fqi] Epoch 136 | ep_cost_mean=42.00 | avg_ep_len=1024.00| ep_reward_mean=5.46 | unsafe_steps=168 over ~4 eps | info={'q1_loss': 3.306147575378418, 'q2_loss': 3.8841094970703125, 'cost_loss': 0.011745926458388567, 'penalty': 8.398096700460707} | KL=None\n",
      "| penalty=8.398096700460707 \n",
      "| global_step=557056.0 \n",
      "[safe_fqi] Epoch 137 | ep_cost_mean=80.00 | avg_ep_len=1024.00| ep_reward_mean=6.02 | unsafe_steps=320 over ~4 eps | info={'q1_loss': 3.6860172748565674, 'q2_loss': 4.201657772064209, 'cost_loss': 0.022408602759242058, 'penalty': 8.536182481882717} | KL=None\n",
      "| penalty=8.536182481882717 \n",
      "| global_step=561152.0 \n",
      "[safe_fqi] Epoch 138 | ep_cost_mean=70.25 | avg_ep_len=1024.00| ep_reward_mean=8.18 | unsafe_steps=281 over ~4 eps | info={'q1_loss': 2.8658435344696045, 'q2_loss': 3.3742499351501465, 'cost_loss': 0.019442950189113618, 'penalty': 8.688560998176403} | KL=None\n",
      "| penalty=8.688560998176403 \n",
      "| global_step=565248.0 \n",
      "[safe_fqi] Epoch 139 | ep_cost_mean=63.75 | avg_ep_len=1024.00| ep_reward_mean=6.11 | unsafe_steps=266 over ~4 eps | info={'q1_loss': 3.2582015991210938, 'q2_loss': 3.784630537033081, 'cost_loss': 0.029405117407441138, 'penalty': 8.825218566827525} | KL=None\n",
      "| penalty=8.825218566827525 \n",
      "| global_step=569344.0 \n",
      "[safe_fqi] Epoch 140 | ep_cost_mean=70.50 | avg_ep_len=1024.00| ep_reward_mean=3.94 | unsafe_steps=282 over ~4 eps | info={'q1_loss': 4.080844879150391, 'q2_loss': 4.578373432159424, 'cost_loss': 0.030562032386660574, 'penalty': 8.967020394508523} | KL=None\n",
      "| penalty=8.967020394508523 \n",
      "| global_step=573440.0 \n",
      "[safe_fqi] Epoch 141 | ep_cost_mean=49.25 | avg_ep_len=1024.00| ep_reward_mean=8.70 | unsafe_steps=221 over ~4 eps | info={'q1_loss': 3.169522523880005, 'q2_loss': 3.57248592376709, 'cost_loss': 0.02316601201891899, 'penalty': 9.080047946682614} | KL=None\n",
      "| penalty=9.080047946682614 \n",
      "| global_step=577536.0 \n",
      "[safe_fqi] Epoch 142 | ep_cost_mean=49.50 | avg_ep_len=1024.00| ep_reward_mean=6.13 | unsafe_steps=217 over ~4 eps | info={'q1_loss': 2.5513758659362793, 'q2_loss': 2.881564140319824, 'cost_loss': 0.02400159537792206, 'penalty': 9.177052188458363} | KL=None\n",
      "| penalty=9.177052188458363 \n",
      "| global_step=581632.0 \n",
      "[safe_fqi] Epoch 143 | ep_cost_mean=49.25 | avg_ep_len=1024.00| ep_reward_mean=6.06 | unsafe_steps=197 over ~4 eps | info={'q1_loss': 3.6313514709472656, 'q2_loss': 4.038718223571777, 'cost_loss': 0.033919600769877434, 'penalty': 9.272594376901505} | KL=None\n",
      "| penalty=9.272594376901505 \n",
      "| global_step=585728.0 \n",
      "[safe_fqi] Epoch 144 | ep_cost_mean=67.75 | avg_ep_len=1024.00| ep_reward_mean=8.74 | unsafe_steps=275 over ~4 eps | info={'q1_loss': 5.485877513885498, 'q2_loss': 5.91096305847168, 'cost_loss': 0.020245364494621755, 'penalty': 9.397180486614522} | KL=None\n",
      "| penalty=9.397180486614522 \n",
      "| global_step=589824.0 \n",
      "[safe_fqi] Epoch 145 | ep_cost_mean=35.50 | avg_ep_len=1024.00| ep_reward_mean=5.31 | unsafe_steps=142 over ~4 eps | info={'q1_loss': 3.6544911861419678, 'q2_loss': 4.087538242340088, 'cost_loss': 0.025957425683736803, 'penalty': 9.485250486843423} | KL=None\n",
      "| penalty=9.485250486843423 \n",
      "| global_step=593920.0 \n",
      "[safe_fqi] Epoch 146 | ep_cost_mean=72.00 | avg_ep_len=1024.00| ep_reward_mean=10.31 | unsafe_steps=305 over ~4 eps | info={'q1_loss': 3.0796337127685547, 'q2_loss': 3.403563976287842, 'cost_loss': 0.031003794446587563, 'penalty': 9.606806319729158} | KL=None\n",
      "| penalty=9.606806319729158 \n",
      "| global_step=598016.0 \n",
      "[safe_fqi] Epoch 147 | ep_cost_mean=61.25 | avg_ep_len=1024.00| ep_reward_mean=7.90 | unsafe_steps=245 over ~4 eps | info={'q1_loss': 2.5054826736450195, 'q2_loss': 2.8160600662231445, 'cost_loss': 0.030958010256290434, 'penalty': 9.738299464716219} | KL=None\n",
      "| penalty=9.738299464716219 \n",
      "| global_step=602112.0 \n",
      "[safe_fqi] Epoch 148 | ep_cost_mean=32.25 | avg_ep_len=1024.00| ep_reward_mean=5.26 | unsafe_steps=129 over ~4 eps | info={'q1_loss': 4.359401226043701, 'q2_loss': 4.722997188568115, 'cost_loss': 0.02132926806807518, 'penalty': 9.817404269825602} | KL=None\n",
      "| penalty=9.817404269825602 \n",
      "| global_step=606208.0 \n",
      "[safe_fqi] Epoch 149 | ep_cost_mean=53.25 | avg_ep_len=1024.00| ep_reward_mean=6.33 | unsafe_steps=239 over ~4 eps | info={'q1_loss': 3.104973077774048, 'q2_loss': 3.3398866653442383, 'cost_loss': 0.025066529214382172, 'penalty': 9.906377857208543} | KL=None\n",
      "| penalty=9.906377857208543 \n",
      "| global_step=610304.0 \n",
      "[safe_fqi] Epoch 150 | ep_cost_mean=36.75 | avg_ep_len=1024.00| ep_reward_mean=7.20 | unsafe_steps=150 over ~4 eps | info={'q1_loss': 2.5469415187835693, 'q2_loss': 2.7448723316192627, 'cost_loss': 0.022636043652892113, 'penalty': 9.983995782227026} | KL=None\n",
      "| penalty=9.983995782227026 \n",
      "| global_step=614400.0 \n",
      "[safe_fqi] Epoch 151 | ep_cost_mean=25.25 | avg_ep_len=1024.00| ep_reward_mean=13.08 | unsafe_steps=114 over ~4 eps | info={'q1_loss': 2.4054994583129883, 'q2_loss': 2.643733263015747, 'cost_loss': 0.031889671459794044, 'penalty': 10.031481614896888} | KL=None\n",
      "| penalty=10.031481614896888 \n",
      "| global_step=618496.0 \n",
      "[safe_fqi] Epoch 152 | ep_cost_mean=53.25 | avg_ep_len=1024.00| ep_reward_mean=12.01 | unsafe_steps=213 over ~4 eps | info={'q1_loss': 2.456272840499878, 'q2_loss': 2.732539176940918, 'cost_loss': 0.02142045684158802, 'penalty': 10.113342809696862} | KL=None\n",
      "| penalty=10.113342809696862 \n",
      "| global_step=622592.0 \n",
      "[safe_fqi] Epoch 153 | ep_cost_mean=81.25 | avg_ep_len=1024.00| ep_reward_mean=14.90 | unsafe_steps=344 over ~4 eps | info={'q1_loss': 2.1960103511810303, 'q2_loss': 2.4098093509674072, 'cost_loss': 0.017034601792693137, 'penalty': 10.26094848046676} | KL=None\n",
      "| penalty=10.26094848046676 \n",
      "| global_step=626688.0 \n",
      "[safe_fqi] Epoch 154 | ep_cost_mean=39.00 | avg_ep_len=1024.00| ep_reward_mean=9.34 | unsafe_steps=156 over ~4 eps | info={'q1_loss': 2.064864158630371, 'q2_loss': 2.3232762813568115, 'cost_loss': 0.021317470446228982, 'penalty': 10.365362112653715} | KL=None\n",
      "| penalty=10.365362112653715 \n",
      "| global_step=630784.0 \n",
      "[safe_fqi] Epoch 155 | ep_cost_mean=42.75 | avg_ep_len=1024.00| ep_reward_mean=15.87 | unsafe_steps=171 over ~4 eps | info={'q1_loss': 2.5597193241119385, 'q2_loss': 2.8234190940856934, 'cost_loss': 0.022557116486132144, 'penalty': 10.444152342735299} | KL=None\n",
      "| penalty=10.444152342735299 \n",
      "| global_step=634880.0 \n",
      "[safe_fqi] Epoch 156 | ep_cost_mean=70.75 | avg_ep_len=1024.00| ep_reward_mean=11.16 | unsafe_steps=283 over ~4 eps | info={'q1_loss': 3.6085124015808105, 'q2_loss': 3.840649127960205, 'cost_loss': 0.019986749440431596, 'penalty': 10.567859418983105} | KL=None\n",
      "| penalty=10.567859418983105 \n",
      "| global_step=638976.0 \n",
      "[safe_fqi] Epoch 157 | ep_cost_mean=53.25 | avg_ep_len=1024.00| ep_reward_mean=10.99 | unsafe_steps=239 over ~4 eps | info={'q1_loss': 1.9629722833633423, 'q2_loss': 2.1740849018096924, 'cost_loss': 0.035207176581025124, 'penalty': 10.686002020432953} | KL=None\n",
      "| penalty=10.686002020432953 \n",
      "| global_step=643072.0 \n",
      "[safe_fqi] Epoch 158 | ep_cost_mean=60.00 | avg_ep_len=1024.00| ep_reward_mean=10.45 | unsafe_steps=240 over ~4 eps | info={'q1_loss': 2.186959743499756, 'q2_loss': 2.373199701309204, 'cost_loss': 0.020424484834074975, 'penalty': 10.802716915202643} | KL=None\n",
      "| penalty=10.802716915202643 \n",
      "| global_step=647168.0 \n",
      "[safe_fqi] Epoch 159 | ep_cost_mean=54.25 | avg_ep_len=1024.00| ep_reward_mean=12.94 | unsafe_steps=223 over ~4 eps | info={'q1_loss': 1.6736959218978882, 'q2_loss': 1.8830379247665405, 'cost_loss': 0.02079178299754858, 'penalty': 10.914720228516341} | KL=None\n",
      "| penalty=10.914720228516341 \n",
      "| global_step=651264.0 \n",
      "[safe_fqi] Epoch 160 | ep_cost_mean=39.25 | avg_ep_len=1024.00| ep_reward_mean=10.05 | unsafe_steps=171 over ~4 eps | info={'q1_loss': 1.8947057723999023, 'q2_loss': 2.027869701385498, 'cost_loss': 0.027909019961953163, 'penalty': 10.99874131209397} | KL=None\n",
      "| penalty=10.99874131209397 \n",
      "| global_step=655360.0 \n",
      "[safe_fqi] Epoch 161 | ep_cost_mean=77.00 | avg_ep_len=1024.00| ep_reward_mean=10.58 | unsafe_steps=308 over ~4 eps | info={'q1_loss': 1.816355586051941, 'q2_loss': 1.9693852663040161, 'cost_loss': 0.018664395809173583, 'penalty': 11.130417742804209} | KL=None\n",
      "| penalty=11.130417742804209 \n",
      "| global_step=659456.0 \n",
      "[safe_fqi] Epoch 162 | ep_cost_mean=59.75 | avg_ep_len=1024.00| ep_reward_mean=16.12 | unsafe_steps=239 over ~4 eps | info={'q1_loss': 1.7856473922729492, 'q2_loss': 1.9611167907714844, 'cost_loss': 0.019601013511419296, 'penalty': 11.26365451204486} | KL=None\n",
      "| penalty=11.26365451204486 \n",
      "| global_step=663552.0 \n",
      "[safe_fqi] Epoch 163 | ep_cost_mean=12.50 | avg_ep_len=1024.00| ep_reward_mean=14.70 | unsafe_steps=78 over ~4 eps | info={'q1_loss': 2.4319345951080322, 'q2_loss': 2.5624189376831055, 'cost_loss': 0.02357597164809704, 'penalty': 11.310585873002402} | KL=None\n",
      "| penalty=11.310585873002402 \n",
      "| global_step=667648.0 \n",
      "[safe_fqi] Epoch 164 | ep_cost_mean=37.00 | avg_ep_len=1024.00| ep_reward_mean=14.88 | unsafe_steps=148 over ~4 eps | info={'q1_loss': 2.283475399017334, 'q2_loss': 2.391951084136963, 'cost_loss': 0.02919522151350975, 'penalty': 11.358123914775481} | KL=None\n",
      "| penalty=11.358123914775481 \n",
      "| global_step=671744.0 \n",
      "[safe_fqi] Epoch 165 | ep_cost_mean=36.50 | avg_ep_len=1024.00| ep_reward_mean=13.50 | unsafe_steps=146 over ~4 eps | info={'q1_loss': 2.090596914291382, 'q2_loss': 2.2378664016723633, 'cost_loss': 0.027201354503631592, 'penalty': 11.421294259758337} | KL=None\n",
      "| penalty=11.421294259758337 \n",
      "| global_step=675840.0 \n",
      "[safe_fqi] Epoch 166 | ep_cost_mean=58.25 | avg_ep_len=1024.00| ep_reward_mean=13.67 | unsafe_steps=233 over ~4 eps | info={'q1_loss': 1.7177667617797852, 'q2_loss': 1.8421906232833862, 'cost_loss': 0.02125134114176035, 'penalty': 11.519808160083397} | KL=None\n",
      "| penalty=11.519808160083397 \n",
      "| global_step=679936.0 \n",
      "[safe_fqi] Epoch 167 | ep_cost_mean=34.75 | avg_ep_len=1024.00| ep_reward_mean=9.09 | unsafe_steps=152 over ~4 eps | info={'q1_loss': 1.8369113206863403, 'q2_loss': 1.9629874229431152, 'cost_loss': 0.03571287989616394, 'penalty': 11.598332531162766} | KL=None\n",
      "| penalty=11.598332531162766 \n",
      "| global_step=684032.0 \n",
      "[safe_fqi] Epoch 168 | ep_cost_mean=42.00 | avg_ep_len=1024.00| ep_reward_mean=5.28 | unsafe_steps=168 over ~4 eps | info={'q1_loss': 1.907349705696106, 'q2_loss': 2.017282485961914, 'cost_loss': 0.020854912325739862, 'penalty': 11.67110081269348} | KL=None\n",
      "| penalty=11.67110081269348 \n",
      "| global_step=688128.0 \n",
      "[safe_fqi] Epoch 169 | ep_cost_mean=78.00 | avg_ep_len=1024.00| ep_reward_mean=14.80 | unsafe_steps=312 over ~4 eps | info={'q1_loss': 2.09466814994812, 'q2_loss': 2.257416248321533, 'cost_loss': 0.020749961584806444, 'penalty': 11.805334817017467} | KL=None\n",
      "| penalty=11.805334817017467 \n",
      "| global_step=692224.0 \n",
      "[safe_fqi] Epoch 170 | ep_cost_mean=32.75 | avg_ep_len=1024.00| ep_reward_mean=10.77 | unsafe_steps=131 over ~4 eps | info={'q1_loss': 3.902449607849121, 'q2_loss': 4.032128810882568, 'cost_loss': 0.0210584556683898, 'penalty': 11.89664035254371} | KL=None\n",
      "| penalty=11.89664035254371 \n",
      "| global_step=696320.0 \n",
      "[safe_fqi] Epoch 171 | ep_cost_mean=46.25 | avg_ep_len=1024.00| ep_reward_mean=13.61 | unsafe_steps=185 over ~4 eps | info={'q1_loss': 3.714531898498535, 'q2_loss': 3.844480514526367, 'cost_loss': 0.024172888323664665, 'penalty': 11.975791578178567} | KL=None\n",
      "| penalty=11.975791578178567 \n",
      "| global_step=700416.0 \n",
      "[safe_fqi] Epoch 172 | ep_cost_mean=71.25 | avg_ep_len=1024.00| ep_reward_mean=14.13 | unsafe_steps=285 over ~4 eps | info={'q1_loss': 1.265455722808838, 'q2_loss': 1.4086531400680542, 'cost_loss': 0.02169044651091099, 'penalty': 12.0} | KL=None\n",
      "| penalty=12.0 \n",
      "| global_step=704512.0 \n",
      "[safe_fqi] Epoch 173 | ep_cost_mean=76.75 | avg_ep_len=1024.00| ep_reward_mean=12.71 | unsafe_steps=322 over ~4 eps | info={'q1_loss': 1.6768780946731567, 'q2_loss': 1.8054759502410889, 'cost_loss': 0.029242536053061485, 'penalty': 12.0} | KL=None\n",
      "| penalty=12.0 \n",
      "| global_step=708608.0 \n",
      "[safe_fqi] Epoch 174 | ep_cost_mean=84.50 | avg_ep_len=1024.00| ep_reward_mean=17.47 | unsafe_steps=338 over ~4 eps | info={'q1_loss': 1.4750850200653076, 'q2_loss': 1.5749956369400024, 'cost_loss': 0.01855279505252838, 'penalty': 12.0} | KL=None\n",
      "| penalty=12.0 \n",
      "| global_step=712704.0 \n",
      "[safe_fqi] Epoch 175 | ep_cost_mean=106.75 | avg_ep_len=1024.00| ep_reward_mean=15.65 | unsafe_steps=427 over ~4 eps | info={'q1_loss': 1.391268253326416, 'q2_loss': 1.507683277130127, 'cost_loss': 0.017223617434501647, 'penalty': 12.0} | KL=None\n",
      "| penalty=12.0 \n",
      "| global_step=716800.0 \n",
      "[safe_fqi] Epoch 176 | ep_cost_mean=83.00 | avg_ep_len=1024.00| ep_reward_mean=19.97 | unsafe_steps=332 over ~4 eps | info={'q1_loss': 1.8393054008483887, 'q2_loss': 1.9682395458221436, 'cost_loss': 0.018649319745600225, 'penalty': 12.0} | KL=None\n",
      "| penalty=12.0 \n",
      "| global_step=720896.0 \n",
      "[safe_fqi] Epoch 177 | ep_cost_mean=57.50 | avg_ep_len=1024.00| ep_reward_mean=13.50 | unsafe_steps=230 over ~4 eps | info={'q1_loss': 1.3842612504959106, 'q2_loss': 1.5222886800765991, 'cost_loss': 0.015521297790110111, 'penalty': 12.0} | KL=None\n",
      "| penalty=12.0 \n",
      "| global_step=724992.0 \n",
      "[safe_fqi] Epoch 178 | ep_cost_mean=83.75 | avg_ep_len=1024.00| ep_reward_mean=16.96 | unsafe_steps=335 over ~4 eps | info={'q1_loss': 1.2674845457077026, 'q2_loss': 1.3402544260025024, 'cost_loss': 0.02232600636780262, 'penalty': 12.0} | KL=None\n",
      "| penalty=12.0 \n",
      "| global_step=729088.0 \n",
      "[safe_fqi] Epoch 179 | ep_cost_mean=103.25 | avg_ep_len=1024.00| ep_reward_mean=18.79 | unsafe_steps=425 over ~4 eps | info={'q1_loss': 1.5581881999969482, 'q2_loss': 1.611415982246399, 'cost_loss': 0.032215343415737153, 'penalty': 12.0} | KL=None\n",
      "| penalty=12.0 \n",
      "| global_step=733184.0 \n",
      "[safe_fqi] Epoch 180 | ep_cost_mean=60.25 | avg_ep_len=1024.00| ep_reward_mean=18.37 | unsafe_steps=257 over ~4 eps | info={'q1_loss': 1.395699143409729, 'q2_loss': 1.4506224393844604, 'cost_loss': 0.01893935240805149, 'penalty': 12.0} | KL=None\n",
      "| penalty=12.0 \n",
      "| global_step=737280.0 \n",
      "[safe_fqi] Epoch 181 | ep_cost_mean=82.00 | avg_ep_len=1024.00| ep_reward_mean=18.16 | unsafe_steps=328 over ~4 eps | info={'q1_loss': 1.2498351335525513, 'q2_loss': 1.2987055778503418, 'cost_loss': 0.021315402537584304, 'penalty': 12.0} | KL=None\n",
      "| penalty=12.0 \n",
      "| global_step=741376.0 \n",
      "[safe_fqi] Epoch 182 | ep_cost_mean=26.25 | avg_ep_len=1024.00| ep_reward_mean=8.69 | unsafe_steps=105 over ~4 eps | info={'q1_loss': 2.795609474182129, 'q2_loss': 2.8145735263824463, 'cost_loss': 0.02627541311085224, 'penalty': 12.0} | KL=None\n",
      "| penalty=12.0 \n",
      "| global_step=745472.0 \n",
      "[safe_fqi] Epoch 183 | ep_cost_mean=30.25 | avg_ep_len=1024.00| ep_reward_mean=7.47 | unsafe_steps=121 over ~4 eps | info={'q1_loss': 1.15944242477417, 'q2_loss': 1.1920260190963745, 'cost_loss': 0.024521687626838685, 'penalty': 12.0} | KL=None\n",
      "| penalty=12.0 \n",
      "| global_step=749568.0 \n",
      "[safe_fqi] Epoch 184 | ep_cost_mean=43.75 | avg_ep_len=1024.00| ep_reward_mean=9.65 | unsafe_steps=185 over ~4 eps | info={'q1_loss': 1.1707954406738281, 'q2_loss': 1.2141751050949097, 'cost_loss': 0.029507090523838996, 'penalty': 12.0} | KL=None\n",
      "| penalty=12.0 \n",
      "| global_step=753664.0 \n",
      "[safe_fqi] Epoch 185 | ep_cost_mean=40.25 | avg_ep_len=1024.00| ep_reward_mean=10.48 | unsafe_steps=161 over ~4 eps | info={'q1_loss': 2.640333414077759, 'q2_loss': 2.70261287689209, 'cost_loss': 0.039666876569390296, 'penalty': 12.0} | KL=None\n",
      "| penalty=12.0 \n",
      "| global_step=757760.0 \n",
      "[safe_fqi] Epoch 186 | ep_cost_mean=67.50 | avg_ep_len=1024.00| ep_reward_mean=15.11 | unsafe_steps=270 over ~4 eps | info={'q1_loss': 2.531451940536499, 'q2_loss': 2.5747873783111572, 'cost_loss': 0.026099634543061256, 'penalty': 12.0} | KL=None\n",
      "| penalty=12.0 \n",
      "| global_step=761856.0 \n",
      "[safe_fqi] Epoch 187 | ep_cost_mean=81.00 | avg_ep_len=1024.00| ep_reward_mean=19.71 | unsafe_steps=324 over ~4 eps | info={'q1_loss': 1.1290736198425293, 'q2_loss': 1.175806999206543, 'cost_loss': 0.021184176951646806, 'penalty': 12.0} | KL=None\n",
      "| penalty=12.0 \n",
      "| global_step=765952.0 \n",
      "[safe_fqi] Epoch 188 | ep_cost_mean=72.25 | avg_ep_len=1024.00| ep_reward_mean=18.98 | unsafe_steps=303 over ~4 eps | info={'q1_loss': 3.683192014694214, 'q2_loss': 3.7542941570281982, 'cost_loss': 0.024992967396974562, 'penalty': 12.0} | KL=None\n",
      "| penalty=12.0 \n",
      "| global_step=770048.0 \n",
      "[safe_fqi] Epoch 189 | ep_cost_mean=70.00 | avg_ep_len=1024.00| ep_reward_mean=14.32 | unsafe_steps=280 over ~4 eps | info={'q1_loss': 1.2889671325683594, 'q2_loss': 1.335349202156067, 'cost_loss': 0.02778810281306505, 'penalty': 12.0} | KL=None\n",
      "| penalty=12.0 \n",
      "| global_step=774144.0 \n",
      "[safe_fqi] Epoch 190 | ep_cost_mean=42.00 | avg_ep_len=1024.00| ep_reward_mean=15.54 | unsafe_steps=188 over ~4 eps | info={'q1_loss': 1.2674285173416138, 'q2_loss': 1.330660104751587, 'cost_loss': 0.02799553982913494, 'penalty': 12.0} | KL=None\n",
      "| penalty=12.0 \n",
      "| global_step=778240.0 \n",
      "[safe_fqi] Epoch 191 | ep_cost_mean=43.00 | avg_ep_len=1024.00| ep_reward_mean=17.01 | unsafe_steps=172 over ~4 eps | info={'q1_loss': 3.5426955223083496, 'q2_loss': 3.60288667678833, 'cost_loss': 0.028218933567404746, 'penalty': 12.0} | KL=None\n",
      "| penalty=12.0 \n",
      "| global_step=782336.0 \n",
      "[safe_fqi] Epoch 192 | ep_cost_mean=64.50 | avg_ep_len=1024.00| ep_reward_mean=17.99 | unsafe_steps=258 over ~4 eps | info={'q1_loss': 1.2398262023925781, 'q2_loss': 1.311125636100769, 'cost_loss': 0.026523770391941072, 'penalty': 12.0} | KL=None\n",
      "| penalty=12.0 \n",
      "| global_step=786432.0 \n",
      "[safe_fqi] Epoch 193 | ep_cost_mean=45.75 | avg_ep_len=1024.00| ep_reward_mean=15.55 | unsafe_steps=193 over ~4 eps | info={'q1_loss': 2.9383373260498047, 'q2_loss': 2.983157157897949, 'cost_loss': 0.021709655225276948, 'penalty': 12.0} | KL=None\n",
      "| penalty=12.0 \n",
      "| global_step=790528.0 \n",
      "[safe_fqi] Epoch 194 | ep_cost_mean=40.25 | avg_ep_len=1024.00| ep_reward_mean=13.86 | unsafe_steps=161 over ~4 eps | info={'q1_loss': 1.1433794498443604, 'q2_loss': 1.2101154327392578, 'cost_loss': 0.021257520467042924, 'penalty': 12.0} | KL=None\n",
      "| penalty=12.0 \n",
      "| global_step=794624.0 \n",
      "[safe_fqi] Epoch 195 | ep_cost_mean=25.00 | avg_ep_len=1024.00| ep_reward_mean=16.45 | unsafe_steps=116 over ~4 eps | info={'q1_loss': 2.3553004264831543, 'q2_loss': 2.4166407585144043, 'cost_loss': 0.024161579459905623, 'penalty': 12.0} | KL=None\n",
      "| penalty=12.0 \n",
      "| global_step=798720.0 \n",
      "[safe_fqi] Epoch 196 | ep_cost_mean=24.50 | avg_ep_len=1024.00| ep_reward_mean=11.44 | unsafe_steps=98 over ~4 eps | info={'q1_loss': 1.2816015481948853, 'q2_loss': 1.3449276685714722, 'cost_loss': 0.023757075518369676, 'penalty': 12.0} | KL=None\n",
      "| penalty=12.0 \n",
      "| global_step=802816.0 \n",
      "[safe_fqi] Epoch 197 | ep_cost_mean=56.50 | avg_ep_len=1024.00| ep_reward_mean=18.22 | unsafe_steps=226 over ~4 eps | info={'q1_loss': 1.3198888301849365, 'q2_loss': 1.3685073852539062, 'cost_loss': 0.020221473649144173, 'penalty': 12.0} | KL=None\n",
      "| penalty=12.0 \n",
      "| global_step=806912.0 \n",
      "[safe_fqi] Epoch 198 | ep_cost_mean=44.75 | avg_ep_len=1024.00| ep_reward_mean=19.11 | unsafe_steps=179 over ~4 eps | info={'q1_loss': 2.0211408138275146, 'q2_loss': 2.047995090484619, 'cost_loss': 0.021734359487891198, 'penalty': 12.0} | KL=None\n",
      "| penalty=12.0 \n",
      "| global_step=811008.0 \n",
      "[safe_fqi] Epoch 199 | ep_cost_mean=53.00 | avg_ep_len=1024.00| ep_reward_mean=20.95 | unsafe_steps=212 over ~4 eps | info={'q1_loss': 1.4494463205337524, 'q2_loss': 1.4925493001937866, 'cost_loss': 0.0199179844930768, 'penalty': 12.0} | KL=None\n",
      "| penalty=12.0 \n",
      "| global_step=815104.0 \n",
      "[safe_fqi] Epoch 200 | ep_cost_mean=71.25 | avg_ep_len=1024.00| ep_reward_mean=18.39 | unsafe_steps=285 over ~4 eps | info={'q1_loss': 2.8437564373016357, 'q2_loss': 2.89302396774292, 'cost_loss': 0.024513354897499083, 'penalty': 12.0} | KL=None\n",
      "| penalty=12.0 \n",
      "| global_step=819200.0 \n"
     ]
    }
   ],
   "source": [
    "\n",
    "fqi = argparse.ArgumentParser()\n",
    "fqi.add_argument(\"--algo\", type=str, default=\"safe_fqi\")\n",
    "fqi.add_argument(\"--env-id\", type=str, default=\"SafetyPointGoal1-v0\")\n",
    "fqi.add_argument(\"--steps-per-epoch\", type=int, default=4096)\n",
    "fqi.add_argument(\"--epochs\", type=int, default=200)\n",
    "fqi.add_argument(\"--device\", type=str, default=device)\n",
    "fqi.add_argument(\"--seed\", type=int, default=0)\n",
    "fqi.add_argument(\"--cost-limit\", type=float, default=0.01)\n",
    "\n",
    "# ← run HybridAgent\n",
    "args_fqi, _ = fqi.parse_known_args()\n",
    "fqi_cost_curve, fqi_rew_curve = train(\n",
    "    algo=args_fqi.algo,\n",
    "    env_id=args_fqi.env_id,\n",
    "    steps_per_epoch=args_fqi.steps_per_epoch,\n",
    "    epochs=args_fqi.epochs,\n",
    "    device=args_fqi.device,\n",
    "    seed=args_fqi.seed,\n",
    "    cost_limit=args_fqi.cost_limit,)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "99f9a869",
   "metadata": {},
   "outputs": [],
   "source": [
    "# safefqi_cost = {\n",
    "# \"safe_fqi_cost_curve\":fqi_cost_curve,\n",
    "# \"safe_fqi_rew_curve\":fqi_rew_curve}\n",
    "\n",
    "\n",
    "# with open(\"safefqi_cost_07_015\", \"w\") as f:\n",
    "#     json.dump(safefqi_cost, f)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "8079edd6",
   "metadata": {},
   "outputs": [],
   "source": [
    "plt.figure(figsize=(8,5))\n",
    "\n",
    "plt.plot(range(1, len(cost_curve)+1), cost_curve, label=\"CPO\")\n",
    "# plt.plot(range(1, len(act_cost_curve)+1), act_cost_curve, label=\"ActSafe\")\n",
    "# plt.plot(range(1, len(GP_cost_curve)+1), GP_cost_curve, label=\"LSEES(Ours)\")\n",
    "# plt.plot(range(1, len(hybrid_cost_curve)+1), hybrid_cost_curve, label=\"hybrid)\")\n",
    "plt.plot(range(1, len(fqi_cost_curve)+1), fqi_cost_curve, label=\"LSEES(Ours)\")\n",
    "plt.xlabel(\"Epoch\"); plt.ylabel(\"Mean episode cost\"); plt.legend(); plt.tight_layout()"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "817c27df",
   "metadata": {},
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "86e228d0",
   "metadata": {},
   "outputs": [],
   "source": [
    "plt.figure(figsize=(8,5))\n",
    "plt.plot(range(1, len(cost_curve)+1), rew_curve, label=\"CPO\")\n",
    "# plt.plot(range(1, len(GP_cost_curve)+1), act_rew_curve, label=\"ActSafe\")\n",
    "# plt.plot(range(1, len(hybrid_rew_curve)+1), hybrid_rew_curve, label=\"hybrid)\")\n",
    "# plt.plot(range(1, len(GP_cost_curve)+1), GP_rew_curve, label=\"LSEES(Ours)\")\n",
    "plt.plot(range(1, len(fqi_rew_curve)+1), fqi_rew_curve, label=\"LSEES(Ours)\")\n",
    "plt.xlabel(\"Epoch\"); plt.ylabel(\"Mean episode reward\"); plt.legend(); plt.tight_layout()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "ddbf55be",
   "metadata": {},
   "outputs": [],
   "source": [
    "\n",
    "\n"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "7f9f0e32",
   "metadata": {},
   "source": [
    "<!-- with open(\"safefqi_cost_08_02.json\", \"r\") as f:\n",
    "    loaded = json.load(f)\n",
    "    \n",
    "# cost_curve=loaded[\"CPO_cost_curve\"]\n",
    "# rew_curve=loaded[\"CPO_rew_curve\"]\n",
    "# act_cost_curve=loaded[\"ActSafe_cost_curve\"]\n",
    "# act_rew_curve=loaded[\"ActSafe_rew_curve\"] -->"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 34,
   "id": "79c1c548",
   "metadata": {},
   "outputs": [],
   "source": [
    "with open(\"safefqi_cost_08_02\", \"r\") as f:\n",
    "    loaded = json.load(f)\n",
    "fqi_cost_curve=loaded[\"safe_fqi_cost_curve\"]\n",
    "fqi_rew_curve=loaded[\"safe_fqi_rew_curve\"]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 35,
   "id": "eaa62416",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "image/png": "iVBORw0KGgoAAAANSUhEUgAAAjIAAAHHCAYAAACle7JuAAAAOnRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjEwLjUsIGh0dHBzOi8vbWF0cGxvdGxpYi5vcmcvWftoOwAAAAlwSFlzAAAPYQAAD2EBqD+naQAAOQtJREFUeJzt3Qd8FNX+//9PIPTeCdK7dEVBFDRIl8sXhKs0pcgXBFFRRLxYINgoKhdRBLxXAb8qIFfAgqJSRQERKQEFpBcJgiBdQpv/43Puf+e3u9lUdrN7wuv5eAzJzs7OnpwMO++cc+ZMlOM4jgAAAFgoW7gLAAAAkFEEGQAAYC2CDAAAsBZBBgAAWIsgAwAArEWQAQAA1iLIAAAAaxFkAACAtQgyAADAWgQZAFaLiooyS8WKFcVGcXFx7s8wY8aMcBcHsA5BBtY7e/as/POf/5Tbb79dihUrJrlz55ZKlSrJ3/72N3n//fflwoULIX3/BQsWmJORLnv37k336xcvXixdu3aV8uXLm7KXLFlSGjVqJKNHj5b9+/eHpMwIvuXLl6cYqrwDS58+fSLm+ANsFx3uAgBX45dffpEOHTrI7t27fdbrB7ouCxculDp16kiDBg1CVgY9kcycOdN8Hxsbm+aWgYsXL0q/fv3k//7v/3zWHz161Cw//vij/PnnnzJx4sSQlDurWLlypfmqIdBGDzzwgLRs2dJ8X7169Uw7/oCsgiADax0/flzatWvntlqUKVNGnnzySalbt66cPn1aVqxYIdOnT5dI9fjjj7shJlu2bNK/f3/TiqQn5M2bN1+z3QzawpYvX740b9+0aVOxmbbE6ZKVaCuoHtPR0ZxikAn07teAjUaMGKF3bjdLoUKFnIMHDybZ5vfff3eOHTvmPk5MTHTGjh3r1K9f38mbN6+TJ08ep169es6YMWPMc942btzo/M///I9TokQJJzo62ilatKh53YMPPujs27fP2bNnj/v+gZZly5YlW/atW7c62bJlc7d94403kmxz5coVZ9u2bT7rlixZ4tx1111OsWLFnBw5cjhly5Z1evfu7fz6668+240aNcrd97///W8nLi7OKV26tFOgQAGnW7duzp9//mnq5b777nMKFizoFClSxPxcf/31l7sP75/vjjvucNauXevcfvvtps5iYmKcZ5991rl48aK7/ZkzZ5yBAwc6DRs2dEqWLGnKp/u+5ZZbTBm8+e97xYoVZrvcuXObnyct9e/h2U+FChV83iM9v2t9rWc/CQkJpl4KFy7s5M+f37n33nt9jqHk6O87ubL4/048P6P/+unTp4fk+EvrcaM2bdrkxMbGmvq67rrrzLHzzTffBCy7fu9Z/8UXXzhDhw41x1lUVJQpn/6f7Nu3r6l3fW/9OfRYa968uTN//vxk60/3+9FHHzk1a9Y05WjatKkTHx/vXL582Rk9erRTpkwZs75t27bO3r17U/3dIGsjyMBalStXdj/49MM2NefPnzcn4uQ++PU5zwnujz/+MCeQ5LbVD/arCTLPP/+8u13VqlWdS5cupVr+yZMnmxNEoPfSgKJBI9DJsUqVKkm21xNAo0aNkqx/5pln3H14/3x64suXL1+S7fWk6qEBIKX60BNQoH3rSUkDjPdJLC317xEoPKTnd+0fZLyPK8/Ss2fPTA0ywTz+0nPc7N692wQ4/+00QKUWZPzrTcu3evXqFMs4c+bMgPVXqVKlJGXWgNS/f/8k+7jttttS/d0gayPIwEqnT5/2+TDTvzhTo3+de7YvV66c8+GHHzqzZs1yypcv767XbdRnn33mruvevbs5cSxYsMB59dVXTQvC0qVLzcly5cqVTrt27dxtJ02aZNbpcuLEiWTL0qVLF/c1999/f6pl379/v5MzZ06zvbbkaGvIwoULnXvuucfdT61atUwrjv/JMXv27M748eOdOXPmmBOXZ722NmhLyZQpU9x1xYsXd9/T/0TZunVrUy8vvPCC2adnvf4Fr06ePGkCmv4l/fXXX5sT0+zZs51q1aq57+cJD/771jD3/vvvm7/q9S/1tNS/R6DwkJ7ftX+Q0dYmLctbb73l1rn+vCn9Pv1PxKktqQWZYB1/6T1u9L0867UVRX8Xr7/+umn9SC3I6PLoo486ixYtcqZNm2bCmP6etZ4//vhjZ/HixaaONLx4QpoeG8nVn7bkaFnr1q3rs15bYrVcpUqVctdt2bIl1f9DyLoIMrCSNll7f7hpV01q9IPZs72eKDy8Txr6l6fSD2PPuuHDh5sTgufD3p/3h3lKrTDeWrZs6b7mqaeeSnX7CRMmuNtrCPK4cOGC+UvV89yGDRuSnBx79Ojhbt++fXt3/XPPPeeur127trvec8L2DhvaNeN9ItcWCs9zGl6867JVq1YmEHmHHf/Q471vPcH6d6Glp/4DBZn0/K79g4x3l4e2XHnWa1dPZgWZYB1/6TlutNtGw6Zn3ebNm93t//GPf6QaZLyPM28zZsxwmjVrZlp6ArUMaQD2rz8Nn1oe9corr7jrdT8egwcPdtdryMO1i8uvYaVChQr5PD506FCqr/n111/d7xs3bux+r5c6+2/TrFkzqVatmvl+/PjxZjCmvqdeFfKvf/1Lrly5ErTyX03Zc+TIITfccEPA7QL9fEWLFnW/v+mmm9zvixcv7n5/4sSJJPuoWbOmT5m99+m5YmzevHnmCrJvvvlG/vjjD7l8+XKS/QTat9ZzjRo1fNZdbf2n53ft74477nC/18v5Uyp7ckqXLm2upvJe+vbtm+bXB+v4S89xc+TIETlz5ox5nDdvXnO1n0eTJk1SfS/93fvTaRH0UnP9+bX+/ps7fQWq14YNG5rBwldzzOLaQZCBlfLnzy+VK1d2H3///fcZ3pfO6+FPP8h1n88//7zceeed5sTkuRJqwIAB5uRyNerXr+9+v2bNmoAn/aspvzfvAOI5OaiCBQsG3D7QySYt7/nmm2+63+vJ6+uvvzYnsFatWrnrA52AS5UqlWn1n1pdqSJFirjfe191k5Z68ciVK5e5msp7Sc+VSaE+/lKri7TUU1p+j2+88Yb7/fDhw2XJkiXmmNArC1M6JkJxzCLrIsjAWjqJnMeECRMCtmzoX5l6mbb/HB1r1651v//hhx/c7z3b6AdjiRIl5LnnnjMfvgkJCablQQOUp/Uh0AdtWv9Svueee9zX7dixQ95+++0k22gZtm/fnmLZdS6aDRs2JCl/sGk5Tp06FbDOPIHyt99+8zmBaYC59dZbfdan9aSZnvoPJD2/60gUrOMvPceNTsRYoEAB9xL4rVu3us+vXr061TIH+j16fvfasjVu3DgTyrQlKLVjAkgPLvKHtYYNGyYffPCBmUdGm5a16VzXeeaR0ZlWdR4Z/arN0z169JD4+Hjz2sGDB5tt9MP3H//4h7vP7t27m6+rVq2SRx99VLp06WKa+LUZW1977tw583xiYmLAv+B1JuHs2bObJaX5TbSrZtCgQTJ58mTz+JFHHjFzx7Rv3978Nb9lyxZT9ubNm5sJ8f7+97/LU089ZU5AehIbNWqU3HLLLWYiND3JqVq1avm09ASTntg0OD788MOyadMmmT17tvtcx44dzdcKFSq4XRkjR46UNm3amHlydNLC9EpP/QeSnt91JArW8Zee40brR7uHPvzwQ7P+/vvvN0FK/3+9/vrrGfo59JjQoH7s2DEZO3as1KtXz+zL88cFEBThHqQDXI2ff/454OWy3otnAKxe5aGDBdNySa5e9ZHSPnUukkADSL2X1OiAS71iKaX3GTJkyFVffu09N0lyA0P1ShjPeh2I6z8gVwfD6pww/u/7v//7v+4+5s6dm+R5vaxa55Xxf0//eWT8paf+Aw32Tc/v2n+wb0YHcgfz8utgHn/BuPzae/B0coN9A9WP90Bdz6IDwWvUqJHkePOfR8ZD68SzXusqpXrDtYmuJVhN/5rUv1S1a0n/AtWWl5w5c0q5cuVMi4D+5anbKG3p0IGonr8M8+TJY2bR1RacMWPGmDEd+lpPU7v+Jat/vWrfv46V0Gb9m2++2bSi6HMeOhvvq6++KlWqVEnXTKY64PK9994z76tdTWXLljXvr83wN954o/lreOjQoe72Dz30kCm/zmasP6e+l85m3KtXL/npp59M2UJFp73X8Rk62FTrTcdsPP300zJlyhR3G/3rf9q0aaYFQetVy7No0SKfQaNplZ76DyQ9v+tIFMzjLz3Hjd6jzPN71vqKiYmRZ5991rSweY/fSc/s1S+++KJpmdHX6X6XLl1qjh8gWKI0zQRtbwCyDL1XlZ7YPFfyaBcdsj49JfiPd9EuOR3jovSPBg0oQKRgjAwAwKUDtIcMGWJaBZW2qk2aNMltRezcuXOYSwj4IsgAAHymA9DFn7bS6Lww2k0ERBLGyAAAXHoFnY4r0rlctAVGx9Po1VM6dkavAAMiDWNkAACAtWiRAQAA1iLIAAAAa2X5wb46ZbdOXa9Tb2fk/iEAACDz6cgXnZVbx2l534rjmgsyGmJ0cjQAAGCfAwcOmAlDr9kg47kJmlZEcndOBQAAkUVvVKsNEZ7z+DUbZDzdSRpiCDIAANgltWEhDPYFAADWIsgAAABrEWQAAIC1svwYGQBAZLh8+bJcvHgx3MVAhNBbYGTPnv2q90OQAQCEfD6Qw4cPy4kTJ8JdFESYwoULS+nSpa9qnjeCDAAgpDwhpmTJkpI3b14mJ4VouD137pwcOXLEPI6JicnwvggyAICQdid5QkyxYsXCXRxEkDx58pivGmb0+MhoNxODfQEAIeMZE6MtMYA/z3FxNWOnCDIAgJCjOwmhOi4IMgAAwFoEGQAAYC0G+wIAMl1cnB3vp1dcvfTSS7Jw4UL57bffzKDUBg0ayGOPPSYtWrSQihUryr59+9zxHjVq1JARI0bIPffc4+7j+PHj8vzzz8v8+fMlISFBihcvLm3btpW4uDgpX758sH7EaxYtMgAABLB3715p2LChLF26VF555RXZvHmzLFq0SJo3by6DBw92t9OQogFlw4YNcvPNN0vXrl1l1apVboi55ZZbZPHixTJ16lTZuXOnzJ4923zVbXfv3h3GnzBroEUGAIAAHnroITMYde3atZIvXz53fe3ateWBBx5wHxcoUMBM6qbL5MmT5f3335fPPvtMbr31VnnmmWfk0KFDJrjo80pbYb766iupVq2aCURffvllWH6+rIIWGQAA/GhLira+aNDwDjHeM9IGEh0dbabev3Dhgly5csW0vvTs2dMNMd5zqGhQ0kCj74WMo0UGiE9H53m9TO7YzyLjFjJ7PARwtbQFRWefrVmzZppfo+Hltddek5MnT8qdd94pR48eNZMBXn/99QG31/X6HvpejRo1CmLpry20yAAA4EcDRlo99dRTkj9/fjPYd9y4cTJ27Fhp3759hvaF9KNFBgAAPzp+RcfHbNu2LdVtn3zySenTp48JM6VKlXIneStRooTpgtq6dWvA1+l63bZq1apBL/+1hBYZAAD8FC1aVNq0aWMG7549ezbJ89538tbLqTWM+N/FOVu2bHLvvffKhx9+aC7j9vbXX3/JW2+9Zd5D3wsZR5ABACAADTF600sdv/Lxxx/Ljh07TCvKpEmTpEmTJmnax8svv2wCTqtWrczVSQcOHJBvv/3WBBi9v5C+B64OQQYAgAAqV64s69evN/PGPPHEE1KnTh0TSJYsWSJTpkxJ0z70jt9r1qwx+3jwwQelSpUqppVGv/7444/mPXB1opwsPgrp1KlTUqhQITOKvGDBguEuDiIRVy25uGoJwXb+/HnZs2ePVKpUSXLnzh3u4sCi4yOt529aZAAAgLUIMgAAwFoEGQAAYC2CDAAAsBZBBgAAWIsgAwAArEWQAQAA1iLIAAAAaxFkAACAtbj79TXIxtlb07Pv2GJp3zj2joyVBwAiyZIlS+Thhx+WLVu2SPbs2cNdHLlw4YJUr15d/vOf/8hNN90U0vciyAAAIvvWIMGQgduL9OnTx9zlesGCBUme27Rpkzz33HPmPko6lb7eGLJx48byxhtvSMmSJWXv3r1m2v1AVq9eLbfccovMmDFD+vbtm+T5XLlyman71dGjR2XkyJGycOFC+f3336VIkSJSv359s+62225zXzN8+HB59tlnfUKM3mF77NixMmvWLNm3b58UKFDA3PMpLi5OateuLaGUM2dOGTZsmDz11FMmZIUSQQYAgHTQcNGiRQv529/+Jl999ZUULlzYBJdPP/1Uzp4967Pt4sWLk4QGvZGkh95DaPv27T7PR0VFud936dLFtG7MnDnT3GBSw4wGg2PHjrnbfPfdd7Jr1y6zrUdiYqK0bNlS9u/fL6+99poJWfraMWPGmO+1XBqmMkrLpGElJT179jQ32/z5559DGpwIMgAApMP3339vbmT473//W6Kj/3sa1dYXbe3wp6FFW2uSo6Eluee1NWjlypWyfPlyueOO//aDV6hQQRo1auSz3ezZs81dub1vujhx4kTT8rNhwwbTguN57ccff2yCTL9+/Uw3lL5/bGysNGjQwLzGo1OnTiagaauRqlixonnNjh07TAtV586d5e2335ahQ4eaff75559SqlQpGThwoIwYMcK8RluPtNVIy/fCCy9IqDDYFwCAdNDgcenSJZk/f744jhOy98mfP79ZNDhoC0tyVq5cmWQcyocffmjCjSfEeGTLlk0ef/xx+eWXX0z3WHq8+uqrZn8ajrRbbdKkSaYV6qOPPjKtSh988IEJPN40dGn5QokgAwBAOmiXzNNPPy09evSQ4sWLS7t27eSVV14xXTf+br31VjeQeBZv2rLj/7zuT2lrj7aIaLeSto5o64a+b3x8vM8+9u3bJ2XKlPFZ9+uvv8r1118fsPye9bpNetx5552mq6hKlSpm0W6ratWqSdOmTU1rj37t3r27z2u0XFq+UCLIAACQTi+99JIcPnxYpk6dasZ/6NeaNWvK5s2bfbabM2eObNy40WfxpgNw/Z/XLisPHfdy6NAh0/LRtm1b08104403ul0+nkG93t1KHsFuLfJv9dHB0FreGjVqyKOPPipff/11ktfkyZNHzp07J6FEkAEAIAN0/Ms999xjuly2bt1qWh/0e2/lypWTqlWr+iz+XT3+z1933XU+22hI0W4i7c5ZtWqVCRCjRo1yny9evLgZo+JNL33WMgXiWa/beMrgH3ouXryY5HX58uXzeayBas+ePWb8i4ape++9V/7+97/7bHP8+HEpUaKEhBJBBgCAq6RX8Gh3i/9VS6FQq1Ytn/e54YYbzJgXb926dTNXJvmPg7ly5Yr885//NPvwjJ/RoJGQkOBuc/nyZTMQOC30qquuXbvKv/71L9P6pAN/Nbx46H60fKHEVUsAACRDx7D4dwdp95Fedq1hQVs1tDXjs88+ky+++EKmT5/us61eJq1dUN50vIunK0hf6/+80rlotJVFW3weeOABqVevnumGWrdunYwfP146duzobtumTRszjsabDuj95JNPpEOHDj6XX7/88sumRUZDjucybx37olcf6Vw1GsYmTJhgrphKjW4XExNjgoq26sydO9cMhNafz0MH+obyiiVFkAEAIBk6JsW/RUEvs9YuIB34euDAATOBnQ561bEt999/v8+2OpeLP52gTkOQ0sn0NAz40xYSvXxZA4i2oOg8Mdrdo11V/fv3N4N+vedrGT58uLlySMerKA1KS5cuNcFFt/WeEE8n8atTp477eg1K2nLTq1cvM8BYQ1CgS8n96f40VOkl2ToR380332zCnIYapZd/axD0724KtignlNeOpUIn5pk3b55s27bNDAjS0d3jxo1zfxFKZzfUg0WvQ9fLzzR5vvXWW+Z69bTQg6RQoUKmMrUJDNyi4KpuUZCB2UFtYuOxgcimn+E6jkLnWQk0IBXB8eSTT5rz3bRp0yRSaJeTdl95h670HB9pPX+HdYzMihUrZPDgwSYdfvPNNyZttm7d2qfvT5OhNtlpk5Vur6O3dSIeAADwX88884y5BFrHwEQCnfm3bt265hweamHtWlq0aJHPY72cTPsFf/rpJ7n99ttNCnvnnXfMxD7ah6e0/1GvgdfwczXTKwMAkFUULlw4xZaPcAx+1ns/ZYaIumpJg4sqWrSo+aqBRltpvPsY9Tr98uXLm743AABwbYuYwb7aHPbYY4+ZmQs9g5B0JLemOu8R0ErHxwQa5a10HI33VM7axwYAALKmiGmR0bEyer25Duq92gHEOjjIs+gIbwBAeIXxuhJk8eMiIoLMww8/LJ9//rksW7ZMypYt667X69F1wJD/9ex6LXxydwvVu25qF5Vn0UvjAADhkSNHDvM11NPUw06e48JznFjXtaRJ7JFHHjF3ENVr9fXyK28NGzY0P9ySJUvM/SaUXievN6pq0qRJwH3q9fy6AADCT+cX0eEBR44cMY/z5s3rTsSGa5fjOCbE6HGhx4ceJ1YGGe1O0iuSdPZBnVjHM+5Fu4R0Xhn92q9fPzPjoA4A1uvINfhoiOGKJQCwg6cF3RNmAA8NMcn1sFgRZKZMmWK+xsbG+qzXS6z1plhKZzTUWQK1RcZ7QjwAgB20BUZnr9XpNQLdjBDXphw5clxVS0zEdC2lRmf6mzx5slkAAPbSk1YwTlxAxA32BQAAyAiCDAAAsBZBBgAAWIsgAwAArEWQAQAA1iLIAAAAaxFkAACAtQgyAADAWgQZAABgLYIMAACwVlhvUYBrXHxcmjeNLRbSkgAALEWLDAAAsBZBBgAAWIsgAwAArEWQAQAA1iLIAAAAaxFkAACAtQgyAADAWgQZAABgLYIMAACwFkEGAABYiyADAACsRZABAADWIsgAAABrEWQAAIC1CDIAAMBa0eEuALKOuLj0bR9bLFQlAQBcK2iRAQAA1iLIAAAAaxFkAACAtQgyAADAWgQZAABgLYIMAACwFkEGAABYiyADAACsRZABAADWIsgAAABrEWQAAIC1CDIAAMBaBBkAAGAtggwAALAWQQYAAFgrOtwFALKquLhwlwAAsj5aZAAAgLUIMgAAwFoEGQAAYC2CDAAAsBZBBgAAWIsgAwAArEWQAQAA1iLIAAAAaxFkAACAtQgyAADAWgQZAABgLYIMAACwFkEGAABYiyADAACsRZABAADWig53AYBwWr4indvPC1VJAAAZQYsMAACwFkEGAABYiyADAACsRZABAADWIsgAAABrEWQAAIC1CDIAAMBaBBkAAGAtggwAALAWQQYAAFgrrEHm22+/lQ4dOkiZMmUkKipKFixY4PN8nz59zHrvpW3btmErLwAAiCxhDTJnz56V+vXry+TJk5PdRoNLQkKCu8yaNStTywgAACJXWG8a2a5dO7OkJFeuXFK6dOlMKxMAALBHxI+RWb58uZQsWVJq1KghgwYNkmPHjoW7SAAAIEKEtUUmNdqt1LlzZ6lUqZLs2rVLnn76adOCs3r1asmePXvA1yQmJprF49SpU5lYYgAAkJkiOsh069bN/b5u3bpSr149qVKlimmladGiRcDXjBkzRkaPHp2JpQSQmrg4O/cNIPJFfNeSt8qVK0vx4sVl586dyW4zYsQIOXnypLscOHAgU8sIAAAyT0S3yPg7ePCgGSMTExOT4uBgXQAAQNYX1iBz5swZn9aVPXv2yMaNG6Vo0aJm0S6iLl26mKuWdIzM8OHDpWrVqtKmTZtwFhsAAESIsAaZdevWSfPmzd3HQ4cONV979+4tU6ZMkfj4eJk5c6acOHHCTJrXunVreeGFF2hxAQAA4Q8ysbGx4jhOss9/9dVXmVoeAABgF6sG+wIAAHgjyAAAAGsRZAAAgLUIMgAAwFoEGQAAYC2CDAAAsBZBBgAAWIsgAwAArEWQAQAA1iLIAAAAa1l192tkvthicWnedvmxtG9rK+oDACILLTIAAMBaBBkAAGAtggwAALAWQQYAAFiLIAMAAK6tILN79+7glwQAACAzgkzVqlWlefPm8v7778v58+czsgsAAIDwBJn169dLvXr1ZOjQoVK6dGl58MEHZe3atVdfGgAAgFAHmQYNGsjrr78uhw4dknfffVcSEhKkadOmUqdOHZkwYYIcPXo0I7sFAADIvMG+0dHR0rlzZ5k7d66MGzdOdu7cKcOGDZNy5cpJr169TMABAACIyCCzbt06eeihhyQmJsa0xGiI2bVrl3zzzTemtaZjx47BKykAAEAw7rWkoWX69Omyfft2ueuuu+S9994zX7Nl+28uqlSpksyYMUMqVqyYkd0DAACELshMmTJFHnjgAenTp49pjQmkZMmS8s4772Rk9wAAAKELMjt27Eh1m5w5c0rv3r0zsnsAAIDQjZHRbiUd4OtP182cOTMjuwQAAMicFpkxY8bItGnTAnYnDRgwgJaYzBYfl84XpHd7AACyUIvM/v37zYBefxUqVDDPAQAARGyQ0ZaX+Pj4JOs3bdokxYoVC0a5AAAAQhNkunfvLo8++qgsW7ZMLl++bJalS5fKkCFDpFu3bhnZJQAAQOaMkXnhhRdk79690qJFCzO7r7py5YqZzffll1/OyC4BAAAyJ8jopdVz5swxgUa7k/LkySN169Y1Y2QAAAAiOsh4VK9e3SwAAADWBBkdE6O3IFiyZIkcOXLEdCt50/EyAAAAERlkdFCvBpn27dtLnTp1JCoqKvglAwAACEWQmT17tnz00UfmRpEAAABWXX6tg32rVq0a/NIAAACEOsg88cQT8vrrr4vjOBl5OQAAQPi6lr777jszGd6XX34ptWvXlhw5cvg8P2/evOCUDgAAINhBpnDhwnL33Xdn5KUAAADhDTLTp08PXgkAAAAyc4yMunTpkixevFimTZsmp0+fNusOHTokZ86cyeguAQAAQt8is2/fPmnbtq3s379fEhMTpVWrVlKgQAEZN26ceTx16tSM7BZe4uLSvm0sNxyPSLHF0vFLFJHlx9K3PQAggy0yOiHeTTfdJH/++ae5z5KHjpvR2X4BAAAitkVm5cqVsmrVKjOfjLeKFSvKb7/9FqyyAQAABL9FRu+tpPdb8nfw4EHTxQQAABCxQaZ169YyceJE97Hea0kH+Y4aNYrbFgAAgMjuWnrttdekTZs2UqtWLTl//rz06NFDduzYIcWLF5dZs2YFv5QAAADBCjJly5aVTZs2mZtHxsfHm9aYfv36Sc+ePX0G/wIAAERckDEvjI6W++67L7ilAQAACHWQee+991J8vlevXhnZLQAAQOiDjM4j4+3ixYty7tw5czl23rx5CTIAACByr1rSifC8Fx0js337dmnatCmDfQEAQOTfa8lftWrVZOzYsUlaawAAACI+yHgGAOuNIwEAACJ2jMynn37q89hxHElISJA333xTbrvttmCVDQAAIPhBplOnTj6PdWbfEiVKyJ133mkmywMAAIjYIKP3WgIAAMhSY2QAAAAivkVm6NChad52woQJGXkLAACA0ASZDRs2mEUnwqtRo4ZZ9+uvv0r27Nnlxhtv9Bk7AwAAEFFBpkOHDlKgQAGZOXOmFClSxKzTifH69u0rzZo1kyeeeCLY5QQAAAjOGBm9MmnMmDFuiFH6/YsvvshVSwAAILKDzKlTp+To0aNJ1uu606dPB6NcAAAAoQkyd999t+lGmjdvnhw8eNAsH3/8sfTr1086d+6ckV0CAABkzhiZqVOnyrBhw6RHjx5mwK/ZUXS0CTKvvPJKRnYJAACQOUEmb9688tZbb5nQsmvXLrOuSpUqki9fvozsDgAAIPMnxNP7K+mid77WEKP3XAIAAIjoIHPs2DFp0aKFVK9eXe666y4TZpR2LXHpNQAAiOgg8/jjj0uOHDlk//79ppvJo2vXrrJo0aI07+fbb781c9KUKVPGTJ63YMECn+e1hWfkyJESExMjefLkkZYtW8qOHTsyUmQAAJAFZSjIfP311zJu3DgpW7asz3rtYtq3b1+a93P27FmpX7++TJ48OeDz48ePl0mTJpnBxT/88IPpvmrTpo2cP38+I8UGAABZTIYG+2oA8W6J8Th+/LjkypUrzftp166dWQLR1piJEyfKs88+Kx07djTr3nvvPSlVqpRpuenWrVtGig4AAK71Fhm9DYGGCg/tFrpy5YppQWnevHlQCrZnzx45fPiw6U7yKFSokDRu3FhWr14dlPcAAADXYIuMBhYd7Ltu3Tq5cOGCDB8+XH7++WfTIvP9998HpWAaYpS2wHjTx57nAklMTDSL9yzEAAAga8pQkKlTp4652/Wbb75pbh555swZM6Pv4MGDzcDccNJ7QI0ePTpz3iw+Ln3b10vn9iESWywyyoGM/16WH+N3CAAZCjI6k2/btm3NANxnnnkmZLVYunRp8/X333/3CUf6uEGDBsm+bsSIETJ06FCfFply5cqFrJwAAMCiMTJ62XV8fLyEWqVKlUyYWbJkiU8o0auXmjRpkuzrdLBxwYIFfRYAAJA1ZWiw73333SfvvPPOVb+5dklt3LjRLJ4Bvvq9zk+jA4gfe+wxefHFF+XTTz+VzZs3S69evcycM506dbrq9wYAANfoGJlLly7Ju+++K4sXL5aGDRsmucfShAkT0rQfHSzsfZWTp0uod+/eMmPGDDOIWC/1HjBggJw4cUKaNm1qJtzLnTt3RooNAACu5SCze/duqVixomzZskVuvPFGs04H/XrTlpS0io2NTfH+TLqv559/3iwAAABXFWR05l69r9KyZcvcWxLozLv+l0gDAABE3BgZ/9aTL7/80nT9AAAAWDPY1yOlbiEAAICICjI6ZsV/DEx6xsQAAACEbYyMtsD06dPHvTGk3oV64MCBSa5amjdvXlALCQAAcNVBRi+L9p9PBgAAwIogM3369NCVBAAAIDMH+wIAAIQTQQYAAFiLIAMAAKxFkAEAANYiyAAAAGsRZAAAgLUIMgAAwFoEGQAAYC2CDAAAsBZBBgAAWIsgAwAArEWQAQAA1iLIAAAAaxFkAACAtQgyAADAWgQZAABgLYIMAACwFkEGAABYiyADAACsFR3uAiCw2GJxYhsbywwkJ87Sw9nWcgMZRYsMAACwFkEGAABYiyADAACsRZABAADWIsgAAABrEWQAAIC1CDIAAMBaBBkAAGAtggwAALAWQQYAAFiLIAMAAKxFkAEAANYiyAAAAGsRZAAAgLUIMgAAwFrR4S4AAFyNuLhwlwBAONEiAwAArEWQAQAA1iLIAAAAaxFkAACAtQgyAADAWgQZAABgLYIMAACwFkEGAABYiyADAACsRZABAADWIsgAAABrEWQAAIC1CDIAAMBaBBkAAGAtggwAALBWdLgLYLPlK9L5ghVxISoJAADXJlpkAACAtQgyAADAWgQZAABgLYIMAACwFkEGAABYiyADAACsRZABAADWIsgAAABrEWQAAIC1CDIAAMBaER1k4uLiJCoqymepWbNmuIsFAAAiRMTfa6l27dqyePFi93F0dMQXGQAAZJKITwUaXEqXLh3uYgAAgAgU0V1LaseOHVKmTBmpXLmy9OzZU/bv3x/uIgEAgAgR0S0yjRs3lhkzZkiNGjUkISFBRo8eLc2aNZMtW7ZIgQIFAr4mMTHRLB6nTp3KxBIDAIDMFNFBpl27du739erVM8GmQoUK8tFHH0m/fv0CvmbMmDEm8ABZWWyxuJDte/mx0O0bAK65riVvhQsXlurVq8vOnTuT3WbEiBFy8uRJdzlw4ECmlhEAAGQeq4LMmTNnZNeuXRITE5PsNrly5ZKCBQv6LAAAIGuK6CAzbNgwWbFihezdu1dWrVold999t2TPnl26d+8e7qIBAIAIENFjZA4ePGhCy7Fjx6REiRLStGlTWbNmjfkeAAAgooPM7Nmzw10EAAAQwSK6awkAACAlBBkAAGAtggwAALAWQQYAAFiLIAMAAKxFkAEAANYiyAAAAGsRZAAAgLUIMgAAwFoEGQAAYK2IvkUBACAyxMXZuW9kfbTIAAAAaxFkAACAtQgyAADAWgQZAABgLYIMAACwFkEGAABYiyADAACsRZABAADWIsgAAABrEWQAAIC1CDIAAMBaBBkAAGAtggwAALAWQQYAAFiLIAMAAKwVHe4CAIgsscXi0rzt8mNp3xaZI45fSabUBfUcOWiRAQAA1iLIAAAAaxFkAACAtQgyAADAWgQZAABgLYIMAACwFkEGAABYiyADAACsRZABAADWIsgAAABrEWQAAIC1CDIAAMBaBBkAAGAtggwAALAWQQYAAFiLIAMAAKxFkAEAANYiyAAAAGsRZAAAgLUIMgAAwFoEGQAAYC2CDAAAsBZBBgAAWIsgAwAArEWQAQAA1iLIAAAAaxFkAACAtQgyAADAWgQZAABgLYIMAACwFkEGAABYKzrcBQCAQGKLxaV52+XH0r4tIk8cvz6r6zkuzL8/WmQAAIC1CDIAAMBaBBkAAGAtggwAALAWQQYAAFiLIAMAAKxFkAEAANYiyAAAAGsRZAAAgLUIMgAAwFpWBJnJkydLxYoVJXfu3NK4cWNZu3ZtuIsEAAAiQMQHmTlz5sjQoUNl1KhRsn79eqlfv760adNGjhw5Eu6iAQCAMIv4IDNhwgTp37+/9O3bV2rVqiVTp06VvHnzyrvvvhvuogEAgDCL6CBz4cIF+emnn6Rly5buumzZspnHq1evDmvZAABA+EVLBPvjjz/k8uXLUqpUKZ/1+njbtm0BX5OYmGgWj5MnT5qvp06dCnr5zv71/94HuBYlJgb//1VG/n+FshxAICE4pYRcYqJddeE5bzuOY2+QyYgxY8bI6NGjk6wvV65cWMoDZG1jJTJESjlwrRjLIZdpdXH69GkpVKiQnUGmePHikj17dvn999991uvj0qVLB3zNiBEjzOBgjytXrsjx48elWLFiEhUVFdSkqOHowIEDUrBgwaDtF/8PdRx61HHoUcehRx1nzTrWlhgNMWXKlElxu4gOMjlz5pSGDRvKkiVLpFOnTm4w0ccPP/xwwNfkypXLLN4KFy4csjLqL5T/OKFFHYcedRx61HHoUcdZr45TaomxIsgobV3p3bu33HTTTdKoUSOZOHGinD171lzFBAAArm0RH2S6du0qR48elZEjR8rhw4elQYMGsmjRoiQDgAEAwLUn4oOM0m6k5LqSwkW7r3SSPv9uLAQPdRx61HHoUcehRx1f23Uc5aR2XRMAAECEiugJ8QAAAFJCkAEAANYiyAAAAGsRZAAAgLUIMhk0efJkqVixouTOnVsaN24sa9euDXeRrBUXF2dmXfZeatas6T5//vx5GTx4sJmdOX/+/NKlS5cksz3D17fffisdOnQwM2JqfS5YsMDneR3jr1MaxMTESJ48ecyNWHfs2OGzjc6I3bNnTzP5lU4q2a9fPzlz5kwm/yT21nGfPn2SHNdt27b12YY6Tvl2MzfffLMUKFBASpYsaSZF3b59u882afls2L9/v7Rv317y5s1r9vPkk0/KpUuXMvmnsbeOY2NjkxzHAwcOjKg6JshkwJw5c8xEfXop2vr166V+/frSpk0bOXLkSLiLZq3atWtLQkKCu3z33Xfuc48//rh89tlnMnfuXFmxYoUcOnRIOnfuHNbyRjqdNFKPSw3cgYwfP14mTZokU6dOlR9++EHy5ctnjmE9MXjoCfbnn3+Wb775Rj7//HNz4h4wYEAm/hR217HS4OJ9XM+aNcvneeo4efp/XUPKmjVrTP1cvHhRWrdubeo9rZ8NetNhPcFeuHBBVq1aJTNnzpQZM2aYEA9JUx2r/v37+xzH+vkRUXWsl18jfRo1auQMHjzYfXz58mWnTJkyzpgxY8JaLluNGjXKqV+/fsDnTpw44eTIkcOZO3euu27r1q06ZYCzevXqTCylvbSu5s+f7z6+cuWKU7p0aeeVV17xqedcuXI5s2bNMo9/+eUX87off/zR3ebLL790oqKinN9++y2TfwL76lj17t3b6dixY7KvoY7T58iRI6a+VqxYkebPhi+++MLJli2bc/jwYXebKVOmOAULFnQSExPD8FPYVcfqjjvucIYMGeIkJxLqmBaZdNLU+dNPP5mmeI9s2bKZx6tXrw5r2Wym3RraRF+5cmXzV6o2VSqta/0rwbu+tdupfPny1HcG7dmzx8yS7V2nej8T7SL11Kl+1a4OvTWIh26vx7q24CBtli9fbpraa9SoIYMGDZJjx465z1HH6XPy5EnztWjRomn+bNCvdevW9ZkJXlse9QaI2hKGlOvY44MPPjA3ca5Tp465MfO5c+fc5yKhjq2Y2TeS/PHHH6Ypzf8WCfp427ZtYSuXzfQEqk2R+mGvzZajR4+WZs2ayZYtW8wJV28e6n/jT61vfQ7p56m3QMew5zn9qidgb9HR0eYDjnpPG+1W0m6OSpUqya5du+Tpp5+Wdu3amQ/+7NmzU8fpoDcLfuyxx+S2224zJ1OVls8G/RroOPc8h5TrWPXo0UMqVKhg/tCMj4+Xp556yoyjmTdvXsTUMUEGYacf7h716tUzwUb/43z00UdmICpgo27durnf61+semxXqVLFtNK0aNEirGWzjY7j0D9svMfOIXPqeIDXmC09jvUCAT1+NZzr8RwJ6FpKJ21e07+m/EfG6+PSpUuHrVxZif6FVb16ddm5c6epU+3OO3HihM821HfGeeotpWNYv/oPXterEPQqG+o9Y7TbVD8/9LhW1HHa6H32dCD0smXLpGzZsu76tHw26NdAx7nnOaRcx4HoH5rK+zgOdx0TZNJJmzIbNmwoS5Ys8WmS08dNmjQJa9myCr38VNO+Jn+t6xw5cvjUtzZr6hga6jtjtKtDP2C861T7s3VchqdO9aueIHQcgsfSpUvNse75IEP6HDx40IyR0eNaUccp0zHUeoKdP3++qRc9br2l5bNBv27evNknMOrVOXq5e61ateRa56RSx4Fs3LjRfPU+jsNex5kypDiLmT17trnCY8aMGebKgwEDBjiFCxf2GbWNtHviiSec5cuXO3v27HG+//57p2XLlk7x4sXNCHo1cOBAp3z58s7SpUuddevWOU2aNDELknf69Glnw4YNZtH/5hMmTDDf79u3zzw/duxYc8x+8sknTnx8vLm6plKlSs5ff/3l7qNt27bODTfc4Pzwww/Od99951SrVs3p3r17GH8qe+pYnxs2bJi5ekaP68WLFzs33nijqcPz58+7+6COkzdo0CCnUKFC5rMhISHBXc6dO+duk9pnw6VLl5w6deo4rVu3djZu3OgsWrTIKVGihDNixIgw/VR21fHOnTud559/3tStHsf6eVG5cmXn9ttvj6g6Jshk0BtvvGH+A+XMmdNcjr1mzZpwF8laXbt2dWJiYkxdXnfddeax/gfy0JPrQw895BQpUsTJmzevc/fdd5v/bEjesmXLzMnVf9FLgj2XYD/33HNOqVKlTChv0aKFs337dp99HDt2zJxU8+fPby6l7Nu3rzlBI/U61hOBfrDrB7peIlyhQgWnf//+Sf7YoY6TF6hudZk+fXq6Phv27t3rtGvXzsmTJ4/5A0n/cLp48WIYfiL76nj//v0mtBQtWtR8TlStWtV58sknnZMnT0ZUHUf9/z8MAACAdRgjAwAArEWQAQAA1iLIAAAAaxFkAACAtQgyAADAWgQZAABgLYIMAACwFkEGQNDt3btXoqKi3OnMQ6FPnz7SqVOnkO0fgB0IMgCSBAQNIf5L27Zt07yPcuXKSUJCgtSpU0cind78rm/fvuZmebly5TL3m+nevbusW7cuKPuPi4uTBg0aBGVfAJKKDrAOwDVOQ8v06dN91ulJPq30DvE23F1Yw0qLFi1M4Jo2bZrUrFlTTp8+LZ988ok88cQTsmLFinAXEUAqaJEBkISGFg0i3kuRIkXc57WFZsqUKdKuXTvJkyePVK5cWf7zn/8k27X0559/Ss+ePaVEiRJm+2rVqvkEJb177p133mmeK1asmAwYMMDcBd3j8uXLMnToUClcuLB5fvjw4ebOvd70rtFjxowxLSq6n/r16/uUyZ++XluftCwrV66U9u3bS5UqVUzryahRo0yYSWv5li9fLo0aNZJ8+fKZMt52222yb98+mTFjhowePVo2bdrktmzpOgDBQ5ABkCHPPfecdOnSxZykNaR069ZNtm7dmuy2v/zyi3z55ZdmGw1BxYsXN8+dPXtW2rRpY4LSjz/+KHPnzpXFixfLww8/7L7+tddeMwHg3Xffle+++06OHz8u8+fP93kPDTHvvfeeTJ06VX7++Wd5/PHH5b777ku2VUVDlm6nLS/ZsiX9KNRAkpbyXbp0yYzVueOOOyQ+Pl5Wr15tgo6Glq5du5r9165d23S16aLrAARRpt2eEoAV9O7N2bNnd/Lly+ezvPTSS+42+tExcOBAn9c1btzYGTRokPl+z549ZpsNGzaYxx06dDB3dg7k7bffNncvPnPmjLtu4cKFTrZs2dy7Revd0cePH+8+r3fWLVu2rNOxY0fz+Pz58+bux6tWrfLZd79+/czdpQOZM2eOKeP69etTrI/Uyqd3sNb9LF++PODrR40a5dSvXz/F9wCQcYyRAZBE8+bNTauJt6JFi/o8btKkSZLHyV2lNGjQINN6s379emndurVpwbj11lvNc9pCo91A2i3joV0z2lW0fft2yZ07t2nJaNy4sft8dHS03HTTTW73kg7YPXfunLRq1crnfS9cuCA33HBDwDL5d00lJ7Xy3X777aaLSltt9P1btmwp9957r8TExKRp/wCuDl1LAJLQk3bVqlV9Fv8gkx46lkbHjGh3z6FDh8wA22HDhgWtvJ7xKgsXLjRhyrNod1Zy42SqV69uvm7btu2q31/H+2iXkoazOXPmmH2vWbPmqvcLIHUEGQAZ4n+i1sfXX399stvrQN/evXvL+++/LxMnTpS3337brNfX6DgbHYvi8f3335txKzVq1JBChQqZ1o0ffvjBfV7Hpfz000/u41q1apkByvv3708SwPRS8EB0UK++TsffaOuKvxMnTqSpfB7a8jNixAhZtWqVuQrqww8/NOtz5sxpBisDCA2CDIAkEhMT5fDhwz7LH3/84bONDnrVwbe//vqrucpn7dq1PgN0vY0cOdJcBaRdQDrA9vPPP3dDjw4U1u4jDTlbtmyRZcuWySOPPCL333+/lCpVymwzZMgQGTt2rCxYsMC0oDz00ENu0FAFChQwLTza4jNz5kzZtWuX6cZ64403zONAdDCutqRo+Zs1ayZffPGF7N692wzYfemll6Rjx45pKt+ePXtMgNEWGW11+vrrr2XHjh3uz1exYkWzjbYQaR1q3QIIoqsYXwMgiw721Y8G/6VGjRruNvp48uTJTqtWrZxcuXI5FStWNINnPfwH+77wwgvO9ddf7+TJk8cpWrSoGaS7e/dud/v4+HinefPmTu7cuc3z/fv3d06fPu0zuHfIkCFOwYIFncKFCztDhw51evXq5Q72VVeuXHEmTpxoypkjRw6nRIkSTps2bZwVK1ak+PNu377d7KtMmTJOzpw5nQoVKpgBwt6DgFMqnw747dSpkxmQ7Hn9yJEjncuXL7sDkbt06WLKrXUyffr0q/wNAfAWpf8EMxgByPq0NUMvf+YWAQDCja4lAABgLYIMAACwFvPIAEg3eqQBRApaZAAAgLUIMgAAwFoEGQAAYC2CDAAAsBZBBgAAWIsgAwAArEWQAQAA1iLIAAAAaxFkAACA2Or/A9uKqniiynsNAAAAAElFTkSuQmCC",
      "text/plain": [
       "<Figure size 640x480 with 1 Axes>"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    }
   ],
   "source": [
    "plt.figure()\n",
    "plt.hist(cost_curve, bins=20, alpha=0.5, label='CPO', color='blue')\n",
    "# axes[1, 1].hist(act_cost_curve, bins=20, alpha=0.5, label='ActSafe', color='green')\n",
    "plt.hist(fqi_cost_curve, bins=20, alpha=0.5, label='LSEES(Ours)', color='orange')\n",
    "plt.title('Cost Comparsion Histogram', fontsize=12, fontweight='bold')\n",
    "plt.xlabel('Episode Cost')\n",
    "plt.ylabel('Frequency')\n",
    "plt.legend()\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 36,
   "id": "2f201285",
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "C:\\Users\\17913\\AppData\\Local\\Temp\\ipykernel_1488\\37808932.py:49: UserWarning: Glyph 25104 (\\N{CJK UNIFIED IDEOGRAPH-6210}) missing from font(s) DejaVu Sans.\n",
      "  plt.tight_layout()\n",
      "C:\\Users\\17913\\AppData\\Local\\Temp\\ipykernel_1488\\37808932.py:49: UserWarning: Glyph 26412 (\\N{CJK UNIFIED IDEOGRAPH-672C}) missing from font(s) DejaVu Sans.\n",
      "  plt.tight_layout()\n",
      "C:\\Users\\17913\\AppData\\Local\\Temp\\ipykernel_1488\\37808932.py:49: UserWarning: Glyph 20998 (\\N{CJK UNIFIED IDEOGRAPH-5206}) missing from font(s) DejaVu Sans.\n",
      "  plt.tight_layout()\n",
      "C:\\Users\\17913\\AppData\\Local\\Temp\\ipykernel_1488\\37808932.py:49: UserWarning: Glyph 24067 (\\N{CJK UNIFIED IDEOGRAPH-5E03}) missing from font(s) DejaVu Sans.\n",
      "  plt.tight_layout()\n",
      "C:\\Users\\17913\\AppData\\Local\\Temp\\ipykernel_1488\\37808932.py:49: UserWarning: Glyph 30452 (\\N{CJK UNIFIED IDEOGRAPH-76F4}) missing from font(s) DejaVu Sans.\n",
      "  plt.tight_layout()\n",
      "C:\\Users\\17913\\AppData\\Local\\Temp\\ipykernel_1488\\37808932.py:49: UserWarning: Glyph 26041 (\\N{CJK UNIFIED IDEOGRAPH-65B9}) missing from font(s) DejaVu Sans.\n",
      "  plt.tight_layout()\n",
      "C:\\Users\\17913\\AppData\\Local\\Temp\\ipykernel_1488\\37808932.py:49: UserWarning: Glyph 22270 (\\N{CJK UNIFIED IDEOGRAPH-56FE}) missing from font(s) DejaVu Sans.\n",
      "  plt.tight_layout()\n",
      "e:\\Anacondda\\envs\\py310\\lib\\site-packages\\IPython\\core\\pylabtools.py:170: UserWarning: Glyph 25104 (\\N{CJK UNIFIED IDEOGRAPH-6210}) missing from font(s) DejaVu Sans.\n",
      "  fig.canvas.print_figure(bytes_io, **kw)\n",
      "e:\\Anacondda\\envs\\py310\\lib\\site-packages\\IPython\\core\\pylabtools.py:170: UserWarning: Glyph 26412 (\\N{CJK UNIFIED IDEOGRAPH-672C}) missing from font(s) DejaVu Sans.\n",
      "  fig.canvas.print_figure(bytes_io, **kw)\n",
      "e:\\Anacondda\\envs\\py310\\lib\\site-packages\\IPython\\core\\pylabtools.py:170: UserWarning: Glyph 20998 (\\N{CJK UNIFIED IDEOGRAPH-5206}) missing from font(s) DejaVu Sans.\n",
      "  fig.canvas.print_figure(bytes_io, **kw)\n",
      "e:\\Anacondda\\envs\\py310\\lib\\site-packages\\IPython\\core\\pylabtools.py:170: UserWarning: Glyph 24067 (\\N{CJK UNIFIED IDEOGRAPH-5E03}) missing from font(s) DejaVu Sans.\n",
      "  fig.canvas.print_figure(bytes_io, **kw)\n",
      "e:\\Anacondda\\envs\\py310\\lib\\site-packages\\IPython\\core\\pylabtools.py:170: UserWarning: Glyph 30452 (\\N{CJK UNIFIED IDEOGRAPH-76F4}) missing from font(s) DejaVu Sans.\n",
      "  fig.canvas.print_figure(bytes_io, **kw)\n",
      "e:\\Anacondda\\envs\\py310\\lib\\site-packages\\IPython\\core\\pylabtools.py:170: UserWarning: Glyph 26041 (\\N{CJK UNIFIED IDEOGRAPH-65B9}) missing from font(s) DejaVu Sans.\n",
      "  fig.canvas.print_figure(bytes_io, **kw)\n",
      "e:\\Anacondda\\envs\\py310\\lib\\site-packages\\IPython\\core\\pylabtools.py:170: UserWarning: Glyph 22270 (\\N{CJK UNIFIED IDEOGRAPH-56FE}) missing from font(s) DejaVu Sans.\n",
      "  fig.canvas.print_figure(bytes_io, **kw)\n"
     ]
    },
    {
     "data": {
      "image/png": "iVBORw0KGgoAAAANSUhEUgAABdIAAAPZCAYAAAAV4dheAAAAOnRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjEwLjUsIGh0dHBzOi8vbWF0cGxvdGxpYi5vcmcvWftoOwAAAAlwSFlzAAAPYQAAD2EBqD+naQAAtR1JREFUeJzs3Qm8XOP5B/D3Zk9kKxJJCLHUVktqX4tWpahSXRQlVP8tVUXaIrZYWkFLtRV0UXRRqkUVpYpQRdVW2qL22CIJlVXWO//Pc9K55t7ce5KbO7kzc+/3+/kcmX3eOXPueOc3z3lOXaFQKCQAAAAAAKBZXZq/GAAAAAAACIJ0AAAAAADIIUgHAAAAAIAcgnQAAAAAAMghSAcAAAAAgByCdAAAAAAAyCFIBwAAAACAHIJ0AAAAAADIIUgHAAAAAIAc3fKuBABqz/PPP58WLFiwTLddc801U58+fdK0adOyZVkMGDAgDR06NHuOeK5lteGGG2b/Tpo0Kc2ZM2eZ7hPPE883ffr09MYbbyzTfeL1xOsKTz/99DKPb911103du3fPnieeb1msuuqq2dJaH/7wh9Pdd9+dnT7xxBPTueee2+Jt77jjjvS73/0u3X///en111/PxtarV680fPjwtOWWW6a999477bffftllHUFdXd0S5+N96d27d1p55ZXTWmutlUaOHJkOOOCAtN1227X4OLvuumu65557Gs6/+OKLacSIEanaTJw4Me22224N50ePHp2uvPLKhvOHHXZYuuqqqxrOx3YTr63WXkc1O+OMM9KZZ5651LG/9NJLae211250WaFQaPH6XXbZJVsvdGzxOfS3v/0tOx3b0emnn17pIQEAK0oBAOhQ1lprrUh2lmm5++67s/uMGzdume8zevTo7D4vvvjiMt+ndMqxyy67LPN9rrjiiuw+8e+y3icev6g144vXE+L1Let9Yr211nXXXddw/759+xamTp3a7O2eeuqpwlZbbbVM4zj++OMLldR0Wyh9D1qrNe/ZdtttV3j22WebfZym21nx/W2Lpn8nxe2zLeJvsLm/r6Km22Pxb7a9LOtrXtrrqGZNX2NLY2/uM29F/R3kfaZTXW699daG96ZPnz6FSZMmVXpIAMAKoiIdADqgK664IqtkzdOtW+NpwLJUT37xi19MCxcubHTZ0ip977vvvrTzzjs3umzcuHFZFWie9dZbr9H5qESOis883/rWt9Kf//znRpctrYL31Vdfzaq7Sy1LNe3uu++eWivW3Te/+c2G81/60pearWiP6saPfOQjafbs2Y0uX2eddbLK/vr6+mxvgGeffTa7PM53VHvuuWdWjR6V+E888USaOnVqw3UPPvhg2mKLLdKf/vSnJarTY3suXbcrrbRSqkaDBg1Kn/rUpxrOb7311qkWdZTX0RaxjZWugw984AMVHQ/t9xn1wQ9+MD322GPZ3lZjx45Nv/zlLys9LABgBRCkAwC0k9/+9reNfgw4/PDDl7jN22+/nfbZZ59GIfrqq6+efv7zn2ctYZr+iHHRRRdlrU86qksuuaThh5ooWP/973+fjjrqqDR58uTsspkzZ6Z99903/fvf/06rrLJKw/1KW3VUswhbY7uodR3ldbT1x4TOvg46q/jxNYL0cO2116bzzjsv+9wGADoWBxsFAGgnP/zhDxtOR5/vTTbZZInbRL/00qrr6PkeVfZNQ/QQ/Zi///3vZ5X4Tc2aNSt7vqicX2211VKPHj2yfvObbbZZ+trXvpaeeuqpZscYAf53v/vd9KEPfSgNHjw4u1/fvn2zPQJiz4Ljjz8+3Xzzzdlt40eB6GHetG909CaPy4tLuXp6x2NFP/jYy6C0wnzKlCnpO9/5TqPbxnOWjqHp3gzx+iOQjwC4X79+2R4aEcRvsMEG2XPEOn3uueey28beE/EYTcP5+CGk9DmKezHEnh2ll8feITHGY445JltXsU6L66S52y7NP/7xj6zyOYLb6I0fryFef3PHRogfIUofv6nia2v6Gsrxmpvz97//PduzJfasiPUe6yKOhbDXXntle9LMnz9/ifs099gzZsxIp512WvY4sQ5i74NPf/rTrTouQrkV/x7ytvtrrrkm+6Es9oKJcffs2TMNGzYsO95BrJfLLrssLVq0qNF79/LLLzd6jNLnaO49XZ51XHTrrbdm4477xbL99tunX/ziF0s8b9O9kGI7KL0+tp/4oS/eqwiU4++ruE289dZb6eyzz8624dh2hwwZkq2H4vEtPvGJT6Rf/epXze5p09zzxHsex0yIv4f4XNh2222z40qUHmci9vCJz7/4LIvPtttvv73Z19+az4VSBx54YOratWvDnkeXXnppi+sYAKhdKtIBANpBHMQ0Dhha9NGPfrTZ2/36179udL4YiOWJEKpp0BqhT9PwOILWJ598Mlsi6InQ/utf/3rD9fPmzctaojzyyCNL3C8C9jhQbLTq+ctf/pI+/vGPp0qJ9RHrJX5EKLr66qtzD9paKl5DrP+5c+cusTdALP/5z3+yyveBAwemr371q20eb6y3CEqjjVBbxbgmTJjQKDSPavwTTjgha3Fzyy23ZMFptYm9CWJb+973vrfEdbF3wR//+Mdsiff0pptuajhgcHNeeOGF7IeoCGpLt90IT++8886sMrgaDywb21K8d819NsTy6KOPpssvvzx9/vOfzwLf9l7H8WNMbEelon1SLPE30xrxHsQ44gePpuJ9a+mAnK+88kq2/OEPf8gC/Pg3b4+b+EyNcZcewPqhhx7KflSJdR0/GowZM6bRQWHj8yt+VLj++uuzvVnK8bkQPzrGj5TFqvTYM6G5HzgBgNomSAcAaAdNe7dHpWdzgWvTsDUCn9aYNm1aGjVqVHrzzTcbLouKyugl/tprr2Wha7Fq8hvf+EZWDXrwwQdnl0WwVBqiRyV73C/EfSMAi1YqTXtCR4gVAV1RVAdHIF+0InpFx3opDdIjfIv1lxfAFkU1bGlYFv2No0L4nXfeSa+//nr2OotVwWHjjTfOXmesu9JK/q222iqr1C9qKbyNCvpi2BYBcKyv5Q27o5VPrPeddtopG28xuCtuY2eddVZZAry2vuamvv3tby8R8MZ6X3nllbPgs7hdxY9A0XM6XldL6yiC0OIPKlHNHWFq8f2MdXLOOeekH//4x2l5RQV8BLFNlYa1rRXbVbQpKipWTse/EaLHtht7LTTdxuOy+Nsqfe7SPuzlWsd//etf00knndTovmussUa2HcSxCVq7PiOoLz7GpptumlWhFyu2i+KzJ7al973vfdk44rMrxvTuu+9m10fVeIThxx13XIvPE9XmEbTH30McRyF+JCyKHxUiSI9jLMQxFOIHmOKPi1HtHj8alAbprf1caGqHHXZo+Ht85plnss/yeP0AQMchSAcAaAcPP/xwo/PNhcul4XdRaytrL7jggkaPE2HdbbfdllVRhghZoyVG0Yknnpi1JejSpUujCt9oaxDBU7RbKIoQKQ6EGpWZpT2hI5wqbe/SHv2ymwvM43UvS5Be+jq/8IUvZFXApSI4i1C6GIJ99rOfzZZoI1Ha6uToo49eplYs4ZBDDkk/+clPGvYeiArq5RHhY1TOrrvuutn5H/3oR+nII49suP4HP/hBdrDDth5ctRyvuei///1vFm6Xij0IYrsr/ggS7TaKIWeE99GC5Mtf/nKLj1l6wOIIvnfbbbcWf7RqrWil0rSdSlvFayutio5wvOlBmKNFSexVUAy3i8F7fAaUjqe5v622ruPo6V3aSiXaz1x33XXZ9hp7o0TwXvwBY1nFZ0uMKT5bSrf597///dlnSPzb3N9wbNvFY0REK5y8ID3au8S6jNYtMf4Is+MzKkQoHn8HDzzwQBbmx48RcRDr+OEixBhKf3xr7edCU/EcTVvsCNIBoGPRIx0AoB0UD45ZWrW9LErDt9ZUghZF2FgM0UNUnUYVb1FUmkdLiVBaaRzVq1HRGWFcVLNGUBcVpRFUtTZIXRGa65/cXL/o5pS+zviR4fzzz8/6vkfldVSwxvqKiuSoYi2HqLiNytrSFjxN2/EsqwiyiyF6+NKXvtQokIz3LVpxVJMIH4tVxsUfd4oBb4iq329+85uN7hMtPVoSPbdPPfXUhvPFnt6l23S1Kd3mij9oRVAbxxOIaudihX0cv2B59lZoyzqOH8iiJU6paJNU3EYjjG7tXg7rr79+ViFfDNFD8fGiV3n8ncVrjarv+PuIqvL4+40fikoPtLy0nvfxA0qE6CGeq+mePtE7vRhwx4+CTa8v3Vba+rnQ9DO9uR9GAYDaJkgHAGgHEUSX6t+//xK3iVYqTTXtc740TW/ftEoyDp4X7RpKFSsxo2VEtB4pigMfRtuXCOWiPcQ666yT9QZu7ZhWhOYqhptbf82JELYY6kWIGZWzUYEb6yUC2fix4OKLL849KGNrRHuc0qC3LaIPc6kIH5vu3VDuauq2Wto2GTbffPNG50urg5uK8DW241IRzha19X0bPXp09gNW0yVvTEsT4X/pngNReR59/uNHgLgu9u6I0Le1Vd/lWMfRUqW0dUwE+RtttFHudrc0UW3ftJVL0W9+85vscyYOhvz4449nld7Raqo50a4lT9PX2fTvrOkBnZteX7pnSFs/F5p+pkdfdQCgYxGkAwC0g9Kq8NDcQfiixUDTVgC33nprq56naQX7slZph169emX9pqM9yIc//OFG4WQxeIvK6giGKx3WNl0vUXEby7KI/u3R9/nYY4/NgrbSgxlGSBatII455pj0uc99rixjLd0DoNKaBpbtUTXblm2yOdHzv6mWQttqEgf4jQOi7r///mno0KGNroswOwLm2DZvvPHGiq7j5u7b2sdraZuPv6+jjjqq0XYYPyLEcR3ih7xYSttJtfZztbQCPkS1+7Jq6+dC09C/Nc8NANQGQToAQDuIlgVNg7PmlLZjCNH+YWntDUqrKkt7lYfSg++FCLCKBxxt7j5xYL4Ii6LVQ1SKxkECo+dwtBApra6P/srlCkZbK8b/s5/9rNFlBx10UKtbT8SBO2P9RDVu9EqOVhel1d033HBDo0rf5X2dTcO9tmj6foam72dpi4qmbULi/SwNX+Mgk3nK8d4ubZsMEWDm3aejiBA9wvSoeJ41a1b65z//mR00t/hDQLwnsV229j1oyzqOliSlPfXj8+T5559vdNs4QGk5tvl//etfjSq1ozI9+rdHK5Xo/R490StpeT4XWvpMb/qZDwDUPkE6AEA72HLLLRudjwCtOdHDPCo0iyLM2X333dNdd921xG2jQjz6DJf2i/74xz/e6DZxoMjSSsnvfOc7DT2Zi5WjUWEeos1CHLyy9Ppo6bLNNttkvYFb6vke4Xup0vuXU4SMEWJFX+TSVhTR0qVp/+c8V155ZVbRXvwBItqERDV7rLum7S/yXmclenHHHgGlLUbiAKbFg7+Gvn37Nurh3LQyONr1FHvMx7bRXOBaqhyvOXpYlz5O9HCP6uvSx4ztslTT7bjWxfYaPcNL/+4jvI6ANg5EG3uDtHQ8hWV5D9qyjiPEjz1QSsVnSrFqPHqWlx6guC0WLFjQ6Hz80FOs/I5tMg6UW/q33Z6W93OhqOnf0tZbb72CRwwAtLfGzQUBAFghmgZVEXRFdWpTEVzHAUMjPC8edC9CsAjK4iCTcUDCCJyiYrQYoEYrgqI4QGhUi0+dOjU7H+0I1ltvvSwsj8eJitBS48ePb6gejSrL6OMcrRfiuaJiNcK+qCCNqvRSpT2UBw8enI27WGn67LPPZpWm8RhRTRu9oD/2sY8t13r7yle+kgWE0QonqmKLr6so2s/E+mqu3UdLonXG73//+6yFRLyOqByNMPG5555rVN0dQVrpgTxj3Zc6++yzs4NFFnsj//KXv2wUiK4Ib7zxRtavOn7ciD0GigeKLYq9CUqriz/60Y9mYyw9+Gy0GImwMg5MujTleM2xbZxwwglZcF8U/cDPO++8rP3F3//+90atjuI5Dz/88NSRRGuQCKdjie1tgw02yNqSzJ07N3v9pQfYbNqfPNZHHPCyKA6YGX3iI4CO0/E339Z1HP3Ab7nlloaD+F577bXZZ1TcLv7umguOl0e0TIkfe6IaP8SBjKMKPJ4n/vbiR6L4zGjtQZbLYXk/F4qiLVZRvL9N23QBALVPkA4A0A6isjEO2lkMpONgg+eff36zt42K4gi+Pv/5zzcKSiM8b9pyoWkbhQi1o03CJz/5yawtQbHlQDxfqQiIokL20EMPXeLxIsSK8CiW5kQoH+F4qSOOOKJRxWuEb8V2EHFAxeX1xz/+scXr4uB/v/jFL7KDoC6PCJMfeeSRFq+P0Lg0oN9jjz2yPvbF9RqVq3fccUejitYVLcLPq666qtk9FOLHmnHjxjW67Oijj86q1kt72hf7okef7h133DFrqdGScr3mGFe0lYmDNRY1/RGgGLRGK43iQR87ogilWwqmY3v71re+1eiy+FuLPTGKohVKLOVcx7EdxI9qEagXxTZT3G5iz5c4dkJLLYOWVYTU55xzTvZ4zX2uxcGMY2yVPAZDaz8Xin9TpRXpTffgAQA6Bq1dAADaSWl4FCFzS+1dQlRERphz++23Z/3JI/yKytIIwKPiOCo4Dz744HT11VdnwVTToDse+3vf+17WBiV6IEcVZVSCRiuJCFfj+UtDs7DTTjtlrT9Gjx6dVT1H0FpsvRCno0r+hz/8YdZXu7TqOUQoHwHgxhtvXPaq7Bh7VECPGDEifehDH8rWY1R/xjiWJ0SPquAIw/baa6+ssjSqeWO9RsgX1bHxA8bEiROzNjul4nVFgB0HGyxWq7a3+OEjXvc+++yTjTven9hWzj333OxHh6YBdFQ9x+0PO+ywrAVOvJfRQz3WYfTMLu393JxyveaoMo5tJ/aQ+MIXvpCt59iGYjwxrjjYZAT+Dz/8cPY+dzT9+vVLv/71r7M9BuKHsvhxIl5/bNvF9kmnnHJK9nfb9D2J7TQqxOOHo/gbXlHrOCraoyo9DroZzxNLVLzHuEs/u9p6AN1YB/HjTayH2Nsknidef+xJE+OvlOX9XAixjhYtWpSdjvc09uoBADqeukIl9psDAFaYCEiifUMEZ3niy/6f//znrFo4bh8BQSx5ojIy+uZGFWq0AYnWH7Erfl7wdd9996Wdd965YVf9eL7ic+aJdiQRbMTriOeL2zd3gLdSEeTGayq+jgiW7r777tyK6FdffTWrFi++juJ6W1qlbYTKETwv7XU07Q8cAU2x2nLMmDHpggsuWOb7A6woUeUeAXnTH0siII49IWLvj9LP2gj+WSxa7cQxJkL8wBktjwCAjkdrFwCAdhKVodH+5LOf/Wx2/sc//nF2cL2oGAeopDig6M0335ztxbL66qtnVfTRsiRa+ZT+iBlhe7RgYbE4QGkxRI/q9WiRAwB0TIJ0AOiA4oCETz/9dKv7wi7tPtOnT1+ipUf0to0D5rWk2Fu5VPTsXtpzRfV20/NLu088bnPPn3e/Yr/opq9zac8V62t5fOYzn8mCqqiUjwPuffe7383acgBUWvRYz+uZHwfRvP7667OD/LLYWWed1XA62mXFHk4AQMckSAeADujkk0/OltaIg1tGr+Wlif7ZTVuctNaECROypTVef/31ZRpf9PfNG++yuPHGG7NlaeJAjMujuQNFAlRS9FWPiurosR6ft//973+zvWjiAMYjR45M++23X9YrvyMfCHZ5PPjgg5UeAgDQTvRIBwAAAACAHF3yrgQAAAAAgM5OkA4AAAAAADkE6QAAAAAAkEOQDgAAAAAAOQTpAAAAAACQQ5AOAAAAAAA5BOkAAAAAAJBDkA4AAAAAADkE6QAAAAAAkEOQDgAAAAAA1RKk33vvvWmfffZJw4YNS3V1denGG29c6n0mTpyYtthii9SzZ8+03nrrpSuvvLJdxgoAAB2BOTgAANRYkD579uy0+eabpwkTJizT7V988cW09957p9122y09/vjj6bjjjktf/OIX0+23377CxwoAAB2BOTgAALRdXaFQKFTkievq0g033JD222+/Fm9z4oknpltuuSX985//bLjsc5/7XHrnnXfSbbfd1k4jBQCAjsEcHAAAOmCP9AceeCDtvvvujS4bNWpUdjkAAFB+5uAAALCkbqmKTZ48Oa222mqNLovzM2bMSO+++27q3bv3EveZN29ethTV19ent99+O62yyipZBQ4AALSX2Plz5syZWX/yLl2quoalgTk4AAC1rLCC5uBVHaQvj/Hjx6czzzyz0sMAAIAGr7zySlpjjTVSR2UODgBAR5+DV3WQPmTIkPTmm282uizO9+/fv9lKmDB27Ng0ZsyYhvPTp09Pa665Zrbi4n4AANBeoop7+PDhqV+/fqlWmIMDAFDLZqygOXhVB+nbb799uvXWWxtddscdd2SXt6Rnz57Z0lRM4E3iAQCohFpqb2IODgBAR1BX5jl4uzZqnDVrVnr88cezJbz44ovZ6UmTJjVUshx66KENtz/yyCPTCy+8kE444YT09NNPp0suuST95je/Sccff3x7DhsAAGqWOTgAANRYkP7www+nD37wg9kSYvfPOH366adn5994442GCX1Ye+210y233JJVwGy++ebpggsuSD/96U/TqFGj2nPYAABQs8zBAQCg7eoKcRjTDt4TZ8CAAVmfRruVAgDQnjrrXLSzvm4AADruXLRdK9IBAAAAAKDWCNIBAAAAACCHIB0AAAAAAHII0gEAAAAAIIcgHQAAAAAAcgjSAQAAAAAghyAdAAAAAAByCNIBAAAAACCHIB0AAAAAAHII0gEAAAAAIIcgHQAAAAAAcgjSAQAAAAAghyAdAAAAAAByCNIBAAAAACCHIB0AAAAAAHII0gEAAAAAIIcgHQAAAAAAcgjSAQAAAAAghyAdAAAAAAByCNIBAAAAACCHIB0AAAAAAHII0gEAAAAAIIcgHQAAAAAAcgjSAQAAAAAghyAdAAAAAAByCNIBAAAAACCHIB0AAAAAAHII0gEAAAAAIIcgHQAAAAAAcgjSAQAAAAAghyAdAAAAAAByCNIBAAAAACCHIB0AAAAAAHII0gEAAAAAIIcgHQAAAAAAcgjSAQAAAAAghyAdAAAAAAByCNIBAAAAACCHIB0AAAAAAHII0gEAAAAAIIcgHQAAAAAAcgjSAQAAAAAghyAdAAAAAAByCNIBAAAAACCHIB0AAAAAAHII0gEAAAAAIIcgHQAAAAAAcgjSAQAAAAAghyAdAAAAAAByCNIBAAAAACCHIB0AAAAAAHII0gEAAAAAIIcgHQAAAAAAcgjSAQAAAAAghyAdAAAAAAByCNIBAAAAACCHIB0AAAAAAHII0gEAAAAAIIcgHQAAAAAAcgjSAQAAAAAghyAdAAAAAAByCNIBAAAAACCHIB0AAAAAAHII0gEAAAAAIIcgHQAAAAAAcgjSAQAAAAAghyAdAAAAAAByCNIBAAAAACCHIB0AAAAAAHII0gEAAAAAIIcgHQAAAAAAcgjSAQAAAACgmoL0CRMmpBEjRqRevXqlbbfdNj300EO5t7/ooovSBhtskHr37p2GDx+ejj/++DR37tx2Gy8AANQ6c3AAAKihIP3aa69NY8aMSePGjUuPPvpo2nzzzdOoUaPSlClTmr391VdfnU466aTs9k899VS6/PLLs8c4+eST23PYAABQs8zBAQCgxoL0Cy+8MP3f//1fOvzww9PGG2+cLrvsstSnT5/0s5/9rNnb33///WnHHXdMBx10UFZBs8cee6QDDzxwqRU0AADAYubgAABQQ0H6/Pnz0yOPPJJ233339568S5fs/AMPPNDsfXbYYYfsPsVJ+wsvvJBuvfXWtNdee7X4PPPmzUszZsxotAAAQGdkDg4AAOXRLbWTadOmpUWLFqXVVlut0eVx/umnn272PlEFE/fbaaedUqFQSAsXLkxHHnlk7m6l48ePT2eeeWbZxw8AALXGHBwAAGr0YKOtMXHixHTOOeekSy65JOvneP3116dbbrklnX322S3eZ+zYsWn69OkNyyuvvNKuYwYAgFpmDg4AABWsSF911VVT165d05tvvtno8jg/ZMiQZu9z2mmnpUMOOSR98YtfzM5vuummafbs2elLX/pSOuWUU7LdUpvq2bNntgAAQGdnDg4AADVWkd6jR4+05ZZbpjvvvLPhsvr6+uz89ttv3+x95syZs8REPb4IhNjNFAAAaJk5OAAA1FhFehgzZkwaPXp02mqrrdI222yTLrrooqy65fDDD8+uP/TQQ9Pqq6+e9VgM++yzT7rwwgvTBz/4wbTtttum5557LquQicuLk3kAAKBl5uAAAFBjQfoBBxyQpk6dmk4//fQ0efLkNHLkyHTbbbc1HPxo0qRJjapfTj311FRXV5f9+9prr6VBgwZlE/hvf/vb7TlsAACoWebgAADQdnWFDr5/5owZM9KAAQOygx7179+/0sMBAKAT6axz0c76ugEA6Lhz0XbrkQ4AAAAAALVIkA4AAAAAADkE6QAAAAAAkEOQDgAAAAAAOQTpAAAAAACQQ5AOAAAAAAA5BOkAAAAAAJBDkA4AAAAAADkE6QAAAAAAkEOQDgAAAAAAOQTpAAAAAACQQ5AOAAAAAAA5BOkAAAAAAJBDkA4AAAAAADkE6QAAAAAAkEOQDgAAAAAAOQTpAAAAAACQQ5AOAAAAAAA5BOkAAAAAAJBDkA4AAAAAADkE6QAAAAAAkEOQDgAAAAAAOQTpAAAAAACQQ5AOAAAAAAA5BOkAAAAAAJBDkA4AAAAAADkE6QAAAAAAkEOQDgAAAAAAOQTpAAAAAACQQ5AOAAAAAAA5BOkAAAAAAJBDkA4AAAAAADkE6QAAAAAAkEOQDgAAAAAAOQTpAAAAAACQQ5AOAAAAAAA5BOkAAAAAAJBDkA4AAAAAADkE6QAAAAAAkEOQDgAAAAAAOQTpAAAAAACQQ5AOAAAAAAA5BOkAAAAAAJBDkA4AAAAAADkE6QAAAAAAkEOQDgAAAAAAOQTpAAAAAACQQ5AOAAAAAAA5BOkAAAAAAJBDkA4AAAAAADkE6QAAAAAAkEOQDgAAAAAAOQTpAAAAAACQQ5AOAAAAAAA5BOkAAAAAAJBDkA4AAAAAADkE6QAAAAAAkEOQDgAAAAAAOQTpAAAAAACQQ5AOAAAAAAA5BOkAAAAAAJBDkA4AAAAAADkE6QAAAAAAkEOQDgAAAAAAOQTpAAAAAACQQ5AOAAAAAAA5BOkAAAAAAJBDkA4AAAAAADkE6QAAAAAAkEOQDgAAAAAAOQTpAAAAAABQTUH6hAkT0ogRI1KvXr3Stttumx566KHc27/zzjvp6KOPTkOHDk09e/ZM66+/frr11lvbbbwAAFDrzMEBAKBtuqV2dO2116YxY8akyy67LJvAX3TRRWnUqFHpmWeeSYMHD17i9vPnz08f/ehHs+t++9vfptVXXz29/PLLaeDAge05bAAAqFnm4AAA0HZ1hUKhkNpJTNy33nrrdPHFF2fn6+vr0/Dhw9MxxxyTTjrppCVuH5P973znO+npp59O3bt3X67nnDFjRhowYECaPn166t+/f5tfAwAA1NJc1BwcAIDOZMYKmou2W2uXqGx55JFH0u677/7ek3fpkp1/4IEHmr3PTTfdlLbffvtst9LVVlstbbLJJumcc85JixYtaq9hAwBAzTIHBwCAGmvtMm3atGzyHZPxUnE+ql2a88ILL6S77rorHXzwwVlPxueeey595StfSQsWLEjjxo1r9j7z5s3LltJfIAAAoDMyBwcAgBo92GhrxG6n0Zvxxz/+cdpyyy3TAQcckE455ZRsd9OWjB8/PivdLy6x2yoAALBszMEBAKCCQfqqq66aunbtmt58881Gl8f5IUOGNHufoUOHpvXXXz+7X9FGG22UJk+enO2m2pyxY8dm/W+KyyuvvFLmVwIAALXBHBwAAGosSO/Ro0dW0XLnnXc2qnaJ89GDsTk77rhjtitp3K7oP//5Tza5j8drTs+ePbMm8qULAAB0RubgAABQg61dxowZk37yk5+kq666Kj311FPpqKOOSrNnz06HH354dv2hhx6aVbMUxfVvv/12OvbYY7PJ+y233JId6CgOfAQAACydOTgAANTQwUZD9FecOnVqOv3007NdQ0eOHJluu+22hoMfTZo0KXXp8l62H70Vb7/99nT88cenzTbbLK2++urZhP7EE09sz2EDAEDNMgcHAIC2qysUCoXUgc2YMSM74FH0arSLKQAA7amzzkU76+sGAKDjzkXbtbULAAAAAADUGkE6AAAAAADkEKQDAAAAAEAOQToAAAAAAOQQpAMAAAAAQA5BOgAAAAAA5BCkAwAAAABADkE6AAAAAADkEKQDAAAAAEAOQToAAAAAAOQQpAMAAAAAQA5BOgAAAAAA5BCkAwAAAABADkE6AAAAAADkEKQDAAAAAEAOQToAAAAAAOQQpAMAAAAAQA5BOgAAAAAA5BCkAwAAAABADkE6AAAAAADkEKQDAAAAAEAOQToAAAAAAOQQpAMAAAAAQA5BOgAAAAAA5BCkAwAAAABADkE6AAAAAADkEKQDAAAAAEAOQToAAAAAAOQQpAMAAAAAQA5BOgAAAAAA5BCkAwAAAABADkE6AAAAAADkEKQDAAAAAEAOQToAAAAAAOQQpAMAAAAAQA5BOgAAAAAA5BCkAwAAAABADkE6AAAAAADkEKQDAAAAAEAOQToAAAAAAOQQpAMAAAAAQA5BOgAAAAAA5BCkAwAAAABADkE6AAAAAADkEKQDAAAAAEAOQToAAAAAAOQQpAMAAAAAQA5BOgAAAAAA5BCkAwAAAABADkE6AAAAAADkEKQDAAAAAEAOQToAAAAAAOQQpAMAAAAAQA5BOgAAAAAA5BCkAwAAAABADkE6AAAAAADkEKQDAAAAAEAOQToAAAAAAOQQpAMAAAAAQA5BOgAAAAAA5BCkAwAAAABADkE6AAAAAADkEKQDAAAAAEAOQToAAAAAAOQQpAMAAAAAQA5BOgAAAAAA5BCkAwAAAABADkE6AAAAAADkEKQDAAAAAEAOQToAAAAAAOQQpAMAAAAAQA5BOgAAAAAAVFOQPmHChDRixIjUq1evtO2226aHHnpome53zTXXpLq6urTffvut8DECAEBHYg4OAAA1FKRfe+21acyYMWncuHHp0UcfTZtvvnkaNWpUmjJlSu79XnrppfSNb3wj7bzzzu02VgAA6AjMwQEAoMaC9AsvvDD93//9Xzr88MPTxhtvnC677LLUp0+f9LOf/azF+yxatCgdfPDB6cwzz0zrrLNOew4XAABqnjk4AADUUJA+f/789Mgjj6Tdd9/9vSfv0iU7/8ADD7R4v7POOisNHjw4HXHEEcv0PPPmzUszZsxotAAAQGdkDg4AADUWpE+bNi2rbFlttdUaXR7nJ0+e3Ox97rvvvnT55Zenn/zkJ8v8POPHj08DBgxoWIYPH97msQMAQC0yBwcAgBo92OiymjlzZjrkkEOyCfyqq666zPcbO3Zsmj59esPyyiuvrNBxAgBAR2EODgAAzeuW2klMxLt27ZrefPPNRpfH+SFDhixx++effz47wNE+++zTcFl9fX32b7du3dIzzzyT1l133SXu17Nnz2wBAIDOzhwcAABqrCK9R48eacstt0x33nlno0l5nN9+++2XuP2GG26YnnzyyfT44483LJ/4xCfSbrvtlp22uygAAOQzBwcAgBqrSA9jxoxJo0ePTltttVXaZptt0kUXXZRmz56dDj/88Oz6Qw89NK2++upZj8VevXqlTTbZpNH9Bw4cmP3b9HIAAKB55uAAAFBjQfoBBxyQpk6dmk4//fTs4EYjR45Mt912W8PBjyZNmpS6dKnatu0AAFBzzMEBAKDt6gqFQiF1YDNmzEgDBgzIDnrUv3//Sg8HAIBOpLPORTvr6wYAoOPORZWeAAAAAABADkE6AAAAAADkEKQDAAAAAEAOQToAAAAAAOQQpAMAAAAAQA5BOgAAAAAA5BCkAwAAAABADkE6AAAAAADkEKQDAAAAAEAOQToAAAAAAOQQpAMAAAAAQA5BOgAAAAAA5BCkAwAAAABADkE6AAAAAADkEKQDAAAAAEAOQToAAAAAAOQQpAMAAAAAQA5BOgAAAAAA5BCkAwAAAABADkE6AAAAAADkEKQDAAAAAEAOQToAAAAAAOQQpAMAAAAAQA5BOgAAAAAA5BCkAwAAAABADkE6AAAAAADkEKQDAAAAAEAOQToAAAAAAOQQpAMAAAAAQA5BOgAAAAAA5BCkAwAAAABADkE6AAAAAADkEKQDAAAAAEAOQToAAAAAAOQQpAMAAAAAQA5BOgAAAAAA5BCkAwAAAABADkE6AAAAAADkEKQDAAAAAEAOQToAAAAAAOQQpAMAAAAAQA5BOgAAAAAA5BCkAwAAAABADkE6AAAAAADkEKQDAAAAAEAOQToAAAAAAOQQpAMAAAAAQA5BOgAAAAAA5BCkAwAAAABADkE6AAAAAADkEKQDAAAAAEAOQToAAAAAAOQQpAMAAAAAQA5BOgAAAAAA5BCkAwAAAABADkE6AAAAAADkEKQDAAAAAEAOQToAAAAAAOQQpAMAAAAAQA5BOgAAAAAA5BCkAwAAAABADkE6AAAAAADkEKQDAAAAAEAOQToAAAAAAOQQpAMAAAAAQA5BOgAAAAAA5BCkAwAAAABADkE6AAAAAADkEKQDAAAAAEAOQToAAAAAAOQQpAMAAAAAQDUF6RMmTEgjRoxIvXr1Sttuu2166KGHWrztT37yk7Tzzjun973vfdmy++67594eAABYkjk4AADUUJB+7bXXpjFjxqRx48alRx99NG2++eZp1KhRacqUKc3efuLEienAAw9Md999d3rggQfS8OHD0x577JFee+219hw2AADULHNwAABou7pCoVBI7SSqX7beeut08cUXZ+fr6+uzifkxxxyTTjrppKXef9GiRVlVTNz/0EMPXabnnDFjRhowYECaPn166t+/f5tfAwAALKtqmIuagwMA0JnMWEFz0XarSJ8/f3565JFHsl1DG568S5fsfFS6LIs5c+akBQsWpJVXXnkFjhQAADoGc3AAACiPbqmdTJs2LatmWW211RpdHueffvrpZXqME088MQ0bNqzRF4Gm5s2bly2lv0AAAEBnZA4OAAA1erDR5XXuueema665Jt1www3ZQZJaMn78+Kx0v7jEbqsAAEDrmYMDAEA7B+mrrrpq6tq1a3rzzTcbXR7nhwwZknvf7373u9kk/k9/+lPabLPNcm87duzYrP9NcXnllVfKMn4AAKg15uAAAFBjQXqPHj3Slltume68886Gy+JAR3F+++23b/F+559/fjr77LPTbbfdlrbaaqulPk/Pnj2zJvKlCwAAdEbm4AAAUGM90sOYMWPS6NGjs8n4Nttsky666KI0e/bsdPjhh2fXH3rooWn11VfPdg0N5513Xjr99NPT1VdfnUaMGJEmT56cXd63b99sAQAA8pmDAwBAjQXpBxxwQJo6dWo2MY8J+ciRI7Mql+LBjyZNmpS6dHmvSP7SSy9N8+fPT5/+9KcbPc64cePSGWec0Z5DBwCAmmQODgAAbVdXKBQKqQObMWNGdsCj6NVoF1MAANpTZ52LdtbXDQBAx52LtluPdAAAAAAAqEWCdAAAAAAAyCFIBwAAAACAHIJ0AAAAAADIIUgHAAAAAIAcgnQAAAAAAMghSAcAAAAAgByCdAAAAAAAyCFIBwAAAACAHIJ0AAAAAADIIUgHAAAAAIAcgnQAAAAAAMghSAcAAAAAgByCdAAAAAAAyCFIBwAAAACAHIJ0AAAAAADIIUgHAAAAAIAcgnQAAAAAAMghSAcAAAAAgByCdAAAAAAAyCFIBwAAAACAHIJ0AAAAAADIIUgHAAAAAIAcgnQAAAAAAMghSAcAAAAAgByCdAAAAAAAyCFIBwAAAACAHIJ0AAAAAADIIUgHAAAAAIAcgnQAAAAAAMghSAcAAAAAgByCdAAAAAAAyCFIBwAAAACAHIJ0AAAAAADIIUgHAAAAAIAcgnQAAAAAAMghSAcAAAAAgByCdAAAAAAAyCFIBwAAAACAHIJ0AAAAAADIIUgHAAAAAIAcgnQAAAAAAMghSAcAAAAAgByCdAAAAAAAyCFIBwAAAACAHIJ0AAAAAADIIUgHAAAAAIAcgnQAAAAAAMghSAcAAAAAgByCdAAAAAAAyCFIBwAAAACAHIJ0AAAAAADIIUgHAAAAAIAcgnQAAAAAAMghSAcAAAAAgByCdAAAAAAAyCFIBwAAAACAHIJ0AAAAAADIIUgHAAAAAIAcgnQAAAAAAMghSAcAAAAAgByCdAAAAAAAyCFIBwAAAACAHIJ0AAAAAADIIUgHAAAAAIAcgnQAAAAAAMghSAcAAAAAgByCdAAAAAAAyCFIBwAAAACAHIJ0AAAAAADIIUgHAAAAAIAcgnQAAAAAAKimIH3ChAlpxIgRqVevXmnbbbdNDz30UO7tr7vuurThhhtmt990003Trbfe2m5jBQCAjsAcHAAAaihIv/baa9OYMWPSuHHj0qOPPpo233zzNGrUqDRlypRmb3///fenAw88MB1xxBHpscceS/vtt1+2/POf/2zPYQMAQM0yBwcAgLarKxQKhdROovpl6623ThdffHF2vr6+Pg0fPjwdc8wx6aSTTlri9gcccECaPXt2uvnmmxsu22677dLIkSPTZZddtkzPOWPGjDRgwIA0ffr01L9//zK+GgAAqP65qDk4AACdyYwVNBftltrJ/Pnz0yOPPJLGjh3bcFmXLl3S7rvvnh544IFm7xOXR/VMqaieufHGG1t8nnnz5mVLUayw4goEAID2VJyDtmPtSiPm4AAAdDYzVtAcvN2C9GnTpqVFixal1VZbrdHlcf7pp59u9j6TJ09u9vZxeUvGjx+fzjzzzCUuj6obAACohLfeeiurimlv5uAAAHRWb5V5Dt5uQXp7iWqb0gqad955J6211lpp0qRJFfnyQnX/OhVf7l555RW7HNOIbYOW2DZoiW2DlkRl9pprrplWXnnl1JGZg7OsfF7SEtsGLbFt0BLbBu09B2+3IH3VVVdNXbt2TW+++Wajy+P8kCFDmr1PXN6a24eePXtmS1MxgfdHRXNiu7Bt0BzbBi2xbdAS2wYtiXYqlWAOTrXyeUlLbBu0xLZBS2wbtNccvN1m9D169EhbbrlluvPOOxsuiwMdxfntt9++2fvE5aW3D3fccUeLtwcAAN5jDg4AADXY2iV29xw9enTaaqut0jbbbJMuuuiiNHv27HT44Ydn1x966KFp9dVXz3oshmOPPTbtsssu6YILLkh77713uuaaa9LDDz+cfvzjH7fnsAEAoGaZgwMAQI0F6QcccECaOnVqOv3007ODFY0cOTLddtttDQczih6KpSX3O+ywQ7r66qvTqaeemk4++eT0/ve/P914441pk002WebnjF1Mx40b1+yupnRutg1aYtugJbYNWmLboJq3DXNwqoltg5bYNmiJbYOW2DZo722jrlAoFMr6iAAAAAAA0IFU5qhHAAAAAABQIwTpAAAAAACQQ5AOAAAAAAA5BOkAAAAAANDRg/QJEyakESNGpF69eqVtt902PfTQQ7m3v+6669KGG26Y3X7TTTdNt956a7uNlerdNn7yk5+knXfeOb3vfe/Llt13332p2xKd53Oj6Jprrkl1dXVpv/32W+FjpDa2jXfeeScdffTRaejQodkRwddff33/X+mgWrttXHTRRWmDDTZIvXv3TsOHD0/HH398mjt3bruNl/Zx7733pn322ScNGzYs+//DjTfeuNT7TJw4MW2xxRbZZ8Z6662XrrzyylSLzMFpiTk4LTEHpyXm4LTEHJyqmoMXatw111xT6NGjR+FnP/tZ4V//+lfh//7v/woDBw4svPnmm83e/q9//Wuha9euhfPPP7/w73//u3DqqacWunfvXnjyySfbfexU17Zx0EEHFSZMmFB47LHHCk899VThsMMOKwwYMKDw6quvtvvYqa5to+jFF18srL766oWdd965sO+++7bbeKnebWPevHmFrbbaqrDXXnsV7rvvvmwbmThxYuHxxx9v97FTXdvGr371q0LPnj2zf2O7uP322wtDhw4tHH/88e0+dlasW2+9tXDKKacUrr/++kJMrW+44Ybc27/wwguFPn36FMaMGZPNRX/4wx9mc9PbbrutUEvMwWmJOTgtMQenJebgtMQcnGqbg9d8kL7NNtsUjj766IbzixYtKgwbNqwwfvz4Zm//2c9+trD33ns3umzbbbctfPnLX17hY6W6t42mFi5cWOjXr1/hqquuWoGjpFa2jdgedthhh8JPf/rTwujRo03iO6jWbhuXXnppYZ111inMnz+/HUdJLWwbcdsPf/jDjS6LSduOO+64wsdK5SzLJP6EE04ofOADH2h02QEHHFAYNWpUoZaYg9MSc3BaYg5OS8zBaYk5ONU2B6/p1i7z589PjzzySLb7X1GXLl2y8w888ECz94nLS28fRo0a1eLt6TzbRlNz5sxJCxYsSCuvvPIKHCm1sm2cddZZafDgwemII45op5FSC9vGTTfdlLbffvtst9LVVlstbbLJJumcc85JixYtaseRU43bxg477JDdp7jr6QsvvJDtbrzXXnu127ipTh1hLmoOTkvMwWmJOTgtMQenJebglFO55qLdUg2bNm1a9kEZH5yl4vzTTz/d7H0mT57c7O3jcjqO5dk2mjrxxBOzXktN/9DofNvGfffdly6//PL0+OOPt9MoqZVtIyZmd911Vzr44IOzCdpzzz2XvvKVr2QBwLhx49pp5FTjtnHQQQdl99tpp51i77+0cOHCdOSRR6aTTz65nUZNtWppLjpjxoz07rvvZv08q505OC0xB6cl5uC0xByclpiDU41z8JquSIcV5dxzz80OaHPDDTdkB7Sg85o5c2Y65JBDsgNhrbrqqpUeDlWmvr4+q5L68Y9/nLbccst0wAEHpFNOOSVddtlllR4aFRYHsonKqEsuuSQ9+uij6frrr0+33HJLOvvssys9NICqZQ5OkTk4eczBaYk5OCtaTVekx/9Qu3btmt58881Gl8f5IUOGNHufuLw1t6fzbBtF3/3ud7NJ/J///Oe02WabreCRUu3bxvPPP59eeuml7GjQpRO30K1bt/TMM8+kddddtx1GTjV+bgwdOjR17949u1/RRhttlP3aHbsi9ujRY4WPm+rcNk477bQsAPjiF7+Ynd90003T7Nmz05e+9KXsi17slkrn1NJctH///jVRjR7MwWmJOTgtMQenJebgtMQcnGqcg9f0FhQfjvHr45133tnof65xPvplNScuL719uOOOO1q8PZ1n2wjnn39+9kvlbbfdlrbaaqt2Gi3VvG1suOGG6cknn8x2KS0un/jEJ9Juu+2WnR4+fHg7vwKq6XNjxx13zHYlLX6xC//5z3+yyb0JfOfeNqLHb9OJevHL3uLj4dBZdYS5qDk4LTEHpyXm4LTEHJyWmINTTmWbixZq3DXXXFPo2bNn4corryz8+9//LnzpS18qDBw4sDB58uTs+kMOOaRw0kknNdz+r3/9a6Fbt26F7373u4WnnnqqMG7cuEL37t0LTz75ZAVfBdWwbZx77rmFHj16FH77298W3njjjYZl5syZFXwVVMO20dTo0aML++67bzuOmGrdNiZNmlTo169f4atf/WrhmWeeKdx8882FwYMHF771rW9V8FVQDdtGzC9i2/j1r39deOGFFwp/+tOfCuuuu27hs5/9bAVfBStCzBMee+yxbImp9YUXXpidfvnll7PrY7uI7aMotoc+ffoUvvnNb2Zz0QkTJhS6du1auO222wq1xByclpiD0xJzcFpiDk5LzMGptjl4zQfp4Yc//GFhzTXXzCZg22yzTeHBBx9suG6XXXbJ/odb6je/+U1h/fXXz27/gQ98oHDLLbdUYNRU27ax1lprZX98TZf4IKbjae3nRimT+I6ttdvG/fffX9h2222zCd4666xT+Pa3v11YuHBhBUZONW0bCxYsKJxxxhnZxL1Xr16F4cOHF77yla8U/vvf/1Zo9Kwod999d7Pzh+L2EP/G9tH0PiNHjsy2pfjcuOKKKwq1yByclpiD0xJzcFpiDk5LzMGppjl4XfynrLXyAAAAAADQgdR0j3QAAAAAAFjRBOkAAAAAAJBDkA4AAAAAADkE6QAAAAAAkEOQDgAAAAAAOQTpAAAAAACQQ5AOAAAAAAA5BOkAAAAAAJBDkA4AAAAAADkE6QAAAAAAkEOQDgAAAAAAOQTpAAAAAACQQ5AOAAAAAAA5BOkAAAAAAJBDkA4AAAAAADkE6QAAAAAAkEOQDgAAAAAAOQTpAAAAAFWmrq4uW0aMGJFq0RlnnNHwGq688spKDwegzQTpAFU62WxuGThw4BL3WbRoUfrFL36R9thjjzRo0KDUo0eP7N+PfvSj2YQ1rm8qJuPFx5w4cWI7vToAAFpj9uzZ6Xvf+1760Ic+lFZZZZXUq1evtPbaa6ePf/zj6Ze//GWaP3/+Cn3+G2+8MZufxvLSSy+1+v5//vOf0wEHHJDWXHPNbOyDBw9O22yzTTrzzDPTpEmTVsiYKb/4vpAX6pd+hznssMOqZvsDKLduZX9EANrNjBkz0ic/+cl01113Nbp82rRp2ReXWCJM//3vf58GDBiwXM8RX37+8Ic/pC5dlvzttb6+Pn3mM59JV111VcVuBwDQEf373/9O++yzT3rhhRcaXR6BYiy33HJL2mSTTdLIkSNX2BgiyCzOt3bddddlroxesGBBOuKII7Jij1JTp07Nlr///e/pv//9b7roootWyLg7ir/85S/Zv/EjRC36whe+kHbffffs9Prrr99u2x/AiiJIB6hSe+65Zzr55JMbXdatW+OP7fiCUgzRV1555XT66adnX6j+9a9/ZZU+b7/9drrnnnuy2/32t79drnFERftNN93UMAkuddttt2XVUJW8HQBARxNzuJgLFqu2hw0blr75zW+mTTfdNM2cOTOb311xxRWpWh1//PENIXoURfzf//1fVkUfgfCTTz7Zadt8xB4GK6200jLffqeddkq1LPZEiKUjib1AYptu+r0M6By0dgGoUrHra0yeS5ftttuu4fpHH320UTh+/fXXp2OPPTZ95CMfSV/72tey80W/+93vstsDAFD9vvvd7zaE6LFX4UMPPZSOO+64bJ633377Ze1e/vOf/zQKKSPgO++887IK9Qhr+/TpkzbffPN07rnnLtEC5h//+Efad999s/lm9+7ds7Yxcb8jjzwye96oeI82HaV7/+22227L1Brw6aefTpdeemnD+e9///vpsssuy4L0KJCIkP3xxx9PRx11VKP7RXHI3nvvnVZdddWsVeHw4cOzNiHPPvtsi21ELr/88qx4ZOjQoal///7pwAMPTO+88072Q8QhhxySrbsoNonXNXfu3IbHKL6+WKLSOSrkd9lll2ydxY8Wp512Wlq4cGGjADzGu9VWW6XVVlstG1889vbbb5+NoVTTx7733nuz2/Xu3TsdffTRy7T+i1pqp9Ka97q0pePkyZOz9fK+970v9evXL9sDNNZVe/dIL+f2t6zbTXjiiSeyx4n1tcYaa2TbTuzB21xbmjhdvPyPf/xj+vrXv55tZ/Fj0Kuvvppee+21rOI+1ns8d7yO2NY+/OEPZ5X0LbXGice97rrr0kYbbZSNY+edd85+XIo9bs8666y0+uqrZ5fHD2kvv/zyCnhXgLbwExpAjbrhhhsaTsekPib/peL8lltumR555JHsfLR32WKLLdp9nAAAtM61117bcDqC5wjXmooQsmjevHnZ8XIitG0aHMYSQeAdd9yRBY1vvfVWdiydaLFSFGFqLBFwfvrTn07rrbfeco89QsIIBUM8TtPAPESguMEGGzScv+SSS9JXv/rVVCgUGi6LsDKC1CgOufPOO9PWW2+9xOOMHz8+Pf/88w3nr7nmmoYgPX58KPrRj36UhZ3f+ta3lniMuH+EqxGWh3fffTe7Xayf+AEgxF4AxdOl7WsefPDBbIlQNfYMbSrC3FGjRjUK8Zdl/edVcbfmvW5qxx13bNQq6De/+U0WALfnnp7l3P5as928+OKL2fej2D5CvGcR9EcQvjTxHE1bLL3yyitL7BUS7YruvvvubIkxHHrooUs8VrxvP//5zxvGfN9992XvZ7Rx+slPftJoD9yDDz44ux6oHirSAapUTL6aHmy0tEoi+mYWtdQbs/TyaPcCAEB1mzVrVqPQLipWlyZ6jReD1ajIvfrqq9Ovf/3rhkA2rosq9vDAAw80hJhRwR2ha1TQRhV8BI1du3bNKm+jP3dUxRb94Ac/yC6L5YMf/GCLY4kwtCgqsePx8kQgGT8WRLAYLTNOPfXUrP97HA+nGGLHHLg0LC2KyuXzzz8/++EhKqyLAWTMk3/60582qoyPML05EbxGwBzH5jn77LMbxhu3j2A6RIVwVAtH8PynP/0pC0ojtH//+9+fXf+d73yn2QO/vv7661nlcwTVt956a7Y3wbKs/3K9103FjwQxlgigi0F7vI7p06enZRVV0k2/o0Rl97Iq1/bX2u3mlFNOaQjRN9tss6woKfaWiD07lib+HmOP39i2YruIbW3IkCHZHgCx529UtRfD80GDBmX3ae5Hm2KgH+OKsUarphB7CkSIPnbs2GxcsddD+Otf/+o7HFQZFekANXyg0aLihK2p0stLbw8AQHVqGmpGq5GliTC1KELSaKMS+vbtm1W6hghbTzzxxKwCuSiC2KgMj7A3AtFoX1EUbQVLq94j9FuWnt2l41+WsUerwmII/clPfjILs0NULUdoGiFjBOMR0DctHonWJNE7PkSVb4STIQLWOEZQuPjii7Mwctq0adnYoiVLqQjJIyCPy2O9RWuaX/3qVw17dEboGm1jIryNMPexxx7LKo/jeD6lP37E/eK2pSLgvfnmmxtV399+++3LtP7L8V43FbePMD/EsYgiGI7XET9ILEtldjmUa/v72c9+tszbTbwv8UNJUby/cVyp8MYbb2SBeJ6DDjooC91LRTuaCNPjh41ozRLbVumPPbE3Qnz/im2nVLzm+JEnto0YX3H7jR/MzjnnnOx0BPMTJkzITj/33HPpAx/4wDKtW2DFU5EOUKWiAqNYdVFcopKiqFh1E+KLQXNKd5ksVjYAAFC9mga9UdW8NKVVtdtuu23D6W222WaJ20RgV6ykjmruqGSO54x+3lEVW2zLUo7xt2XsEbiWVr43Vzlc+vqiP3Vp28OiaOlSVKxILrXhhhs2GnPpYxb3DIg2IRFSR/V0zLtLQ/S8x471XBqil2P9t+a9bqq0FWQEwXljb0mEx02/oxx++OHLfP9ybX+t2W6mTJmS/dhR/OGkGKIX95pYmuIPFKWi6j8qy+P1x/prbo+J5tZrtN6MEL0t2yxQOYJ0gBo62Ghx0hk23njjhtNRBbG0XWtL7wsAQHWKyuJ11lmn4Xy0d1heUeXbVASJ8ZjRqiQOjBjBaLTBuOeee9KXvvSlLNxsi9LK5ugf3lzo3JbxlyoNwIvhZGhaBVzUXNi5LM8ZVe1FEZ5Ge5cIUKP6uai5ALi5QpYVtf6Xtq5CHGS0qFu3bq1aL0U9e/Zc4jtKXk/39t7+lrYulmU9Lcv7+MMf/rDh9AknnJD1Y49totiupaVtYkVss0D7EaQD1KjibpnFLyl/+9vfGl0fE7mHH364YcL4+c9/vt3HCABA60XLkqILL7yw2cruqLKNAzSG9ddfv+Hy0oNsls4Pi7eJYC7a/5122mlZ+BetLaLyOgL8YvV1c0HfslYKR4/q4v2ivcWPf/zjJW4TY3jmmWdyxx4H84w2Kk3HX24xjtIWiKXrrPiDRhyYsjRAjQB9hx12aHT5soa2rVn/zWnNe12NyrX9tWa7iQKl4t68cVDZp556qlHP9qVp7n0svvdR2X/eeedlPwpEJfzStgmgtumRDlCjYve/6AcYB6QJn/jEJ9Lpp5+eNtpoo6wPZOlBf774xS82qmwCAKB6feMb38j6OE+aNClr7RCtK+KyqHaN6t2JEyemK664Ivs32kNED+figTGPPvro7DYR/p100kkNjxkHdgz3339/duDET33qU9kei9FGIu47Z86c7Pp58+Y1W8EcB6mMA0HGktcrPVqlHHXUUQ09no855phs78m99947q2b+5z//mY19t912y/pLf/rTn876eUcAGiHquHHj0nbbbZcduDFC1uKemCuqh3cEq/HDxVe/+tVsb844+GbRvvvum/271lprNbQSifn2qFGj0i9+8Yusx3VrtWb9N6c173U1Ktf215rtJtZPtGcp9pc/5JBDsiA//r6a9j5fVrFNxA9Fb731VtZjPfqwx2MVf9wCOiZBOkANiy8hcbCj+BIVVUnxBaCp+NJSuushAADVLcLxP/7xj1n4F9W6r776ajruuONavH1cFwfajD0SX3755SWC1A996EPZATiLFcGPPvpotjSn9L4RdkdFfHHeGUvxMfJE/+io8o6wOVq7XHrppdlSKh67ePDFCNRjHhtVx9Hyo1RUEl955ZXL1ZJjWQPRCHfjwJulohClePDQaDkS/dGLry2WXr16Zf2uH3nkkVY9X2vWf1vf62pUru2vtdvNt771rXTrrbdmP0zFe1bcuzfe4+IPE60R20TxQKFjx47N/o0fBaInfnFvC6Dj0doFoIZFj704qntUXuyxxx7ZbpJRpVE0evTodPPNN2fVPwAA1I6opo2AL4LEqMCNcL1Hjx5ZgBgV0TH/Kx4zJ+Z6EfQWK2N79+6dBb1RwT5+/Pisp3fct9jqIip5o3o3ej9Hr+xoq7H11ltnVeRxXdHHP/7x9N3vfjetu+66jXpqL00c8PHnP/959rzR6mWNNdbInj/aYGyxxRZZNfCYMWMabv+Vr3wlG/+ee+6Zvc54rmHDhqVDDz00Cz1jbCvKiBEjsv7ccbDLWG/Rs/vkk09uFPxH9fOPfvSjrII61muMJ4L30oNWLqvWrP/mtOa9rkbl3P5as92svfbaDe9zrK+hQ4emU089NdvDoLR/+7KKHysinI8fYuJ+8bh33XVXtv0AHVddwZELADqUhQsXZj36okolJtbxb1TLLK/44nDkkUem3XfffYnr4gtE7GYZS6VuBwAArfHSSy9lwWrYZZddsr076fgi/mq6Z0O0xIke5yF+tKrman6g8lSkA3QwUYnxm9/8JqvGePfdd7PdFt98881KDwsAAKBi4gCx0QM/+t3H8oMf/CBbintR7L///pUeIlDl9EgH6IBil8Kbbrop/eEPf8jOP/zww1mv9OUVYXxzu1NG9Xuxv2AlbwcAAJDnwQcfzJamoko9+t5HmxaAPFq7AAAAAJ2G1i6d09e+9rWsT3ocpHXOnDnZ8aW23377dOyxx6add9650sMDaoAgHQAAAAAAcuiRDgAAAAAAOQTpAAAAAADQmQ82Wl9fn15//fXUr1+/7AASAADQXqKL4syZM9OwYcNSly6dp4bFHBwAgI42B+/wQXpM4IcPH17pYQAA0Im98soraY011kidhTk4AAAdbQ7e4YP0qIIprrj+/fu3eyXO1KlTsyNBd6YKpGph/VdWp13/s2enNGzY4tOvv57SSitVZBiddv1XEe9BZVn/lWX9v2fGjBlZoFyck3YW5uCsSN7jjs973PF5jzs+73HHV1/F7/GKmoN3+CC9uCtpTOArMYmfO3du9rzVtkF1BtZ/ZXXa9d+163un4zOngkF6p1z/VcR7UFnWf2VZ/0vqbO1NzMFZkbzHHZ/3uOPzHnd83uOOr74G3uNyz8Gr81UCAAAAAECV6PAV6QDtqnv3lM4//73TAAAAANQ8QTpAOfXokdI3v1npUQAAAABQRoJ0AIBWWLRoUVqwYEGlh1H1/RJjHUXPxGrtl1gu3bt3T11Lj48BAACd4HtGfQXn/JWagwvSAcpp0aKUHn108ekttmh88FGgphUKhTR58uT0zjvvVHooNbGuYmI9c+bMTnGQzYEDB6YhQ4Z0itcKAEB51er3jEKF5/yVmIML0gHKae7clLbZZvHpWbNSWmmlSo8IKJPi5Hbw4MGpT58+QtOlTKoXLlyYunXr1qHXU7zOOXPmpClTpmTnhw4dWukhAQBQY2r1e0ahQnP+Ss7BBekAAMuwm2VxcrvKKqtUejhVr7ME6aF3797ZvzGRj+1DmxcAADrD94xCBef8lZqDd+ymlQAAZVDsVRgVItBUcbuopZ6WAABUnu8ZtTUHF6QDACyjjl5dzfKxXQAA0Bbmk7WxzgTpAAAAAACQQ5AOAAAAAAA5HGwUAKCDOuyww9JVV12VvvzlL6fLLrus0XVHH310uuSSS9Lo0aPTlVdemap17KVGjRqVbrvttobzn/jEJ9Ljjz+eHWTofe97X9p9993Teeedl4YNG9bi486dOzd9/etfT9dcc02aN29e9pixHlZbbbXs+rfeeisdfPDB6YknnshOx8GL9t1333TOOeek/v37r8BXDAAA7znjjOp/rsmTJ2fz71tvvTW99tpr2dx55MiR6bjjjksf+chH0ogRI9LLL7/c0NN8gw02SGPHjk2f+cxnGh7j7bffTmeddVa64YYb0htvvJFWXXXV9LGPfSydccYZac0110zVREU6QDl1757SuHGLlzgNUGHDhw/PQuN33323UZh89dVXV93EtKmYQMdkurj8+te/bnT9brvtln7zm9+kZ555Jv3ud79Lzz//fPr0pz+d+5jHH398+sMf/pCuu+66dM8996TXX3897b///g3Xd+nSJQvOb7rppvSf//wn+5Hhz3/+czryyCNX2OsEAIBa89JLL6Xtttsu3X333ek73/lOevLJJ7Oil5ijR9FOUYTkMZd/7LHH0tZbb50OOOCAdP/99zeE6PEYMd+Owp/nnnsu++4S/8ZtX3jhhVRNBOkA5dSjx+KfcmOJ0wAVtsUWW2Rh+vXXX99wWZyOEP2DH/xgo9vW19en8ePHp7XXXjv17t07bb755um3v/1tw/WLFi1KRxxxRMP1UVHy/e9/f4lK8k9+8pPpwgsvzCrDV1lllWwivWDBglaPvWfPnmnIkCENS1SdNw3FY+K91lprpR122CGddNJJ6cEHH2zxuaZPn54uv/zybGwf/vCH05ZbbpmuuOKKbCIf9wvxHEcddVTaaqutsseNSpqvfOUr6S9/+Uurxw8AAB3V0UcfnR3w829/+1v61Kc+ldZff/30gQ98II0ZM6Zhbh369euXzeXj+gkTJmTfI6KwJZxyyilZYUsE6XvuuWf2HeVDH/pQuv3221P37t0bBfLVQJAOALC8Zs9ueZk7d9lvW1Itnnvb5fSFL3whC4yLfvazn6XDDz98idtFiP7zn/88qwb517/+lQXVn//857PK7WLQvsYaa2TV3P/+97/T6aefnk4++eSsKrxUVKVE9chdd92VtWeJqu7S9jGxm2bs5rk0EydOzHYPjcA+wu1otdKSqGb51a9+lQXqMeluziOPPJKF7NECpmjDDTfMJuwPPPBAs/eJiX388LDLLrssdbwAANAZvP3221n1eey1udJKKy1x/cCBA5u9X7du3bK5+vz587PvFlF9Hm0VI2gvFWF7FLNEoB7PVS0E6QDlVF+f0r/+tXiJ00DH1rdvy8unPtX4toMHt3zbPfdsfNsImZu73XKKMPy+++7L+hPG8te//jW7rFT0C48+4BGyR9/wddZZJ6suj9v96Ec/ym4Tk94zzzwzq9aOqvSY9EYg3zRIj6ruqFSPkPrjH/942nvvvdOdd97ZcH30PVx33XWX2tYlQv24X/RdjDA/qlSiKr7UiSeemE3eo/J90qRJ6fe//31uD8cePXosMbGP/uhxXakDDzww6+O4+uqrZ73Rf/rTn+aOFwAAOovnnnsuFQqFrOBlWUV4HoU7sZdo7B06derU9M4776SNNtqo2dvH5fEc8VzVwsFGAcopqko32WTx6VmzUmrml1lS9j/MGTNmlO3xIuQaNGhQ2R4POpr4+4gwO6rCYzIapyPMLhUT1Dlz5qSPfvSjS0x4S1vAxO6YEbZHaB191+P6OKBQqdils2vXrg3nhw4dmvVMLPrqV7+aLXk+97nPNZzedNNN02abbZaF71GlHu1Wir75zW9m7WbiB4II+Q899NB08803Z7uZtsX3vve9NG7cuKxPehwQKXZRjYOSAgBAZ1coFJb5tlH4cuqpp2bHaerbt28699xzs+8jb775Zqsfq9IE6QC0e4h+1BcPSvNmtdyiobV69l0lXfrTq4XptL/4wawlJUFyZsqUlm/bpclOgi+9lMot2rsUw+sIw5ua9b/Xcsstt2RV2E17lYfY9fIb3/hGuuCCC9L222+f9TuMAwtFX8RSTVurRKgdu262RVTIR/gfgX9pkB6XxRI9F6NqJfrBR0/GGF9TsctoBP9R+VJalR6T+Ka7kxb7skdV/corr5x23nnndNppp2U/CgBknjhj+e+7WRvu2wnF4Yc643MDVKv3v//92Rz/mWeeWepto/Al9nSNED32BC0WvMT395iTP/XUU83eLy6P26633nqpWgjSAWhXUYkeIfrX9+mZhg/q3ebHe2Xqu+mCP7yVPa4gnXbXmr1OVtRtl1G0SokQOSaj0bqlqY033jgLzKPSvKV+4NESJnqQR7/Coueffz61h1dffTXrkZ4XZBfD+mhT05w4uGiE/NEuJg6IFGLyH6+5ueB9WR8XAAA6k5VXXjn7ThHHVjruuOOykLxUaeFKFL00F4Z36dIlffazn82Oc3TWWWc1KmyJPV9jb9B4jniuaiFIB6AiIkRfd/VyhYXCLViaaLVSrPYobbtSFNXlUW0eBxiN4HinnXbK+hdGeB7tk0aPHp1VnkTf8jjoT/RI/8UvfpH+/ve/Z6db4+KLL0433HBDo77pTavjo01LhN0xoY6w/oQTTsgm4MUfAaIKPp47xhk92eM2UTEe7V+Kofhrr72WVa/HmLfZZps0YMCArA1MtGmJCXm8rmOOOSa7/XbbbZfd59Zbb80q1LfeeuvsC0EcdDWqaHbcccdlOkAqAAB0BhdffHE2F992222zIDxaMS5cuDDdcccd6dJLL22x0rxUHKMpvhNEe8nzzz8/bbLJJunFF1/MWsEsWLCg2T1pK0mQDgDQSURwnOfss8/O9uyIgwC98MILWRXJFltskU4++eTs+i9/+cvpscceSwcccEBW2R4H5Izq9D/+8Y+tGse0adNyK9kj6H/iiSfSVVddlVWzDBs2LO2xxx7Z+IptZuJAoNdff33Wx3z27NlZpXpU3ceku3ibmHxHxXn0fi/tfR7VLxHSR4V5BPOlvc979+6dfvKTn2Q/KMT10Spm//33TyeddFKrXiMAAHRk66yzTlbcct5556Wvf/3r6Y033si+S8ReoBGkL4tVVlkla8sYQXx815g8eXJW8LLnnnumX/7yl2nNNddM1aSuUEsd3ZdD7Oof1UdRUbW0L4/lFtVcU6ZMSYMHD86+sNG+rP/K6rTrf/bslIq7NFXwYKPVvP4jPDvuS59JF31hYFkq0p9/bXY67mfvpIt+fF1WiVotqvk96AzKvf7jwDhRGRGV17169SrLGDuymF5GNUq3bt3afNDPWpC3fVRyLlpJ5uB0ivdYj/R2e4/1SO94qubvmBXGe9zxv2cUKjznr8Qc3JYMAAAAAAA5tHYBKKfu3VP6xjfeOw0AAABAzROkA5RTjx4pfec7lR4FAAAAAGWktQsAAAAAAORQkQ5QTvX1KU2atPh0HF3aQVWgQ+ngx2hnOdkuAACg4xOkA5TTu++mtPbai0/PmpXSSitVekRAGXT/3zEP5syZk3r37l3p4VBlYrso3U4AAICOR5AOALAUXbt2TQMHDkxTpkzJzvfp0yfV1dVVelhVXaG9cOHC1K1btw69nuJ1Roge20VsH7GdAAAAHZMgHQBgGQwZMiT7tximkx8w19fXpy5dunToIL0oQvTi9gEAAHRMgnQAgGUQgfDQoUPT4MGD04IFCyo9nKoWIfpbb72VVllllSxM78iinYtKdAAA6PgE6QAArRChqeB06UF6BMy9evXq8EE6AADQOQjSAQAAAACqyRNntN9zbdb65zr88MPTVVddtcTlzz77bFpvvfXSK6+8ksaNG5duu+22NG3atGzv3v322y+dfvrp2Z6rRbvuumsaOXJkuuiii1K1UyIEAAAAAECrjBo1Kr3++uvpjTfeaFjWXnvt9MILL6StttoqC9V//etfp+eeey5ddtll6c4770zbb799evvtt1MtUpEOUE7duqX0la+8dxoAAACgA+rRo0caMmRIdjypUkcffXR23Z/+9KfUu3fv7LI111wzffCDH0zrrrtuOuWUU9Kll16aak1FU5577703fec730mPPPJI9ovFDTfckJX4l3rqqafSiSeemO655560cOHCtPHGG6ff/e532coHqDo9e6Y0YUKlRwEAdDJnnNH5nvuss9p2/11XWf6B77pL254bADqqt99+O91+++3p29/+dkOIXhSh+8EHH5yuvfbadMkllywRwFe7irZ2mT17dtp8883ThBZCp+effz7ttNNOacMNN0wTJ05MTzzxRDrttNOyA1cBAAAAAFAZt956a+rXr1/q27dvtnzmM5/J2rkUCoW00UYbNXufuPy///1vmjp1aqo1Fa1I33PPPbOlJVHmv9dee6Xzzz+/4bIo/weoWoVCStOmLT696qop1divqwAAAADLYtddd81atBQry1daaaU0adKk7HSE6Xmi9UutqdqDjdbX16dbbrklrb/++lnj+sGDB6dtt9023XjjjZUeGkDL5sxJafDgxUucBgAAAOiA+vTpk9Zbb72GZejQodm/EaxHu+7mxOWDBg1KAwcOTLWmao+EN2XKlDRr1qx07rnnpm9961vpvPPOS7fddlvaf//9091335122aX5pnTz5s3LlqIZM2Y0BPOxtKd4vvj1pb2fl8Ws/8qqlvU/bdq0hs+Bcujfv39aNSrNW1Jf3/ALZfbaK/D64zVPnz49zZw5M1vK0XNsqa+7FWK7iDEVUl2qL7R9bPE42eNVwfZWjX8DnZX1X1nW/3usAwAAOpNVVlklffSjH816oB9//PGN+qRPnjw5/epXv8oORlqLulX7l4599903W+lh5MiR6f7770+XXXZZi0H6+PHj05lnnrnE5dF3Z+7cuam9X0OEWfFFskuXqi3+77Cs/8qqhvUfz3/pD7+bFsydWbbH7N6rXzrqmG+kAQMGNHt93Zw5abWSz53C7NmpMq95Vhq02tA09c03sqh5Rb/u1ohwf/iI96eZXVdKUxa2/ZgXM7vOTcNHzM4eN36ErRbV8DfQmVn/lWX9vyc+mwAAoDO5+OKL0w477JB1GYkC6bXXXjv961//St/85jez7iOnn356qkVVG6RH5WO3bt3SxhtvvERD+vvuu6/F+40dOzaNGTOm4XxUog4fPjzbZSAqKtv7S2RUScZzd/YvkZVg/VdWNaz/2KvlhacfTcd/vGcaPqjxkaKXxytT303fu3le6tq1a9ZuqlklwXm89rTSSqkSr/m4j/dKA4eslPptPDVF7fcKf92tHOMrLz2b+i0amAZ3a/v6mbVodnrlpXeyA5yUY3wd6W+gM7P+K8v6f0+vXm3/wRAAAGrJ+9///vT3v/89nXHGGemzn/1sVvQWRTbRaeQXv/hF1hKmFlVtkB4N57feeuv0zDPPNLr8P//5T1prrbVavF/Pnj2zpan4EleJL3LxJbJSz43139nXf7Hdx5qDeqV1V2/7h3QE0oXC3IbX1aySy7PbtPNrL33NfVfpmQZ365O61BVW/OtejjHG47Z1bO+Nb3G7mGr7W6/030BnZ/1XlvW/WGd//QAALKfNzkjV7IorrkgLFy5s8foRI0akK6+8suH8uHHj0oUXXpieeOKJtN122zVcPnHixFQrKhqkR1Xic88913D+xRdfTI8//nhaeeWV05prrpmV+x9wwAHpQx/6UNptt92yHul/+MMfamoFAwAAAAB0ZmeeeWYWrj/44INpm222qcmCk4oG6Q8//HAWkBcVW7KMHj06+8Xik5/8ZNYPPfqef+1rX0sbbLBB+t3vfpd22mmnCo4aAAAAAIDWOPzww1Mtq2iQvuuuu2a74+f5whe+kC0ANaFbt/g18L3TAAAAANQ8KQ9AOcUxGkp6gAEAAABQ+2qvGQ0AAAAAQAextI4dVMc6E6QDlFN8kM+evXjxP0IAqlAcf2jrrbdO/fr1S4MHD0777bdfeuaZZxrdZu7cuenoo49Oq6yySurbt2/61Kc+ld58882KjRkAoCPq3r179u+cOXMqPZSaM+d/66y4DtuD1i4A5RQf5H37Lj49a1ZKK61U6REBQCP33HNPFpJHmL5w4cJ08sknpz322CP9+9//Tiv97/9bxx9/fLrlllvSddddlwYMGJC++tWvpv333z/99a9/rfTwAQA6jK5du6aBAwemKVOmZOf79OmT6urqUq1UhC9cuDB169atXccczxsheqyzWHexDtuLIB0AADqR2267rdH5K6+8MqtMf+SRR9KHPvShNH369HT55Zenq6++On34wx/ObnPFFVekjTbaKD344INpu+22q9DIAQA6niFDhmT/FsP0WlEoFFJ9fX3q0qVLRcL/CNGL6669CNIBAKATi+A8rLzyytm/EagvWLAg7b777g232XDDDdOaa66ZHnjgAUE6AEAZRQg9dOjQrLAh5mC1or6+Pr311ltZK8AI09tTtHNpz0r0IkE6AAB0UvEF6Ljjjks77rhj2mSTTbLLJk+enHr06JFV+ZRabbXVsuuaM2/evGwpmjFjRsPjx9Ke4vmKFVK0j/Ze1cX3OKW2PXFbjmZT39ZD4dg+a+bvuAqG0CFV03vMiuE9Xr5APeZgtaK+vj5r6xJjbu8gvfj8y3NdWwjSAQCgk4pe6f/85z/Tfffd1+YDmJ555plLXD516tTswKXtKb44RZV9fHmvxJe6Sunfv3LP3d57ohff4/79I81e/vd4Ye/lX2lT3l3uu/7vAWpr9/321vTvuDNt351FZ/2s7ky8xx1ffRW/xzNnzlwhjytIBwCATigOIHrzzTene++9N62xxhoNl0evyfnz56d33nmnUVX6m2++2WIfyrFjx6YxY8Y0qkgfPnx4GjRoUOrfzglYfKmLiq547mr7Urci/W8ngIoYPDhV5D2eMWNQm4L0bt2Xf6UN7r3cd63MSqsxTf+OO9P23Vl01s/qzsR73PHVV/F73KtXrxXyuIJ0AADoRKJq6Jhjjkk33HBDmjhxYlp77bUbXb/llltmfSfvvPPO9KlPfSq77JlnnkmTJk1K22+/fbOP2bNnz2xpKr5UVeKLVXypq9Rzd0aVWM2LD2oWT7z8T96Ww6J1aesx1WybNfN37K3q+O8xK473uOOrq9L3eEWNR5AOUE5xsItPf/q90wBQhe1crr766vT73/8+9evXr6Hv+YABA1Lv3r2zf4844oiswjwOQBoV5RG8R4juQKMAAHRWgnSAcordh667rtKjAIAWXXrppdm/u+66a6PLr7jiinTYYYdlp7/3ve9llTxRkR4HER01alS65JJLKjJeAACoBoJ0AADoZK1dlqWv5IQJE7IFAABoS0M5AAAAAADoBATpAOU0e3YcbWPxEqcBAAAAqHmCdAAAAAAAyCFIBwAAAACAHIJ0AAAAAADIIUgHAAAAAIAcgnQAAAAAAMghSAcAAAAAgBzd8q4EoJW6dk1pr73eOw0AAABAzROkA5RTr14p3XJLpUcBAAAAQBlp7QIAAAAAADlUpAMAAFA5T5zRutsXUkrv9k+7rDIj1a2oMQEANKEiHaCcZs9OaaWVFi9xGgAAAICapyIdoNzmzKn0CAAAAAAoIxXpAAAAAACQQ5AOAAAAAAA5BOkAAAAAAJBDkA4AAAAAADkE6QAAAAAAkKNb3pUAtFKXLintsst7pwEAAACoeYJ0gHLq3TuliRMrPQoAAAAAyki5JAAAAAAA5BCkAwAAAABAtQbp9957b9pnn33SsGHDUl1dXbrxxhtbvO2RRx6Z3eaiiy5q1zECtMrs2SkNGrR4idMAAAAA1LyKBumzZ89Om2++eZowYULu7W644Yb04IMPZoE7QNWbNm3xAgAAAECHUNGDje65557Zkue1115LxxxzTLr99tvT3nvv3W5jAwAAAACAigfpS1NfX58OOeSQ9M1vfjN94AMfWKb7zJs3L1uKZsyY0fBYsbSneL5CodDuz8ti1n9lVcP6j+ePllCFVJfqC3Vtf7xUt/jx8l5XfX3Drj7Zbdr59Ze+5kKhHV/3co6xGsfXkf4GOjPrv7Ks//dYBwAA0DFUdZB+3nnnpW7duqWvfe1ry3yf8ePHpzPPPHOJy6dOnZrmzp2b2vuL0/Tp07Mvkl26OK5re7P+K6sa1v/MmTPT8BHvTzO7rpSmLOzV9sfrOjcNHzE7e9wpU6Y0e5u6OXPSaiWfO4V27pNefM2zuvZNCxetmgqpkLrUrfjXXe3vS2f9G+jMrP/Ksv7fE59NAABA7avaIP2RRx5J3//+99Ojjz6aVRouq7Fjx6YxY8Y0qkgfPnx4GjRoUOrfv39q7y+RMfZ47s7+JbISrP/Kqob1P2vWrPTKS8+mfosGpsHdVmr74y2anV556Z3Ur1+/NHjw4OZvVBKcx2tPK7X9eZfnNfdd9L7Ut2uvNKjbq6lLXWHFv+5qf1866d9AZ2b9V5b1/55evdr+gyEAAFB5VRuk/+Uvf8kqC9dcc82GyxYtWpS+/vWvp4suuii99NJLzd6vZ8+e2dJUfImrxBe5+BJZqefG+u/s67/Y7iOaiLQ1TM4eL+q7/9eWpMXXVHJ5dpt2fu2lr7mubvHrbutrX6bXXe3vSyf9G+jsrP/Ksv4X6+yvn87hjDPadv9dV2nd7WP2sLB3FX+ZBQA6pKqde0Rv9N13373RZaNGjcouP/zwwys2LoBcEZhstdV7pwEAAACoeRUN0mP3/ueee67h/Isvvpgef/zxtPLKK2eV6Kus0rg0oXv37mnIkCFpgw02qMBoAZZB794p/f3vlR4FAAAAAB0lSH/44YfTbrvt1nC+2Nt89OjR6corr6zgyAAAAAAAoAqC9F133TXra7usWuqLDgAAAAAAK4oGvgDlNGdOSiNGLF7iNAAAAAA1r2oPNgpQk2Ivm5dffu80AAAAADVPRToAAAAAAOQQpAMAAAAAQA5BOgAAAAAA5BCkAwAAAABADkE6AAAAAADk6JZ3JQCtVFeX0sYbv3caAAAAgJonSAcopz59UvrXvyo9CgAAAADKSGsXAAAAAADIIUgHAAAAAIAcgnSAcpozJ6UPfGDxEqcBAAAAqHl6pAOUU6GQ0r///d5pAAAAAGqeIB0AAABqxBlnpE6hf/+UZsyo9CgA4D1auwAAAAAAQA4V6dBJTJ06Nc0oc0lH//7906BBg1JnMm/+gvTyyy+3eH3dnDlpnf+dfuGFF1KhT5+lPmZnXI8AAAAAtUSQDp0kRD/qiwelebPeKuvj9uy7Srr0p1d3mhD4rRnz0wsvvpzOPf2Y1LNnz2Zv03PRovTb/50+4ZjPp3lduy71cTvbegQAAACoNYJ06ASiEj1C9K/v0zMNH9S7LI/5ytR30wV/eCt77M4SAM96d1Hq0WVhOv7jPdL6wwc2e5u6uYtSumfx6fMPGZgKvfKD9M64HgEAAABqjSAdOpEI0dddfaUyPuK81BmtMahXy+sxgvTVFv9YsU7cZilBemdejwAAAAC1QpAOUE4RnF/zkUqPAgAAAIAy6lLOBwMAAAAAgI5GkA4AAAAAADkE6QDlNG9RSkf+ZfESpwEAAACoeXqkA5RTfSGlZ6a/dxoAAACAmqciHQAAAAAAcgjSAQAAAAAghyAdAAAAAAByCNIBAAAAACCHIB0AAAAAAHJ0y7sSgOUwoEelRwAAAABAGQnSAcqpd7eUbtyj0qMAAAAAoIwE6QAAANAKE+9p4/2vL9dIAID2okc6AAAAAADkEKQDlNO8RSkdd//iJU4DAAAAUPO0dgEop/pCSv94+73TAAAAANS8ilak33vvvWmfffZJw4YNS3V1denGG29suG7BggXpxBNPTJtuumlaaaWVstsceuih6fXXX6/kkAEAAAAA6GQqGqTPnj07bb755mnChAlLXDdnzpz06KOPptNOOy379/rrr0/PPPNM+sQnPlGRsQIAAAAA0DlVtLXLnnvumS3NGTBgQLrjjjsaXXbxxRenbbbZJk2aNCmtueaa7TRKAAAAAAA6s5rqkT59+vSsBczAgQNbvM28efOypWjGjBnZv/X19dnSnuL5CoVCuz8vi1n/74n1EH87hVSX6gt15XnMVLf4MVtYx9Ww/sv9uuNxunTpkv94hbqGXX2y2yzleZe2HtvymguF8r3uFTXGahxfuVTD30BnZv1XlvX/HusAAAA6hpoJ0ufOnZv1TD/wwANT//79W7zd+PHj05lnnrnE5VOnTs0eo72/OEX4H18kI3yjfVn/75k5c2YaPuL9aWbXldKUhb3K85hd56bhI2Znjz1lypSqXP/lft2L+gxI62/cJc3psXaasrD5z6G6hQvSav87PXXhGqmwsHub1uPyvuZZXfumhYtWTYVUSF3amFWvqDGW630p9/jKpRr+Bjoz67+yrP/3xGcTAABQ+2oiSI8Dj372s5/NvoxdeumlubcdO3ZsGjNmTKOK9OHDh6dBgwblBvAr6ktkVEnGc3f2L5GVYP2/Z9asWemVl55N/RYNTIO7rVSex1w0O73y0jupX79+afDgwVW5/sv9urvOmZb+8+8nUp/59Wlwt1Wbv1G3hanQq2t2clC3V1Pq1q1N63F5X3PfRe9Lfbv2ysbQpa7QtsdcQWMs1/tS7vGVSzX8DXRm1n9lWf/v6dWrPD9gAwAAldWtVkL0l19+Od11111LDcN79uyZLU3Fl7hKfJGLL5GVem6s/6Ji24toptHWULXhMaPW+X8tOlpav5Ve/+V+3fE4WTiU93h9uqb0x8XHflhcCF5o83pc3tdcV7d4nG197StyjOV6X8o5vnKq9N9AZ2f9V5b1v1hnf/0AANBRdKuFEP3ZZ59Nd999d1pllVUqPSQAAAAAADqZigbpsXv/c88913D+xRdfTI8//nhaeeWV09ChQ9OnP/3p9Oijj6abb745LVq0KE2ePDm7XVzfo0ePCo4cAAAAAIDOoqL7mj788MPpgx/8YLaE6G0ep08//fT02muvpZtuuim9+uqraeTIkVmwXlzuv//+Sg4boGXzF6V00kOLlzgNAFXm3nvvTfvss08aNmxY1oLnxhtvbHT9YYcdll1eunzsYx+r2HgBACB19or0XXfdNetr25K86wCq0qJCSn+b8t5pAKgys2fPTptvvnn6whe+kPbff/9mbxPB+RVXXNFwvrljEAEAQGdS1T3SAQCA8tpzzz2zJU8E50OGDGm3MQEAQLWraGsXAACg+kycODENHjw4bbDBBumoo45Kb731VqWHBAAAFaUiHQAAaNTWJVq+rL322un5559PJ598clbB/sADD6SuXbs2e5958+ZlS9GMGTOyf+vr67OlPcXzRYvI9n5ell9hOW5fXGqX7XPp66dQFevJR8mK4bO64/Med3z1Vfwer6gxCdIBAIAGn/vc5xpOb7rppmmzzTZL6667blal/pGPfKTZ+4wfPz6deeaZS1w+derUNHfu3NTeX5ymT5+efbHr0qXz7IDbv3+qWQt7t27wEa8u6tEnO12XalP//v87pg4tqE99+kz/37td2b/jiy6qzPMedFDq0DrrZ3Vn4j3u+Oqr+D2eOXPmCnlcQToAANCiddZZJ6266qrpueeeazFIHzt2bBozZkyjivThw4enQYMGpf7tnPDGl7q6urrsuavtS92K9L+dAGpSt+6tG3yxEr3buzNqNkifMWNwpYdQ5aKSsC7NmDGo4kF6pQzu4JtIZ/2s7ky8xx1ffRW/x7169VohjytIBwAAWvTqq69mPdKHDh2ae3DSWJqKL1WV+GIVX+oq9dy0Xt1y3qe41Cbb5tLV/W89dc511Rk+vnxWd3ze446vrkrf4xU1HkE6QDn17pbS3R+v9CgAoEWzZs3KqsuLXnzxxfT444+nlVdeOVuiRcunPvWpNGTIkKxH+gknnJDWW2+9NGrUqIqOGwAAKkmQDgAAncjDDz+cdtttt4bzxZYso0ePTpdeeml64okn0lVXXZXeeeedNGzYsLTHHnuks88+u9mKcwAA6CwE6QAA0Insuuuu2UGhWnL77be363gAAKAWCNIBymn+opTOeXzx6ZNHptSja6VHBAAAAEAbVVcneIBat6iQ0j1vLF7iNAAAAAA1T5AOAAAAAAA5BOkAAAAAAJBDkA4AAAAAADkE6QAAAAAAkKNb3pUArHjz5i9IL7/8clkeKx5n4cKFZXksAAAAABYTpANU0Fsz5qcXXnw5nXv6Malnz55tfrzZc+alNye/kuYtGJj6lmWEAAAAAAjSAcqpV9eUbv3Ye6eXYta7i1KPLgvT8R/vkdYfPrDNT//gU/9N3/75wrRokap0AAAAgHIRpAOUU11dSr1b/9G6xqBead3VV2rz07/85rttfgwAAAAAGnOwUQAAAAAAyKEiHaCc5i9K6cInF58es2lKPZbe3gUAAACA6iZIByinRYWUbn918eljN6n0aAAAlsmuq5yx3Ped+Nby37ezasv6DtY5ALQ/rV0AAAAAACCHIB0AAAAAAHII0gEAAAAAIIcgHQAAAAAAcgjSAQAAAAAghyAdAAAAAABydMu7EoBW6tU1pRs++t5pAAAAAGqeIB2gnOrqUhrYs9KjAAAAAKCMtHYBAAAAAIByB+kvvPDC8twNoOObvyili55cvMRpACgTc3AAAKixIH299dZLu+22W/rlL3+Z5s6dW/5RAdSqRYWUfv/y4iVOA0CZmIMDAECNBemPPvpo2myzzdKYMWPSkCFD0pe//OX00EMPlX90AABAxhwcAABqLEgfOXJk+v73v59ef/319LOf/Sy98cYbaaeddkqbbLJJuvDCC9PUqVPLP1IAAOjEzMEBAKBGDzbarVu3tP/++6frrrsunXfeeem5555L3/jGN9Lw4cPToYcemk3u89x7771pn332ScOGDUt1dXXpxhtvbHR9oVBIp59+eho6dGjq3bt32n333dOzzz7bliEDAEBNa+scHAAAaOcg/eGHH05f+cpXsqA7qmBiAv/888+nO+64I6uU2XfffXPvP3v27LT55punCRMmNHv9+eefn37wgx+kyy67LP3tb39LK620Uho1apSekAAAdFptnYMDAACt12057pNN2K+44or0zDPPpL322iv9/Oc/z/7t0mVxLr/22munK6+8Mo0YMSL3cfbcc89saU5Uo1900UXp1FNPbfgyEM+z2mqrZZXrn/vc55Zn6AAAUJPKNQcHAADaKUi/9NJL0xe+8IV02GGHZZUwzRk8eHC6/PLL0/J68cUX0+TJk7N2LkUDBgxI2267bXrggQcE6QAAdCrtMQcHAADKGKQvS5/yHj16pNGjR6flFSF6iAr0UnG+eF1z5s2bly1FM2bMyP6tr6/PlvYUzxeV9e39vCxm/b8n1kMch6CQ6lJ9oa48j5nqFj9mC+u4GtZ/uV93PE5U/eU+Xo9uKV39kfdOL+V5l+kxl3OMhUL5HnP+gkXppZdeytZpW7388stp0aL6sr7mvG2xUtrjb2DatGkN/58rh/79+6dVV101dQTV8BnUmVn/7ynnOmiPOTgV9sQZbbhzW+4LAMAKCdJjl9K+ffumz3zmM40ujwMezZkzp6KT9/Hjx6czzzxzicunTp3a7r3V44vT9OnTsy+SxV1uaT/W/3tmzpyZho94f5rZdaU0ZWGv8jxm17lp+IjZ2WNPmTKlKtd/uV/3oj4D0vobd0lzeqydpizs3/INizlkZCf1ZXrMVo7x3R5rp3cWrZoKqZC6tDGrfn3erNSzz8J07c8vSd27d2/zGOfOW5B69x2Q3k5rpL4L+67wbbFSVvTfQDz2pT/8blowd2bZHrN7r37pqGO+ke0BVuuq4TOoM7P+3xOfTeVSzXNwAADo6Lotb1j9ox/9qNldSb/0pS+VZRI/ZMiQ7N8333yz0a6rcX7kyJEt3m/s2LFpzJgxDeejUm/48OFp0KBBWaVde3+JjCrJeO7O/iWyEqz/98yaNSu98tKzqd+igWlwt5XK85iLZqdXXnon9evXL/vbr8b1X+7X3XXOtPSffz+R+syvT4O7ladqt9yPWXy83vMLaWDXAWlQt1dTl7q2VZH/651p6YWnn0hH7rpBWn/4wDaP8W9PvZPG/+WZ1GvugrK85qVti5Wyov8GYvt+4elH0/Ef75mGD+rd5sd7Zeq76Xs3z0tdu3atqvW4vKrhM6gzs/7f06tXeX7Abq85OAAAUMYgfdKkSdnBjJpaa621suvKIR4/wvQ777yzITiPUPxvf/tbOuqoo1q8X8+ePbOlqfgSV4kvcvElslLPjfVfVGx7EU1O2hqqNjxm1Dr/r3VKS+u30uu/3K87HicLh/Ieb0F9Spc/vfj0ERum1L1L2x9zOcdYV7f4Mdv6uMXHHD6oR1pv9T5tHuOkN+eU/TUvbVuslBX5N1Dcvtcc1CutW4b3ZfF6nFuV63F5VfozqLOz/hcr5+tvjzk4AADQvOWa2UfVyxNPPLHE5f/4xz/SKqus0qpquscffzxbigcYjdPxRSC+fB133HHpW9/6VrrpppvSk08+mQ499NA0bNiwtN9++y3PsAFWvIX1KV37wuIlTgNAmZRrDg4AALRTRfqBBx6Yvva1r2W70X/oQx/KLrvnnnvSsccemz73uc8t8+M8/PDDabfddms4X2zJErulXnnllemEE05Is2fPznZVfeedd9JOO+2UbrvttrLuIgsAALWgXHNwAACgnYL0s88+O7300kvpIx/5SOrWbfFDxG76UTF+zjnnLPPj7Lrrrtlu6S2JqvSzzjorWwAAoDMr1xwcAABopyC9R48e6dprr80m87Erae/evdOmm26a9WcEAADKzxwcAABqLEgvWn/99bMFAABoH+bgAABQI0H6okWLsh7md955Z5oyZUq2S2mpu+66q1zjAwAAzMEBAKD2gvQ4oFFM4vfee++0ySabZL3MAQCAFcccHAAAaixIv+aaa9JvfvObtNdee5V/RAC1rGfXlH62y3unAaBMzMEBAKAGDza63nrrlX80ALWuS11Ka/er9CgA6IDMwQEAoHK6LM+dvv71r6fvf//7qVAolH9EAADAEszBAQCgxirS77vvvnT33XenP/7xj+kDH/hA6t69e6Prr7/++nKND6C2LKhP6VfPLj598PtT6r5cv1cCwBLMwQEAoMaC9IEDB6ZPfvKT5R8NQK1bWJ/SVf8L0g9YV5AOQNmYgwMAQI0F6VdccUX5RwIAALTIHBwAAGosSA8LFy5MEydOTM8//3w66KCDUr9+/dLrr7+e+vfvn/r27VveUQIAAObgVe6MM9p2/11XKddI6Oh2XWX5N7aJb7VxQwWATmq5gvSXX345fexjH0uTJk1K8+bNSx/96EezSfx5552Xnb/sssvKP1IAAOjEzMEBAKBylqt577HHHpu22mqr9N///jf17t274fLo2XjnnXeWc3wAAIA5OAAA1F5F+l/+8pd0//33px49ejS6fMSIEem1114r19gAAID/MQcHAIAaq0ivr69PixYtWuLyV199Ndu9FAAAKC9zcAAAqLEgfY899kgXXXRRw/m6uro0a9asNG7cuLTXXnuVc3wAtaVH15Qu3WnxEqcBoEzMwQEAoMZau1xwwQVp1KhRaeONN05z585NBx10UHr22WfTqquumn7961+Xf5QAtaJrXUobDqz0KDqdefMXZAfhK6f+/funQYMGlfUxAdrCHBwAAGosSF9jjTXSP/7xj3TNNdekJ554IquEOeKII9LBBx/c6MBHALCivTVjfnrhxZfTuacfk3r27Fm2x+3Zd5V06U+vFqYDVcMcHAAAaixIz+7YrVv6/Oc/X97RANS6BfUp/e7Fxac/tXZK3ZergxatMOvdRalHl4Xp+I/3SOsPL8/eAK9MfTdd8Ie30owZMwTpQFUxBwcAgBoK0n/+85/nXn/ooYcu73gAatvC+pR+9NTi0/uuJUhvR2sM6pXWXX2lMj7ivDI+FkDbmYMDAECNBenHHntso/MLFixIc+bMST169Eh9+vQxiQcAgDIzBwcAgMpZrlLJ//73v42W6M/4zDPPpJ122smBjgAAYAUwBwcAgMopW8+B97///encc89dolIGAABYMczBAQCgfXQp98GPXn/99XI+JAAAkMMcHAAAqrRH+k033dTofKFQSG+88Ua6+OKL04477liusQEAAP9jDg4AADUWpO+3336NztfV1aVBgwalD3/4w+mCCy4o19gAAID/MQcHAIAaC9Lr6+vLPxKAjqBH15S+t917pwGgTMzBAQCgxoJ0AFrQtS6lkatWehQAAAAAVDpIHzNmzDLf9sILL1yepwAAAEqYgwMAQI0F6Y899li2LFiwIG2wwQbZZf/5z39S165d0xZbbNGobyNAp7KwPqU/TFp8ep81U+rWpdIjAqCDMAcHAIAaC9L32Wef1K9fv3TVVVel/2/vTsDsqOqEcf96SWcjC5AOBBJI2MEoigoPIgoDw/KhA+gzIqJGxg8EUYGIYHRYMohBHRweGQbUbwT9jwg6Iy4IjIAQRXYQ2QMYCKCBJECSDkk66e76P6dCd7qz3Cxd3Xfp981T6br31j116pxbdU/97qlTW265Zf7c66+/HieeeGIceOCB8cUvfrHofAJUh5UdEd95bNX8EeMF0gEojDY4AACUz2ZFeC655JKYMWNGVwM+SfNf+9rX8tcAAIBiaYMDAECVBdIXL14c8+fPX+v59FxLS0sR+QIAALrRBgcAgCoLpB977LH5JaQ///nP46WXXsqn//mf/4lPf/rT8aEPfaj4XAIAwACnDQ4AAFU2RvqVV14ZZ511VnzsYx/Lb3aUJ9TYmDfiv/WtbxWdRwAAGPC0wQEAoMp6pA8bNiz+4z/+I1599dX405/+lE+vvfZa/tzw4cMLy1x7e3uce+65MWnSpBg6dGjsvPPOceGFF0aWZYWtAwAAqkF/tcEBAICCeqR3mjt3bj69733vywPdKcBdV1cXRfnGN74RV1xxRfzwhz+Mt7zlLfHAAw/kl7OOGjUqvvCFLxS2HgAAqBZ93QYHAAAKCqSnXjAf+chH4vbbb88b7c8880zstNNO+WWlW265ZVxyySVRhLvuuiuOPvroOOqoo/LHEydOjJ/85Cdx3333FZI+QOGa6iO+/u7V8wBQkP5qgwMAAGvbrCjPmWeeGYMGDYoXXnghv8S003HHHRc333xzFOU973lP3HbbbfH000/nj//85z/HnXfeGUceeWRh6wAoVEN9xP7brJrSPAAUpL/a4AAAQEE90n/729/G//7v/8b48eN7PL/rrrvGnDlzoihf/vKXY/HixbHHHntEQ0NDPmb6RRddFCeccMJ639Pa2ppPndL7k46OjnzqT2l96VLb/l4vGy7/BQsWdH02ijBy5MgYM2ZMVKrOS76zqIuOrJhLv1NaeZrrKeNK+PwXvd0pnfr6+sLLscg0u6eXZZW53ZWeXmeaK1a2x/PPP7/Z9+VI72tpacmn9Dks+jjRF5/vUvt0tamEY9BApvxXK7IM+qsNDgAAFBRIf+ONN3r0gumUbnY0ePDgKMpPf/rT+PGPfxzXXHNNPkb6ww8/HGeccUZst912MWXKlHW+Z8aMGTF9+vS1np8/f34sX748+vvEadGiRfmJZAryEBVR/um5Ky7711i5vKWwdQ0aMiJO/fxZ+fj9lSgF8iZM3DVaGobHvLYhxaTZsDwmTHwjT3vevHkV+fkvervbh42K3faqj6VNk2Je28h1L9TWHkN/90w+u+zvdo1obOh9mpuRx2VNk2Jh+5jIIov6XsZY+yqPlZpe8rfWJTF4WFtc96P/yHt/bp66aN5mXMx/ZW4epi76OFH053tD+3S1qYRj0ECm/FdL+1RR+qsNDgAAFBRIP/DAA+NHP/pRXHjhhfnj1IMtnTB985vfjIMPPjiK8qUvfSnvlf7Rj340f/zWt741722TguXrC6RPmzYtpk6d2vU49TqeMGFCNDc3570B+1Mqk1Q2ad0D/SSyHNZX/kuWLInZTz0UZ35gcExoHtrr9bw4f1n82w2t+VUTY8eOjUqUtvnF55+JEe2jY2zj8GLSbH8jXnx+YYwYMWKd210Jn/+it7th6YJ4+olHYtiKjhjbuJ6exSvbov5ff5fPjjh4cERjY+/T3Iw8Dl2RxeiGUdHc+FLU121ej+q+zmOlppc8vnBBzH7qkTjloN1jtwmjN7uHdwpyj9hrfrw0f2nhx4miP98b2qerTSUcgwYy5b/akCHF/IDdn21wAACgoEB6aqwfcsgh8cADD8SKFSvi7LPPjscffzzvDfPHP/4xirJ06dK1Tr5SEKLUJbKpN866euSkdMpxIpdOcMq1btZd/p1DF+zQPCR23n5Y79eR+vxmy7vWVYk6tznltbdB1Z7bnZXc7nJ//ove7pROHhwqlV635/NlNrDejUpzM/NYV7cqzd6m25d5rMT0uqc5obkpdtnM40QabmVe2+AY2zgs6qOj8ONEX3y+N7RPV5tyH4MGOuW/SpHbX1Qb/Pe//31861vfigcffDDmzp0b119/fRxzzDFdr6djwfnnnx/f//73Y+HChXHAAQfEFVdckQ8hAwAAA9VmtewnT56c3wD0ve99bxx99NH5ZaYf+tCH4k9/+lPsvPPOhWXugx/8YD4m+m9+85t8nNrUyP/2t78dxx57bGHrAACAalBUGzy9b++9947LL798vQH773znO3HllVfGvffeG8OHD4/DDz+834dJBACAqu6RvnLlyjjiiCPyhvVXv/rV6EuXXXZZnHvuufHZz342H681jY3+mc98Js4777w+XS8AAFSSItvgRx55ZD6tS+qNfumll8Y///M/58H6JA0ns80228QvfvGLriEXAQBgoNnkQHq66dojjzwS/SGN05oa8mkCAICBqr/a4M8991y8/PLLceihh3Y9l26SvN9++8Xdd9+93kB6a2trPnW/T1GShskqNSxjX0jrSz8I9Pd6i9C7gbo6Bsy6s24Tm6OjSvKYVUle+0YVHsIGzLGajaOOa19HBddxX+Vps8ZI//jHPx7/+Z//GRdffHHxOQIAAMrSBk9B9CT1QO8uPe58bV1mzJgR06dPX+v5+fPn9/uQMOnEadEzv4rs+aVRX7cZCUz82Gave+TI6JW2oZufwAHje9f5qC02f90jR87r1+1O4dX2plX3MNmcKh7oevtZeXTx5u8jG68jhg1b9GZtD8x7bczr3W5V8fJj9aJFeRBuoN9PpVap49rXUcF13NLSUjmB9La2tvjBD34Qt956a7zzne/Mx03sLo1jDgAAFKeS2+DTpk2LqVOn9uiRPmHChGhubo6RvY0ub6L8BtRzlkbz0MWbF0gfO3az1/1mR/zN1jiolwmUyeLFm19mm7PdnT3RG5ctFkivwvreOKknYV0sXtw8YAPpvTgUVYX8WF1Xl39PVFoAjmKo49rXUcF1PGTIkPIH0mfPnh0TJ06Mxx57LPbZZ5/8uXTDo+5SAQIMWE31Eefvs3oeAHqpP9vg2267bf73lVdeiXHjxnU9nx6//e1vX+/7Bg8enE9rSidV5TixSsWRguibFUgv44lg9Z5J1ff7dtd1m+hv/bWP1L25roHZpq6wmFSfSN9d5fqeoH+o49pXV6F13Ff52aRA+q677hpz586N22+/PX983HHHxXe+8521Lv0EGLAa6iMO2q7cuQCghvRnG3zSpEl5MP22227rCpyn3uX33ntvnHrqqYWvDwAAqsUmBdLTmDfd3XTTTfHGG28UnScAAKCP2uBLliyJZ599tscNRh9++OHYaqutYocddogzzjgjvva1r+UB/BRYP/fcc2O77baLY445plfbAQAA1WyzxkhfX6MeYMBr74j4w5s3Yztw21U91AGgQL1tgz/wwANx8MEHdz3uHNt8ypQpcfXVV8fZZ5+dB+pPPvnkWLhwYbz3ve+Nm2++uc/GmgQAgJoLpKdxb9Ycf9GY6ADdrOiImP7Qqvkbj4gYKpAOQO8U3QY/6KCDSgbjU9r/8i//kk8AAMBmDu3yqU99qutGQsuXL49TTjklhg8f3mO5n//855uSLAAAsB7a4AAAUGWB9HS5Z3cf//jHi84PAADQjTY4AABUWSD9qquu6rucAAAAa9EGBwCA8jN4LwAAAAAAlCCQDgAAAAAAJQikAwAAAABAUWOkA7ABg+ojztl79TwAAAAAVU8gHaBIjfURR0wody4AAAAAKJDukgAAAAAAUIIe6VSF+fPnx+LFizfpPVmWRUtLSyxZsiTq6uq6np8zZ060tbX1QS4pRz2XUpa6bu+IuG/+qvl9myMa/F4JAAAAUO0E0qmK4Oqp//dj0brk1U16XwqeT5i4a7z4/DN5UL3TG0tb45WXX4zWlaP6ILf0dz2XUpa6XtER8ZX7V83feETEUIF0AAAAgGonkE7FSz2UU3D1ix8cHBOah270+7Koi5aG4TGifXTUxepA+j1Pvh4X/agt2tv1Sq+Fei5FXQMAAABQBIF0qkYKru68/fCNXr4jq4t5bUNibOPwqK9bHUif88qyPsoh5ajnUtQ1AAAAAEUw5gAAAAAAAJQgkA4AAAAAACUIpAMAAAAAQAkC6QAAAAAAUIKbjQIUaVB9xBcmr54HAAAAoOoJpAMUqbE+4tiJ5c4FAAAAAAXSXRIAAAAAAErQIx2gSO1ZxKOvrpp/69YRDXXlzhEAAAAAvSSQDlCkFe0RZ96zav7GIyKGOswCAAAAVDtDuwAAAAAAQAkC6QAAAAAAUIJAOgAAAAAAlCCQDgAAAAAAJQikAwAAAABACQLpAAAAAABQQmOpFwHYRI31EZ/Zc/U8AAAAAFWv4gPpf/3rX+Occ86Jm266KZYuXRq77LJLXHXVVfGud72r3FkDWNug+oiP7lzuXAAAZXLQ1hfEQDMQtxlq2QX9tEuPHBmxeHEMuO0GqldFB9Jff/31OOCAA+Lggw/OA+nNzc3xzDPPxJZbblnurAEAAAAAMEBUdCD9G9/4RkyYMCHvgd5p0qRJZc0TQEntWcQzi1bN7zoqoqGu3DkCAAAAoJYD6b/61a/i8MMPj3/8x3+MmTNnxvbbbx+f/exn46STTlrve1pbW/Op0+I3rxPq6OjIp/6U1rdw4cJoaWmJurpigmkjR46MMWPGRJEWLFjQVU5FWLFiRTQ1NRWW3pw5c6K9vSOyqIuObOPLMS2bZWu/J6VTX1+/yemtT0on1W+WZYV+xoqsl80tw95sd3puU8okLZunV3Aei67rDabX2h71p96Zz3b85siIoY1ly+O6Pv+9TXMgpFdUmt2PQX1xnCh6n+mrY1m5bOoxiGIp/9WUAQAA1IaKDqTPnj07rrjiipg6dWp85Stfifvvvz++8IUv5EHaKVOmrPM9M2bMiOnTp6/1/Pz582P58uXRn1IQ/WfX/n/x8kuz8xBFEQYNGRGnfv6sGDVqVCHpLVq0KK647F9j5fKWQtJbubItXlnwWowbu3U0NDQUkuby1pUxdItR8VqMjy3attjo93VkEYvax0QWWdR3izG1DxsVu+1VH0ubJsW8tpG9zl9Lw/KYMPGN/AeTefPmRSXWy+aWYW+2OwUO0nakQEoKSG4wvZaWmDBx12hpGB7z2oYUksei63pj0qtrWxnbvDk/v218ZG2DypLHZU2TYuE6Pv/VUo7lTK+oNLsfg/riOFH0PtMXeSynTT0GUSzlv1rapwAAgOrXWOknYemmol//+tfzx+94xzviscceiyuvvHK9gfRp06blgfdOqUdvGh4mja+eenP394nTK3+dHR+e/ELs0Nz7IMeL85fFv93Qmgeox44dW0gelyxZErOfeijO/MDgmNA8tNfp3fvkwpgxc1Z85sDdY7cJowvJY57mH2bFkOUrY2zjxvfGTz0007/mxpeivm71DxkNSxfE0088EsNWdGxSeuuzpP2NePH5hTFixIjKrpfNKMPebHfaf1Pv1rTvbUwQJW3zi88/EyPaR8fYxuGF5LHout6o9BrbumbTZy8aG8uSx6ErshjdMGqtz3/VlGMZ0ysqze7HoKXtS/rkOFHkPtMXx7Jy2tRjEMVS/qsNGVLMj8MAAEB5VXQgfdy4cbHXXnv1eG7PPfeM//mf/1nvewYPHpxPa0oncf19Itd5iXwKou+y/bDep5f6NWbL83SL2pbuedy5gDy+8MrS/OR5QnNTIdvcPc20/ZsaEKyrW/We7u9L6Wxueuuvl6wq6qWobd7Y7e58bWPKpXObi85j0XW9wfS6PZ8vs4H19mUe1/X5r5pyLGN6RabZWQd9eZyo5GNZuW3KMYjiKf9VBvr2AwBArajolv0BBxwQs2bN6vHc008/HTvuuGPZ8gQAAAAAwMBS0YH0M888M+655558aJdnn302rrnmmvje974Xp512WrmzBgAAAADAAFHRgfR3v/vdcf3118dPfvKTmDx5clx44YVx6aWXxgknnFDurAEAAAAAMEBU9BjpyQc+8IF8AqgKjfURU3ZdPQ8AAABA1av4QDpAVRlUH/Gp3cudCwAAAAAKpLskAAAAAACUoEc6QJE6sog5S1bN77hFRH1duXMEAAAAQC8JpAMUqbU94p9mrpq/8YiIoQ6zAAAAANXO0C4AAAAAAFCCQDoAAAAAAJQgkA4AAAAAACUYvBcAAACgglxwQblzAMCa9EgHAAAAAIASBNIBAAAAAKAEQ7sAFKmxPuK4nVbPAwAAAFD1BNIBijSoPuKUvcqdCwAAAAAKpLskAAAAAACUoEc6QJE6soh5y1bNjx0aUV9X7hwBAAAA0EsC6QBFam2POP53q+ZvPCJiqMMsAAAAQLUT4YECtK5YGXPmzCksvZRWW1tbYekBAAAAAJtPIB166dXFK2L2c3Pi4vM+H4MHDy4kzTeWtsYrL78YrStHFZIeAAAAALD5BNKhl5Ysa4+m+rY48wNNsduE0YWkec+Tr8dFP2qL9na90gEAAACg3ATSoSDjm4fEztsPLyStOa+8ebNKAAAAAKDs6sudAQAAAAAAqGQC6QAAAAAAUIKhXQCK1FAXcfSOq+cBAAAAqHoC6QBFamqIOOOt5c4FAAAAAAUytAsAAAAAAJSgRzpAkbIsYtGKVfOjmiLqDO8CAAAAUO0E0gGKtLw94thbVs3feETEUIdZAOhvjz4W0bgsYrN+zp55wWav96CtN/utAABUOEO7AAAAAABACQLpAAAAAABQgkA6AAAAAACUIJAOAAAAAAAlCKQDAAAAAEAJAukAAAAAAFBCY6kXAdhEDXURh49fPQ8AAABA1RNIByhSU0PEl99e7lwAAAAAUCBDuwAAAAAAQK0E0i+++OKoq6uLM844o9xZAVi3LItY1rZqSvMAAAAAVL2qCaTff//98d3vfjfe9ra3lTsrAOu3vD3i/9y8akrzAAAAAFS9qgikL1myJE444YT4/ve/H1tuuWW5swMAAAAAwABSFTcbPe200+Koo46KQw89NL72ta+VXLa1tTWfOi1evDj/29HRkU/9KcuyfCiaLOqiI6vrfXpRFytWtsfzzz+fp12EOXPmRHt7R6F5rK+vLyy93qSZls2ytd9TdB4raZv7O4+lPo/puZaWlnxK+0F/fxbLVo5ZXdcvlPkyG1hvX+ZxXZ//3qY5ENIrKs3ux6BqOX4XncdkxYoV0dTUVFh6I0eOjDFjxmxwufSdn7ajv7/7WUX5r1atZXDBBRfE9OnTezy3++67x1NPPVW2PAEAQDlVfCD92muvjYceeigf2mVjzJgxY61GfzJ//vxYvnx59HdP+jFjx8WShuExr21wr9P7W+uSGDysLa770X/EoEGDCsnj8taVMXSLUfFajI8t2rbodXrtw0bFbnvVx9KmSTGvbWQhedzcNDuyiEXtYyKLLOrr+i6PlbTN/ZnHDX8e66J5m3Ex/5W5eYiuvz+L5SrHuraVsc2b8/PbxkfWNqgseVzWNCkWruPzX4ufx0rdB7sfg6rh+N0XeVy5si1eWfBajBu7dTQ0NBSS5qAhI+LUz58Vo0aN2mDwctGiRXkwN/0oQv9S/qulH5Sr1Vve8pa49dZbux43Nlb8qQMAAPSZim4Nv/jii3H66afHLbfcEkOGDNmo90ybNi2mTp3ao0f6hAkTorm5Oe/F1t8nTgvmzY0t2ufH2MZhvU7v8YULYvZTj8QpB+0eu00YXUge731yYcz4w6wYsnxljG3ccA+/DWlYuiCefuKRGLaio5D0epNm6qGZ/jU3vhT1dVmf5bGStrk/87ihz2Pq3drSMDxG7DU/9Y3u989i2cqxsa1rNn32YgNBh77K49AVWYxuGLXW578WP4+Vug92PwY9uXB+xR+/++w7Zuas+MyBxaT54vxl8W83tOZB+bFjx24wkJuuhknf/wM9kFsOyn+1jW3DVqIUON92223LnQ0AAKgIFR1If/DBB2PevHmxzz77dD3X3t4ev//97+Pf//3f8yFc1uzhNnjw4HxaUzqJ6+8TuXxYlzS8S94jtPeXyad00onphOam2GX73gfmkxdeWbrqZLfgPBaVXm/TrKtb9Z7u7ys6j5W2zf2dx/V9HlMQMV2JkX5E2ph1Fv1ZLFs5dns+X2YD6+3LPK7r81+Ln8dK3gc766Cajt99kcei0kx5zLLl+ffrxnyndy430AO55aL8V6nm7X/mmWdiu+22y38M2H///fMrP3fYYYeKH14xH1poo66Ho1p11q86LpeOflpHquHqHB6L6qzjKh2NrWIZ6q/2dVRwHfdVnio6kH7IIYfEo48+2uO5E088MfbYY48455xzCrtMHAAAWG2//faLq6++Oh8Xfe7cufnQiQceeGA89thjMWLEiIoeXjGdOLU3rfrxrpg7Z1BpUuhNHZfPAeMv7bc6bhi5tKuOH138sT5fL/2pI4YNW/RmbVfGj87z5pU7B7XFUH+1r6OC67ivhles6EB6aqRPnjy5x3PDhw+Prbfeeq3nASpCQ13E+8etngeAKnTkkUd2zb/tbW/LA+s77rhj/PSnP41Pf/rTFT28Yjqpa1ixNBqXLRZkrVGdPdHV8cCq48WLSw/rRrVJvUXrYvHi5ooJpG9g5EA2kaH+al9HBddxXw2vWNGBdICq09QQccE7y50LACjU6NGjY7fddotnn312na9X0vCKSV23idqkjgdiHVdWkIYi1L1Zr5VRtxUWB6wJhvqrfXUVWsd9lZ+qC6Tfcccd5c4CAAAMKEuWLIm//OUv8YlPfKLcWQEAgLKorJ8LAACAsjvrrLNi5syZ8fzzz8ddd90Vxx57bH5/ouOPP77cWQMAgLKouh7pABVtWVvE/7l51fyNR0QMdZgFoPq89NJLedD81Vdfzce9fO973xv33HNPPg8AAAORCA8AANDDtddeW+4sAABARTG0CwAAAAAAlCCQDgAAAAAAJQikAwAAAABACQLpAAAAAABQgkA6AAAAAACU0FjqRQA2UUNdxH5jV88DAAAAUPUE0gGK1NQQcfG+5c4FAAAAAAUytAsAAAAAAJQgkA4AAAAAACUIpAMUaVlbxJE3rZrSPAAAAABVzxjpAEVb3l7uHAAAAABQIIF0AAAAACiDCy4YmOuGamRoFwAAAAAAKEEgHQAAAAAAShBIBwAAAACAEgTSAQAAAACgBDcbBShSfV3E3lutngcAAACg6gmkAxRpcEPEpe8pdy4AAAAAKJChXQAAAAAAoASBdAAAAAAAKEEgHaBIy9oijvntqinNAwAAAFD1jJEOULRFK8qdAwAAAAAKpEc6AAAAAACUIJAOAAAAAAAlCKQDAAAAAEAJAukAAAAAAFCCQDoAAAAAAJTQWOpFADZRfV3E7qNWzwMAAABQ9QTSAYo0uCHiygPLnQsAAAAACiSQDgAAAFS0g7a+oFfvv+PV3r2f2neBj8iAKG/1TG8YIx0AAAAAAEoQSAco0vL2iI/etmpK8wAAAABUvYoPpM+YMSPe/e53x4gRI2Ls2LFxzDHHxKxZs8qdLYB1y7KIV5atmtI8AAAAAFWv4gPpM2fOjNNOOy3uueeeuOWWW2LlypVx2GGHxRtvvFHurAEAAAAAMABU/M1Gb7755h6Pr7766rxn+oMPPhjve9/7ypYvAAAAAAAGhooPpK9p0aJF+d+tttpqna+3trbmU6fFixfnfzs6OvKpP2VZFnV1dZFFXXRkdb1PL+qivr6+sPT6Is1KymNaNsvWfk8tb3Ml5XF95V9JeeyT9LK6rkt98mU2sN6+zOOmlH+58liJ6RWVZvd9oFLz2Jfp9VUeV6xsj+effz7/ji25bJZFS0tLPqXv4lJWrFgRTU1NUZSRI0fGmDFjYiBLba5UB/3d9qpEygAAAGpDY7WdiJxxxhlxwAEHxOTJk9c7pvr06dPXen7+/PmxfPny6E9LliyJMWPHxZKG4TGvbXCv02sfNip226s+ljZNinltIwvJY9FpVlIeO7KIRe1jIoss6usGxjZXUh7XV/6VlMe+SK+ubWVs8+b8/LbxkbUNKkselzVNioWbUP7lyGOlpldUmt33gfZhIysyj32ZXl+k+bfWJTF4WFtc96P/iEGDSu9bEXXRvM24mP/K3DwEvz4rV7bFKwtei3Fjt46GhoYowqAhI+LUz58Vo0aNioEqtdlS54cUTE8/pgxk6cccAACg+lVVID2Nlf7YY4/FnXfeud5lpk2bFlOnTu3RI33ChAnR3Nyc9xDr7xOnBfPmxhbt82Ns47Bep9ewdEE8/cQjMWxFR4xtLKanW9FpVlIeU+/H9K+58aWor8sGxDZXUh7XV/6VlMc+Sa+xrWs2bXs0NpYlj0NXZDG6YdRGl3858lip6RWVZvd9oGHp/IrMY1+m1xdpPr5wQcx+6pE45aDdY7cJozfYe72lYXiM2Gt+uj5jvcvd++TCmDFzVnzmwA2nuTFenL8s/u2G1jwon4aiG8iB9HQlQGp/DfRA+pAhQ8qdBQAAYCAF0j/3uc/FDTfcEL///e9j/Pjx611u8ODB+bSmdBLX3ydy+bAuaXiXvEdo1vv0YtUl0kWl1xdpVloe6+pWvaf7+2p9myspj+sq/0rLY+HppcPMjlusmk3zG1hvX+ZxU8q/XHmsxPSKTLOzDio5j32VXl/mcUJzU+yy/bAN/pCRrgZLP2SXWvcLryzd6DQ3No9ZtjxvAwz0AHJnGQz0chjo2w8AALWi4gPpKRD9+c9/Pq6//vq44447YtKkSeXOEsD6DWmIuPqgcucCAAAAgIEUSE/DuVxzzTXxy1/+MkaMGBEvv/xy/nwad3To0KHlzh4AAAAAADWu4q81veKKK/KbVR100EExbty4rum6664rd9YAAAAAABgAqmJoF4Cqsbw94pQ/rJq/8sBVQ70AAAAAUNUqPpAOUFXSj39zlqyeBwAAAKDqVfzQLgAAAAAAUE4C6QAAAAAAUIJAOgAAAAAAlCCQDgAAAAAAJQikAwAAAABACY2lXgRgE9XVRWwzdPU8AAAAAFVPIB2gSEMaIq49pNy5AAAAAKBAhnYBAAAAAIASBNIBAAAAAKAEgXSAIrW2R5zyh1VTmgcAAACg6hkjHaBIHVnErEWr5wEAAACoenqkAwAAAABACQLpAAAAAABQgkA6AAAAAACUIJAOAAAAAAAluNkoAECBWlesjDlz5hSa5siRI6O5uTkGkvnz58fixYsLS28gliEAAFAcgXSAoo1qKncOgDJ5dfGKmP3cnLj4vM/H4MGDC0t38BZbxxX/75oBEwhOQfRT/+/HonXJq4WlOdDKEAAAKJZAOkCRhjZG/OKwcucCKJMly9qjqb4tzvxAU+w2YXQhab44f1lc8utX897ZAyUInLY1BdG/+MHBMaF5aK/TG4hlCAAAFEsgHQCgYOObh8TO2w8vMMXWGIhSEL24chyYZQgAABTDzUYBAAAAAKAEgXSAIrW2R5xx16opzQMAAABQ9QztAlCkjiziz6+tngcAAAa0g7a+YLPfe8erm/9e2JAL+vjjNXJkuvdN366D8tb1yA3UcV9/xvqbHukAAAAAAFCCQDoAAAAAAJQgkA4AAAAAACUIpAMAAAAAQAkC6QAAAAAAUEJjqRcB2AxDGsqdAwAAAAAKJJAOUKShjRE3HVnuXAAAAABQIEO7AAAAAABACQLpAAAAAABQgkA6QJFWtEd8+b5VU5oHAAAAoOoZIx2gSO1ZxL3zVs8DAAAAUPX0SAcAAAAAgGoPpF9++eUxceLEGDJkSOy3335x3333lTtLAABQ07TBAQCgigLp1113XUydOjXOP//8eOihh2LvvfeOww8/PObNe3PoBAAAoFDa4AAAUGWB9G9/+9tx0kknxYknnhh77bVXXHnllTFs2LD4wQ9+UO6sAQBATdIGBwCAKgqkr1ixIh588ME49NBDu56rr6/PH999991lzRsAANQibXAAAFhbY1SwBQsWRHt7e2yzzTY9nk+Pn3rqqXW+p7W1NZ86LVq0KP+7cOHC6OjoiP7U0tISK1e2xZMvLomWpW29Tu8vc5dFFnUx68Vl0daxuJA8Fp1mZeWxLloaWmJue3pPNkC2uZLyuO7yr6w8Fp9eXWt77PTm/Oy/tEQ2uKFseVxYt/HlX648VmJ6xaW5eh+o3Dz2XXrlz+PGHYOqoRz/+uqyWLZ8ZTz++OOxeHExafZXO2ju3Lmb9d4XX3wxlq9YmbehFi9tL6QM29o78vJLbcL+1FlnWda7Y3F/qvY2eFrfkmXLo3FZa9T165rpL2lvagt1XMv6oo5bW/v3+N/dkmWrj4/VlO++1RHLly+O1tamSu/jSY3VcT83BStGt2Zav9bxwjKVd1+1weuyCm7V/+1vf4vtt98+7rrrrth///27nj/77LNj5syZce+99671ngsuuCCmT5/ezzkFAIDSPw6MHz8+qoE2OAAAteDFgtvgFd0jfcyYMdHQ0BCvvPJKj+fT42233Xad75k2bVp+Y6TuPVJee+212HrrraOurq7ff/2YMGFCXmkjR47s13Wj/MtN+ZeX8i8/dVBeyr+8lP9qqc9K6p2/3XbbRbXQBqfSqePap45rnzqufeq49i2u4DruqzZ4RQfSm5qa4p3vfGfcdtttccwxx3Q1ytPjz33uc+t8z+DBg/Opu9GjR0c5pQ9TpX2gBhLlX17Kv7yUf/mpg/JS/uWl/FcZNWpUVBNtcKqFOq596rj2qePap45r38gKreO+aINXdCA9ST1bpkyZEu9617ti3333jUsvvTTeeOONOPHEE8udNQAAqEna4AAAUGWB9OOOOy7mz58f5513Xrz88svx9re/PW6++ea1bn4EAAAUQxscAACqLJCepEtI13cZaSVLl7eef/75a13mSv9Q/uWl/MtL+ZefOigv5V9eyr82aINTqdRx7VPHtU8d1z51XPsGD8A6rsvS6OsAAAAAAMA61a/7aQAAAAAAIBFIBwAAAACAEgTSAQAAAACgBIH0PnL55ZfHxIkTY8iQIbHffvvFfffdV+4s1aQZM2bEu9/97hgxYkSMHTs2jjnmmJg1a1aPZZYvXx6nnXZabL311rHFFlvEhz/84XjllVfKludadvHFF0ddXV2cccYZXc8p/77317/+NT7+8Y/nZTx06NB461vfGg888EDX6+lWGOedd16MGzcuf/3QQw+NZ555pqx5rhXt7e1x7rnnxqRJk/Ky3XnnnePCCy/My7yT8i/O73//+/jgBz8Y2223XX6s+cUvftHj9Y0p69deey1OOOGEGDlyZIwePTo+/elPx5IlS/p5S2qzDlauXBnnnHNOfgwaPnx4vswnP/nJ+Nvf/tYjDXVAX9IGrx0XXHBBfpzpPu2xxx5dr2tjVh/f47VvQ3X8qU99aq39+ogjjuixjDqu/fjLCy+8EEcddVQMGzYsT+dLX/pStLW19fPWsLl1fNBBB621H59yyikDpo4F0vvAddddF1OnTs3vXPvQQw/F3nvvHYcffnjMmzev3FmrOTNnzswP0vfcc0/ccsst+Un8YYcdFm+88UbXMmeeeWb8+te/jp/97Gf58umE/kMf+lBZ812L7r///vjud78bb3vb23o8r/z71uuvvx4HHHBADBo0KG666aZ44okn4pJLLoktt9yya5lvfvOb8Z3vfCeuvPLKuPfee/MAVzompUYOvfONb3wjrrjiivj3f//3ePLJJ/PHqbwvu+yyrmWUf3HSsT19p6ZA2bpsTFmnE7PHH388/8644YYb8hO+k08+uR+3onbrYOnSpXm7J/24lP7+/Oc/zxve//AP/9BjOXVAX9EGrz1vectbYu7cuV3TnXfe2fWaNmb18T1e+zZUx0kKnHffr3/yk5/0eF0d13b8JXVESgHWFStWxF133RU//OEP4+qrr85/RKM66jg56aSTeuzH6fg9YOo4o3D77rtvdtppp3U9bm9vz7bbbrtsxowZZc3XQDBv3rzUDTSbOXNm/njhwoXZoEGDsp/97Gddyzz55JP5MnfffXcZc1pbWlpasl133TW75ZZbsve///3Z6aefnj+v/PveOeeck733ve9d7+sdHR3Ztttum33rW9/qei7Vy+DBg7Of/OQn/ZTL2nXUUUdl//RP/9TjuQ996EPZCSeckM8r/76TjiPXX3991+ONKesnnngif9/999/ftcxNN92U1dXVZX/961/7eQtqrw7W5b777suXmzNnTv5YHdCXtMFry/nnn5/tvffe63xNG7P6+R4fmO2EKVOmZEcfffR636OOaz/+cuONN2b19fXZyy+/3LXMFVdckY0cOTJrbW0tw1awKXWcdI/5rEut17Ee6QVLv7g8+OCD+WVonerr6/PHd999d1nzNhAsWrQo/7vVVlvlf1NdpF/QutdHuiR0hx12UB8FSr9Ypl8cu5dzovz73q9+9at417veFf/4j/+YXzL1jne8I77//e93vf7cc8/Fyy+/3KMORo0alV/urg567z3veU/cdttt8fTTT+eP//znP+e95Y488sj8sfLvPxtT1ulvukQ47TOd0vLpezr1fKNvvpfT5Z6p3BN1QF/RBq9NaViPNETETjvtlPdSTZeKJ9qYtcf3+MBxxx135Octu+++e5x66qnx6quvdr2mjms//pL+pmEAt9lmm65l0pUnixcvzq9EoLLruNOPf/zjGDNmTEyePDmmTZuWX5naqdbruLHcGag1CxYsyC9j6P6BSdLjp556qmz5Ggg6OjrysbnTMBdpZ05SY6ypqanrBL57faTX6L1rr702v3w6De2yJuXf92bPnp0PLZIuZf/KV76S18MXvvCFvNynTJnSVc7rOiapg9778pe/nDcIUgOxoaEhP/5fdNFF+cl+ovz7z8aUdfqbTty6a2xszBuG6qN46VL8NGb68ccfn49zmqgD+oo2eO1JAdR0KXgKtqXLxqdPnx4HHnhgPPbYY9qYNcj3+MCQhnVJw3yk+wv95S9/yc9fUgeUFHhLbWl1XPvxl/R3Xft552tUdh0nH/vYx2LHHXfMf+h+5JFH8vZ+Gs4xDes4EOpYIJ2a6hWdGtbdx06kb7344otx+umn52NnpZt6UZ4vt9Rj4+tf/3r+OPVIT/tBGlsyBdLpWz/96U/zX+OvueaafBzXhx9+OG9spEaF8mcgS72RPvKRj+Q3jks/9gFsqs6ru5J0D54UWE8n7um7N92IEqg+H/3oR7vmU4/VtG/vvPPOeS/1Qw45pKx5Y9OIvwzcOj652z0L0n6cbhCd9t/041jan2udoV0Kli5tSL+krnlX4vR42223LVu+at3nPve5/EYkt99+e4wfP77r+VTm6VLfhQsX9lhefRQjXbqVbuC1zz775D0F0pRuTpFuEpTm06+Oyr9vpS+tvfbaq8dze+65Z9elz53l7JjUN9Ldx1Ov9HRSkBoRn/jEJ/Ib7KS7nSfKv/9sTFmnv2vedDDdPf61115TH30QRJ8zZ07+Q2tnb/REHdBXtMFrX+rhuNtuu8Wzzz6rjV+DfI8PTGnYpnT8Tvt1oo5rP/6S/q5rP+98jcqu43VJP3Qn3ffjWq5jgfSCpctY3vnOd+Zj5nbvMZoe77///mXNWy1KPd3SDn799dfH7373u/wSse5SXQwaNKhHfaRLTlKQUX30XvrV8dFHH8174XZOqXd0Gtaic1759610mVUq0+7SeN2px1aS9on0ZdW9DtJQJGmMQXXQe2ksuDRmY3cpkJOO+4ny7z8bU9bpb2rYpx8BO6XvjlRfnQ1Aigmip3GNb7311th66617vK4O6Cva4LVvyZIleW+31IlAG7/2+B4fmF566aV8jPS0XyfquPbjL+lviiF0/8Gks+PFmh3EqLw6XpcU+0m678c1XcflvttpLbr22mvzu4tfffXV+V2nTz755Gz06NE97lhLMU499dRs1KhR2R133JHNnTu3a1q6dGnXMqecckq2ww47ZL/73e+yBx54INt///3zib6x5h2clX/fuu+++7LGxsbsoosuyp555pnsxz/+cTZs2LDsv/7rv7qWufjii/Nj0C9/+cvskUceyY4++uhs0qRJ2bJly8qa91owZcqUbPvtt89uuOGG7Lnnnst+/vOfZ2PGjMnOPvvsrmWUf3FaWlqyP/3pT/mUmjDf/va38/k5c+ZsdFkfccQR2Tve8Y7s3nvvze68885s1113zY4//vgyblXt1MGKFSuyf/iHf8jGjx+fPfzwwz2+l1tbW7vSUAf0FW3w2vLFL34xb+On79c//vGP2aGHHpp/x86bNy9/XRuz+vgeH9h1nF4766yzsrvvvjvfr2+99dZsn332yetw+fLlXWmo49qOv7S1tWWTJ0/ODjvssLy9ePPNN2fNzc3ZtGnTyrRVbEodP/vss9m//Mu/5HWb9uN0vN5pp52y973vfQOmjgXS+8hll12WHzyampqyfffdN7vnnnvKnaWalL6c1zVdddVVXcukhtdnP/vZbMstt8wDjMcee2x+IKB/AunKv+/9+te/zr+oUvBgjz32yL73ve/1eL2joyM799xzs2222SZf5pBDDslmzZpVtvzWksWLF+ef93S8HzJkSN6I+OpXv9ojaKj8i3P77bev85ifftDY2LJ+9dVX85OxLbbYIhs5cmR24okn5id29L4OUmN6fd/L6X2d1AF9SRu8dhx33HHZuHHj8rpMP1qnx+kEvpM2ZvXxPT6w6zgF4lJgLQXUBg0alO24447ZSSedtNaPneq49uMvzz//fHbkkUdmQ4cOzX8gTT+crly5sgxbxKbW8QsvvJAHzbfaaqv8OL3LLrtkX/rSl7JFixYNmDquS/+Vu1c8AAAAAABUKmOkAwAAAABACQLpAAAAAABQgkA6AAAAAACUIJAOAAAAAAAlCKQDAAAAAEAJAukAAAAAAFCCQDoAAAAAAJQgkA4AAAAAACUIpANUqeeffz7q6uri4Ycf7rN1fOpTn4pjjjmmz9IHAIBqog0OMHAJpAOUQWocpwb4mtMRRxyx0WlMmDAh5s6dG5MnT45K9+yzz8aJJ54Y48ePj8GDB8ekSZPi+OOPjwceeKCQ9C+44IJ4+9vfXkhaAADUJm1wbXCA3mjs1bsB2GypwX7VVVf1eC41cDdWQ0NDbLvttlHpUkP9kEMOyU82vvvd78Yee+wRLS0t8ctf/jK++MUvxsyZM8udRQAABghtcG1wgM2lRzpAmaQGe2qEd5+23HLLrtdT75grrrgijjzyyBg6dGjstNNO8d///d/rvaz09ddfjxNOOCGam5vz5XfdddceJwmPPvpo/N3f/V3+2tZbbx0nn3xyLFmypOv19vb2mDp1aowePTp//eyzz44sy3rkuaOjI2bMmJH3Zknp7L333j3ytKb0/tTzJ+XlD3/4Qxx11FGx88475z1Xzj///Lwhv7H5u+OOO2LfffeN4cOH53k84IADYs6cOXH11VfH9OnT489//nNXr6L0HAAArEkbXBscYHMJpANUsHPPPTc+/OEP5w3U1ED/6Ec/Gk8++eR6l33iiSfipptuypdJJwBjxozJX3vjjTfi8MMPz08S7r///vjZz34Wt956a3zuc5/rev8ll1ySN35/8IMfxJ133hmvvfZaXH/99T3WkRrwP/rRj+LKK6+Mxx9/PM4888z4+Mc/vt4eLekEIy2Xer3U16/9lZMa4xuTv7a2tnycyPe///3xyCOPxN1335038lOD/bjjjsvTf8tb3pJfZpum9BwAAGwObXBtcIB1ygDod1OmTMkaGhqy4cOH95guuuiirmXSIfqUU07p8b799tsvO/XUU/P55557Ll/mT3/6U/74gx/8YHbiiSeuc33f+973si233DJbsmRJ13O/+c1vsvr6+uzll1/OH48bNy775je/2fX6ypUrs/Hjx2dHH310/nj58uXZsGHDsrvuuqtH2p/+9Kez448/fp3rve666/I8PvTQQyXLY0P5e/XVV/N07rjjjnW+//zzz8/23nvvkusAAGBg0wbftPxpgwP0ZIx0gDI5+OCD8x4r3W211VY9Hu+///5rPe68jHRNp556at5z5qGHHorDDjss7z3ynve8J38t9Y5Jl4CmSzI7pcsy02Wis2bNiiFDhuS9SPbbb7+u1xsbG+Nd73pX16Wl6WZFS5cujb//+7/vsd4VK1bEO97xjnXmac3LUtdnQ/l73/vel1+emnrMpPUfeuih8ZGPfCTGjRu3UekDAECiDb6aNjjApjG0C0CZpAbrLrvs0mNasxG/KdI4jmm8wnSp59/+9rf85kJnnXVWYfntHCvxN7/5TX4i0TmlS1nXN0bjbrvtlv996qmner3+NNZkupw0nZhcd911edr33HNPr9MFAGDg0AbfNNrgAKsJpANUsDUbqenxnnvuud7l002OpkyZEv/1X/8Vl156aXzve9/Ln0/vSWM8pnEQO/3xj3/Mx0zcfffdY9SoUXnPknvvvbfr9TQm4oMPPtj1eK+99spvzvTCCy+sdfIxYcKEdeYn3dAovS+N/Zh6tqxp4cKFG5W/TqnXzbRp0+Kuu+6KyZMnxzXXXJM/39TUlN+oCQAAeksbXBscYF0E0gHKpLW1NV5++eUe04IFC3osk274k2489PTTT8f5558f9913X4+bE3V33nnnxS9/+cv88s90c6Ebbrihq8GfbpKULh1NDfzHHnssbr/99vj85z8fn/jEJ2KbbbbJlzn99NPj4osvjl/84hd575XPfvazXY3sZMSIEXnvmtTb5oc//GH85S9/yS9hveyyy/LH65JuRJR6saT8H3jggXHjjTfG7Nmz85sVXXTRRXH00UdvVP6ee+65vPGeesOkHj+//e1v45lnnunavokTJ+bLpN45qQxT2QIAwJq0wbXBATbbGmOmA9BPNzpKh+A1p913371rmfT48ssvz/7+7/8+Gzx4cDZx4sT8xkGd1rzR0YUXXpjtueee2dChQ7Otttoqv0HR7Nmzu5Z/5JFHsoMPPjgbMmRI/vpJJ52UtbS09Lix0emnn56NHDkyGz16dDZ16tTsk5/8ZNeNjpKOjo7s0ksvzfM5aNCgrLm5OTv88MOzmTNnltzeWbNm5Wltt912WVNTU7bjjjvmN0fqfgOkUvlLNzs65phj8psxdb7/vPPOy9rb27tuwvThD384z3cqk6uuuqqXNQQAQK3RBtcGB+iNuvTf5ofhAegrqSfJ9ddfn9+wCAAA6Hva4ACsj6FdAAAAAACgBIF0AAAAAAAowdAuAAAAAABQgh7pAAAAAABQgkA6AAAAAACUIJAOAAAAAAAlCKQDAAAAAEAJAukAAAAAAFCCQDoAAAAAAJQgkA4AAAAAACUIpAMAAAAAQAkC6QAAAAAAEOv3/wNEiiKaADXWLwAAAABJRU5ErkJggg==",
      "text/plain": [
       "<Figure size 1500x1000 with 4 Axes>"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "成本统计信息 (Cost Statistics):\n",
      "==================================================\n",
      "CPO:     Mean=84.19, Std=48.47, Min=0.00, Max=253.60\n",
      "ActSafe: Mean=51.09, Std=26.57, Min=10.40, Max=249.80\n",
      "FQI:     Mean=53.03, Std=25.80, Min=0.00, Max=127.50\n"
     ]
    }
   ],
   "source": [
    "# 直方图 (Histogram) 绘制成本分布\n",
    "import matplotlib.pyplot as plt\n",
    "import numpy as np\n",
    "\n",
    "# 创建子图\n",
    "fig, axes = plt.subplots(2, 2, figsize=(15, 10))\n",
    "fig.suptitle('成本分布直方图 (Cost Distribution Histograms)', fontsize=16, fontweight='bold')\n",
    "\n",
    "# # 1. CPO 成本直方图\n",
    "# axes[0, 0].hist(cost_curve, bins=30, alpha=0.7, color='blue', edgecolor='black')\n",
    "# axes[0, 0].set_title('CPO 成本分布', fontsize=12, fontweight='bold')\n",
    "# axes[0, 0].set_xlabel('Episode Cost')\n",
    "# axes[0, 0].set_ylabel('Frequency')\n",
    "# axes[0, 0].grid(True, alpha=0.3)\n",
    "# axes[0, 0].axvline(np.mean(cost_curve), color='red', linestyle='--', \n",
    "#                    label=f'Mean: {np.mean(cost_curve):.2f}')\n",
    "# axes[0, 0].legend()\n",
    "\n",
    "# # 2. ActSafe 成本直方图\n",
    "# axes[0, 1].hist(act_cost_curve, bins=30, alpha=0.7, color='green', edgecolor='black')\n",
    "# axes[0, 1].set_title('ActSafe 成本分布', fontsize=12, fontweight='bold')\n",
    "# axes[0, 1].set_xlabel('Episode Cost')\n",
    "# axes[0, 1].set_ylabel('Frequency')\n",
    "# axes[0, 1].grid(True, alpha=0.3)\n",
    "# axes[0, 1].axvline(np.mean(act_cost_curve), color='red', linestyle='--', \n",
    "#                    label=f'Mean: {np.mean(act_cost_curve):.2f}')\n",
    "# axes[0, 1].legend()\n",
    "\n",
    "# 3. FQI 成本直方图\n",
    "axes[1, 0].hist(fqi_cost_curve, bins=30, alpha=0.7, color='orange', edgecolor='black')\n",
    "axes[1, 0].set_title('FQI 成本分布', fontsize=12, fontweight='bold')\n",
    "axes[1, 0].set_xlabel('Episode Cost')\n",
    "axes[1, 0].set_ylabel('Frequency')\n",
    "axes[1, 0].grid(True, alpha=0.3)\n",
    "axes[1, 0].axvline(np.mean(fqi_cost_curve), color='red', linestyle='--', \n",
    "                   label=f'Mean: {np.mean(fqi_cost_curve):.2f}')\n",
    "axes[1, 0].legend()\n",
    "\n",
    "# 4. 所有算法对比直方图\n",
    "axes[1, 1].hist(cost_curve, bins=20, alpha=0.5, label='CPO', color='blue')\n",
    "# axes[1, 1].hist(act_cost_curve, bins=20, alpha=0.5, label='ActSafe', color='green')\n",
    "axes[1, 1].hist(fqi_cost_curve, bins=20, alpha=0.5, label='FQI', color='orange')\n",
    "axes[1, 1].set_title('Cost Comparsion Histogram', fontsize=12, fontweight='bold')\n",
    "axes[1, 1].set_xlabel('Episode Cost')\n",
    "axes[1, 1].set_ylabel('Frequency')\n",
    "axes[1, 1].legend()\n",
    "axes[1, 1].grid(True, alpha=0.3)\n",
    "\n",
    "plt.tight_layout()\n",
    "plt.show()\n",
    "\n",
    "# 打印统计信息\n",
    "print(\"成本统计信息 (Cost Statistics):\")\n",
    "print(\"=\" * 50)\n",
    "print(f\"CPO:     Mean={np.mean(cost_curve):.2f}, Std={np.std(cost_curve):.2f}, Min={np.min(cost_curve):.2f}, Max={np.max(cost_curve):.2f}\")\n",
    "print(f\"ActSafe: Mean={np.mean(act_cost_curve):.2f}, Std={np.std(act_cost_curve):.2f}, Min={np.min(act_cost_curve):.2f}, Max={np.max(act_cost_curve):.2f}\")\n",
    "print(f\"FQI:     Mean={np.mean(fqi_cost_curve):.2f}, Std={np.std(fqi_cost_curve):.2f}, Min={np.min(fqi_cost_curve):.2f}, Max={np.max(fqi_cost_curve):.2f}\")\n"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "py310",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.10.18"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
