{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "id": "67576132",
   "metadata": {},
   "outputs": [],
   "source": [
    "from math import inf\n",
    "import numpy as np\n",
    "import scipy\n",
    "import torch\n",
    "import torch.nn as nn\n",
    "import torch.nn.functional as F\n",
    "import torch.optim as optim\n",
    "import gymnasium as gym\n",
    "import pandas as pd\n",
    "from datetime import datetime\n",
    "from sklearn.base import BaseEstimator\n",
    "from realkd.boosting import WeightUpdateMethod\n",
    "from pandas import qcut\n",
    "from realkd.rules import SquaredLoss, AdditiveRuleEnsemble, Rule\n",
    "from realkd.search import Context\n",
    "\n",
    "import warnings"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "id": "8b8f01e2",
   "metadata": {},
   "outputs": [],
   "source": [
    "# warnings.filterwarnings('ignore')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "id": "db545637",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "cuda\n"
     ]
    }
   ],
   "source": [
    "env = gym.make('CartPole-v1', render_mode='rgb_array')\n",
    "device = torch.device(\"cuda\" if torch.cuda.is_available() else \"cpu\")\n",
    "print(device)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "id": "7aa6c889",
   "metadata": {},
   "outputs": [],
   "source": [
    "column_names = ['cp', 'cv', 'pa', 'pav']"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "id": "24f75485",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<torch._C.Generator at 0x7f33cbd05410>"
      ]
     },
     "execution_count": 5,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "np.random.seed(753894)\n",
    "torch.manual_seed(3921840)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "id": "84732b72",
   "metadata": {},
   "outputs": [],
   "source": [
    "def orthonormalization(Q):\n",
    "    n, k = Q.shape\n",
    "    O = np.zeros(shape=(n, k))\n",
    "    q = Q[:, 0]\n",
    "    O[:, 0] = q / (norm(q) + 1e-6)\n",
    "    for i in range(1, k):\n",
    "        O_i = O[:, :i]\n",
    "        q = Q[:, i]\n",
    "        q_orth = q - O_i.dot(O_i.T.dot(q))\n",
    "        O[:, i] = q_orth / (norm(q_orth) + 1e-6)\n",
    "    return O"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "id": "973f1f9b",
   "metadata": {},
   "outputs": [],
   "source": [
    "def softmax1(action, values, other_values, location):\n",
    "    all_values = np.insert(other_values, location, values, axis=1)\n",
    "    exps = np.exp(all_values)\n",
    "    res = np.exp(all_values[np.arange(values.shape[0]), action]) / np.sum(exps, axis=1)\n",
    "    return res\n",
    "\n",
    "def norm(x):\n",
    "    \"\"\"\n",
    "    Calculate the L-2 norm of a vector\n",
    "    :param x: the vector whose L-2 norm is to be calculated\n",
    "    :return: the L-2 norm of the vector\n",
    "    \"\"\"\n",
    "    return (x * x).sum() ** 0.5\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "id": "5b0af6ac",
   "metadata": {},
   "outputs": [],
   "source": [
    "class PiLoss:\n",
    "    _instance = None\n",
    "\n",
    "    def __new__(cls):\n",
    "        if cls._instance is None:\n",
    "            cls._instance = super(PiLoss, cls).__new__(cls)\n",
    "        return cls._instance\n",
    "\n",
    "    @staticmethod\n",
    "    def __call__(action, values, advantage, other_values, current):\n",
    "        \"\"\"\n",
    "        :param action: the action chosen\n",
    "        :param values: the values provided by current model\n",
    "        :param other_values: the output by other models\n",
    "        :param current: the action represented by the current model\n",
    "        \"\"\"\n",
    "        sm = softmax1(action, values, other_values, current)+1e-6\n",
    "        return -np.log(sm) * advantage\n",
    "\n",
    "    @staticmethod\n",
    "    def g(action, values, advantage, other_values, current):\n",
    "        return np.where(action == current, -advantage * (1 - softmax1(current, values, other_values, current)),\n",
    "                        advantage * softmax1(current, values, other_values, current))\n",
    "\n",
    "    @staticmethod\n",
    "    def h(action, values, advantage, other_values, current):\n",
    "        sm = softmax1(current, values, other_values, current)\n",
    "        return advantage * sm * (1 - sm)\n",
    "\n",
    "    @staticmethod\n",
    "    def __repr__():\n",
    "        return 'pi_loss'\n",
    "\n",
    "    @staticmethod\n",
    "    def __str__():\n",
    "        return 'pi_loss'"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 9,
   "id": "67942365",
   "metadata": {},
   "outputs": [],
   "source": [
    "loss_functions = {\n",
    "    'pi_loss': PiLoss()\n",
    "}"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 10,
   "id": "693287f4",
   "metadata": {},
   "outputs": [],
   "source": [
    "def loss_function(loss):\n",
    "    \"\"\"Provides loss functions from string representation.\n",
    "\n",
    "    :param loss: string identifier of loss function loss function\n",
    "    :return: loss function matching corresponding to input string (or unchanged input if was already loss function)\n",
    "    \"\"\"\n",
    "    if callable(loss):\n",
    "        return loss\n",
    "    else:\n",
    "        return loss_functions[loss]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 11,
   "id": "ae0af97c",
   "metadata": {},
   "outputs": [],
   "source": [
    "def calc_risk(loss, action, rules, states, reg, advantage, others, current):\n",
    "    weights = np.array([rule.y for rule in rules])\n",
    "    risk = sum(loss(action, rules(states), advantage, others, current)) + reg * sum(weights * weights) / 2\n",
    "    return risk"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 12,
   "id": "d06dc96b",
   "metadata": {},
   "outputs": [],
   "source": [
    "class FullyCorrectiveA2C:\n",
    "    def __init__(self, loss='pi_loss', reg=1.0, solver='L-BFGS-B'):\n",
    "        self.loss = loss_function(loss)\n",
    "        self.reg = reg\n",
    "        self.solver = solver\n",
    "\n",
    "    @staticmethod\n",
    "    def get_risk(loss, action, q_mat, reg, advantage, others, current):\n",
    "        def sum_loss(weights):\n",
    "            return sum(loss(action, q_mat.dot(weights), advantage, others, current)) + reg * sum(weights * weights) / 2\n",
    "\n",
    "        return sum_loss\n",
    "\n",
    "    @staticmethod\n",
    "    def get_gradient(g, action, q_mat, reg, advantage, other, current):\n",
    "        def gradient(weights):\n",
    "            grad_vec = g(action, q_mat.dot(weights), advantage, other, current)\n",
    "            return q_mat.T.dot(grad_vec) + reg * weights\n",
    "\n",
    "        return gradient\n",
    "\n",
    "    @staticmethod\n",
    "    def get_hessian(h, action, q_mat, reg, advantage, other, current):\n",
    "        def hessian(weights):\n",
    "            h_vec = h(action, q_mat.dot(weights), advantage, other, current)\n",
    "            return q_mat.T.dot(np.diag(h_vec)).dot(q_mat) + np.diag([reg] * len(weights))\n",
    "\n",
    "        return hessian\n",
    "\n",
    "    def calc_weight(self, data, action, rules, advantage, other, current):\n",
    "        g = self.loss.g\n",
    "        h = self.loss.h\n",
    "        loss = self.loss\n",
    "        y = np.array(action)\n",
    "        q_mat = np.column_stack(\n",
    "            [rules[i].q(data) + np.zeros(len(data)) for i in range(len(rules))])\n",
    "        sum_loss = self.get_risk(loss, y, q_mat, self.reg, advantage, other, current)\n",
    "        gradient = self.get_gradient(g, y, q_mat, self.reg, advantage, other, current)\n",
    "        hessian = self.get_hessian(h, y, q_mat, self.reg, advantage, other, current)\n",
    "        if self.solver == 'GD':  # Gradient descent\n",
    "            w = np.array([r.y for r in rules])\n",
    "            old_w = np.ones_like(w) * (1.0 if len(w) - sum(w) > 1e-5 else 2.0)\n",
    "            i = 0\n",
    "            while norm(old_w - w) > 1e-3 and i < 50:\n",
    "                old_w = np.array(w)\n",
    "                if norm(gradient(w)) == 0:\n",
    "                    break\n",
    "                p = -gradient(w) / norm(gradient(w))\n",
    "                w += GoldenRatioSearch(sum_loss, old_w, p, gradient).run() * p\n",
    "                i += 1\n",
    "        elif self.solver == 'Line':\n",
    "            w = np.array([r.y for r in rules])\n",
    "            if norm(gradient(w)) != 0:\n",
    "                p = -gradient(w) / norm(gradient(w))\n",
    "                distance = GoldenRatioSearch(sum_loss, w, p, gradient).run()\n",
    "                w += distance * p\n",
    "        else:\n",
    "            w = np.array([r.y for r in rules])\n",
    "            w = scipy.optimize.minimize(sum_loss, w, method=self.solver, jac=gradient,  # hess=hessian,\n",
    "                                        options={'disp': False}).x\n",
    "\n",
    "        return w"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 13,
   "id": "2d0c04a8",
   "metadata": {},
   "outputs": [],
   "source": [
    "class ObjectFunction:\n",
    "    def __init__(self, data, target, predictions, loss, reg, advantage, other_values, current, rules=None):\n",
    "        self.loss = loss_function(loss)\n",
    "        self.reg = reg\n",
    "        predictions = np.zeros_like(\n",
    "            target) if predictions is None else predictions\n",
    "        g = np.array(self.loss.g(target, predictions, advantage, other_values, current))\n",
    "        h = np.array(self.loss.h(target, predictions, advantage, other_values, current)) + 1e-6\n",
    "        r = g / h\n",
    "        order = np.argsort(r)[::-1]\n",
    "        self.g = g[order]\n",
    "        self.h = h[order]\n",
    "        self.data = data.iloc[order].reset_index(drop=True)\n",
    "        self.target = target.iloc[order].reset_index(drop=True)\n",
    "        self.n = len(target)\n",
    "\n",
    "    def __call__(self, ext):\n",
    "        raise NotImplementedError()\n",
    "\n",
    "    def bound(self, ext):\n",
    "        raise NotImplementedError()\n",
    "\n",
    "    def search(self, method='greedy', verbose=False, **search_params):\n",
    "        from realkd.search import search_methods\n",
    "        ctx = Context.from_df(self.data, **search_params)\n",
    "        if verbose >= 2:\n",
    "            print(\n",
    "                f'Created search context with {len(ctx.attributes)} attributes')\n",
    "        return search_methods[method](ctx, self, self.bound, verbose=verbose, **search_params).run()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 14,
   "id": "eaec4413",
   "metadata": {},
   "outputs": [],
   "source": [
    "class OrthogonalBoostingObjective(ObjectFunction):\n",
    "    def __init__(self, data, target, advantage, other_values, current, predictions=None, loss=SquaredLoss, reg=1.0,\n",
    "                 rules=None,\n",
    "                 epsilon=1e-4, **kwargs):\n",
    "        super().__init__(data, target, predictions, loss, reg, advantage, other_values, current, rules)\n",
    "        self.rules = [] if rules is None else rules\n",
    "        self.loss = loss_function(loss)\n",
    "        self.reg = reg\n",
    "        self.epsilon = epsilon\n",
    "        predictions = np.zeros_like(\n",
    "            target) if predictions is None else predictions\n",
    "        g = np.array(self.loss.g(target, predictions, advantage, other_values, current))\n",
    "        self.n = len(target)\n",
    "        r = g\n",
    "        order = np.argsort(r)[::-1]\n",
    "        self.g = g[order]\n",
    "        self.data = data.iloc[order].reset_index(drop=True)\n",
    "        self.target = target.iloc[order].reset_index(drop=True)\n",
    "        if len(rules) != 0:\n",
    "            orth_basis = kwargs['orth_basis']\n",
    "            self.orth_basis = orth_basis[order]\n",
    "            self.g = self.g - self.orth_basis @ self.orth_basis.T @ self.g\n",
    "        else:\n",
    "            self.orth_basis = np.zeros(self.n)\n",
    "\n",
    "    def __call__(self, ext):\n",
    "        if len(ext) == 0:\n",
    "            return -inf\n",
    "        g_q = self.g[ext]\n",
    "        if len(self.rules) == 0:\n",
    "            h_q = self.h[ext]\n",
    "            return abs(g_q.sum()) / np.sqrt(h_q.sum())\n",
    "        length = self.fast_orth_norm(ext)\n",
    "        if length > 1e-4:\n",
    "            obj = abs(g_q.sum()) / (length + self.epsilon)\n",
    "        else:\n",
    "            obj = 0\n",
    "        return obj\n",
    "\n",
    "    def fast_orth_norm(self, ext):\n",
    "        deltas = self.orth_basis[ext]\n",
    "        length = len(ext)\n",
    "        okqi = abs(np.sum(deltas, axis=0))\n",
    "        q_para_norms = (okqi ** 2).sum()\n",
    "        q_orth_norms_sq = np.abs(length - q_para_norms)\n",
    "        return np.sqrt(q_orth_norms_sq)\n",
    "\n",
    "    def fast_para_norms_prefix(self, ext):\n",
    "        deltas = self.orth_basis[ext]\n",
    "        length = len(ext)\n",
    "        okqi = np.cumsum(deltas, axis=0)\n",
    "        q_para_norms = (okqi ** 2).sum(axis=1)\n",
    "        q_orth_norms_sq = np.abs(np.arange(1, length + 1) - q_para_norms)\n",
    "        q_orth_norms = np.sqrt(q_orth_norms_sq)\n",
    "        return q_orth_norms\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 15,
   "id": "626cceb7",
   "metadata": {},
   "outputs": [],
   "source": [
    "class GeneralRuleBoostingEstimator(BaseEstimator):\n",
    "    def __init__(self, num_rules, objective_function, weight_update_method, loss='squared', reg=1.0,\n",
    "                 search='greedy', max_col_attr=10,\n",
    "                 search_params=None, verbose=False):\n",
    "        if search_params is None:\n",
    "            search_params = {'order': 'bestboundfirst', 'apx': 1.0, 'max_depth': None, 'discretization': qcut,\n",
    "                             'max_col_attr': max_col_attr}\n",
    "        self.num_rules = num_rules\n",
    "        self.num_components = 500\n",
    "        self.objective = objective_function\n",
    "        self.objective_function = objective_function\n",
    "        self.max_col_attr = max_col_attr\n",
    "        self.weight_update_method = weight_update_method\n",
    "        self.loss = loss_function(loss)\n",
    "        self.reg = reg\n",
    "        self.weight_update_method.loss = loss\n",
    "        self.weight_update_method.reg = reg\n",
    "        self.verbose = verbose\n",
    "        self.search = search\n",
    "        self.rules_ = AdditiveRuleEnsemble([])\n",
    "        self.search_params = search_params\n",
    "        self.history = []\n",
    "        self.time = []\n",
    "\n",
    "    def set_reg(self, reg):\n",
    "        self.reg = reg\n",
    "        self.objective.reg = reg\n",
    "        self.weight_update_method.reg = reg\n",
    "\n",
    "    def fit(self, data, target, advantage, other_values, current, has_origin_rules=False, verbose=False):\n",
    "        if not has_origin_rules:\n",
    "            self.history = []\n",
    "            self.time = []\n",
    "            self.rules_.members = []\n",
    "            orth_basis = np.array([])\n",
    "        else:\n",
    "            q_mat = np.column_stack(\n",
    "                [self.rules_[i].q(data) + np.zeros(len(data)) for i in range(len(self.rules_))])\n",
    "            orth_basis = orthonormalization(q_mat)\n",
    "        num_components = 0\n",
    "        while len(self.rules_) < self.num_rules and num_components < self.num_components:\n",
    "            start_time = datetime.now()\n",
    "            # Search for a rule\n",
    "            scores = self.rules_(data)\n",
    "            obj = self.objective(data, target, advantage, other_values, current, predictions=scores,\n",
    "                                 loss=self.loss, reg=self.reg, rules=self.rules_, orth_basis=orth_basis)\n",
    "            q = obj.search(method=self.search, verbose=verbose,\n",
    "                           **self.search_params)\n",
    "            if hasattr(self.objective, 'opt_weight') and callable(getattr(self.objective, 'opt_weight')):\n",
    "                y = obj.opt_weight(q)\n",
    "            else:\n",
    "                y = 1.0  # np.random.random()\n",
    "            q_vec = q(data)\n",
    "            num_components += (1 + len(q))\n",
    "            if len(orth_basis) == 0:\n",
    "                basis = q_vec / norm(q_vec)\n",
    "                orth_basis = np.array([basis]).T\n",
    "            else:\n",
    "                basis = q_vec - orth_basis.dot(orth_basis.T.dot(q_vec))\n",
    "                basis = basis / (norm(basis) + 1e-6)\n",
    "                orth_basis = np.hstack((orth_basis, np.array([basis]).T))\n",
    "            rule = Rule(q, y)\n",
    "            if self.verbose:\n",
    "                print(rule)\n",
    "            self.rules_.append(rule)\n",
    "            # Calculate weights\n",
    "            weights = self.weight_update_method.calc_weight(\n",
    "                data, target, self.rules_, advantage, other_values, current)\n",
    "            for i in range(len(self.rules_)):\n",
    "                self.rules_[i].y = weights[i]\n",
    "            self.history.append(AdditiveRuleEnsemble(\n",
    "                [Rule(q=rule.q, y=rule.y) for rule in self.rules_.members]))\n",
    "            end_time = datetime.now()\n",
    "            self.time.append(str(end_time - start_time))\n",
    "        return self\n",
    "\n",
    "    def predict(self, data):\n",
    "        loss = loss_function(self.loss)\n",
    "        return loss.preidictions(self.rules_(data))\n",
    "\n",
    "    def decision_function(self, data):\n",
    "        return self.rules_(data)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 16,
   "id": "b50ce787",
   "metadata": {},
   "outputs": [],
   "source": [
    "# class Actor(nn.Module):\n",
    "#     def __init__(self, action_space, node=16):\n",
    "#         super(Actor, self).__init__()\n",
    "#         self.fc1 = nn.Linear(4, node)  \n",
    "# #         self.fc1_ = nn.Linear(node, node)\n",
    "#         self.fc2 = nn.Linear(node, action_space)\n",
    "\n",
    "#     def forward(self, state):\n",
    "#         x = F.relu(self.fc1(state))\n",
    "# #         x = F.relu(self.fc1_(x))\n",
    "#         x = self.fc2(x)\n",
    "#         return x"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 17,
   "id": "84b0ee0a",
   "metadata": {},
   "outputs": [],
   "source": [
    "def copy_rules(origin_rules):\n",
    "    rules = []\n",
    "    for n in range(len(origin_rules)):\n",
    "        rule = origin_rules[n]\n",
    "        rules.append(Rule(q=rule.q, y=rule.y))\n",
    "    return AdditiveRuleEnsemble(rules)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 18,
   "id": "bb3fcc8c",
   "metadata": {},
   "outputs": [],
   "source": [
    "class ActorRule():\n",
    "    def __init__(self, action_space=2, num_rules=5):\n",
    "        self.action_space = action_space\n",
    "        self.model = [GeneralRuleBoostingEstimator(num_rules=num_rules, objective_function=OrthogonalBoostingObjective,\n",
    "                                                   weight_update_method=FullyCorrectiveA2C(), loss=PiLoss(),\n",
    "                                                   reg=0.3, search='greedy', max_col_attr=10, verbose=False) for _ in\n",
    "                      range(action_space)]\n",
    "        self.best_model = [\n",
    "            GeneralRuleBoostingEstimator(num_rules=num_rules, objective_function=OrthogonalBoostingObjective,\n",
    "                                         weight_update_method=FullyCorrectiveA2C(), loss=PiLoss(),\n",
    "                                         reg=0.01, search='greedy', max_col_attr=20, verbose=False) for _ in\n",
    "            range(action_space)]\n",
    "\n",
    "    def __call__(self, state):\n",
    "        res = [self.model[i].rules_(state) for i in range(len(self.model))]\n",
    "        return np.array(res)\n",
    "\n",
    "    def predict(self, state):\n",
    "        res = [self.best_model[i].rules_(state) for i in range(len(self.model))]\n",
    "        return np.array(res)\n",
    "\n",
    "\n",
    "def update_rules(estimator: GeneralRuleBoostingEstimator, x, y, adv, other_values, current):\n",
    "    queries_lst = []\n",
    "    queries = {}\n",
    "    original_rules = copy_rules(estimator.rules_)\n",
    "    origin_risk = calc_risk(PiLoss(), y, original_rules, x, estimator.reg, adv, other_values, current)\n",
    "    for i in range(len(estimator.rules_)):\n",
    "        q_str = str(estimator.rules_[i].q)\n",
    "        if q_str not in queries:\n",
    "            queries[q_str] = estimator.rules_[i].y\n",
    "            queries_lst.append(estimator.rules_[i].q)\n",
    "        else:\n",
    "            queries[q_str] += estimator.rules_[i].y\n",
    "    for k in queries:\n",
    "        queries[k] = abs(queries[k])\n",
    "    min_weight_query = min(queries, key=queries.get)\n",
    "    rules = []\n",
    "    for i in range(len(queries_lst)):\n",
    "        q_str = str(queries_lst[i])\n",
    "        if q_str != min_weight_query:\n",
    "            rules.append(Rule(q=queries_lst[i], y=queries[str(queries_lst[i])]))\n",
    "    if len(rules) == 0:\n",
    "        rules = [Rule(q=queries_lst[0], y=queries[str(queries_lst[0])])]\n",
    "    new_rules = AdditiveRuleEnsemble(rules)\n",
    "    weights = FullyCorrectiveA2C(loss_function('pi_loss'), estimator.reg).calc_weight(x, y, new_rules, adv,\n",
    "                                                                                      other_values, current)\n",
    "    for i in range(len(new_rules)):\n",
    "        new_rules[i].y = weights[i]\n",
    "    estimator.rules_ = new_rules\n",
    "    estimator.fit(x, y, adv, other_values, current, has_origin_rules=True)\n",
    "    weights = FullyCorrectiveA2C(loss_function('pi_loss'), estimator.reg).calc_weight(x, y, estimator.rules_, adv,\n",
    "                                                                                      other_values, current)\n",
    "    for i in range(len(estimator.rules_)):\n",
    "        estimator.rules_[i].y = weights[i]\n",
    "    new_risk = calc_risk(PiLoss(), y, estimator.rules_, x, estimator.reg, adv, other_values, current)\n",
    "    if new_risk > origin_risk:\n",
    "        estimator.rules_ = copy_rules(original_rules)\n",
    "        print(\"origin\", origin_risk, 'new', new_risk, 'not updated')\n",
    "        # risk = sum(PiLoss.__call__(y, estimator.rules_[i].y))\n",
    "    return estimator"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 19,
   "id": "2824981f",
   "metadata": {},
   "outputs": [],
   "source": [
    "class Critic(nn.Module):\n",
    "    def __init__(self, node=16):\n",
    "        super(Critic, self).__init__()\n",
    "        self.fc1 = nn.Linear(4, node)\n",
    "        self.fc2 = nn.Linear(node, 1)\n",
    "\n",
    "    def forward(self, state):\n",
    "        x = F.relu(self.fc1(state))\n",
    "        x = self.fc2(x)\n",
    "        return x"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 20,
   "id": "6b6e2dd7",
   "metadata": {},
   "outputs": [],
   "source": [
    "gamma = 0.99\n",
    "actor = ActorRule()\n",
    "critic = Critic().to(device)\n",
    "critic_optimizer = optim.AdamW(critic.parameters(), lr=0.001)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 21,
   "id": "ae072cc5",
   "metadata": {},
   "outputs": [],
   "source": [
    "class ActorNet(nn.Module):\n",
    "    def __init__(self, hidden_dim=16):\n",
    "        super().__init__()\n",
    "\n",
    "        self.hidden = nn.Linear(4, hidden_dim)\n",
    "        self.output = nn.Linear(hidden_dim, 2)\n",
    "\n",
    "    def forward(self, s):\n",
    "        outs = self.hidden(s)\n",
    "        outs = F.relu(outs)\n",
    "        logits = self.output(outs)\n",
    "        return logits\n",
    "\n",
    "\n",
    "actor_func = ActorNet().to(device)\n",
    "value_func = critic"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 22,
   "id": "c565d5ef",
   "metadata": {
    "scrolled": true
   },
   "outputs": [],
   "source": [
    "opt1 = torch.optim.AdamW(value_func.parameters(), lr=0.001)\n",
    "opt2 = torch.optim.AdamW(actor_func.parameters(), lr=0.001)\n",
    "def pick_sample(s):\n",
    "    with torch.no_grad():\n",
    "        #   --> size : (1, 4)\n",
    "        s_batch = np.expand_dims(s, axis=0)\n",
    "        s_batch = torch.tensor(s_batch, dtype=torch.float).to(device)\n",
    "        # Get logits from state\n",
    "        #   --> size : (1, 2)\n",
    "        logits = actor_func(s_batch)\n",
    "        #   --> size : (2)\n",
    "        logits = logits.squeeze(dim=0)\n",
    "        # From logits to probabilities\n",
    "        probs = F.softmax(logits, dim=-1)\n",
    "        # Pick up action's sample\n",
    "        a = torch.multinomial(probs, num_samples=1)\n",
    "        # Return\n",
    "        return a.tolist()[0]\n",
    "reward_records = []\n",
    "for i in range(0):\n",
    "    #\n",
    "    # Run episode till done\n",
    "    #\n",
    "    done = False\n",
    "    states = []\n",
    "    actions = []\n",
    "    rewards = []\n",
    "    s, _ = env.reset(seed=np.random.randint(0, 1e6))\n",
    "    while not done:\n",
    "        states.append(s.tolist())\n",
    "        a = pick_sample(s)\n",
    "        s, r, term, trunc, _ = env.step(a)\n",
    "        done = term or trunc\n",
    "        actions.append(a)\n",
    "        rewards.append(r)\n",
    "\n",
    "    #\n",
    "    # Get cumulative rewards\n",
    "    #\n",
    "    cum_rewards = np.zeros_like(rewards)\n",
    "    reward_len = len(rewards)\n",
    "    for j in reversed(range(reward_len)):\n",
    "        cum_rewards[j] = rewards[j] + (cum_rewards[j+1]*gamma if j+1 < reward_len else 0)\n",
    "\n",
    "    #\n",
    "    # Train (optimize parameters)\n",
    "    #\n",
    "\n",
    "    # Optimize value loss (Critic)\n",
    "    opt1.zero_grad()\n",
    "    states = torch.tensor(states, dtype=torch.float).to(device)\n",
    "    cum_rewards = torch.tensor(cum_rewards, dtype=torch.float).to(device)\n",
    "    values = value_func(states)\n",
    "    values = values.squeeze(dim=1)\n",
    "    vf_loss = F.mse_loss(\n",
    "        values,\n",
    "        cum_rewards,\n",
    "        reduction=\"none\")\n",
    "    vf_loss.sum().backward()\n",
    "    opt1.step()\n",
    "\n",
    "    # Todo 2; RULE BASED UPDATES\n",
    "    with torch.no_grad():\n",
    "        values = value_func(states).squeeze(dim=1)\n",
    "    opt2.zero_grad()\n",
    "    actions = torch.tensor(actions, dtype=torch.int64).to(device)\n",
    "    advantages = cum_rewards - values\n",
    "#     print(advantages)\n",
    "    logits = actor_func(states)\n",
    "    log_probs = -F.cross_entropy(logits, actions, reduction=\"none\")\n",
    "    pi_loss = -log_probs * advantages\n",
    "    pi_loss.sum().backward()\n",
    "    opt2.step()\n",
    "\n",
    "    # Output total rewards in episode (max 500)\n",
    "    print(\"Run episode {} with rewards {}\".format(i, sum(rewards)))#, end=\"\\r\")\n",
    "    reward_records.append(sum(rewards))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 23,
   "id": "73589768",
   "metadata": {},
   "outputs": [],
   "source": [
    "def softmax(logits):\n",
    "    exp_logits = np.exp(logits)\n",
    "    sum_logits = np.sum(exp_logits)\n",
    "    return (exp_logits / sum_logits).reshape([-1])\n",
    "\n",
    "def pick_sample(s):\n",
    "    with torch.no_grad():\n",
    "        s_batch = np.expand_dims(s, axis=0)\n",
    "        logits = actor(pd.DataFrame(s_batch, columns=column_names))\n",
    "        probs = softmax(logits)\n",
    "        a = torch.multinomial(torch.tensor(probs), num_samples=1)\n",
    "        return a.tolist()[0]\n",
    "\n",
    "\n",
    "def train():\n",
    "    reward_records = []\n",
    "    best_rewards = 0\n",
    "    # best_model = None\n",
    "    for i in range(1000):\n",
    "\n",
    "        done = False\n",
    "        states = []\n",
    "        actions = []\n",
    "        rewards = []\n",
    "        s, _ = env.reset(seed=np.random.randint(0, 1e6))\n",
    "        if i == 2:\n",
    "            print('stop here')\n",
    "        while not done:\n",
    "            states.append(s.tolist())\n",
    "            a = pick_sample(s)\n",
    "            s, r, term, trunc, _ = env.step(a)\n",
    "            done = term or trunc\n",
    "            actions.append(a)\n",
    "            rewards.append(r)\n",
    "\n",
    "        # if sum(rewards) > 480:\n",
    "        #     break\n",
    "        #\n",
    "        # Get cumulative rewards\n",
    "        #\n",
    "        cum_rewards = np.zeros_like(rewards)\n",
    "        reward_len = len(rewards)\n",
    "        for j in reversed(range(reward_len)):\n",
    "            cum_rewards[j] = rewards[j] + (cum_rewards[j + 1] * gamma if j + 1 < reward_len else 0)\n",
    "        #\n",
    "        # Train (optimize parameters)\n",
    "        #\n",
    "        # Optimize value loss (Critic)\n",
    "        critic_optimizer.zero_grad()\n",
    "        states = torch.tensor(states, dtype=torch.float).to(device)\n",
    "        cum_rewards = torch.tensor(cum_rewards, dtype=torch.float).to(device)\n",
    "        values = critic(states)\n",
    "        values = values.squeeze(dim=1)\n",
    "        vf_loss = F.mse_loss(\n",
    "            values,\n",
    "            cum_rewards,\n",
    "            reduction=\"none\")\n",
    "        vf_loss.sum().backward()\n",
    "        critic_optimizer.step()\n",
    "        print('============', i, '===========')\n",
    "        print(len(actions), 'actions', actions)\n",
    "\n",
    "        print(\"{}\\n--------------\\n{}\\nRun episode {} with rewards {}\".format(actor.model[0].rules_,\n",
    "                                                                              actor.model[1].rules_,\n",
    "                                                                              i,\n",
    "                                                                              sum(rewards)))  # , end=\"\\r\")\n",
    "        if i > 0:\n",
    "            if sum(rewards) >= best_rewards:\n",
    "                best_rewards = sum(rewards)\n",
    "                for rr in range(actor.action_space):\n",
    "                    rules = []\n",
    "                    for n in range(len(actor.model[rr].rules_)):\n",
    "                        rule = actor.model[rr].rules_[n]\n",
    "                        rules.append(Rule(q=rule.q, y=rule.y))\n",
    "                    actor.best_model[rr].rules_ = AdditiveRuleEnsemble(rules)\n",
    "                print('best')\n",
    "        if np.average(reward_records[-5:]) > 475.0:\n",
    "            break\n",
    "        #     else:\n",
    "        #         for rr in range(actor.action_space):\n",
    "        #             rules = []\n",
    "        #             for n in range(len(actor.best_model[rr].rules_)):\n",
    "        #                 rule = actor.best_model[rr].rules_[n]\n",
    "        #                 rules.append(Rule(q=rule.q, y=rule.y))\n",
    "        #             actor.model[rr].rules_ = AdditiveRuleEnsemble(rules)\n",
    "        #         print('')\n",
    "\n",
    "        #\n",
    "        # Todo 2; RULE BASED UPDATES\n",
    "        with torch.no_grad():\n",
    "            values = critic(states).squeeze(dim=1)\n",
    "        actions = torch.tensor(actions, dtype=torch.int64).to(device)\n",
    "        advantages = cum_rewards - values\n",
    "        states_array = states.cpu().detach().numpy()\n",
    "        x = pd.DataFrame(states_array, columns=column_names)\n",
    "        y = pd.Series(actions.cpu().detach().numpy())\n",
    "#         advantages = (advantages-advantages.mean())/advantages.std()\n",
    "        adv = pd.Series(advantages.cpu().detach().numpy())\n",
    "        outputs = actor(x).T\n",
    "        # print('adv', advantages.cpu().detach().numpy())\n",
    "        # print('outputs', outputs.tolist())\n",
    "        for j in range(len(actor.model)):\n",
    "            m = actor.model[j]\n",
    "            masks = np.ones_like(outputs, dtype=bool)\n",
    "            masks[:, j] = False\n",
    "            other_values = outputs[masks].reshape(-1, outputs.shape[1] - 1)\n",
    "\n",
    "            if len(m.rules_) == 0:\n",
    "                m.fit(x, y, adv, other_values, j)\n",
    "            else:\n",
    "                for _ in range(1):\n",
    "                    update_rules(m, x, y, adv, other_values, j)\n",
    "        \n",
    "        # print(\n",
    "        #     \"{}\\n--------------\\n{}\\nRun episode {} with rewards {}\".format(actor.model[0].rules_,\n",
    "        #                                                                     actor.model[1].rules_,\n",
    "        #                                                                     i,\n",
    "        #                                                                     sum(rewards)))  # , end=\"\\r\")\n",
    "        reward_records.append(sum(rewards))\n",
    "    print(\"\\nDone\")\n",
    "    env.close()\n",
    "    return reward_records"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 24,
   "id": "b411aa5d",
   "metadata": {
    "scrolled": true
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 0 ===========\n",
      "31 actions [1, 0, 1, 1, 1, 0, 0, 0, 0, 1, 0, 0, 0, 1, 1, 0, 1, 1, 0, 0, 1, 1, 1, 0, 1, 1, 0, 0, 1, 1, 1]\n",
      "\n",
      "--------------\n",
      "\n",
      "Run episode 0 with rewards 31.0\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/home/fyan/.local/lib/python3.10/site-packages/numpy/lib/function_base.py:518: RuntimeWarning: Mean of empty slice.\n",
      "  avg = a.mean(axis, **keepdims_kw)\n",
      "/home/fyan/.local/lib/python3.10/site-packages/numpy/core/_methods.py:190: RuntimeWarning: invalid value encountered in double_scalars\n",
      "  ret = ret.dtype.type(ret / rcount)\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 1 ===========\n",
      "25 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1]\n",
      "   +6.6232 if cp>=0.04436511918902397 & cv>=-0.21709540486335754\n",
      "   -3.5863 if cv<=-0.02955218032002449 & pa>=-0.05927136540412903\n",
      "   +3.1406 if cv>=0.5568901300430298\n",
      "   -4.2572 if cp<=0.04436511918902397 & cp>=0.02268251031637192 & pav>=-0.7808784246444702\n",
      "   +2.0342 if cv>=-0.002278788713737727 & pa>=-0.05927136540412903 & pav>=-0.4059761166572571\n",
      "--------------\n",
      "   -6.6233 if cp>=0.04436511918902397 & cv>=-0.21709540486335754\n",
      "   +3.5862 if cv<=-0.02955218032002449 & pa>=-0.05927136540412903\n",
      "   -3.1406 if cv>=0.5568901300430298\n",
      "   +4.2572 if cp<=0.04436511918902397 & cp>=0.02268251031637192 & pav>=-0.7808784246444702\n",
      "   -2.0343 if cv>=-0.002278788713737727 & pa>=-0.05927136540412903 & pav>=-0.4059761166572571\n",
      "Run episode 1 with rewards 25.0\n",
      "best\n",
      "stop here\n",
      "============ 2 ===========\n",
      "41 actions [0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 0, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0]\n",
      "   +0.0000 if cp>=0.04436511918902397 & cv>=-0.21709540486335754\n",
      "   -1.9213 if cv<=-0.02955218032002449 & pa>=-0.05927136540412903\n",
      "   +0.0000 if cv>=0.5568901300430298\n",
      "   +0.0000 if cp<=0.04436511918902397 & cp>=0.02268251031637192 & pav>=-0.7808784246444702\n",
      "   +2.9984 if cv>=0.005495118349790581 & pav<=0.35348663926124574\n",
      "--------------\n",
      "   +0.0000 if cp>=0.04436511918902397 & cv>=-0.21709540486335754\n",
      "   +1.9213 if cv<=-0.02955218032002449 & pa>=-0.05927136540412903\n",
      "   +0.0000 if cv>=0.5568901300430298\n",
      "   +0.0000 if cp<=0.04436511918902397 & cp>=0.02268251031637192 & pav>=-0.7808784246444702\n",
      "   -2.9985 if cv>=0.005495118349790581 & pav<=0.35348663926124574\n",
      "Run episode 2 with rewards 41.0\n",
      "best\n",
      "============ 3 ===========\n",
      "24 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1]\n",
      "   +0.0000 if cp>=0.04436511918902397 & cv>=-0.21709540486335754\n",
      "   -4.1606 if cv<=-0.02955218032002449 & pa>=-0.05927136540412903\n",
      "   +0.0000 if cp<=0.04436511918902397 & cp>=0.02268251031637192 & pav>=-0.7808784246444702\n",
      "   +2.2978 if cv>=0.005495118349790581 & pav<=0.35348663926124574\n",
      "   +1.3003 if cp>=-0.06380262970924377 & pav>=-0.26473599672317505\n",
      "--------------\n",
      "   +0.0000 if cp>=0.04436511918902397 & cv>=-0.21709540486335754\n",
      "   +4.1606 if cv<=-0.02955218032002449 & pa>=-0.05927136540412903\n",
      "   +0.0000 if cp<=0.04436511918902397 & cp>=0.02268251031637192 & pav>=-0.7808784246444702\n",
      "   -2.2978 if cv>=0.005495118349790581 & pav<=0.35348663926124574\n",
      "   -1.3003 if cp>=-0.06380262970924377 & pav>=-0.26473599672317505\n",
      "Run episode 3 with rewards 24.0\n",
      "============ 4 ===========\n",
      "67 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1]\n",
      "   +0.0000 if cp>=0.04436511918902397 & cv>=-0.21709540486335754\n",
      "   -3.0625 if cv<=-0.02955218032002449 & pa>=-0.05927136540412903\n",
      "   +1.1008 if cv>=0.005495118349790581 & pav<=0.35348663926124574\n",
      "   +1.2823 if cp>=-0.06380262970924377 & pav>=-0.26473599672317505\n",
      "   -0.4043 if cv<=0.008257742691785107 & cv>=-0.17936682105064392\n",
      "--------------\n",
      "   +0.0000 if cp>=0.04436511918902397 & cv>=-0.21709540486335754\n",
      "   +3.0625 if cv<=-0.02955218032002449 & pa>=-0.05927136540412903\n",
      "   -1.1008 if cv>=0.005495118349790581 & pav<=0.35348663926124574\n",
      "   -1.2823 if cp>=-0.06380262970924377 & pav>=-0.26473599672317505\n",
      "   +0.4043 if cv<=0.008257742691785107 & cv>=-0.17936682105064392\n",
      "Run episode 4 with rewards 67.0\n",
      "best\n",
      "============ 5 ===========\n",
      "43 actions [1, 0, 1, 0, 1, 0, 0, 0, 0, 1, 1, 1, 1, 0, 1, 0, 1, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1]\n",
      "   -5.6587 if cv<=-0.02955218032002449 & pa>=-0.05927136540412903\n",
      "   +4.0768 if cv>=0.005495118349790581 & pav<=0.35348663926124574\n",
      "   +2.1020 if cp>=-0.06380262970924377 & pav>=-0.26473599672317505\n",
      "   -0.4433 if cv<=0.008257742691785107 & cv>=-0.17936682105064392\n",
      "   -5.2149 if cp>=0.010548739694058895 & cv<=0.04253323003649713 & cv>=-0.13681784868240357 & pav<=-0.02825711220502851\n",
      "--------------\n",
      "   +5.6586 if cv<=-0.02955218032002449 & pa>=-0.05927136540412903\n",
      "   -4.0767 if cv>=0.005495118349790581 & pav<=0.35348663926124574\n",
      "   -2.1020 if cp>=-0.06380262970924377 & pav>=-0.26473599672317505\n",
      "   +0.4433 if cv<=0.008257742691785107 & cv>=-0.17936682105064392\n",
      "   +5.2149 if cp>=0.010548739694058895 & cv<=0.04253323003649713 & cv>=-0.13681784868240357 & pav<=-0.02825711220502851\n",
      "Run episode 5 with rewards 43.0\n",
      "============ 6 ===========\n",
      "86 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 0, 1, 1, 1, 0, 1, 0, 0, 0, 0, 1, 1]\n",
      "   -3.2169 if cv<=-0.02955218032002449 & pa>=-0.05927136540412903\n",
      "   +1.8550 if cv>=0.005495118349790581 & pav<=0.35348663926124574\n",
      "   +4.0945 if cp>=-0.06380262970924377 & pav>=-0.26473599672317505\n",
      "   +0.0000 if cp>=0.010548739694058895 & cv<=0.04253323003649713 & cv>=-0.13681784868240357 & pav<=-0.02825711220502851\n",
      "   -2.5571 if cv<=-0.019157563149929044 & pa>=-0.061038896441459656\n",
      "--------------\n",
      "   +3.2168 if cv<=-0.02955218032002449 & pa>=-0.05927136540412903\n",
      "   -1.8549 if cv>=0.005495118349790581 & pav<=0.35348663926124574\n",
      "   -4.0945 if cp>=-0.06380262970924377 & pav>=-0.26473599672317505\n",
      "   +0.0000 if cp>=0.010548739694058895 & cv<=0.04253323003649713 & cv>=-0.13681784868240357 & pav<=-0.02825711220502851\n",
      "   +2.5571 if cv<=-0.019157563149929044 & pa>=-0.061038896441459656\n",
      "Run episode 6 with rewards 86.0\n",
      "best\n",
      "============ 7 ===========\n",
      "33 actions [0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1]\n",
      "   -5.6897 if cv<=-0.02955218032002449 & pa>=-0.05927136540412903\n",
      "   +3.3461 if cv>=0.005495118349790581 & pav<=0.35348663926124574\n",
      "   +2.1603 if cp>=-0.06380262970924377 & pav>=-0.26473599672317505\n",
      "   +0.1208 if cv<=-0.019157563149929044 & pa>=-0.061038896441459656\n",
      "   -1.4960 if pav>=-0.2632550895214081\n",
      "--------------\n",
      "   +5.6897 if cv<=-0.02955218032002449 & pa>=-0.05927136540412903\n",
      "   -3.3460 if cv>=0.005495118349790581 & pav<=0.35348663926124574\n",
      "   -2.1603 if cp>=-0.06380262970924377 & pav>=-0.26473599672317505\n",
      "   -0.1208 if cv<=-0.019157563149929044 & pa>=-0.061038896441459656\n",
      "   +1.4960 if pav>=-0.2632550895214081\n",
      "Run episode 7 with rewards 33.0\n",
      "============ 8 ===========\n",
      "39 actions [0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 1]\n",
      "   -3.5529 if cv<=-0.02955218032002449 & pa>=-0.05927136540412903\n",
      "   +0.3746 if cv>=0.005495118349790581 & pav<=0.35348663926124574\n",
      "   +1.4908 if cp>=-0.06380262970924377 & pav>=-0.26473599672317505\n",
      "   +1.4908 if pav>=-0.2632550895214081\n",
      "   +0.5546 if cp>=0.03598427399992943 & cv>=-0.03523126021027565\n",
      "--------------\n",
      "   +3.5528 if cv<=-0.02955218032002449 & pa>=-0.05927136540412903\n",
      "   -0.3746 if cv>=0.005495118349790581 & pav<=0.35348663926124574\n",
      "   -1.4909 if cp>=-0.06380262970924377 & pav>=-0.26473599672317505\n",
      "   -1.4909 if pav>=-0.2632550895214081\n",
      "   -0.5546 if cp>=0.03598427399992943 & cv>=-0.03523126021027565\n",
      "Run episode 8 with rewards 39.0\n",
      "============ 9 ===========\n",
      "34 actions [0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1]\n",
      "   -4.3928 if cv<=-0.02955218032002449 & pa>=-0.05927136540412903\n",
      "   +1.0070 if cp>=-0.06380262970924377 & pav>=-0.26473599672317505\n",
      "   +1.0070 if pav>=-0.2632550895214081\n",
      "   -0.0000 if cp>=0.03598427399992943 & cv>=-0.03523126021027565\n",
      "   +5.1528 if cp>=-0.03323424980044365\n",
      "--------------\n",
      "   +4.3928 if cv<=-0.02955218032002449 & pa>=-0.05927136540412903\n",
      "   -1.0070 if cp>=-0.06380262970924377 & pav>=-0.26473599672317505\n",
      "   -1.0070 if pav>=-0.2632550895214081\n",
      "   -0.0000 if cp>=0.03598427399992943 & cv>=-0.03523126021027565\n",
      "   -5.1528 if cp>=-0.03323424980044365\n",
      "Run episode 9 with rewards 34.0\n",
      "============ 10 ===========\n",
      "40 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1]\n",
      "   -4.8679 if cv<=-0.02955218032002449 & pa>=-0.05927136540412903\n",
      "   +0.6692 if cp>=-0.06380262970924377 & pav>=-0.26473599672317505\n",
      "   +2.0017 if pav>=-0.2632550895214081\n",
      "   +2.8742 if cp>=-0.03323424980044365\n",
      "   -4.5283 if cv>=0.025608240440487876 & pav>=0.306297105550766\n",
      "--------------\n",
      "   +4.8679 if cv<=-0.02955218032002449 & pa>=-0.05927136540412903\n",
      "   -0.6693 if cp>=-0.06380262970924377 & pav>=-0.26473599672317505\n",
      "   -2.0018 if pav>=-0.2632550895214081\n",
      "   -2.8742 if cp>=-0.03323424980044365\n",
      "   +4.5282 if cv>=0.025608240440487876 & pav>=0.306297105550766\n",
      "Run episode 10 with rewards 40.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 11 ===========\n",
      "22 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1]\n",
      "   -5.3772 if cv<=-0.02955218032002449 & pa>=-0.05927136540412903\n",
      "   +2.3613 if pav>=-0.2632550895214081\n",
      "   -0.0000 if cp>=-0.03323424980044365\n",
      "   -2.1884 if cv>=0.025608240440487876 & pav>=0.306297105550766\n",
      "   -0.4186 if cv<=-0.15498296916484833\n",
      "--------------\n",
      "   +5.3772 if cv<=-0.02955218032002449 & pa>=-0.05927136540412903\n",
      "   -2.3614 if pav>=-0.2632550895214081\n",
      "   -0.0000 if cp>=-0.03323424980044365\n",
      "   +2.1884 if cv>=0.025608240440487876 & pav>=0.306297105550766\n",
      "   +0.4186 if cv<=-0.15498296916484833\n",
      "Run episode 11 with rewards 22.0\n",
      "============ 12 ===========\n",
      "50 actions [0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1]\n",
      "   -1.7887 if cv<=-0.02955218032002449 & pa>=-0.05927136540412903\n",
      "   +1.6826 if pav>=-0.2632550895214081\n",
      "   +0.0000 if cv>=0.025608240440487876 & pav>=0.306297105550766\n",
      "   -1.7887 if cv<=-0.15498296916484833\n",
      "   +1.3093 if cp<=-0.05473860576748848 & cv>=-0.1826152354478836\n",
      "--------------\n",
      "   +1.7887 if cv<=-0.02955218032002449 & pa>=-0.05927136540412903\n",
      "   -1.6826 if pav>=-0.2632550895214081\n",
      "   +0.0000 if cv>=0.025608240440487876 & pav>=0.306297105550766\n",
      "   +1.7887 if cv<=-0.15498296916484833\n",
      "   -1.3093 if cp<=-0.05473860576748848 & cv>=-0.1826152354478836\n",
      "Run episode 12 with rewards 50.0\n",
      "============ 13 ===========\n",
      "45 actions [0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0]\n",
      "   +3.7618 if cv<=-0.02955218032002449 & pa>=-0.05927136540412903\n",
      "   -3.6526 if pav>=-0.2632550895214081\n",
      "   -6.6486 if cv<=-0.15498296916484833\n",
      "   +2.5942 if cp<=-0.05473860576748848 & cv>=-0.1826152354478836\n",
      "   +3.4027 if \n",
      "--------------\n",
      "   -3.7623 if cv<=-0.02955218032002449 & pa>=-0.05927136540412903\n",
      "   +3.6524 if pav>=-0.2632550895214081\n",
      "   +6.6495 if cv<=-0.15498296916484833\n",
      "   -2.5946 if cp<=-0.05473860576748848 & cv>=-0.1826152354478836\n",
      "   -3.4025 if \n",
      "Run episode 13 with rewards 45.0\n",
      "============ 14 ===========\n",
      "48 actions [1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0]\n",
      "   -0.8590 if cv<=-0.02955218032002449 & pa>=-0.05927136540412903\n",
      "   -2.3938 if pav>=-0.2632550895214081\n",
      "   -1.9232 if cv<=-0.15498296916484833\n",
      "   +1.6469 if \n",
      "   +5.4802 if cp>=0.0015539415879175086 & cv<=-0.015290745720267288 & cv>=-0.20043312311172484 & pa<=-0.022069661691784856\n",
      "--------------\n",
      "   +0.8590 if cv<=-0.02955218032002449 & pa>=-0.05927136540412903\n",
      "   +2.3937 if pav>=-0.2632550895214081\n",
      "   +1.9236 if cv<=-0.15498296916484833\n",
      "   -1.6468 if \n",
      "   -5.4801 if cp>=0.0015539415879175086 & cv<=-0.015290745720267288 & cv>=-0.20043312311172484 & pa<=-0.022069661691784856\n",
      "Run episode 14 with rewards 48.0\n",
      "============ 15 ===========\n",
      "48 actions [1, 0, 1, 1, 0, 0, 1, 0, 1, 1, 0, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 0]\n",
      "   -3.8457 if pav>=-0.2632550895214081\n",
      "   -3.7875 if cv<=-0.15498296916484833\n",
      "   +3.2578 if \n",
      "   +0.0000 if cp>=0.0015539415879175086 & cv<=-0.015290745720267288 & cv>=-0.20043312311172484 & pa<=-0.022069661691784856\n",
      "   -3.7202 if pa>=-0.010346114076673978 & pav>=-0.009510042145848257\n",
      "--------------\n",
      "   +3.8454 if pav>=-0.2632550895214081\n",
      "   +3.7878 if cv<=-0.15498296916484833\n",
      "   -3.2576 if \n",
      "   +0.0000 if cp>=0.0015539415879175086 & cv<=-0.015290745720267288 & cv>=-0.20043312311172484 & pa<=-0.022069661691784856\n",
      "   +3.7207 if pa>=-0.010346114076673978 & pav>=-0.009510042145848257\n",
      "Run episode 15 with rewards 48.0\n",
      "============ 16 ===========\n",
      "38 actions [1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 0, 1, 1, 0]\n",
      "   -2.8411 if pav>=-0.2632550895214081\n",
      "   -1.3434 if cv<=-0.15498296916484833\n",
      "   +1.9428 if \n",
      "   -0.9754 if pa>=-0.010346114076673978 & pav>=-0.009510042145848257\n",
      "   +2.5806 if cp>=0.03478786125779152 & pa>=-0.03226655200123787 & pav<=-0.21050577759742736 & pav>=-0.2995856761932373\n",
      "--------------\n",
      "   +2.8409 if pav>=-0.2632550895214081\n",
      "   +1.3436 if cv<=-0.15498296916484833\n",
      "   -1.9425 if \n",
      "   +0.9755 if pa>=-0.010346114076673978 & pav>=-0.009510042145848257\n",
      "   -2.5807 if cp>=0.03478786125779152 & pa>=-0.03226655200123787 & pav<=-0.21050577759742736 & pav>=-0.2995856761932373\n",
      "Run episode 16 with rewards 38.0\n",
      "============ 17 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 1, 1, 1, 1, 1]\n",
      "   -6.0661 if pav>=-0.2632550895214081\n",
      "   -1.9330 if cv<=-0.15498296916484833\n",
      "   +2.6316 if \n",
      "   +0.0000 if cp>=0.03478786125779152 & pa>=-0.03226655200123787 & pav<=-0.21050577759742736 & pav>=-0.2995856761932373\n",
      "   +6.3043 if cp>=0.01828569918870926\n",
      "--------------\n",
      "   +6.0659 if pav>=-0.2632550895214081\n",
      "   +1.9331 if cv<=-0.15498296916484833\n",
      "   -2.6314 if \n",
      "   +0.0000 if cp>=0.03478786125779152 & pa>=-0.03226655200123787 & pav<=-0.21050577759742736 & pav>=-0.2995856761932373\n",
      "   -6.3044 if cp>=0.01828569918870926\n",
      "Run episode 17 with rewards 10.0\n",
      "============ 18 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 1, 0, 0]\n",
      "   +0.5502 if pav>=-0.2632550895214081\n",
      "   +0.4666 if cv<=-0.15498296916484833\n",
      "   +0.5502 if \n",
      "   +1.5374 if cp>=0.01828569918870926\n",
      "   +0.4086 if cp>=0.046193432062864304\n",
      "--------------\n",
      "   -0.5501 if pav>=-0.2632550895214081\n",
      "   -0.4665 if cv<=-0.15498296916484833\n",
      "   -0.5501 if \n",
      "   -1.5374 if cp>=0.01828569918870926\n",
      "   -0.4086 if cp>=0.046193432062864304\n",
      "Run episode 18 with rewards 9.0\n",
      "============ 19 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 1, 0, 1, 0]\n",
      "   -0.2887 if pav>=-0.2632550895214081\n",
      "   -0.8441 if cv<=-0.15498296916484833\n",
      "   -0.2887 if \n",
      "   -0.0000 if cp>=0.01828569918870926\n",
      "   +3.3794 if cv>=-1.0282196640968322\n",
      "--------------\n",
      "   +0.2887 if pav>=-0.2632550895214081\n",
      "   +0.8441 if cv<=-0.15498296916484833\n",
      "   +0.2887 if \n",
      "   -0.0000 if cp>=0.01828569918870926\n",
      "   -3.3794 if cv>=-1.0282196640968322\n",
      "Run episode 19 with rewards 10.0\n",
      "============ 20 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 1, 0, 1]\n",
      "   -0.0893 if pav>=-0.2632550895214081\n",
      "   -0.2239 if cv<=-0.15498296916484833\n",
      "   -0.0893 if \n",
      "   +2.3301 if cv>=-1.0282196640968322\n",
      "   +0.4861 if cp>=-0.031829146295785905\n",
      "--------------\n",
      "   +0.0894 if pav>=-0.2632550895214081\n",
      "   +0.2239 if cv<=-0.15498296916484833\n",
      "   +0.0894 if \n",
      "   -2.3301 if cv>=-1.0282196640968322\n",
      "   -0.4861 if cp>=-0.031829146295785905\n",
      "Run episode 20 with rewards 9.0\n",
      "============ 21 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 1, 0, 1, 0]\n",
      "   -0.4674 if cv<=-0.15498296916484833\n",
      "   -0.3197 if \n",
      "   +2.0894 if cv>=-1.0282196640968322\n",
      "   +0.8340 if cp>=-0.031829146295785905\n",
      "   -0.3757 if pa>=0.19453386962413788\n",
      "--------------\n",
      "   +0.4675 if cv<=-0.15498296916484833\n",
      "   +0.3197 if \n",
      "   -2.0893 if cv>=-1.0282196640968322\n",
      "   -0.8340 if cp>=-0.031829146295785905\n",
      "   +0.3757 if pa>=0.19453386962413788\n",
      "Run episode 21 with rewards 10.0\n",
      "============ 22 ===========\n",
      "12 actions [0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 1, 0]\n",
      "   -0.0566 if cv<=-0.15498296916484833\n",
      "   +2.5434 if cv>=-1.0282196640968322\n",
      "   -0.2595 if cp>=-0.031829146295785905\n",
      "   -0.0000 if pa>=0.19453386962413788\n",
      "   -1.4205 if cp<=0.001615658774971964\n",
      "--------------\n",
      "   +0.0566 if cv<=-0.15498296916484833\n",
      "   -2.5434 if cv>=-1.0282196640968322\n",
      "   +0.2595 if cp>=-0.031829146295785905\n",
      "   +0.0000 if pa>=0.19453386962413788\n",
      "   +1.4205 if cp<=0.001615658774971964\n",
      "Run episode 22 with rewards 12.0\n",
      "============ 23 ===========\n",
      "12 actions [0, 0, 0, 0, 0, 1, 0, 0, 1, 1, 0, 1]\n",
      "   -0.7135 if cv<=-0.15498296916484833\n",
      "   +0.4830 if cv>=-1.0282196640968322\n",
      "   +1.3896 if cp>=-0.031829146295785905\n",
      "   -0.7733 if cp<=0.001615658774971964\n",
      "   +2.9579 if cv>=-0.9685938596725464\n",
      "--------------\n",
      "   +0.7135 if cv<=-0.15498296916484833\n",
      "   -0.4830 if cv>=-1.0282196640968322\n",
      "   -1.3896 if cp>=-0.031829146295785905\n",
      "   +0.7734 if cp<=0.001615658774971964\n",
      "   -2.9579 if cv>=-0.9685938596725464\n",
      "Run episode 23 with rewards 12.0\n",
      "============ 24 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 1, 0, 0, 1]\n",
      "   -0.4645 if cv<=-0.15498296916484833\n",
      "   -0.0000 if cp>=-0.031829146295785905\n",
      "   -0.2564 if cp<=0.001615658774971964\n",
      "   +2.7659 if cv>=-0.9685938596725464\n",
      "   +3.0924 if cp<=-0.11080022305250167 & cv<=-0.897741675376892 & cv>=-0.9762959718704224\n",
      "--------------\n",
      "   +0.4645 if cv<=-0.15498296916484833\n",
      "   +0.0000 if cp>=-0.031829146295785905\n",
      "   +0.2564 if cp<=0.001615658774971964\n",
      "   -2.7659 if cv>=-0.9685938596725464\n",
      "   -3.0924 if cp<=-0.11080022305250167 & cv<=-0.897741675376892 & cv>=-0.9762959718704224\n",
      "Run episode 24 with rewards 9.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 25 ===========\n",
      "11 actions [0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0]\n",
      "   +0.5102 if cv<=-0.15498296916484833\n",
      "   +0.0902 if cp<=0.001615658774971964\n",
      "   +2.1867 if cv>=-0.9685938596725464\n",
      "   +0.0000 if cp<=-0.11080022305250167 & cv<=-0.897741675376892 & cv>=-0.9762959718704224\n",
      "   -0.9268 if cp>=-0.06092919930815697\n",
      "--------------\n",
      "   -0.5102 if cv<=-0.15498296916484833\n",
      "   -0.0902 if cp<=0.001615658774971964\n",
      "   -2.1867 if cv>=-0.9685938596725464\n",
      "   -0.0000 if cp<=-0.11080022305250167 & cv<=-0.897741675376892 & cv>=-0.9762959718704224\n",
      "   +0.9268 if cp>=-0.06092919930815697\n",
      "Run episode 25 with rewards 11.0\n",
      "============ 26 ===========\n",
      "11 actions [0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0]\n",
      "   +0.5946 if cv<=-0.15498296916484833\n",
      "   +1.0713 if cp<=0.001615658774971964\n",
      "   +0.9650 if cv>=-0.9685938596725464\n",
      "   +0.8695 if cp>=-0.06092919930815697\n",
      "   -3.7584 if cp>=-0.1591801792383194 & cv<=-1.186832308769226\n",
      "--------------\n",
      "   -0.5946 if cv<=-0.15498296916484833\n",
      "   -1.0713 if cp<=0.001615658774971964\n",
      "   -0.9650 if cv>=-0.9685938596725464\n",
      "   -0.8694 if cp>=-0.06092919930815697\n",
      "   +3.7584 if cp>=-0.1591801792383194 & cv<=-1.186832308769226\n",
      "Run episode 26 with rewards 11.0\n",
      "============ 27 ===========\n",
      "12 actions [1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1]\n",
      "   +1.1888 if cp<=0.001615658774971964\n",
      "   +0.4756 if cv>=-0.9685938596725464\n",
      "   +0.6941 if cp>=-0.06092919930815697\n",
      "   -1.0371 if cp>=-0.1591801792383194 & cv<=-1.186832308769226\n",
      "   -0.7967 if cv<=-1.1849778890609741\n",
      "--------------\n",
      "   -1.1888 if cp<=0.001615658774971964\n",
      "   -0.4757 if cv>=-0.9685938596725464\n",
      "   -0.6941 if cp>=-0.06092919930815697\n",
      "   +1.0371 if cp>=-0.1591801792383194 & cv<=-1.186832308769226\n",
      "   +0.7967 if cv<=-1.1849778890609741\n",
      "Run episode 27 with rewards 12.0\n",
      "============ 28 ===========\n",
      "8 actions [1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.0754 if cp<=0.001615658774971964\n",
      "   +1.9430 if cp>=-0.06092919930815697\n",
      "   -1.6739 if cp>=-0.1591801792383194 & cv<=-1.186832308769226\n",
      "   -1.6739 if cv<=-1.1849778890609741\n",
      "   -3.1066 if cp>=0.044930972158908844 & cv>=-0.050052957981824735\n",
      "--------------\n",
      "   +0.0755 if cp<=0.001615658774971964\n",
      "   -1.9430 if cp>=-0.06092919930815697\n",
      "   +1.6739 if cp>=-0.1591801792383194 & cv<=-1.186832308769226\n",
      "   +1.6739 if cv<=-1.1849778890609741\n",
      "   +3.1066 if cp>=0.044930972158908844 & cv>=-0.050052957981824735\n",
      "Run episode 28 with rewards 8.0\n",
      "============ 29 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -1.4253 if cp>=-0.06092919930815697\n",
      "   +0.0000 if cp>=-0.1591801792383194 & cv<=-1.186832308769226\n",
      "   +0.0000 if cv<=-1.1849778890609741\n",
      "   -1.4253 if cp>=0.044930972158908844 & cv>=-0.050052957981824735\n",
      "   -0.6004 if cp>=0.05212235227227211\n",
      "--------------\n",
      "   +1.4253 if cp>=-0.06092919930815697\n",
      "   -0.0000 if cp>=-0.1591801792383194 & cv<=-1.186832308769226\n",
      "   -0.0000 if cv<=-1.1849778890609741\n",
      "   +1.4253 if cp>=0.044930972158908844 & cv>=-0.050052957981824735\n",
      "   +0.6004 if cp>=0.05212235227227211\n",
      "Run episode 29 with rewards 9.0\n",
      "============ 30 ===========\n",
      "12 actions [1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.8595 if cp>=-0.06092919930815697\n",
      "   -0.0000 if cp>=-0.1591801792383194 & cv<=-1.186832308769226\n",
      "   -0.8595 if cp>=0.044930972158908844 & cv>=-0.050052957981824735\n",
      "   -0.2655 if cp>=0.05212235227227211\n",
      "   -0.3736 if cp<=0.04816343188285828\n",
      "--------------\n",
      "   +0.8595 if cp>=-0.06092919930815697\n",
      "   +0.0000 if cv<=-1.1849778890609741\n",
      "   +0.8595 if cp>=0.044930972158908844 & cv>=-0.050052957981824735\n",
      "   +0.2655 if cp>=0.05212235227227211\n",
      "   +0.3736 if cp<=0.04816343188285828\n",
      "Run episode 30 with rewards 12.0\n",
      "============ 31 ===========\n",
      "16 actions [1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0]\n",
      "   -1.2966 if cp>=-0.06092919930815697\n",
      "   -0.6369 if cp>=0.044930972158908844 & cv>=-0.050052957981824735\n",
      "   -0.6369 if cp>=0.05212235227227211\n",
      "   -0.6597 if cp<=0.04816343188285828\n",
      "   +4.9549 if cp<=0.030089328065514565 & cv>=0.18910401463508605\n",
      "--------------\n",
      "   +1.2966 if cp>=-0.06092919930815697\n",
      "   +0.6369 if cp>=0.044930972158908844 & cv>=-0.050052957981824735\n",
      "   +0.6369 if cp>=0.05212235227227211\n",
      "   +0.6597 if cp<=0.04816343188285828\n",
      "   -4.9550 if cp<=0.030089328065514565 & cv>=0.18910401463508605\n",
      "Run episode 31 with rewards 16.0\n",
      "============ 32 ===========\n",
      "8 actions [1, 1, 1, 1, 1, 1, 0, 0]\n",
      "   -1.2238 if cp>=-0.06092919930815697\n",
      "   -0.0000 if cp>=0.044930972158908844 & cv>=-0.050052957981824735\n",
      "   -1.2238 if cp<=0.04816343188285828\n",
      "   +2.4394 if cp<=0.030089328065514565 & cv>=0.18910401463508605\n",
      "   +1.2889 if pav<=-0.4411633908748626\n",
      "--------------\n",
      "   +1.2238 if cp>=-0.06092919930815697\n",
      "   +0.0000 if cp>=0.05212235227227211\n",
      "   +1.2238 if cp<=0.04816343188285828\n",
      "   -2.4394 if cp<=0.030089328065514565 & cv>=0.18910401463508605\n",
      "   -1.2889 if pav<=-0.4411633908748626\n",
      "Run episode 32 with rewards 8.0\n",
      "============ 33 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 0, 0]\n",
      "   -1.1937 if cp>=-0.06092919930815697\n",
      "   -0.9938 if cp<=0.04816343188285828\n",
      "   +0.0000 if cp<=0.030089328065514565 & cv>=0.18910401463508605\n",
      "   -0.7468 if pav<=-0.4411633908748626\n",
      "   +2.5115 if cp>=0.08136449456214906\n",
      "--------------\n",
      "   +1.1937 if cp>=-0.06092919930815697\n",
      "   +0.9938 if cp<=0.04816343188285828\n",
      "   -0.0000 if cp<=0.030089328065514565 & cv>=0.18910401463508605\n",
      "   +0.7468 if pav<=-0.4411633908748626\n",
      "   -2.5114 if cp>=0.08136449456214906\n",
      "Run episode 33 with rewards 9.0\n",
      "============ 34 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 0]\n",
      "   -0.6579 if cp>=-0.06092919930815697\n",
      "   -1.3378 if cp<=0.04816343188285828\n",
      "   +0.1341 if pav<=-0.4411633908748626\n",
      "   +1.3529 if cp>=0.08136449456214906\n",
      "   +0.3026 if cp>=0.11645765602588654\n",
      "--------------\n",
      "   +0.6579 if cp>=-0.06092919930815697\n",
      "   +1.3378 if cp<=0.04816343188285828\n",
      "   -0.1341 if pav<=-0.4411633908748626\n",
      "   -1.3529 if cp>=0.08136449456214906\n",
      "   -0.3026 if cp>=0.11645765602588654\n",
      "Run episode 34 with rewards 10.0\n",
      "============ 35 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -1.2475 if cp>=-0.06092919930815697\n",
      "   -1.2876 if cp<=0.04816343188285828\n",
      "   +0.8137 if cp>=0.08136449456214906\n",
      "   -0.0000 if cp>=0.11645765602588654\n",
      "   -0.6336 if cp<=-0.01644002106040716\n",
      "--------------\n",
      "   +1.2475 if cp>=-0.06092919930815697\n",
      "   +1.2876 if cp<=0.04816343188285828\n",
      "   -0.8137 if cp>=0.08136449456214906\n",
      "   -0.0000 if cp>=0.11645765602588654\n",
      "   +0.6336 if cp<=-0.01644002106040716\n",
      "Run episode 35 with rewards 10.0\n",
      "============ 36 ===========\n",
      "12 actions [1, 1, 1, 1, 1, 0, 1, 0, 1, 1, 1, 1]\n",
      "   -1.9252 if cp>=-0.06092919930815697\n",
      "   -0.7499 if cp<=0.04816343188285828\n",
      "   -0.7010 if cp>=0.08136449456214906\n",
      "   +0.0000 if cp<=-0.01644002106040716\n",
      "   -0.0818 if cp>=0.1387488842010498\n",
      "--------------\n",
      "   +1.9252 if cp>=-0.06092919930815697\n",
      "   +0.7499 if cp<=0.04816343188285828\n",
      "   +0.7010 if cp>=0.08136449456214906\n",
      "   -0.0000 if cp<=-0.01644002106040716\n",
      "   +0.0819 if cp>=0.1387488842010498\n",
      "Run episode 36 with rewards 12.0\n",
      "============ 37 ===========\n",
      "12 actions [1, 0, 1, 1, 1, 1, 1, 0, 1, 0, 1, 0]\n",
      "   -0.9635 if cp>=-0.06092919930815697\n",
      "   +0.1305 if cp<=0.04816343188285828\n",
      "   -2.6563 if cp>=0.08136449456214906\n",
      "   -0.0000 if cp>=0.1387488842010498\n",
      "   +4.6582 if cv>=0.8908948779106143\n",
      "--------------\n",
      "   +0.9635 if cp>=-0.06092919930815697\n",
      "   -0.1305 if cp<=0.04816343188285828\n",
      "   +2.6563 if cp>=0.08136449456214906\n",
      "   -0.0000 if cp>=0.1387488842010498\n",
      "   -4.6582 if cv>=0.8908948779106143\n",
      "Run episode 37 with rewards 12.0\n",
      "============ 38 ===========\n",
      "8 actions [1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -1.1800 if cp>=-0.06092919930815697\n",
      "   -1.2015 if cp<=0.04816343188285828\n",
      "   +0.9511 if cp>=0.08136449456214906\n",
      "   +1.3632 if cv>=0.8908948779106143\n",
      "   +4.9750 if pa>=-0.018662821501493454\n",
      "--------------\n",
      "   +1.1800 if cp>=-0.06092919930815697\n",
      "   +1.2015 if cp<=0.04816343188285828\n",
      "   -0.9511 if cp>=0.08136449456214906\n",
      "   -1.3631 if cv>=0.8908948779106143\n",
      "   -4.9750 if pa>=-0.018662821501493454\n",
      "Run episode 38 with rewards 8.0\n",
      "============ 39 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -1.3008 if cp>=-0.06092919930815697\n",
      "   -1.0008 if cp<=0.04816343188285828\n",
      "   -0.5747 if cv>=0.8908948779106143\n",
      "   +0.0000 if pa>=-0.018662821501493454\n",
      "   -0.3126 if cp<=-0.017852361127734185\n",
      "--------------\n",
      "   +1.3008 if cp>=-0.06092919930815697\n",
      "   +1.0008 if cp<=0.04816343188285828\n",
      "   +0.5746 if cv>=0.8908948779106143\n",
      "   +0.0000 if pa>=-0.018662821501493454\n",
      "   +0.3126 if cp<=-0.017852361127734185\n",
      "Run episode 39 with rewards 10.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 40 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -1.6923 if cp>=-0.06092919930815697\n",
      "   -0.8326 if cp<=0.04816343188285828\n",
      "   -0.4327 if cv>=0.8908948779106143\n",
      "   +0.0000 if cp<=-0.017852361127734185\n",
      "   -0.7333 if cp<=0.11994099020957948 & cp>=0.051053491234779355\n",
      "--------------\n",
      "   +1.6923 if cp>=-0.06092919930815697\n",
      "   +0.8327 if cp<=0.04816343188285828\n",
      "   +0.4327 if cv>=0.8908948779106143\n",
      "   +0.0000 if cp<=-0.017852361127734185\n",
      "   +0.7333 if cp<=0.11994099020957948 & cp>=0.051053491234779355\n",
      "Run episode 40 with rewards 9.0\n",
      "============ 41 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -1.1445 if cp>=-0.06092919930815697\n",
      "   -0.9724 if cp<=0.04816343188285828\n",
      "   -0.2684 if cv>=0.8908948779106143\n",
      "   -0.0253 if cp<=0.11994099020957948 & cp>=0.051053491234779355\n",
      "   -0.3543 if cp<=-0.02527914009988308\n",
      "--------------\n",
      "   +1.1444 if cp>=-0.06092919930815697\n",
      "   +0.9724 if cp<=0.04816343188285828\n",
      "   +0.2684 if cv>=0.8908948779106143\n",
      "   +0.0253 if cp<=0.11994099020957948 & cp>=0.051053491234779355\n",
      "   +0.3543 if cp<=-0.02527914009988308\n",
      "Run episode 41 with rewards 9.0\n",
      "============ 42 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -1.5107 if cp>=-0.06092919930815697\n",
      "   -1.0444 if cp<=0.04816343188285828\n",
      "   -0.5162 if cv>=0.8908948779106143\n",
      "   +0.0000 if cp<=-0.02527914009988308\n",
      "   -0.0531 if cp>=0.10773805528879166\n",
      "--------------\n",
      "   +1.5107 if cp>=-0.06092919930815697\n",
      "   +1.0444 if cp<=0.04816343188285828\n",
      "   +0.5162 if cv>=0.8908948779106143\n",
      "   +0.0000 if cp<=-0.02527914009988308\n",
      "   +0.0531 if cp>=0.10773805528879166\n",
      "Run episode 42 with rewards 9.0\n",
      "============ 43 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -1.1566 if cp>=-0.06092919930815697\n",
      "   -0.9473 if cp<=0.04816343188285828\n",
      "   -0.2940 if cv>=0.8908948779106143\n",
      "   +0.0000 if cp>=0.10773805528879166\n",
      "   -0.3499 if cp<=-0.00816472051665187\n",
      "--------------\n",
      "   +1.1566 if cp>=-0.06092919930815697\n",
      "   +0.9473 if cp<=0.04816343188285828\n",
      "   +0.2940 if cv>=0.8908948779106143\n",
      "   +0.0000 if cp>=0.10773805528879166\n",
      "   +0.3499 if cp<=-0.00816472051665187\n",
      "Run episode 43 with rewards 10.0\n",
      "============ 44 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -1.1837 if cp>=-0.06092919930815697\n",
      "   -0.9034 if cp<=0.04816343188285828\n",
      "   -0.5151 if cv>=0.8908948779106143\n",
      "   -0.6685 if cp<=-0.00816472051665187\n",
      "   -0.0693 if cp>=0.10396123677492142\n",
      "--------------\n",
      "   +1.1837 if cp>=-0.06092919930815697\n",
      "   +0.9034 if cp<=0.04816343188285828\n",
      "   +0.5151 if cv>=0.8908948779106143\n",
      "   +0.6685 if cp<=-0.00816472051665187\n",
      "   +0.0693 if cp>=0.10396123677492142\n",
      "Run episode 44 with rewards 9.0\n",
      "============ 45 ===========\n",
      "8 actions [1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -1.4288 if cp>=-0.06092919930815697\n",
      "   -1.0205 if cp<=0.04816343188285828\n",
      "   -0.4555 if cv>=0.8908948779106143\n",
      "   -0.1336 if cp<=-0.00816472051665187\n",
      "   -0.0429 if cp>=0.10776353627443314\n",
      "--------------\n",
      "   +1.4288 if cp>=-0.06092919930815697\n",
      "   +1.0206 if cp<=0.04816343188285828\n",
      "   +0.4555 if cv>=0.8908948779106143\n",
      "   +0.1335 if cp<=-0.00816472051665187\n",
      "   +0.0429 if cp>=0.10776353627443314\n",
      "Run episode 45 with rewards 8.0\n",
      "============ 46 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -1.1428 if cp>=-0.06092919930815697\n",
      "   -0.9011 if cp<=0.04816343188285828\n",
      "   -0.2863 if cv>=0.8908948779106143\n",
      "   +0.0000 if cp<=-0.00816472051665187\n",
      "   -0.3598 if cp<=0.0002708058338612323\n",
      "--------------\n",
      "   +1.1428 if cp>=-0.06092919930815697\n",
      "   +0.9012 if cp<=0.04816343188285828\n",
      "   +0.2863 if cv>=0.8908948779106143\n",
      "   +0.0000 if cp<=-0.00816472051665187\n",
      "   +0.3598 if cp<=0.0002708058338612323\n",
      "Run episode 46 with rewards 9.0\n",
      "============ 47 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -1.1454 if cp>=-0.06092919930815697\n",
      "   -0.8402 if cp<=0.04816343188285828\n",
      "   -0.4713 if cv>=0.8908948779106143\n",
      "   -0.6741 if cp<=0.0002708058338612323\n",
      "   -0.0740 if cp>=0.07781381905078888\n",
      "--------------\n",
      "   +1.1454 if cp>=-0.06092919930815697\n",
      "   +0.8402 if cp<=0.04816343188285828\n",
      "   +0.4713 if cv>=0.8908948779106143\n",
      "   +0.6741 if cp<=0.0002708058338612323\n",
      "   +0.0740 if cp>=0.07781381905078888\n",
      "Run episode 47 with rewards 9.0\n",
      "============ 48 ===========\n",
      "11 actions [0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1]\n",
      "   -1.0675 if cp>=-0.06092919930815697\n",
      "   -0.7924 if cp<=0.04816343188285828\n",
      "   -0.4449 if cv>=0.8908948779106143\n",
      "   -0.6225 if cp<=0.0002708058338612323\n",
      "   -0.0631 if cp>=0.0877842977643013\n",
      "--------------\n",
      "   +1.0675 if cp>=-0.06092919930815697\n",
      "   +0.7924 if cp<=0.04816343188285828\n",
      "   +0.4449 if cv>=0.8908948779106143\n",
      "   +0.6225 if cp<=0.0002708058338612323\n",
      "   +0.0631 if cp>=0.0877842977643013\n",
      "Run episode 48 with rewards 11.0\n",
      "============ 49 ===========\n",
      "11 actions [0, 0, 0, 0, 0, 1, 1, 1, 0, 0, 1]\n",
      "   +2.2171 if cp>=-0.06092919930815697\n",
      "   -0.7915 if cp<=0.04816343188285828\n",
      "   +1.3888 if cv>=0.8908948779106143\n",
      "   +0.8283 if cp<=0.0002708058338612323\n",
      "   -2.9390 if cv>=0.023687930777668953\n",
      "--------------\n",
      "   -2.2171 if cp>=-0.06092919930815697\n",
      "   +0.7915 if cp<=0.04816343188285828\n",
      "   -1.3888 if cv>=0.8908948779106143\n",
      "   -0.8283 if cp<=0.0002708058338612323\n",
      "   +2.9390 if cv>=0.023687930777668953\n",
      "Run episode 49 with rewards 11.0\n",
      "============ 50 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 1, 1]\n",
      "   +3.1725 if cp>=-0.06092919930815697\n",
      "   -0.0000 if cv>=0.8908948779106143\n",
      "   -1.6670 if cp<=0.0002708058338612323\n",
      "   -0.0000 if cv>=0.023687930777668953\n",
      "   +2.9939 if cp<=-0.1164289116859436 & cv>=-0.606419563293457\n",
      "--------------\n",
      "   -3.1725 if cp>=-0.06092919930815697\n",
      "   +0.0000 if cv>=0.8908948779106143\n",
      "   +1.6670 if cp<=0.0002708058338612323\n",
      "   +0.0000 if cv>=0.023687930777668953\n",
      "   -2.9939 if cp<=-0.1164289116859436 & cv>=-0.606419563293457\n",
      "Run episode 50 with rewards 10.0\n",
      "============ 51 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 1, 1]\n",
      "   +1.8110 if cp>=-0.06092919930815697\n",
      "   +0.2467 if cp<=0.0002708058338612323\n",
      "   +0.0000 if cv>=0.023687930777668953\n",
      "   +0.0000 if cp<=-0.1164289116859436 & cv>=-0.606419563293457\n",
      "   -0.7224 if cp<=-0.060197605192661284\n",
      "--------------\n",
      "   -1.8110 if cp>=-0.06092919930815697\n",
      "   -0.2467 if cp<=0.0002708058338612323\n",
      "   +0.0000 if cv>=0.023687930777668953\n",
      "   +0.0000 if cp<=-0.1164289116859436 & cv>=-0.606419563293457\n",
      "   +0.7224 if cp<=-0.060197605192661284\n",
      "Run episode 51 with rewards 9.0\n",
      "============ 52 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 1, 1]\n",
      "   +2.2285 if cp>=-0.06092919930815697\n",
      "   -0.2520 if cp<=0.0002708058338612323\n",
      "   +0.0000 if cp<=-0.1164289116859436 & cv>=-0.606419563293457\n",
      "   -0.8695 if cp<=-0.060197605192661284\n",
      "   -0.5400 if pav>=2.176384210586548\n",
      "--------------\n",
      "   -2.2285 if cp>=-0.06092919930815697\n",
      "   +0.2520 if cp<=0.0002708058338612323\n",
      "   +0.0000 if cp<=-0.1164289116859436 & cv>=-0.606419563293457\n",
      "   +0.8695 if cp<=-0.060197605192661284\n",
      "   +0.5400 if pav>=2.176384210586548\n",
      "Run episode 52 with rewards 9.0\n",
      "============ 53 ===========\n",
      "12 actions [0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1]\n",
      "   +1.7175 if cp>=-0.06092919930815697\n",
      "   +0.6094 if cp<=0.0002708058338612323\n",
      "   -1.1081 if cp<=-0.060197605192661284\n",
      "   +0.0000 if pav>=2.176384210586548\n",
      "   -0.2605 if pa>=0.18819184601306915\n",
      "--------------\n",
      "   -1.7175 if cp>=-0.06092919930815697\n",
      "   -0.6094 if cp<=0.0002708058338612323\n",
      "   +1.1081 if cp<=-0.060197605192661284\n",
      "   +0.0000 if pav>=2.176384210586548\n",
      "   +0.2605 if pa>=0.18819184601306915\n",
      "Run episode 53 with rewards 12.0\n",
      "============ 54 ===========\n",
      "11 actions [0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1]\n",
      "   +2.6264 if cp>=-0.06092919930815697\n",
      "   -0.7711 if cp<=0.0002708058338612323\n",
      "   -1.7338 if cp<=-0.060197605192661284\n",
      "   -0.0526 if pa>=0.18819184601306915\n",
      "   -0.4774 if cp<=-0.1085894837975502\n",
      "--------------\n",
      "   -2.6264 if cp>=-0.06092919930815697\n",
      "   +0.7711 if cp<=0.0002708058338612323\n",
      "   +1.7338 if cp<=-0.060197605192661284\n",
      "   +0.0525 if pa>=0.18819184601306915\n",
      "   +0.4774 if cp<=-0.1085894837975502\n",
      "Run episode 54 with rewards 11.0\n",
      "============ 55 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 1]\n",
      "   +2.0669 if cp>=-0.06092919930815697\n",
      "   +0.3426 if cp<=0.0002708058338612323\n",
      "   -0.8808 if cp<=-0.060197605192661284\n",
      "   -0.1570 if cp<=-0.1085894837975502\n",
      "   -0.2446 if cv<=-1.0073978900909424\n",
      "--------------\n",
      "   -2.0669 if cp>=-0.06092919930815697\n",
      "   -0.3426 if cp<=0.0002708058338612323\n",
      "   +0.8808 if cp<=-0.060197605192661284\n",
      "   +0.1570 if cp<=-0.1085894837975502\n",
      "   +0.2446 if cv<=-1.0073978900909424\n",
      "Run episode 55 with rewards 9.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 56 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +1.9360 if cp>=-0.06092919930815697\n",
      "   +0.0214 if cp<=0.0002708058338612323\n",
      "   -0.3714 if cp<=-0.060197605192661284\n",
      "   -0.1267 if cv<=-1.0073978900909424\n",
      "   +0.5507 if cp>=0.03463598936796188\n",
      "--------------\n",
      "   -1.9360 if cp>=-0.06092919930815697\n",
      "   -0.0214 if cp<=0.0002708058338612323\n",
      "   +0.3714 if cp<=-0.060197605192661284\n",
      "   +0.1267 if cv<=-1.0073978900909424\n",
      "   -0.5507 if cp>=0.03463598936796188\n",
      "Run episode 56 with rewards 9.0\n",
      "============ 57 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +1.7530 if cp>=-0.06092919930815697\n",
      "   +0.5330 if cp<=-0.060197605192661284\n",
      "   +0.7148 if cv<=-1.0073978900909424\n",
      "   +0.0000 if cp>=0.03463598936796188\n",
      "   +0.9189 if cp>=0.017563362605869777\n",
      "--------------\n",
      "   -1.7530 if cp>=-0.06092919930815697\n",
      "   -0.5330 if cp<=-0.060197605192661284\n",
      "   -0.7148 if cv<=-1.0073978900909424\n",
      "   -0.0000 if cp>=0.03463598936796188\n",
      "   -0.9189 if cp>=0.017563362605869777\n",
      "Run episode 57 with rewards 9.0\n",
      "============ 58 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +2.1268 if cp>=-0.06092919930815697\n",
      "   +0.5793 if cp<=-0.060197605192661284\n",
      "   +0.5793 if cv<=-1.0073978900909424\n",
      "   +0.0000 if cp>=0.017563362605869777\n",
      "   +0.8219 if cp<=-0.03141929954290389\n",
      "--------------\n",
      "   -2.1268 if cp>=-0.06092919930815697\n",
      "   -0.5793 if cp<=-0.060197605192661284\n",
      "   -0.5793 if cv<=-1.0073978900909424\n",
      "   +0.0000 if cp>=0.017563362605869777\n",
      "   -0.8220 if cp<=-0.03141929954290389\n",
      "Run episode 58 with rewards 9.0\n",
      "============ 59 ===========\n",
      "11 actions [0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +1.8320 if cp>=-0.06092919930815697\n",
      "   +0.3776 if cp<=-0.060197605192661284\n",
      "   +0.3776 if cv<=-1.0073978900909424\n",
      "   +0.4663 if cp<=-0.03141929954290389\n",
      "   +0.4663 if cp<=-0.028056500107049933\n",
      "--------------\n",
      "   -1.8320 if cp>=-0.06092919930815697\n",
      "   -0.3776 if cp<=-0.060197605192661284\n",
      "   -0.3776 if cv<=-1.0073978900909424\n",
      "   -0.4663 if cp<=-0.03141929954290389\n",
      "   -0.4663 if cp<=-0.028056500107049933\n",
      "Run episode 59 with rewards 11.0\n",
      "============ 60 ===========\n",
      "11 actions [0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   -2.5776 if cp>=-0.06092919930815697\n",
      "   +0.1427 if cp<=-0.060197605192661284\n",
      "   +0.8969 if cp<=-0.03141929954290389\n",
      "   +2.6885 if cp<=-0.028056500107049933\n",
      "   +3.8538 if cv>=-0.22420302033424377\n",
      "--------------\n",
      "   +2.5790 if cp>=-0.06092919930815697\n",
      "   -0.0709 if cv<=-1.0073978900909424\n",
      "   -0.9045 if cp<=-0.03141929954290389\n",
      "   -2.6922 if cp<=-0.028056500107049933\n",
      "   -3.8549 if cv>=-0.22420302033424377\n",
      "Run episode 60 with rewards 11.0\n",
      "============ 61 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.7812 if cp>=-0.06092919930815697\n",
      "   +1.3380 if cp<=-0.03141929954290389\n",
      "   +1.3605 if cp<=-0.028056500107049933\n",
      "   +1.6230 if cv>=-0.22420302033424377\n",
      "   -0.7213 if cp<=-0.021535539999604225\n",
      "--------------\n",
      "   -0.7846 if cp>=-0.06092919930815697\n",
      "   -1.3388 if cp<=-0.03141929954290389\n",
      "   -1.3614 if cp<=-0.028056500107049933\n",
      "   -1.6208 if cv>=-0.22420302033424377\n",
      "   +0.7241 if cp<=-0.021535539999604225\n",
      "Run episode 61 with rewards 9.0\n",
      "============ 62 ===========\n",
      "12 actions [0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.3003 if cp>=-0.06092919930815697\n",
      "   +1.0246 if cp<=-0.03141929954290389\n",
      "   +1.0246 if cp<=-0.028056500107049933\n",
      "   +0.0595 if cv>=-0.22420302033424377\n",
      "   +0.1049 if cp<=-0.10825576335191726\n",
      "--------------\n",
      "   -0.3008 if cp>=-0.06092919930815697\n",
      "   -1.0244 if cp<=-0.03141929954290389\n",
      "   -1.0244 if cp<=-0.028056500107049933\n",
      "   -0.0595 if cv>=-0.22420302033424377\n",
      "   -0.1048 if cp<=-0.10825576335191726\n",
      "Run episode 62 with rewards 12.0\n",
      "============ 63 ===========\n",
      "11 actions [0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0]\n",
      "   +2.4605 if cp>=-0.06092919930815697\n",
      "   +0.6962 if cp<=-0.03141929954290389\n",
      "   +0.8945 if cp<=-0.028056500107049933\n",
      "   +0.1305 if cp<=-0.10825576335191726\n",
      "   -4.6626 if cp>=-0.01900034099817276 & cv<=-0.2032691389322281\n",
      "--------------\n",
      "   -2.4609 if cp>=-0.06092919930815697\n",
      "   -0.6961 if cp<=-0.03141929954290389\n",
      "   -0.8944 if cp<=-0.028056500107049933\n",
      "   -0.1304 if cp<=-0.10825576335191726\n",
      "   +4.6626 if cp>=-0.01900034099817276 & cv<=-0.2032691389322281\n",
      "Run episode 63 with rewards 11.0\n",
      "============ 64 ===========\n",
      "12 actions [1, 0, 0, 0, 1, 0, 0, 0, 0, 1, 0, 1]\n",
      "   +0.4296 if cp>=-0.06092919930815697\n",
      "   +0.5638 if cp<=-0.03141929954290389\n",
      "   +0.5638 if cp<=-0.028056500107049933\n",
      "   -0.0000 if cp>=-0.01900034099817276 & cv<=-0.2032691389322281\n",
      "   -3.7889 if cp>=-0.09550245106220245 & pav>=1.4577392339706423\n",
      "--------------\n",
      "   -0.4298 if cp>=-0.06092919930815697\n",
      "   -0.5637 if cp<=-0.03141929954290389\n",
      "   -0.5637 if cp<=-0.028056500107049933\n",
      "   -0.0000 if cp>=-0.01900034099817276 & cv<=-0.2032691389322281\n",
      "   +3.7889 if cp>=-0.09550245106220245 & pav>=1.4577392339706423\n",
      "Run episode 64 with rewards 12.0\n",
      "============ 65 ===========\n",
      "38 actions [0, 1, 1, 1, 0, 0, 1, 1, 0, 0, 0, 0, 0, 0, 1, 1, 1, 0, 1, 1, 1, 0, 1, 1, 0, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0]\n",
      "   +0.9208 if cp>=-0.06092919930815697\n",
      "   -0.1832 if cp<=-0.03141929954290389\n",
      "   -0.1832 if cp<=-0.028056500107049933\n",
      "   -0.5791 if cp>=-0.09550245106220245 & pav>=1.4577392339706423\n",
      "   -3.2438 if cp>=0.03882381096482278 & cv<=-0.29263252317905397\n",
      "--------------\n",
      "   -0.9209 if cp>=-0.06092919930815697\n",
      "   +0.1832 if cp<=-0.03141929954290389\n",
      "   +0.1832 if cp<=-0.028056500107049933\n",
      "   +0.5791 if cp>=-0.09550245106220245 & pav>=1.4577392339706423\n",
      "   +3.2439 if cp>=0.03882381096482278 & cv<=-0.29263252317905397\n",
      "Run episode 65 with rewards 38.0\n",
      "============ 66 ===========\n",
      "30 actions [1, 0, 0, 0, 0, 0, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0]\n",
      "   +0.5065 if cp>=-0.06092919930815697\n",
      "   -1.5051 if cp<=-0.028056500107049933\n",
      "   -1.6610 if cp>=-0.09550245106220245 & pav>=1.4577392339706423\n",
      "   -0.0000 if cp>=0.03882381096482278 & cv<=-0.29263252317905397\n",
      "   +2.1229 if cp<=-0.03771157860755921 & pa<=0.14968046247959138 & pav<=0.03948571011424065\n",
      "--------------\n",
      "   -0.5066 if cp>=-0.06092919930815697\n",
      "   +1.5052 if cp<=-0.028056500107049933\n",
      "   +1.6609 if cp>=-0.09550245106220245 & pav>=1.4577392339706423\n",
      "   -0.0000 if cp>=0.03882381096482278 & cv<=-0.29263252317905397\n",
      "   -2.1229 if cp<=-0.03771157860755921 & pa<=0.14968046247959138 & pav<=0.03948571011424065\n",
      "Run episode 66 with rewards 30.0\n",
      "============ 67 ===========\n",
      "12 actions [0, 1, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1]\n",
      "   +1.1633 if cp>=-0.06092919930815697\n",
      "   -3.6093 if cp<=-0.028056500107049933\n",
      "   -1.2312 if cp>=-0.09550245106220245 & pav>=1.4577392339706423\n",
      "   -0.0000 if cp<=-0.03771157860755921 & pa<=0.14968046247959138 & pav<=0.03948571011424065\n",
      "   +7.1183 if cp<=-0.06243328601121902 & cv>=-0.09947531446814514 & pa<=0.15227958261966706\n",
      "--------------\n",
      "   -1.1634 if cp>=-0.06092919930815697\n",
      "   +3.6093 if cp<=-0.028056500107049933\n",
      "   +1.2312 if cp>=-0.09550245106220245 & pav>=1.4577392339706423\n",
      "   +0.0000 if cp<=-0.03771157860755921 & pa<=0.14968046247959138 & pav<=0.03948571011424065\n",
      "   -7.1183 if cp<=-0.06243328601121902 & cv>=-0.09947531446814514 & pa<=0.15227958261966706\n",
      "Run episode 67 with rewards 12.0\n",
      "============ 68 ===========\n",
      "11 actions [0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 0]\n",
      "   +2.0418 if cp>=-0.06092919930815697\n",
      "   -1.0289 if cp<=-0.028056500107049933\n",
      "   +0.1771 if cp>=-0.09550245106220245 & pav>=1.4577392339706423\n",
      "   +0.0000 if cp<=-0.06243328601121902 & cv>=-0.09947531446814514 & pa<=0.15227958261966706\n",
      "   -4.9709 if cp>=0.04676826670765877\n",
      "--------------\n",
      "   -2.0419 if cp>=-0.06092919930815697\n",
      "   +1.0288 if cp<=-0.028056500107049933\n",
      "   -0.1772 if cp>=-0.09550245106220245 & pav>=1.4577392339706423\n",
      "   +0.0000 if cp<=-0.06243328601121902 & cv>=-0.09947531446814514 & pa<=0.15227958261966706\n",
      "   +4.9708 if cp>=0.04676826670765877\n",
      "Run episode 68 with rewards 11.0\n",
      "============ 69 ===========\n",
      "42 actions [0, 0, 0, 0, 1, 1, 1, 0, 1, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 0, 0]\n",
      "   +2.7510 if cp>=-0.06092919930815697\n",
      "   -0.6398 if cp<=-0.028056500107049933\n",
      "   -0.5086 if cp>=-0.09550245106220245 & pav>=1.4577392339706423\n",
      "   -0.0000 if cp>=0.04676826670765877\n",
      "   +1.2616 if pa>=0.19209958612918854\n",
      "--------------\n",
      "   -2.7511 if cp>=-0.06092919930815697\n",
      "   +0.6398 if cp<=-0.028056500107049933\n",
      "   +0.5086 if cp>=-0.09550245106220245 & pav>=1.4577392339706423\n",
      "   -0.0000 if cp>=0.04676826670765877\n",
      "   -1.2616 if pa>=0.19209958612918854\n",
      "Run episode 69 with rewards 42.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 70 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 1, 1, 1]\n",
      "   +6.0068 if cp>=-0.06092919930815697\n",
      "   -0.3912 if cp<=-0.028056500107049933\n",
      "   +0.1081 if cp>=-0.09550245106220245 & pav>=1.4577392339706423\n",
      "   +0.5979 if pa>=0.19209958612918854\n",
      "   -2.8765 if cp>=-0.10255458205938339\n",
      "--------------\n",
      "   -6.0069 if cp>=-0.06092919930815697\n",
      "   +0.3911 if cp<=-0.028056500107049933\n",
      "   -0.1075 if cp>=-0.09550245106220245 & pav>=1.4577392339706423\n",
      "   -0.5956 if pa>=0.19209958612918854\n",
      "   +2.8764 if cp>=-0.10255458205938339\n",
      "Run episode 70 with rewards 9.0\n",
      "============ 71 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 1, 1, 1, 0, 1]\n",
      "   +1.1484 if cp>=-0.06092919930815697\n",
      "   -0.5864 if cp<=-0.028056500107049933\n",
      "   -0.5692 if pa>=0.19209958612918854\n",
      "   +0.6499 if cp>=-0.10255458205938339\n",
      "   -0.2747 if pav>=1.8594632148742676\n",
      "--------------\n",
      "   -1.1484 if cp>=-0.06092919930815697\n",
      "   +0.5868 if cp<=-0.028056500107049933\n",
      "   +0.5697 if pa>=0.19209958612918854\n",
      "   -0.6499 if cp>=-0.10255458205938339\n",
      "   +0.2747 if pav>=1.8594632148742676\n",
      "Run episode 71 with rewards 10.0\n",
      "============ 72 ===========\n",
      "11 actions [0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1]\n",
      "   +1.6785 if cp>=-0.06092919930815697\n",
      "   -1.5966 if cp<=-0.028056500107049933\n",
      "   -0.2738 if pa>=0.19209958612918854\n",
      "   +0.4453 if cp>=-0.10255458205938339\n",
      "   -3.0786 if pav>=1.5738029479980469\n",
      "--------------\n",
      "   -1.6786 if cp>=-0.06092919930815697\n",
      "   +1.5969 if cp<=-0.028056500107049933\n",
      "   +0.2740 if pa>=0.19209958612918854\n",
      "   -0.4452 if cp>=-0.10255458205938339\n",
      "   +3.0786 if pav>=1.5738029479980469\n",
      "Run episode 72 with rewards 11.0\n",
      "============ 73 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 1, 1, 0]\n",
      "   +0.8967 if cp>=-0.06092919930815697\n",
      "   +0.2702 if cp<=-0.028056500107049933\n",
      "   +0.8445 if cp>=-0.10255458205938339\n",
      "   -2.4294 if pav>=1.5738029479980469\n",
      "   +0.5570 if cp<=0.02591441199183464 & cv>=-0.930989682674408\n",
      "--------------\n",
      "   -0.8967 if cp>=-0.06092919930815697\n",
      "   -0.2701 if cp<=-0.028056500107049933\n",
      "   -0.8445 if cp>=-0.10255458205938339\n",
      "   +2.4294 if pav>=1.5738029479980469\n",
      "   -0.5570 if cp<=0.02591441199183464 & cv>=-0.930989682674408\n",
      "Run episode 73 with rewards 9.0\n",
      "============ 74 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 1, 1, 0, 1]\n",
      "   +0.5121 if cp>=-0.06092919930815697\n",
      "   +0.3100 if cp>=-0.10255458205938339\n",
      "   -1.0902 if pav>=1.5738029479980469\n",
      "   +0.6284 if cp<=0.02591441199183464 & cv>=-0.930989682674408\n",
      "   +1.3254 if cv>=-0.9956066370010376\n",
      "--------------\n",
      "   -0.5121 if cp>=-0.06092919930815697\n",
      "   -0.3100 if cp>=-0.10255458205938339\n",
      "   +1.0902 if pav>=1.5738029479980469\n",
      "   -0.6284 if cp<=0.02591441199183464 & cv>=-0.930989682674408\n",
      "   -1.3253 if cv>=-0.9956066370010376\n",
      "Run episode 74 with rewards 10.0\n",
      "============ 75 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 1, 1, 0, 1]\n",
      "   +0.4637 if cp>=-0.06092919930815697\n",
      "   -1.4102 if pav>=1.5738029479980469\n",
      "   +0.7578 if cp<=0.02591441199183464 & cv>=-0.930989682674408\n",
      "   +1.4220 if cv>=-0.9956066370010376\n",
      "   -0.6378 if pav>=1.84544038772583\n",
      "--------------\n",
      "   -0.4637 if cp>=-0.06092919930815697\n",
      "   +1.4102 if pav>=1.5738029479980469\n",
      "   -0.7577 if cp<=0.02591441199183464 & cv>=-0.930989682674408\n",
      "   -1.4219 if cv>=-0.9956066370010376\n",
      "   +0.6378 if pav>=1.84544038772583\n",
      "Run episode 75 with rewards 10.0\n",
      "============ 76 ===========\n",
      "12 actions [0, 0, 0, 0, 0, 1, 0, 0, 1, 0, 1, 1]\n",
      "   -2.1195 if pav>=1.5738029479980469\n",
      "   +1.2466 if cp<=0.02591441199183464 & cv>=-0.930989682674408\n",
      "   +0.2574 if cv>=-0.9956066370010376\n",
      "   -0.1502 if pav>=1.84544038772583\n",
      "   +0.5019 if cv>=-0.9391664624214172\n",
      "--------------\n",
      "   +2.1195 if pav>=1.5738029479980469\n",
      "   -1.2466 if cp<=0.02591441199183464 & cv>=-0.930989682674408\n",
      "   -0.2574 if cv>=-0.9956066370010376\n",
      "   +0.1501 if pav>=1.84544038772583\n",
      "   -0.5019 if cv>=-0.9391664624214172\n",
      "Run episode 76 with rewards 12.0\n",
      "============ 77 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 1, 0, 1, 0]\n",
      "   -1.8979 if pav>=1.5738029479980469\n",
      "   +1.7870 if cp<=0.02591441199183464 & cv>=-0.930989682674408\n",
      "   -1.0237 if cv>=-0.9956066370010376\n",
      "   +1.7870 if cv>=-0.9391664624214172\n",
      "   +1.9844 if cp<=-0.08726051449775696\n",
      "--------------\n",
      "   +1.8979 if pav>=1.5738029479980469\n",
      "   -1.7870 if cp<=0.02591441199183464 & cv>=-0.930989682674408\n",
      "   +1.0238 if cv>=-0.9956066370010376\n",
      "   -1.7870 if cv>=-0.9391664624214172\n",
      "   -1.9844 if cp<=-0.08726051449775696\n",
      "Run episode 77 with rewards 9.0\n",
      "============ 78 ===========\n",
      "13 actions [0, 0, 0, 1, 0, 0, 0, 1, 0, 0, 1, 0, 1]\n",
      "   -0.2110 if pav>=1.5738029479980469\n",
      "   +1.2824 if cp<=0.02591441199183464 & cv>=-0.930989682674408\n",
      "   +1.2824 if cv>=-0.9391664624214172\n",
      "   -0.0000 if cp<=-0.08726051449775696\n",
      "   -0.6117 if cp>=-0.0455000214278698\n",
      "--------------\n",
      "   +0.2110 if pav>=1.5738029479980469\n",
      "   -1.2824 if cp<=0.02591441199183464 & cv>=-0.930989682674408\n",
      "   -1.2824 if cv>=-0.9391664624214172\n",
      "   +0.0000 if cp<=-0.08726051449775696\n",
      "   +0.6117 if cp>=-0.0455000214278698\n",
      "Run episode 78 with rewards 13.0\n",
      "============ 79 ===========\n",
      "28 actions [0, 1, 0, 1, 1, 1, 0, 0, 0, 0, 1, 1, 0, 0, 1, 0, 1, 0, 0, 0, 1, 0, 1, 1, 0, 0, 0, 0]\n",
      "   +1.2144 if pav>=1.5738029479980469\n",
      "   +1.2936 if cp<=0.02591441199183464 & cv>=-0.930989682674408\n",
      "   +1.2936 if cv>=-0.9391664624214172\n",
      "   -2.5015 if cp>=-0.0455000214278698\n",
      "   -2.0465 if cp<=-0.03797737807035445\n",
      "--------------\n",
      "   -1.2144 if pav>=1.5738029479980469\n",
      "   -1.2936 if cp<=0.02591441199183464 & cv>=-0.930989682674408\n",
      "   -1.2936 if cv>=-0.9391664624214172\n",
      "   +2.5015 if cp>=-0.0455000214278698\n",
      "   +2.0465 if cp<=-0.03797737807035445\n",
      "Run episode 79 with rewards 28.0\n",
      "============ 80 ===========\n",
      "32 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1]\n",
      "   -0.1106 if cp<=0.02591441199183464 & cv>=-0.930989682674408\n",
      "   -0.1106 if cv>=-0.9391664624214172\n",
      "   -0.5054 if cp>=-0.0455000214278698\n",
      "   +0.0160 if cp<=-0.03797737807035445\n",
      "   +1.5530 if cv>=-0.16748674511909484\n",
      "--------------\n",
      "   +0.1106 if cp<=0.02591441199183464 & cv>=-0.930989682674408\n",
      "   +0.1106 if cv>=-0.9391664624214172\n",
      "   +0.5054 if cp>=-0.0455000214278698\n",
      "   -0.0160 if cp<=-0.03797737807035445\n",
      "   -1.5530 if cv>=-0.16748674511909484\n",
      "Run episode 80 with rewards 32.0\n",
      "============ 81 ===========\n",
      "16 actions [0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 1]\n",
      "   -1.1378 if cp<=0.02591441199183464 & cv>=-0.930989682674408\n",
      "   -1.1378 if cv>=-0.9391664624214172\n",
      "   -1.1378 if cp>=-0.0455000214278698\n",
      "   +3.8989 if cv>=-0.16748674511909484\n",
      "   +1.9897 if cv<=-0.18623730838298796\n",
      "--------------\n",
      "   +1.1378 if cp<=0.02591441199183464 & cv>=-0.930989682674408\n",
      "   +1.1378 if cv>=-0.9391664624214172\n",
      "   +1.1378 if cp>=-0.0455000214278698\n",
      "   -3.8989 if cv>=-0.16748674511909484\n",
      "   -1.9897 if cv<=-0.18623730838298796\n",
      "Run episode 81 with rewards 16.0\n",
      "============ 82 ===========\n",
      "50 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1]\n",
      "   +2.2795 if cv>=-0.9391664624214172\n",
      "   -2.4778 if cp>=-0.0455000214278698\n",
      "   +3.6408 if cv>=-0.16748674511909484\n",
      "   -1.2832 if cv<=-0.18623730838298796\n",
      "   -3.3879 if cp<=-0.058242518454790115\n",
      "--------------\n",
      "   -2.2795 if cv>=-0.9391664624214172\n",
      "   +2.4778 if cp>=-0.0455000214278698\n",
      "   -3.6407 if cv>=-0.16748674511909484\n",
      "   +1.2832 if cv<=-0.18623730838298796\n",
      "   +3.3879 if cp<=-0.058242518454790115\n",
      "Run episode 82 with rewards 50.0\n",
      "============ 83 ===========\n",
      "16 actions [0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 0, 1, 0, 1, 0, 1]\n",
      "   +1.5254 if cv>=-0.9391664624214172\n",
      "   -0.7407 if cp>=-0.0455000214278698\n",
      "   +2.5218 if cv>=-0.16748674511909484\n",
      "   -2.5498 if cp<=-0.058242518454790115\n",
      "   -4.9779 if cp>=-0.011460253037512297 & cv<=-0.026414439454674695\n",
      "--------------\n",
      "   -1.5254 if cv>=-0.9391664624214172\n",
      "   +0.7408 if cp>=-0.0455000214278698\n",
      "   -2.5218 if cv>=-0.16748674511909484\n",
      "   +2.5498 if cp<=-0.058242518454790115\n",
      "   +4.9779 if cp>=-0.011460253037512297 & cv<=-0.026414439454674695\n",
      "Run episode 83 with rewards 16.0\n",
      "============ 84 ===========\n",
      "17 actions [0, 0, 0, 0, 1, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0]\n",
      "   +2.2958 if cv>=-0.9391664624214172\n",
      "   +2.8454 if cv>=-0.16748674511909484\n",
      "   -4.1540 if cp<=-0.058242518454790115\n",
      "   -0.0000 if cp>=-0.011460253037512297 & cv<=-0.026414439454674695\n",
      "   +0.0103 if cp>=-0.02599506452679634\n",
      "--------------\n",
      "   -2.2958 if cv>=-0.9391664624214172\n",
      "   -2.8454 if cv>=-0.16748674511909484\n",
      "   +4.1539 if cp<=-0.058242518454790115\n",
      "   -0.0000 if cp>=-0.011460253037512297 & cv<=-0.026414439454674695\n",
      "   -0.0103 if cp>=-0.02599506452679634\n",
      "Run episode 84 with rewards 17.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 85 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 1, 1, 1, 1, 1]\n",
      "   +1.2098 if cv>=-0.9391664624214172\n",
      "   +3.5937 if cv>=-0.16748674511909484\n",
      "   -2.7756 if cp<=-0.058242518454790115\n",
      "   +0.0000 if cp>=-0.02599506452679634\n",
      "   +0.0025 if cp>=-0.04341575503349304\n",
      "--------------\n",
      "   -1.2098 if cv>=-0.9391664624214172\n",
      "   -3.5937 if cv>=-0.16748674511909484\n",
      "   +2.7755 if cp<=-0.058242518454790115\n",
      "   +0.0000 if cp>=-0.02599506452679634\n",
      "   -0.0025 if cp>=-0.04341575503349304\n",
      "Run episode 85 with rewards 10.0\n",
      "============ 86 ===========\n",
      "29 actions [0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1]\n",
      "   +1.0337 if cv>=-0.9391664624214172\n",
      "   +0.0238 if cv>=-0.16748674511909484\n",
      "   -1.5484 if cp<=-0.058242518454790115\n",
      "   +2.5821 if cp>=-0.04341575503349304\n",
      "   -1.2766 if cp>=-0.0906264215707779\n",
      "--------------\n",
      "   -1.0337 if cv>=-0.9391664624214172\n",
      "   -0.0238 if cv>=-0.16748674511909484\n",
      "   +1.5484 if cp<=-0.058242518454790115\n",
      "   -2.5821 if cp>=-0.04341575503349304\n",
      "   +1.2766 if cp>=-0.0906264215707779\n",
      "Run episode 86 with rewards 29.0\n",
      "============ 87 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 1, 1]\n",
      "   +1.4986 if cv>=-0.9391664624214172\n",
      "   -5.8912 if cp<=-0.058242518454790115\n",
      "   +2.4404 if cp>=-0.04341575503349304\n",
      "   +1.6803 if cp>=-0.0906264215707779\n",
      "   -4.8568 if cp<=-0.018723207339644367 & cp>=-0.0510717861354351 & cv>=0.5481361508369446\n",
      "--------------\n",
      "   -1.4986 if cv>=-0.9391664624214172\n",
      "   +5.8912 if cp<=-0.058242518454790115\n",
      "   -2.4404 if cp>=-0.04341575503349304\n",
      "   -1.6803 if cp>=-0.0906264215707779\n",
      "   +4.8568 if cp<=-0.018723207339644367 & cp>=-0.0510717861354351 & cv>=0.5481361508369446\n",
      "Run episode 87 with rewards 10.0\n",
      "============ 88 ===========\n",
      "13 actions [1, 0, 0, 0, 0, 1, 0, 0, 0, 1, 0, 0, 0]\n",
      "   -0.0830 if cp<=-0.058242518454790115\n",
      "   +0.4099 if cp>=-0.04341575503349304\n",
      "   +0.3300 if cp>=-0.0906264215707779\n",
      "   -0.0000 if cp<=-0.018723207339644367 & cp>=-0.0510717861354351 & cv>=0.5481361508369446\n",
      "   +0.2293 if cp<=0.023197786882519725 & cp>=-0.04668726772069931\n",
      "--------------\n",
      "   +0.0830 if cp<=-0.058242518454790115\n",
      "   -0.4099 if cp>=-0.04341575503349304\n",
      "   -0.3300 if cp>=-0.0906264215707779\n",
      "   +0.0000 if cp<=-0.018723207339644367 & cp>=-0.0510717861354351 & cv>=0.5481361508369446\n",
      "   -0.2294 if cp<=0.023197786882519725 & cp>=-0.04668726772069931\n",
      "Run episode 88 with rewards 13.0\n",
      "============ 89 ===========\n",
      "12 actions [0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0]\n",
      "   +2.4013 if cp<=-0.058242518454790115\n",
      "   +0.2687 if cp>=-0.04341575503349304\n",
      "   -1.0837 if cp>=-0.0906264215707779\n",
      "   +0.2687 if cp<=0.023197786882519725 & cp>=-0.04668726772069931\n",
      "   +2.9793 if cp>=-0.0038203832693397967\n",
      "--------------\n",
      "   -2.4014 if cp<=-0.058242518454790115\n",
      "   -0.2687 if cp>=-0.04341575503349304\n",
      "   +1.0837 if cp>=-0.0906264215707779\n",
      "   -0.2687 if cp<=0.023197786882519725 & cp>=-0.04668726772069931\n",
      "   -2.9793 if cp>=-0.0038203832693397967\n",
      "Run episode 89 with rewards 12.0\n",
      "============ 90 ===========\n",
      "32 actions [0, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 0, 1, 1, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0]\n",
      "   -0.0000 if cp<=-0.058242518454790115\n",
      "   -0.8402 if cp>=-0.0906264215707779\n",
      "   -1.5940 if cp<=0.023197786882519725 & cp>=-0.04668726772069931\n",
      "   +2.2032 if cp>=-0.0038203832693397967\n",
      "   +2.9817 if cp<=-0.03068971447646618 & cv<=0.0781933151185513\n",
      "--------------\n",
      "   +0.0000 if cp<=-0.058242518454790115\n",
      "   +1.1581 if cp>=-0.04341575503349304\n",
      "   +1.1581 if cp>=-0.0906264215707779\n",
      "   -2.7106 if cp>=-0.0038203832693397967\n",
      "   -2.8702 if cp<=-0.03068971447646618 & cv<=0.0781933151185513\n",
      "Run episode 90 with rewards 32.0\n",
      "============ 91 ===========\n",
      "9 actions [0, 0, 0, 0, 1, 0, 0, 0, 0]\n",
      "   -2.6161 if cp>=-0.0906264215707779\n",
      "   +0.4568 if cp<=0.023197786882519725 & cp>=-0.04668726772069931\n",
      "   +1.1905 if cp>=-0.0038203832693397967\n",
      "   +2.8309 if cp<=-0.03068971447646618 & cv<=0.0781933151185513\n",
      "   +5.5358 if cp>=-0.0027046778704971006 & cv>=-0.3636189520359039\n",
      "--------------\n",
      "   +1.7414 if cp>=-0.04341575503349304\n",
      "   +0.6797 if cp>=-0.0906264215707779\n",
      "   -1.2362 if cp>=-0.0038203832693397967\n",
      "   -2.6579 if cp<=-0.03068971447646618 & cv<=0.0781933151185513\n",
      "   -5.7855 if cp>=-0.0027046778704971006 & cv>=-0.3636189520359039\n",
      "Run episode 91 with rewards 9.0\n",
      "============ 92 ===========\n",
      "43 actions [1, 1, 0, 0, 0, 1, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 0, 1, 0, 0, 0, 1, 0, 0, 0, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.3469 if cp>=-0.0906264215707779\n",
      "   -0.0000 if cp>=-0.0038203832693397967\n",
      "   +0.7886 if cp<=-0.03068971447646618 & cv<=0.0781933151185513\n",
      "   -0.0000 if cp>=-0.0027046778704971006 & cv>=-0.3636189520359039\n",
      "   -4.0728 if cp>=-0.08244724720716476 & cv<=-0.7399085760116577\n",
      "--------------\n",
      "   +0.0000 if cp>=-0.04341575503349304\n",
      "   +0.0000 if cp>=-0.0038203832693397967\n",
      "   -2.5314 if cp<=-0.03068971447646618 & cv<=0.0781933151185513\n",
      "   +0.0000 if cp>=-0.0027046778704971006 & cv>=-0.3636189520359039\n",
      "   +3.8000 if cp>=-0.08244724720716476 & cv<=-0.7399085760116577\n",
      "Run episode 92 with rewards 43.0\n",
      "============ 93 ===========\n",
      "13 actions [0, 0, 1, 1, 0, 0, 0, 0, 1, 0, 0, 0, 0]\n",
      "   -0.7493 if cp>=-0.0906264215707779\n",
      "   +1.4629 if cp<=-0.03068971447646618 & cv<=0.0781933151185513\n",
      "   +0.1831 if cp>=-0.0027046778704971006 & cv>=-0.3636189520359039\n",
      "   -2.6357 if cp>=-0.08244724720716476 & cv<=-0.7399085760116577\n",
      "   +5.5261 if pav<=-0.3392040193080902\n",
      "--------------\n",
      "   +1.0964 if cp>=-0.04341575503349304\n",
      "   -2.5400 if cp<=-0.03068971447646618 & cv<=0.0781933151185513\n",
      "   -0.1834 if cp>=-0.0027046778704971006 & cv>=-0.3636189520359039\n",
      "   +2.4211 if cp>=-0.08244724720716476 & cv<=-0.7399085760116577\n",
      "   -5.5261 if pav<=-0.3392040193080902\n",
      "Run episode 93 with rewards 13.0\n",
      "============ 94 ===========\n",
      "15 actions [0, 1, 0, 1, 0, 1, 0, 0, 0, 0, 1, 0, 0, 0, 0]\n",
      "   -0.8898 if cp>=-0.0906264215707779\n",
      "   +2.2333 if cp<=-0.03068971447646618 & cv<=0.0781933151185513\n",
      "   -2.8722 if cp>=-0.08244724720716476 & cv<=-0.7399085760116577\n",
      "   +0.0000 if pav<=-0.3392040193080902\n",
      "   +4.7119 if cp>=-0.02508831098675727 & cv>=-0.18150896430015565\n",
      "--------------\n",
      "   +0.9503 if cp>=-0.04341575503349304\n",
      "   -2.9636 if cp<=-0.03068971447646618 & cv<=0.0781933151185513\n",
      "   +2.5821 if cp>=-0.08244724720716476 & cv<=-0.7399085760116577\n",
      "   -0.0000 if pav<=-0.3392040193080902\n",
      "   -4.4792 if cp>=-0.02508831098675727 & cv>=-0.18150896430015565\n",
      "Run episode 94 with rewards 15.0\n",
      "============ 95 ===========\n",
      "34 actions [1, 0, 1, 0, 0, 1, 0, 1, 1, 1, 0, 0, 0, 1, 0, 0, 1, 1, 1, 0, 1, 1, 0, 1, 0, 0, 0, 1, 0, 1, 0, 1, 1, 0]\n",
      "   -1.3998 if cp>=-0.0906264215707779\n",
      "   +2.2310 if cp<=-0.03068971447646618 & cv<=0.0781933151185513\n",
      "   -2.6979 if cp>=-0.08244724720716476 & cv<=-0.7399085760116577\n",
      "   +1.7423 if cp>=-0.02508831098675727 & cv>=-0.18150896430015565\n",
      "   +4.2825 if cp<=-0.024553969502449036 & cv>=-0.03751928657293319\n",
      "--------------\n",
      "   +1.2692 if cp>=-0.04341575503349304\n",
      "   -2.6493 if cp<=-0.03068971447646618 & cv<=0.0781933151185513\n",
      "   +2.6347 if cp>=-0.08244724720716476 & cv<=-0.7399085760116577\n",
      "   -1.4828 if cp>=-0.02508831098675727 & cv>=-0.18150896430015565\n",
      "   -4.1322 if cp<=-0.024553969502449036 & cv>=-0.03751928657293319\n",
      "Run episode 95 with rewards 34.0\n",
      "============ 96 ===========\n",
      "31 actions [1, 1, 1, 1, 0, 0, 0, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 0, 1, 1, 0, 0, 0, 1, 1, 1, 1, 0]\n",
      "   -0.0000 if cp<=-0.03068971447646618 & cv<=0.0781933151185513\n",
      "   -0.0000 if cp>=-0.08244724720716476 & cv<=-0.7399085760116577\n",
      "   +0.9575 if cp>=-0.02508831098675727 & cv>=-0.18150896430015565\n",
      "   -0.0000 if cp<=-0.024553969502449036 & cv>=-0.03751928657293319\n",
      "   -5.0930 if cp<=0.04491923749446869 & cv<=0.16893298625946046 & pa<=0.09081460982561111 & pav<=0.36510490179061916\n",
      "--------------\n",
      "   -0.0000 if cp<=-0.03068971447646618 & cv<=0.0781933151185513\n",
      "   -0.0000 if cp>=-0.08244724720716476 & cv<=-0.7399085760116577\n",
      "   -0.8294 if cp>=-0.02508831098675727 & cv>=-0.18150896430015565\n",
      "   -0.0000 if cp<=-0.024553969502449036 & cv>=-0.03751928657293319\n",
      "   +5.0935 if cp<=0.04491923749446869 & cv<=0.16893298625946046 & pa<=0.09081460982561111 & pav<=0.36510490179061916\n",
      "Run episode 96 with rewards 31.0\n",
      "============ 97 ===========\n",
      "30 actions [0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 0, 0, 1, 0, 0, 1, 1, 1, 1, 0, 1, 1]\n",
      "   +0.0000 if cp>=-0.08244724720716476 & cv<=-0.7399085760116577\n",
      "   +0.2450 if cp>=-0.02508831098675727 & cv>=-0.18150896430015565\n",
      "   -6.3723 if cp<=-0.024553969502449036 & cv>=-0.03751928657293319\n",
      "   -1.3225 if cp<=0.04491923749446869 & cv<=0.16893298625946046 & pa<=0.09081460982561111 & pav<=0.36510490179061916\n",
      "   +2.7342 if cv>=-0.0008797662449069321 & pa>=-0.06359162181615827\n",
      "--------------\n",
      "   +0.0004 if cp<=-0.03068971447646618 & cv<=0.0781933151185513\n",
      "   -0.1187 if cp>=-0.02508831098675727 & cv>=-0.18150896430015565\n",
      "   +6.3711 if cp<=-0.024553969502449036 & cv>=-0.03751928657293319\n",
      "   +1.3238 if cp<=0.04491923749446869 & cv<=0.16893298625946046 & pa<=0.09081460982561111 & pav<=0.36510490179061916\n",
      "   -2.7327 if cv>=-0.0008797662449069321 & pa>=-0.06359162181615827\n",
      "Run episode 97 with rewards 30.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 98 ===========\n",
      "15 actions [0, 0, 1, 0, 0, 1, 1, 0, 0, 1, 0, 0, 0, 0, 1]\n",
      "   +0.9828 if cp>=-0.02508831098675727 & cv>=-0.18150896430015565\n",
      "   -0.0000 if cp<=-0.024553969502449036 & cv>=-0.03751928657293319\n",
      "   -2.4978 if cp<=0.04491923749446869 & cv<=0.16893298625946046 & pa<=0.09081460982561111 & pav<=0.36510490179061916\n",
      "   +1.4353 if cv>=-0.0008797662449069321 & pa>=-0.06359162181615827\n",
      "   +5.4158 if cv>=-0.19242751896381377 & pav>=-0.029707568138837806\n",
      "--------------\n",
      "   -0.8586 if cp>=-0.02508831098675727 & cv>=-0.18150896430015565\n",
      "   +0.0000 if cp<=-0.024553969502449036 & cv>=-0.03751928657293319\n",
      "   +2.5010 if cp<=0.04491923749446869 & cv<=0.16893298625946046 & pa<=0.09081460982561111 & pav<=0.36510490179061916\n",
      "   -1.4331 if cv>=-0.0008797662449069321 & pa>=-0.06359162181615827\n",
      "   -5.4155 if cv>=-0.19242751896381377 & pav>=-0.029707568138837806\n",
      "Run episode 98 with rewards 15.0\n",
      "============ 99 ===========\n",
      "13 actions [0, 0, 0, 1, 1, 1, 0, 0, 0, 0, 1, 0, 0]\n",
      "   +0.6458 if cp>=-0.02508831098675727 & cv>=-0.18150896430015565\n",
      "   +0.6458 if cp<=0.04491923749446869 & cv<=0.16893298625946046 & pa<=0.09081460982561111 & pav<=0.36510490179061916\n",
      "   +0.0582 if cv>=-0.0008797662449069321 & pa>=-0.06359162181615827\n",
      "   +0.6458 if cv>=-0.19242751896381377 & pav>=-0.029707568138837806\n",
      "   -0.5386 if cp>=-0.00976196555420756\n",
      "--------------\n",
      "   -0.6182 if cp>=-0.02508831098675727 & cv>=-0.18150896430015565\n",
      "   -0.6182 if cp<=0.04491923749446869 & cv<=0.16893298625946046 & pa<=0.09081460982561111 & pav<=0.36510490179061916\n",
      "   -0.0557 if cv>=-0.0008797662449069321 & pa>=-0.06359162181615827\n",
      "   -0.6182 if cv>=-0.19242751896381377 & pav>=-0.029707568138837806\n",
      "   +0.5393 if cp>=-0.00976196555420756\n",
      "Run episode 99 with rewards 13.0\n",
      "============ 100 ===========\n",
      "42 actions [1, 1, 1, 1, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1]\n",
      "   +0.9471 if cp>=-0.02508831098675727 & cv>=-0.18150896430015565\n",
      "   -3.6584 if cp<=0.04491923749446869 & cv<=0.16893298625946046 & pa<=0.09081460982561111 & pav<=0.36510490179061916\n",
      "   +0.9471 if cv>=-0.19242751896381377 & pav>=-0.029707568138837806\n",
      "   -0.5803 if cp>=-0.00976196555420756\n",
      "   +4.2533 if cp>=0.023481510952115068\n",
      "--------------\n",
      "   -0.9199 if cp>=-0.02508831098675727 & cv>=-0.18150896430015565\n",
      "   +3.6821 if cp<=0.04491923749446869 & cv<=0.16893298625946046 & pa<=0.09081460982561111 & pav<=0.36510490179061916\n",
      "   -0.9199 if cv>=-0.19242751896381377 & pav>=-0.029707568138837806\n",
      "   +0.5825 if cp>=-0.00976196555420756\n",
      "   -4.2511 if cp>=0.023481510952115068\n",
      "Run episode 100 with rewards 42.0\n",
      "============ 101 ===========\n",
      "23 actions [1, 1, 0, 1, 1, 0, 0, 0, 0, 1, 0, 0, 1, 1, 1, 1, 0, 0, 0, 1, 0, 1, 0]\n",
      "   +2.2189 if cp>=-0.02508831098675727 & cv>=-0.18150896430015565\n",
      "   -1.4912 if cp<=0.04491923749446869 & cv<=0.16893298625946046 & pa<=0.09081460982561111 & pav<=0.36510490179061916\n",
      "   -0.1045 if cv>=-0.19242751896381377 & pav>=-0.029707568138837806\n",
      "   +3.4959 if cp>=0.023481510952115068\n",
      "   -2.6336 if pav>=-0.778511106967926\n",
      "--------------\n",
      "   -2.1910 if cp>=-0.02508831098675727 & cv>=-0.18150896430015565\n",
      "   +1.5057 if cp<=0.04491923749446869 & cv<=0.16893298625946046 & pa<=0.09081460982561111 & pav<=0.36510490179061916\n",
      "   +0.1079 if cv>=-0.19242751896381377 & pav>=-0.029707568138837806\n",
      "   -3.4930 if cp>=0.023481510952115068\n",
      "   +2.6344 if pav>=-0.778511106967926\n",
      "Run episode 101 with rewards 23.0\n",
      "============ 102 ===========\n",
      "17 actions [1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 1, 1]\n",
      "   +2.2485 if cp>=-0.02508831098675727 & cv>=-0.18150896430015565\n",
      "   -0.0262 if cp<=0.04491923749446869 & cv<=0.16893298625946046 & pa<=0.09081460982561111 & pav<=0.36510490179061916\n",
      "   +1.3089 if cp>=0.023481510952115068\n",
      "   -1.7383 if pav>=-0.778511106967926\n",
      "   -3.8251 if cp<=0.02439744509756565 & cv<=0.2973863840103152\n",
      "--------------\n",
      "   -2.2260 if cp>=-0.02508831098675727 & cv>=-0.18150896430015565\n",
      "   +0.0346 if cp<=0.04491923749446869 & cv<=0.16893298625946046 & pa<=0.09081460982561111 & pav<=0.36510490179061916\n",
      "   -1.3048 if cp>=0.023481510952115068\n",
      "   +1.7444 if pav>=-0.778511106967926\n",
      "   +3.8260 if cp<=0.02439744509756565 & cv<=0.2973863840103152\n",
      "Run episode 102 with rewards 17.0\n",
      "============ 103 ===========\n",
      "52 actions [1, 0, 0, 0, 0, 1, 0, 0, 0, 1, 1, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1, 1, 1, 0, 1, 1, 0, 1, 0, 0, 1, 0]\n",
      "   +4.3244 if cp>=-0.02508831098675727 & cv>=-0.18150896430015565\n",
      "   +0.1990 if cp>=0.023481510952115068\n",
      "   -0.4353 if pav>=-0.778511106967926\n",
      "   -0.2046 if cp<=0.02439744509756565 & cv<=0.2973863840103152\n",
      "   -2.4660 if cv>=-0.18218555748462673\n",
      "--------------\n",
      "   -4.3086 if cp>=-0.02508831098675727 & cv>=-0.18150896430015565\n",
      "   -0.1896 if cp>=0.023481510952115068\n",
      "   +0.4442 if pav>=-0.778511106967926\n",
      "   +0.2062 if cp<=0.02439744509756565 & cv<=0.2973863840103152\n",
      "   +2.4680 if cv>=-0.18218555748462673\n",
      "Run episode 103 with rewards 52.0\n",
      "============ 104 ===========\n",
      "22 actions [1, 1, 0, 1, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0, 0, 0, 0, 1, 0, 1, 1, 1]\n",
      "   +2.5955 if cp>=-0.02508831098675727 & cv>=-0.18150896430015565\n",
      "   +0.4287 if pav>=-0.778511106967926\n",
      "   -1.0353 if cp<=0.02439744509756565 & cv<=0.2973863840103152\n",
      "   -2.3021 if cv>=-0.18218555748462673\n",
      "   +5.1636 if cp>=-0.07342007756233215 & cv<=-0.2898537695407864 & pav<=0.6640133261680604\n",
      "--------------\n",
      "   -2.5763 if cp>=-0.02508831098675727 & cv>=-0.18150896430015565\n",
      "   -0.4127 if pav>=-0.778511106967926\n",
      "   +1.0305 if cp<=0.02439744509756565 & cv<=0.2973863840103152\n",
      "   +2.3052 if cv>=-0.18218555748462673\n",
      "   -5.1638 if cp>=-0.07342007756233215 & cv<=-0.2898537695407864 & pav<=0.6640133261680604\n",
      "Run episode 104 with rewards 22.0\n",
      "============ 105 ===========\n",
      "14 actions [1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 0]\n",
      "   -1.2863 if cp>=-0.02508831098675727 & cv>=-0.18150896430015565\n",
      "   -4.9032 if cp<=0.02439744509756565 & cv<=0.2973863840103152\n",
      "   -1.2863 if cv>=-0.18218555748462673\n",
      "   +0.5096 if cp>=-0.07342007756233215 & cv<=-0.2898537695407864 & pav<=0.6640133261680604\n",
      "   +5.0970 if \n",
      "--------------\n",
      "   +1.2977 if cp>=-0.02508831098675727 & cv>=-0.18150896430015565\n",
      "   +4.9005 if cp<=0.02439744509756565 & cv<=0.2973863840103152\n",
      "   +1.2977 if cv>=-0.18218555748462673\n",
      "   -0.5097 if cp>=-0.07342007756233215 & cv<=-0.2898537695407864 & pav<=0.6640133261680604\n",
      "   -5.0832 if \n",
      "Run episode 105 with rewards 14.0\n",
      "============ 106 ===========\n",
      "64 actions [0, 0, 0, 1, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 1, 0, 0, 0, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -1.1036 if cp>=-0.02508831098675727 & cv>=-0.18150896430015565\n",
      "   -2.1318 if cp<=0.02439744509756565 & cv<=0.2973863840103152\n",
      "   -1.1036 if cv>=-0.18218555748462673\n",
      "   +0.3271 if \n",
      "   +3.3299 if cp>=-0.023341166973114013 & cv>=-0.7640999913215637\n",
      "--------------\n",
      "   +1.1139 if cp>=-0.02508831098675727 & cv>=-0.18150896430015565\n",
      "   +2.1323 if cp<=0.02439744509756565 & cv<=0.2973863840103152\n",
      "   +1.1139 if cv>=-0.18218555748462673\n",
      "   -0.3180 if \n",
      "   -3.3266 if cp>=-0.023341166973114013 & cv>=-0.7640999913215637\n",
      "Run episode 106 with rewards 64.0\n",
      "============ 107 ===========\n",
      "11 actions [1, 1, 0, 1, 1, 1, 0, 1, 1, 0, 1]\n",
      "   +1.2331 if cp>=-0.02508831098675727 & cv>=-0.18150896430015565\n",
      "   -3.6277 if cp<=0.02439744509756565 & cv<=0.2973863840103152\n",
      "   -3.9781 if cv>=-0.18218555748462673\n",
      "   +3.2124 if cp>=-0.023341166973114013 & cv>=-0.7640999913215637\n",
      "   -5.0430 if cp>=0.010805560834705831 & pa>=-0.024321251735091195\n",
      "--------------\n",
      "   -1.2243 if cp>=-0.02508831098675727 & cv>=-0.18150896430015565\n",
      "   +3.6343 if cp<=0.02439744509756565 & cv<=0.2973863840103152\n",
      "   +3.9959 if cv>=-0.18218555748462673\n",
      "   -3.2059 if cp>=-0.023341166973114013 & cv>=-0.7640999913215637\n",
      "   +5.0431 if cp>=0.010805560834705831 & pa>=-0.024321251735091195\n",
      "Run episode 107 with rewards 11.0\n",
      "============ 108 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.7671 if cp<=0.02439744509756565 & cv<=0.2973863840103152\n",
      "   -0.2239 if cv>=-0.18218555748462673\n",
      "   -0.2239 if cp>=-0.023341166973114013 & cv>=-0.7640999913215637\n",
      "   +0.0000 if cp>=0.010805560834705831 & pa>=-0.024321251735091195\n",
      "   -1.0579 if cp>=0.031854745000600815\n",
      "--------------\n",
      "   +0.7703 if cp<=0.02439744509756565 & cv<=0.2973863840103152\n",
      "   +0.2399 if cv>=-0.18218555748462673\n",
      "   +0.2399 if cp>=-0.023341166973114013 & cv>=-0.7640999913215637\n",
      "   +0.0000 if cp>=0.010805560834705831 & pa>=-0.024321251735091195\n",
      "   +1.0587 if cp>=0.031854745000600815\n",
      "Run episode 108 with rewards 9.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 109 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.7783 if cp<=0.02439744509756565 & cv<=0.2973863840103152\n",
      "   -2.3981 if cv>=-0.18218555748462673\n",
      "   -0.6913 if cp>=-0.023341166973114013 & cv>=-0.7640999913215637\n",
      "   -0.0449 if cp>=0.031854745000600815\n",
      "   -1.0662 if cp<=-0.007952731102704991 & cp>=-0.0396684467792511\n",
      "--------------\n",
      "   +0.7814 if cp<=0.02439744509756565 & cv<=0.2973863840103152\n",
      "   +2.4102 if cv>=-0.18218555748462673\n",
      "   +0.6991 if cp>=-0.023341166973114013 & cv>=-0.7640999913215637\n",
      "   +0.0455 if cp>=0.031854745000600815\n",
      "   +1.0687 if cp<=-0.007952731102704991 & cp>=-0.0396684467792511\n",
      "Run episode 109 with rewards 9.0\n",
      "============ 110 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.1815 if cp<=0.02439744509756565 & cv<=0.2973863840103152\n",
      "   -0.7908 if cv>=-0.18218555748462673\n",
      "   -0.7908 if cp>=-0.023341166973114013 & cv>=-0.7640999913215637\n",
      "   +0.0000 if cp<=-0.007952731102704991 & cp>=-0.0396684467792511\n",
      "   -0.2579 if cp>=0.01844007670879364\n",
      "--------------\n",
      "   +0.1832 if cp<=0.02439744509756565 & cv<=0.2973863840103152\n",
      "   +0.7968 if cv>=-0.18218555748462673\n",
      "   +0.7968 if cp>=-0.023341166973114013 & cv>=-0.7640999913215637\n",
      "   +0.0000 if cp<=-0.007952731102704991 & cp>=-0.0396684467792511\n",
      "   +0.2596 if cp>=0.01844007670879364\n",
      "Run episode 110 with rewards 10.0\n",
      "============ 111 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.0000 if cp<=0.02439744509756565 & cv<=0.2973863840103152\n",
      "   -1.0448 if cv>=-0.18218555748462673\n",
      "   -1.0448 if cp>=-0.023341166973114013 & cv>=-0.7640999913215637\n",
      "   -1.0448 if cp>=0.01844007670879364\n",
      "   -0.1338 if cp>=0.07674511969089509\n",
      "--------------\n",
      "   -0.0000 if cp<=0.02439744509756565 & cv<=0.2973863840103152\n",
      "   +1.0483 if cv>=-0.18218555748462673\n",
      "   +1.0483 if cp>=-0.023341166973114013 & cv>=-0.7640999913215637\n",
      "   +1.0483 if cp>=0.01844007670879364\n",
      "   +0.1342 if cp>=0.07674511969089509\n",
      "Run episode 111 with rewards 10.0\n",
      "============ 112 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -1.1940 if cv>=-0.18218555748462673\n",
      "   -1.1940 if cp>=-0.023341166973114013 & cv>=-0.7640999913215637\n",
      "   -0.1089 if cp>=0.01844007670879364\n",
      "   -0.0134 if cp>=0.07674511969089509\n",
      "   -0.4685 if cp<=0.02623074650764466 & cp>=-0.015032512694597244\n",
      "--------------\n",
      "   +1.1965 if cv>=-0.18218555748462673\n",
      "   +1.1965 if cp>=-0.023341166973114013 & cv>=-0.7640999913215637\n",
      "   +0.1094 if cp>=0.01844007670879364\n",
      "   +0.0135 if cp>=0.07674511969089509\n",
      "   +0.4692 if cp<=0.02623074650764466 & cp>=-0.015032512694597244\n",
      "Run episode 112 with rewards 10.0\n",
      "============ 113 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.7741 if cv>=-0.18218555748462673\n",
      "   -0.7741 if cp>=-0.023341166973114013 & cv>=-0.7640999913215637\n",
      "   -0.7741 if cp>=0.01844007670879364\n",
      "   -0.2307 if cp<=0.02623074650764466 & cp>=-0.015032512694597244\n",
      "   -0.3475 if cp<=0.03983869701623917\n",
      "--------------\n",
      "   +0.7754 if cv>=-0.18218555748462673\n",
      "   +0.7754 if cp>=-0.023341166973114013 & cv>=-0.7640999913215637\n",
      "   +0.7754 if cp>=0.01844007670879364\n",
      "   +0.2310 if cp<=0.02623074650764466 & cp>=-0.015032512694597244\n",
      "   +0.3480 if cp<=0.03983869701623917\n",
      "Run episode 113 with rewards 10.0\n",
      "============ 114 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -1.0236 if cv>=-0.18218555748462673\n",
      "   -1.0236 if cp>=-0.023341166973114013 & cv>=-0.7640999913215637\n",
      "   -0.2291 if cp>=0.01844007670879364\n",
      "   -0.8377 if cp<=0.03983869701623917\n",
      "   -0.1859 if cp>=0.03698556609451771\n",
      "--------------\n",
      "   +1.0245 if cv>=-0.18218555748462673\n",
      "   +1.0245 if cp>=-0.023341166973114013 & cv>=-0.7640999913215637\n",
      "   +0.2294 if cp>=0.01844007670879364\n",
      "   +0.8384 if cp<=0.03983869701623917\n",
      "   +0.1861 if cp>=0.03698556609451771\n",
      "Run episode 114 with rewards 10.0\n",
      "============ 115 ===========\n",
      "11 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.8932 if cv>=-0.18218555748462673\n",
      "   -0.8932 if cp>=-0.023341166973114013 & cv>=-0.7640999913215637\n",
      "   -0.8932 if cp>=0.01844007670879364\n",
      "   -0.0000 if cp<=0.03983869701623917\n",
      "   -0.1147 if cp>=0.0884269416332245\n",
      "--------------\n",
      "   +0.8938 if cv>=-0.18218555748462673\n",
      "   +0.8938 if cp>=-0.023341166973114013 & cv>=-0.7640999913215637\n",
      "   +0.8938 if cp>=0.01844007670879364\n",
      "   +0.0000 if cp<=0.03983869701623917\n",
      "   +0.1148 if cp>=0.0884269416332245\n",
      "Run episode 115 with rewards 11.0\n",
      "============ 116 ===========\n",
      "14 actions [1, 1, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.8797 if cv>=-0.18218555748462673\n",
      "   -0.8797 if cp>=-0.023341166973114013 & cv>=-0.7640999913215637\n",
      "   -0.8797 if cp>=0.01844007670879364\n",
      "   -0.0759 if cp>=0.0884269416332245\n",
      "   -0.1351 if pa<=-0.033388491719961166\n",
      "--------------\n",
      "   +0.8801 if cv>=-0.18218555748462673\n",
      "   +0.8801 if cp>=-0.023341166973114013 & cv>=-0.7640999913215637\n",
      "   +0.8801 if cp>=0.01844007670879364\n",
      "   +0.0759 if cp>=0.0884269416332245\n",
      "   +0.1352 if pa<=-0.033388491719961166\n",
      "Run episode 116 with rewards 14.0\n",
      "============ 117 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.6058 if cv>=-0.18218555748462673\n",
      "   -1.2976 if cp>=-0.023341166973114013 & cv>=-0.7640999913215637\n",
      "   -0.1266 if cp>=0.01844007670879364\n",
      "   -0.3457 if pa<=-0.033388491719961166\n",
      "   +3.6683 if cp<=-0.03628011122345924 & cv>=0.3984464168548584\n",
      "--------------\n",
      "   +0.6062 if cv>=-0.18218555748462673\n",
      "   +1.2978 if cp>=-0.023341166973114013 & cv>=-0.7640999913215637\n",
      "   +0.1266 if cp>=0.01844007670879364\n",
      "   +0.3458 if pa<=-0.033388491719961166\n",
      "   -3.6683 if cp<=-0.03628011122345924 & cv>=0.3984464168548584\n",
      "Run episode 117 with rewards 10.0\n",
      "============ 118 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -1.2564 if cv>=-0.18218555748462673\n",
      "   -1.2564 if cp>=-0.023341166973114013 & cv>=-0.7640999913215637\n",
      "   -0.1460 if pa<=-0.033388491719961166\n",
      "   +0.0000 if cp<=-0.03628011122345924 & cv>=0.3984464168548584\n",
      "   -0.5394 if cp<=0.09490340650081636 & cp>=0.005333039071410895\n",
      "--------------\n",
      "   +1.2566 if cv>=-0.18218555748462673\n",
      "   +1.2566 if cp>=-0.023341166973114013 & cv>=-0.7640999913215637\n",
      "   +0.1461 if pa<=-0.033388491719961166\n",
      "   +0.0000 if cp<=-0.03628011122345924 & cv>=0.3984464168548584\n",
      "   +0.5395 if cp<=0.09490340650081636 & cp>=0.005333039071410895\n",
      "Run episode 118 with rewards 10.0\n",
      "============ 119 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -1.0506 if cv>=-0.18218555748462673\n",
      "   -1.0506 if cp>=-0.023341166973114013 & cv>=-0.7640999913215637\n",
      "   -0.0985 if pa<=-0.033388491719961166\n",
      "   -0.0969 if cp<=0.09490340650081636 & cp>=0.005333039071410895\n",
      "   -0.4651 if cp<=0.06361113041639328 & cp>=-0.016911190748214722\n",
      "--------------\n",
      "   +1.0508 if cv>=-0.18218555748462673\n",
      "   +1.0508 if cp>=-0.023341166973114013 & cv>=-0.7640999913215637\n",
      "   +0.0986 if pa<=-0.033388491719961166\n",
      "   +0.0969 if cp<=0.09490340650081636 & cp>=0.005333039071410895\n",
      "   +0.4652 if cp<=0.06361113041639328 & cp>=-0.016911190748214722\n",
      "Run episode 119 with rewards 10.0\n",
      "============ 120 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.9220 if cv>=-0.18218555748462673\n",
      "   -0.9220 if cp>=-0.023341166973114013 & cv>=-0.7640999913215637\n",
      "   -0.2715 if pa<=-0.033388491719961166\n",
      "   -0.7030 if cp<=0.06361113041639328 & cp>=-0.016911190748214722\n",
      "   -0.2190 if cp>=0.06933503821492196\n",
      "--------------\n",
      "   +0.9221 if cv>=-0.18218555748462673\n",
      "   +0.9221 if cp>=-0.023341166973114013 & cv>=-0.7640999913215637\n",
      "   +0.2715 if pa<=-0.033388491719961166\n",
      "   +0.7031 if cp<=0.06361113041639328 & cp>=-0.016911190748214722\n",
      "   +0.2190 if cp>=0.06933503821492196\n",
      "Run episode 120 with rewards 10.0\n",
      "============ 121 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.9491 if cv>=-0.18218555748462673\n",
      "   -0.9491 if cp>=-0.023341166973114013 & cv>=-0.7640999913215637\n",
      "   -0.2060 if pa<=-0.033388491719961166\n",
      "   -0.7431 if cp<=0.06361113041639328 & cp>=-0.016911190748214722\n",
      "   -0.2060 if cp>=0.05786761566996575\n",
      "--------------\n",
      "   +0.9492 if cv>=-0.18218555748462673\n",
      "   +0.9492 if cp>=-0.023341166973114013 & cv>=-0.7640999913215637\n",
      "   +0.2060 if pa<=-0.033388491719961166\n",
      "   +0.7432 if cp<=0.06361113041639328 & cp>=-0.016911190748214722\n",
      "   +0.2060 if cp>=0.05786761566996575\n",
      "Run episode 121 with rewards 9.0\n",
      "============ 122 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.7058 if cv>=-0.18218555748462673\n",
      "   -0.7058 if cp>=-0.023341166973114013 & cv>=-0.7640999913215637\n",
      "   -0.7058 if pa<=-0.033388491719961166\n",
      "   -0.4494 if cp<=0.06361113041639328 & cp>=-0.016911190748214722\n",
      "   -0.0453 if cp>=0.10643080770969392\n",
      "--------------\n",
      "   +0.7058 if cv>=-0.18218555748462673\n",
      "   +0.7058 if cp>=-0.023341166973114013 & cv>=-0.7640999913215637\n",
      "   +0.7058 if pa<=-0.033388491719961166\n",
      "   +0.4494 if cp<=0.06361113041639328 & cp>=-0.016911190748214722\n",
      "   +0.0453 if cp>=0.10643080770969392\n",
      "Run episode 122 with rewards 10.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 123 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -1.0409 if cv>=-0.18218555748462673\n",
      "   -1.0409 if cp>=-0.023341166973114013 & cv>=-0.7640999913215637\n",
      "   -0.1653 if pa<=-0.033388491719961166\n",
      "   -0.9354 if cp<=0.06361113041639328 & cp>=-0.016911190748214722\n",
      "   -0.2657 if cp>=0.007136023230850698\n",
      "--------------\n",
      "   +1.0410 if cv>=-0.18218555748462673\n",
      "   +1.0410 if cp>=-0.023341166973114013 & cv>=-0.7640999913215637\n",
      "   +0.1653 if pa<=-0.033388491719961166\n",
      "   +0.9354 if cp<=0.06361113041639328 & cp>=-0.016911190748214722\n",
      "   +0.2657 if cp>=0.007136023230850698\n",
      "Run episode 123 with rewards 9.0\n",
      "============ 124 ===========\n",
      "12 actions [0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.5875 if cv>=-0.18218555748462673\n",
      "   -0.5875 if cp>=-0.023341166973114013 & cv>=-0.7640999913215637\n",
      "   -0.4354 if cp<=0.06361113041639328 & cp>=-0.016911190748214722\n",
      "   -0.5875 if cp>=0.007136023230850698\n",
      "   -0.0028 if cp>=0.13167087733745575\n",
      "--------------\n",
      "   +0.5876 if cv>=-0.18218555748462673\n",
      "   +0.5876 if cp>=-0.023341166973114013 & cv>=-0.7640999913215637\n",
      "   +0.4354 if cp<=0.06361113041639328 & cp>=-0.016911190748214722\n",
      "   +0.5876 if cp>=0.007136023230850698\n",
      "   +0.0027 if cp>=0.13167087733745575\n",
      "Run episode 124 with rewards 12.0\n",
      "============ 125 ===========\n",
      "10 actions [0, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   +0.5161 if cv>=-0.18218555748462673\n",
      "   -0.5446 if cp>=-0.023341166973114013 & cv>=-0.7640999913215637\n",
      "   -0.5323 if cp<=0.06361113041639328 & cp>=-0.016911190748214722\n",
      "   -0.4360 if cp>=0.007136023230850698\n",
      "   -3.2433 if cp<=0.02390245608985426 & cv>=0.03412083117291335\n",
      "--------------\n",
      "   -0.5160 if cv>=-0.18218555748462673\n",
      "   +0.5447 if cp>=-0.023341166973114013 & cv>=-0.7640999913215637\n",
      "   +0.5323 if cp<=0.06361113041639328 & cp>=-0.016911190748214722\n",
      "   +0.4360 if cp>=0.007136023230850698\n",
      "   +3.2433 if cp<=0.02390245608985426 & cv>=0.03412083117291335\n",
      "Run episode 125 with rewards 10.0\n",
      "============ 126 ===========\n",
      "34 actions [0, 1, 1, 1, 1, 0, 1, 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 0, 0, 1, 1, 1, 0, 1, 1, 1, 1]\n",
      "   +0.6102 if cv>=-0.18218555748462673\n",
      "   +1.2000 if cp>=-0.023341166973114013 & cv>=-0.7640999913215637\n",
      "   -1.6896 if cp<=0.06361113041639328 & cp>=-0.016911190748214722\n",
      "   -0.5409 if cp<=0.02390245608985426 & cv>=0.03412083117291335\n",
      "   -3.5477 if cp<=-0.021554994955658914\n",
      "--------------\n",
      "   -0.6102 if cv>=-0.18218555748462673\n",
      "   -1.1999 if cp>=-0.023341166973114013 & cv>=-0.7640999913215637\n",
      "   +1.6896 if cp<=0.06361113041639328 & cp>=-0.016911190748214722\n",
      "   +0.5409 if cp<=0.02390245608985426 & cv>=0.03412083117291335\n",
      "   +3.5477 if cp<=-0.021554994955658914\n",
      "Run episode 126 with rewards 34.0\n",
      "============ 127 ===========\n",
      "19 actions [0, 0, 0, 1, 1, 0, 1, 1, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 0]\n",
      "   +2.2503 if cv>=-0.18218555748462673\n",
      "   +1.9589 if cp>=-0.023341166973114013 & cv>=-0.7640999913215637\n",
      "   -5.0317 if cp<=0.06361113041639328 & cp>=-0.016911190748214722\n",
      "   -0.0000 if cp<=-0.021554994955658914\n",
      "   +4.7298 if cv>=0.412167239189148 & pav>=-0.8529941916465759\n",
      "--------------\n",
      "   -2.2502 if cv>=-0.18218555748462673\n",
      "   -1.9589 if cp>=-0.023341166973114013 & cv>=-0.7640999913215637\n",
      "   +5.0318 if cp<=0.06361113041639328 & cp>=-0.016911190748214722\n",
      "   -0.0000 if cp<=-0.021554994955658914\n",
      "   -4.7300 if cv>=0.412167239189148 & pav>=-0.8529941916465759\n",
      "Run episode 127 with rewards 19.0\n",
      "============ 128 ===========\n",
      "13 actions [0, 0, 0, 0, 1, 1, 0, 1, 1, 0, 0, 0, 0]\n",
      "   +1.1819 if cv>=-0.18218555748462673\n",
      "   -0.0000 if cp>=-0.023341166973114013 & cv>=-0.7640999913215637\n",
      "   -0.0000 if cp<=0.06361113041639328 & cp>=-0.016911190748214722\n",
      "   -0.0000 if cv>=0.412167239189148 & pav>=-0.8529941916465759\n",
      "   +3.4094 if cp>=-0.04647282361984253 & pav<=0.5802946805953979\n",
      "--------------\n",
      "   -1.1819 if cv>=-0.18218555748462673\n",
      "   -0.0000 if cp>=-0.023341166973114013 & cv>=-0.7640999913215637\n",
      "   -0.0000 if cp<=0.06361113041639328 & cp>=-0.016911190748214722\n",
      "   -0.0000 if cv>=0.412167239189148 & pav>=-0.8529941916465759\n",
      "   -3.4094 if cp>=-0.04647282361984253 & pav<=0.5802946805953979\n",
      "Run episode 128 with rewards 13.0\n",
      "============ 129 ===========\n",
      "21 actions [0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 0, 1, 0, 0, 1, 0, 0, 1, 0, 0]\n",
      "   +0.0269 if cv>=-0.18218555748462673\n",
      "   +2.4887 if cp<=0.06361113041639328 & cp>=-0.016911190748214722\n",
      "   +0.0000 if cv>=0.412167239189148 & pav>=-0.8529941916465759\n",
      "   +0.1859 if cp>=-0.04647282361984253 & pav<=0.5802946805953979\n",
      "   -3.0598 if cp>=-0.0630530148744583 & cv<=-0.6311264395713806\n",
      "--------------\n",
      "   -0.0269 if cv>=-0.18218555748462673\n",
      "   -2.4887 if cp<=0.06361113041639328 & cp>=-0.016911190748214722\n",
      "   -0.0000 if cv>=0.412167239189148 & pav>=-0.8529941916465759\n",
      "   -0.1859 if cp>=-0.04647282361984253 & pav<=0.5802946805953979\n",
      "   +3.0598 if cp>=-0.0630530148744583 & cv<=-0.6311264395713806\n",
      "Run episode 129 with rewards 21.0\n",
      "============ 130 ===========\n",
      "10 actions [0, 0, 0, 0, 1, 0, 1, 0, 1, 1]\n",
      "   -0.0383 if cv>=-0.18218555748462673\n",
      "   +4.3577 if cp<=0.06361113041639328 & cp>=-0.016911190748214722\n",
      "   +1.8106 if cp>=-0.04647282361984253 & pav<=0.5802946805953979\n",
      "   -3.0995 if cp>=-0.0630530148744583 & cv<=-0.6311264395713806\n",
      "   -4.0746 if cp>=-0.04672830179333687 & pa<=0.1297180950641632\n",
      "--------------\n",
      "   +0.0383 if cv>=-0.18218555748462673\n",
      "   -4.3577 if cp<=0.06361113041639328 & cp>=-0.016911190748214722\n",
      "   -1.8106 if cp>=-0.04647282361984253 & pav<=0.5802946805953979\n",
      "   +3.0995 if cp>=-0.0630530148744583 & cv<=-0.6311264395713806\n",
      "   +4.0746 if cp>=-0.04672830179333687 & pa<=0.1297180950641632\n",
      "Run episode 130 with rewards 10.0\n",
      "============ 131 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 1, 0, 0, 0]\n",
      "   +0.5688 if cp<=0.06361113041639328 & cp>=-0.016911190748214722\n",
      "   +0.1918 if cp>=-0.04647282361984253 & pav<=0.5802946805953979\n",
      "   -1.0910 if cp>=-0.0630530148744583 & cv<=-0.6311264395713806\n",
      "   +0.5639 if cp>=-0.04672830179333687 & pa<=0.1297180950641632\n",
      "   +2.3117 if cv>=-0.620622980594635\n",
      "--------------\n",
      "   -0.5688 if cp<=0.06361113041639328 & cp>=-0.016911190748214722\n",
      "   -0.1918 if cp>=-0.04647282361984253 & pav<=0.5802946805953979\n",
      "   +1.0911 if cp>=-0.0630530148744583 & cv<=-0.6311264395713806\n",
      "   -0.5639 if cp>=-0.04672830179333687 & pa<=0.1297180950641632\n",
      "   -2.3117 if cv>=-0.620622980594635\n",
      "Run episode 131 with rewards 10.0\n",
      "============ 132 ===========\n",
      "11 actions [0, 0, 0, 0, 1, 0, 0, 0, 1, 0, 1]\n",
      "   -0.0000 if cp<=0.06361113041639328 & cp>=-0.016911190748214722\n",
      "   -0.0000 if cp>=-0.0630530148744583 & cv<=-0.6311264395713806\n",
      "   +0.4171 if cp>=-0.04672830179333687 & pa<=0.1297180950641632\n",
      "   +1.4440 if cv>=-0.620622980594635\n",
      "   +2.4611 if cp<=-0.06055886894464493 & cp>=-0.08711969256401061\n",
      "--------------\n",
      "   +0.0000 if cp<=0.06361113041639328 & cp>=-0.016911190748214722\n",
      "   +0.0000 if cp>=-0.0630530148744583 & cv<=-0.6311264395713806\n",
      "   -0.4171 if cp>=-0.04672830179333687 & pa<=0.1297180950641632\n",
      "   -1.4440 if cv>=-0.620622980594635\n",
      "   -2.4611 if cp<=-0.06055886894464493 & cp>=-0.08711969256401061\n",
      "Run episode 132 with rewards 11.0\n",
      "============ 133 ===========\n",
      "17 actions [0, 0, 0, 1, 0, 1, 0, 0, 1, 1, 1, 0, 0, 0, 1, 1, 0]\n",
      "   -2.2660 if cp>=-0.0630530148744583 & cv<=-0.6311264395713806\n",
      "   -0.2377 if cp>=-0.04672830179333687 & pa<=0.1297180950641632\n",
      "   +2.3991 if cv>=-0.620622980594635\n",
      "   +0.8655 if cp<=-0.06055886894464493 & cp>=-0.08711969256401061\n",
      "   -1.4142 if cp<=-0.10491194576025009 & cp>=-0.10491194576025009\n",
      "--------------\n",
      "   +2.2660 if cp>=-0.0630530148744583 & cv<=-0.6311264395713806\n",
      "   +0.2377 if cp>=-0.04672830179333687 & pa<=0.1297180950641632\n",
      "   -2.3991 if cv>=-0.620622980594635\n",
      "   -0.8655 if cp<=-0.06055886894464493 & cp>=-0.08711969256401061\n",
      "   +1.4142 if cp<=-0.10491194576025009 & cp>=-0.10491194576025009\n",
      "Run episode 133 with rewards 17.0\n",
      "============ 134 ===========\n",
      "17 actions [0, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 0]\n",
      "   -1.2072 if cp>=-0.0630530148744583 & cv<=-0.6311264395713806\n",
      "   +2.1429 if cv>=-0.620622980594635\n",
      "   -0.1478 if cp<=-0.06055886894464493 & cp>=-0.08711969256401061\n",
      "   -0.0000 if cp<=-0.10491194576025009 & cp>=-0.10491194576025009\n",
      "   -2.9615 if cv<=-0.43466285467147825 & pav<=0.853936243057251\n",
      "--------------\n",
      "   +1.2072 if cp>=-0.0630530148744583 & cv<=-0.6311264395713806\n",
      "   -2.1429 if cv>=-0.620622980594635\n",
      "   +0.1478 if cp<=-0.06055886894464493 & cp>=-0.08711969256401061\n",
      "   -0.0000 if cp<=-0.10491194576025009 & cp>=-0.10491194576025009\n",
      "   +2.9615 if cv<=-0.43466285467147825 & pav<=0.853936243057251\n",
      "Run episode 134 with rewards 17.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 135 ===========\n",
      "25 actions [0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 0]\n",
      "   +0.0000 if cp>=-0.0630530148744583 & cv<=-0.6311264395713806\n",
      "   +1.6954 if cv>=-0.620622980594635\n",
      "   +1.3483 if cp<=-0.06055886894464493 & cp>=-0.08711969256401061\n",
      "   -4.0111 if cv<=-0.43466285467147825 & pav<=0.853936243057251\n",
      "   -3.1618 if cp>=-0.010009538009762751 & cv<=-0.5924060344696045\n",
      "--------------\n",
      "   -0.0000 if cp>=-0.0630530148744583 & cv<=-0.6311264395713806\n",
      "   -1.6955 if cv>=-0.620622980594635\n",
      "   -1.3483 if cp<=-0.06055886894464493 & cp>=-0.08711969256401061\n",
      "   +4.0111 if cv<=-0.43466285467147825 & pav<=0.853936243057251\n",
      "   +3.1618 if cp>=-0.010009538009762751 & cv<=-0.5924060344696045\n",
      "Run episode 135 with rewards 25.0\n",
      "============ 136 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.9683 if cv>=-0.620622980594635\n",
      "   -0.7930 if cp<=-0.06055886894464493 & cp>=-0.08711969256401061\n",
      "   -4.9641 if cv<=-0.43466285467147825 & pav<=0.853936243057251\n",
      "   +0.0000 if cp>=-0.010009538009762751 & cv<=-0.5924060344696045\n",
      "   +1.7733 if \n",
      "--------------\n",
      "   -0.9683 if cv>=-0.620622980594635\n",
      "   +0.7930 if cp<=-0.06055886894464493 & cp>=-0.08711969256401061\n",
      "   +4.9641 if cv<=-0.43466285467147825 & pav<=0.853936243057251\n",
      "   -0.0000 if cp>=-0.010009538009762751 & cv<=-0.5924060344696045\n",
      "   -1.7733 if \n",
      "Run episode 136 with rewards 9.0\n",
      "============ 137 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.5779 if cv>=-0.620622980594635\n",
      "   +0.3275 if cp<=-0.06055886894464493 & cp>=-0.08711969256401061\n",
      "   -0.0000 if cv<=-0.43466285467147825 & pav<=0.853936243057251\n",
      "   +1.7281 if \n",
      "   +0.0967 if cp<=-0.08466165810823441\n",
      "--------------\n",
      "   -0.5779 if cv>=-0.620622980594635\n",
      "   -0.3275 if cp<=-0.06055886894464493 & cp>=-0.08711969256401061\n",
      "   -0.0000 if cv<=-0.43466285467147825 & pav<=0.853936243057251\n",
      "   -1.7281 if \n",
      "   -0.0967 if cp<=-0.08466165810823441\n",
      "Run episode 137 with rewards 10.0\n",
      "============ 138 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.7371 if cv>=-0.620622980594635\n",
      "   +0.0865 if cp<=-0.06055886894464493 & cp>=-0.08711969256401061\n",
      "   +1.8867 if \n",
      "   +0.0506 if cp<=-0.08466165810823441\n",
      "   +0.3333 if cp<=-0.044500275701284404\n",
      "--------------\n",
      "   -0.7371 if cv>=-0.620622980594635\n",
      "   -0.0865 if cp<=-0.06055886894464493 & cp>=-0.08711969256401061\n",
      "   -1.8867 if \n",
      "   -0.0506 if cp<=-0.08466165810823441\n",
      "   -0.3333 if cp<=-0.044500275701284404\n",
      "Run episode 138 with rewards 9.0\n",
      "============ 139 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.7098 if cv>=-0.620622980594635\n",
      "   +0.1007 if cp<=-0.06055886894464493 & cp>=-0.08711969256401061\n",
      "   +1.5073 if \n",
      "   +0.3370 if cp<=-0.044500275701284404\n",
      "   +0.0558 if cp<=-0.07673204690217972\n",
      "--------------\n",
      "   -0.7098 if cv>=-0.620622980594635\n",
      "   -0.1007 if cp<=-0.06055886894464493 & cp>=-0.08711969256401061\n",
      "   -1.5073 if \n",
      "   -0.3370 if cp<=-0.044500275701284404\n",
      "   -0.0558 if cp<=-0.07673204690217972\n",
      "Run episode 139 with rewards 10.0\n",
      "============ 140 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.8119 if cv>=-0.620622980594635\n",
      "   +0.3264 if cp<=-0.06055886894464493 & cp>=-0.08711969256401061\n",
      "   +1.4503 if \n",
      "   +0.8008 if cp<=-0.044500275701284404\n",
      "   +0.0452 if cp<=-0.13022855818271636\n",
      "--------------\n",
      "   -0.8119 if cv>=-0.620622980594635\n",
      "   -0.3264 if cp<=-0.06055886894464493 & cp>=-0.08711969256401061\n",
      "   -1.4503 if \n",
      "   -0.8008 if cp<=-0.044500275701284404\n",
      "   -0.0452 if cp<=-0.13022855818271636\n",
      "Run episode 140 with rewards 10.0\n",
      "============ 141 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.7969 if cv>=-0.620622980594635\n",
      "   +0.0721 if cp<=-0.06055886894464493 & cp>=-0.08711969256401061\n",
      "   +1.7928 if \n",
      "   +0.3450 if cp<=-0.044500275701284404\n",
      "   +0.1750 if cp<=-0.0567673809826374\n",
      "--------------\n",
      "   -0.7969 if cv>=-0.620622980594635\n",
      "   -0.0722 if cp<=-0.06055886894464493 & cp>=-0.08711969256401061\n",
      "   -1.7928 if \n",
      "   -0.3450 if cp<=-0.044500275701284404\n",
      "   -0.1750 if cp<=-0.0567673809826374\n",
      "Run episode 141 with rewards 9.0\n",
      "============ 142 ===========\n",
      "8 actions [0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.8129 if cv>=-0.620622980594635\n",
      "   +1.2997 if \n",
      "   +0.4868 if cp<=-0.044500275701284404\n",
      "   +0.2136 if cp<=-0.0567673809826374\n",
      "   +0.2136 if cp<=-0.06354073360562325\n",
      "--------------\n",
      "   -0.8129 if cv>=-0.620622980594635\n",
      "   -1.2997 if \n",
      "   -0.4868 if cp<=-0.044500275701284404\n",
      "   -0.2136 if cp<=-0.0567673809826374\n",
      "   -0.2136 if cp<=-0.06354073360562325\n",
      "Run episode 142 with rewards 8.0\n",
      "============ 143 ===========\n",
      "13 actions [1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.7578 if cv>=-0.620622980594635\n",
      "   +1.7517 if \n",
      "   +0.0038 if cp<=-0.044500275701284404\n",
      "   +0.0038 if cp<=-0.0567673809826374\n",
      "   +0.0038 if pa>=0.1773243546485901\n",
      "--------------\n",
      "   -0.7578 if cv>=-0.620622980594635\n",
      "   -1.7517 if \n",
      "   -0.0038 if cp<=-0.044500275701284404\n",
      "   -0.0038 if cp<=-0.0567673809826374\n",
      "   -0.0038 if pa>=0.1773243546485901\n",
      "Run episode 143 with rewards 13.0\n",
      "============ 144 ===========\n",
      "13 actions [1, 1, 1, 1, 1, 0, 0, 1, 1, 1, 1, 0, 1]\n",
      "   -2.6913 if cv>=-0.620622980594635\n",
      "   +0.8399 if \n",
      "   +0.9273 if cp<=-0.044500275701284404\n",
      "   -0.0176 if pa>=0.1773243546485901\n",
      "   +2.7945 if cp>=-0.00470041763037443\n",
      "--------------\n",
      "   +2.6913 if cv>=-0.620622980594635\n",
      "   -0.8399 if \n",
      "   -0.9273 if cp<=-0.044500275701284404\n",
      "   +0.0176 if pa>=0.1773243546485901\n",
      "   -2.7945 if cp>=-0.00470041763037443\n",
      "Run episode 144 with rewards 13.0\n",
      "============ 145 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 0, 1, 1, 1, 1]\n",
      "   -1.4165 if cv>=-0.620622980594635\n",
      "   -1.4165 if \n",
      "   -0.0000 if cp<=-0.044500275701284404\n",
      "   +0.0947 if cp>=-0.00470041763037443\n",
      "   +4.0658 if cp<=0.046702855080366146 & cp>=0.005593272112309944 & cv>=0.7525028109550478\n",
      "--------------\n",
      "   +1.4165 if cv>=-0.620622980594635\n",
      "   +1.4165 if \n",
      "   -0.0000 if cp<=-0.044500275701284404\n",
      "   -0.0947 if cp>=-0.00470041763037443\n",
      "   -4.0658 if cp<=0.046702855080366146 & cp>=0.005593272112309944 & cv>=0.7525028109550478\n",
      "Run episode 145 with rewards 10.0\n",
      "============ 146 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -1.1022 if cv>=-0.620622980594635\n",
      "   -1.1022 if \n",
      "   -0.5770 if cp>=-0.00470041763037443\n",
      "   -0.4524 if cp<=0.046702855080366146 & cp>=0.005593272112309944 & cv>=0.7525028109550478\n",
      "   +3.1221 if cp<=0.033539891242980964 & cv>=0.8678554773330689\n",
      "--------------\n",
      "   +1.1022 if cv>=-0.620622980594635\n",
      "   +1.1022 if \n",
      "   +0.5770 if cp>=-0.00470041763037443\n",
      "   +0.4524 if cp<=0.046702855080366146 & cp>=0.005593272112309944 & cv>=0.7525028109550478\n",
      "   -3.1221 if cp<=0.033539891242980964 & cv>=0.8678554773330689\n",
      "Run episode 146 with rewards 9.0\n",
      "============ 147 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.7621 if cv>=-0.620622980594635\n",
      "   -0.7621 if \n",
      "   -0.7621 if cp>=-0.00470041763037443\n",
      "   +0.0000 if cp<=0.033539891242980964 & cv>=0.8678554773330689\n",
      "   -0.1159 if cp>=0.07147436067461968\n",
      "--------------\n",
      "   +0.7621 if cv>=-0.620622980594635\n",
      "   +0.7621 if \n",
      "   +0.7621 if cp>=-0.00470041763037443\n",
      "   -0.0000 if cp<=0.033539891242980964 & cv>=0.8678554773330689\n",
      "   +0.1159 if cp>=0.07147436067461968\n",
      "Run episode 147 with rewards 9.0\n",
      "============ 148 ===========\n",
      "8 actions [1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -1.3111 if cv>=-0.620622980594635\n",
      "   -1.3111 if \n",
      "   -0.1438 if cp>=-0.00470041763037443\n",
      "   +0.0005 if cp>=0.07147436067461968\n",
      "   -0.4875 if cp<=0.05135817453265191 & cp>=-0.01658541727811098\n",
      "--------------\n",
      "   +1.3111 if cv>=-0.620622980594635\n",
      "   +1.3111 if \n",
      "   +0.1438 if cp>=-0.00470041763037443\n",
      "   -0.0005 if cp>=0.07147436067461968\n",
      "   +0.4874 if cp<=0.05135817453265191 & cp>=-0.01658541727811098\n",
      "Run episode 148 with rewards 8.0\n",
      "============ 149 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 0]\n",
      "   -0.8896 if cv>=-0.620622980594635\n",
      "   -0.8896 if \n",
      "   -0.0591 if cp>=-0.00470041763037443\n",
      "   -0.1291 if cp<=0.05135817453265191 & cp>=-0.01658541727811098\n",
      "   -0.3777 if cp<=-0.034330998361110684\n",
      "--------------\n",
      "   +0.8896 if cv>=-0.620622980594635\n",
      "   +0.8896 if \n",
      "   +0.0591 if cp>=-0.00470041763037443\n",
      "   +0.1291 if cp<=0.05135817453265191 & cp>=-0.01658541727811098\n",
      "   +0.3777 if cp<=-0.034330998361110684\n",
      "Run episode 149 with rewards 10.0\n",
      "============ 150 ===========\n",
      "8 actions [1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -1.4159 if cv>=-0.620622980594635\n",
      "   -1.4159 if \n",
      "   -0.2891 if cp<=0.05135817453265191 & cp>=-0.01658541727811098\n",
      "   +0.0000 if cp<=-0.034330998361110684\n",
      "   -0.4800 if cp>=-0.007336246361955999\n",
      "--------------\n",
      "   +1.4159 if cv>=-0.620622980594635\n",
      "   +1.4159 if \n",
      "   +0.2891 if cp<=0.05135817453265191 & cp>=-0.01658541727811098\n",
      "   +0.0000 if cp<=-0.034330998361110684\n",
      "   +0.4800 if cp>=-0.007336246361955999\n",
      "Run episode 150 with rewards 8.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 151 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 0, 1, 1]\n",
      "   -0.4784 if cv>=-0.620622980594635\n",
      "   -0.4784 if \n",
      "   -0.3849 if cp<=0.05135817453265191 & cp>=-0.01658541727811098\n",
      "   -0.4784 if cp>=-0.007336246361955999\n",
      "   -0.0008 if cp>=0.10462094098329544\n",
      "--------------\n",
      "   +0.4784 if cv>=-0.620622980594635\n",
      "   +0.4784 if \n",
      "   +0.3848 if cp<=0.05135817453265191 & cp>=-0.01658541727811098\n",
      "   +0.4784 if cp>=-0.007336246361955999\n",
      "   +0.0008 if cp>=0.10462094098329544\n",
      "Run episode 151 with rewards 10.0\n",
      "============ 152 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 0, 1]\n",
      "   -1.2280 if cv>=-0.620622980594635\n",
      "   -1.2280 if \n",
      "   -1.0531 if cp<=0.05135817453265191 & cp>=-0.01658541727811098\n",
      "   +1.5289 if cp>=-0.007336246361955999\n",
      "   +2.7390 if cp<=0.060874041914939885 & cv>=1.1974634170532228\n",
      "--------------\n",
      "   +1.2280 if cv>=-0.620622980594635\n",
      "   +1.2280 if \n",
      "   +1.0531 if cp<=0.05135817453265191 & cp>=-0.01658541727811098\n",
      "   -1.5289 if cp>=-0.007336246361955999\n",
      "   -2.7390 if cp<=0.060874041914939885 & cv>=1.1974634170532228\n",
      "Run episode 152 with rewards 9.0\n",
      "============ 153 ===========\n",
      "12 actions [1, 1, 1, 1, 1, 1, 0, 0, 1, 1, 1, 1]\n",
      "   -0.7535 if cv>=-0.620622980594635\n",
      "   -0.7535 if \n",
      "   +0.7183 if cp>=-0.007336246361955999\n",
      "   +0.9685 if cp<=0.060874041914939885 & cv>=1.1974634170532228\n",
      "   -0.7172 if cp<=0.015288146398961552 & cp>=-0.04654557630419731\n",
      "--------------\n",
      "   +0.7535 if cv>=-0.620622980594635\n",
      "   +0.7535 if \n",
      "   -0.7183 if cp>=-0.007336246361955999\n",
      "   -0.9686 if cp<=0.060874041914939885 & cv>=1.1974634170532228\n",
      "   +0.7172 if cp<=0.015288146398961552 & cp>=-0.04654557630419731\n",
      "Run episode 153 with rewards 12.0\n",
      "============ 154 ===========\n",
      "12 actions [1, 1, 1, 1, 1, 0, 1, 0, 1, 0, 1, 1]\n",
      "   -1.0917 if cv>=-0.620622980594635\n",
      "   -1.0917 if \n",
      "   +0.4317 if cp>=-0.007336246361955999\n",
      "   -0.0000 if cp<=0.060874041914939885 & cv>=1.1974634170532228\n",
      "   +4.3321 if cp<=0.09044438600540163 & cv>=0.9404092073440552\n",
      "--------------\n",
      "   +1.0917 if cv>=-0.620622980594635\n",
      "   +1.0917 if \n",
      "   -0.4317 if cp>=-0.007336246361955999\n",
      "   -0.0000 if cp<=0.060874041914939885 & cv>=1.1974634170532228\n",
      "   -4.3321 if cp<=0.09044438600540163 & cv>=0.9404092073440552\n",
      "Run episode 154 with rewards 12.0\n",
      "============ 155 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.9357 if cv>=-0.620622980594635\n",
      "   -0.9357 if \n",
      "   +0.0653 if cp>=-0.007336246361955999\n",
      "   +2.3490 if cp<=0.09044438600540163 & cv>=0.9404092073440552\n",
      "   -0.0961 if cp>=-0.04355480149388313 & cv<=0.9589924693107605\n",
      "--------------\n",
      "   +0.9357 if cv>=-0.620622980594635\n",
      "   +0.9357 if \n",
      "   -0.0653 if cp>=-0.007336246361955999\n",
      "   -2.3490 if cp<=0.09044438600540163 & cv>=0.9404092073440552\n",
      "   +0.0961 if cp>=-0.04355480149388313 & cv<=0.9589924693107605\n",
      "Run episode 155 with rewards 9.0\n",
      "============ 156 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -1.1424 if cv>=-0.620622980594635\n",
      "   -1.1424 if \n",
      "   -0.3980 if cp<=0.09044438600540163 & cv>=0.9404092073440552\n",
      "   -0.9811 if cp>=-0.04355480149388313 & cv<=0.9589924693107605\n",
      "   -0.0486 if cp>=0.11194151490926743\n",
      "--------------\n",
      "   +1.1424 if cv>=-0.620622980594635\n",
      "   +1.1424 if \n",
      "   +0.3981 if cp<=0.09044438600540163 & cv>=0.9404092073440552\n",
      "   +0.9811 if cp>=-0.04355480149388313 & cv<=0.9589924693107605\n",
      "   +0.0486 if cp>=0.11194151490926743\n",
      "Run episode 156 with rewards 9.0\n",
      "============ 157 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.9917 if cv>=-0.620622980594635\n",
      "   -0.9917 if \n",
      "   -0.0742 if cp<=0.09044438600540163 & cv>=0.9404092073440552\n",
      "   -0.2057 if cp>=-0.04355480149388313 & cv<=0.9589924693107605\n",
      "   -0.2523 if cp<=0.01749318018555642 & cp>=-0.04327699691057205\n",
      "--------------\n",
      "   +0.9917 if cv>=-0.620622980594635\n",
      "   +0.9917 if \n",
      "   +0.0742 if cp<=0.09044438600540163 & cv>=0.9404092073440552\n",
      "   +0.2058 if cp>=-0.04355480149388313 & cv<=0.9589924693107605\n",
      "   +0.2523 if cp<=0.01749318018555642 & cp>=-0.04327699691057205\n",
      "Run episode 157 with rewards 9.0\n",
      "============ 158 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.8269 if cv>=-0.620622980594635\n",
      "   -0.8269 if \n",
      "   -0.5834 if cp>=-0.04355480149388313 & cv<=0.9589924693107605\n",
      "   -0.5834 if cp<=0.01749318018555642 & cp>=-0.04327699691057205\n",
      "   +0.0035 if cp>=0.06990355998277664\n",
      "--------------\n",
      "   +0.8269 if cv>=-0.620622980594635\n",
      "   +0.8269 if \n",
      "   +0.5834 if cp>=-0.04355480149388313 & cv<=0.9589924693107605\n",
      "   +0.5834 if cp<=0.01749318018555642 & cp>=-0.04327699691057205\n",
      "   -0.0035 if cp>=0.06990355998277664\n",
      "Run episode 158 with rewards 10.0\n",
      "============ 159 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -1.1349 if cv>=-0.620622980594635\n",
      "   -1.1349 if \n",
      "   -0.4913 if cp>=-0.04355480149388313 & cv<=0.9589924693107605\n",
      "   -0.2405 if cp<=0.01749318018555642 & cp>=-0.04327699691057205\n",
      "   -0.0517 if cp>=0.097404183447361\n",
      "--------------\n",
      "   +1.1350 if cv>=-0.620622980594635\n",
      "   +1.1350 if \n",
      "   +0.4913 if cp>=-0.04355480149388313 & cv<=0.9589924693107605\n",
      "   +0.2405 if cp<=0.01749318018555642 & cp>=-0.04327699691057205\n",
      "   +0.0517 if cp>=0.097404183447361\n",
      "Run episode 159 with rewards 10.0\n",
      "============ 160 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.8704 if cv>=-0.620622980594635\n",
      "   -0.8704 if \n",
      "   -0.4077 if cp>=-0.04355480149388313 & cv<=0.9589924693107605\n",
      "   -0.5220 if cp<=0.01749318018555642 & cp>=-0.04327699691057205\n",
      "   -0.0478 if cp>=0.0594980537891388\n",
      "--------------\n",
      "   +0.8704 if cv>=-0.620622980594635\n",
      "   +0.8704 if \n",
      "   +0.4077 if cp>=-0.04355480149388313 & cv<=0.9589924693107605\n",
      "   +0.5220 if cp<=0.01749318018555642 & cp>=-0.04327699691057205\n",
      "   +0.0478 if cp>=0.0594980537891388\n",
      "Run episode 160 with rewards 9.0\n",
      "============ 161 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.8630 if cv>=-0.620622980594635\n",
      "   -0.8630 if \n",
      "   -0.4562 if cp>=-0.04355480149388313 & cv<=0.9589924693107605\n",
      "   -0.5642 if cp<=0.01749318018555642 & cp>=-0.04327699691057205\n",
      "   +0.0063 if cp>=0.0885891392827034\n",
      "--------------\n",
      "   +0.8630 if cv>=-0.620622980594635\n",
      "   +0.8630 if \n",
      "   +0.4562 if cp>=-0.04355480149388313 & cv<=0.9589924693107605\n",
      "   +0.5642 if cp<=0.01749318018555642 & cp>=-0.04327699691057205\n",
      "   -0.0063 if cp>=0.0885891392827034\n",
      "Run episode 161 with rewards 10.0\n",
      "============ 162 ===========\n",
      "8 actions [1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.9885 if cv>=-0.620622980594635\n",
      "   -0.9885 if \n",
      "   -0.4124 if cp>=-0.04355480149388313 & cv<=0.9589924693107605\n",
      "   -0.5243 if cp<=0.01749318018555642 & cp>=-0.04327699691057205\n",
      "   -0.0603 if cp>=0.058328224718570715\n",
      "--------------\n",
      "   +0.9885 if cv>=-0.620622980594635\n",
      "   +0.9885 if \n",
      "   +0.4124 if cp>=-0.04355480149388313 & cv<=0.9589924693107605\n",
      "   +0.5243 if cp<=0.01749318018555642 & cp>=-0.04327699691057205\n",
      "   +0.0603 if cp>=0.058328224718570715\n",
      "Run episode 162 with rewards 8.0\n",
      "============ 163 ===========\n",
      "11 actions [1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1]\n",
      "   -0.6396 if cv>=-0.620622980594635\n",
      "   -0.6396 if \n",
      "   -0.5104 if cp>=-0.04355480149388313 & cv<=0.9589924693107605\n",
      "   -0.5104 if cp<=0.01749318018555642 & cp>=-0.04327699691057205\n",
      "   +0.0016 if cp>=0.05082032456994057\n",
      "--------------\n",
      "   +0.6396 if cv>=-0.620622980594635\n",
      "   +0.6396 if \n",
      "   +0.5104 if cp>=-0.04355480149388313 & cv<=0.9589924693107605\n",
      "   +0.5104 if cp<=0.01749318018555642 & cp>=-0.04327699691057205\n",
      "   -0.0016 if cp>=0.05082032456994057\n",
      "Run episode 163 with rewards 11.0\n",
      "============ 164 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 0, 1, 1, 1, 1]\n",
      "   -0.1888 if cv>=-0.620622980594635\n",
      "   -0.1888 if \n",
      "   -1.5188 if cp>=-0.04355480149388313 & cv<=0.9589924693107605\n",
      "   -0.8547 if cp<=0.01749318018555642 & cp>=-0.04327699691057205\n",
      "   +2.9284 if cp<=0.04228303208947184 & cv>=0.946413576602936\n",
      "--------------\n",
      "   +0.1888 if cv>=-0.620622980594635\n",
      "   +0.1888 if \n",
      "   +1.5188 if cp>=-0.04355480149388313 & cv<=0.9589924693107605\n",
      "   +0.8547 if cp<=0.01749318018555642 & cp>=-0.04327699691057205\n",
      "   -2.9284 if cp<=0.04228303208947184 & cv>=0.946413576602936\n",
      "Run episode 164 with rewards 10.0\n",
      "============ 165 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.8761 if \n",
      "   -1.2492 if cp>=-0.04355480149388313 & cv<=0.9589924693107605\n",
      "   -0.4096 if cp<=0.01749318018555642 & cp>=-0.04327699691057205\n",
      "   +0.0000 if cp<=0.04228303208947184 & cv>=0.946413576602936\n",
      "   +2.6590 if cp<=0.056911637634038933 & cv>=0.8428707599639893\n",
      "--------------\n",
      "   +0.8761 if \n",
      "   +1.2492 if cp>=-0.04355480149388313 & cv<=0.9589924693107605\n",
      "   +0.4096 if cp<=0.01749318018555642 & cp>=-0.04327699691057205\n",
      "   -0.0000 if cp<=0.04228303208947184 & cv>=0.946413576602936\n",
      "   -2.6590 if cp<=0.056911637634038933 & cv>=0.8428707599639893\n",
      "Run episode 165 with rewards 10.0\n",
      "============ 166 ===========\n",
      "8 actions [1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -1.5001 if \n",
      "   -0.5200 if cp>=-0.04355480149388313 & cv<=0.9589924693107605\n",
      "   +0.0000 if cp<=0.01749318018555642 & cp>=-0.04327699691057205\n",
      "   +0.0000 if cp<=0.056911637634038933 & cv>=0.8428707599639893\n",
      "   -1.2813 if cp<=0.11156202852725983\n",
      "--------------\n",
      "   +1.5001 if \n",
      "   +0.5200 if cp>=-0.04355480149388313 & cv<=0.9589924693107605\n",
      "   -0.0000 if cp<=0.01749318018555642 & cp>=-0.04327699691057205\n",
      "   -0.0000 if cp<=0.056911637634038933 & cv>=0.8428707599639893\n",
      "   +1.2812 if cp<=0.11156202852725983\n",
      "Run episode 166 with rewards 8.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 167 ===========\n",
      "11 actions [1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1]\n",
      "   -0.6328 if \n",
      "   -0.5087 if cp>=-0.04355480149388313 & cv<=0.9589924693107605\n",
      "   -0.1254 if cp<=0.056911637634038933 & cv>=0.8428707599639893\n",
      "   -0.6328 if cp<=0.11156202852725983\n",
      "   -0.2434 if cp>=-0.016420724242925643\n",
      "--------------\n",
      "   +0.6328 if \n",
      "   +0.5086 if cp>=-0.04355480149388313 & cv<=0.9589924693107605\n",
      "   +0.1254 if cp<=0.056911637634038933 & cv>=0.8428707599639893\n",
      "   +0.6328 if cp<=0.11156202852725983\n",
      "   +0.2434 if cp>=-0.016420724242925643\n",
      "Run episode 167 with rewards 11.0\n",
      "============ 168 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 0]\n",
      "   -0.6419 if \n",
      "   -1.4254 if cp>=-0.04355480149388313 & cv<=0.9589924693107605\n",
      "   -0.7129 if cp<=0.11156202852725983\n",
      "   +0.3019 if cp>=-0.016420724242925643\n",
      "   +3.3523 if cp<=0.08318053930997849 & cv>=1.3547604084014893\n",
      "--------------\n",
      "   +0.6419 if \n",
      "   +1.4254 if cp>=-0.04355480149388313 & cv<=0.9589924693107605\n",
      "   +0.7129 if cp<=0.11156202852725983\n",
      "   -0.3019 if cp>=-0.016420724242925643\n",
      "   -3.3522 if cp<=0.08318053930997849 & cv>=1.3547604084014893\n",
      "Run episode 168 with rewards 9.0\n",
      "============ 169 ===========\n",
      "11 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -1.2995 if \n",
      "   -0.5115 if cp>=-0.04355480149388313 & cv<=0.9589924693107605\n",
      "   -1.0102 if cp<=0.11156202852725983\n",
      "   -0.0000 if cp<=0.08318053930997849 & cv>=1.3547604084014893\n",
      "   -0.3904 if cp<=0.08748282045125962 & cp>=0.05492035821080209\n",
      "--------------\n",
      "   +1.2995 if \n",
      "   +0.5115 if cp>=-0.04355480149388313 & cv<=0.9589924693107605\n",
      "   +1.0102 if cp<=0.11156202852725983\n",
      "   +0.0000 if cp<=0.08318053930997849 & cv>=1.3547604084014893\n",
      "   +0.3904 if cp<=0.08748282045125962 & cp>=0.05492035821080209\n",
      "Run episode 169 with rewards 11.0\n",
      "============ 170 ===========\n",
      "8 actions [1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -1.3620 if \n",
      "   -0.5277 if cp>=-0.04355480149388313 & cv<=0.9589924693107605\n",
      "   -0.8233 if cp<=0.11156202852725983\n",
      "   -0.1869 if cp<=0.08748282045125962 & cp>=0.05492035821080209\n",
      "   +0.0560 if cp>=0.20324723422527313\n",
      "--------------\n",
      "   +1.3620 if \n",
      "   +0.5277 if cp>=-0.04355480149388313 & cv<=0.9589924693107605\n",
      "   +0.8232 if cp<=0.11156202852725983\n",
      "   +0.1869 if cp<=0.08748282045125962 & cp>=0.05492035821080209\n",
      "   -0.0560 if cp>=0.20324723422527313\n",
      "Run episode 170 with rewards 8.0\n",
      "============ 171 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.8119 if \n",
      "   -0.6115 if cp>=-0.04355480149388313 & cv<=0.9589924693107605\n",
      "   -0.8119 if cp<=0.11156202852725983\n",
      "   -0.0549 if cp<=0.08748282045125962 & cp>=0.05492035821080209\n",
      "   -0.0506 if cp>=0.06045079529285432\n",
      "--------------\n",
      "   +0.8119 if \n",
      "   +0.6115 if cp>=-0.04355480149388313 & cv<=0.9589924693107605\n",
      "   +0.8119 if cp<=0.11156202852725983\n",
      "   +0.0549 if cp<=0.08748282045125962 & cp>=0.05492035821080209\n",
      "   +0.0506 if cp>=0.06045079529285432\n",
      "Run episode 171 with rewards 9.0\n",
      "============ 172 ===========\n",
      "8 actions [1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -1.0803 if \n",
      "   -0.6548 if cp>=-0.04355480149388313 & cv<=0.9589924693107605\n",
      "   -1.0803 if cp<=0.11156202852725983\n",
      "   -0.0573 if cp<=0.08748282045125962 & cp>=0.05492035821080209\n",
      "   -0.0489 if cp>=0.05895039215683938\n",
      "--------------\n",
      "   +1.0803 if \n",
      "   +0.6547 if cp>=-0.04355480149388313 & cv<=0.9589924693107605\n",
      "   +1.0803 if cp<=0.11156202852725983\n",
      "   +0.0573 if cp<=0.08748282045125962 & cp>=0.05492035821080209\n",
      "   +0.0489 if cp>=0.05895039215683938\n",
      "Run episode 172 with rewards 8.0\n",
      "============ 173 ===========\n",
      "13 actions [0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0]\n",
      "   -0.7883 if \n",
      "   -0.5910 if cp>=-0.04355480149388313 & cv<=0.9589924693107605\n",
      "   -0.7883 if cp<=0.11156202852725983\n",
      "   -0.1277 if cp<=0.08748282045125962 & cp>=0.05492035821080209\n",
      "   +0.0050 if cp>=0.11146552860736847\n",
      "--------------\n",
      "   +0.7883 if \n",
      "   +0.5910 if cp>=-0.04355480149388313 & cv<=0.9589924693107605\n",
      "   +0.7883 if cp<=0.11156202852725983\n",
      "   +0.1277 if cp<=0.08748282045125962 & cp>=0.05492035821080209\n",
      "   -0.0050 if cp>=0.11146552860736847\n",
      "Run episode 173 with rewards 13.0\n",
      "============ 174 ===========\n",
      "12 actions [0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1]\n",
      "   -1.6264 if \n",
      "   +1.2662 if cp>=-0.04355480149388313 & cv<=0.9589924693107605\n",
      "   -0.8413 if cp<=0.11156202852725983\n",
      "   -0.0400 if cp<=0.08748282045125962 & cp>=0.05492035821080209\n",
      "   +3.2742 if cp>=-0.04446401074528694 & cv<=0.03769075199961669\n",
      "--------------\n",
      "   +1.6265 if \n",
      "   -1.2663 if cp>=-0.04355480149388313 & cv<=0.9589924693107605\n",
      "   +0.8412 if cp<=0.11156202852725983\n",
      "   +0.0399 if cp<=0.08748282045125962 & cp>=0.05492035821080209\n",
      "   -3.2742 if cp>=-0.04446401074528694 & cv<=0.03769075199961669\n",
      "Run episode 174 with rewards 12.0\n",
      "============ 175 ===========\n",
      "37 actions [0, 0, 0, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 1, 0]\n",
      "   -0.3637 if \n",
      "   +1.6425 if cp>=-0.04355480149388313 & cv<=0.9589924693107605\n",
      "   -0.3637 if cp<=0.11156202852725983\n",
      "   +1.6425 if cp>=-0.04446401074528694 & cv<=0.03769075199961669\n",
      "   -0.3917 if cp<=-0.12097439020872115\n",
      "--------------\n",
      "   +0.3637 if \n",
      "   -1.6425 if cp>=-0.04355480149388313 & cv<=0.9589924693107605\n",
      "   +0.3637 if cp<=0.11156202852725983\n",
      "   -1.6425 if cp>=-0.04446401074528694 & cv<=0.03769075199961669\n",
      "   +0.3917 if cp<=-0.12097439020872115\n",
      "Run episode 175 with rewards 37.0\n",
      "============ 176 ===========\n",
      "12 actions [0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1]\n",
      "   +0.7284 if \n",
      "   +0.0884 if cp>=-0.04355480149388313 & cv<=0.9589924693107605\n",
      "   +5.0245 if cp>=-0.04446401074528694 & cv<=0.03769075199961669\n",
      "   -0.5205 if cp<=-0.12097439020872115\n",
      "   -3.8007 if cv<=-0.5853130280971527 & pa>=-0.027786554023623462\n",
      "--------------\n",
      "   -0.7284 if \n",
      "   -0.0885 if cp>=-0.04355480149388313 & cv<=0.9589924693107605\n",
      "   -5.0246 if cp>=-0.04446401074528694 & cv<=0.03769075199961669\n",
      "   +0.5205 if cp<=-0.12097439020872115\n",
      "   +3.8007 if cv<=-0.5853130280971527 & pa>=-0.027786554023623462\n",
      "Run episode 176 with rewards 12.0\n",
      "============ 177 ===========\n",
      "10 actions [0, 0, 0, 0, 1, 0, 1, 0, 1, 0]\n",
      "   +1.7592 if \n",
      "   +0.0597 if cp>=-0.04446401074528694 & cv<=0.03769075199961669\n",
      "   -0.5802 if cp<=-0.12097439020872115\n",
      "   -1.0269 if cv<=-0.5853130280971527 & pa>=-0.027786554023623462\n",
      "   -1.5793 if cv<=-0.5777048826217651\n",
      "--------------\n",
      "   -1.7592 if \n",
      "   -0.0597 if cp>=-0.04446401074528694 & cv<=0.03769075199961669\n",
      "   +0.5802 if cp<=-0.12097439020872115\n",
      "   +1.0269 if cv<=-0.5853130280971527 & pa>=-0.027786554023623462\n",
      "   +1.5793 if cv<=-0.5777048826217651\n",
      "Run episode 177 with rewards 10.0\n",
      "============ 178 ===========\n",
      "18 actions [0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1]\n",
      "   +1.7350 if \n",
      "   -0.0000 if cp<=-0.12097439020872115\n",
      "   -1.7721 if cv<=-0.5853130280971527 & pa>=-0.027786554023623462\n",
      "   -1.7721 if cv<=-0.5777048826217651\n",
      "   -0.5855 if cv<=-0.7597455620765686\n",
      "--------------\n",
      "   -1.7350 if \n",
      "   -0.0000 if cp<=-0.12097439020872115\n",
      "   +1.7721 if cv<=-0.5853130280971527 & pa>=-0.027786554023623462\n",
      "   +1.7721 if cv<=-0.5777048826217651\n",
      "   +0.5855 if cv<=-0.7597455620765686\n",
      "Run episode 178 with rewards 18.0\n",
      "============ 179 ===========\n",
      "11 actions [0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1]\n",
      "   +1.0329 if \n",
      "   -2.2152 if cv<=-0.5853130280971527 & pa>=-0.027786554023623462\n",
      "   -2.2152 if cv<=-0.5777048826217651\n",
      "   -0.0000 if cv<=-0.7597455620765686\n",
      "   +1.8073 if cv>=-0.6302691459655761\n",
      "--------------\n",
      "   -1.0329 if \n",
      "   +2.2152 if cv<=-0.5853130280971527 & pa>=-0.027786554023623462\n",
      "   +2.2152 if cv<=-0.5777048826217651\n",
      "   +0.0000 if cv<=-0.7597455620765686\n",
      "   -1.8073 if cv>=-0.6302691459655761\n",
      "Run episode 179 with rewards 11.0\n",
      "============ 180 ===========\n",
      "10 actions [0, 0, 0, 0, 1, 0, 1, 0, 0, 1]\n",
      "   +0.3789 if \n",
      "   -0.7367 if cv<=-0.5853130280971527 & pa>=-0.027786554023623462\n",
      "   +0.1709 if cv<=-0.5777048826217651\n",
      "   +2.2544 if cv>=-0.6302691459655761\n",
      "   +0.6037 if cv>=-0.7769304513931274\n",
      "--------------\n",
      "   -0.3789 if \n",
      "   +0.7367 if cv<=-0.5853130280971527 & pa>=-0.027786554023623462\n",
      "   -0.1709 if cv<=-0.5777048826217651\n",
      "   -2.2544 if cv>=-0.6302691459655761\n",
      "   -0.6037 if cv>=-0.7769304513931274\n",
      "Run episode 180 with rewards 10.0\n",
      "============ 181 ===========\n",
      "19 actions [0, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 1]\n",
      "   +0.4666 if \n",
      "   -0.6192 if cv<=-0.5853130280971527 & pa>=-0.027786554023623462\n",
      "   +1.3291 if cv>=-0.6302691459655761\n",
      "   +1.3291 if cv>=-0.7769304513931274\n",
      "   -1.7445 if cp>=-0.04337635561823845\n",
      "--------------\n",
      "   -0.4666 if \n",
      "   +0.6192 if cv<=-0.5853130280971527 & pa>=-0.027786554023623462\n",
      "   -1.3291 if cv>=-0.6302691459655761\n",
      "   -1.3291 if cv>=-0.7769304513931274\n",
      "   +1.7445 if cp>=-0.04337635561823845\n",
      "Run episode 181 with rewards 19.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 182 ===========\n",
      "10 actions [0, 0, 1, 0, 0, 0, 1, 0, 1, 0]\n",
      "   +2.0579 if cv<=-0.5853130280971527 & pa>=-0.027786554023623462\n",
      "   +0.4620 if cv>=-0.6302691459655761\n",
      "   +0.4620 if cv>=-0.7769304513931274\n",
      "   -1.3149 if cp>=-0.04337635561823845\n",
      "   -2.3614 if cv<=-0.7444795727729797\n",
      "--------------\n",
      "   -2.0579 if cv<=-0.5853130280971527 & pa>=-0.027786554023623462\n",
      "   -0.4620 if cv>=-0.6302691459655761\n",
      "   -0.4620 if cv>=-0.7769304513931274\n",
      "   +1.3149 if cp>=-0.04337635561823845\n",
      "   +2.3614 if cv<=-0.7444795727729797\n",
      "Run episode 182 with rewards 10.0\n",
      "============ 183 ===========\n",
      "10 actions [0, 0, 0, 0, 1, 0, 1, 0, 1, 1]\n",
      "   -1.2905 if cv<=-0.5853130280971527 & pa>=-0.027786554023623462\n",
      "   +0.0756 if cv>=-0.7769304513931274\n",
      "   +0.0000 if cp>=-0.04337635561823845\n",
      "   -1.2905 if cv<=-0.7444795727729797\n",
      "   +2.2202 if cp>=-0.048891137540340426\n",
      "--------------\n",
      "   +1.2641 if cv<=-0.5853130280971527 & pa>=-0.027786554023623462\n",
      "   -2.0337 if cv>=-0.6302691459655761\n",
      "   -0.0000 if cp>=-0.04337635561823845\n",
      "   +1.2641 if cv<=-0.7444795727729797\n",
      "   +2.8297 if cp<=-0.048891137540340426 & cp>=-0.058871033042669295\n",
      "Run episode 183 with rewards 10.0\n",
      "============ 184 ===========\n",
      "15 actions [0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0]\n",
      "   -1.4593 if cv<=-0.5853130280971527 & pa>=-0.027786554023623462\n",
      "   -0.1569 if cv>=-0.7769304513931274\n",
      "   +0.0000 if cv<=-0.7444795727729797\n",
      "   -0.1569 if cp>=-0.048891137540340426\n",
      "   +2.2655 if cv>=-0.5487538337707519\n",
      "--------------\n",
      "   +2.7598 if cv<=-0.5853130280971527 & pa>=-0.027786554023623462\n",
      "   -1.5557 if cv>=-0.6302691459655761\n",
      "   -0.0000 if cv<=-0.7444795727729797\n",
      "   -0.0000 if cp<=-0.048891137540340426 & cp>=-0.058871033042669295\n",
      "   +1.6021 if cv<=-0.5487538337707519 & cv>=-0.7383198142051697\n",
      "Run episode 184 with rewards 15.0\n",
      "============ 185 ===========\n",
      "12 actions [0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1]\n",
      "   -2.0253 if cv<=-0.5853130280971527 & pa>=-0.027786554023623462\n",
      "   +0.1850 if cv>=-0.7769304513931274\n",
      "   +0.2189 if cp>=-0.048891137540340426\n",
      "   +2.2104 if cv>=-0.5487538337707519\n",
      "   +0.4961 if cv>=-0.6172951698303223\n",
      "--------------\n",
      "   +1.9330 if cv<=-0.5853130280971527 & pa>=-0.027786554023623462\n",
      "   -2.0720 if cv>=-0.6302691459655761\n",
      "   +0.1825 if cp<=-0.048891137540340426 & cp>=-0.058871033042669295\n",
      "   +1.9330 if cv<=-0.5487538337707519 & cv>=-0.7383198142051697\n",
      "   +0.9517 if cv<=-0.5059112608432769 & pav>=0.8615671157836914\n",
      "Run episode 185 with rewards 12.0\n",
      "============ 186 ===========\n",
      "17 actions [0, 0, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0]\n",
      "   -1.3491 if cv<=-0.5853130280971527 & pa>=-0.027786554023623462\n",
      "   +0.0780 if cp>=-0.048891137540340426\n",
      "   +1.2403 if cv>=-0.5487538337707519\n",
      "   +1.2403 if cv>=-0.6172951698303223\n",
      "   +0.2128 if cv>=-0.6258533596992493\n",
      "--------------\n",
      "   +1.1403 if cv<=-0.5853130280971527 & pa>=-0.027786554023623462\n",
      "   -1.1832 if cv>=-0.6302691459655761\n",
      "   +1.1403 if cv<=-0.5487538337707519 & cv>=-0.7383198142051697\n",
      "   +1.1403 if cv<=-0.5059112608432769 & pav>=0.8615671157836914\n",
      "   +0.1662 if cp<=-0.002830615919083351\n",
      "Run episode 186 with rewards 17.0\n",
      "============ 187 ===========\n",
      "14 actions [0, 0, 0, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 1]\n",
      "   -1.0590 if cv<=-0.5853130280971527 & pa>=-0.027786554023623462\n",
      "   +0.9940 if cv>=-0.5487538337707519\n",
      "   +0.9940 if cv>=-0.6172951698303223\n",
      "   +0.9940 if cv>=-0.6258533596992493\n",
      "   -2.9269 if cp<=-0.09966623932123184 & pav<=0.9118899703025818\n",
      "--------------\n",
      "   +1.0041 if cv<=-0.5853130280971527 & pa>=-0.027786554023623462\n",
      "   -1.2432 if cv>=-0.6302691459655761\n",
      "   +1.0041 if cv<=-0.5487538337707519 & cv>=-0.7383198142051697\n",
      "   +1.0041 if cv<=-0.5059112608432769 & pav>=0.8615671157836914\n",
      "   +3.2396 if cp<=-0.09966623932123184 & cv<=-0.4358456790447235\n",
      "Run episode 187 with rewards 14.0\n",
      "============ 188 ===========\n",
      "12 actions [0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0]\n",
      "   +1.6759 if cv<=-0.5853130280971527 & pa>=-0.027786554023623462\n",
      "   +2.5150 if cv>=-0.6172951698303223\n",
      "   +0.4768 if cv>=-0.6258533596992493\n",
      "   +0.0000 if cp<=-0.09966623932123184 & pav<=0.9118899703025818\n",
      "   -3.0945 if cv<=-0.47721685171127304 & cv>=-0.6272403955459595\n",
      "--------------\n",
      "   -4.3768 if cv>=-0.6302691459655761\n",
      "   +0.3189 if cv<=-0.5487538337707519 & cv>=-0.7383198142051697\n",
      "   +1.8063 if cv<=-0.5059112608432769 & pav>=0.8615671157836914\n",
      "   +0.0000 if cp<=-0.09966623932123184 & cv<=-0.4358456790447235\n",
      "   +3.6821 if cv>=-0.6272403955459595\n",
      "Run episode 188 with rewards 12.0\n",
      "============ 189 ===========\n",
      "18 actions [0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1]\n",
      "   +0.0000 if cv<=-0.5853130280971527 & pa>=-0.027786554023623462\n",
      "   +1.1471 if cv>=-0.6172951698303223\n",
      "   +1.1471 if cv>=-0.6258533596992493\n",
      "   -3.8184 if cv<=-0.47721685171127304 & cv>=-0.6272403955459595\n",
      "   +0.4953 if cp>=0.00034209038130939267\n",
      "--------------\n",
      "   -0.5868 if cv>=-0.6302691459655761\n",
      "   +2.0376 if cv<=-0.5487538337707519 & cv>=-0.7383198142051697\n",
      "   +2.0376 if cv<=-0.5059112608432769 & pav>=0.8615671157836914\n",
      "   -0.5868 if cv>=-0.6272403955459595\n",
      "   +0.0927 if cp>=-0.01975622735917568\n",
      "Run episode 189 with rewards 18.0\n",
      "============ 190 ===========\n",
      "14 actions [0, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1]\n",
      "   +3.1128 if cv>=-0.6172951698303223\n",
      "   +0.9946 if cv>=-0.6258533596992493\n",
      "   -2.4837 if cv<=-0.47721685171127304 & cv>=-0.6272403955459595\n",
      "   -0.1201 if cp>=0.00034209038130939267\n",
      "   -1.1362 if cv<=-0.43050196170806887\n",
      "--------------\n",
      "   -0.5523 if cv>=-0.6302691459655761\n",
      "   +3.2380 if cv<=-0.5487538337707519 & cv>=-0.7383198142051697\n",
      "   +1.2065 if cv<=-0.5059112608432769 & pav>=0.8615671157836914\n",
      "   -1.4946 if cv>=-0.6272403955459595\n",
      "   +0.3869 if cv<=-0.4357734501361847 & cv>=-0.6253568410873414\n",
      "Run episode 190 with rewards 14.0\n",
      "============ 191 ===========\n",
      "16 actions [0, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1]\n",
      "   +1.4494 if cv>=-0.6172951698303223\n",
      "   +1.4332 if cv>=-0.6258533596992493\n",
      "   +0.0430 if cv<=-0.47721685171127304 & cv>=-0.6272403955459595\n",
      "   -2.7895 if cv<=-0.43050196170806887\n",
      "   +2.9964 if cp<=-0.10556585788726806 & cp>=-0.13504776060581208 & cv<=-0.6082265019416809\n",
      "--------------\n",
      "   -1.3026 if cv>=-0.6302691459655761\n",
      "   +1.3528 if cv<=-0.5487538337707519 & cv>=-0.7383198142051697\n",
      "   +1.8559 if cv<=-0.5059112608432769 & pav>=0.8615671157836914\n",
      "   -1.3026 if cv>=-0.6272403955459595\n",
      "   +2.5503 if cp>=-0.10556585788726806\n",
      "Run episode 191 with rewards 16.0\n",
      "============ 192 ===========\n",
      "18 actions [0, 0, 1, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1]\n",
      "   +0.3662 if cv>=-0.6172951698303223\n",
      "   +0.3457 if cv>=-0.6258533596992493\n",
      "   -3.4230 if cv<=-0.43050196170806887\n",
      "   -0.0000 if cp<=-0.10556585788726806 & cp>=-0.13504776060581208 & cv<=-0.6082265019416809\n",
      "   +2.5062 if cp<=0.014270531944930553\n",
      "--------------\n",
      "   +2.2536 if cv<=-0.5487538337707519 & cv>=-0.7383198142051697\n",
      "   +2.2536 if cv<=-0.5059112608432769 & pav>=0.8615671157836914\n",
      "   +1.0317 if cv>=-0.6272403955459595\n",
      "   +1.0317 if cp>=-0.10556585788726806\n",
      "   -2.6502 if cp<=0.014270531944930553\n",
      "Run episode 192 with rewards 18.0\n",
      "============ 193 ===========\n",
      "12 actions [0, 0, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1]\n",
      "   +0.8150 if cv>=-0.6172951698303223\n",
      "   +0.8147 if cv>=-0.6258533596992493\n",
      "   -2.8535 if cv<=-0.43050196170806887\n",
      "   +1.5920 if cp<=0.014270531944930553\n",
      "   +3.1491 if cp>=0.024660246446728706\n",
      "--------------\n",
      "   +2.1683 if cv<=-0.5487538337707519 & cv>=-0.7383198142051697\n",
      "   +2.1683 if cv<=-0.5059112608432769 & pav>=0.8615671157836914\n",
      "   +1.0870 if cv>=-0.6272403955459595\n",
      "   -1.7947 if cp<=0.014270531944930553\n",
      "   -3.1054 if cp>=0.024660246446728706\n",
      "Run episode 193 with rewards 12.0\n",
      "============ 194 ===========\n",
      "20 actions [0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1]\n",
      "   +2.2693 if cv>=-0.6172951698303223\n",
      "   -1.2021 if cv<=-0.43050196170806887\n",
      "   -0.5269 if cp<=0.014270531944930553\n",
      "   +2.7962 if cp>=0.024660246446728706\n",
      "   +0.6139 if cp>=-0.009475043602287767\n",
      "--------------\n",
      "   +0.4216 if cv<=-0.5487538337707519 & cv>=-0.7383198142051697\n",
      "   +0.5163 if cv<=-0.5059112608432769 & pav>=0.8615671157836914\n",
      "   +0.3088 if cp<=0.014270531944930553\n",
      "   -1.7544 if cp>=0.024660246446728706\n",
      "   +2.1260 if cv<=-0.6054225564002991\n",
      "Run episode 194 with rewards 20.0\n",
      "============ 195 ===========\n",
      "12 actions [0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1]\n",
      "   +3.2782 if cv>=-0.6172951698303223\n",
      "   -4.4019 if cv<=-0.43050196170806887\n",
      "   +0.3027 if cp>=0.024660246446728706\n",
      "   +0.9859 if cp>=-0.009475043602287767\n",
      "   +1.6459 if cp<=-0.06878231167793274 & cv<=-0.4303651094436646\n",
      "--------------\n",
      "   +1.2184 if cv<=-0.5487538337707519 & cv>=-0.7383198142051697\n",
      "   +0.2648 if cv<=-0.5059112608432769 & pav>=0.8615671157836914\n",
      "   -0.3894 if cp>=0.024660246446728706\n",
      "   +1.2184 if cv<=-0.6054225564002991\n",
      "   +1.6116 if cp>=-0.09630699604749679 & cv<=-0.4303651094436646 & pav<=0.8401442050933838\n",
      "Run episode 195 with rewards 12.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 196 ===========\n",
      "14 actions [0, 0, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0]\n",
      "   +2.4482 if cv>=-0.6172951698303223\n",
      "   -3.7321 if cv<=-0.43050196170806887\n",
      "   +0.0000 if cp>=-0.009475043602287767\n",
      "   -0.1344 if cp<=-0.06878231167793274 & cv<=-0.4303651094436646\n",
      "   +1.6408 if cp>=-0.02181137911975383\n",
      "--------------\n",
      "   +2.3920 if cv<=-0.5487538337707519 & cv>=-0.7383198142051697\n",
      "   -0.0000 if cp>=0.024660246446728706\n",
      "   +0.6356 if cv<=-0.6054225564002991\n",
      "   -0.0000 if cp>=-0.09630699604749679 & cv<=-0.4303651094436646 & pav<=0.8401442050933838\n",
      "   -1.3557 if cv>=-0.40778805017471315\n",
      "Run episode 196 with rewards 14.0\n",
      "============ 197 ===========\n",
      "13 actions [0, 0, 0, 0, 1, 1, 1, 0, 0, 1, 0, 1, 0]\n",
      "   +1.2632 if cv>=-0.6172951698303223\n",
      "   -1.6409 if cv<=-0.43050196170806887\n",
      "   -0.6697 if cp<=-0.06878231167793274 & cv<=-0.4303651094436646\n",
      "   +4.5970 if cp>=-0.02181137911975383\n",
      "   +0.0796 if cp>=-0.011399445123970505\n",
      "--------------\n",
      "   -0.4154 if cv<=-0.5487538337707519 & cv>=-0.7383198142051697\n",
      "   +0.4428 if cv<=-0.6054225564002991\n",
      "   +0.0000 if cp>=-0.09630699604749679 & cv<=-0.4303651094436646 & pav<=0.8401442050933838\n",
      "   -1.4844 if cv>=-0.40778805017471315\n",
      "   +2.0378 if cp<=-0.044606526941061014 & cv<=-0.5566751539707183\n",
      "Run episode 197 with rewards 13.0\n",
      "============ 198 ===========\n",
      "14 actions [0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 1, 1]\n",
      "   +2.1634 if cv>=-0.6172951698303223\n",
      "   -3.8141 if cv<=-0.43050196170806887\n",
      "   -0.0116 if cp<=-0.06878231167793274 & cv<=-0.4303651094436646\n",
      "   +3.0303 if cp>=-0.02181137911975383\n",
      "   -2.3833 if cv>=-0.41838520765304565\n",
      "--------------\n",
      "   -1.8639 if cv<=-0.5487538337707519 & cv>=-0.7383198142051697\n",
      "   +4.2282 if cv<=-0.6054225564002991\n",
      "   -1.3162 if cv>=-0.40778805017471315\n",
      "   +0.4497 if cp<=-0.044606526941061014 & cv<=-0.5566751539707183\n",
      "   +3.0274 if cp<=-0.02211420945823191 & cv<=-0.2987691164016721 & cv>=-0.41838520765304565\n",
      "Run episode 198 with rewards 14.0\n",
      "============ 199 ===========\n",
      "11 actions [0, 0, 0, 1, 0, 1, 0, 0, 1, 1, 0]\n",
      "   +1.1514 if cv>=-0.6172951698303223\n",
      "   -1.0340 if cv<=-0.43050196170806887\n",
      "   -0.0000 if cp>=-0.02181137911975383\n",
      "   -1.4095 if cv>=-0.41838520765304565\n",
      "   +2.9393 if cv>=-0.2699694454669951 & pav<=0.621361255645752\n",
      "--------------\n",
      "   +0.1909 if cv<=-0.5487538337707519 & cv>=-0.7383198142051697\n",
      "   +0.1909 if cv<=-0.6054225564002991\n",
      "   -3.6507 if cv>=-0.40778805017471315\n",
      "   +3.1064 if cp<=-0.02211420945823191 & cv<=-0.2987691164016721 & cv>=-0.41838520765304565\n",
      "   +2.2916 if cv<=-0.4239108204841614\n",
      "Run episode 199 with rewards 11.0\n",
      "============ 200 ===========\n",
      "12 actions [0, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1]\n",
      "   +0.8305 if cv>=-0.6172951698303223\n",
      "   -0.7507 if cv<=-0.43050196170806887\n",
      "   +1.3094 if cv>=-0.41838520765304565\n",
      "   +0.1645 if cv>=-0.2699694454669951 & pav<=0.621361255645752\n",
      "   +3.2455 if cv<=-0.5965708494186401 & cv>=-0.5965708494186401\n",
      "--------------\n",
      "   +0.2206 if cv<=-0.6054225564002991\n",
      "   -3.1619 if cv>=-0.40778805017471315\n",
      "   -0.5022 if cp<=-0.02211420945823191 & cv<=-0.2987691164016721 & cv>=-0.41838520765304565\n",
      "   +2.1950 if cv<=-0.4239108204841614\n",
      "   -3.0213 if cv<=-0.5965708494186401 & cv>=-0.5965708494186401\n",
      "Run episode 200 with rewards 12.0\n",
      "============ 201 ===========\n",
      "10 actions [0, 0, 0, 1, 0, 0, 0, 0, 0, 1]\n",
      "   +1.8621 if cv>=-0.6172951698303223\n",
      "   -0.0667 if cv<=-0.43050196170806887\n",
      "   +1.6319 if cv>=-0.41838520765304565\n",
      "   -0.0000 if cv<=-0.5965708494186401 & cv>=-0.5965708494186401\n",
      "   -2.2790 if cp>=-0.07216166555881501\n",
      "--------------\n",
      "   -1.9631 if cv>=-0.40778805017471315\n",
      "   -0.5140 if cp<=-0.02211420945823191 & cv<=-0.2987691164016721 & cv>=-0.41838520765304565\n",
      "   +2.5192 if cv<=-0.4239108204841614\n",
      "   -0.0000 if cv<=-0.5965708494186401 & cv>=-0.5965708494186401\n",
      "   -2.3639 if cp<=-0.07216166555881501\n",
      "Run episode 201 with rewards 10.0\n",
      "============ 202 ===========\n",
      "13 actions [0, 0, 0, 1, 0, 1, 0, 0, 1, 0, 0, 0, 0]\n",
      "   +0.5510 if cv>=-0.6172951698303223\n",
      "   +1.6307 if cv<=-0.43050196170806887\n",
      "   +2.9009 if cv>=-0.41838520765304565\n",
      "   -1.0723 if cp>=-0.07216166555881501\n",
      "   +0.7944 if cp<=-0.10996792316436768\n",
      "--------------\n",
      "   -2.0716 if cv>=-0.40778805017471315\n",
      "   -1.7029 if cp<=-0.02211420945823191 & cv<=-0.2987691164016721 & cv>=-0.41838520765304565\n",
      "   +0.9335 if cv<=-0.4239108204841614\n",
      "   -3.0169 if cp<=-0.07216166555881501\n",
      "   -0.6369 if cp<=-0.06455549299716949 & cp>=-0.08255888521671295\n",
      "Run episode 202 with rewards 13.0\n",
      "============ 203 ===========\n",
      "18 actions [0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1]\n",
      "   -0.5051 if cv<=-0.43050196170806887\n",
      "   +2.5429 if cv>=-0.41838520765304565\n",
      "   -0.8058 if cp>=-0.07216166555881501\n",
      "   -0.0347 if cp<=-0.10996792316436768\n",
      "   +1.7537 if cp<=-0.035466827079653734 & cp>=-0.05758484452962875 & cv<=-0.5185663998126981\n",
      "--------------\n",
      "   -1.9025 if cv>=-0.40778805017471315\n",
      "   -0.4256 if cp<=-0.02211420945823191 & cv<=-0.2987691164016721 & cv>=-0.41838520765304565\n",
      "   +2.6795 if cv<=-0.4239108204841614\n",
      "   -2.7202 if cp<=-0.07216166555881501\n",
      "   -1.1429 if cp<=-0.035466827079653734 & cp>=-0.05758484452962875 & cv<=-0.5185663998126981\n",
      "Run episode 203 with rewards 18.0\n",
      "============ 204 ===========\n",
      "12 actions [0, 0, 0, 0, 1, 0, 0, 0, 0, 1, 1, 0]\n",
      "   +0.0887 if cv<=-0.43050196170806887\n",
      "   +3.0841 if cv>=-0.41838520765304565\n",
      "   +1.4555 if cp>=-0.07216166555881501\n",
      "   -0.0000 if cp<=-0.035466827079653734 & cp>=-0.05758484452962875 & cv<=-0.5185663998126981\n",
      "   -2.0217 if cv>=-0.44013012051582334\n",
      "--------------\n",
      "   -2.7807 if cv>=-0.40778805017471315\n",
      "   +1.8687 if cv<=-0.4239108204841614\n",
      "   -2.1462 if cp<=-0.07216166555881501\n",
      "   -0.0000 if cp<=-0.035466827079653734 & cp>=-0.05758484452962875 & cv<=-0.5185663998126981\n",
      "   -3.1723 if cp>=-0.03788341060280799 & cv<=-0.44013012051582334 & cv>=-0.4482870399951935\n",
      "Run episode 204 with rewards 12.0\n",
      "============ 205 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   -1.5623 if cv<=-0.43050196170806887\n",
      "   +0.1072 if cv>=-0.41838520765304565\n",
      "   +3.8342 if cp>=-0.07216166555881501\n",
      "   +0.1072 if cv>=-0.44013012051582334\n",
      "   +1.6311 if cp<=-0.005845760798547394\n",
      "--------------\n",
      "   -1.5958 if cv>=-0.40778805017471315\n",
      "   +1.1339 if cv<=-0.4239108204841614\n",
      "   +2.1818 if cp<=-0.07216166555881501\n",
      "   +0.0000 if cp>=-0.03788341060280799 & cv<=-0.44013012051582334 & cv>=-0.4482870399951935\n",
      "   -2.1423 if cp<=-0.005845760798547394\n",
      "Run episode 205 with rewards 10.0\n",
      "============ 206 ===========\n",
      "14 actions [0, 0, 0, 0, 1, 0, 1, 0, 0, 1, 1, 0, 0, 0]\n",
      "   +1.4932 if cv<=-0.43050196170806887\n",
      "   +2.5608 if cp>=-0.07216166555881501\n",
      "   +0.3757 if cv>=-0.44013012051582334\n",
      "   -0.5039 if cp<=-0.005845760798547394\n",
      "   +0.8380 if cp>=0.026156372204422955\n",
      "--------------\n",
      "   -0.4254 if cv>=-0.40778805017471315\n",
      "   -1.0099 if cv<=-0.4239108204841614\n",
      "   +0.6231 if cp<=-0.07216166555881501\n",
      "   +0.4221 if cp<=-0.005845760798547394\n",
      "   -0.7715 if cp>=0.026156372204422955\n",
      "Run episode 206 with rewards 14.0\n",
      "============ 207 ===========\n",
      "12 actions [0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0]\n",
      "   -0.2866 if cv<=-0.43050196170806887\n",
      "   -0.4183 if cp>=-0.07216166555881501\n",
      "   -0.6898 if cp<=-0.005845760798547394\n",
      "   +0.0000 if cp>=0.026156372204422955\n",
      "   +4.0716 if cv>=-0.5359808921813964\n",
      "--------------\n",
      "   -1.4453 if cv>=-0.40778805017471315\n",
      "   +0.7978 if cv<=-0.4239108204841614\n",
      "   +0.8132 if cp<=-0.07216166555881501\n",
      "   -0.0000 if cp>=0.026156372204422955\n",
      "   +4.9960 if cp>=-0.06117412894964218 & cv<=-0.5359808921813964\n",
      "Run episode 207 with rewards 12.0\n",
      "============ 208 ===========\n",
      "12 actions [0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1]\n",
      "   +0.2561 if cv<=-0.43050196170806887\n",
      "   +0.4851 if cp>=-0.07216166555881501\n",
      "   -0.7982 if cp<=-0.005845760798547394\n",
      "   +0.8097 if cv>=-0.5359808921813964\n",
      "   +2.9719 if cv>=-0.4475941717624664\n",
      "--------------\n",
      "   -0.8117 if cv>=-0.40778805017471315\n",
      "   -0.1722 if cv<=-0.4239108204841614\n",
      "   -0.0213 if cp<=-0.07216166555881501\n",
      "   +0.7298 if cp>=-0.06117412894964218 & cv<=-0.5359808921813964\n",
      "   +2.8932 if cv<=-0.4475941717624664\n",
      "Run episode 208 with rewards 12.0\n",
      "============ 209 ===========\n",
      "13 actions [0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0]\n",
      "   -0.2198 if cp>=-0.07216166555881501\n",
      "   -0.0916 if cp<=-0.005845760798547394\n",
      "   +1.7997 if cv>=-0.5359808921813964\n",
      "   +1.7997 if cv>=-0.4475941717624664\n",
      "   +0.2798 if cv>=-0.5593703985214233\n",
      "--------------\n",
      "   -1.0082 if cv>=-0.40778805017471315\n",
      "   +1.4556 if cv<=-0.4239108204841614\n",
      "   +1.4556 if cp>=-0.06117412894964218 & cv<=-0.5359808921813964\n",
      "   +1.4556 if cv<=-0.4475941717624664\n",
      "   +0.0604 if cp<=-0.016071575134992598\n",
      "Run episode 209 with rewards 13.0\n",
      "============ 210 ===========\n",
      "11 actions [0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0]\n",
      "   -0.0229 if cp>=-0.07216166555881501\n",
      "   +1.2208 if cv>=-0.5359808921813964\n",
      "   +1.2208 if cv>=-0.4475941717624664\n",
      "   +1.2208 if cv>=-0.5593703985214233\n",
      "   +0.5644 if pav<=0.9073766469955444\n",
      "--------------\n",
      "   -1.2143 if cv>=-0.40778805017471315\n",
      "   +1.3561 if cv<=-0.4239108204841614\n",
      "   +1.1818 if cp>=-0.06117412894964218 & cv<=-0.5359808921813964\n",
      "   +1.3561 if cv<=-0.4475941717624664\n",
      "   +0.2910 if cp<=-0.040034329891204826 & cv<=-0.6025578260421753\n",
      "Run episode 210 with rewards 11.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 211 ===========\n",
      "15 actions [0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0]\n",
      "   +0.9257 if cv>=-0.5359808921813964\n",
      "   +0.9257 if cv>=-0.4475941717624664\n",
      "   +0.9257 if cv>=-0.5593703985214233\n",
      "   +0.9257 if pav<=0.9073766469955444\n",
      "   +0.2059 if cp<=-0.05011123791337012 & cv>=-0.39514073729515076\n",
      "--------------\n",
      "   -0.8485 if cv>=-0.40778805017471315\n",
      "   +1.4996 if cv<=-0.4239108204841614\n",
      "   +0.8340 if cp>=-0.06117412894964218 & cv<=-0.5359808921813964\n",
      "   +1.4996 if cv<=-0.4475941717624664\n",
      "   +0.1633 if pav>=1.1423214673995972\n",
      "Run episode 211 with rewards 15.0\n",
      "============ 212 ===========\n",
      "14 actions [0, 0, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1]\n",
      "   +1.4198 if cv>=-0.5359808921813964\n",
      "   +1.4198 if cv>=-0.4475941717624664\n",
      "   +1.4198 if cv>=-0.5593703985214233\n",
      "   +0.5118 if pav<=0.9073766469955444\n",
      "   -0.9510 if cp<=-0.03020063713192939\n",
      "--------------\n",
      "   -1.4149 if cv>=-0.40778805017471315\n",
      "   +1.8936 if cv<=-0.4239108204841614\n",
      "   +1.1513 if cp>=-0.06117412894964218 & cv<=-0.5359808921813964\n",
      "   +1.8936 if cv<=-0.4475941717624664\n",
      "   +0.5019 if cp<=-0.05824594944715497 & cv<=-0.39432398676872255\n",
      "Run episode 212 with rewards 14.0\n",
      "============ 213 ===========\n",
      "18 actions [0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1]\n",
      "   +0.4363 if cv>=-0.5359808921813964\n",
      "   +0.4363 if cv>=-0.4475941717624664\n",
      "   +3.3289 if cv>=-0.5593703985214233\n",
      "   +2.8592 if cp<=-0.03020063713192939\n",
      "   -4.3855 if cv<=-0.5405802607536316\n",
      "--------------\n",
      "   -0.0379 if cv>=-0.40778805017471315\n",
      "   +1.7927 if cv<=-0.4239108204841614\n",
      "   -0.5305 if cp>=-0.06117412894964218 & cv<=-0.5359808921813964\n",
      "   +1.7927 if cv<=-0.4475941717624664\n",
      "   -4.0371 if cv>=-0.5405802607536316\n",
      "Run episode 213 with rewards 18.0\n",
      "============ 214 ===========\n",
      "15 actions [0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0]\n",
      "   +1.4699 if cv>=-0.4475941717624664\n",
      "   +1.4699 if cv>=-0.5593703985214233\n",
      "   -0.2383 if cp<=-0.03020063713192939\n",
      "   -1.3679 if cv<=-0.5405802607536316\n",
      "   +0.0497 if cp>=-0.07534757554531096\n",
      "--------------\n",
      "   +0.9656 if cv<=-0.4239108204841614\n",
      "   +0.5664 if cp>=-0.06117412894964218 & cv<=-0.5359808921813964\n",
      "   +1.7048 if cv<=-0.4475941717624664\n",
      "   -1.2045 if cv>=-0.5405802607536316\n",
      "   +0.5245 if cp<=-0.039611346274614316 & cv>=-0.6314427137374878\n",
      "Run episode 214 with rewards 15.0\n",
      "============ 215 ===========\n",
      "31 actions [0, 0, 1, 0, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1]\n",
      "   +1.5584 if cv>=-0.4475941717624664\n",
      "   -1.2144 if cv>=-0.5593703985214233\n",
      "   -0.9159 if cp<=-0.03020063713192939\n",
      "   -0.3486 if cv<=-0.5405802607536316\n",
      "   +2.8686 if cp>=-0.04842094630002975 & cv>=-0.35534352660179136\n",
      "--------------\n",
      "   +2.1362 if cv<=-0.4239108204841614\n",
      "   +2.1362 if cp>=-0.06117412894964218 & cv<=-0.5359808921813964\n",
      "   +2.1362 if cv<=-0.4475941717624664\n",
      "   +1.4576 if cv>=-0.5405802607536316\n",
      "   -2.3556 if cp>=-0.04842094630002975\n",
      "Run episode 215 with rewards 31.0\n",
      "============ 216 ===========\n",
      "23 actions [0, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1]\n",
      "   +0.4436 if cv>=-0.4475941717624664\n",
      "   +0.1531 if cv>=-0.5593703985214233\n",
      "   -1.0782 if cp<=-0.03020063713192939\n",
      "   +3.7254 if cp>=-0.04842094630002975 & cv>=-0.35534352660179136\n",
      "   +6.4105 if cp>=0.011996845714747906 & cv<=-0.4327103793621063\n",
      "--------------\n",
      "   +3.1696 if cv<=-0.4239108204841614\n",
      "   -2.6285 if cp>=-0.06117412894964218 & cv<=-0.5359808921813964\n",
      "   -1.1046 if cv<=-0.4475941717624664\n",
      "   -1.9014 if cp>=-0.04842094630002975\n",
      "   +5.3435 if cp<=0.011996845714747906 & cv<=-0.2655753493309021 & cv<=-0.4327103793621063 & pa<=0.0977092832326889\n",
      "Run episode 216 with rewards 23.0\n",
      "============ 217 ===========\n",
      "36 actions [0, 0, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0]\n",
      "   +0.9037 if cv>=-0.4475941717624664\n",
      "   -3.3532 if cp<=-0.03020063713192939\n",
      "   +4.1134 if cp>=-0.04842094630002975 & cv>=-0.35534352660179136\n",
      "   +3.8218 if cp>=0.011996845714747906 & cv<=-0.4327103793621063\n",
      "   -0.7464 if \n",
      "--------------\n",
      "   +3.4210 if cv<=-0.4239108204841614\n",
      "   +0.3338 if cp>=-0.06117412894964218 & cv<=-0.5359808921813964\n",
      "   -0.4636 if cp>=-0.04842094630002975\n",
      "   +1.8632 if cp<=0.011996845714747906 & cv<=-0.2655753493309021 & cv<=-0.4327103793621063 & pa<=0.0977092832326889\n",
      "   +3.3130 if cp<=-0.04900763109326362\n",
      "Run episode 217 with rewards 36.0\n",
      "============ 218 ===========\n",
      "27 actions [0, 0, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1]\n",
      "   +2.2448 if cv>=-0.4475941717624664\n",
      "   -5.8882 if cp<=-0.03020063713192939\n",
      "   +6.8973 if cp>=-0.04842094630002975 & cv>=-0.35534352660179136\n",
      "   -0.0000 if cp>=0.011996845714747906 & cv<=-0.4327103793621063\n",
      "   -4.5197 if pa>=0.19850285351276398\n",
      "--------------\n",
      "   +1.1103 if cv<=-0.4239108204841614\n",
      "   -0.9537 if cp>=-0.04842094630002975\n",
      "   +0.6635 if cp<=0.011996845714747906 & cv<=-0.2655753493309021 & cv<=-0.4327103793621063 & pa<=0.0977092832326889\n",
      "   +2.2005 if cp<=-0.04900763109326362\n",
      "   -3.1679 if cp<=-0.0235468540340662 & cp>=-0.04435991868376732 & cv>=-0.358180969953537 & pa<=0.0681978389620781 & pa<=0.17756260931491852\n",
      "Run episode 218 with rewards 27.0\n",
      "============ 219 ===========\n",
      "31 actions [0, 0, 0, 1, 0, 1, 1, 0, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0]\n",
      "   +2.4675 if cv>=-0.4475941717624664\n",
      "   -5.2174 if cp<=-0.03020063713192939\n",
      "   +4.6705 if cp>=-0.04842094630002975 & cv>=-0.35534352660179136\n",
      "   -0.0014 if pa>=0.19850285351276398\n",
      "   -3.2556 if cv<=-0.5685905337333679 & pav<=0.9192032098770142\n",
      "--------------\n",
      "   +4.1180 if cv<=-0.4239108204841614\n",
      "   -0.9911 if cp>=-0.04842094630002975\n",
      "   +1.5029 if cp<=-0.04900763109326362\n",
      "   +0.0001 if cp<=-0.0235468540340662 & cp>=-0.04435991868376732 & cv>=-0.358180969953537 & pa<=0.0681978389620781 & pa<=0.17756260931491852\n",
      "   -3.8801 if pa<=0.11504924893379212 & pa>=0.09308255612850189 & pav>=0.9192032098770142\n",
      "Run episode 219 with rewards 31.0\n",
      "============ 220 ===========\n",
      "72 actions [0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0]\n",
      "   +1.8886 if cv>=-0.4475941717624664\n",
      "   -5.2116 if cp<=-0.03020063713192939\n",
      "   +5.3419 if cp>=-0.04842094630002975 & cv>=-0.35534352660179136\n",
      "   -0.0001 if cv<=-0.5685905337333679 & pav<=0.9192032098770142\n",
      "   -5.3926 if cp<=-0.01848515123128891 & cp>=-0.01848515123128891\n",
      "--------------\n",
      "   +2.0246 if cv<=-0.4239108204841614\n",
      "   +2.3023 if cp>=-0.04842094630002975\n",
      "   +2.9707 if cp<=-0.04900763109326362\n",
      "   -2.3662 if pa<=0.11504924893379212 & pa>=0.09308255612850189 & pav>=0.9192032098770142\n",
      "   -3.9005 if cp>=-0.050379715859889984 & pav<=0.5525406002998352\n",
      "Run episode 220 with rewards 72.0\n",
      "origin 135.4608498991925 new 138.32813491461832 not updated\n",
      "============ 221 ===========\n",
      "23 actions [0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1]\n",
      "   -1.7730 if cv>=-0.4475941717624664\n",
      "   -2.3146 if cp<=-0.03020063713192939\n",
      "   +8.9103 if cp>=-0.04842094630002975 & cv>=-0.35534352660179136\n",
      "   -0.0001 if cp<=-0.01848515123128891 & cp>=-0.01848515123128891\n",
      "   +5.1767 if cp>=-0.012103290297091007 & cv<=-0.41887985467910765 & pa<=-0.0063225512392818895\n",
      "--------------\n",
      "   +2.0246 if cv<=-0.4239108204841614\n",
      "   +2.3023 if cp>=-0.04842094630002975\n",
      "   +2.9707 if cp<=-0.04900763109326362\n",
      "   -2.3662 if pa<=0.11504924893379212 & pa>=0.09308255612850189 & pav>=0.9192032098770142\n",
      "   -3.9005 if cp>=-0.050379715859889984 & pav<=0.5525406002998352\n",
      "Run episode 221 with rewards 23.0\n",
      "============ 222 ===========\n",
      "26 actions [0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1]\n",
      "   +0.5556 if cv>=-0.4475941717624664\n",
      "   -1.5409 if cp<=-0.03020063713192939\n",
      "   +5.8858 if cp>=-0.04842094630002975 & cv>=-0.35534352660179136\n",
      "   +0.0000 if cp>=-0.012103290297091007 & cv<=-0.41887985467910765 & pa<=-0.0063225512392818895\n",
      "   +0.0147 if cp>=-0.062081161141395565 & cv>=-0.22087514996528615\n",
      "--------------\n",
      "   +1.2503 if cp>=-0.04842094630002975\n",
      "   +1.4600 if cp<=-0.04900763109326362\n",
      "   +0.5885 if pa<=0.11504924893379212 & pa>=0.09308255612850189 & pav>=0.9192032098770142\n",
      "   -0.8205 if cp>=-0.050379715859889984 & pav<=0.5525406002998352\n",
      "   +2.0546 if cv<=-0.3715309202671051 & pa<=0.07132412493228912\n",
      "Run episode 222 with rewards 26.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 223 ===========\n",
      "40 actions [0, 0, 1, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 1, 1, 0, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0]\n",
      "   +0.3328 if cv>=-0.4475941717624664\n",
      "   -2.2015 if cp<=-0.03020063713192939\n",
      "   +5.2443 if cp>=-0.04842094630002975 & cv>=-0.35534352660179136\n",
      "   +0.2449 if cp>=-0.062081161141395565 & cv>=-0.22087514996528615\n",
      "   -2.5819 if cv<=-0.19157974421977997 & pa<=0.15566210448741913 & pav>=0.583642840385437\n",
      "--------------\n",
      "   +2.2161 if cp>=-0.04842094630002975\n",
      "   +2.7365 if cp<=-0.04900763109326362\n",
      "   -1.8344 if cp>=-0.050379715859889984 & pav<=0.5525406002998352\n",
      "   +2.7978 if cv<=-0.3715309202671051 & pa<=0.07132412493228912\n",
      "   +1.6544 if pav<=0.6781032085418701 & pav>=0.6781032085418701\n",
      "Run episode 223 with rewards 40.0\n",
      "============ 224 ===========\n",
      "37 actions [0, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 1, 0, 1, 1, 1, 0, 0, 1, 0, 0, 0, 1]\n",
      "   +0.4651 if cv>=-0.4475941717624664\n",
      "   -2.3062 if cp<=-0.03020063713192939\n",
      "   +5.3060 if cp>=-0.04842094630002975 & cv>=-0.35534352660179136\n",
      "   -6.1281 if cv<=-0.19157974421977997 & pa<=0.15566210448741913 & pav>=0.583642840385437\n",
      "   +4.8596 if cp>=-0.009577208291739218 & cv<=-0.34262049198150635\n",
      "--------------\n",
      "   +3.4905 if cp>=-0.04842094630002975\n",
      "   +3.2263 if cp<=-0.04900763109326362\n",
      "   -3.8379 if cp>=-0.050379715859889984 & pav<=0.5525406002998352\n",
      "   +0.2897 if cv<=-0.3715309202671051 & pa<=0.07132412493228912\n",
      "   -3.3585 if cp<=-0.04272569566965103 & cv<=-0.1590231955051422 & pav<=0.5695533752441406\n",
      "Run episode 224 with rewards 37.0\n",
      "============ 225 ===========\n",
      "23 actions [0, 0, 0, 1, 0, 1, 1, 0, 1, 1, 1, 0, 1, 1, 1, 0, 0, 0, 1, 0, 1, 0, 0]\n",
      "   -2.4447 if cp<=-0.03020063713192939\n",
      "   +5.8010 if cp>=-0.04842094630002975 & cv>=-0.35534352660179136\n",
      "   -3.0111 if cv<=-0.19157974421977997 & pa<=0.15566210448741913 & pav>=0.583642840385437\n",
      "   +0.8425 if cp>=-0.009577208291739218 & cv<=-0.34262049198150635\n",
      "   +5.7050 if cp>=-0.021108832955360413 & cv<=-0.37257466912269593 & pav<=0.6128907084465027\n",
      "--------------\n",
      "   +6.2100 if cp>=-0.04842094630002975\n",
      "   +2.8875 if cp<=-0.04900763109326362\n",
      "   -6.8719 if cp>=-0.050379715859889984 & pav<=0.5525406002998352\n",
      "   -0.2118 if cp<=-0.04272569566965103 & cv<=-0.1590231955051422 & pav<=0.5695533752441406\n",
      "   -4.0208 if cp>=-0.021108832955360413 & cv<=-0.37257466912269593 & pav<=0.6128907084465027\n",
      "Run episode 225 with rewards 23.0\n",
      "============ 226 ===========\n",
      "17 actions [0, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0]\n",
      "   -0.3384 if cp<=-0.03020063713192939\n",
      "   +3.5930 if cp>=-0.04842094630002975 & cv>=-0.35534352660179136\n",
      "   +0.7620 if cv<=-0.19157974421977997 & pa<=0.15566210448741913 & pav>=0.583642840385437\n",
      "   +4.9970 if cp>=-0.021108832955360413 & cv<=-0.37257466912269593 & pav<=0.6128907084465027\n",
      "   +5.0451 if cp<=-0.05435553416609764 & pav<=0.028094302117824592\n",
      "--------------\n",
      "   +5.0636 if cp>=-0.04842094630002975\n",
      "   +0.8716 if cp<=-0.04900763109326362\n",
      "   -4.7722 if cp>=-0.050379715859889984 & pav<=0.5525406002998352\n",
      "   -4.7640 if cp>=-0.021108832955360413 & cv<=-0.37257466912269593 & pav<=0.6128907084465027\n",
      "   -5.1187 if cp<=-0.05435553416609764 & pav<=0.028094302117824592\n",
      "Run episode 226 with rewards 17.0\n",
      "============ 227 ===========\n",
      "16 actions [0, 1, 0, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 0, 0, 1]\n",
      "   +5.0740 if cp>=-0.04842094630002975 & cv>=-0.35534352660179136\n",
      "   +1.3325 if cv<=-0.19157974421977997 & pa<=0.15566210448741913 & pav>=0.583642840385437\n",
      "   +0.0000 if cp>=-0.021108832955360413 & cv<=-0.37257466912269593 & pav<=0.6128907084465027\n",
      "   +0.0000 if cp<=-0.05435553416609764 & pav<=0.028094302117824592\n",
      "   +5.3525 if cp>=0.013979233801364909 & cv>=-0.38151112794876096 & pav>=0.6509832143783569\n",
      "--------------\n",
      "   +1.7859 if cp>=-0.04842094630002975\n",
      "   -2.6099 if cp>=-0.050379715859889984 & pav<=0.5525406002998352\n",
      "   +0.0000 if cp>=-0.021108832955360413 & cv<=-0.37257466912269593 & pav<=0.6128907084465027\n",
      "   +0.0000 if cp<=-0.05435553416609764 & pav<=0.028094302117824592\n",
      "   +2.4602 if cp>=-0.030897304043173788 & cv<=-0.19025937914848326 & pav<=0.6509832143783569\n",
      "Run episode 227 with rewards 16.0\n",
      "============ 228 ===========\n",
      "16 actions [0, 0, 0, 1, 0, 0, 0, 1, 1, 1, 1, 0, 0, 0, 1, 0]\n",
      "   +1.0537 if cp>=-0.04842094630002975 & cv>=-0.35534352660179136\n",
      "   -0.5900 if cv<=-0.19157974421977997 & pa<=0.15566210448741913 & pav>=0.583642840385437\n",
      "   -0.0000 if cp<=-0.05435553416609764 & pav<=0.028094302117824592\n",
      "   -0.0000 if cp>=0.013979233801364909 & cv>=-0.38151112794876096 & pav>=0.6509832143783569\n",
      "   +3.1772 if cp<=-0.010842427611351013 & cv>=-0.41891029477119446\n",
      "--------------\n",
      "   -0.2520 if cp>=-0.04842094630002975\n",
      "   +0.3267 if cp>=-0.050379715859889984 & pav<=0.5525406002998352\n",
      "   +0.0000 if cp<=-0.05435553416609764 & pav<=0.028094302117824592\n",
      "   +4.4848 if cp>=-0.030897304043173788 & cv<=-0.19025937914848326 & pav<=0.6509832143783569\n",
      "   +3.0334 if cp>=-0.04910212382674217 & pav>=0.6741473078727723\n",
      "Run episode 228 with rewards 16.0\n",
      "============ 229 ===========\n",
      "18 actions [0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 0, 1, 1, 0, 0, 0]\n",
      "   +1.5324 if cp>=-0.04842094630002975 & cv>=-0.35534352660179136\n",
      "   -2.3249 if cv<=-0.19157974421977997 & pa<=0.15566210448741913 & pav>=0.583642840385437\n",
      "   +0.0000 if cp>=0.013979233801364909 & cv>=-0.38151112794876096 & pav>=0.6509832143783569\n",
      "   +2.6235 if cp<=-0.010842427611351013 & cv>=-0.41891029477119446\n",
      "   +2.6788 if cv<=-0.3712434768676758 & pa<=0.025261955335736275\n",
      "--------------\n",
      "   -1.3221 if cp>=-0.04842094630002975\n",
      "   -1.3221 if cp>=-0.050379715859889984 & pav<=0.5525406002998352\n",
      "   -0.0000 if cp>=-0.030897304043173788 & cv<=-0.19025937914848326 & pav<=0.6509832143783569\n",
      "   -0.0000 if cp>=-0.04910212382674217 & pav>=0.6741473078727723\n",
      "   +1.8159 if cp>=-0.055687446147203445\n",
      "Run episode 229 with rewards 18.0\n",
      "============ 230 ===========\n",
      "22 actions [0, 0, 1, 0, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1]\n",
      "   +0.8956 if cp>=-0.04842094630002975 & cv>=-0.35534352660179136\n",
      "   -3.7582 if cv<=-0.19157974421977997 & pa<=0.15566210448741913 & pav>=0.583642840385437\n",
      "   +3.0185 if cp<=-0.010842427611351013 & cv>=-0.41891029477119446\n",
      "   +0.9641 if cv<=-0.3712434768676758 & pa<=0.025261955335736275\n",
      "   -2.9005 if cp<=-0.0866495594382286 & cv>=-0.1987998306751251\n",
      "--------------\n",
      "   -1.7162 if cp>=-0.04842094630002975\n",
      "   -1.1711 if cp>=-0.050379715859889984 & pav<=0.5525406002998352\n",
      "   +0.0000 if cp>=-0.030897304043173788 & cv<=-0.19025937914848326 & pav<=0.6509832143783569\n",
      "   +2.5719 if cp>=-0.055687446147203445\n",
      "   +2.5344 if cp<=-0.0866495594382286 & cv>=-0.1987998306751251\n",
      "Run episode 230 with rewards 22.0\n",
      "============ 231 ===========\n",
      "21 actions [0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 0]\n",
      "   -3.7289 if cv<=-0.19157974421977997 & pa<=0.15566210448741913 & pav>=0.583642840385437\n",
      "   +4.2277 if cp<=-0.010842427611351013 & cv>=-0.41891029477119446\n",
      "   -1.1026 if cv<=-0.3712434768676758 & pa<=0.025261955335736275\n",
      "   -0.0000 if cp<=-0.0866495594382286 & cv>=-0.1987998306751251\n",
      "   +3.6888 if cv<=-0.3211576789617536 & pav<=0.5353778839111328\n",
      "--------------\n",
      "   -3.7066 if cp>=-0.04842094630002975\n",
      "   +2.0639 if cp>=-0.050379715859889984 & pav<=0.5525406002998352\n",
      "   +2.0639 if cp>=-0.055687446147203445\n",
      "   +0.0000 if cp<=-0.0866495594382286 & cv>=-0.1987998306751251\n",
      "   -0.9572 if cp>=-0.06504419595003127 & cv<=-0.3211576789617536\n",
      "Run episode 231 with rewards 21.0\n",
      "============ 232 ===========\n",
      "14 actions [0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1]\n",
      "   -3.7211 if cv<=-0.19157974421977997 & pa<=0.15566210448741913 & pav>=0.583642840385437\n",
      "   +3.9274 if cp<=-0.010842427611351013 & cv>=-0.41891029477119446\n",
      "   -1.3978 if cv<=-0.3712434768676758 & pa<=0.025261955335736275\n",
      "   +3.7619 if cv<=-0.3211576789617536 & pav<=0.5353778839111328\n",
      "   +3.7307 if cp<=-0.14206790924072266 & cv<=-0.41799449920654297 & cv>=-0.43221142888069153 & pav<=0.7852320075035095\n",
      "--------------\n",
      "   -0.3020 if cp>=-0.04842094630002975\n",
      "   -1.0737 if cp>=-0.050379715859889984 & pav<=0.5525406002998352\n",
      "   -0.3020 if cp>=-0.055687446147203445\n",
      "   -0.0289 if cp>=-0.06504419595003127 & cv<=-0.3211576789617536\n",
      "   -3.7372 if cp<=-0.14206790924072266 & cv<=-0.41970932483673096 & pav<=0.7852320075035095\n",
      "Run episode 232 with rewards 14.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 233 ===========\n",
      "20 actions [0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1]\n",
      "   -3.1677 if cv<=-0.19157974421977997 & pa<=0.15566210448741913 & pav>=0.583642840385437\n",
      "   +1.8654 if cp<=-0.010842427611351013 & cv>=-0.41891029477119446\n",
      "   +0.0000 if cv<=-0.3211576789617536 & pav<=0.5353778839111328\n",
      "   +0.0000 if cp<=-0.14206790924072266 & cv<=-0.41799449920654297 & cv>=-0.43221142888069153 & pav<=0.7852320075035095\n",
      "   -3.0088 if cp>=0.014986315183341505 & cv<=-0.21335616111755357\n",
      "--------------\n",
      "   +0.7749 if cp>=-0.04842094630002975\n",
      "   -4.9768 if cp>=-0.050379715859889984 & pav<=0.5525406002998352\n",
      "   +0.7565 if cp>=-0.055687446147203445\n",
      "   +0.0000 if cp<=-0.14206790924072266 & cv<=-0.41970932483673096 & pav<=0.7852320075035095\n",
      "   -0.7101 if cv<=-0.3663216710090637\n",
      "Run episode 233 with rewards 20.0\n",
      "============ 234 ===========\n",
      "20 actions [0, 0, 0, 1, 1, 0, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0]\n",
      "   -5.0916 if cv<=-0.19157974421977997 & pa<=0.15566210448741913 & pav>=0.583642840385437\n",
      "   +2.6869 if cp<=-0.010842427611351013 & cv>=-0.41891029477119446\n",
      "   +0.8244 if cv<=-0.3211576789617536 & pav<=0.5353778839111328\n",
      "   +0.4842 if cp>=0.014986315183341505 & cv<=-0.21335616111755357\n",
      "   +1.3406 if cp>=-0.09392058849334717 & cv<=-0.42816460132598877 & pav>=0.5469551801681518\n",
      "--------------\n",
      "   +1.7742 if cp>=-0.04842094630002975\n",
      "   -3.5535 if cp>=-0.050379715859889984 & pav<=0.5525406002998352\n",
      "   -2.0031 if cp>=-0.055687446147203445\n",
      "   +0.0924 if cv<=-0.3663216710090637\n",
      "   -3.0112 if cv>=-0.42816460132598877\n",
      "Run episode 234 with rewards 20.0\n",
      "============ 235 ===========\n",
      "17 actions [0, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1]\n",
      "   -3.6252 if cv<=-0.19157974421977997 & pa<=0.15566210448741913 & pav>=0.583642840385437\n",
      "   +0.8856 if cp<=-0.010842427611351013 & cv>=-0.41891029477119446\n",
      "   -0.0000 if cv<=-0.3211576789617536 & pav<=0.5353778839111328\n",
      "   -1.1523 if cp>=-0.09392058849334717 & cv<=-0.42816460132598877 & pav>=0.5469551801681518\n",
      "   -3.1749 if cp<=-0.0006213464308529961 & cv<=-0.3518273293972012 & cv>=-0.4242498278617859\n",
      "--------------\n",
      "   +5.5548 if cp>=-0.04842094630002975\n",
      "   -3.0910 if cp>=-0.050379715859889984 & pav<=0.5525406002998352\n",
      "   -3.4573 if cp>=-0.055687446147203445\n",
      "   -2.4407 if cv>=-0.42816460132598877\n",
      "   -2.2699 if cp>=-0.0006213464308529961 & cv<=-0.3518273293972012 & cv>=-0.4242498278617859\n",
      "Run episode 235 with rewards 17.0\n",
      "============ 236 ===========\n",
      "22 actions [0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0]\n",
      "   -3.0856 if cv<=-0.19157974421977997 & pa<=0.15566210448741913 & pav>=0.583642840385437\n",
      "   -1.5363 if cp<=-0.010842427611351013 & cv>=-0.41891029477119446\n",
      "   +0.0000 if cp>=-0.09392058849334717 & cv<=-0.42816460132598877 & pav>=0.5469551801681518\n",
      "   -3.5693 if cp<=-0.0006213464308529961 & cv<=-0.3518273293972012 & cv>=-0.4242498278617859\n",
      "   +2.5170 if cv>=-0.2074990063905716\n",
      "--------------\n",
      "   -0.9430 if cp>=-0.04842094630002975\n",
      "   -2.0002 if cp>=-0.050379715859889984 & pav<=0.5525406002998352\n",
      "   -0.7804 if cp>=-0.055687446147203445\n",
      "   +0.1486 if cv>=-0.42816460132598877\n",
      "   -1.8621 if cp<=-0.0542319819331169 & cv>=-0.2074990063905716\n",
      "Run episode 236 with rewards 22.0\n",
      "============ 237 ===========\n",
      "23 actions [0, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1]\n",
      "   -2.7511 if cv<=-0.19157974421977997 & pa<=0.15566210448741913 & pav>=0.583642840385437\n",
      "   -0.1477 if cp<=-0.010842427611351013 & cv>=-0.41891029477119446\n",
      "   -2.8457 if cp<=-0.0006213464308529961 & cv<=-0.3518273293972012 & cv>=-0.4242498278617859\n",
      "   +2.6980 if cv>=-0.2074990063905716\n",
      "   -0.4512 if cv<=-0.3815720796585083 & pav>=0.6173649668693543\n",
      "--------------\n",
      "   -0.6298 if cp>=-0.04842094630002975\n",
      "   -1.1300 if cp>=-0.050379715859889984 & pav<=0.5525406002998352\n",
      "   -0.9008 if cp>=-0.055687446147203445\n",
      "   -1.9591 if cp<=-0.0542319819331169 & cv>=-0.2074990063905716\n",
      "   -1.9836 if cv>=-0.1956001877784729\n",
      "Run episode 237 with rewards 23.0\n",
      "============ 238 ===========\n",
      "17 actions [0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0]\n",
      "   -2.5740 if cv<=-0.19157974421977997 & pa<=0.15566210448741913 & pav>=0.583642840385437\n",
      "   -5.7697 if cp<=-0.0006213464308529961 & cv<=-0.3518273293972012 & cv>=-0.4242498278617859\n",
      "   +1.3380 if cv>=-0.2074990063905716\n",
      "   -2.4992 if cv<=-0.3815720796585083 & pav>=0.6173649668693543\n",
      "   +0.4490 if \n",
      "--------------\n",
      "   +1.4434 if cp>=-0.050379715859889984 & pav<=0.5525406002998352\n",
      "   +0.1807 if cp>=-0.055687446147203445\n",
      "   -0.6631 if cp<=-0.0542319819331169 & cv>=-0.2074990063905716\n",
      "   -3.4293 if cv>=-0.1956001877784729\n",
      "   -2.2345 if cp>=-0.015325212851166715 & cv<=-0.19491941332817075 & cv>=-0.3773327529430389\n",
      "Run episode 238 with rewards 17.0\n",
      "============ 239 ===========\n",
      "17 actions [0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1]\n",
      "   -1.7312 if cv<=-0.19157974421977997 & pa<=0.15566210448741913 & pav>=0.583642840385437\n",
      "   -2.0081 if cp<=-0.0006213464308529961 & cv<=-0.3518273293972012 & cv>=-0.4242498278617859\n",
      "   +2.0570 if cv>=-0.2074990063905716\n",
      "   -1.1535 if cv<=-0.3815720796585083 & pav>=0.6173649668693543\n",
      "   -2.3653 if cv>=-0.30973643064498896 & pav>=0.6234838962554932\n",
      "--------------\n",
      "   -1.1861 if cp>=-0.050379715859889984 & pav<=0.5525406002998352\n",
      "   +1.0419 if cp<=-0.0542319819331169 & cv>=-0.2074990063905716\n",
      "   -2.0134 if cv>=-0.1956001877784729\n",
      "   -0.0000 if cp>=-0.015325212851166715 & cv<=-0.19491941332817075 & cv>=-0.3773327529430389\n",
      "   -1.6869 if cp<=-0.05020944550633429 & pav<=0.6234838962554932\n",
      "Run episode 239 with rewards 17.0\n",
      "============ 240 ===========\n",
      "24 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 1]\n",
      "   -2.7649 if cv<=-0.19157974421977997 & pa<=0.15566210448741913 & pav>=0.583642840385437\n",
      "   -1.3350 if cp<=-0.0006213464308529961 & cv<=-0.3518273293972012 & cv>=-0.4242498278617859\n",
      "   +2.6039 if cv>=-0.2074990063905716\n",
      "   +0.2070 if cv>=-0.30973643064498896 & pav>=0.6234838962554932\n",
      "   -0.8604 if \n",
      "--------------\n",
      "   -1.3956 if cp>=-0.050379715859889984 & pav<=0.5525406002998352\n",
      "   -1.1861 if cp<=-0.0542319819331169 & cv>=-0.2074990063905716\n",
      "   -2.5818 if cv>=-0.1956001877784729\n",
      "   -0.7105 if cp<=-0.05020944550633429 & pav<=0.6234838962554932\n",
      "   +1.4417 if \n",
      "Run episode 240 with rewards 24.0\n",
      "============ 241 ===========\n",
      "11 actions [0, 0, 0, 0, 0, 1, 1, 1, 1, 0, 1]\n",
      "   -0.6032 if cv<=-0.19157974421977997 & pa<=0.15566210448741913 & pav>=0.583642840385437\n",
      "   -0.1852 if cp<=-0.0006213464308529961 & cv<=-0.3518273293972012 & cv>=-0.4242498278617859\n",
      "   +4.7749 if cv>=-0.2074990063905716\n",
      "   -2.8117 if \n",
      "   +2.5427 if cp>=-0.03902865871787071 & cv<=-0.21990827918052674 & pav>=0.4386511385440827\n",
      "--------------\n",
      "   +2.4751 if cp>=-0.050379715859889984 & pav<=0.5525406002998352\n",
      "   -0.0313 if cp<=-0.0542319819331169 & cv>=-0.2074990063905716\n",
      "   -5.0296 if cv>=-0.1956001877784729\n",
      "   +0.0004 if \n",
      "   -2.9946 if cp>=-0.03902865871787071 & pav>=0.4386511385440827\n",
      "Run episode 241 with rewards 11.0\n",
      "============ 242 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 1, 1, 0, 1]\n",
      "   -0.6088 if cv<=-0.19157974421977997 & pa<=0.15566210448741913 & pav>=0.583642840385437\n",
      "   +2.2316 if cv>=-0.2074990063905716\n",
      "   -1.4837 if \n",
      "   +2.3954 if cp>=-0.03902865871787071 & cv<=-0.21990827918052674 & pav>=0.4386511385440827\n",
      "   -0.0395 if pa>=0.20533423125743866\n",
      "--------------\n",
      "   -0.7337 if cp>=-0.050379715859889984 & pav<=0.5525406002998352\n",
      "   -0.0915 if cp<=-0.0542319819331169 & cv>=-0.2074990063905716\n",
      "   -0.8252 if cv>=-0.1956001877784729\n",
      "   -3.5341 if cp>=-0.03902865871787071 & pav>=0.4386511385440827\n",
      "   -0.9110 if cv>=-0.3799735903739929\n",
      "Run episode 242 with rewards 10.0\n",
      "============ 243 ===========\n",
      "16 actions [0, 0, 0, 0, 1, 1, 0, 0, 0, 1, 0, 1, 1, 1, 1, 0]\n",
      "   -1.6482 if cv<=-0.19157974421977997 & pa<=0.15566210448741913 & pav>=0.583642840385437\n",
      "   +0.8491 if cv>=-0.2074990063905716\n",
      "   +0.8620 if \n",
      "   +1.1349 if cp>=-0.03902865871787071 & cv<=-0.21990827918052674 & pav>=0.4386511385440827\n",
      "   -1.0845 if pav>=1.792494773864746\n",
      "--------------\n",
      "   -0.7169 if cp>=-0.050379715859889984 & pav<=0.5525406002998352\n",
      "   -0.7169 if cv>=-0.1956001877784729\n",
      "   -2.3562 if cp>=-0.03902865871787071 & pav>=0.4386511385440827\n",
      "   -0.8992 if cv>=-0.3799735903739929\n",
      "   -1.2715 if cp>=-0.0027518722228705847\n",
      "Run episode 243 with rewards 16.0\n",
      "============ 244 ===========\n",
      "8 actions [0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   -3.2776 if cv<=-0.19157974421977997 & pa<=0.15566210448741913 & pav>=0.583642840385437\n",
      "   +1.0764 if \n",
      "   +2.5049 if cp>=-0.03902865871787071 & cv<=-0.21990827918052674 & pav>=0.4386511385440827\n",
      "   +0.0000 if pav>=1.792494773864746\n",
      "   +4.7163 if cp<=-0.07690728455781934 & cp>=-0.17082376778125763 & cv<=-0.6186946630477902 & cv>=-0.8160397410392761\n",
      "--------------\n",
      "   -0.5056 if cv>=-0.1956001877784729\n",
      "   -2.8193 if cp>=-0.03902865871787071 & pav>=0.4386511385440827\n",
      "   -2.3147 if cv>=-0.3799735903739929\n",
      "   +0.0000 if cp>=-0.0027518722228705847\n",
      "   +0.4435 if cp>=-0.07690728455781934 & cv<=-0.4236404299736023\n",
      "Run episode 244 with rewards 8.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 245 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 1, 1]\n",
      "   +0.6500 if cv<=-0.19157974421977997 & pa<=0.15566210448741913 & pav>=0.583642840385437\n",
      "   +0.1300 if \n",
      "   +0.6500 if cp>=-0.03902865871787071 & cv<=-0.21990827918052674 & pav>=0.4386511385440827\n",
      "   +0.0000 if cp<=-0.07690728455781934 & cp>=-0.17082376778125763 & cv<=-0.6186946630477902 & cv>=-0.8160397410392761\n",
      "   +0.9096 if cp>=0.020525609701871873\n",
      "--------------\n",
      "   -0.6778 if cv>=-0.1956001877784729\n",
      "   -1.3475 if cp>=-0.03902865871787071 & pav>=0.4386511385440827\n",
      "   -0.9618 if cv>=-0.3799735903739929\n",
      "   -0.7077 if cp>=-0.07690728455781934 & cv<=-0.4236404299736023\n",
      "   -1.4434 if cp>=-0.0026517412683460823\n",
      "Run episode 245 with rewards 10.0\n",
      "============ 246 ===========\n",
      "8 actions [0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.0757 if cv<=-0.19157974421977997 & pa<=0.15566210448741913 & pav>=0.583642840385437\n",
      "   +2.6664 if \n",
      "   +0.2388 if cp>=-0.03902865871787071 & cv<=-0.21990827918052674 & pav>=0.4386511385440827\n",
      "   +0.2037 if cp>=0.020525609701871873\n",
      "   +2.4449 if pa>=0.18643324077129364\n",
      "--------------\n",
      "   -0.9165 if cp>=-0.03902865871787071 & pav>=0.4386511385440827\n",
      "   -1.2026 if cv>=-0.3799735903739929\n",
      "   -1.2297 if cp>=-0.07690728455781934 & cv<=-0.4236404299736023\n",
      "   -1.5812 if cp>=-0.0026517412683460823\n",
      "   -2.2516 if pa>=0.18643324077129364\n",
      "Run episode 246 with rewards 8.0\n",
      "============ 247 ===========\n",
      "11 actions [0, 0, 0, 0, 1, 0, 0, 0, 0, 1, 1]\n",
      "   +0.9492 if \n",
      "   +1.1172 if cp>=-0.03902865871787071 & cv<=-0.21990827918052674 & pav>=0.4386511385440827\n",
      "   -0.0000 if cp>=0.020525609701871873\n",
      "   -0.0000 if pa>=0.18643324077129364\n",
      "   -1.8551 if pa>=0.1680329144001007\n",
      "--------------\n",
      "   -0.4891 if cv>=-0.3799735903739929\n",
      "   -0.7220 if cp>=-0.07690728455781934 & cv<=-0.4236404299736023\n",
      "   -0.4891 if cp>=-0.0026517412683460823\n",
      "   +0.0000 if pa>=0.18643324077129364\n",
      "   -0.8432 if cp>=-0.011729464679956428\n",
      "Run episode 247 with rewards 11.0\n",
      "============ 248 ===========\n",
      "12 actions [0, 0, 0, 1, 0, 0, 0, 1, 0, 0, 0, 1]\n",
      "   +1.8171 if \n",
      "   -3.1986 if cp>=-0.03902865871787071 & cv<=-0.21990827918052674 & pav>=0.4386511385440827\n",
      "   -0.0000 if pa>=0.18643324077129364\n",
      "   +1.9283 if pa>=0.1680329144001007\n",
      "   +3.1402 if cp<=-0.0005182931199669838 & cv>=-0.5909072160720825\n",
      "--------------\n",
      "   -0.8314 if cv>=-0.3799735903739929\n",
      "   -0.6802 if cp>=-0.07690728455781934 & cv<=-0.4236404299736023\n",
      "   -1.0924 if cp>=-0.0026517412683460823\n",
      "   -1.4293 if cp>=-0.011729464679956428\n",
      "   +4.0312 if cp<=-0.020259829238057126 & pa<=0.002990087028592825\n",
      "Run episode 248 with rewards 12.0\n",
      "============ 249 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 1, 0, 0]\n",
      "   +2.6102 if \n",
      "   -1.0847 if cp>=-0.03902865871787071 & cv<=-0.21990827918052674 & pav>=0.4386511385440827\n",
      "   +2.6271 if pa>=0.1680329144001007\n",
      "   +4.2153 if cp<=-0.0005182931199669838 & cv>=-0.5909072160720825\n",
      "   -2.4003 if cp<=-0.07934917956590652 & cp>=-0.11967403292655944\n",
      "--------------\n",
      "   -0.1471 if cv>=-0.3799735903739929\n",
      "   -0.0000 if cp>=-0.0026517412683460823\n",
      "   -0.0000 if cp>=-0.011729464679956428\n",
      "   +0.7852 if cp<=-0.020259829238057126 & pa<=0.002990087028592825\n",
      "   -1.8191 if cp>=-0.02845750302076339\n",
      "Run episode 249 with rewards 10.0\n",
      "============ 250 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 1, 1, 0]\n",
      "   +2.0160 if \n",
      "   -2.4925 if pa>=0.1680329144001007\n",
      "   +0.8233 if cp<=-0.0005182931199669838 & cv>=-0.5909072160720825\n",
      "   -0.4464 if cp<=-0.07934917956590652 & cp>=-0.11967403292655944\n",
      "   -3.1761 if cv<=-1.1715060472488403\n",
      "--------------\n",
      "   -0.0360 if cv>=-0.3799735903739929\n",
      "   -0.0076 if cp>=-0.011729464679956428\n",
      "   -0.0000 if cp<=-0.020259829238057126 & pa<=0.002990087028592825\n",
      "   -0.0531 if cp>=-0.02845750302076339\n",
      "   -1.2281 if cp>=-0.054706879705190656\n",
      "Run episode 250 with rewards 9.0\n",
      "============ 251 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 1, 1]\n",
      "   +0.4576 if \n",
      "   -1.2538 if pa>=0.1680329144001007\n",
      "   +0.8685 if cp<=-0.0005182931199669838 & cv>=-0.5909072160720825\n",
      "   -1.3237 if cv<=-1.1715060472488403\n",
      "   +1.7332 if cp>=-0.04412382766604423\n",
      "--------------\n",
      "   -0.2487 if cv>=-0.3799735903739929\n",
      "   -0.3737 if cp>=-0.011729464679956428\n",
      "   -0.7037 if cp>=-0.02845750302076339\n",
      "   -1.5437 if cp>=-0.054706879705190656\n",
      "   +0.4083 if \n",
      "Run episode 251 with rewards 10.0\n",
      "============ 252 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 1, 0, 0, 0]\n",
      "   +2.5294 if pa>=0.1680329144001007\n",
      "   -0.0000 if cp<=-0.0005182931199669838 & cv>=-0.5909072160720825\n",
      "   +2.4658 if cv<=-1.1715060472488403\n",
      "   +2.0199 if cp>=-0.04412382766604423\n",
      "   -0.1721 if pav>=2.3458900451660156\n",
      "--------------\n",
      "   -0.2408 if cp>=-0.011729464679956428\n",
      "   -0.2723 if cp>=-0.02845750302076339\n",
      "   -0.5862 if cp>=-0.054706879705190656\n",
      "   -2.8668 if \n",
      "   -2.4553 if pa>=0.1845792829990387\n",
      "Run episode 252 with rewards 9.0\n",
      "============ 253 ===========\n",
      "8 actions [0, 0, 0, 0, 0, 0, 0, 1]\n",
      "   -0.0108 if pa>=0.1680329144001007\n",
      "   -0.0000 if cv<=-1.1715060472488403\n",
      "   +0.9206 if cp>=-0.04412382766604423\n",
      "   -0.0000 if pav>=2.3458900451660156\n",
      "   -2.5244 if cp<=-0.059460674226284024 & cp>=-0.08738023787736893\n",
      "--------------\n",
      "   -0.3576 if cp>=-0.02845750302076339\n",
      "   -1.5945 if cp>=-0.054706879705190656\n",
      "   -0.9637 if \n",
      "   +0.0692 if pa>=0.1845792829990387\n",
      "   +1.0467 if cp<=-0.059460674226284024 & cp>=-0.08738023787736893\n",
      "Run episode 253 with rewards 8.0\n",
      "============ 254 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +2.7140 if pa>=0.1680329144001007\n",
      "   +2.7140 if cv<=-1.1715060472488403\n",
      "   +1.2700 if cp>=-0.04412382766604423\n",
      "   +2.7140 if cp<=-0.059460674226284024 & cp>=-0.08738023787736893\n",
      "   +2.7125 if cp<=-0.011223205178976054\n",
      "--------------\n",
      "   -0.3864 if cp>=-0.02845750302076339\n",
      "   -0.3873 if cp>=-0.054706879705190656\n",
      "   -3.0946 if \n",
      "   -2.7072 if cp<=-0.059460674226284024 & cp>=-0.08738023787736893\n",
      "   -2.7318 if cp<=0.011811462603509428\n",
      "Run episode 254 with rewards 10.0\n",
      "============ 255 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 1, 0, 0]\n",
      "   -0.0096 if pa>=0.1680329144001007\n",
      "   -0.0090 if cv<=-1.1715060472488403\n",
      "   +0.0006 if cp<=-0.059460674226284024 & cp>=-0.08738023787736893\n",
      "   +0.0455 if cp<=-0.011223205178976054\n",
      "   +0.1591 if \n",
      "--------------\n",
      "   -1.0548 if cp>=-0.054706879705190656\n",
      "   -1.1069 if \n",
      "   -0.0001 if cp<=-0.059460674226284024 & cp>=-0.08738023787736893\n",
      "   -1.1069 if cp<=0.011811462603509428\n",
      "   -0.0699 if cp<=-0.017073611170053477\n",
      "Run episode 255 with rewards 9.0\n",
      "============ 256 ===========\n",
      "14 actions [0, 0, 0, 0, 1, 1, 0, 0, 1, 0, 1, 1, 1, 1]\n",
      "   -0.0525 if pa>=0.1680329144001007\n",
      "   +0.0000 if cv<=-1.1715060472488403\n",
      "   -0.7655 if cp<=-0.011223205178976054\n",
      "   +0.6266 if \n",
      "   -2.1841 if cp>=-0.06848140954971313 & cv<=-1.0137367367744445\n",
      "--------------\n",
      "   -2.8609 if cp>=-0.054706879705190656\n",
      "   -0.4514 if \n",
      "   -0.4514 if cp<=0.011811462603509428\n",
      "   +1.1997 if cp<=-0.017073611170053477\n",
      "   +0.2847 if cp<=-0.06848140954971313\n",
      "Run episode 256 with rewards 14.0\n",
      "============ 257 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 1, 1]\n",
      "   -1.4007 if pa>=0.1680329144001007\n",
      "   -0.9237 if cp<=-0.011223205178976054\n",
      "   -0.9237 if \n",
      "   -0.0000 if cp>=-0.06848140954971313 & cv<=-1.0137367367744445\n",
      "   +3.2553 if cv>=-0.7035442590713501\n",
      "--------------\n",
      "   -3.7603 if cp>=-0.054706879705190656\n",
      "   +0.0785 if \n",
      "   +0.0785 if cp<=0.011811462603509428\n",
      "   +0.0785 if cp<=-0.017073611170053477\n",
      "   -0.9455 if cp<=-0.05325836166739464 & cv>=-0.6224732756614685\n",
      "Run episode 257 with rewards 10.0\n",
      "============ 258 ===========\n",
      "8 actions [0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +2.7259 if pa>=0.1680329144001007\n",
      "   +2.7384 if cp<=-0.011223205178976054\n",
      "   +2.8870 if \n",
      "   +0.1254 if cv>=-0.7035442590713501\n",
      "   -0.0072 if pav>=2.365217924118042\n",
      "--------------\n",
      "   -0.3926 if cp>=-0.054706879705190656\n",
      "   -3.1543 if \n",
      "   -2.9977 if cp<=0.011811462603509428\n",
      "   -0.0000 if cp<=-0.05325836166739464 & cv>=-0.6224732756614685\n",
      "   -2.7169 if pa>=0.17350324988365173\n",
      "Run episode 258 with rewards 8.0\n",
      "============ 259 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   -0.0024 if pa>=0.1680329144001007\n",
      "   -0.0015 if cp<=-0.011223205178976054\n",
      "   +0.5410 if \n",
      "   +0.4524 if cv>=-0.7035442590713501\n",
      "   +0.5384 if cp>=0.017338381335139277\n",
      "--------------\n",
      "   -0.7893 if cp>=-0.054706879705190656\n",
      "   -0.7893 if \n",
      "   -0.0545 if cp<=0.011811462603509428\n",
      "   +0.0000 if pa>=0.17350324988365173\n",
      "   -0.2945 if cp<=0.044763692468404774 & cp>=0.017338381335139277\n",
      "Run episode 259 with rewards 10.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 260 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 1]\n",
      "   -4.1049 if pa>=0.1680329144001007\n",
      "   -1.2021 if \n",
      "   +1.0618 if cv>=-0.7035442590713501\n",
      "   +0.0000 if cp>=0.017338381335139277\n",
      "   +3.0170 if cp>=-0.11279532611370087\n",
      "--------------\n",
      "   -0.9343 if cp>=-0.054706879705190656\n",
      "   -1.4663 if \n",
      "   -1.4663 if cp<=0.011811462603509428\n",
      "   -0.0000 if cp<=0.044763692468404774 & cp>=0.017338381335139277\n",
      "   +0.1520 if cp<=-0.11279532611370087\n",
      "Run episode 260 with rewards 10.0\n",
      "============ 261 ===========\n",
      "8 actions [0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +4.1136 if pa>=0.1680329144001007\n",
      "   +4.1603 if \n",
      "   +0.0296 if cv>=-0.7035442590713501\n",
      "   +0.0469 if cp>=-0.11279532611370087\n",
      "   +2.4114 if pa>=0.2018057405948639\n",
      "--------------\n",
      "   -0.6237 if cp>=-0.054706879705190656\n",
      "   -1.0651 if \n",
      "   -1.0651 if cp<=0.011811462603509428\n",
      "   -0.2250 if cp<=-0.11279532611370087\n",
      "   -0.2613 if pa>=0.2018057405948639\n",
      "Run episode 261 with rewards 8.0\n",
      "============ 262 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   -0.0489 if pa>=0.1680329144001007\n",
      "   +0.8411 if \n",
      "   +0.8411 if cp>=-0.11279532611370087\n",
      "   -0.0000 if pa>=0.2018057405948639\n",
      "   +0.3283 if cp<=-8.289625402539778e-05\n",
      "--------------\n",
      "   -0.3868 if cp>=-0.054706879705190656\n",
      "   -0.3930 if \n",
      "   -0.3930 if cp<=0.011811462603509428\n",
      "   -0.0000 if pa>=0.2018057405948639\n",
      "   -0.0280 if cp<=-0.024278481304645536\n",
      "Run episode 262 with rewards 9.0\n",
      "============ 263 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   -0.0000 if pa>=0.1680329144001007\n",
      "   +1.5560 if \n",
      "   +1.5560 if cp>=-0.11279532611370087\n",
      "   -0.0269 if cp<=-8.289625402539778e-05\n",
      "   +0.6164 if cp<=0.037796685844659804 & cp>=-0.025213143602013585\n",
      "--------------\n",
      "   -1.3003 if cp>=-0.054706879705190656\n",
      "   -1.2116 if \n",
      "   -0.0209 if cp<=0.011811462603509428\n",
      "   +0.0848 if cp<=-0.024278481304645536\n",
      "   -0.4683 if cp<=0.037796685844659804\n",
      "Run episode 263 with rewards 9.0\n",
      "============ 264 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.8697 if \n",
      "   +0.8697 if cp>=-0.11279532611370087\n",
      "   -0.0975 if cp<=-8.289625402539778e-05\n",
      "   +0.2733 if cp<=0.037796685844659804 & cp>=-0.025213143602013585\n",
      "   +0.4498 if cp>=0.04271928071975708\n",
      "--------------\n",
      "   -0.7871 if cp>=-0.054706879705190656\n",
      "   -0.7285 if \n",
      "   +0.0557 if cp<=-0.024278481304645536\n",
      "   -0.0958 if cp<=0.037796685844659804\n",
      "   -0.2448 if cp<=0.04271928071975708\n",
      "Run episode 264 with rewards 9.0\n",
      "============ 265 ===========\n",
      "11 actions [0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1]\n",
      "   -0.8070 if \n",
      "   +2.5671 if cp>=-0.11279532611370087\n",
      "   +0.8169 if cp<=0.037796685844659804 & cp>=-0.025213143602013585\n",
      "   +0.0000 if cp>=0.04271928071975708\n",
      "   -3.1323 if cp<=-0.08475320041179657\n",
      "--------------\n",
      "   -0.7220 if cp>=-0.054706879705190656\n",
      "   -0.7823 if \n",
      "   -0.7823 if cp<=0.037796685844659804\n",
      "   -0.7823 if cp<=0.04271928071975708\n",
      "   +0.1678 if cp<=-0.08475320041179657\n",
      "Run episode 265 with rewards 11.0\n",
      "============ 266 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.3782 if \n",
      "   -1.4050 if cp>=-0.11279532611370087\n",
      "   +0.5039 if cp<=0.037796685844659804 & cp>=-0.025213143602013585\n",
      "   -0.3848 if cp<=-0.08475320041179657\n",
      "   +2.9912 if cv>=-1.4054123163223267\n",
      "--------------\n",
      "   -1.2816 if cp>=-0.054706879705190656\n",
      "   -0.3518 if \n",
      "   -0.3518 if cp<=0.037796685844659804\n",
      "   -0.3518 if cp<=0.04271928071975708\n",
      "   -0.5387 if cv>=-1.4054123163223267 & pa>=0.035637006163597135\n",
      "Run episode 266 with rewards 10.0\n",
      "============ 267 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 1]\n",
      "   +1.2539 if cp>=-0.11279532611370087\n",
      "   -0.0000 if cp<=0.037796685844659804 & cp>=-0.025213143602013585\n",
      "   -2.6691 if cp<=-0.08475320041179657\n",
      "   +2.1851 if cv>=-1.4054123163223267\n",
      "   -4.1195 if pa>=0.1782267838716507\n",
      "--------------\n",
      "   -1.6278 if cp>=-0.054706879705190656\n",
      "   -0.2434 if cp<=0.037796685844659804\n",
      "   -0.2434 if cp<=0.04271928071975708\n",
      "   -0.5733 if cv>=-1.4054123163223267 & pa>=0.035637006163597135\n",
      "   +4.0157 if pa>=0.1782267838716507\n",
      "Run episode 267 with rewards 9.0\n",
      "============ 268 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.9375 if cp>=-0.11279532611370087\n",
      "   +3.6663 if cp<=-0.08475320041179657\n",
      "   +0.9375 if cv>=-1.4054123163223267\n",
      "   +3.6662 if pa>=0.1782267838716507\n",
      "   +3.6964 if cp<=-0.03355707302689552\n",
      "--------------\n",
      "   -0.5788 if cp>=-0.054706879705190656\n",
      "   -1.0502 if cp<=0.04271928071975708\n",
      "   -0.5044 if cv>=-1.4054123163223267 & pa>=0.035637006163597135\n",
      "   -0.0124 if pa>=0.1782267838716507\n",
      "   -0.0389 if cp<=-0.09851870238780976\n",
      "Run episode 268 with rewards 9.0\n",
      "============ 269 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +1.4871 if cp>=-0.11279532611370087\n",
      "   -0.3403 if cp<=-0.08475320041179657\n",
      "   -0.0000 if pa>=0.1782267838716507\n",
      "   +0.0059 if cp<=-0.03355707302689552\n",
      "   +1.1659 if cp>=-0.010104698687791817\n",
      "--------------\n",
      "   -1.2347 if cp>=-0.054706879705190656\n",
      "   -1.2349 if cp<=0.04271928071975708\n",
      "   -0.1390 if cv>=-1.4054123163223267 & pa>=0.035637006163597135\n",
      "   +0.0003 if cp<=-0.09851870238780976\n",
      "   -0.0037 if cp<=-0.03060951009392738\n",
      "Run episode 269 with rewards 9.0\n",
      "============ 270 ===========\n",
      "37 actions [0, 0, 0, 0, 1, 1, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +2.3855 if cp>=-0.11279532611370087\n",
      "   -3.6189 if cp<=-0.08475320041179657\n",
      "   -2.0258 if cp<=-0.03355707302689552\n",
      "   -0.0000 if cp>=-0.010104698687791817\n",
      "   -3.7889 if pa>=0.20631426572799683\n",
      "--------------\n",
      "   -2.3206 if cp>=-0.054706879705190656\n",
      "   +0.3420 if cp<=0.04271928071975708\n",
      "   -1.9309 if cv>=-1.4054123163223267 & pa>=0.035637006163597135\n",
      "   +2.0125 if cp<=-0.03060951009392738\n",
      "   +3.7844 if pa>=0.20631426572799683\n",
      "Run episode 270 with rewards 37.0\n",
      "============ 271 ===========\n",
      "40 actions [1, 0, 0, 1, 1, 1, 1, 0, 0, 0, 1, 1, 0, 1, 0, 0, 0, 1, 0, 0, 0, 1, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0, 1, 1]\n",
      "   +0.6629 if cp>=-0.11279532611370087\n",
      "   +1.4422 if cp<=-0.08475320041179657\n",
      "   -1.7879 if cp<=-0.03355707302689552\n",
      "   +0.0000 if pa>=0.20631426572799683\n",
      "   -4.2737 if cp<=-0.08099639117717743 & pa>=0.09297403991222382\n",
      "--------------\n",
      "   -2.0641 if cp>=-0.054706879705190656\n",
      "   -1.8699 if cv>=-1.4054123163223267 & pa>=0.035637006163597135\n",
      "   +1.3146 if cp<=-0.03060951009392738\n",
      "   +0.0000 if pa>=0.20631426572799683\n",
      "   +2.0970 if cp>=-0.08099639117717743\n",
      "Run episode 271 with rewards 40.0\n",
      "============ 272 ===========\n",
      "54 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 0, 0, 0, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 1]\n",
      "   +0.5897 if cp>=-0.11279532611370087\n",
      "   +1.1396 if cp<=-0.08475320041179657\n",
      "   -2.3315 if cp<=-0.03355707302689552\n",
      "   +0.0000 if cp<=-0.08099639117717743 & pa>=0.09297403991222382\n",
      "   -4.3973 if cp>=-0.0903333842754364 & cv<=-0.022616906091570854 & pa>=-0.01969499886035919\n",
      "--------------\n",
      "   -0.3710 if cp>=-0.054706879705190656\n",
      "   +0.0000 if cv>=-1.4054123163223267 & pa>=0.035637006163597135\n",
      "   +2.2026 if cp<=-0.03060951009392738\n",
      "   +0.4894 if cp>=-0.08099639117717743\n",
      "   +4.3873 if cp>=-0.0903333842754364 & cv<=-0.022616906091570854 & pa>=-0.01969499886035919\n",
      "Run episode 272 with rewards 54.0\n",
      "============ 273 ===========\n",
      "24 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1]\n",
      "   +3.1482 if cp>=-0.11279532611370087\n",
      "   +0.0000 if cp<=-0.08475320041179657\n",
      "   +0.0000 if cp<=-0.03355707302689552\n",
      "   -4.5246 if cp>=-0.0903333842754364 & cv<=-0.022616906091570854 & pa>=-0.01969499886035919\n",
      "   -2.4763 if cp<=-0.02046313099563122 & pav<=0.1402955144643786\n",
      "--------------\n",
      "   -2.0618 if cp>=-0.054706879705190656\n",
      "   +4.5525 if cp<=-0.03060951009392738\n",
      "   -2.0618 if cp>=-0.08099639117717743\n",
      "   +5.9252 if cp>=-0.0903333842754364 & cv<=-0.022616906091570854 & pa>=-0.01969499886035919\n",
      "   +3.5993 if cv>=-0.1890313982963562 & pa>=0.026955819875001914\n",
      "Run episode 273 with rewards 24.0\n",
      "============ 274 ===========\n",
      "27 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0]\n",
      "   +2.5183 if cp>=-0.11279532611370087\n",
      "   +0.0000 if cp<=-0.03355707302689552\n",
      "   -3.4725 if cp>=-0.0903333842754364 & cv<=-0.022616906091570854 & pa>=-0.01969499886035919\n",
      "   +0.0000 if cp<=-0.02046313099563122 & pav<=0.1402955144643786\n",
      "   +1.4778 if cp>=-0.001516864215955138\n",
      "--------------\n",
      "   -0.0000 if cp<=-0.03060951009392738\n",
      "   -0.3824 if cp>=-0.08099639117717743\n",
      "   +4.0420 if cp>=-0.0903333842754364 & cv<=-0.022616906091570854 & pa>=-0.01969499886035919\n",
      "   -0.4261 if cv>=-0.1890313982963562 & pa>=0.026955819875001914\n",
      "   -1.3879 if cv>=0.022743523493409162\n",
      "Run episode 274 with rewards 27.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 275 ===========\n",
      "51 actions [0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1]\n",
      "   +1.6577 if cp>=-0.11279532611370087\n",
      "   -3.3407 if cp>=-0.0903333842754364 & cv<=-0.022616906091570854 & pa>=-0.01969499886035919\n",
      "   +1.1653 if cp<=-0.02046313099563122 & pav<=0.1402955144643786\n",
      "   +0.0000 if cp>=-0.001516864215955138\n",
      "   +2.2695 if cv>=-0.006811957526952023\n",
      "--------------\n",
      "   +0.7565 if cp>=-0.08099639117717743\n",
      "   +3.7539 if cp>=-0.0903333842754364 & cv<=-0.022616906091570854 & pa>=-0.01969499886035919\n",
      "   -0.6675 if cv>=-0.1890313982963562 & pa>=0.026955819875001914\n",
      "   +0.0000 if cv>=0.022743523493409162\n",
      "   -2.8119 if cv>=-0.006811957526952023\n",
      "Run episode 275 with rewards 51.0\n",
      "============ 276 ===========\n",
      "28 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1]\n",
      "   +4.0169 if cp>=-0.11279532611370087\n",
      "   -6.1296 if cp>=-0.0903333842754364 & cv<=-0.022616906091570854 & pa>=-0.01969499886035919\n",
      "   -0.0000 if cp<=-0.02046313099563122 & pav<=0.1402955144643786\n",
      "   +0.7360 if cv>=-0.006811957526952023\n",
      "   +0.7385 if cp<=0.02772759087383747 & cv<=0.1343117952346802 & pav<=0.2446259856224061\n",
      "--------------\n",
      "   -1.6772 if cp>=-0.08099639117717743\n",
      "   +6.4685 if cp>=-0.0903333842754364 & cv<=-0.022616906091570854 & pa>=-0.01969499886035919\n",
      "   -0.0206 if cv>=-0.1890313982963562 & pa>=0.026955819875001914\n",
      "   -1.2895 if cv>=-0.006811957526952023\n",
      "   -0.9333 if cp<=0.03870861977338791 & cv<=0.1343117952346802 & pav<=0.3900669813156128\n",
      "Run episode 276 with rewards 28.0\n",
      "============ 277 ===========\n",
      "36 actions [1, 0, 1, 0, 0, 0, 1, 1, 1, 0, 1, 1, 0, 0, 1, 0, 0, 0, 1, 1, 0, 1, 1, 0, 0, 0, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0]\n",
      "   -0.1090 if cp>=-0.11279532611370087\n",
      "   -1.6519 if cp>=-0.0903333842754364 & cv<=-0.022616906091570854 & pa>=-0.01969499886035919\n",
      "   +1.5429 if cv>=-0.006811957526952023\n",
      "   +0.8320 if cp<=0.02772759087383747 & cv<=0.1343117952346802 & pav<=0.2446259856224061\n",
      "   +0.5157 if cp<=-0.054499171674251556 & cv>=-0.15299256443977355 & pav<=0.3895665764808655\n",
      "--------------\n",
      "   +0.6564 if cp>=-0.08099639117717743\n",
      "   +2.0850 if cp>=-0.0903333842754364 & cv<=-0.022616906091570854 & pa>=-0.01969499886035919\n",
      "   -1.4519 if cv>=-0.006811957526952023\n",
      "   -0.0334 if cp<=0.03870861977338791 & cv<=0.1343117952346802 & pav<=0.3900669813156128\n",
      "   +1.0183 if cv<=0.025913040339946757 & cv>=-0.16134010553359984\n",
      "Run episode 277 with rewards 36.0\n",
      "============ 278 ===========\n",
      "41 actions [0, 0, 1, 0, 1, 1, 1, 0, 1, 0, 0, 0, 1, 1, 1, 0, 1, 1, 0, 0, 0, 0, 1, 1, 1, 0, 1, 0, 0, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0]\n",
      "   -0.0001 if cp>=-0.0903333842754364 & cv<=-0.022616906091570854 & pa>=-0.01969499886035919\n",
      "   +3.9595 if cv>=-0.006811957526952023\n",
      "   +2.7056 if cp<=0.02772759087383747 & cv<=0.1343117952346802 & pav<=0.2446259856224061\n",
      "   +0.7552 if cp<=-0.054499171674251556 & cv>=-0.15299256443977355 & pav<=0.3895665764808655\n",
      "   -3.1169 if cp<=-0.0392732135951519\n",
      "--------------\n",
      "   +1.4813 if cp>=-0.08099639117717743\n",
      "   -0.0001 if cp>=-0.0903333842754364 & cv<=-0.022616906091570854 & pa>=-0.01969499886035919\n",
      "   -1.9366 if cv>=-0.006811957526952023\n",
      "   +0.7115 if cv<=0.025913040339946757 & cv>=-0.16134010553359984\n",
      "   -2.2081 if cp>=-0.0392732135951519 & pa<=-0.0469292514026165 & pa>=-0.08339634537696836\n",
      "Run episode 278 with rewards 41.0\n",
      "============ 279 ===========\n",
      "12 actions [0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1]\n",
      "   +7.4648 if cv>=-0.006811957526952023\n",
      "   +4.4240 if cp<=0.02772759087383747 & cv<=0.1343117952346802 & pav<=0.2446259856224061\n",
      "   +1.6214 if cp<=-0.054499171674251556 & cv>=-0.15299256443977355 & pav<=0.3895665764808655\n",
      "   -6.9124 if cp<=-0.0392732135951519\n",
      "   +3.0034 if cp>=-0.0627727210521698 & pa<=-0.04627456888556479\n",
      "--------------\n",
      "   +1.3444 if cp>=-0.08099639117717743\n",
      "   -2.3351 if cv>=-0.006811957526952023\n",
      "   +0.7881 if cv<=0.025913040339946757 & cv>=-0.16134010553359984\n",
      "   -4.5788 if cp>=-0.0392732135951519 & pa<=-0.0469292514026165 & pa>=-0.08339634537696836\n",
      "   -3.0026 if cp>=-0.014123460277915001\n",
      "Run episode 279 with rewards 12.0\n",
      "============ 280 ===========\n",
      "14 actions [0, 0, 0, 0, 0, 0, 1, 1, 1, 0, 1, 1, 0, 1]\n",
      "   +0.1332 if cv>=-0.006811957526952023\n",
      "   -0.0000 if cp<=0.02772759087383747 & cv<=0.1343117952346802 & pav<=0.2446259856224061\n",
      "   -1.9086 if cp<=-0.0392732135951519\n",
      "   -0.0000 if cp>=-0.0627727210521698 & pa<=-0.04627456888556479\n",
      "   +2.2446 if cp>=0.0023463560268283104\n",
      "--------------\n",
      "   -0.6881 if cp>=-0.08099639117717743\n",
      "   -0.0005 if cv>=-0.006811957526952023\n",
      "   +0.0000 if cp>=-0.0392732135951519 & pa<=-0.0469292514026165 & pa>=-0.08339634537696836\n",
      "   -3.0071 if cp>=-0.014123460277915001\n",
      "   +2.2807 if pav>=1.7944064140319824\n",
      "Run episode 280 with rewards 14.0\n",
      "============ 281 ===========\n",
      "24 actions [0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   -0.0000 if cv>=-0.006811957526952023\n",
      "   -0.0000 if cp<=0.02772759087383747 & cv<=0.1343117952346802 & pav<=0.2446259856224061\n",
      "   -1.0160 if cp<=-0.0392732135951519\n",
      "   +1.3068 if cp>=0.0023463560268283104\n",
      "   -2.8169 if cp<=0.000398847181350007 & cp>=-0.05523159652948379\n",
      "--------------\n",
      "   -1.2642 if cp>=-0.08099639117717743\n",
      "   -0.0000 if cv>=-0.006811957526952023\n",
      "   -1.4139 if cp>=-0.014123460277915001\n",
      "   -0.0000 if pav>=1.7944064140319824\n",
      "   +3.1051 if cp<=0.000398847181350007 & cp>=-0.05523159652948379\n",
      "Run episode 281 with rewards 24.0\n",
      "============ 282 ===========\n",
      "11 actions [0, 0, 0, 0, 0, 1, 1, 1, 0, 0, 1]\n",
      "   -0.1897 if cv>=-0.006811957526952023\n",
      "   +0.0000 if cp<=-0.0392732135951519\n",
      "   +2.5446 if cp>=0.0023463560268283104\n",
      "   -3.2447 if cp<=0.000398847181350007 & cp>=-0.05523159652948379\n",
      "   -0.6992 if cp<=0.0038555560167878927 & pav>=1.0275235295295722\n",
      "--------------\n",
      "   -0.8384 if cp>=-0.08099639117717743\n",
      "   -2.1517 if cp>=-0.014123460277915001\n",
      "   +0.0286 if pav>=1.7944064140319824\n",
      "   +3.8586 if cp<=0.000398847181350007 & cp>=-0.05523159652948379\n",
      "   -0.3261 if cp<=0.021788688004016885 & pav<=1.0275235295295722\n",
      "Run episode 282 with rewards 11.0\n",
      "============ 283 ===========\n",
      "11 actions [0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0]\n",
      "   +0.0000 if cv>=-0.006811957526952023\n",
      "   +1.3368 if cp>=0.0023463560268283104\n",
      "   -1.5651 if cp<=0.000398847181350007 & cp>=-0.05523159652948379\n",
      "   +0.6425 if cp<=0.0038555560167878927 & pav>=1.0275235295295722\n",
      "   +0.9779 if cp<=0.0009900524746626728\n",
      "--------------\n",
      "   -0.8936 if cp>=-0.08099639117717743\n",
      "   -1.5254 if cp>=-0.014123460277915001\n",
      "   +1.5849 if cp<=0.000398847181350007 & cp>=-0.05523159652948379\n",
      "   -0.0504 if cp<=0.021788688004016885 & pav<=1.0275235295295722\n",
      "   -1.3626 if cp<=0.0009900524746626728\n",
      "Run episode 283 with rewards 11.0\n",
      "============ 284 ===========\n",
      "13 actions [0, 0, 0, 0, 1, 0, 1, 0, 0, 0, 0, 1, 1]\n",
      "   +1.6928 if cp>=0.0023463560268283104\n",
      "   +0.5669 if cp<=0.000398847181350007 & cp>=-0.05523159652948379\n",
      "   -3.2943 if cp<=0.0038555560167878927 & pav>=1.0275235295295722\n",
      "   +0.0132 if cp<=0.0009900524746626728\n",
      "   +3.3966 if cp<=-0.02979903668165207\n",
      "--------------\n",
      "   -2.6363 if cp>=-0.08099639117717743\n",
      "   +2.4405 if cp>=-0.014123460277915001\n",
      "   -0.4520 if cp<=0.000398847181350007 & cp>=-0.05523159652948379\n",
      "   +1.8498 if cp<=0.0009900524746626728\n",
      "   -2.5084 if cv>=-0.5931488871574402\n",
      "Run episode 284 with rewards 13.0\n",
      "============ 285 ===========\n",
      "13 actions [0, 0, 0, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.8142 if cp>=0.0023463560268283104\n",
      "   +0.4457 if cp<=0.000398847181350007 & cp>=-0.05523159652948379\n",
      "   -0.0523 if cp<=0.0038555560167878927 & pav>=1.0275235295295722\n",
      "   +3.8028 if cp<=-0.02979903668165207\n",
      "   -2.9574 if cv<=-0.5515098571777344\n",
      "--------------\n",
      "   +0.1989 if cp>=-0.08099639117717743\n",
      "   +0.1264 if cp>=-0.014123460277915001\n",
      "   -3.2944 if cp<=0.0009900524746626728\n",
      "   -2.5828 if cv>=-0.5931488871574402\n",
      "   +3.4454 if cp>=-0.03523021936416625 & cv<=-0.5515098571777344\n",
      "Run episode 285 with rewards 13.0\n",
      "============ 286 ===========\n",
      "17 actions [1, 1, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 1, 0, 0, 1, 1]\n",
      "   +1.7938 if cp>=0.0023463560268283104\n",
      "   -1.9306 if cp<=0.000398847181350007 & cp>=-0.05523159652948379\n",
      "   +2.6982 if cp<=-0.02979903668165207\n",
      "   -2.4035 if cv<=-0.5515098571777344\n",
      "   +0.0297 if cp<=0.0034468579106032952 & cp>=-0.039940269291400904 & cv<=-0.3623745501041412 & cv>=-0.5185580074787138\n",
      "--------------\n",
      "   -2.5523 if cp>=-0.08099639117717743\n",
      "   +1.2225 if cp<=0.0009900524746626728\n",
      "   -0.9116 if cv>=-0.5931488871574402\n",
      "   +2.6161 if cp>=-0.03523021936416625 & cv<=-0.5515098571777344\n",
      "   +4.3613 if pa>=0.18061141669750214\n",
      "Run episode 286 with rewards 17.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 287 ===========\n",
      "30 actions [1, 0, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 0, 1, 0, 0, 0, 1, 1, 1, 0, 1]\n",
      "   +1.0915 if cp>=0.0023463560268283104\n",
      "   -3.2801 if cp<=0.000398847181350007 & cp>=-0.05523159652948379\n",
      "   +2.1723 if cp<=-0.02979903668165207\n",
      "   -1.5634 if cv<=-0.5515098571777344\n",
      "   +3.4878 if cv>=0.4282839894294739\n",
      "--------------\n",
      "   -2.5056 if cp>=-0.08099639117717743\n",
      "   +1.6279 if cp<=0.0009900524746626728\n",
      "   +0.0000 if cp>=-0.03523021936416625 & cv<=-0.5515098571777344\n",
      "   -0.5674 if pa>=0.18061141669750214\n",
      "   -3.4986 if cv>=0.4282839894294739\n",
      "Run episode 287 with rewards 30.0\n",
      "============ 288 ===========\n",
      "20 actions [0, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 0, 1, 1, 0]\n",
      "   -2.5972 if cp<=0.000398847181350007 & cp>=-0.05523159652948379\n",
      "   -0.2992 if cp<=-0.02979903668165207\n",
      "   -0.7518 if cv<=-0.5515098571777344\n",
      "   -3.3666 if cv>=0.4282839894294739\n",
      "   +4.2855 if cv>=0.7767402529716492\n",
      "--------------\n",
      "   -3.8283 if cp>=-0.08099639117717743\n",
      "   +3.3308 if cp<=0.0009900524746626728\n",
      "   +0.0000 if pa>=0.18061141669750214\n",
      "   +2.8035 if cv>=0.4282839894294739\n",
      "   -4.6978 if cv>=0.7767402529716492\n",
      "Run episode 288 with rewards 20.0\n",
      "============ 289 ===========\n",
      "14 actions [0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 0, 1, 0, 1]\n",
      "   -4.4098 if cp<=0.000398847181350007 & cp>=-0.05523159652948379\n",
      "   -0.7428 if cv<=-0.5515098571777344\n",
      "   +2.0077 if cv>=0.4282839894294739\n",
      "   +0.0000 if cv>=0.7767402529716492\n",
      "   +2.5755 if cp<=0.0011459880159236523 & pa<=0.03864565938711166\n",
      "--------------\n",
      "   -4.3461 if cp>=-0.08099639117717743\n",
      "   +1.2209 if cp<=0.0009900524746626728\n",
      "   -2.0375 if cv>=0.4282839894294739\n",
      "   -0.0000 if cv>=0.7767402529716492\n",
      "   +3.6706 if cp<=0.0011459880159236523 & pa>=0.03864565938711166\n",
      "Run episode 289 with rewards 14.0\n",
      "============ 290 ===========\n",
      "38 actions [1, 0, 1, 1, 0, 0, 0, 1, 0, 0, 0, 0, 1, 1, 1, 1, 1, 0, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1]\n",
      "   -2.4753 if cp<=0.000398847181350007 & cp>=-0.05523159652948379\n",
      "   -0.5200 if cv<=-0.5515098571777344\n",
      "   +0.0000 if cv>=0.4282839894294739\n",
      "   +0.0000 if cp<=0.0011459880159236523 & pa<=0.03864565938711166\n",
      "   +1.9914 if cp<=-0.051288959383964536 & cv>=-0.16756957173347467 & pav<=0.3533070981502533\n",
      "--------------\n",
      "   -3.6236 if cp>=-0.08099639117717743\n",
      "   +2.3720 if cp<=0.0009900524746626728\n",
      "   -0.0000 if cv>=0.4282839894294739\n",
      "   +2.3720 if cp<=0.0011459880159236523 & pa>=0.03864565938711166\n",
      "   -2.6155 if cp<=-0.051288959383964536 & cv>=-0.16756957173347467\n",
      "Run episode 290 with rewards 38.0\n",
      "============ 291 ===========\n",
      "40 actions [1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 0, 1, 1, 1, 1, 0, 1, 1, 1, 1, 0, 0]\n",
      "   -1.2013 if cp<=0.000398847181350007 & cp>=-0.05523159652948379\n",
      "   -4.6052 if cv<=-0.5515098571777344\n",
      "   -1.2013 if cp<=0.0011459880159236523 & pa<=0.03864565938711166\n",
      "   -0.0000 if cp<=-0.051288959383964536 & cv>=-0.16756957173347467 & pav<=0.3533070981502533\n",
      "   -6.1857 if cp>=0.015538278967142107 & cv>=-0.4311076164245605 & pav>=-0.07366576939821223\n",
      "--------------\n",
      "   -3.3816 if cp>=-0.08099639117717743\n",
      "   +2.1146 if cp<=0.0009900524746626728\n",
      "   +0.0000 if cp<=0.0011459880159236523 & pa>=0.03864565938711166\n",
      "   +0.0000 if cp<=-0.051288959383964536 & cv>=-0.16756957173347467\n",
      "   +5.9800 if cp>=0.015538278967142107 & pa>=-0.19708524346351625 & pav>=-0.07366576939821223\n",
      "Run episode 291 with rewards 40.0\n",
      "============ 292 ===========\n",
      "37 actions [1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1, 1, 0, 1, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -1.6033 if cp<=0.000398847181350007 & cp>=-0.05523159652948379\n",
      "   +0.0000 if cv<=-0.5515098571777344\n",
      "   -1.6033 if cp<=0.0011459880159236523 & pa<=0.03864565938711166\n",
      "   -3.0766 if cp>=0.015538278967142107 & cv>=-0.4311076164245605 & pav>=-0.07366576939821223\n",
      "   -3.2577 if cv<=0.04350157827138901 & pa>=-0.03408206403255463 & pav<=-0.07486550956964493\n",
      "--------------\n",
      "   -3.9154 if cp>=-0.08099639117717743\n",
      "   +3.3608 if cp<=0.0009900524746626728\n",
      "   +0.0000 if cp<=-0.051288959383964536 & cv>=-0.16756957173347467\n",
      "   +3.3264 if cp>=0.015538278967142107 & pa>=-0.19708524346351625 & pav>=-0.07366576939821223\n",
      "   +3.7800 if cv<=0.04350157827138901 & pa>=-0.03408206403255463 & pav<=-0.07486550956964493\n",
      "Run episode 292 with rewards 37.0\n",
      "============ 293 ===========\n",
      "40 actions [1, 0, 1, 1, 0, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -4.1131 if cp<=0.000398847181350007 & cp>=-0.05523159652948379\n",
      "   -2.2989 if cp<=0.0011459880159236523 & pa<=0.03864565938711166\n",
      "   -4.1300 if cp>=0.015538278967142107 & cv>=-0.4311076164245605 & pav>=-0.07366576939821223\n",
      "   +0.0000 if cv<=0.04350157827138901 & pa>=-0.03408206403255463 & pav<=-0.07486550956964493\n",
      "   +5.5973 if cp>=0.04282323867082596 & pa<=-0.13602356612682343\n",
      "--------------\n",
      "   -4.1325 if cp>=-0.08099639117717743\n",
      "   +6.0166 if cp<=0.0009900524746626728\n",
      "   +4.5859 if cp>=0.015538278967142107 & pa>=-0.19708524346351625 & pav>=-0.07366576939821223\n",
      "   +0.0000 if cv<=0.04350157827138901 & pa>=-0.03408206403255463 & pav<=-0.07486550956964493\n",
      "   -5.5882 if cp>=0.04282323867082596 & pa<=-0.13602356612682343\n",
      "Run episode 293 with rewards 40.0\n",
      "============ 294 ===========\n",
      "29 actions [1, 0, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 0, 0, 1, 1, 1, 1, 1, 1, 0]\n",
      "   -1.3727 if cp<=0.000398847181350007 & cp>=-0.05523159652948379\n",
      "   -1.3727 if cp<=0.0011459880159236523 & pa<=0.03864565938711166\n",
      "   -2.0403 if cp>=0.015538278967142107 & cv>=-0.4311076164245605 & pav>=-0.07366576939821223\n",
      "   -0.0000 if cp>=0.04282323867082596 & pa<=-0.13602356612682343\n",
      "   -6.7649 if cp>=0.047200937569141385 & cv<=0.18223719596862792 & cv>=-0.005970613844692703 & pa>=-0.052626480162143704\n",
      "--------------\n",
      "   -4.2233 if cp>=-0.08099639117717743\n",
      "   +2.0400 if cp<=0.0009900524746626728\n",
      "   +2.5792 if cp>=0.015538278967142107 & pa>=-0.19708524346351625 & pav>=-0.07366576939821223\n",
      "   -0.0000 if cp>=0.04282323867082596 & pa<=-0.13602356612682343\n",
      "   +6.8434 if cp>=0.047200937569141385 & cv<=0.18223719596862792 & cv>=-0.005970613844692703 & pa>=-0.052626480162143704\n",
      "Run episode 294 with rewards 29.0\n",
      "============ 295 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   -3.0413 if cp<=0.000398847181350007 & cp>=-0.05523159652948379\n",
      "   -3.0413 if cp<=0.0011459880159236523 & pa<=0.03864565938711166\n",
      "   -5.1240 if cp>=0.015538278967142107 & cv>=-0.4311076164245605 & pav>=-0.07366576939821223\n",
      "   -0.0000 if cp>=0.047200937569141385 & cv<=0.18223719596862792 & cv>=-0.005970613844692703 & pa>=-0.052626480162143704\n",
      "   +6.3395 if pa>=-0.017351703718304634\n",
      "--------------\n",
      "   -3.6760 if cp>=-0.08099639117717743\n",
      "   +4.6687 if cp<=0.0009900524746626728\n",
      "   +5.1170 if cp>=0.015538278967142107 & pa>=-0.19708524346351625 & pav>=-0.07366576939821223\n",
      "   -0.0000 if cp>=0.047200937569141385 & cv<=0.18223719596862792 & cv>=-0.005970613844692703 & pa>=-0.052626480162143704\n",
      "   -6.2021 if pa>=-0.017351703718304634\n",
      "Run episode 295 with rewards 9.0\n",
      "============ 296 ===========\n",
      "35 actions [1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 1, 1, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1]\n",
      "   +1.1646 if cp<=0.000398847181350007 & cp>=-0.05523159652948379\n",
      "   +0.8639 if cp<=0.0011459880159236523 & pa<=0.03864565938711166\n",
      "   -0.0000 if cp>=0.015538278967142107 & cv>=-0.4311076164245605 & pav>=-0.07366576939821223\n",
      "   -3.2742 if pa>=-0.017351703718304634\n",
      "   -4.8120 if pa>=0.16187560558319092\n",
      "--------------\n",
      "   -0.9423 if cp>=-0.08099639117717743\n",
      "   -0.8802 if cp<=0.0009900524746626728\n",
      "   -0.0000 if cp>=0.015538278967142107 & pa>=-0.19708524346351625 & pav>=-0.07366576939821223\n",
      "   -0.9409 if pa>=-0.017351703718304634\n",
      "   -0.9250 if cp>=-0.033666057512164116\n",
      "Run episode 296 with rewards 35.0\n",
      "============ 297 ===========\n",
      "22 actions [0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1]\n",
      "   +0.8109 if cp<=0.000398847181350007 & cp>=-0.05523159652948379\n",
      "   +0.8110 if cp<=0.0011459880159236523 & pa<=0.03864565938711166\n",
      "   -3.8936 if pa>=-0.017351703718304634\n",
      "   +7.9295 if pa>=0.16187560558319092\n",
      "   +3.9446 if cv>=0.9473289251327515\n",
      "--------------\n",
      "   -0.7822 if cp>=-0.08099639117717743\n",
      "   +1.1904 if cp<=0.0009900524746626728\n",
      "   -0.7136 if pa>=-0.017351703718304634\n",
      "   -0.6153 if cp>=-0.033666057512164116\n",
      "   -4.0060 if cv>=0.9473289251327515\n",
      "Run episode 297 with rewards 22.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 298 ===========\n",
      "57 actions [1, 1, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 0, 1, 1, 1]\n",
      "   -0.5354 if cp<=0.0011459880159236523 & pa<=0.03864565938711166\n",
      "   -5.3531 if pa>=-0.017351703718304634\n",
      "   +0.0000 if pa>=0.16187560558319092\n",
      "   +1.7972 if cv>=0.9473289251327515\n",
      "   +2.9606 if cp>=0.019229778647422792 & cv<=0.07964958816301085\n",
      "--------------\n",
      "   +0.1570 if cp>=-0.08099639117717743\n",
      "   +1.6387 if cp<=0.0009900524746626728\n",
      "   +0.4249 if pa>=-0.017351703718304634\n",
      "   -2.6641 if cv>=0.9473289251327515\n",
      "   -4.1679 if cp>=0.019229778647422792 & cv<=0.07964958816301085\n",
      "Run episode 298 with rewards 57.0\n",
      "============ 299 ===========\n",
      "32 actions [1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 1, 1, 0, 0, 0]\n",
      "   -0.0364 if cp<=0.0011459880159236523 & pa<=0.03864565938711166\n",
      "   -4.9349 if pa>=-0.017351703718304634\n",
      "   +0.9040 if cv>=0.9473289251327515\n",
      "   +1.0319 if cp>=0.019229778647422792 & cv<=0.07964958816301085\n",
      "   +1.9785 if cp>=0.023992419615387936\n",
      "--------------\n",
      "   +1.2428 if cp<=0.0009900524746626728\n",
      "   +1.5233 if pa>=-0.017351703718304634\n",
      "   -2.1557 if cv>=0.9473289251327515\n",
      "   -1.7206 if cp>=0.019229778647422792 & cv<=0.07964958816301085\n",
      "   -1.8276 if cp>=0.023992419615387936\n",
      "Run episode 299 with rewards 32.0\n",
      "============ 300 ===========\n",
      "38 actions [1, 1, 1, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0, 1, 0, 1]\n",
      "   -2.7341 if pa>=-0.017351703718304634\n",
      "   +1.5026 if cv>=0.9473289251327515\n",
      "   +0.5972 if cp>=0.019229778647422792 & cv<=0.07964958816301085\n",
      "   +5.5211 if cp>=0.023992419615387936\n",
      "   -3.2551 if cp>=0.004421115014702081\n",
      "--------------\n",
      "   +1.0761 if pa>=-0.017351703718304634\n",
      "   -1.5310 if cv>=0.9473289251327515\n",
      "   -0.8547 if cp>=0.019229778647422792 & cv<=0.07964958816301085\n",
      "   -5.4462 if cp>=0.023992419615387936\n",
      "   +3.2589 if cp>=0.004421115014702081\n",
      "Run episode 300 with rewards 38.0\n",
      "============ 301 ===========\n",
      "83 actions [0, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 0, 1]\n",
      "   -3.9763 if pa>=-0.017351703718304634\n",
      "   -0.0000 if cv>=0.9473289251327515\n",
      "   +3.2905 if cp>=0.023992419615387936\n",
      "   -0.4198 if cp>=0.004421115014702081\n",
      "   +3.2984 if cv>=0.5991621613502502 & pav>=-1.2170824527740478\n",
      "--------------\n",
      "   +2.7055 if pa>=-0.017351703718304634\n",
      "   -0.0000 if cv>=0.9473289251327515\n",
      "   -3.3054 if cp>=0.023992419615387936\n",
      "   +0.4196 if cp>=0.004421115014702081\n",
      "   -3.2984 if cv>=0.5991621613502502 & pav>=-1.2170824527740478\n",
      "Run episode 301 with rewards 83.0\n",
      "============ 302 ===========\n",
      "27 actions [1, 1, 1, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -5.3908 if pa>=-0.017351703718304634\n",
      "   +6.4934 if cp>=0.023992419615387936\n",
      "   +0.3271 if cp>=0.004421115014702081\n",
      "   +5.2514 if cv>=0.5991621613502502 & pav>=-1.2170824527740478\n",
      "   -4.3189 if cp>=-0.07237079292535782 & pa<=0.028423225134611145\n",
      "--------------\n",
      "   +4.2709 if pa>=-0.017351703718304634\n",
      "   -6.5497 if cp>=0.023992419615387936\n",
      "   -0.3352 if cp>=0.004421115014702081\n",
      "   -5.3992 if cv>=0.5991621613502502 & pav>=-1.2170824527740478\n",
      "   +4.3161 if cp>=-0.07237079292535782 & pa<=0.028423225134611145\n",
      "Run episode 302 with rewards 27.0\n",
      "============ 303 ===========\n",
      "16 actions [1, 1, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 1]\n",
      "   -0.0502 if pa>=-0.017351703718304634\n",
      "   +2.4746 if cp>=0.023992419615387936\n",
      "   +1.7792 if cv>=0.5991621613502502 & pav>=-1.2170824527740478\n",
      "   -0.0221 if cp>=-0.07237079292535782 & pa<=0.028423225134611145\n",
      "   +1.2445 if cv>=0.5812965512275696\n",
      "--------------\n",
      "   +0.0174 if pa>=-0.017351703718304634\n",
      "   -2.5044 if cp>=0.023992419615387936\n",
      "   -1.8410 if cv>=0.5991621613502502 & pav>=-1.2170824527740478\n",
      "   -0.0034 if cp>=-0.07237079292535782 & pa<=0.028423225134611145\n",
      "   -1.2765 if cv>=0.5812965512275696\n",
      "Run episode 303 with rewards 16.0\n",
      "============ 304 ===========\n",
      "18 actions [1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +6.2171 if pa>=-0.017351703718304634\n",
      "   +1.9596 if cp>=0.023992419615387936\n",
      "   +0.0001 if cv>=0.5991621613502502 & pav>=-1.2170824527740478\n",
      "   +0.0001 if cv>=0.5812965512275696\n",
      "   -1.3442 if cp<=0.022497572004795078 & cv>=-0.40636923909187284\n",
      "--------------\n",
      "   -6.2216 if pa>=-0.017351703718304634\n",
      "   -1.9962 if cp>=0.023992419615387936\n",
      "   -0.0000 if cv>=0.5991621613502502 & pav>=-1.2170824527740478\n",
      "   -0.0000 if cv>=0.5812965512275696\n",
      "   +1.3201 if cp<=0.022497572004795078 & cv>=-0.40636923909187284\n",
      "Run episode 304 with rewards 18.0\n",
      "============ 305 ===========\n",
      "12 actions [0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0]\n",
      "   +0.0007 if pa>=-0.017351703718304634\n",
      "   +2.5674 if cp>=0.023992419615387936\n",
      "   +0.3217 if cv>=0.5991621613502502 & pav>=-1.2170824527740478\n",
      "   -2.6731 if cp<=0.022497572004795078 & cv>=-0.40636923909187284\n",
      "   +2.4203 if cv<=-0.7793434023857115\n",
      "--------------\n",
      "   -0.0008 if pa>=-0.017351703718304634\n",
      "   -2.5934 if cp>=0.023992419615387936\n",
      "   -0.3242 if cv>=0.5991621613502502 & pav>=-1.2170824527740478\n",
      "   +2.6557 if cp<=0.022497572004795078 & cv>=-0.40636923909187284\n",
      "   -2.4203 if cv<=-0.7793434023857115\n",
      "Run episode 305 with rewards 12.0\n",
      "============ 306 ===========\n",
      "13 actions [0, 0, 0, 1, 1, 0, 1, 0, 0, 0, 0, 0, 0]\n",
      "   +0.8792 if cp>=0.023992419615387936\n",
      "   -0.4154 if cv>=0.5991621613502502 & pav>=-1.2170824527740478\n",
      "   -0.6535 if cp<=0.022497572004795078 & cv>=-0.40636923909187284\n",
      "   +0.0000 if cv<=-0.7793434023857115\n",
      "   +3.2905 if cp<=-0.0060994777828454975 & cv<=0.06378469131886963\n",
      "--------------\n",
      "   -0.8911 if cp>=0.023992419615387936\n",
      "   +0.4118 if cv>=0.5991621613502502 & pav>=-1.2170824527740478\n",
      "   +0.6392 if cp<=0.022497572004795078 & cv>=-0.40636923909187284\n",
      "   +0.0000 if cv<=-0.7793434023857115\n",
      "   -3.2934 if cp<=-0.0060994777828454975 & cv<=0.06378469131886963\n",
      "Run episode 306 with rewards 13.0\n",
      "============ 307 ===========\n",
      "12 actions [0, 0, 0, 1, 0, 0, 0, 1, 1, 1, 0, 0]\n",
      "   +2.7195 if cp>=0.023992419615387936\n",
      "   -0.0000 if cv>=0.5991621613502502 & pav>=-1.2170824527740478\n",
      "   +2.6619 if cp<=0.022497572004795078 & cv>=-0.40636923909187284\n",
      "   +0.4885 if cp<=-0.0060994777828454975 & cv<=0.06378469131886963\n",
      "   -3.0838 if cp>=-0.012137975171208378 & cv<=-0.4209617614746094\n",
      "--------------\n",
      "   -2.7281 if cp>=0.023992419615387936\n",
      "   +0.0000 if cv>=0.5991621613502502 & pav>=-1.2170824527740478\n",
      "   -2.6720 if cp<=0.022497572004795078 & cv>=-0.40636923909187284\n",
      "   -0.4896 if cp<=-0.0060994777828454975 & cv<=0.06378469131886963\n",
      "   +3.0838 if cp>=-0.012137975171208378 & cv<=-0.4209617614746094\n",
      "Run episode 307 with rewards 12.0\n",
      "============ 308 ===========\n",
      "11 actions [0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1]\n",
      "   +0.0000 if cp>=0.023992419615387936\n",
      "   +1.7930 if cp<=0.022497572004795078 & cv>=-0.40636923909187284\n",
      "   -1.5874 if cp<=-0.0060994777828454975 & cv<=0.06378469131886963\n",
      "   -0.2747 if cp>=-0.012137975171208378 & cv<=-0.4209617614746094\n",
      "   +3.2565 if cp<=-0.02264549210667609 & cp>=-0.0490520916879177\n",
      "--------------\n",
      "   -0.0000 if cp>=0.023992419615387936\n",
      "   -1.7993 if cp<=0.022497572004795078 & cv>=-0.40636923909187284\n",
      "   +1.5861 if cp<=-0.0060994777828454975 & cv<=0.06378469131886963\n",
      "   +0.2748 if cp>=-0.012137975171208378 & cv<=-0.4209617614746094\n",
      "   -3.2564 if cp<=-0.02264549210667609 & cp>=-0.0490520916879177\n",
      "Run episode 308 with rewards 11.0\n",
      "============ 309 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.8033 if cp<=0.022497572004795078 & cv>=-0.40636923909187284\n",
      "   +3.0177 if cp<=-0.0060994777828454975 & cv<=0.06378469131886963\n",
      "   -0.0000 if cp>=-0.012137975171208378 & cv<=-0.4209617614746094\n",
      "   +0.2034 if cp<=-0.02264549210667609 & cp>=-0.0490520916879177\n",
      "   -2.9812 if cp<=-0.08888379484415054\n",
      "--------------\n",
      "   -0.8020 if cp<=0.022497572004795078 & cv>=-0.40636923909187284\n",
      "   -3.0189 if cp<=-0.0060994777828454975 & cv<=0.06378469131886963\n",
      "   +0.0000 if cp>=-0.012137975171208378 & cv<=-0.4209617614746094\n",
      "   -0.2037 if cp<=-0.02264549210667609 & cp>=-0.0490520916879177\n",
      "   +2.9814 if cp<=-0.08888379484415054\n",
      "Run episode 309 with rewards 9.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 310 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 1, 1]\n",
      "   +0.8884 if cp<=0.022497572004795078 & cv>=-0.40636923909187284\n",
      "   +0.0529 if cp<=-0.0060994777828454975 & cv<=0.06378469131886963\n",
      "   +0.0852 if cp<=-0.02264549210667609 & cp>=-0.0490520916879177\n",
      "   +0.0000 if cp<=-0.08888379484415054\n",
      "   +2.6149 if cp>=-0.01406213957816362\n",
      "--------------\n",
      "   -0.8879 if cp<=0.022497572004795078 & cv>=-0.40636923909187284\n",
      "   -0.0530 if cp<=-0.0060994777828454975 & cv<=0.06378469131886963\n",
      "   -0.0854 if cp<=-0.02264549210667609 & cp>=-0.0490520916879177\n",
      "   -0.0000 if cp<=-0.08888379484415054\n",
      "   -2.6147 if cp>=-0.01406213957816362\n",
      "Run episode 310 with rewards 9.0\n",
      "============ 311 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.0000 if cp<=0.022497572004795078 & cv>=-0.40636923909187284\n",
      "   +5.9525 if cp<=-0.0060994777828454975 & cv<=0.06378469131886963\n",
      "   +1.7062 if cp<=-0.02264549210667609 & cp>=-0.0490520916879177\n",
      "   +1.5309 if cp>=-0.01406213957816362\n",
      "   +4.2462 if pa>=0.17625679075717926\n",
      "--------------\n",
      "   -0.0000 if cp<=0.022497572004795078 & cv>=-0.40636923909187284\n",
      "   -5.9523 if cp<=-0.0060994777828454975 & cv<=0.06378469131886963\n",
      "   -1.7062 if cp<=-0.02264549210667609 & cp>=-0.0490520916879177\n",
      "   -1.5312 if cp>=-0.01406213957816362\n",
      "   -4.2459 if pa>=0.17625679075717926\n",
      "Run episode 311 with rewards 9.0\n",
      "============ 312 ===========\n",
      "20 actions [0, 0, 0, 0, 0, 1, 1, 1, 1, 0, 0, 1, 1, 1, 0, 0, 1, 1, 0, 0]\n",
      "   +0.0349 if cp<=-0.0060994777828454975 & cv<=0.06378469131886963\n",
      "   +0.0078 if cp<=-0.02264549210667609 & cp>=-0.0490520916879177\n",
      "   +1.1096 if cp>=-0.01406213957816362\n",
      "   -0.0000 if pa>=0.17625679075717926\n",
      "   +1.1063 if cp>=-0.006037170439958571\n",
      "--------------\n",
      "   -0.0349 if cp<=-0.0060994777828454975 & cv<=0.06378469131886963\n",
      "   -0.0078 if cp<=-0.02264549210667609 & cp>=-0.0490520916879177\n",
      "   -1.1097 if cp>=-0.01406213957816362\n",
      "   +0.0000 if pa>=0.17625679075717926\n",
      "   -1.1064 if cp>=-0.006037170439958571\n",
      "Run episode 312 with rewards 20.0\n",
      "============ 313 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 1, 0, 1, 0, 1]\n",
      "   -0.6750 if cp<=-0.0060994777828454975 & cv<=0.06378469131886963\n",
      "   +2.4012 if cp<=-0.02264549210667609 & cp>=-0.0490520916879177\n",
      "   +2.6523 if cp>=-0.01406213957816362\n",
      "   +0.6507 if cp>=-0.006037170439958571\n",
      "   -3.9754 if pav>=1.4021705389022827\n",
      "--------------\n",
      "   +0.6750 if cp<=-0.0060994777828454975 & cv<=0.06378469131886963\n",
      "   -2.4012 if cp<=-0.02264549210667609 & cp>=-0.0490520916879177\n",
      "   -2.6522 if cp>=-0.01406213957816362\n",
      "   -0.6514 if cp>=-0.006037170439958571\n",
      "   +3.9753 if pav>=1.4021705389022827\n",
      "Run episode 313 with rewards 10.0\n",
      "============ 314 ===========\n",
      "25 actions [1, 0, 1, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1]\n",
      "   +0.3493 if cp<=-0.0060994777828454975 & cv<=0.06378469131886963\n",
      "   -0.0011 if cp<=-0.02264549210667609 & cp>=-0.0490520916879177\n",
      "   +0.6935 if cp>=-0.01406213957816362\n",
      "   -1.6601 if pav>=1.4021705389022827\n",
      "   -0.0746 if cv<=-0.9413479566574097\n",
      "--------------\n",
      "   -0.3491 if cp<=-0.0060994777828454975 & cv<=0.06378469131886963\n",
      "   +0.0010 if cp<=-0.02264549210667609 & cp>=-0.0490520916879177\n",
      "   -0.6939 if cp>=-0.01406213957816362\n",
      "   +1.6600 if pav>=1.4021705389022827\n",
      "   +0.0746 if cv<=-0.9413479566574097\n",
      "Run episode 314 with rewards 25.0\n",
      "============ 315 ===========\n",
      "30 actions [1, 1, 0, 0, 0, 0, 1, 1, 1, 0, 1, 0, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 0]\n",
      "   -2.6580 if cp<=-0.0060994777828454975 & cv<=0.06378469131886963\n",
      "   +4.9450 if cp>=-0.01406213957816362\n",
      "   -0.7371 if pav>=1.4021705389022827\n",
      "   -2.4197 if cv<=-0.9413479566574097\n",
      "   +4.8948 if cp<=-0.020977539196610447 & cv<=-0.3246115565299984\n",
      "--------------\n",
      "   +2.6581 if cp<=-0.0060994777828454975 & cv<=0.06378469131886963\n",
      "   -4.9452 if cp>=-0.01406213957816362\n",
      "   +0.7371 if pav>=1.4021705389022827\n",
      "   +2.4197 if cv<=-0.9413479566574097\n",
      "   -4.8948 if cp<=-0.020977539196610447 & cv<=-0.3246115565299984\n",
      "Run episode 315 with rewards 30.0\n",
      "============ 316 ===========\n",
      "13 actions [0, 0, 0, 0, 0, 1, 1, 1, 0, 0, 1, 1, 1]\n",
      "   -1.5950 if cp<=-0.0060994777828454975 & cv<=0.06378469131886963\n",
      "   +3.2337 if cp>=-0.01406213957816362\n",
      "   -3.7838 if cv<=-0.9413479566574097\n",
      "   +0.6842 if cp<=-0.020977539196610447 & cv<=-0.3246115565299984\n",
      "   +3.1434 if cp<=-0.017740741744637488 & pa<=0.006769537553191192\n",
      "--------------\n",
      "   +1.5950 if cp<=-0.0060994777828454975 & cv<=0.06378469131886963\n",
      "   -3.2339 if cp>=-0.01406213957816362\n",
      "   +3.7837 if cv<=-0.9413479566574097\n",
      "   -0.6841 if cp<=-0.020977539196610447 & cv<=-0.3246115565299984\n",
      "   -3.1434 if cp<=-0.017740741744637488 & pa<=0.006769537553191192\n",
      "Run episode 316 with rewards 13.0\n",
      "============ 317 ===========\n",
      "12 actions [1, 1, 1, 0, 0, 1, 1, 1, 0, 0, 1, 0]\n",
      "   -0.8182 if cp<=-0.0060994777828454975 & cv<=0.06378469131886963\n",
      "   +0.7083 if cp>=-0.01406213957816362\n",
      "   -2.1978 if cv<=-0.9413479566574097\n",
      "   +0.0000 if cp<=-0.017740741744637488 & pa<=0.006769537553191192\n",
      "   +3.3409 if cp<=-0.03559884876012801 & cp>=-0.05851826518774032\n",
      "--------------\n",
      "   +0.8183 if cp<=-0.0060994777828454975 & cv<=0.06378469131886963\n",
      "   -0.7084 if cp>=-0.01406213957816362\n",
      "   +2.1977 if cv<=-0.9413479566574097\n",
      "   -0.0000 if cp<=-0.017740741744637488 & pa<=0.006769537553191192\n",
      "   -3.3409 if cp<=-0.03559884876012801 & cp>=-0.05851826518774032\n",
      "Run episode 317 with rewards 12.0\n",
      "============ 318 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 0, 0, 1]\n",
      "   -0.0000 if cp<=-0.0060994777828454975 & cv<=0.06378469131886963\n",
      "   -0.6293 if cp>=-0.01406213957816362\n",
      "   -0.0000 if cv<=-0.9413479566574097\n",
      "   -0.0000 if cp<=-0.03559884876012801 & cp>=-0.05851826518774032\n",
      "   -3.3741 if cp<=0.037648145109415054\n",
      "--------------\n",
      "   +0.0000 if cp<=-0.0060994777828454975 & cv<=0.06378469131886963\n",
      "   +0.6292 if cp>=-0.01406213957816362\n",
      "   +0.0000 if cv<=-0.9413479566574097\n",
      "   +0.0000 if cp<=-0.03559884876012801 & cp>=-0.05851826518774032\n",
      "   +3.3741 if cp<=0.037648145109415054\n",
      "Run episode 318 with rewards 10.0\n",
      "============ 319 ===========\n",
      "42 actions [1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0]\n",
      "   +1.9746 if cp>=-0.01406213957816362\n",
      "   -0.0000 if cv<=-0.9413479566574097\n",
      "   -0.0000 if cp<=-0.03559884876012801 & cp>=-0.05851826518774032\n",
      "   -1.5738 if cp<=0.037648145109415054\n",
      "   +1.8558 if cp>=0.11010701209306717\n",
      "--------------\n",
      "   -1.9747 if cp>=-0.01406213957816362\n",
      "   -0.0000 if cv<=-0.9413479566574097\n",
      "   -0.0000 if cp<=-0.03559884876012801 & cp>=-0.05851826518774032\n",
      "   +1.5738 if cp<=0.037648145109415054\n",
      "   -1.8558 if cp>=0.11010701209306717\n",
      "Run episode 319 with rewards 42.0\n",
      "============ 320 ===========\n",
      "44 actions [1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0]\n",
      "   -1.6317 if cp>=-0.01406213957816362\n",
      "   -0.4233 if cp<=-0.03559884876012801 & cp>=-0.05851826518774032\n",
      "   -1.1905 if cp<=0.037648145109415054\n",
      "   -0.0000 if cp>=0.11010701209306717\n",
      "   +6.6275 if cp>=-0.009362631477415501 & pa<=-0.02657882720232007\n",
      "--------------\n",
      "   +1.6318 if cp>=-0.01406213957816362\n",
      "   +0.4221 if cp<=-0.03559884876012801 & cp>=-0.05851826518774032\n",
      "   +1.1905 if cp<=0.037648145109415054\n",
      "   +0.0000 if cp>=0.11010701209306717\n",
      "   -6.6279 if cp>=-0.009362631477415501 & pa<=-0.02657882720232007\n",
      "Run episode 320 with rewards 44.0\n",
      "============ 321 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 0, 0]\n",
      "   -0.2356 if cp>=-0.01406213957816362\n",
      "   -0.0000 if cp<=-0.03559884876012801 & cp>=-0.05851826518774032\n",
      "   -3.6781 if cp<=0.037648145109415054\n",
      "   +3.5662 if cp>=-0.009362631477415501 & pa<=-0.02657882720232007\n",
      "   -1.6166 if cp>=0.0413067735731602\n",
      "--------------\n",
      "   +0.2355 if cp>=-0.01406213957816362\n",
      "   -0.0000 if cp<=-0.03559884876012801 & cp>=-0.05851826518774032\n",
      "   +3.6782 if cp<=0.037648145109415054\n",
      "   -3.5665 if cp>=-0.009362631477415501 & pa<=-0.02657882720232007\n",
      "   +1.6166 if cp>=0.0413067735731602\n",
      "Run episode 321 with rewards 9.0\n",
      "============ 322 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -2.2136 if cp>=-0.01406213957816362\n",
      "   -0.9489 if cp<=0.037648145109415054\n",
      "   -2.2136 if cp>=-0.009362631477415501 & pa<=-0.02657882720232007\n",
      "   -2.1738 if cp>=0.0413067735731602\n",
      "   -2.5549 if cp>=0.07005753368139267\n",
      "--------------\n",
      "   +2.2135 if cp>=-0.01406213957816362\n",
      "   +0.9490 if cp<=0.037648145109415054\n",
      "   +2.2135 if cp>=-0.009362631477415501 & pa<=-0.02657882720232007\n",
      "   +2.1738 if cp>=0.0413067735731602\n",
      "   +2.5549 if cp>=0.07005753368139267\n",
      "Run episode 322 with rewards 9.0\n",
      "============ 323 ===========\n",
      "11 actions [1, 1, 1, 1, 1, 0, 1, 1, 1, 0, 1]\n",
      "   -0.9000 if cp>=-0.01406213957816362\n",
      "   -0.0840 if cp>=-0.009362631477415501 & pa<=-0.02657882720232007\n",
      "   -0.0020 if cp>=0.0413067735731602\n",
      "   +0.0001 if cp>=0.07005753368139267\n",
      "   -0.4962 if cp<=0.003137091267853976\n",
      "--------------\n",
      "   +0.9000 if cp>=-0.01406213957816362\n",
      "   +0.0840 if cp>=-0.009362631477415501 & pa<=-0.02657882720232007\n",
      "   +0.0020 if cp>=0.0413067735731602\n",
      "   -0.0001 if cp>=0.07005753368139267\n",
      "   +0.4962 if cp<=0.003137091267853976\n",
      "Run episode 323 with rewards 11.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 324 ===========\n",
      "27 actions [1, 1, 0, 0, 0, 0, 1, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 1, 1, 0, 0, 0, 1, 0, 1]\n",
      "   -2.1078 if cp>=-0.01406213957816362\n",
      "   -0.7886 if cp>=-0.009362631477415501 & pa<=-0.02657882720232007\n",
      "   +3.7842 if cp>=0.0413067735731602\n",
      "   +0.0000 if cp<=0.003137091267853976\n",
      "   -2.1989 if cp<=0.10423237830400467 & pa<=-0.052472516894340515\n",
      "--------------\n",
      "   +2.1078 if cp>=-0.01406213957816362\n",
      "   +0.7886 if cp>=-0.009362631477415501 & pa<=-0.02657882720232007\n",
      "   -3.7842 if cp>=0.0413067735731602\n",
      "   +0.0000 if cp<=0.003137091267853976\n",
      "   +2.1989 if cp<=0.10423237830400467 & pa<=-0.052472516894340515\n",
      "Run episode 324 with rewards 27.0\n",
      "============ 325 ===========\n",
      "17 actions [0, 0, 0, 1, 1, 0, 0, 1, 0, 0, 1, 1, 1, 0, 1, 0, 1]\n",
      "   -2.2301 if cp>=-0.01406213957816362\n",
      "   +0.4765 if cp>=-0.009362631477415501 & pa<=-0.02657882720232007\n",
      "   +3.9330 if cp>=0.0413067735731602\n",
      "   -3.2729 if cp<=0.10423237830400467 & pa<=-0.052472516894340515\n",
      "   -5.6289 if cp<=0.05581433027982712 & cp>=0.04346144050359726 & cv<=-0.1877691149711609\n",
      "--------------\n",
      "   +2.2301 if cp>=-0.01406213957816362\n",
      "   -0.4765 if cp>=-0.009362631477415501 & pa<=-0.02657882720232007\n",
      "   -3.9330 if cp>=0.0413067735731602\n",
      "   +3.2729 if cp<=0.10423237830400467 & pa<=-0.052472516894340515\n",
      "   +5.6288 if cp<=0.05581433027982712 & cp>=0.04346144050359726 & cv<=-0.1877691149711609\n",
      "Run episode 325 with rewards 17.0\n",
      "============ 326 ===========\n",
      "13 actions [0, 0, 1, 0, 1, 0, 0, 0, 1, 0, 0, 0, 1]\n",
      "   +0.0000 if cp>=-0.01406213957816362\n",
      "   +0.0000 if cp>=0.0413067735731602\n",
      "   +0.0000 if cp<=0.10423237830400467 & pa<=-0.052472516894340515\n",
      "   +0.0000 if cp<=0.05581433027982712 & cp>=0.04346144050359726 & cv<=-0.1877691149711609\n",
      "   +3.5601 if cp>=-0.08105124086141585 & cv>=-0.1833589106798172\n",
      "--------------\n",
      "   -0.0000 if cp>=-0.01406213957816362\n",
      "   -0.0000 if cp>=0.0413067735731602\n",
      "   -0.0000 if cp<=0.10423237830400467 & pa<=-0.052472516894340515\n",
      "   -0.0000 if cp<=0.05581433027982712 & cp>=0.04346144050359726 & cv<=-0.1877691149711609\n",
      "   -3.5601 if cp>=-0.08105124086141585 & cv>=-0.1833589106798172\n",
      "Run episode 326 with rewards 13.0\n",
      "============ 327 ===========\n",
      "17 actions [0, 0, 1, 0, 0, 1, 1, 0, 1, 0, 0, 0, 0, 0, 0, 1, 1]\n",
      "   +0.0000 if cp>=0.0413067735731602\n",
      "   +0.0000 if cp<=0.10423237830400467 & pa<=-0.052472516894340515\n",
      "   +0.0000 if cp<=0.05581433027982712 & cp>=0.04346144050359726 & cv<=-0.1877691149711609\n",
      "   +1.1195 if cp>=-0.08105124086141585 & cv>=-0.1833589106798172\n",
      "   -2.8892 if cp>=-0.008618047088384621 & cv<=-0.16477275490760804\n",
      "--------------\n",
      "   +0.0000 if cp>=0.0413067735731602\n",
      "   +0.0000 if cp<=0.10423237830400467 & pa<=-0.052472516894340515\n",
      "   +0.0000 if cp<=0.05581433027982712 & cp>=0.04346144050359726 & cv<=-0.1877691149711609\n",
      "   -1.1195 if cp>=-0.08105124086141585 & cv>=-0.1833589106798172\n",
      "   +2.8892 if cp>=-0.008618047088384621 & cv<=-0.16477275490760804\n",
      "Run episode 327 with rewards 17.0\n",
      "============ 328 ===========\n",
      "12 actions [0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 1]\n",
      "   -0.0000 if cp>=0.0413067735731602\n",
      "   -0.0000 if cp<=0.05581433027982712 & cp>=0.04346144050359726 & cv<=-0.1877691149711609\n",
      "   +2.7750 if cp>=-0.08105124086141585 & cv>=-0.1833589106798172\n",
      "   -0.0000 if cp>=-0.008618047088384621 & cv<=-0.16477275490760804\n",
      "   +2.7486 if cp>=-0.008789596147835255\n",
      "--------------\n",
      "   -0.0000 if cp>=0.0413067735731602\n",
      "   -0.0000 if cp<=0.05581433027982712 & cp>=0.04346144050359726 & cv<=-0.1877691149711609\n",
      "   -2.7750 if cp>=-0.08105124086141585 & cv>=-0.1833589106798172\n",
      "   -0.0000 if cp>=-0.008618047088384621 & cv<=-0.16477275490760804\n",
      "   -2.7486 if cp>=-0.008789596147835255\n",
      "Run episode 328 with rewards 12.0\n",
      "============ 329 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 1, 1, 1]\n",
      "   +0.3496 if cp>=0.0413067735731602\n",
      "   +0.0710 if cp>=-0.08105124086141585 & cv>=-0.1833589106798172\n",
      "   +1.3680 if cp>=-0.008618047088384621 & cv<=-0.16477275490760804\n",
      "   +1.4390 if cp>=-0.008789596147835255\n",
      "   -1.2036 if cp>=-0.0342368297278881\n",
      "--------------\n",
      "   -0.3496 if cp>=0.0413067735731602\n",
      "   -0.0710 if cp>=-0.08105124086141585 & cv>=-0.1833589106798172\n",
      "   -1.3680 if cp>=-0.008618047088384621 & cv<=-0.16477275490760804\n",
      "   -1.4390 if cp>=-0.008789596147835255\n",
      "   +1.2036 if cp>=-0.0342368297278881\n",
      "Run episode 329 with rewards 9.0\n",
      "============ 330 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 1, 0, 0]\n",
      "   -0.0000 if cp>=0.0413067735731602\n",
      "   +0.5388 if cp>=-0.008618047088384621 & cv<=-0.16477275490760804\n",
      "   +1.7221 if cp>=-0.008789596147835255\n",
      "   +0.9926 if cp>=-0.0342368297278881\n",
      "   +3.1616 if pa>=0.1959518939256668\n",
      "--------------\n",
      "   -0.0000 if cp>=0.0413067735731602\n",
      "   -0.5388 if cp>=-0.008618047088384621 & cv<=-0.16477275490760804\n",
      "   -1.7221 if cp>=-0.008789596147835255\n",
      "   -0.9926 if cp>=-0.0342368297278881\n",
      "   -3.1616 if pa>=0.1959518939256668\n",
      "Run episode 330 with rewards 10.0\n",
      "============ 331 ===========\n",
      "40 actions [0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1]\n",
      "   +0.1094 if cp>=-0.008618047088384621 & cv<=-0.16477275490760804\n",
      "   +0.1785 if cp>=-0.008789596147835255\n",
      "   +3.1250 if cp>=-0.0342368297278881\n",
      "   -5.8499 if pa>=0.1959518939256668\n",
      "   -4.4617 if cp<=-0.004689938668161629\n",
      "--------------\n",
      "   -0.1094 if cp>=-0.008618047088384621 & cv<=-0.16477275490760804\n",
      "   -0.1785 if cp>=-0.008789596147835255\n",
      "   -3.1250 if cp>=-0.0342368297278881\n",
      "   +5.8499 if pa>=0.1959518939256668\n",
      "   +4.4617 if cp<=-0.004689938668161629\n",
      "Run episode 331 with rewards 40.0\n",
      "============ 332 ===========\n",
      "29 actions [0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   +6.3263 if cp>=-0.008789596147835255\n",
      "   +1.4780 if cp>=-0.0342368297278881\n",
      "   +8.4386 if pa>=0.1959518939256668\n",
      "   -4.2004 if cp<=-0.004689938668161629\n",
      "   +1.0000 if cp<=0.05595003142952921 & pa>=0.0813248246908188\n",
      "--------------\n",
      "   -6.1695 if cp>=-0.008789596147835255\n",
      "   -1.9376 if cp>=-0.0342368297278881\n",
      "   -9.3559 if pa>=0.1959518939256668\n",
      "   +3.6595 if cp<=-0.004689938668161629\n",
      "   +0.1132 if cp<=0.05595003142952921 & pa>=0.0813248246908188\n",
      "Run episode 332 with rewards 29.0\n",
      "============ 333 ===========\n",
      "25 actions [0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1]\n",
      "   +0.0556 if cp>=-0.008789596147835255\n",
      "   +0.9783 if cp>=-0.0342368297278881\n",
      "   -0.0000 if pa>=0.1959518939256668\n",
      "   +0.7881 if cp<=-0.004689938668161629\n",
      "   -4.3844 if cp<=-0.019171951711177825\n",
      "--------------\n",
      "   -0.0466 if cp>=-0.008789596147835255\n",
      "   -1.4655 if cp>=-0.0342368297278881\n",
      "   +0.0000 if pa>=0.1959518939256668\n",
      "   -1.2884 if cp<=-0.004689938668161629\n",
      "   +4.3730 if cp<=-0.019171951711177825\n",
      "Run episode 333 with rewards 25.0\n",
      "============ 334 ===========\n",
      "32 actions [0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1]\n",
      "   +0.9159 if cp>=-0.008789596147835255\n",
      "   +0.7003 if cp>=-0.0342368297278881\n",
      "   -0.7993 if cp<=-0.004689938668161629\n",
      "   -2.3925 if cp<=-0.019171951711177825\n",
      "   +2.3589 if cp>=-0.021425632759928696\n",
      "--------------\n",
      "   -0.8981 if cp>=-0.008789596147835255\n",
      "   -1.0507 if cp>=-0.0342368297278881\n",
      "   +0.4407 if cp<=-0.004689938668161629\n",
      "   +2.2230 if cp<=-0.019171951711177825\n",
      "   -2.5243 if cp>=-0.021425632759928696\n",
      "Run episode 334 with rewards 32.0\n",
      "============ 335 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 1, 1]\n",
      "   +0.1565 if cp>=-0.008789596147835255\n",
      "   -0.7274 if cp<=-0.004689938668161629\n",
      "   -0.9486 if cp<=-0.019171951711177825\n",
      "   +4.7541 if cp>=-0.021425632759928696\n",
      "   -0.6682 if \n",
      "--------------\n",
      "   -0.1125 if cp>=-0.008789596147835255\n",
      "   -0.5766 if cp>=-0.0342368297278881\n",
      "   +1.1707 if cp<=-0.019171951711177825\n",
      "   -4.1684 if cp>=-0.021425632759928696\n",
      "   +1.5605 if cp<=-0.036515137553215025\n",
      "Run episode 335 with rewards 9.0\n",
      "============ 336 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +5.4338 if cp<=-0.004689938668161629\n",
      "   +5.3300 if cp<=-0.019171951711177825\n",
      "   -2.2230 if cp>=-0.021425632759928696\n",
      "   +5.4682 if \n",
      "   +1.0000 if cp<=0.022835540771484385\n",
      "--------------\n",
      "   -0.4730 if cp>=-0.0342368297278881\n",
      "   -7.9367 if cp<=-0.019171951711177825\n",
      "   -0.5125 if cp>=-0.021425632759928696\n",
      "   -7.9540 if cp<=-0.036515137553215025\n",
      "   -1.4766 if pa>=0.19643020629882812\n",
      "Run episode 336 with rewards 10.0\n",
      "============ 337 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 1, 0, 0]\n",
      "   +0.0819 if cp<=-0.004689938668161629\n",
      "   +0.0002 if cp<=-0.019171951711177825\n",
      "   +1.5196 if cp>=-0.021425632759928696\n",
      "   +1.5198 if \n",
      "   +0.5869 if cp<=0.028962263464927675 & cp>=-0.012997983675450086\n",
      "--------------\n",
      "   +0.0000 if cp<=-0.019171951711177825\n",
      "   -0.9599 if cp>=-0.021425632759928696\n",
      "   +0.0000 if cp<=-0.036515137553215025\n",
      "   +0.0000 if pa>=0.19643020629882812\n",
      "   -0.4841 if cp>=0.028962263464927675\n",
      "Run episode 337 with rewards 9.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 338 ===========\n",
      "27 actions [1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -4.4905 if cp<=-0.004689938668161629\n",
      "   +4.2248 if cp>=-0.021425632759928696\n",
      "   -2.2605 if \n",
      "   +2.1418 if cp<=0.028962263464927675 & cp>=-0.012997983675450086\n",
      "   -5.4048 if pa>=0.19310349225997925\n",
      "--------------\n",
      "   +6.4944 if cp<=-0.019171951711177825\n",
      "   -0.9352 if cp>=-0.021425632759928696\n",
      "   +6.4847 if cp<=-0.036515137553215025\n",
      "   -0.6386 if cp>=0.028962263464927675\n",
      "   +2.5496 if pa>=0.19310349225997925\n",
      "Run episode 338 with rewards 27.0\n",
      "============ 339 ===========\n",
      "21 actions [0, 0, 0, 1, 1, 1, 1, 0, 1, 0, 0, 1, 1, 0, 0, 0, 0, 0, 0, 1, 1]\n",
      "   -0.2603 if cp<=-0.004689938668161629\n",
      "   +2.6421 if cp>=-0.021425632759928696\n",
      "   +1.7508 if \n",
      "   +0.0000 if pa>=0.19310349225997925\n",
      "   -0.4450 if cp<=-0.02724060416221618\n",
      "--------------\n",
      "   +0.3595 if cp<=-0.019171951711177825\n",
      "   -3.6811 if cp>=-0.021425632759928696\n",
      "   +0.2205 if cp<=-0.036515137553215025\n",
      "   +0.0000 if pa>=0.19310349225997925\n",
      "   -2.1837 if cp>=-0.02724060416221618 & pav<=-1.1382731080055237\n",
      "Run episode 339 with rewards 21.0\n",
      "============ 340 ===========\n",
      "11 actions [0, 1, 0, 0, 0, 0, 0, 1, 0, 0, 0]\n",
      "   +2.4540 if cp<=-0.004689938668161629\n",
      "   +0.2704 if cp>=-0.021425632759928696\n",
      "   +2.4540 if \n",
      "   -3.5491 if cp<=-0.02724060416221618\n",
      "   -2.4378 if cp>=-0.0591566301882267\n",
      "--------------\n",
      "   +0.9657 if cp<=-0.019171951711177825\n",
      "   -1.3091 if cp>=-0.021425632759928696\n",
      "   -3.6559 if cp<=-0.036515137553215025\n",
      "   -0.0000 if cp>=-0.02724060416221618 & pav<=-1.1382731080055237\n",
      "   +5.5265 if cp<=-0.04726061224937439 & cv<=-0.0514153353869915 & pa<=0.06377492845058441\n",
      "Run episode 340 with rewards 11.0\n",
      "============ 341 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -1.0018 if cp<=-0.004689938668161629\n",
      "   -2.2747 if \n",
      "   -4.3995 if cp<=-0.02724060416221618\n",
      "   +4.2290 if cp>=-0.0591566301882267\n",
      "   -4.8294 if cp>=0.0019177517388015985\n",
      "--------------\n",
      "   +2.6793 if cp<=-0.019171951711177825\n",
      "   -2.4277 if cp>=-0.021425632759928696\n",
      "   +3.2983 if cp<=-0.036515137553215025\n",
      "   -0.0000 if cp<=-0.04726061224937439 & cv<=-0.0514153353869915 & pa<=0.06377492845058441\n",
      "   +4.3936 if cp>=0.0019177517388015985\n",
      "Run episode 341 with rewards 9.0\n",
      "============ 342 ===========\n",
      "12 actions [1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.9048 if \n",
      "   -0.0000 if cp<=-0.02724060416221618\n",
      "   -0.9048 if cp>=-0.0591566301882267\n",
      "   -0.9048 if cp>=0.0019177517388015985\n",
      "   -0.0583 if cp>=0.04631521627306939\n",
      "--------------\n",
      "   +0.0000 if cp<=-0.019171951711177825\n",
      "   +0.8493 if cp>=-0.021425632759928696\n",
      "   +0.0000 if cp<=-0.036515137553215025\n",
      "   +0.8493 if cp>=0.0019177517388015985\n",
      "   +0.3660 if cp>=0.00978351142257452\n",
      "Run episode 342 with rewards 12.0\n",
      "============ 343 ===========\n",
      "15 actions [1, 1, 1, 1, 1, 0, 0, 0, 1, 0, 1, 1, 0, 0, 1]\n",
      "   -0.0673 if \n",
      "   -0.0673 if cp>=-0.0591566301882267\n",
      "   -0.0673 if cp>=0.0019177517388015985\n",
      "   +0.8943 if cp>=0.04631521627306939\n",
      "   -1.9418 if cp<=0.049164246022701266\n",
      "--------------\n",
      "   -0.6939 if cp>=-0.021425632759928696\n",
      "   -0.0000 if cp<=-0.036515137553215025\n",
      "   -0.6939 if cp>=0.0019177517388015985\n",
      "   -0.6939 if cp>=0.00978351142257452\n",
      "   +3.0981 if cv<=0.6285897493362428\n",
      "Run episode 343 with rewards 15.0\n",
      "============ 344 ===========\n",
      "17 actions [1, 1, 1, 1, 0, 1, 0, 0, 0, 0, 1, 1, 1, 0, 1, 1, 0]\n",
      "   -0.0971 if \n",
      "   -0.0971 if cp>=-0.0591566301882267\n",
      "   +1.1184 if cp>=0.04631521627306939\n",
      "   -1.2155 if cp<=0.049164246022701266\n",
      "   -0.9992 if cv>=0.6292034149169922\n",
      "--------------\n",
      "   +1.1810 if cp>=-0.021425632759928696\n",
      "   -0.4728 if cp>=0.0019177517388015985\n",
      "   -1.1581 if cp>=0.00978351142257452\n",
      "   +1.0140 if cv<=0.6285897493362428\n",
      "   -3.5528 if cv>=1.0150601863861084\n",
      "Run episode 344 with rewards 17.0\n",
      "============ 345 ===========\n",
      "10 actions [1, 1, 1, 1, 0, 1, 0, 1, 0, 1]\n",
      "   -1.4103 if cp>=-0.0591566301882267\n",
      "   +0.3119 if cp>=0.04631521627306939\n",
      "   -2.3919 if cp<=0.049164246022701266\n",
      "   +3.4897 if cv>=0.6292034149169922\n",
      "   +4.4178 if cp<=0.12645374536514284 & cp>=0.09458535015583039\n",
      "--------------\n",
      "   -1.1529 if cp>=-0.021425632759928696\n",
      "   -1.1529 if cp>=0.00978351142257452\n",
      "   +5.1918 if cv<=0.6285897493362428\n",
      "   +0.0001 if cv>=1.0150601863861084\n",
      "   -2.3183 if cp>=0.09458535015583039\n",
      "Run episode 345 with rewards 10.0\n",
      "============ 346 ===========\n",
      "15 actions [1, 1, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 0, 1, 0]\n",
      "   -0.3023 if cp>=-0.0591566301882267\n",
      "   -0.2202 if cp<=0.049164246022701266\n",
      "   +1.1506 if cv>=0.6292034149169922\n",
      "   -0.0000 if cp<=0.12645374536514284 & cp>=0.09458535015583039\n",
      "   +0.0414 if cv>=0.7965694069862366\n",
      "--------------\n",
      "   -0.4946 if cp>=-0.021425632759928696\n",
      "   -1.3094 if cp>=0.00978351142257452\n",
      "   +1.4189 if cv<=0.6285897493362428\n",
      "   -0.0000 if cp>=0.09458535015583039\n",
      "   -1.8674 if cv<=0.7911309361457824 & cv>=0.6014715194702148\n",
      "Run episode 346 with rewards 15.0\n",
      "============ 347 ===========\n",
      "17 actions [1, 1, 1, 0, 0, 1, 1, 1, 0, 0, 0, 1, 1, 0, 1, 0, 0]\n",
      "   +0.6155 if cp>=-0.0591566301882267\n",
      "   +1.3081 if cp<=0.049164246022701266\n",
      "   -0.0000 if cv>=0.6292034149169922\n",
      "   -0.0000 if cv>=0.7965694069862366\n",
      "   -3.4339 if cp<=0.048826619982719435 & cv<=0.4210139513015747\n",
      "--------------\n",
      "   -0.3187 if cp>=-0.021425632759928696\n",
      "   -2.7968 if cp>=0.00978351142257452\n",
      "   +3.6075 if cv<=0.6285897493362428\n",
      "   -5.1473 if cv<=0.7911309361457824 & cv>=0.6014715194702148\n",
      "   -1.3262 if cp<=0.028522142767906208 & pav>=-0.9341952443122864\n",
      "Run episode 347 with rewards 17.0\n",
      "============ 348 ===========\n",
      "11 actions [1, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0]\n",
      "   +0.7203 if cp>=-0.0591566301882267\n",
      "   -2.0991 if cp<=0.049164246022701266\n",
      "   +0.0027 if cv>=0.6292034149169922\n",
      "   -1.8143 if cp<=0.048826619982719435 & cv<=0.4210139513015747\n",
      "   +2.9148 if cp<=0.03634631410241127 & cv>=0.21344271302223208\n",
      "--------------\n",
      "   -3.5009 if cp>=0.00978351142257452\n",
      "   +4.9505 if cv<=0.6285897493362428\n",
      "   -0.0242 if cv<=0.7911309361457824 & cv>=0.6014715194702148\n",
      "   -3.7345 if cp<=0.028522142767906208 & pav>=-0.9341952443122864\n",
      "   -2.7419 if cp<=0.07386630326509477 & cv>=0.5625986218452453\n",
      "Run episode 348 with rewards 11.0\n",
      "============ 349 ===========\n",
      "11 actions [1, 1, 1, 1, 0, 1, 0, 0, 1, 1, 1]\n",
      "   -1.5808 if cp>=-0.0591566301882267\n",
      "   -0.9491 if cp<=0.049164246022701266\n",
      "   -0.7198 if cp<=0.048826619982719435 & cv<=0.4210139513015747\n",
      "   -0.1852 if cp<=0.03634631410241127 & cv>=0.21344271302223208\n",
      "   +0.9565 if cp<=0.10003259778022766 & pav<=-1.1191586256027222\n",
      "--------------\n",
      "   -0.7545 if cp>=0.00978351142257452\n",
      "   +3.7087 if cv<=0.6285897493362428\n",
      "   -0.0000 if cp<=0.028522142767906208 & pav>=-0.9341952443122864\n",
      "   -2.4360 if cp<=0.07386630326509477 & cv>=0.5625986218452453\n",
      "   +0.8208 if cp>=0.1256619095802307\n",
      "Run episode 349 with rewards 11.0\n",
      "============ 350 ===========\n",
      "14 actions [1, 1, 1, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1]\n",
      "   -0.8883 if cp>=-0.0591566301882267\n",
      "   -3.1928 if cp<=0.049164246022701266\n",
      "   -0.0371 if cp<=0.048826619982719435 & cv<=0.4210139513015747\n",
      "   +3.6706 if cp<=0.10003259778022766 & pav<=-1.1191586256027222\n",
      "   +0.4514 if pa>=-0.07962553203105925\n",
      "--------------\n",
      "   -0.9127 if cp>=0.00978351142257452\n",
      "   +1.5946 if cv<=0.6285897493362428\n",
      "   -0.1922 if cp<=0.07386630326509477 & cv>=0.5625986218452453\n",
      "   -0.0000 if cp>=0.1256619095802307\n",
      "   -2.9810 if cp<=0.06985729187726974 & cv>=0.6330425143241882\n",
      "Run episode 350 with rewards 14.0\n",
      "============ 351 ===========\n",
      "12 actions [1, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1]\n",
      "   +0.5243 if cp>=-0.0591566301882267\n",
      "   -2.3004 if cp<=0.049164246022701266\n",
      "   +2.1842 if cp<=0.10003259778022766 & pav<=-1.1191586256027222\n",
      "   -0.7700 if pa>=-0.07962553203105925\n",
      "   -1.4506 if cp>=0.03896013796329499 & cv<=0.6070688605308533\n",
      "--------------\n",
      "   -0.9194 if cp>=0.00978351142257452\n",
      "   +1.2559 if cv<=0.6285897493362428\n",
      "   -2.1320 if cp<=0.07386630326509477 & cv>=0.5625986218452453\n",
      "   -1.3117 if cp<=0.06985729187726974 & cv>=0.6330425143241882\n",
      "   +1.4131 if cp>=-0.03041258379817009 & cv<=0.6070688605308533\n",
      "Run episode 351 with rewards 12.0\n",
      "============ 352 ===========\n",
      "16 actions [1, 1, 1, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 1, 1, 1]\n",
      "   +0.8438 if cp<=0.049164246022701266\n",
      "   -0.0000 if cp<=0.10003259778022766 & pav<=-1.1191586256027222\n",
      "   -0.3413 if pa>=-0.07962553203105925\n",
      "   -1.1889 if cp>=0.03896013796329499 & cv<=0.6070688605308533\n",
      "   -2.5377 if cp<=0.04191069379448891 & cv<=0.419805246591568\n",
      "--------------\n",
      "   -0.3512 if cv<=0.6285897493362428\n",
      "   -4.1501 if cp<=0.07386630326509477 & cv>=0.5625986218452453\n",
      "   -0.0000 if cp<=0.06985729187726974 & cv>=0.6330425143241882\n",
      "   +2.3667 if cp>=-0.03041258379817009 & cv<=0.6070688605308533\n",
      "   -1.9177 if cp>=0.11693211644887924\n",
      "Run episode 352 with rewards 16.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 353 ===========\n",
      "12 actions [1, 1, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0]\n",
      "   +0.7755 if cp<=0.049164246022701266\n",
      "   +0.9545 if pa>=-0.07962553203105925\n",
      "   -3.1943 if cp>=0.03896013796329499 & cv<=0.6070688605308533\n",
      "   -2.4611 if cp<=0.04191069379448891 & cv<=0.419805246591568\n",
      "   -3.5818 if cp<=0.033396828919649145 & cv<=0.5623753070831299\n",
      "--------------\n",
      "   -0.8763 if cv<=0.6285897493362428\n",
      "   -3.2333 if cp<=0.07386630326509477 & cv>=0.5625986218452453\n",
      "   +3.7514 if cp>=-0.03041258379817009 & cv<=0.6070688605308533\n",
      "   +0.0000 if cp>=0.11693211644887924\n",
      "   +2.6876 if cp<=-0.037992581725120544 & cv<=0.5623753070831299\n",
      "Run episode 353 with rewards 12.0\n",
      "============ 354 ===========\n",
      "10 actions [1, 1, 1, 0, 1, 1, 1, 1, 0, 1]\n",
      "   +0.1256 if pa>=-0.07962553203105925\n",
      "   -2.7265 if cp>=0.03896013796329499 & cv<=0.6070688605308533\n",
      "   -1.9026 if cp<=0.04191069379448891 & cv<=0.419805246591568\n",
      "   -1.1229 if cp<=0.033396828919649145 & cv<=0.5623753070831299\n",
      "   +1.3701 if cp<=0.03899315372109413\n",
      "--------------\n",
      "   +1.2402 if cv<=0.6285897493362428\n",
      "   -1.7975 if cp<=0.07386630326509477 & cv>=0.5625986218452453\n",
      "   +1.2402 if cp>=-0.03041258379817009 & cv<=0.6070688605308533\n",
      "   -0.0000 if cp<=-0.037992581725120544 & cv<=0.5623753070831299\n",
      "   -0.8860 if cp<=0.03899315372109413\n",
      "Run episode 354 with rewards 10.0\n",
      "============ 355 ===========\n",
      "12 actions [1, 1, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0]\n",
      "   -1.4474 if cp>=0.03896013796329499 & cv<=0.6070688605308533\n",
      "   -1.7426 if cp<=0.04191069379448891 & cv<=0.419805246591568\n",
      "   -1.7426 if cp<=0.033396828919649145 & cv<=0.5623753070831299\n",
      "   +1.3968 if cp<=0.03899315372109413\n",
      "   -0.0507 if cp<=0.055652286112308505\n",
      "--------------\n",
      "   -0.1032 if cv<=0.6285897493362428\n",
      "   -1.3712 if cp<=0.07386630326509477 & cv>=0.5625986218452453\n",
      "   -0.1032 if cp>=-0.03041258379817009 & cv<=0.6070688605308533\n",
      "   -0.5753 if cp<=0.03899315372109413\n",
      "   +2.3429 if cp<=0.08188644200563432\n",
      "Run episode 355 with rewards 12.0\n",
      "============ 356 ===========\n",
      "10 actions [1, 1, 1, 0, 1, 1, 1, 1, 1, 1]\n",
      "   -0.0000 if cp>=0.03896013796329499 & cv<=0.6070688605308533\n",
      "   -2.4791 if cp<=0.04191069379448891 & cv<=0.419805246591568\n",
      "   -2.4791 if cp<=0.033396828919649145 & cv<=0.5623753070831299\n",
      "   +0.1584 if cp<=0.03899315372109413\n",
      "   +2.4268 if cp<=0.025460057705640797\n",
      "--------------\n",
      "   -1.9564 if cp<=0.07386630326509477 & cv>=0.5625986218452453\n",
      "   +0.7579 if cp>=-0.03041258379817009 & cv<=0.6070688605308533\n",
      "   -0.8787 if cp<=0.03899315372109413\n",
      "   +2.0553 if cp<=0.08188644200563432\n",
      "   +3.7410 if cp>=0.025460057705640797\n",
      "Run episode 356 with rewards 10.0\n",
      "============ 357 ===========\n",
      "13 actions [1, 1, 1, 0, 1, 1, 0, 1, 1, 1, 1, 1, 1]\n",
      "   -0.7342 if cp<=0.04191069379448891 & cv<=0.419805246591568\n",
      "   -2.1639 if cp<=0.033396828919649145 & cv<=0.5623753070831299\n",
      "   -0.0746 if cp<=0.03899315372109413\n",
      "   +0.6403 if cp<=0.025460057705640797\n",
      "   +0.3314 if cp<=0.06110185235738755 & cp>=-0.003091528033837676\n",
      "--------------\n",
      "   -0.0936 if cp<=0.07386630326509477 & cv>=0.5625986218452453\n",
      "   +0.8059 if cp<=0.03899315372109413\n",
      "   +2.1465 if cp<=0.08188644200563432\n",
      "   -0.0677 if cp>=0.025460057705640797\n",
      "   -2.2215 if cp<=0.014091908931732178 & cv>=0.551794171333313\n",
      "Run episode 357 with rewards 13.0\n",
      "============ 358 ===========\n",
      "13 actions [1, 1, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 0]\n",
      "   -1.2192 if cp<=0.04191069379448891 & cv<=0.419805246591568\n",
      "   -1.2192 if cp<=0.033396828919649145 & cv<=0.5623753070831299\n",
      "   +0.7571 if cp<=0.025460057705640797\n",
      "   -1.8263 if cp<=0.06110185235738755 & cp>=-0.003091528033837676\n",
      "   +2.9228 if cp<=0.028535769879817974 & cv>=0.5649913311004638\n",
      "--------------\n",
      "   +0.3540 if cp<=0.07386630326509477 & cv>=0.5625986218452453\n",
      "   +0.3813 if cp<=0.03899315372109413\n",
      "   +1.7693 if cp<=0.08188644200563432\n",
      "   -3.5005 if cp<=0.014091908931732178 & cv>=0.551794171333313\n",
      "   +3.5067 if cp>=-0.001709474608651357 & cv<=0.5649913311004638\n",
      "Run episode 358 with rewards 13.0\n",
      "============ 359 ===========\n",
      "10 actions [1, 1, 1, 1, 0, 1, 1, 1, 1, 1]\n",
      "   -0.8058 if cp<=0.04191069379448891 & cv<=0.419805246591568\n",
      "   -0.8058 if cp<=0.033396828919649145 & cv<=0.5623753070831299\n",
      "   +1.4529 if cp<=0.06110185235738755 & cp>=-0.003091528033837676\n",
      "   +3.7995 if cp<=0.028535769879817974 & cv>=0.5649913311004638\n",
      "   -1.3178 if \n",
      "--------------\n",
      "   -0.5166 if cp<=0.03899315372109413\n",
      "   +0.6285 if cp<=0.08188644200563432\n",
      "   -2.2672 if cp<=0.014091908931732178 & cv>=0.551794171333313\n",
      "   +0.1078 if cp>=-0.001709474608651357 & cv<=0.5649913311004638\n",
      "   +1.6724 if cv<=0.5699054718017578\n",
      "Run episode 359 with rewards 10.0\n",
      "============ 360 ===========\n",
      "13 actions [1, 1, 0, 1, 1, 0, 1, 1, 1, 1, 1, 0, 0]\n",
      "   -1.2300 if cp<=0.04191069379448891 & cv<=0.419805246591568\n",
      "   -1.5486 if cp<=0.06110185235738755 & cp>=-0.003091528033837676\n",
      "   +2.5817 if cp<=0.028535769879817974 & cv>=0.5649913311004638\n",
      "   +0.5818 if \n",
      "   +3.9926 if cp>=0.10487756878137589\n",
      "--------------\n",
      "   +0.0835 if cp<=0.03899315372109413\n",
      "   +1.6557 if cp<=0.08188644200563432\n",
      "   -0.0000 if cp<=0.014091908931732178 & cv>=0.551794171333313\n",
      "   +1.5043 if cv<=0.5699054718017578\n",
      "   -3.6895 if cp>=0.10487756878137589\n",
      "Run episode 360 with rewards 13.0\n",
      "============ 361 ===========\n",
      "10 actions [1, 1, 1, 0, 1, 1, 1, 1, 0, 0]\n",
      "   -1.1255 if cp<=0.04191069379448891 & cv<=0.419805246591568\n",
      "   -0.4045 if cp<=0.06110185235738755 & cp>=-0.003091528033837676\n",
      "   +3.6889 if cp<=0.028535769879817974 & cv>=0.5649913311004638\n",
      "   -0.1186 if cp>=0.10487756878137589\n",
      "   +4.9024 if cp<=-0.0011078261770307986 & cv>=0.30543713271617895\n",
      "--------------\n",
      "   -1.2454 if cp<=0.03899315372109413\n",
      "   +1.5384 if cp<=0.08188644200563432\n",
      "   -0.0707 if cv<=0.5699054718017578\n",
      "   +0.0463 if cp>=0.10487756878137589\n",
      "   +2.5198 if cv<=0.30543713271617895\n",
      "Run episode 361 with rewards 10.0\n",
      "============ 362 ===========\n",
      "12 actions [0, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1]\n",
      "   -0.5940 if cp<=0.04191069379448891 & cv<=0.419805246591568\n",
      "   -1.1448 if cp<=0.06110185235738755 & cp>=-0.003091528033837676\n",
      "   +3.0205 if cp<=0.028535769879817974 & cv>=0.5649913311004638\n",
      "   -0.0000 if cp<=-0.0011078261770307986 & cv>=0.30543713271617895\n",
      "   -1.3386 if cp<=0.03453342840075493 & cp>=0.017335251718759537 & cv<=0.5519150376319886\n",
      "--------------\n",
      "   -0.6730 if cp<=0.03899315372109413\n",
      "   +1.8722 if cp<=0.08188644200563432\n",
      "   +1.5935 if cv<=0.5699054718017578\n",
      "   +0.4465 if cv<=0.30543713271617895\n",
      "   +2.9913 if cp>=0.12228837609291077\n",
      "Run episode 362 with rewards 12.0\n",
      "============ 363 ===========\n",
      "11 actions [0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1]\n",
      "   +2.5742 if cp<=0.04191069379448891 & cv<=0.419805246591568\n",
      "   -2.7678 if cp<=0.06110185235738755 & cp>=-0.003091528033837676\n",
      "   +2.1729 if cp<=0.028535769879817974 & cv>=0.5649913311004638\n",
      "   +0.0000 if cp<=0.03453342840075493 & cp>=0.017335251718759537 & cv<=0.5519150376319886\n",
      "   -2.7459 if cp<=-0.022813060879707338\n",
      "--------------\n",
      "   +2.1574 if cp<=0.03899315372109413\n",
      "   +0.1266 if cp<=0.08188644200563432\n",
      "   +0.2333 if cv<=0.5699054718017578\n",
      "   +0.0000 if cp>=0.12228837609291077\n",
      "   -4.8955 if cp>=-0.022813060879707338 & pa>=-0.01905742846429348\n",
      "Run episode 363 with rewards 11.0\n",
      "============ 364 ===========\n",
      "62 actions [0, 0, 1, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 1, 0, 0, 0, 0, 1, 1, 1, 0, 0, 1, 1, 0, 1, 1, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 0, 1, 1, 1, 0, 1, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0]\n",
      "   +0.6025 if cp<=0.04191069379448891 & cv<=0.419805246591568\n",
      "   +0.8222 if cp<=0.06110185235738755 & cp>=-0.003091528033837676\n",
      "   -0.0000 if cp<=0.028535769879817974 & cv>=0.5649913311004638\n",
      "   -1.4259 if cp<=-0.022813060879707338\n",
      "   +0.7998 if cv>=-0.57942134141922\n",
      "--------------\n",
      "   +0.6681 if cp<=0.03899315372109413\n",
      "   +0.6681 if cp<=0.08188644200563432\n",
      "   +0.6681 if cv<=0.5699054718017578\n",
      "   -3.4748 if cp>=-0.022813060879707338 & pa>=-0.01905742846429348\n",
      "   -2.0537 if cv>=-0.38366845250129683\n",
      "Run episode 364 with rewards 62.0\n",
      "============ 365 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 1, 1, 1]\n",
      "   +0.8934 if cp<=0.04191069379448891 & cv<=0.419805246591568\n",
      "   +1.4713 if cp<=0.06110185235738755 & cp>=-0.003091528033837676\n",
      "   -0.5012 if cp<=-0.022813060879707338\n",
      "   -0.5375 if cv>=-0.57942134141922\n",
      "   -4.6714 if cp<=-0.040008373558521264 & cp>=-0.0688414305448532 & pa>=0.015934531018137955\n",
      "--------------\n",
      "   +1.8654 if cp<=0.08188644200563432\n",
      "   -0.1470 if cv<=0.5699054718017578\n",
      "   -4.6494 if cp>=-0.022813060879707338 & pa>=-0.01905742846429348\n",
      "   -0.4628 if cv>=-0.38366845250129683\n",
      "   -2.1359 if cv>=-0.22060306966304777 & pa<=-0.0179064685478806\n",
      "Run episode 365 with rewards 9.0\n",
      "============ 366 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +4.2684 if cp<=0.04191069379448891 & cv<=0.419805246591568\n",
      "   +0.0441 if cp<=0.06110185235738755 & cp>=-0.003091528033837676\n",
      "   +0.0373 if cv>=-0.57942134141922\n",
      "   +5.1579 if cp<=-0.040008373558521264 & cp>=-0.0688414305448532 & pa>=0.015934531018137955\n",
      "   +3.7978 if pa>=0.19936834275722504\n",
      "--------------\n",
      "   -0.8009 if cp<=0.08188644200563432\n",
      "   -1.2878 if cp>=-0.022813060879707338 & pa>=-0.01905742846429348\n",
      "   -0.6580 if cv>=-0.38366845250129683\n",
      "   -0.0000 if cv>=-0.22060306966304777 & pa<=-0.0179064685478806\n",
      "   +0.6413 if pav>=1.8786249160766602\n",
      "Run episode 366 with rewards 9.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 367 ===========\n",
      "33 actions [0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 1, 0, 0, 0]\n",
      "   -0.1130 if cp<=0.04191069379448891 & cv<=0.419805246591568\n",
      "   +0.0000 if cp<=0.06110185235738755 & cp>=-0.003091528033837676\n",
      "   +0.9495 if cp<=-0.040008373558521264 & cp>=-0.0688414305448532 & pa>=0.015934531018137955\n",
      "   +0.0000 if pa>=0.19936834275722504\n",
      "  -10.4172 if cp<=-0.07443822771310807\n",
      "--------------\n",
      "   -0.2656 if cp<=0.08188644200563432\n",
      "   -0.3221 if cp>=-0.022813060879707338 & pa>=-0.01905742846429348\n",
      "   -0.2527 if cv>=-0.38366845250129683\n",
      "   +0.1263 if pav>=1.8786249160766602\n",
      "   -0.3914 if cp>=-0.043339595943689344\n",
      "Run episode 367 with rewards 33.0\n",
      "============ 368 ===========\n",
      "11 actions [0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1]\n",
      "   +1.6059 if cp<=0.04191069379448891 & cv<=0.419805246591568\n",
      "   +2.7521 if cp<=-0.040008373558521264 & cp>=-0.0688414305448532 & pa>=0.015934531018137955\n",
      "   -0.0494 if pa>=0.19936834275722504\n",
      "   -6.4002 if cp<=-0.07443822771310807\n",
      "   -4.6264 if cp<=-0.03404654264450073 & cv<=-0.575925600528717 & pa<=0.039409229159355165\n",
      "--------------\n",
      "   +2.2411 if cp<=0.08188644200563432\n",
      "   -0.2404 if cp>=-0.022813060879707338 & pa>=-0.01905742846429348\n",
      "   -4.9479 if cv>=-0.38366845250129683\n",
      "   -2.1194 if cp>=-0.043339595943689344\n",
      "   -5.6410 if cp<=-0.03404654264450073 & cv<=-0.3856007754802704 & cv>=-0.575925600528717 & pav<=1.1169506072998048\n",
      "Run episode 368 with rewards 11.0\n",
      "============ 369 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +7.1228 if cp<=0.04191069379448891 & cv<=0.419805246591568\n",
      "   +0.3936 if cp<=-0.040008373558521264 & cp>=-0.0688414305448532 & pa>=0.015934531018137955\n",
      "   +8.1158 if cp<=-0.07443822771310807\n",
      "   +0.6747 if cp<=-0.03404654264450073 & cv<=-0.575925600528717 & pa<=0.039409229159355165\n",
      "   +1.1754 if pa>=0.1987810879945755\n",
      "--------------\n",
      "   -2.1589 if cp<=0.08188644200563432\n",
      "   -0.4621 if cv>=-0.38366845250129683\n",
      "   -0.9556 if cp>=-0.043339595943689344\n",
      "   -0.0000 if cp<=-0.03404654264450073 & cv<=-0.3856007754802704 & cv>=-0.575925600528717 & pav<=1.1169506072998048\n",
      "   -0.6358 if pav>=2.2878594398498535\n",
      "Run episode 369 with rewards 9.0\n",
      "============ 370 ===========\n",
      "14 actions [1, 1, 0, 1, 1, 0, 0, 0, 1, 1, 1, 1, 1, 0]\n",
      "   -0.6439 if cp<=0.04191069379448891 & cv<=0.419805246591568\n",
      "  -11.1585 if cp<=-0.07443822771310807\n",
      "   +0.0001 if cp<=-0.03404654264450073 & cv<=-0.575925600528717 & pa<=0.039409229159355165\n",
      "   +0.0001 if pa>=0.1987810879945755\n",
      "   -7.8038 if pa>=0.19120833277702332\n",
      "--------------\n",
      "   -0.0624 if cp<=0.08188644200563432\n",
      "   -0.0305 if cv>=-0.38366845250129683\n",
      "   -0.0619 if cp>=-0.043339595943689344\n",
      "   +0.0000 if pav>=2.2878594398498535\n",
      "   -0.0515 if cp>=-0.008232972119003526\n",
      "Run episode 370 with rewards 14.0\n",
      "============ 371 ===========\n",
      "16 actions [1, 0, 1, 0, 1, 1, 1, 0, 1, 0, 0, 0, 1, 0, 1, 1]\n",
      "   -0.3236 if cp<=0.04191069379448891 & cv<=0.419805246591568\n",
      "   -0.0000 if cp<=-0.07443822771310807\n",
      "   -0.0000 if pa>=0.1987810879945755\n",
      "   -0.0000 if pa>=0.19120833277702332\n",
      "   -3.1721 if cv<=0.15137543976306916\n",
      "--------------\n",
      "   -0.1407 if cp<=0.08188644200563432\n",
      "   -0.1406 if cv>=-0.38366845250129683\n",
      "   -0.1407 if cp>=-0.043339595943689344\n",
      "   -0.4815 if cp>=-0.008232972119003526\n",
      "   +3.1988 if cv<=0.15137543976306916\n",
      "Run episode 371 with rewards 16.0\n",
      "============ 372 ===========\n",
      "35 actions [1, 0, 0, 1, 1, 0, 0, 1, 1, 0, 0, 0, 1, 1, 1, 0, 1, 0, 1, 1, 0, 0, 0, 1, 1, 1, 0, 0, 0, 1, 0, 0, 0, 0, 1]\n",
      "   -1.3494 if cp<=0.04191069379448891 & cv<=0.419805246591568\n",
      "   +0.0000 if cp<=-0.07443822771310807\n",
      "   +0.0000 if pa>=0.19120833277702332\n",
      "   -3.0272 if cv<=0.15137543976306916\n",
      "   +3.3627 if cv<=0.16462518274784088\n",
      "--------------\n",
      "   -0.0860 if cp<=0.08188644200563432\n",
      "   -0.0860 if cp>=-0.043339595943689344\n",
      "   -0.9179 if cp>=-0.008232972119003526\n",
      "   +1.8772 if cv<=0.15137543976306916\n",
      "   -0.9801 if pa>=-0.06725075840950011 & pav>=-0.4073075354099273\n",
      "Run episode 372 with rewards 35.0\n",
      "============ 373 ===========\n",
      "55 actions [1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 0, 1, 0, 0, 1, 1, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 0, 0, 0, 1, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 1]\n",
      "   -4.6143 if cp<=0.04191069379448891 & cv<=0.419805246591568\n",
      "   -0.0000 if cp<=-0.07443822771310807\n",
      "   +0.1079 if cv<=0.15137543976306916\n",
      "   +0.1079 if cv<=0.16462518274784088\n",
      "   +6.6262 if cp<=0.045123687386512755 & cv>=0.1841414213180542\n",
      "--------------\n",
      "   -1.6327 if cp>=-0.043339595943689344\n",
      "   -1.6344 if cp>=-0.008232972119003526\n",
      "   +5.3190 if cv<=0.15137543976306916\n",
      "   -1.6345 if pa>=-0.06725075840950011 & pav>=-0.4073075354099273\n",
      "   +3.8635 if cv>=-0.20255407094955444 & pa<=0.09680629819631577 & pa>=0.07280992269515991\n",
      "Run episode 373 with rewards 55.0\n",
      "============ 374 ===========\n",
      "70 actions [1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 0, 1]\n",
      "   -7.4711 if cp<=0.04191069379448891 & cv<=0.419805246591568\n",
      "   +1.8195 if cv<=0.15137543976306916\n",
      "   +1.8194 if cv<=0.16462518274784088\n",
      "   +9.6413 if cp<=0.045123687386512755 & cv>=0.1841414213180542\n",
      "   -3.8649 if cp>=0.03836637958884239 & cv<=0.03616651371121407\n",
      "--------------\n",
      "   -0.9305 if cp>=-0.008232972119003526\n",
      "   +2.7484 if cv<=0.15137543976306916\n",
      "   -0.9305 if pa>=-0.06725075840950011 & pav>=-0.4073075354099273\n",
      "   +1.9825 if cv>=-0.20255407094955444 & pa<=0.09680629819631577 & pa>=0.07280992269515991\n",
      "   -2.7286 if cv>=0.03616651371121407\n",
      "Run episode 374 with rewards 70.0\n",
      "============ 375 ===========\n",
      "43 actions [1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1]\n",
      "   -0.9916 if cp<=0.04191069379448891 & cv<=0.419805246591568\n",
      "   -4.1734 if cv<=0.15137543976306916\n",
      "   +3.5437 if cp<=0.045123687386512755 & cv>=0.1841414213180542\n",
      "   +0.1210 if cp>=0.03836637958884239 & cv<=0.03616651371121407\n",
      "   +3.4129 if cp>=0.0680988907814026 & cv<=-0.0012299037072807544\n",
      "--------------\n",
      "   -1.2766 if cp>=-0.008232972119003526\n",
      "   +2.9087 if cv<=0.15137543976306916\n",
      "   +1.3860 if cv>=-0.20255407094955444 & pa<=0.09680629819631577 & pa>=0.07280992269515991\n",
      "   -4.4123 if cv>=0.03616651371121407\n",
      "   +3.0795 if cp<=0.0680988907814026 & cp>=0.042327406257390995 & cv<=0.1863972008228302\n",
      "Run episode 375 with rewards 43.0\n",
      "============ 376 ===========\n",
      "29 actions [1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1]\n",
      "   +0.2851 if cp<=0.04191069379448891 & cv<=0.419805246591568\n",
      "   -1.4594 if cv<=0.15137543976306916\n",
      "   +0.9996 if cp<=0.045123687386512755 & cv>=0.1841414213180542\n",
      "   -0.7149 if cp>=0.0680988907814026 & cv<=-0.0012299037072807544\n",
      "   -4.4804 if cp<=0.05791991204023362 & cv<=0.17877845764160158\n",
      "--------------\n",
      "   +2.3231 if cv<=0.15137543976306916\n",
      "   -1.2068 if cv>=-0.20255407094955444 & pa<=0.09680629819631577 & pa>=0.07280992269515991\n",
      "   -3.1034 if cv>=0.03616651371121407\n",
      "   +2.8956 if cp<=0.0680988907814026 & cp>=0.042327406257390995 & cv<=0.1863972008228302\n",
      "   -2.8138 if cv>=0.17877845764160158 & pav>=0.11616250872612001\n",
      "Run episode 376 with rewards 29.0\n",
      "============ 377 ===========\n",
      "23 actions [1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1]\n",
      "   -2.2520 if cv<=0.15137543976306916\n",
      "   +1.4299 if cp<=0.045123687386512755 & cv>=0.1841414213180542\n",
      "   -0.0000 if cp>=0.0680988907814026 & cv<=-0.0012299037072807544\n",
      "   -2.0185 if cp<=0.05791991204023362 & cv<=0.17877845764160158\n",
      "   +1.1742 if \n",
      "--------------\n",
      "   +1.5396 if cv<=0.15137543976306916\n",
      "   -3.8411 if cv>=0.03616651371121407\n",
      "   +1.0057 if cp<=0.0680988907814026 & cp>=0.042327406257390995 & cv<=0.1863972008228302\n",
      "   +0.0000 if cv>=0.17877845764160158 & pav>=0.11616250872612001\n",
      "   -1.0396 if cp<=0.06352734118700028 & cp>=0.03869664147496224 & cv>=0.017582559213042262\n",
      "Run episode 377 with rewards 23.0\n",
      "============ 378 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -2.4001 if cv<=0.15137543976306916\n",
      "   -1.8737 if cp<=0.045123687386512755 & cv>=0.1841414213180542\n",
      "   -2.1261 if cp<=0.05791991204023362 & cv<=0.17877845764160158\n",
      "   +2.0997 if \n",
      "   -2.9084 if cp>=0.010750044882297518\n",
      "--------------\n",
      "   -2.9435 if cv<=0.15137543976306916\n",
      "   +0.3960 if cv>=0.03616651371121407\n",
      "   -1.1327 if cp<=0.0680988907814026 & cp>=0.042327406257390995 & cv<=0.1863972008228302\n",
      "   -2.2269 if cp<=0.06352734118700028 & cp>=0.03869664147496224 & cv>=0.017582559213042262\n",
      "   +5.2914 if cv<=0.14919012486934663\n",
      "Run episode 378 with rewards 9.0\n",
      "============ 379 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.0802 if cv<=0.15137543976306916\n",
      "   -0.0802 if cp<=0.05791991204023362 & cv<=0.17877845764160158\n",
      "   -1.6093 if \n",
      "   -0.9635 if cp>=0.010750044882297518\n",
      "   -1.6093 if \n",
      "--------------\n",
      "   +0.1487 if cv<=0.15137543976306916\n",
      "   -0.0000 if cp<=0.0680988907814026 & cp>=0.042327406257390995 & cv<=0.1863972008228302\n",
      "   +0.9580 if cp<=0.06352734118700028 & cp>=0.03869664147496224 & cv>=0.017582559213042262\n",
      "   +0.1487 if cv<=0.14919012486934663\n",
      "   +2.3836 if cp<=0.010191611200571061\n",
      "Run episode 379 with rewards 9.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 380 ===========\n",
      "68 actions [1, 0, 1, 1, 0, 1, 1, 0, 1, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0]\n",
      "   -0.2769 if cp<=0.05791991204023362 & cv<=0.17877845764160158\n",
      "   -1.5207 if \n",
      "   -0.4627 if cp>=0.010750044882297518\n",
      "   +2.5237 if cp>=0.03656812123954297\n",
      "   +5.3624 if cp>=0.10907566547393799\n",
      "--------------\n",
      "   +0.1606 if cv<=0.15137543976306916\n",
      "   +0.1231 if cp<=0.06352734118700028 & cp>=0.03869664147496224 & cv>=0.017582559213042262\n",
      "   +0.1606 if cv<=0.14919012486934663\n",
      "   +0.5755 if cp<=0.010191611200571061\n",
      "   +0.7519 if cp<=0.03656812123954297\n",
      "Run episode 380 with rewards 68.0\n",
      "============ 381 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 0, 0, 0, 0]\n",
      "   -3.7741 if \n",
      "   -0.3658 if cp>=0.010750044882297518\n",
      "   +4.0219 if cp>=0.03656812123954297\n",
      "   +5.7628 if cp>=0.10907566547393799\n",
      "   +4.7978 if cp>=0.07284396141767502 & pa>=-0.02522238940000534\n",
      "--------------\n",
      "   +0.4410 if cv<=0.15137543976306916\n",
      "   +0.4410 if cv<=0.14919012486934663\n",
      "   +1.3367 if cp<=0.010191611200571061\n",
      "   +5.2763 if cp<=0.03656812123954297\n",
      "   -2.5417 if cp<=0.04475419446825982\n",
      "Run episode 381 with rewards 10.0\n",
      "============ 382 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -1.5977 if \n",
      "   -0.4577 if cp>=0.03656812123954297\n",
      "   -2.1755 if cp>=0.10907566547393799\n",
      "   -0.0000 if cp>=0.07284396141767502 & pa>=-0.02522238940000534\n",
      "   +2.8136 if cv>=0.9684635162353515\n",
      "--------------\n",
      "   +0.0534 if cv<=0.15137543976306916\n",
      "   +0.0000 if cp<=0.010191611200571061\n",
      "   +0.2092 if cp<=0.03656812123954297\n",
      "   +0.2092 if cp<=0.04475419446825982\n",
      "   +1.6349 if cp<=0.05846913382411004\n",
      "Run episode 382 with rewards 9.0\n",
      "============ 383 ===========\n",
      "24 actions [0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1]\n",
      "   -1.2356 if \n",
      "   +7.1330 if cp>=0.03656812123954297\n",
      "   +0.0000 if cp>=0.10907566547393799\n",
      "   +2.8255 if cv>=0.9684635162353515\n",
      "   +5.6326 if cp>=0.0696534812450409\n",
      "--------------\n",
      "   +0.2669 if cv<=0.15137543976306916\n",
      "   +2.8827 if cp<=0.03656812123954297\n",
      "   +1.7719 if cp<=0.04475419446825982\n",
      "   +1.7719 if cp<=0.05846913382411004\n",
      "   -3.7809 if \n",
      "Run episode 383 with rewards 24.0\n",
      "============ 384 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 0]\n",
      "   -1.3033 if \n",
      "   +4.9980 if cp>=0.03656812123954297\n",
      "   +0.1039 if cv>=0.9684635162353515\n",
      "   +0.1038 if cp>=0.0696534812450409\n",
      "   +0.1305 if pa>=0.1783704161643982\n",
      "--------------\n",
      "   +2.4567 if cp<=0.03656812123954297\n",
      "   +0.4437 if cp<=0.04475419446825982\n",
      "   +0.4533 if cp<=0.05846913382411004\n",
      "   +0.4505 if \n",
      "   -0.0535 if pa>=0.1783704161643982\n",
      "Run episode 384 with rewards 9.0\n",
      "============ 385 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -4.3537 if \n",
      "   -6.2846 if cp>=0.03656812123954297\n",
      "   -3.6610 if cv>=0.9684635162353515\n",
      "   -0.0697 if pa>=0.1783704161643982\n",
      "   -0.5039 if cp>=0.06343476474285126\n",
      "--------------\n",
      "   +0.7746 if cp<=0.03656812123954297\n",
      "   +0.7746 if cp<=0.04475419446825982\n",
      "   +0.7746 if cp<=0.05846913382411004\n",
      "   +1.1689 if \n",
      "   +0.0720 if cp<=0.0221261564642191 & cp>=-0.009768184553831804 & cp>=-0.03147666454315185\n",
      "Run episode 385 with rewards 10.0\n",
      "============ 386 ===========\n",
      "13 actions [0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0]\n",
      "   -0.8212 if \n",
      "   +0.3313 if cp>=0.03656812123954297\n",
      "   +0.8356 if cv>=0.9684635162353515\n",
      "   +2.4516 if cp>=0.06343476474285126\n",
      "   +8.6945 if cp>=0.10433796048164368\n",
      "--------------\n",
      "   +0.3078 if cp<=0.03656812123954297\n",
      "   +0.3080 if cp<=0.04475419446825982\n",
      "   +0.3080 if cp<=0.05846913382411004\n",
      "   +0.3080 if \n",
      "   +0.1650 if cp<=0.017755144834518434\n",
      "Run episode 386 with rewards 13.0\n",
      "============ 387 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   +0.8998 if \n",
      "   +1.3585 if cv>=0.9684635162353515\n",
      "   -2.4245 if cp>=0.06343476474285126\n",
      "   -3.3128 if cp>=0.10433796048164368\n",
      "   -2.7433 if pa>=-0.030563800409436227\n",
      "--------------\n",
      "   -0.7467 if cp<=0.03656812123954297\n",
      "   -0.7467 if cp<=0.04475419446825982\n",
      "   +0.4893 if cp<=0.05846913382411004\n",
      "   +0.4002 if \n",
      "   +2.9480 if pa>=-0.030563800409436227\n",
      "Run episode 387 with rewards 10.0\n",
      "============ 388 ===========\n",
      "31 actions [1, 1, 1, 1, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   +1.6786 if cv>=0.9684635162353515\n",
      "   +1.0292 if cp>=0.06343476474285126\n",
      "   +6.8720 if cp>=0.10433796048164368\n",
      "   -1.2203 if pa>=-0.030563800409436227\n",
      "   +4.0709 if cp>=0.18228232860565186\n",
      "--------------\n",
      "   +0.0000 if cp<=0.03656812123954297\n",
      "   +0.0000 if cp<=0.04475419446825982\n",
      "   +0.6973 if cp<=0.05846913382411004\n",
      "   +0.7292 if pa>=-0.030563800409436227\n",
      "   +1.5849 if cp<=0.12991291284561157\n",
      "Run episode 388 with rewards 31.0\n",
      "============ 389 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 0, 0, 0, 0]\n",
      "   +4.3123 if cv>=0.9684635162353515\n",
      "   +4.9063 if cp>=0.10433796048164368\n",
      "   -2.3006 if pa>=-0.030563800409436227\n",
      "   -0.0000 if cp>=0.18228232860565186\n",
      "   -1.9396 if cp>=0.013428708538413048 & pa>=-0.12422385811805725 & pav<=-1.1635535955429077 & pav>=-1.1635535955429077\n",
      "--------------\n",
      "   +0.3147 if cp<=0.03656812123954297\n",
      "   +1.6017 if cp<=0.05846913382411004\n",
      "   +2.4660 if pa>=-0.030563800409436227\n",
      "   +3.7707 if cp<=0.12991291284561157\n",
      "   -3.4429 if cv>=-0.14763273298740387 & pa>=-0.05089149996638298\n",
      "Run episode 389 with rewards 10.0\n",
      "============ 390 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 0, 0]\n",
      "   +3.2770 if cv>=0.9684635162353515\n",
      "   +1.8282 if cp>=0.10433796048164368\n",
      "   -0.1238 if pa>=-0.030563800409436227\n",
      "   +0.0000 if cp>=0.013428708538413048 & pa>=-0.12422385811805725 & pav<=-1.1635535955429077 & pav>=-1.1635535955429077\n",
      "   -1.8500 if cp<=0.0653747260570526\n",
      "--------------\n",
      "   +0.1441 if cp<=0.05846913382411004\n",
      "   +0.1441 if pa>=-0.030563800409436227\n",
      "   +1.8682 if cp<=0.12991291284561157\n",
      "   +0.5830 if cv>=-0.14763273298740387 & pa>=-0.05089149996638298\n",
      "   +1.1773 if cp<=0.09223462790250779 & cv<=0.7479923367500305\n",
      "Run episode 390 with rewards 9.0\n",
      "============ 391 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -6.9737 if cv>=0.9684635162353515\n",
      "   -0.0000 if cp>=0.10433796048164368\n",
      "   -0.2585 if pa>=-0.030563800409436227\n",
      "   -0.9900 if cp<=0.0653747260570526\n",
      "   -4.8679 if cp>=0.09874916076660156\n",
      "--------------\n",
      "   +0.0380 if cp<=0.05846913382411004\n",
      "   +6.9623 if cp<=0.12991291284561157\n",
      "   +0.0093 if cv>=-0.14763273298740387 & pa>=-0.05089149996638298\n",
      "   +0.0093 if cp<=0.09223462790250779 & cv<=0.7479923367500305\n",
      "   +4.8661 if cp>=0.09874916076660156\n",
      "Run episode 391 with rewards 10.0\n",
      "============ 392 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 0, 1, 1, 0, 0]\n",
      "   +7.2427 if cv>=0.9684635162353515\n",
      "   -0.0253 if pa>=-0.030563800409436227\n",
      "   -1.3797 if cp<=0.0653747260570526\n",
      "   +9.4216 if cp>=0.09874916076660156\n",
      "   +2.6599 if cp>=0.14110326766967773\n",
      "--------------\n",
      "   +1.2035 if cp<=0.05846913382411004\n",
      "   +1.2045 if cp<=0.12991291284561157\n",
      "   +0.9015 if cv>=-0.14763273298740387 & pa>=-0.05089149996638298\n",
      "   -0.0001 if cp>=0.09874916076660156\n",
      "   +0.3713 if cp<=0.0073036282323300835\n",
      "Run episode 392 with rewards 10.0\n",
      "============ 393 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   +0.7856 if cv>=0.9684635162353515\n",
      "   +0.5926 if cp<=0.0653747260570526\n",
      "   -0.0000 if cp>=0.09874916076660156\n",
      "   -0.0000 if cp>=0.14110326766967773\n",
      "   -5.9076 if cp>=0.022265415824949748 & cv>=0.8636269807815552\n",
      "--------------\n",
      "   +1.6202 if cp<=0.05846913382411004\n",
      "   +1.6420 if cp<=0.12991291284561157\n",
      "   +0.3695 if cv>=-0.14763273298740387 & pa>=-0.05089149996638298\n",
      "   +0.4489 if cp<=0.0073036282323300835\n",
      "   +1.7371 if cp<=0.053675672411918646 & cp>=0.022265415824949748 & cv>=0.8636269807815552\n",
      "Run episode 393 with rewards 10.0\n",
      "============ 394 ===========\n",
      "13 actions [1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +1.3273 if cv>=0.9684635162353515\n",
      "   -2.6245 if cp<=0.0653747260570526\n",
      "   +7.9369 if cp>=0.09874916076660156\n",
      "   +1.3245 if cp>=0.022265415824949748 & cv>=0.8636269807815552\n",
      "   +0.7692 if cp>=0.037615477293729785\n",
      "--------------\n",
      "   +2.0796 if cp<=0.05846913382411004\n",
      "   +2.0968 if cp<=0.12991291284561157\n",
      "   -0.0000 if cp<=0.0073036282323300835\n",
      "   -0.0000 if cp<=0.053675672411918646 & cp>=0.022265415824949748 & cv>=0.8636269807815552\n",
      "   +0.7027 if cp<=0.02113799788057804\n",
      "Run episode 394 with rewards 13.0\n",
      "============ 395 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 0, 0, 1, 1]\n",
      "   +2.3695 if cv>=0.9684635162353515\n",
      "   -1.2771 if cp<=0.0653747260570526\n",
      "   +2.4112 if cp>=0.09874916076660156\n",
      "   +0.1160 if cp>=0.022265415824949748 & cv>=0.8636269807815552\n",
      "   +1.6702 if cv>=1.1633527278900146\n",
      "--------------\n",
      "   +0.4729 if cp<=0.05846913382411004\n",
      "   +3.2502 if cp<=0.12991291284561157\n",
      "   -0.0000 if cp<=0.053675672411918646 & cp>=0.022265415824949748 & cv>=0.8636269807815552\n",
      "   -0.0000 if cp<=0.02113799788057804\n",
      "   -1.8021 if cv>=1.1633527278900146\n",
      "Run episode 395 with rewards 10.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 396 ===========\n",
      "26 actions [1, 1, 1, 1, 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 1, 1, 0, 1, 0, 0, 0, 1, 0]\n",
      "   +3.3494 if cv>=0.9684635162353515\n",
      "   -0.4436 if cp<=0.0653747260570526\n",
      "   +0.0000 if cp>=0.09874916076660156\n",
      "   +0.7683 if cv>=1.1633527278900146\n",
      "   -1.1356 if cp<=0.02564563043415547 & cv>=0.8965176343917848\n",
      "--------------\n",
      "   +2.3730 if cp<=0.05846913382411004\n",
      "   -2.0613 if cp<=0.12991291284561157\n",
      "   +2.6571 if cp<=0.02113799788057804\n",
      "   -0.2841 if cv>=1.1633527278900146\n",
      "   -0.2250 if cp>=0.02564563043415547 & cv<=1.0139300346374511\n",
      "Run episode 396 with rewards 26.0\n",
      "============ 397 ===========\n",
      "15 actions [0, 1, 1, 1, 1, 1, 0, 1, 1, 0, 0, 0, 1, 1, 0]\n",
      "   +1.3304 if cv>=0.9684635162353515\n",
      "   +2.0674 if cp<=0.0653747260570526\n",
      "   -0.0000 if cv>=1.1633527278900146\n",
      "   -0.0000 if cp<=0.02564563043415547 & cv>=0.8965176343917848\n",
      "   -5.1862 if cp<=0.054408326745033264 & cp<=0.12786857783794403 & cv<=0.6056643128395081\n",
      "--------------\n",
      "   +0.7712 if cp<=0.05846913382411004\n",
      "   +1.6460 if cp<=0.12991291284561157\n",
      "   +3.3455 if cp<=0.02113799788057804\n",
      "   -0.0000 if cv>=1.1633527278900146\n",
      "   -2.0915 if cv>=-0.14371004700660706 & pa>=-0.15884847939014435\n",
      "Run episode 397 with rewards 15.0\n",
      "============ 398 ===========\n",
      "32 actions [0, 1, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1, 1, 1, 0, 1, 1, 1]\n",
      "   +1.5118 if cv>=0.9684635162353515\n",
      "   +1.5441 if cp<=0.0653747260570526\n",
      "   +0.0000 if cp<=0.02564563043415547 & cv>=0.8965176343917848\n",
      "   -1.1501 if cp<=0.054408326745033264 & cp<=0.12786857783794403 & cv<=0.6056643128395081\n",
      "   -3.4067 if pa>=0.0021245435811579247\n",
      "--------------\n",
      "   -3.1620 if cp<=0.05846913382411004\n",
      "   +2.3001 if cp<=0.12991291284561157\n",
      "   -0.0000 if cp<=0.02113799788057804\n",
      "   -2.1312 if cv>=-0.14371004700660706 & pa>=-0.15884847939014435\n",
      "   +3.2587 if pa>=0.0021245435811579247\n",
      "Run episode 398 with rewards 32.0\n",
      "============ 399 ===========\n",
      "30 actions [1, 1, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 1, 0]\n",
      "   +0.0463 if cv>=0.9684635162353515\n",
      "   +1.4849 if cp<=0.0653747260570526\n",
      "   -1.8514 if cp<=0.054408326745033264 & cp<=0.12786857783794403 & cv<=0.6056643128395081\n",
      "   -6.4998 if pa>=0.0021245435811579247\n",
      "   +2.2812 if cp<=2.357817720621976e-05\n",
      "--------------\n",
      "   -3.3518 if cp<=0.05846913382411004\n",
      "   +0.7434 if cp<=0.12991291284561157\n",
      "   -1.1413 if cv>=-0.14371004700660706 & pa>=-0.15884847939014435\n",
      "   +5.4421 if pa>=0.0021245435811579247\n",
      "   +5.6386 if cp>=2.357817720621976e-05 & cv<=-0.20287275910377503\n",
      "Run episode 399 with rewards 30.0\n",
      "============ 400 ===========\n",
      "57 actions [0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 1, 0]\n",
      "   +2.9474 if cp<=0.0653747260570526\n",
      "   +0.3476 if cp<=0.054408326745033264 & cp<=0.12786857783794403 & cv<=0.6056643128395081\n",
      "   -4.4918 if pa>=0.0021245435811579247\n",
      "   -0.2277 if cp<=2.357817720621976e-05\n",
      "   -1.4944 if cp<=0.07366606891155245\n",
      "--------------\n",
      "   -2.8162 if cp<=0.05846913382411004\n",
      "   -0.2522 if cv>=-0.14371004700660706 & pa>=-0.15884847939014435\n",
      "   +3.7527 if pa>=0.0021245435811579247\n",
      "   +0.0000 if cp>=2.357817720621976e-05 & cv<=-0.20287275910377503\n",
      "   +0.4873 if cp<=0.07366606891155245\n",
      "Run episode 400 with rewards 57.0\n",
      "============ 401 ===========\n",
      "38 actions [1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1, 1]\n",
      "   +2.1179 if cp<=0.0653747260570526\n",
      "   -0.6292 if cp<=0.054408326745033264 & cp<=0.12786857783794403 & cv<=0.6056643128395081\n",
      "   -4.9510 if pa>=0.0021245435811579247\n",
      "   +2.1179 if cp<=0.07366606891155245\n",
      "   -3.1309 if cp>=-0.15073510706424711\n",
      "--------------\n",
      "   +0.3008 if cp<=0.05846913382411004\n",
      "   -5.0312 if cv>=-0.14371004700660706 & pa>=-0.15884847939014435\n",
      "   +4.6857 if pa>=0.0021245435811579247\n",
      "   +0.2879 if cp<=0.07366606891155245\n",
      "   -3.2661 if cp<=0.03709249496459964 & cv<=-0.20091741383075715\n",
      "Run episode 401 with rewards 38.0\n",
      "============ 402 ===========\n",
      "43 actions [1, 1, 1, 0, 0, 0, 0, 1, 0, 0, 1, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 0, 0, 0, 1, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 0, 1, 1, 0, 1, 1, 1]\n",
      "   +0.4982 if cp<=0.0653747260570526\n",
      "   -3.0472 if pa>=0.0021245435811579247\n",
      "   +0.3977 if cp<=0.07366606891155245\n",
      "   -2.4471 if cp>=-0.15073510706424711\n",
      "   -5.0807 if cp>=0.08948071151971818 & pa>=-0.054486496001482004 & pav>=-0.1699135154485702\n",
      "--------------\n",
      "   +3.3113 if cp<=0.05846913382411004\n",
      "   -6.3399 if cv>=-0.14371004700660706 & pa>=-0.15884847939014435\n",
      "   +3.3113 if pa>=0.0021245435811579247\n",
      "   -0.0000 if cp<=0.03709249496459964 & cv<=-0.20091741383075715\n",
      "   +5.5999 if cp>=0.08948071151971818 & pa>=-0.054486496001482004 & pav>=-0.1699135154485702\n",
      "Run episode 402 with rewards 43.0\n",
      "============ 403 ===========\n",
      "27 actions [1, 1, 0, 1, 0, 0, 0, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 0, 1, 1, 0, 1, 1]\n",
      "   -2.8104 if cp<=0.0653747260570526\n",
      "   -1.9787 if pa>=0.0021245435811579247\n",
      "   -0.0377 if cp>=-0.15073510706424711\n",
      "   +0.0000 if cp>=0.08948071151971818 & pa>=-0.054486496001482004 & pav>=-0.1699135154485702\n",
      "   +3.2558 if cv>=0.5837278962135315\n",
      "--------------\n",
      "   +4.1153 if cp<=0.05846913382411004\n",
      "   -6.0629 if cv>=-0.14371004700660706 & pa>=-0.15884847939014435\n",
      "   +2.3051 if pa>=0.0021245435811579247\n",
      "   -0.0000 if cp>=0.08948071151971818 & pa>=-0.054486496001482004 & pav>=-0.1699135154485702\n",
      "   -4.4857 if cp>=0.07105790078639984\n",
      "Run episode 403 with rewards 27.0\n",
      "============ 404 ===========\n",
      "40 actions [1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0, 0, 1, 1, 1, 0, 0, 0, 1]\n",
      "   -3.1383 if cp<=0.0653747260570526\n",
      "   -0.0000 if pa>=0.0021245435811579247\n",
      "   +1.6619 if cp>=-0.15073510706424711\n",
      "   -0.0000 if cv>=0.5837278962135315\n",
      "   -4.3432 if cp<=0.039748097956180575 & pa>=-0.052654109150171276 & pav>=-0.47196046710014344\n",
      "--------------\n",
      "   +2.4805 if cp<=0.05846913382411004\n",
      "   -4.5833 if cv>=-0.14371004700660706 & pa>=-0.15884847939014435\n",
      "   -0.0000 if pa>=0.0021245435811579247\n",
      "   -2.5321 if cp>=0.07105790078639984\n",
      "   -4.1695 if cp<=0.039748097956180575 & cv>=0.18841646909713747\n",
      "Run episode 404 with rewards 40.0\n",
      "============ 405 ===========\n",
      "29 actions [1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0]\n",
      "   -0.8467 if cp<=0.0653747260570526\n",
      "   -0.8467 if cp>=-0.15073510706424711\n",
      "   -0.0000 if cv>=0.5837278962135315\n",
      "   -5.1158 if cp<=0.039748097956180575 & pa>=-0.052654109150171276 & pav>=-0.47196046710014344\n",
      "   +2.6798 if pa>=0.03044209927320481\n",
      "--------------\n",
      "   +1.0439 if cp<=0.05846913382411004\n",
      "   -2.9598 if cv>=-0.14371004700660706 & pa>=-0.15884847939014435\n",
      "   -0.0000 if cp>=0.07105790078639984\n",
      "   -6.4768 if cp<=0.039748097956180575 & cv>=0.18841646909713747\n",
      "   -4.0414 if cv>=0.1896238148212433 & pa<=0.03044209927320481\n",
      "Run episode 405 with rewards 29.0\n",
      "============ 406 ===========\n",
      "36 actions [1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0]\n",
      "   -1.2758 if cp<=0.0653747260570526\n",
      "   -2.4079 if cp>=-0.15073510706424711\n",
      "   -2.5704 if cp<=0.039748097956180575 & pa>=-0.052654109150171276 & pav>=-0.47196046710014344\n",
      "   -0.0000 if pa>=0.03044209927320481\n",
      "   +3.6861 if pa<=-0.11208502501249312 & pa>=-0.14062108099460602 & pav<=-0.07925299257040024\n",
      "--------------\n",
      "   +4.1655 if cp<=0.05846913382411004\n",
      "   -3.7848 if cv>=-0.14371004700660706 & pa>=-0.15884847939014435\n",
      "   -4.1170 if cp<=0.039748097956180575 & cv>=0.18841646909713747\n",
      "   -6.6303 if cv>=0.1896238148212433 & pa<=0.03044209927320481\n",
      "   +4.8078 if cv<=0.05177219510078432 & pa>=-0.11208502501249312 & pav<=-0.22525151669979088\n",
      "Run episode 406 with rewards 36.0\n",
      "============ 407 ===========\n",
      "12 actions [1, 1, 0, 1, 1, 1, 1, 0, 1, 1, 1, 1]\n",
      "   -2.9079 if cp<=0.0653747260570526\n",
      "   -2.9079 if cp>=-0.15073510706424711\n",
      "   +0.3106 if cp<=0.039748097956180575 & pa>=-0.052654109150171276 & pav>=-0.47196046710014344\n",
      "   +0.0862 if pa<=-0.11208502501249312 & pa>=-0.14062108099460602 & pav<=-0.07925299257040024\n",
      "   +0.4472 if cp<=0.017757041379809393\n",
      "--------------\n",
      "   +0.4379 if cp<=0.05846913382411004\n",
      "   -7.9054 if cp<=0.039748097956180575 & cv>=0.18841646909713747\n",
      "   -3.5860 if cv>=0.1896238148212433 & pa<=0.03044209927320481\n",
      "   +0.3149 if cv<=0.05177219510078432 & pa>=-0.11208502501249312 & pav<=-0.22525151669979088\n",
      "   +3.1694 if pa<=-0.06270446628332138 & pav<=-0.32724449038505554\n",
      "Run episode 407 with rewards 12.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 408 ===========\n",
      "16 actions [1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 0]\n",
      "   -2.6866 if cp<=0.0653747260570526\n",
      "   -1.5809 if cp>=-0.15073510706424711\n",
      "   -0.3857 if cp<=0.039748097956180575 & pa>=-0.052654109150171276 & pav>=-0.47196046710014344\n",
      "   -0.0000 if cp<=0.017757041379809393\n",
      "   -2.1161 if cp<=0.07158641666173937 & cp>=0.034048267453908924 & cv>=0.2175112009048462\n",
      "--------------\n",
      "   -0.0655 if cp<=0.05846913382411004\n",
      "   -3.9705 if cp<=0.039748097956180575 & cv>=0.18841646909713747\n",
      "   -3.5136 if cv>=0.1896238148212433 & pa<=0.03044209927320481\n",
      "   -1.2146 if pa<=-0.06270446628332138 & pav<=-0.32724449038505554\n",
      "   -6.2960 if cp>=0.15454915165901184\n",
      "Run episode 408 with rewards 16.0\n",
      "============ 409 ===========\n",
      "28 actions [1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0]\n",
      "   -1.6551 if cp<=0.0653747260570526\n",
      "   -1.9656 if cp>=-0.15073510706424711\n",
      "   -0.5320 if cp<=0.039748097956180575 & pa>=-0.052654109150171276 & pav>=-0.47196046710014344\n",
      "   -2.0733 if cp<=0.07158641666173937 & cp>=0.034048267453908924 & cv>=0.2175112009048462\n",
      "   -1.5645 if cv<=0.17791473865509033\n",
      "--------------\n",
      "   -4.1779 if cp<=0.039748097956180575 & cv>=0.18841646909713747\n",
      "   -3.0267 if cv>=0.1896238148212433 & pa<=0.03044209927320481\n",
      "   -0.5442 if pa<=-0.06270446628332138 & pav<=-0.32724449038505554\n",
      "   -0.0000 if cp>=0.15454915165901184\n",
      "   -1.3999 if cp<=0.031056124716997154 & cv>=0.17791473865509033\n",
      "Run episode 409 with rewards 28.0\n",
      "============ 410 ===========\n",
      "11 actions [0, 0, 0, 0, 1, 0, 1, 1, 0, 0, 1]\n",
      "   -0.5994 if cp<=0.0653747260570526\n",
      "   -5.1676 if cp>=-0.15073510706424711\n",
      "   -0.4540 if cp<=0.07158641666173937 & cp>=0.034048267453908924 & cv>=0.2175112009048462\n",
      "   -0.5746 if cv<=0.17791473865509033\n",
      "   +3.2680 if pa>=0.014674222096800804\n",
      "--------------\n",
      "   -3.2930 if cp<=0.039748097956180575 & cv>=0.18841646909713747\n",
      "   -4.6834 if cv>=0.1896238148212433 & pa<=0.03044209927320481\n",
      "   +1.1701 if pa<=-0.06270446628332138 & pav<=-0.32724449038505554\n",
      "   +0.3727 if cp<=0.031056124716997154 & cv>=0.17791473865509033\n",
      "   -4.0783 if pa>=0.014674222096800804\n",
      "Run episode 410 with rewards 11.0\n",
      "============ 411 ===========\n",
      "14 actions [0, 1, 1, 1, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0]\n",
      "   -0.4020 if cp<=0.0653747260570526\n",
      "   -0.4020 if cp>=-0.15073510706424711\n",
      "   -0.4020 if cv<=0.17791473865509033\n",
      "   -0.4020 if pa>=0.014674222096800804\n",
      "   -3.7712 if cv<=-0.8011940121650696\n",
      "--------------\n",
      "   -0.0000 if cp<=0.039748097956180575 & cv>=0.18841646909713747\n",
      "   -0.0000 if cv>=0.1896238148212433 & pa<=0.03044209927320481\n",
      "   -0.0000 if pa<=-0.06270446628332138 & pav<=-0.32724449038505554\n",
      "   -6.0218 if pa>=0.014674222096800804\n",
      "   +4.6074 if cp>=-0.08459462970495224 & cv<=-0.6099400520324707\n",
      "Run episode 411 with rewards 14.0\n",
      "============ 412 ===========\n",
      "8 actions [1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.3719 if cp<=0.0653747260570526\n",
      "   +0.3619 if cv<=0.17791473865509033\n",
      "   -0.0000 if pa>=0.014674222096800804\n",
      "   -0.0000 if cv<=-0.8011940121650696\n",
      "   -3.0990 if pa>=-0.0048870470374822615\n",
      "--------------\n",
      "   -1.3614 if cp<=0.039748097956180575 & cv>=0.18841646909713747\n",
      "   +3.8502 if cv>=0.1896238148212433 & pa<=0.03044209927320481\n",
      "   -0.0000 if pa>=0.014674222096800804\n",
      "   -0.0000 if cp>=-0.08459462970495224 & cv<=-0.6099400520324707\n",
      "   -5.1080 if cp<=0.03696828559041024 & cv>=0.6120929479598999\n",
      "Run episode 412 with rewards 8.0\n",
      "============ 413 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 0, 1]\n",
      "   -1.7350 if cp<=0.0653747260570526\n",
      "   -1.1244 if cv<=0.17791473865509033\n",
      "   -0.0000 if cv<=-0.8011940121650696\n",
      "   -0.0000 if pa>=-0.0048870470374822615\n",
      "   +0.0031 if cp>=0.03713083826005459\n",
      "--------------\n",
      "   +1.8994 if cp<=0.039748097956180575 & cv>=0.18841646909713747\n",
      "   +0.7485 if cv>=0.1896238148212433 & pa<=0.03044209927320481\n",
      "   +0.0000 if pa>=0.014674222096800804\n",
      "   +0.0000 if cp<=0.03696828559041024 & cv>=0.6120929479598999\n",
      "   +2.1485 if pa>=-0.036416713148355484\n",
      "Run episode 413 with rewards 10.0\n",
      "============ 414 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -1.0150 if cp<=0.0653747260570526\n",
      "   -0.6013 if cv<=0.17791473865509033\n",
      "   -0.6579 if pa>=-0.0048870470374822615\n",
      "   -3.8450 if cp>=0.03713083826005459\n",
      "   -3.9101 if cv>=1.5416429042816162\n",
      "--------------\n",
      "   +0.0965 if cp<=0.039748097956180575 & cv>=0.18841646909713747\n",
      "   +3.8717 if cv>=0.1896238148212433 & pa<=0.03044209927320481\n",
      "   +0.0539 if cp<=0.03696828559041024 & cv>=0.6120929479598999\n",
      "   +1.0515 if pa>=-0.036416713148355484\n",
      "   +3.9092 if cv>=1.5416429042816162\n",
      "Run episode 414 with rewards 9.0\n",
      "============ 415 ===========\n",
      "12 actions [1, 1, 0, 1, 1, 1, 1, 1, 1, 0, 1, 0]\n",
      "   -0.8108 if cp<=0.0653747260570526\n",
      "   +0.0000 if pa>=-0.0048870470374822615\n",
      "   -0.9003 if cp>=0.03713083826005459\n",
      "   +0.0013 if cv>=1.5416429042816162\n",
      "   -0.7134 if pa>=-0.02863243967294693\n",
      "--------------\n",
      "   +0.0000 if cp<=0.039748097956180575 & cv>=0.18841646909713747\n",
      "   +0.2732 if cv>=0.1896238148212433 & pa<=0.03044209927320481\n",
      "   +0.1811 if pa>=-0.036416713148355484\n",
      "   -0.0025 if cv>=1.5416429042816162\n",
      "   +0.3889 if cp<=0.11195867955684663\n",
      "Run episode 415 with rewards 12.0\n",
      "============ 416 ===========\n",
      "10 actions [1, 1, 0, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.7839 if cp<=0.0653747260570526\n",
      "   -6.6593 if cp>=0.03713083826005459\n",
      "   -0.0000 if cv>=1.5416429042816162\n",
      "   +0.7918 if pa>=-0.02863243967294693\n",
      "   -2.7758 if cv<=0.22931289672851565\n",
      "--------------\n",
      "   -2.3774 if cv>=0.1896238148212433 & pa<=0.03044209927320481\n",
      "   +0.1436 if pa>=-0.036416713148355484\n",
      "   +0.0000 if cv>=1.5416429042816162\n",
      "   +0.0940 if cp<=0.11195867955684663\n",
      "   +6.8170 if cp>=-0.00813198760151863\n",
      "Run episode 416 with rewards 10.0\n",
      "============ 417 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 0, 0]\n",
      "   +0.0218 if cp<=0.0653747260570526\n",
      "   +8.0600 if cp>=0.03713083826005459\n",
      "   -1.7660 if pa>=-0.02863243967294693\n",
      "   -2.9022 if cv<=0.22931289672851565\n",
      "   +6.8878 if cp>=0.0839681327342987\n",
      "--------------\n",
      "   -0.3990 if cv>=0.1896238148212433 & pa<=0.03044209927320481\n",
      "   -1.9194 if pa>=-0.036416713148355484\n",
      "   +0.1504 if cp<=0.11195867955684663\n",
      "   +2.0697 if cp>=-0.00813198760151863\n",
      "   +2.0750 if cp<=-0.009995092265307903\n",
      "Run episode 417 with rewards 9.0\n",
      "============ 418 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -9.8809 if cp>=0.03713083826005459\n",
      "   -0.0016 if pa>=-0.02863243967294693\n",
      "   -1.2419 if cv<=0.22931289672851565\n",
      "   -0.0064 if cp>=0.0839681327342987\n",
      "   -2.0198 if cp<=0.004474838823080074\n",
      "--------------\n",
      "   +1.3015 if cv>=0.1896238148212433 & pa<=0.03044209927320481\n",
      "   +0.1858 if pa>=-0.036416713148355484\n",
      "   +0.5727 if cp>=-0.00813198760151863\n",
      "   +0.9146 if cp<=-0.009995092265307903\n",
      "   +1.4873 if \n",
      "Run episode 418 with rewards 10.0\n",
      "============ 419 ===========\n",
      "10 actions [1, 1, 1, 0, 1, 1, 1, 1, 1, 1]\n",
      "   -0.6613 if cp>=0.03713083826005459\n",
      "   -0.5878 if cv<=0.22931289672851565\n",
      "   +0.2504 if cp>=0.0839681327342987\n",
      "   +0.0000 if cp<=0.004474838823080074\n",
      "   -0.9473 if cp<=0.12150578498840332\n",
      "--------------\n",
      "   +0.0024 if cv>=0.1896238148212433 & pa<=0.03044209927320481\n",
      "   +0.0032 if cp>=-0.00813198760151863\n",
      "   -0.0000 if cp<=-0.009995092265307903\n",
      "   +0.0032 if \n",
      "   +0.0036 if cp<=0.08179659247398377\n",
      "Run episode 419 with rewards 10.0\n",
      "============ 420 ===========\n",
      "10 actions [1, 1, 1, 0, 1, 1, 1, 0, 0, 0]\n",
      "   +2.4325 if cp>=0.03713083826005459\n",
      "   -1.3047 if cv<=0.22931289672851565\n",
      "   +3.9989 if cp>=0.0839681327342987\n",
      "   -4.7416 if cp<=0.12150578498840332\n",
      "   +3.5682 if cp<=0.06456989496946335 & cv>=0.46514596939086916\n",
      "--------------\n",
      "   -1.5707 if cv>=0.1896238148212433 & pa<=0.03044209927320481\n",
      "   -1.0670 if cp>=-0.00813198760151863\n",
      "   -1.0670 if \n",
      "   +2.4271 if cp<=0.08179659247398377\n",
      "   +2.1034 if cp<=0.06456989496946335 & cv<=0.46514596939086916\n",
      "Run episode 420 with rewards 10.0\n",
      "============ 421 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -5.2228 if cp>=0.03713083826005459\n",
      "   +0.0000 if cp>=0.0839681327342987\n",
      "   -1.2536 if cp<=0.12150578498840332\n",
      "   +1.5134 if cp<=0.06456989496946335 & cv>=0.46514596939086916\n",
      "   -4.6426 if cp>=-0.011187520809471607 & cv>=0.48689550161361694\n",
      "--------------\n",
      "   -0.1140 if cv>=0.1896238148212433 & pa<=0.03044209927320481\n",
      "   +0.2751 if \n",
      "   +0.2751 if cp<=0.08179659247398377\n",
      "   +1.0367 if cp<=0.06456989496946335 & cv<=0.46514596939086916\n",
      "   -2.7802 if cp<=-0.011187520809471607\n",
      "Run episode 421 with rewards 9.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 422 ===========\n",
      "33 actions [1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1]\n",
      "   +6.2885 if cp>=0.03713083826005459\n",
      "   -0.8331 if cp<=0.12150578498840332\n",
      "   -6.1724 if cp<=0.06456989496946335 & cv>=0.46514596939086916\n",
      "   +4.7125 if cp>=-0.011187520809471607 & cv>=0.48689550161361694\n",
      "   +3.8569 if cp>=0.11627332121133804\n",
      "--------------\n",
      "   +0.8983 if \n",
      "   +0.8984 if cp<=0.08179659247398377\n",
      "   +0.8535 if cp<=0.06456989496946335 & cv<=0.46514596939086916\n",
      "   +0.0000 if cp<=-0.011187520809471607\n",
      "   +0.5223 if cp<=0.010753399692475796\n",
      "Run episode 422 with rewards 33.0\n",
      "============ 423 ===========\n",
      "50 actions [0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 1, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +2.1955 if cp>=0.03713083826005459\n",
      "   -1.5748 if cp<=0.06456989496946335 & cv>=0.46514596939086916\n",
      "   +1.8078 if cp>=-0.011187520809471607 & cv>=0.48689550161361694\n",
      "   -0.0000 if cp>=0.11627332121133804\n",
      "   +4.9354 if pa<=0.02632100582122803\n",
      "--------------\n",
      "   +0.0610 if \n",
      "   +0.6754 if cp<=0.08179659247398377\n",
      "   +1.8064 if cp<=0.06456989496946335 & cv<=0.46514596939086916\n",
      "   +1.3397 if cp<=0.010753399692475796\n",
      "   +5.2667 if cp<=0.08584630489349365 & cv<=-0.5616021156311035 & pa<=0.05126389190554619 & pa>=0.02632100582122803\n",
      "Run episode 423 with rewards 50.0\n",
      "============ 424 ===========\n",
      "41 actions [0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 1, 1, 1, 1]\n",
      "   +1.6988 if cp>=0.03713083826005459\n",
      "   -2.3188 if cp<=0.06456989496946335 & cv>=0.46514596939086916\n",
      "   +1.8340 if cp>=-0.011187520809471607 & cv>=0.48689550161361694\n",
      "   +6.6433 if pa<=0.02632100582122803\n",
      "   +3.5835 if cv>=1.1551240682601929\n",
      "--------------\n",
      "   +1.3941 if cp<=0.08179659247398377\n",
      "   +0.4144 if cp<=0.06456989496946335 & cv<=0.46514596939086916\n",
      "   +3.9955 if cp<=0.010753399692475796\n",
      "   +3.5297 if cp<=0.08584630489349365 & cv<=-0.5616021156311035 & pa<=0.05126389190554619 & pa>=0.02632100582122803\n",
      "   -3.5377 if cv>=1.1551240682601929\n",
      "Run episode 424 with rewards 41.0\n",
      "============ 425 ===========\n",
      "37 actions [0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1]\n",
      "   -4.5920 if cp<=0.06456989496946335 & cv>=0.46514596939086916\n",
      "   +3.3059 if cp>=-0.011187520809471607 & cv>=0.48689550161361694\n",
      "   +8.7613 if pa<=0.02632100582122803\n",
      "   +8.3685 if cv>=1.1551240682601929\n",
      "   -2.2731 if cp>=-0.041792836040258345\n",
      "--------------\n",
      "   +0.0170 if cp<=0.08179659247398377\n",
      "   +3.7309 if cp<=0.010753399692475796\n",
      "   +0.8863 if cp<=0.08584630489349365 & cv<=-0.5616021156311035 & pa<=0.05126389190554619 & pa>=0.02632100582122803\n",
      "   -5.0186 if cv>=1.1551240682601929\n",
      "   +3.3510 if cp>=-0.07359480112791061 & cv>=0.7799454927444458\n",
      "Run episode 425 with rewards 37.0\n",
      "============ 426 ===========\n",
      "38 actions [0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1]\n",
      "   -0.1958 if cp<=0.06456989496946335 & cv>=0.46514596939086916\n",
      "   +1.4477 if cp>=-0.011187520809471607 & cv>=0.48689550161361694\n",
      "   +7.3403 if pa<=0.02632100582122803\n",
      "   -0.4662 if cv>=1.1551240682601929\n",
      "   -1.3205 if cv>=-0.5029662370681762\n",
      "--------------\n",
      "   +2.3294 if cp<=0.010753399692475796\n",
      "   +0.4995 if cp<=0.08584630489349365 & cv<=-0.5616021156311035 & pa<=0.05126389190554619 & pa>=0.02632100582122803\n",
      "   +1.6583 if cv>=1.1551240682601929\n",
      "   +0.9775 if cp>=-0.07359480112791061 & cv>=0.7799454927444458\n",
      "   +2.8724 if pa>=0.05105633437633516\n",
      "Run episode 426 with rewards 38.0\n",
      "============ 427 ===========\n",
      "22 actions [0, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1, 1, 1]\n",
      "   +0.3468 if cp>=-0.011187520809471607 & cv>=0.48689550161361694\n",
      "   +6.1759 if pa<=0.02632100582122803\n",
      "   -0.1970 if cv>=1.1551240682601929\n",
      "   -0.2530 if cv>=-0.5029662370681762\n",
      "   -0.3329 if cv<=0.7657540440559387 & pa<=0.038968174159526844\n",
      "--------------\n",
      "   +6.3702 if cp<=0.010753399692475796\n",
      "   +1.1829 if cv>=1.1551240682601929\n",
      "   +1.3445 if cp>=-0.07359480112791061 & cv>=0.7799454927444458\n",
      "   -2.4903 if pa>=0.05105633437633516\n",
      "   +0.1276 if cp<=0.025987823680043223 & cv<=-0.8969947218894958 & pa<=0.038968174159526844\n",
      "Run episode 427 with rewards 22.0\n",
      "============ 428 ===========\n",
      "25 actions [0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1]\n",
      "   +1.3251 if cp>=-0.011187520809471607 & cv>=0.48689550161361694\n",
      "   +2.8363 if pa<=0.02632100582122803\n",
      "   +0.7750 if cv>=-0.5029662370681762\n",
      "   -2.2273 if cv<=0.7657540440559387 & pa<=0.038968174159526844\n",
      "   +2.4260 if pa<=0.04479966461658478\n",
      "--------------\n",
      "   +4.9816 if cp<=0.010753399692475796\n",
      "   -0.0000 if cv>=1.1551240682601929\n",
      "   -0.0000 if cp>=-0.07359480112791061 & cv>=0.7799454927444458\n",
      "   -1.3160 if pa>=0.05105633437633516\n",
      "   -3.6935 if cp<=0.022423011437058455 & pa<=0.04479966461658478\n",
      "Run episode 428 with rewards 25.0\n",
      "============ 429 ===========\n",
      "22 actions [0, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1]\n",
      "   -0.1214 if cp>=-0.011187520809471607 & cv>=0.48689550161361694\n",
      "   +1.7510 if pa<=0.02632100582122803\n",
      "   +2.9570 if cv<=0.7657540440559387 & pa<=0.038968174159526844\n",
      "   +1.4972 if pa<=0.04479966461658478\n",
      "   -3.0994 if cp<=0.007324641756713402 & pa<=0.056019283831119544\n",
      "--------------\n",
      "   +0.3693 if cp<=0.010753399692475796\n",
      "   -0.0674 if cp>=-0.07359480112791061 & cv>=0.7799454927444458\n",
      "   +0.2167 if pa>=0.05105633437633516\n",
      "   -1.6780 if cp<=0.022423011437058455 & pa<=0.04479966461658478\n",
      "   +6.1694 if cp<=0.007324641756713402\n",
      "Run episode 429 with rewards 22.0\n",
      "============ 430 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.1969 if pa<=0.02632100582122803\n",
      "   +0.2116 if cv<=0.7657540440559387 & pa<=0.038968174159526844\n",
      "   +6.4087 if pa<=0.04479966461658478\n",
      "   +0.0000 if cp<=0.007324641756713402 & pa<=0.056019283831119544\n",
      "   -3.2439 if cp<=0.04509247839450836 & cv>=-0.9345631122589111\n",
      "--------------\n",
      "   -6.5536 if cp<=0.010753399692475796\n",
      "   +0.0576 if pa>=0.05105633437633516\n",
      "   -2.0688 if cp<=0.022423011437058455 & pa<=0.04479966461658478\n",
      "  -13.7046 if cp<=0.007324641756713402\n",
      "   +2.3939 if cp<=0.03274640068411827\n",
      "Run episode 430 with rewards 9.0\n",
      "============ 431 ===========\n",
      "15 actions [1, 0, 0, 1, 1, 1, 1, 1, 1, 0, 1, 1, 0, 1, 0]\n",
      "   +0.0000 if pa<=0.02632100582122803\n",
      "   +0.0000 if cv<=0.7657540440559387 & pa<=0.038968174159526844\n",
      "   +0.0000 if pa<=0.04479966461658478\n",
      "   +0.0000 if cp<=0.04509247839450836 & cv>=-0.9345631122589111\n",
      "   +0.0000 if cp<=-0.08312169760465622\n",
      "--------------\n",
      "   -1.5305 if cp<=0.010753399692475796\n",
      "   -0.0229 if cp<=0.022423011437058455 & pa<=0.04479966461658478\n",
      "   -1.5305 if cp<=0.007324641756713402\n",
      "   -1.5305 if cp<=0.03274640068411827\n",
      "   +0.1776 if cp<=-0.08312169760465622\n",
      "Run episode 431 with rewards 15.0\n",
      "============ 432 ===========\n",
      "15 actions [0, 0, 1, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1]\n",
      "   -0.6771 if pa<=0.02632100582122803\n",
      "   +1.2196 if cv<=0.7657540440559387 & pa<=0.038968174159526844\n",
      "   -0.6771 if pa<=0.04479966461658478\n",
      "   +0.0000 if cp<=0.04509247839450836 & cv>=-0.9345631122589111\n",
      "   -3.2283 if pa<=0.017547349631786346 & pa>=0.01215519066900015\n",
      "--------------\n",
      "   -0.0000 if cp<=0.010753399692475796\n",
      "   -0.0000 if cp<=0.007324641756713402\n",
      "   -0.0000 if cp<=0.03274640068411827\n",
      "   +0.0000 if cp<=-0.08312169760465622\n",
      "   +3.3306 if pa<=0.017547349631786346 & pa>=0.01215519066900015\n",
      "Run episode 432 with rewards 15.0\n",
      "============ 433 ===========\n",
      "32 actions [1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 0, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -3.7529 if pa<=0.02632100582122803\n",
      "   +0.2588 if cv<=0.7657540440559387 & pa<=0.038968174159526844\n",
      "   +2.2994 if pa<=0.04479966461658478\n",
      "   -2.0038 if pa<=0.017547349631786346 & pa>=0.01215519066900015\n",
      "   +3.7448 if cp>=0.024964621663093576\n",
      "--------------\n",
      "   +0.3901 if cp<=0.010753399692475796\n",
      "   +0.3901 if cp<=0.007324641756713402\n",
      "   -0.7405 if cp<=0.03274640068411827\n",
      "   +0.9453 if pa<=0.017547349631786346 & pa>=0.01215519066900015\n",
      "   -3.2791 if cp>=0.024964621663093576 & cv>=-0.24089364409446717\n",
      "Run episode 433 with rewards 32.0\n",
      "============ 434 ===========\n",
      "8 actions [1, 1, 1, 1, 1, 1, 1, 0]\n",
      "   -1.9528 if pa<=0.02632100582122803\n",
      "   -1.9528 if pa<=0.04479966461658478\n",
      "   -0.0000 if pa<=0.017547349631786346 & pa>=0.01215519066900015\n",
      "   +7.2554 if cp>=0.024964621663093576\n",
      "   +3.0565 if cp<=-0.03214512392878532\n",
      "--------------\n",
      "   -0.3409 if cp<=0.007324641756713402\n",
      "   +2.0171 if cp<=0.03274640068411827\n",
      "   +0.0000 if pa<=0.017547349631786346 & pa>=0.01215519066900015\n",
      "   -3.2289 if cp>=0.024964621663093576 & cv>=-0.24089364409446717\n",
      "   -4.7248 if cp<=-0.03214512392878532 & cp>=-0.0874237984418869 & cv<=-0.33078291416168204 & cv>=-0.6083286881446839 & pa<=-0.06490335911512375\n",
      "Run episode 434 with rewards 8.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 435 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -4.8218 if pa<=0.02632100582122803\n",
      "   -4.8218 if pa<=0.04479966461658478\n",
      "   -8.8710 if cp>=0.024964621663093576\n",
      "   +0.0336 if cp<=-0.03214512392878532\n",
      "   -0.4233 if cp>=0.0445467010140419\n",
      "--------------\n",
      "   +0.9847 if cp<=0.007324641756713402\n",
      "   +0.9584 if cp<=0.03274640068411827\n",
      "   +7.6518 if cp>=0.024964621663093576 & cv>=-0.24089364409446717\n",
      "   -0.0000 if cp<=-0.03214512392878532 & cp>=-0.0874237984418869 & cv<=-0.33078291416168204 & cv>=-0.6083286881446839 & pa<=-0.06490335911512375\n",
      "   +0.9031 if cp<=-0.031632077693939206\n",
      "Run episode 435 with rewards 10.0\n",
      "============ 436 ===========\n",
      "12 actions [1, 1, 1, 1, 0, 1, 0, 1, 1, 1, 1, 1]\n",
      "   -1.3067 if pa<=0.02632100582122803\n",
      "   -1.3067 if pa<=0.04479966461658478\n",
      "   +0.0002 if cp>=0.024964621663093576\n",
      "   +0.0004 if cp>=0.0445467010140419\n",
      "   -0.3612 if cp<=0.0015970207750797272\n",
      "--------------\n",
      "   +0.0045 if cp<=0.007324641756713402\n",
      "   +0.0062 if cp<=0.03274640068411827\n",
      "   -0.0000 if cp>=0.024964621663093576 & cv>=-0.24089364409446717\n",
      "   +0.0000 if cp<=-0.031632077693939206\n",
      "   +0.0032 if cp<=0.0015970207750797272\n",
      "Run episode 436 with rewards 12.0\n",
      "============ 437 ===========\n",
      "11 actions [1, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0]\n",
      "   -1.6566 if pa<=0.02632100582122803\n",
      "   -1.6566 if pa<=0.04479966461658478\n",
      "   +0.5130 if cp>=0.0445467010140419\n",
      "   -0.0000 if cp<=0.0015970207750797272\n",
      "   +4.1103 if cv>=0.5864701390266418\n",
      "--------------\n",
      "   -0.0000 if cp<=0.007324641756713402\n",
      "   -0.0000 if cp<=0.03274640068411827\n",
      "   -3.3695 if cp>=0.024964621663093576 & cv>=-0.24089364409446717\n",
      "   -0.0000 if cp<=0.0015970207750797272\n",
      "   +4.1293 if cv<=0.5864701390266418\n",
      "Run episode 437 with rewards 11.0\n",
      "============ 438 ===========\n",
      "12 actions [1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0]\n",
      "   -0.3267 if pa<=0.02632100582122803\n",
      "   -0.3267 if pa<=0.04479966461658478\n",
      "   +0.2502 if cp>=0.0445467010140419\n",
      "   +1.9748 if cv>=0.5864701390266418\n",
      "   +0.5499 if cp<=-0.00035830060369335115\n",
      "--------------\n",
      "   -0.2840 if cp<=0.007324641756713402\n",
      "   -1.1356 if cp<=0.03274640068411827\n",
      "   -0.0596 if cp>=0.024964621663093576 & cv>=-0.24089364409446717\n",
      "   +1.2867 if cv<=0.5864701390266418\n",
      "   +1.2481 if cv<=0.5487783551216125\n",
      "Run episode 438 with rewards 12.0\n",
      "============ 439 ===========\n",
      "14 actions [1, 1, 1, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1]\n",
      "   -1.0267 if pa<=0.02632100582122803\n",
      "   -1.0267 if pa<=0.04479966461658478\n",
      "   +3.1548 if cv>=0.5864701390266418\n",
      "   -0.2062 if cp<=-0.00035830060369335115\n",
      "   -0.1571 if cv<=0.5156859278678897 & cv>=0.3989398777484894\n",
      "--------------\n",
      "   +0.0045 if cp<=0.007324641756713402\n",
      "   -0.9355 if cp<=0.03274640068411827\n",
      "   +2.3258 if cv<=0.5864701390266418\n",
      "   +2.3258 if cv<=0.5487783551216125\n",
      "   +0.0735 if cv<=0.5935626864433289\n",
      "Run episode 439 with rewards 14.0\n",
      "============ 440 ===========\n",
      "11 actions [1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 0]\n",
      "   -0.4017 if pa<=0.02632100582122803\n",
      "   -1.1478 if pa<=0.04479966461658478\n",
      "   +1.5648 if cv>=0.5864701390266418\n",
      "   -0.0000 if cp<=-0.00035830060369335115\n",
      "   +2.3574 if cp<=0.07351673096418382 & cv>=0.7292433738708497\n",
      "--------------\n",
      "   +0.0113 if cp<=0.03274640068411827\n",
      "   +1.3969 if cv<=0.5864701390266418\n",
      "   +0.9100 if cv<=0.5487783551216125\n",
      "   +1.3969 if cv<=0.5935626864433289\n",
      "   -1.9299 if cp<=0.07351673096418382 & cv>=0.7292433738708497\n",
      "Run episode 440 with rewards 11.0\n",
      "============ 441 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -2.9834 if pa<=0.02632100582122803\n",
      "   -2.9834 if pa<=0.04479966461658478\n",
      "   -0.1646 if cv>=0.5864701390266418\n",
      "   -0.1076 if cp<=0.07351673096418382 & cv>=0.7292433738708497\n",
      "   +6.2003 if pa>=-0.04299029335379599\n",
      "--------------\n",
      "   +0.9965 if cv<=0.5864701390266418\n",
      "   +0.9965 if cv<=0.5487783551216125\n",
      "   +0.9965 if cv<=0.5935626864433289\n",
      "   +2.9349 if cp<=0.07351673096418382 & cv>=0.7292433738708497\n",
      "   -2.0637 if cv>=0.6093803644180298 & pa>=-0.04299029335379599\n",
      "Run episode 441 with rewards 9.0\n",
      "============ 442 ===========\n",
      "54 actions [1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0]\n",
      "   +0.2672 if pa<=0.02632100582122803\n",
      "   +0.2672 if pa<=0.04479966461658478\n",
      "   +3.3133 if cv>=0.5864701390266418\n",
      "   -3.0461 if pa>=-0.04299029335379599\n",
      "  +10.8363 if cp>=0.0032348557375371564\n",
      "--------------\n",
      "   +1.2137 if cv<=0.5487783551216125\n",
      "   +2.4352 if cv<=0.5935626864433289\n",
      "   +0.0134 if cp<=0.07351673096418382 & cv>=0.7292433738708497\n",
      "   +0.0000 if cv>=0.6093803644180298 & pa>=-0.04299029335379599\n",
      "   +0.6973 if cp<=-0.02951752170920372\n",
      "Run episode 442 with rewards 54.0\n",
      "============ 443 ===========\n",
      "72 actions [0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 0, 0, 0]\n",
      "   -0.8839 if pa<=0.04479966461658478\n",
      "   +1.6162 if cv>=0.5864701390266418\n",
      "   -0.2747 if pa>=-0.04299029335379599\n",
      "   +9.6610 if cp>=0.0032348557375371564\n",
      "   +3.9098 if cp<=0.016211983934044844 & cp>=-0.016528677940368653 & cv>=0.417055767774582\n",
      "--------------\n",
      "   +3.0452 if cv<=0.5487783551216125\n",
      "   +3.0452 if cv<=0.5935626864433289\n",
      "   -0.6271 if cp<=0.07351673096418382 & cv>=0.7292433738708497\n",
      "   +0.2655 if cp<=-0.02951752170920372\n",
      "   -2.9848 if cp>=-0.016528677940368653\n",
      "Run episode 443 with rewards 72.0\n",
      "============ 444 ===========\n",
      "32 actions [1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0, 1, 0, 0]\n",
      "   -1.8039 if pa<=0.04479966461658478\n",
      "   +3.5982 if cv>=0.5864701390266418\n",
      "  +10.3276 if cp>=0.0032348557375371564\n",
      "   +2.1555 if cp<=0.016211983934044844 & cp>=-0.016528677940368653 & cv>=0.417055767774582\n",
      "   -4.4843 if cp>=-0.03621840476989745 & cv>=0.5433438420295715 & pa<=0.01998873390257361 & pa>=-0.027186436206102366\n",
      "--------------\n",
      "   +3.9716 if cv<=0.5487783551216125\n",
      "   +3.9716 if cv<=0.5935626864433289\n",
      "   +1.3124 if cp<=0.07351673096418382 & cv>=0.7292433738708497\n",
      "   -3.5985 if cp>=-0.016528677940368653\n",
      "   -2.6430 if cv>=-0.6327137351036072 & pa>=0.01998873390257361\n",
      "Run episode 444 with rewards 32.0\n",
      "============ 445 ===========\n",
      "12 actions [0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 0]\n",
      "   +2.0800 if cv>=0.5864701390266418\n",
      "   +8.4259 if cp>=0.0032348557375371564\n",
      "   -3.0527 if cp<=0.016211983934044844 & cp>=-0.016528677940368653 & cv>=0.417055767774582\n",
      "   -3.7049 if cp>=-0.03621840476989745 & cv>=0.5433438420295715 & pa<=0.01998873390257361 & pa>=-0.027186436206102366\n",
      "   +2.1427 if cv>=0.9249119758605957\n",
      "--------------\n",
      "   -0.7407 if cv<=0.5487783551216125\n",
      "   +4.6444 if cv<=0.5935626864433289\n",
      "   +0.2967 if cp>=-0.016528677940368653\n",
      "   +0.8453 if cv>=-0.6327137351036072 & pa>=0.01998873390257361\n",
      "   -0.6661 if cv<=0.5559707403182983\n",
      "Run episode 445 with rewards 12.0\n",
      "============ 446 ===========\n",
      "49 actions [0, 1, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 0, 0, 1, 0, 0, 1, 1, 0, 0, 1]\n",
      "   +6.5350 if cp>=0.0032348557375371564\n",
      "   -0.0000 if cp<=0.016211983934044844 & cp>=-0.016528677940368653 & cv>=0.417055767774582\n",
      "   -0.0000 if cp>=-0.03621840476989745 & cv>=0.5433438420295715 & pa<=0.01998873390257361 & pa>=-0.027186436206102366\n",
      "   -0.0000 if cv>=0.9249119758605957\n",
      "   -2.5647 if pa>=0.20913422107696533\n",
      "--------------\n",
      "   +1.3249 if cv<=0.5487783551216125\n",
      "   +1.3249 if cv<=0.5935626864433289\n",
      "   +2.5725 if cv>=-0.6327137351036072 & pa>=0.01998873390257361\n",
      "   +1.3249 if cv<=0.5559707403182983\n",
      "   +2.5716 if pa>=0.20913422107696533\n",
      "Run episode 446 with rewards 49.0\n",
      "============ 447 ===========\n",
      "26 actions [0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +7.0405 if cp>=0.0032348557375371564\n",
      "   -0.1143 if cp<=0.016211983934044844 & cp>=-0.016528677940368653 & cv>=0.417055767774582\n",
      "   +0.0000 if cp>=-0.03621840476989745 & cv>=0.5433438420295715 & pa<=0.01998873390257361 & pa>=-0.027186436206102366\n",
      "   +0.0000 if pa>=0.20913422107696533\n",
      "   -5.6561 if cp<=0.04573825225234032 & cp>=-0.0010418455814942642 & cv<=-0.24821975827217102 & pa>=0.02413535751402378 & pa>=0.04427661895751953 & pav>=0.8056353807449341\n",
      "--------------\n",
      "   +1.8297 if cv<=0.5487783551216125\n",
      "   +1.5685 if cv>=-0.6327137351036072 & pa>=0.01998873390257361\n",
      "   +2.6756 if cv<=0.5559707403182983\n",
      "   -0.0000 if pa>=0.20913422107696533\n",
      "   +3.8281 if cp<=0.02085765451192857 & cv<=-0.24821975827217102 & pa<=0.04427661895751953\n",
      "Run episode 447 with rewards 26.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 448 ===========\n",
      "14 actions [1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 0]\n",
      "   +7.1210 if cp>=0.0032348557375371564\n",
      "   -2.8373 if cp<=0.016211983934044844 & cp>=-0.016528677940368653 & cv>=0.417055767774582\n",
      "   -0.0000 if pa>=0.20913422107696533\n",
      "   -0.0000 if cp<=0.04573825225234032 & cp>=-0.0010418455814942642 & cv<=-0.24821975827217102 & pa>=0.02413535751402378 & pa>=0.04427661895751953 & pav>=0.8056353807449341\n",
      "   -4.7810 if cv<=-0.34424278140068054 & pa<=0.10854633897542953\n",
      "--------------\n",
      "   +3.3265 if cv<=0.5487783551216125\n",
      "   +2.5449 if cv>=-0.6327137351036072 & pa>=0.01998873390257361\n",
      "   +3.3265 if cv<=0.5559707403182983\n",
      "   -0.0000 if cp<=0.02085765451192857 & cv<=-0.24821975827217102 & pa<=0.04427661895751953\n",
      "   -2.4098 if cv<=0.41497159004211426\n",
      "Run episode 448 with rewards 14.0\n",
      "============ 449 ===========\n",
      "15 actions [1, 1, 1, 1, 1, 0, 0, 0, 0, 1, 1, 0, 1, 1, 1]\n",
      "   +2.9717 if cp>=0.0032348557375371564\n",
      "   -2.7043 if cp<=0.016211983934044844 & cp>=-0.016528677940368653 & cv>=0.417055767774582\n",
      "   +0.0000 if cp<=0.04573825225234032 & cp>=-0.0010418455814942642 & cv<=-0.24821975827217102 & pa>=0.02413535751402378 & pa>=0.04427661895751953 & pav>=0.8056353807449341\n",
      "   +0.0000 if cv<=-0.34424278140068054 & pa<=0.10854633897542953\n",
      "   -4.0734 if cp>=0.0911550223827362\n",
      "--------------\n",
      "   +1.8139 if cv<=0.5487783551216125\n",
      "   +0.1163 if cv>=-0.6327137351036072 & pa>=0.01998873390257361\n",
      "   +3.0552 if cv<=0.5559707403182983\n",
      "   +1.8139 if cv<=0.41497159004211426\n",
      "   +4.0609 if cp>=0.0911550223827362\n",
      "Run episode 449 with rewards 15.0\n",
      "============ 450 ===========\n",
      "30 actions [1, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 1]\n",
      "   +5.3066 if cp>=0.0032348557375371564\n",
      "   -2.0798 if cp<=0.016211983934044844 & cp>=-0.016528677940368653 & cv>=0.417055767774582\n",
      "   -0.0000 if cv<=-0.34424278140068054 & pa<=0.10854633897542953\n",
      "   +7.8838 if cp>=0.0911550223827362\n",
      "   -2.4389 if cp<=0.017242443561553966 & cp>=-0.0256837323307991 & cv<=0.6304874897003174\n",
      "--------------\n",
      "   +0.8259 if cv<=0.5487783551216125\n",
      "   +0.8259 if cv<=0.5559707403182983\n",
      "   +1.9779 if cv<=0.41497159004211426\n",
      "   -7.8695 if cp>=0.0911550223827362\n",
      "   +1.4206 if cv<=0.8222731351852417\n",
      "Run episode 450 with rewards 30.0\n",
      "============ 451 ===========\n",
      "31 actions [0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 1, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1]\n",
      "   +5.5371 if cp>=0.0032348557375371564\n",
      "   -2.2195 if cp<=0.016211983934044844 & cp>=-0.016528677940368653 & cv>=0.417055767774582\n",
      "   +0.0063 if cp>=0.0911550223827362\n",
      "   -3.3106 if cp<=0.017242443561553966 & cp>=-0.0256837323307991 & cv<=0.6304874897003174\n",
      "   +3.7762 if cp>=0.021721605956554434 & cv<=-0.11098241806030251 & pa<=0.13823647797107697\n",
      "--------------\n",
      "   +0.5544 if cv<=0.5559707403182983\n",
      "   +1.9306 if cv<=0.41497159004211426\n",
      "   -0.0067 if cp>=0.0911550223827362\n",
      "   +2.3823 if cv<=0.8222731351852417\n",
      "   -3.8138 if cp>=0.021721605956554434 & cv<=-0.11098241806030251 & pa<=0.10694646239280702\n",
      "Run episode 451 with rewards 31.0\n",
      "============ 452 ===========\n",
      "23 actions [1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 0]\n",
      "   +5.5309 if cp>=0.0032348557375371564\n",
      "   +0.7274 if cp<=0.016211983934044844 & cp>=-0.016528677940368653 & cv>=0.417055767774582\n",
      "   -3.5731 if cp<=0.017242443561553966 & cp>=-0.0256837323307991 & cv<=0.6304874897003174\n",
      "   +0.9339 if cp>=0.021721605956554434 & cv<=-0.11098241806030251 & pa<=0.13823647797107697\n",
      "   -3.5871 if cp<=0.044689234346151366 & cv<=-0.5689799189567566 & pa<=0.04663300514221192 & pa>=0.008187416940927505\n",
      "--------------\n",
      "   +3.8069 if cv<=0.5559707403182983\n",
      "   +3.8069 if cv<=0.41497159004211426\n",
      "   +0.5093 if cv<=0.8222731351852417\n",
      "   -1.5811 if cp>=0.021721605956554434 & cv<=-0.11098241806030251 & pa<=0.10694646239280702\n",
      "   -3.7933 if pa<=0.008187416940927505\n",
      "Run episode 452 with rewards 23.0\n",
      "============ 453 ===========\n",
      "32 actions [0, 0, 1, 0, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0]\n",
      "   +7.2014 if cp>=0.0032348557375371564\n",
      "   -2.5282 if cp<=0.017242443561553966 & cp>=-0.0256837323307991 & cv<=0.6304874897003174\n",
      "   +0.5026 if cp>=0.021721605956554434 & cv<=-0.11098241806030251 & pa<=0.13823647797107697\n",
      "   +0.0000 if cp<=0.044689234346151366 & cv<=-0.5689799189567566 & pa<=0.04663300514221192 & pa>=0.008187416940927505\n",
      "   -2.5784 if pav>=0.8101928234100342\n",
      "--------------\n",
      "   +1.7315 if cv<=0.5559707403182983\n",
      "   +1.4943 if cv<=0.41497159004211426\n",
      "   -0.3339 if cp>=0.021721605956554434 & cv<=-0.11098241806030251 & pa<=0.10694646239280702\n",
      "   -1.7937 if pa<=0.008187416940927505\n",
      "   +2.7068 if pav>=0.8101928234100342\n",
      "Run episode 453 with rewards 32.0\n",
      "============ 454 ===========\n",
      "35 actions [1, 1, 1, 0, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 1, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 1]\n",
      "   +8.4547 if cp>=0.0032348557375371564\n",
      "   -4.7300 if cp<=0.017242443561553966 & cp>=-0.0256837323307991 & cv<=0.6304874897003174\n",
      "   +0.9166 if cp>=0.021721605956554434 & cv<=-0.11098241806030251 & pa<=0.13823647797107697\n",
      "   -2.1378 if pav>=0.8101928234100342\n",
      "   -3.4819 if cp>=0.011691604182124138\n",
      "--------------\n",
      "   +2.8278 if cv<=0.5559707403182983\n",
      "   +2.8278 if cv<=0.41497159004211426\n",
      "   -1.1845 if pa<=0.008187416940927505\n",
      "   +0.9882 if pav>=0.8101928234100342\n",
      "   -2.1885 if cv<=0.192336043715477 & cv>=-0.39261813163757325\n",
      "Run episode 454 with rewards 35.0\n",
      "============ 455 ===========\n",
      "27 actions [1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 0, 0, 0]\n",
      "   +7.3846 if cp>=0.0032348557375371564\n",
      "   -3.2680 if cp<=0.017242443561553966 & cp>=-0.0256837323307991 & cv<=0.6304874897003174\n",
      "   -1.0032 if pav>=0.8101928234100342\n",
      "   -1.6412 if cp>=0.011691604182124138\n",
      "   +2.8445 if pa>=-0.04019965007901192 & pav<=-0.7331143379211426\n",
      "--------------\n",
      "   +4.8086 if cv<=0.5559707403182983\n",
      "   +2.9933 if cv<=0.41497159004211426\n",
      "   -3.2849 if pa<=0.008187416940927505\n",
      "   -3.2001 if cv<=0.192336043715477 & cv>=-0.39261813163757325\n",
      "   -2.7458 if cv>=0.24392422139644623 & pav>=-0.4994829118251799\n",
      "Run episode 455 with rewards 27.0\n",
      "============ 456 ===========\n",
      "48 actions [1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 0, 1, 0, 1, 0]\n",
      "   +4.1448 if cp>=0.0032348557375371564\n",
      "   -5.6782 if cp<=0.017242443561553966 & cp>=-0.0256837323307991 & cv<=0.6304874897003174\n",
      "   +4.2254 if cp>=0.011691604182124138\n",
      "   +0.0000 if pa>=-0.04019965007901192 & pav<=-0.7331143379211426\n",
      "   -2.2067 if cp<=-0.034141418710350986 & pa>=-0.030271454155445097\n",
      "--------------\n",
      "   +3.1350 if cv<=0.5559707403182983\n",
      "   +0.6339 if cv<=0.41497159004211426\n",
      "   -1.4672 if pa<=0.008187416940927505\n",
      "   +0.2298 if cv<=0.192336043715477 & cv>=-0.39261813163757325\n",
      "   +3.1144 if pav>=1.164414405822754\n",
      "Run episode 456 with rewards 48.0\n",
      "============ 457 ===========\n",
      "22 actions [0, 0, 1, 0, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +3.0914 if cp>=0.0032348557375371564\n",
      "   -6.3737 if cp<=0.017242443561553966 & cp>=-0.0256837323307991 & cv<=0.6304874897003174\n",
      "   +3.9221 if cp>=0.011691604182124138\n",
      "   -3.1947 if cp<=-0.034141418710350986 & pa>=-0.030271454155445097\n",
      "   +1.7850 if cp>=-0.023651875555515286\n",
      "--------------\n",
      "   +4.3317 if cv<=0.5559707403182983\n",
      "   +0.6726 if cv<=0.41497159004211426\n",
      "   -3.5772 if pa<=0.008187416940927505\n",
      "   +0.0682 if pav>=1.164414405822754\n",
      "   +2.6447 if cp<=0.0013343197293579612 & cp>=-0.04303167387843132 & pa<=0.008624317310750501 & pav<=0.4660482048988343 & pav>=-0.9894907593727111\n",
      "Run episode 457 with rewards 22.0\n",
      "============ 458 ===========\n",
      "24 actions [0, 0, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1]\n",
      "   +2.9164 if cp>=0.0032348557375371564\n",
      "   -5.4354 if cp<=0.017242443561553966 & cp>=-0.0256837323307991 & cv<=0.6304874897003174\n",
      "   +5.0143 if cp>=0.011691604182124138\n",
      "   +0.0000 if cp<=-0.034141418710350986 & pa>=-0.030271454155445097\n",
      "   -2.9221 if cv<=-0.17943775355815886 & pa<=0.07523108720779419\n",
      "--------------\n",
      "   +2.1608 if cv<=0.5559707403182983\n",
      "   +2.1608 if cv<=0.41497159004211426\n",
      "   -0.0000 if pa<=0.008187416940927505\n",
      "   -0.0000 if cp<=0.0013343197293579612 & cp>=-0.04303167387843132 & pa<=0.008624317310750501 & pav<=0.4660482048988343 & pav>=-0.9894907593727111\n",
      "   +3.2349 if cv<=0.018164076656103152\n",
      "Run episode 458 with rewards 24.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 459 ===========\n",
      "41 actions [1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 1, 0, 1, 1, 0, 1, 0, 0, 1, 0]\n",
      "   +2.2663 if cp>=0.0032348557375371564\n",
      "   -2.7492 if cp<=0.017242443561553966 & cp>=-0.0256837323307991 & cv<=0.6304874897003174\n",
      "   +5.2601 if cp>=0.011691604182124138\n",
      "   +2.0874 if cv<=-0.17943775355815886 & pa<=0.07523108720779419\n",
      "   -4.4852 if pa<=0.06382297724485397 & pav>=0.6960279107093812\n",
      "--------------\n",
      "   +1.9983 if cv<=0.5559707403182983\n",
      "   +1.6325 if cv<=0.41497159004211426\n",
      "   +0.0000 if pa<=0.008187416940927505\n",
      "   +4.2883 if cv<=0.018164076656103152\n",
      "   -5.2424 if cv<=-0.16757909953594208 & cv<=0.03295904062688351 & pa<=0.06382297724485397 & pav<=0.6960279107093812\n",
      "Run episode 459 with rewards 41.0\n",
      "============ 460 ===========\n",
      "28 actions [1, 1, 1, 1, 0, 0, 0, 1, 0, 0, 0, 0, 0, 1, 1, 0, 1, 0, 0, 1, 1, 1, 1, 1, 1, 0, 0, 1]\n",
      "   +1.3699 if cp>=0.0032348557375371564\n",
      "   -1.1539 if cp<=0.017242443561553966 & cp>=-0.0256837323307991 & cv<=0.6304874897003174\n",
      "   +4.4477 if cp>=0.011691604182124138\n",
      "   -1.9901 if pa<=0.06382297724485397 & pav>=0.6960279107093812\n",
      "   +4.7646 if cp>=0.05950666964054108\n",
      "--------------\n",
      "   +2.7342 if cv<=0.5559707403182983\n",
      "   +2.7342 if cv<=0.41497159004211426\n",
      "   +4.0994 if cv<=0.018164076656103152\n",
      "   -3.8738 if cv<=-0.16757909953594208 & cv<=0.03295904062688351 & pa<=0.06382297724485397 & pav<=0.6960279107093812\n",
      "   -4.7156 if cp>=0.05950666964054108\n",
      "Run episode 460 with rewards 28.0\n",
      "============ 461 ===========\n",
      "22 actions [0, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 0, 1, 0, 0, 0]\n",
      "   +3.2286 if cp>=0.0032348557375371564\n",
      "   +3.2311 if cp>=0.011691604182124138\n",
      "   -0.0001 if pa<=0.06382297724485397 & pav>=0.6960279107093812\n",
      "   +1.7441 if cp>=0.05950666964054108\n",
      "   -4.0170 if cp>=0.028403618559241305 & cv<=-0.3610952258110046 & pa>=-0.11634602695703507\n",
      "--------------\n",
      "   +2.5507 if cv<=0.41497159004211426\n",
      "   +1.8966 if cv<=0.018164076656103152\n",
      "   +1.6169 if cv<=-0.16757909953594208 & cv<=0.03295904062688351 & pa<=0.06382297724485397 & pav<=0.6960279107093812\n",
      "   -0.5969 if cp>=0.05950666964054108\n",
      "   +5.5004 if cp>=0.028403618559241305 & cv<=0.2130426168441773 & pa>=-0.09084345400333403\n",
      "Run episode 461 with rewards 22.0\n",
      "============ 462 ===========\n",
      "34 actions [0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1]\n",
      "   +2.5997 if cp>=0.0032348557375371564\n",
      "   +5.9303 if cp>=0.011691604182124138\n",
      "   +0.0000 if cp>=0.05950666964054108\n",
      "   +0.0000 if cp>=0.028403618559241305 & cv<=-0.3610952258110046 & pa>=-0.11634602695703507\n",
      "   +4.3883 if cp>=-0.00985839832574129 & cv<=-0.020345222577452658 & cv>=-0.21598108112812042 & pa>=-0.07890328615903854\n",
      "--------------\n",
      "   +2.9955 if cv<=0.41497159004211426\n",
      "   -3.4601 if cv<=0.018164076656103152\n",
      "   +4.5290 if cv<=-0.16757909953594208 & cv<=0.03295904062688351 & pa<=0.06382297724485397 & pav<=0.6960279107093812\n",
      "   +0.0000 if cp>=0.028403618559241305 & cv<=0.2130426168441773 & pa>=-0.09084345400333403\n",
      "   +3.2277 if pa>=-0.043268293142318726\n",
      "Run episode 462 with rewards 34.0\n",
      "============ 463 ===========\n",
      "25 actions [0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +5.2510 if cp>=0.0032348557375371564\n",
      "   +5.2510 if cp>=0.011691604182124138\n",
      "   +2.0696 if cp>=0.028403618559241305 & cv<=-0.3610952258110046 & pa>=-0.11634602695703507\n",
      "   +2.0985 if cp>=-0.00985839832574129 & cv<=-0.020345222577452658 & cv>=-0.21598108112812042 & pa>=-0.07890328615903854\n",
      "   -1.5900 if \n",
      "--------------\n",
      "   +0.8278 if cv<=0.41497159004211426\n",
      "   +0.4480 if cv<=0.018164076656103152\n",
      "   -0.3759 if cv<=-0.16757909953594208 & cv<=0.03295904062688351 & pa<=0.06382297724485397 & pav<=0.6960279107093812\n",
      "   +2.2051 if pa>=-0.043268293142318726\n",
      "   +2.6718 if cv>=-0.7817498922348023 & pa>=0.05621699318289764\n",
      "Run episode 463 with rewards 25.0\n",
      "============ 464 ===========\n",
      "58 actions [0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 0, 0, 1, 0, 1, 0, 0]\n",
      "   -0.9725 if cp>=0.0032348557375371564\n",
      "   -0.8365 if cp>=0.011691604182124138\n",
      "   +1.2635 if cp>=0.028403618559241305 & cv<=-0.3610952258110046 & pa>=-0.11634602695703507\n",
      "   +1.1693 if cp>=-0.00985839832574129 & cv<=-0.020345222577452658 & cv>=-0.21598108112812042 & pa>=-0.07890328615903854\n",
      "   +9.3194 if cp>=0.024442286789417268\n",
      "--------------\n",
      "   +3.8124 if cv<=0.41497159004211426\n",
      "   +4.0779 if cv<=0.018164076656103152\n",
      "   +5.5809 if pa>=-0.043268293142318726\n",
      "   +0.9393 if cv>=-0.7817498922348023 & pa>=0.05621699318289764\n",
      "   -6.5044 if cp>=0.024442286789417268\n",
      "Run episode 464 with rewards 58.0\n",
      "============ 465 ===========\n",
      "55 actions [0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 1, 0, 1, 1, 1, 1, 0, 1, 0, 0, 0]\n",
      "   +1.6987 if cp>=0.0032348557375371564\n",
      "   -1.2305 if cp>=0.028403618559241305 & cv<=-0.3610952258110046 & pa>=-0.11634602695703507\n",
      "   +2.6707 if cp>=-0.00985839832574129 & cv<=-0.020345222577452658 & cv>=-0.21598108112812042 & pa>=-0.07890328615903854\n",
      "   +6.9814 if cp>=0.024442286789417268\n",
      "   -4.9646 if cv<=-0.45395070910453794 & pav<=0.9214514017105103\n",
      "--------------\n",
      "   +2.2468 if cv<=0.41497159004211426\n",
      "   +1.9027 if cv<=0.018164076656103152\n",
      "   +4.2945 if pa>=-0.043268293142318726\n",
      "   -1.9066 if cp>=0.024442286789417268\n",
      "   +2.9370 if cp<=0.07895713150501252 & cv<=-0.23600178360939025 & pa<=0.010498513188213114\n",
      "Run episode 465 with rewards 55.0\n",
      "============ 466 ===========\n",
      "13 actions [1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +1.4618 if cp>=0.0032348557375371564\n",
      "   +3.1834 if cp>=-0.00985839832574129 & cv<=-0.020345222577452658 & cv>=-0.21598108112812042 & pa>=-0.07890328615903854\n",
      "   +6.1969 if cp>=0.024442286789417268\n",
      "   -4.9863 if cv<=-0.45395070910453794 & pav<=0.9214514017105103\n",
      "   -3.1216 if cv<=-0.3377564370632172 & pa>=-0.03464720025658605\n",
      "--------------\n",
      "   +3.3871 if cv<=0.41497159004211426\n",
      "   +7.5856 if pa>=-0.043268293142318726\n",
      "   -3.0978 if cp>=0.024442286789417268\n",
      "   +5.0138 if cp<=0.07895713150501252 & cv<=-0.23600178360939025 & pa<=0.010498513188213114\n",
      "   -2.0487 if cv>=-0.3377564370632172 & pa>=-0.0497795782983303\n",
      "Run episode 466 with rewards 13.0\n",
      "============ 467 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 0, 1, 1, 1, 1]\n",
      "   -0.0000 if cp>=-0.00985839832574129 & cv<=-0.020345222577452658 & cv>=-0.21598108112812042 & pa>=-0.07890328615903854\n",
      "   -0.5711 if cp>=0.024442286789417268\n",
      "   -0.0000 if cv<=-0.45395070910453794 & pav<=0.9214514017105103\n",
      "   -0.0000 if cv<=-0.3377564370632172 & pa>=-0.03464720025658605\n",
      "   -3.4754 if cp>=0.1212937980890274\n",
      "--------------\n",
      "   +1.0793 if cv<=0.41497159004211426\n",
      "   +3.3765 if pa>=-0.043268293142318726\n",
      "   -0.0247 if cp>=0.024442286789417268\n",
      "   -0.0000 if cp<=0.07895713150501252 & cv<=-0.23600178360939025 & pa<=0.010498513188213114\n",
      "   +0.8622 if cp>=0.013779091089963924\n",
      "Run episode 467 with rewards 10.0\n",
      "============ 468 ===========\n",
      "65 actions [0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1]\n",
      "   +0.0000 if cp>=-0.00985839832574129 & cv<=-0.020345222577452658 & cv>=-0.21598108112812042 & pa>=-0.07890328615903854\n",
      "  +14.5240 if cp>=0.024442286789417268\n",
      "   +0.0000 if cv<=-0.45395070910453794 & pav<=0.9214514017105103\n",
      "   +0.4883 if cp>=0.1212937980890274\n",
      "   +1.0397 if cp>=0.08313257247209549\n",
      "--------------\n",
      "   +2.5427 if cv<=0.41497159004211426\n",
      "   +2.3529 if pa>=-0.043268293142318726\n",
      "   -9.9747 if cp>=0.024442286789417268\n",
      "   -8.3435 if cp>=0.013779091089963924\n",
      "   +1.0000 if cp>=0.08313257247209549\n",
      "Run episode 468 with rewards 65.0\n",
      "============ 469 ===========\n",
      "34 actions [1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0]\n",
      "   +0.0009 if cp>=0.024442286789417268\n",
      "   -0.7685 if cv<=-0.45395070910453794 & pav<=0.9214514017105103\n",
      "   +0.0001 if cp>=0.1212937980890274\n",
      "   +0.0001 if cp>=0.08313257247209549\n",
      "   +2.6170 if cp>=-0.002485810266807661\n",
      "--------------\n",
      "   +4.0888 if cv<=0.41497159004211426\n",
      "   +2.3452 if pa>=-0.043268293142318726\n",
      "   -0.0000 if cp>=0.024442286789417268\n",
      "   -6.4020 if cp>=0.013779091089963924\n",
      "   -3.0945 if cp>=-0.002485810266807661\n",
      "Run episode 469 with rewards 34.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 470 ===========\n",
      "48 actions [0, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 0, 1, 1, 1, 0, 0, 0, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 1, 0, 0, 0, 0]\n",
      "   +0.0798 if cp>=0.024442286789417268\n",
      "   -3.1776 if cv<=-0.45395070910453794 & pav<=0.9214514017105103\n",
      "   +0.0000 if cp>=0.08313257247209549\n",
      "   +2.0351 if cp>=-0.002485810266807661\n",
      "   +3.7674 if cv<=-0.3942896962165833 & pa<=-0.06120980605483055 & pa>=-0.09238835722208023\n",
      "--------------\n",
      "   +3.4213 if cv<=0.41497159004211426\n",
      "   +1.7992 if pa>=-0.043268293142318726\n",
      "   -2.7866 if cp>=0.013779091089963924\n",
      "   -3.8190 if cp>=-0.002485810266807661\n",
      "   +5.0620 if cv<=-0.3942896962165833 & pa>=-0.05049029365181923\n",
      "Run episode 470 with rewards 48.0\n",
      "============ 471 ===========\n",
      "42 actions [1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 0]\n",
      "   -0.0886 if cp>=0.024442286789417268\n",
      "   +0.0000 if cv<=-0.45395070910453794 & pav<=0.9214514017105103\n",
      "   +2.1882 if cp>=-0.002485810266807661\n",
      "   +0.0000 if cv<=-0.3942896962165833 & pa<=-0.06120980605483055 & pa>=-0.09238835722208023\n",
      "   -4.6336 if cp<=0.01298898439854384 & cp>=-0.003375707799568772 & pa<=0.06016263067722321 & pav>=0.343337655067444\n",
      "--------------\n",
      "   +4.5079 if cv<=0.41497159004211426\n",
      "   -2.5357 if cp>=0.013779091089963924\n",
      "   -3.4335 if cp>=-0.002485810266807661\n",
      "   +6.9113 if cv<=-0.3942896962165833 & pa>=-0.05049029365181923\n",
      "   +4.7771 if cp<=0.01298898439854384 & cp>=-0.003375707799568772 & pa<=0.06016263067722321 & pav>=0.343337655067444\n",
      "Run episode 471 with rewards 42.0\n",
      "origin 73.55210564877498 new 86.40176198955525 not updated\n",
      "============ 472 ===========\n",
      "42 actions [1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 0, 1]\n",
      "   +3.4287 if cp>=0.024442286789417268\n",
      "   +2.4293 if cp>=-0.002485810266807661\n",
      "   +1.7820 if cv<=-0.3942896962165833 & pa<=-0.06120980605483055 & pa>=-0.09238835722208023\n",
      "   -0.3350 if cp<=0.01298898439854384 & cp>=-0.003375707799568772 & pa<=0.06016263067722321 & pav>=0.343337655067444\n",
      "   -2.8829 if cp>=-0.009246001020073889\n",
      "--------------\n",
      "   +4.5079 if cv<=0.41497159004211426\n",
      "   -2.5357 if cp>=0.013779091089963924\n",
      "   -3.4335 if cp>=-0.002485810266807661\n",
      "   +6.9113 if cv<=-0.3942896962165833 & pa>=-0.05049029365181923\n",
      "   +4.7771 if cp<=0.01298898439854384 & cp>=-0.003375707799568772 & pa<=0.06016263067722321 & pav>=0.343337655067444\n",
      "Run episode 472 with rewards 42.0\n",
      "============ 473 ===========\n",
      "27 actions [1, 1, 1, 0, 1, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1]\n",
      "   +3.4231 if cp>=0.024442286789417268\n",
      "   +0.1553 if cp>=-0.002485810266807661\n",
      "   +0.3662 if cv<=-0.3942896962165833 & pa<=-0.06120980605483055 & pa>=-0.09238835722208023\n",
      "   -0.0109 if cp>=-0.009246001020073889\n",
      "   -3.7084 if cv<=0.4234041929244995 & cv>=0.2291816055774689 & pa>=-0.04833601415157315\n",
      "--------------\n",
      "   +4.2502 if cv<=0.41497159004211426\n",
      "   -5.5652 if cp>=-0.002485810266807661\n",
      "   +1.6863 if cv<=-0.3942896962165833 & pa>=-0.05049029365181923\n",
      "   +2.8539 if cp<=0.01298898439854384 & cp>=-0.003375707799568772 & pa<=0.06016263067722321 & pav>=0.343337655067444\n",
      "   +4.1238 if cp<=0.0052462389692664296 & cv<=0.4234041929244995 & cv>=0.2291816055774689 & pa>=-0.12948998510837553\n",
      "Run episode 473 with rewards 27.0\n",
      "============ 474 ===========\n",
      "47 actions [1, 1, 1, 0, 1, 0, 0, 0, 1, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0, 0, 0, 1, 0, 0, 0, 0, 1, 1, 1, 1, 0, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1]\n",
      "   -0.0000 if cp>=0.024442286789417268\n",
      "   -2.8616 if cp>=-0.002485810266807661\n",
      "   -0.0000 if cv<=-0.3942896962165833 & pa<=-0.06120980605483055 & pa>=-0.09238835722208023\n",
      "   -0.0150 if cv<=0.4234041929244995 & cv>=0.2291816055774689 & pa>=-0.04833601415157315\n",
      "   +4.0693 if cp>=0.00045164491748437316\n",
      "--------------\n",
      "   +5.8878 if cv<=0.41497159004211426\n",
      "   -4.7337 if cp>=-0.002485810266807661\n",
      "   +3.9977 if cp<=0.01298898439854384 & cp>=-0.003375707799568772 & pa<=0.06016263067722321 & pav>=0.343337655067444\n",
      "   +1.2014 if cp<=0.0052462389692664296 & cv<=0.4234041929244995 & cv>=0.2291816055774689 & pa>=-0.12948998510837553\n",
      "   -2.7665 if \n",
      "Run episode 474 with rewards 47.0\n",
      "============ 475 ===========\n",
      "23 actions [0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 0, 1, 0, 0, 0, 0, 0, 0]\n",
      "   +3.2409 if cp>=0.024442286789417268\n",
      "   -2.9340 if cp>=-0.002485810266807661\n",
      "   +0.8446 if cv<=0.4234041929244995 & cv>=0.2291816055774689 & pa>=-0.04833601415157315\n",
      "   +2.1880 if cp>=0.00045164491748437316\n",
      "   +3.7033 if cp>=0.011939553171396257 & cv>=0.18773728907108309 & pa<=0.03373017385601998\n",
      "--------------\n",
      "   +6.7115 if cv<=0.41497159004211426\n",
      "   -3.4671 if cp>=-0.002485810266807661\n",
      "   +4.5856 if cp<=0.01298898439854384 & cp>=-0.003375707799568772 & pa<=0.06016263067722321 & pav>=0.343337655067444\n",
      "   -3.3628 if \n",
      "   -3.4676 if cp>=0.011939553171396257 & cv>=0.18773728907108309 & pa<=0.03373017385601998\n",
      "Run episode 475 with rewards 23.0\n",
      "============ 476 ===========\n",
      "52 actions [1, 1, 1, 0, 0, 0, 0, 1, 0, 0, 0, 1, 1, 1, 1, 1, 0, 1, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1]\n",
      "   +3.3227 if cp>=0.024442286789417268\n",
      "   -1.3466 if cp>=-0.002485810266807661\n",
      "   +2.3191 if cp>=0.00045164491748437316\n",
      "   +0.0000 if cp>=0.011939553171396257 & cv>=0.18773728907108309 & pa<=0.03373017385601998\n",
      "   -3.5236 if pav>=1.525205135345459\n",
      "--------------\n",
      "   +3.6081 if cv<=0.41497159004211426\n",
      "   -4.5649 if cp>=-0.002485810266807661\n",
      "   +0.0000 if cp<=0.01298898439854384 & cp>=-0.003375707799568772 & pa<=0.06016263067722321 & pav>=0.343337655067444\n",
      "   +0.0000 if cp>=0.011939553171396257 & cv>=0.18773728907108309 & pa<=0.03373017385601998\n",
      "   +2.8663 if pav>=1.525205135345459\n",
      "Run episode 476 with rewards 52.0\n",
      "============ 477 ===========\n",
      "40 actions [1, 1, 1, 0, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1]\n",
      "   +9.3984 if cp>=0.024442286789417268\n",
      "   +2.2837 if cp>=-0.002485810266807661\n",
      "   -2.2674 if cp>=0.00045164491748437316\n",
      "   +0.2377 if pav>=1.525205135345459\n",
      "   -3.5284 if cp<=-0.027068544179201126 & pav<=-0.47223123311996457\n",
      "--------------\n",
      "   +4.7065 if cv<=0.41497159004211426\n",
      "   -6.3289 if cp>=-0.002485810266807661\n",
      "   +0.1434 if cp<=0.01298898439854384 & cp>=-0.003375707799568772 & pa<=0.06016263067722321 & pav>=0.343337655067444\n",
      "   +0.6508 if pav>=1.525205135345459\n",
      "   +5.5666 if cp<=0.00892969742417338 & pa<=-0.0031828373670577986 & pav>=-0.1667665421962738 & pav>=0.3291012227535248\n",
      "Run episode 477 with rewards 40.0\n",
      "============ 478 ===========\n",
      "24 actions [1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 0, 1, 0, 0]\n",
      "   +3.7406 if cp>=0.024442286789417268\n",
      "   -0.3959 if cp>=-0.002485810266807661\n",
      "   -0.5082 if cp>=0.00045164491748437316\n",
      "   -0.8038 if cp<=-0.027068544179201126 & pav<=-0.47223123311996457\n",
      "   +3.8037 if cp>=-0.014802151545882224 & pa>=-0.09053615778684612 & pav<=-0.580714476108551 & pav>=-0.8724653482437134\n",
      "--------------\n",
      "   +5.1697 if cv<=0.41497159004211426\n",
      "   -4.8486 if cp>=-0.002485810266807661\n",
      "   -0.0000 if pav>=1.525205135345459\n",
      "   +4.0421 if cp<=0.00892969742417338 & pa<=-0.0031828373670577986 & pav>=-0.1667665421962738 & pav>=0.3291012227535248\n",
      "   -1.3996 if \n",
      "Run episode 478 with rewards 24.0\n",
      "============ 479 ===========\n",
      "21 actions [1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0]\n",
      "   +5.6815 if cp>=0.024442286789417268\n",
      "   -3.4214 if cp>=0.00045164491748437316\n",
      "   +0.0000 if cp<=-0.027068544179201126 & pav<=-0.47223123311996457\n",
      "   +5.9452 if cp>=-0.014802151545882224 & pa>=-0.09053615778684612 & pav<=-0.580714476108551 & pav>=-0.8724653482437134\n",
      "   +4.5625 if cp>=0.007366901822388175 & cv>=0.4098138093948364 & pa>=-0.10706463605165481\n",
      "--------------\n",
      "   +3.7275 if cv<=0.41497159004211426\n",
      "   -1.9642 if cp>=-0.002485810266807661\n",
      "   +1.4932 if cp<=0.00892969742417338 & pa<=-0.0031828373670577986 & pav>=-0.1667665421962738 & pav>=0.3291012227535248\n",
      "   -1.0769 if \n",
      "   -3.9647 if cv>=0.4098138093948364 & pa<=-0.07986893355846403 & pa>=-0.10706463605165481\n",
      "Run episode 479 with rewards 21.0\n",
      "============ 480 ===========\n",
      "41 actions [1, 1, 1, 0, 0, 1, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 0, 1, 0, 0, 0, 0, 0, 1, 1, 1, 1, 0, 0, 1, 1, 1, 0, 0, 0, 0, 0, 1, 1, 1, 1]\n",
      "   +4.9547 if cp>=0.024442286789417268\n",
      "   -1.9310 if cp>=0.00045164491748437316\n",
      "   +2.4062 if cp>=-0.014802151545882224 & pa>=-0.09053615778684612 & pav<=-0.580714476108551 & pav>=-0.8724653482437134\n",
      "   +0.1685 if cp>=0.007366901822388175 & cv>=0.4098138093948364 & pa>=-0.10706463605165481\n",
      "   -3.8504 if pav>=0.3114900290966034\n",
      "--------------\n",
      "   +3.2223 if cv<=0.41497159004211426\n",
      "   -3.1551 if cp>=-0.002485810266807661\n",
      "   -0.0000 if cp<=0.00892969742417338 & pa<=-0.0031828373670577986 & pav>=-0.1667665421962738 & pav>=0.3291012227535248\n",
      "   -0.3153 if cv>=0.4098138093948364 & pa<=-0.07986893355846403 & pa>=-0.10706463605165481\n",
      "   +3.7410 if pav>=0.3114900290966034\n",
      "Run episode 480 with rewards 41.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 481 ===========\n",
      "57 actions [1, 0, 1, 1, 0, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 0, 0, 0, 0, 1, 1, 1, 1, 0, 1, 0, 0, 0, 0, 0, 1, 1, 0, 1, 1, 1, 1, 1, 1, 0, 1, 0]\n",
      "   +6.3425 if cp>=0.024442286789417268\n",
      "   -2.1979 if cp>=0.00045164491748437316\n",
      "   +5.5136 if cp>=-0.014802151545882224 & pa>=-0.09053615778684612 & pav<=-0.580714476108551 & pav>=-0.8724653482437134\n",
      "   -3.8219 if pav>=0.3114900290966034\n",
      "   -5.1935 if cp<=0.010710266418755054 & cv>=0.23148006200790405 & pa>=-0.028171932324767113 & pav>=-0.6160905957221985\n",
      "--------------\n",
      "   +4.8139 if cv<=0.41497159004211426\n",
      "   -5.7907 if cp>=-0.002485810266807661\n",
      "   +0.0002 if cv>=0.4098138093948364 & pa<=-0.07986893355846403 & pa>=-0.10706463605165481\n",
      "   +3.6790 if pav>=0.3114900290966034\n",
      "   +3.5124 if cp>=0.010710266418755054 & cv<=0.23148006200790405 & pa>=-0.028171932324767113\n",
      "Run episode 481 with rewards 57.0\n",
      "============ 482 ===========\n",
      "21 actions [1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 0]\n",
      "   +5.9704 if cp>=0.024442286789417268\n",
      "   +2.7696 if cp>=-0.014802151545882224 & pa>=-0.09053615778684612 & pav<=-0.580714476108551 & pav>=-0.8724653482437134\n",
      "   -3.3236 if pav>=0.3114900290966034\n",
      "   +0.0000 if cp<=0.010710266418755054 & cv>=0.23148006200790405 & pa>=-0.028171932324767113 & pav>=-0.6160905957221985\n",
      "   -4.8040 if cp<=0.027937728166580213 & cp>=0.02027012072503567 & cv>=0.15404279232025148 & pa>=-0.004733150079846373\n",
      "--------------\n",
      "   +2.9866 if cv<=0.41497159004211426\n",
      "   -4.2676 if cp>=-0.002485810266807661\n",
      "   +1.7138 if pav>=0.3114900290966034\n",
      "   +3.1891 if cp>=0.010710266418755054 & cv<=0.23148006200790405 & pa>=-0.028171932324767113\n",
      "   -4.3327 if pa>=0.03088420443236828\n",
      "Run episode 482 with rewards 21.0\n",
      "============ 483 ===========\n",
      "41 actions [0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1]\n",
      "   +2.5864 if cp>=0.024442286789417268\n",
      "   +0.0000 if cp>=-0.014802151545882224 & pa>=-0.09053615778684612 & pav<=-0.580714476108551 & pav>=-0.8724653482437134\n",
      "   -2.3684 if pav>=0.3114900290966034\n",
      "   +0.0000 if cp<=0.027937728166580213 & cp>=0.02027012072503567 & cv>=0.15404279232025148 & pa>=-0.004733150079846373\n",
      "   +2.6703 if cp>=-0.011025765910744667 & pa>=-0.07097708433866501\n",
      "--------------\n",
      "   +3.2042 if cv<=0.41497159004211426\n",
      "   -4.7446 if cp>=-0.002485810266807661\n",
      "   +0.0000 if cp>=0.010710266418755054 & cv<=0.23148006200790405 & pa>=-0.028171932324767113\n",
      "   +0.0000 if pa>=0.03088420443236828\n",
      "   +2.7437 if cv<=0.5829967260360718 & cv>=0.5829967260360718\n",
      "Run episode 483 with rewards 41.0\n",
      "============ 484 ===========\n",
      "53 actions [0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0]\n",
      "   +1.7336 if cp>=0.024442286789417268\n",
      "   -1.9974 if pav>=0.3114900290966034\n",
      "   +0.0000 if cp<=0.027937728166580213 & cp>=0.02027012072503567 & cv>=0.15404279232025148 & pa>=-0.004733150079846373\n",
      "   +3.1772 if cp>=-0.011025765910744667 & pa>=-0.07097708433866501\n",
      "   -4.0080 if pa>=0.0014401157386600971 & pav<=-0.3587428331375122\n",
      "--------------\n",
      "   +3.2632 if cv<=0.41497159004211426\n",
      "   -5.1382 if cp>=-0.002485810266807661\n",
      "   +3.2881 if pa>=0.03088420443236828\n",
      "   +0.0000 if cv<=0.5829967260360718 & cv>=0.5829967260360718\n",
      "   +3.6481 if cv>=0.569101870059967 & pa>=0.0014401157386600971\n",
      "Run episode 484 with rewards 53.0\n",
      "============ 485 ===========\n",
      "45 actions [1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 0, 1, 1, 1, 0]\n",
      "   +0.9529 if cp>=0.024442286789417268\n",
      "   -2.3110 if pav>=0.3114900290966034\n",
      "   +5.0403 if cp>=-0.011025765910744667 & pa>=-0.07097708433866501\n",
      "   -1.4664 if pa>=0.0014401157386600971 & pav<=-0.3587428331375122\n",
      "   +3.3450 if cv>=0.9670963883399963\n",
      "--------------\n",
      "   +2.9334 if cv<=0.41497159004211426\n",
      "   -4.9101 if cp>=-0.002485810266807661\n",
      "   +2.4123 if pa>=0.03088420443236828\n",
      "   +1.0366 if cv>=0.569101870059967 & pa>=0.0014401157386600971\n",
      "   -3.3450 if cv>=0.9670963883399963\n",
      "Run episode 485 with rewards 45.0\n",
      "============ 486 ===========\n",
      "34 actions [0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1]\n",
      "   -0.0805 if pav>=0.3114900290966034\n",
      "   +5.8010 if cp>=-0.011025765910744667 & pa>=-0.07097708433866501\n",
      "   -2.5567 if pa>=0.0014401157386600971 & pav<=-0.3587428331375122\n",
      "   +0.0068 if cv>=0.9670963883399963\n",
      "   +3.3973 if cv>=0.4370531439781189 & pa<=-0.0011482498375698887 & pav>=-0.9644701838493347\n",
      "--------------\n",
      "   +2.7415 if cv<=0.41497159004211426\n",
      "   -7.4414 if cp>=-0.002485810266807661\n",
      "   +0.0000 if pa>=0.03088420443236828\n",
      "   -0.0144 if cv>=0.9670963883399963\n",
      "   -3.3973 if cv>=0.4370531439781189 & pa<=-0.0011482498375698887 & pav>=-0.9644701838493347\n",
      "Run episode 486 with rewards 34.0\n",
      "============ 487 ===========\n",
      "30 actions [0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1]\n",
      "   +0.1877 if pav>=0.3114900290966034\n",
      "   +5.0480 if cp>=-0.011025765910744667 & pa>=-0.07097708433866501\n",
      "   -1.6917 if pa>=0.0014401157386600971 & pav<=-0.3587428331375122\n",
      "   +0.0006 if cv>=0.4370531439781189 & pa<=-0.0011482498375698887 & pav>=-0.9644701838493347\n",
      "   -3.0664 if cv>=-0.7867410063743592 & pa>=0.05214817151427281\n",
      "--------------\n",
      "   +2.9583 if cv<=0.41497159004211426\n",
      "   -5.9432 if cp>=-0.002485810266807661\n",
      "   -0.0026 if cv>=0.9670963883399963\n",
      "   -0.0028 if cv>=0.4370531439781189 & pa<=-0.0011482498375698887 & pav>=-0.9644701838493347\n",
      "  +10.1176 if cp<=0.023049185425043126 & pa>=0.05214817151427281\n",
      "Run episode 487 with rewards 30.0\n",
      "============ 488 ===========\n",
      "14 actions [0, 0, 0, 0, 1, 0, 1, 1, 1, 0, 1, 0, 0, 0]\n",
      "   +1.6563 if pav>=0.3114900290966034\n",
      "   +4.2749 if cp>=-0.011025765910744667 & pa>=-0.07097708433866501\n",
      "   +0.3501 if pa>=0.0014401157386600971 & pav<=-0.3587428331375122\n",
      "   -0.0100 if cv>=-0.7867410063743592 & pa>=0.05214817151427281\n",
      "   -2.1065 if cp<=-0.01629803683608769 & cv<=-0.6502944588661193 & pa<=0.07311543673276902\n",
      "--------------\n",
      "   -0.7741 if cv<=0.41497159004211426\n",
      "   -1.9125 if cp>=-0.002485810266807661\n",
      "   -0.0291 if cv>=0.4370531439781189 & pa<=-0.0011482498375698887 & pav>=-0.9644701838493347\n",
      "   -2.2295 if cp<=0.023049185425043126 & pa>=0.05214817151427281\n",
      "   +4.4771 if cp<=-0.01629803683608769\n",
      "Run episode 488 with rewards 14.0\n",
      "============ 489 ===========\n",
      "32 actions [0, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0]\n",
      "   -0.5015 if pav>=0.3114900290966034\n",
      "   +0.4625 if cp>=-0.011025765910744667 & pa>=-0.07097708433866501\n",
      "   -0.0000 if pa>=0.0014401157386600971 & pav<=-0.3587428331375122\n",
      "   -0.2423 if cp<=-0.01629803683608769 & cv<=-0.6502944588661193 & pa<=0.07311543673276902\n",
      "   +3.6068 if cp>=-0.03756543025374412 & cv>=-0.6343786001205445\n",
      "--------------\n",
      "   +0.4210 if cv<=0.41497159004211426\n",
      "   -0.7466 if cp>=-0.002485810266807661\n",
      "   -0.9312 if cp<=0.023049185425043126 & pa>=0.05214817151427281\n",
      "   +1.2695 if cp<=-0.01629803683608769\n",
      "   +7.2671 if cp<=-0.03756543025374412 & cv<=-0.24550054967403412\n",
      "Run episode 489 with rewards 32.0\n",
      "============ 490 ===========\n",
      "25 actions [0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0]\n",
      "   -2.1829 if pav>=0.3114900290966034\n",
      "   +1.0616 if cp>=-0.011025765910744667 & pa>=-0.07097708433866501\n",
      "   -0.5739 if cp<=-0.01629803683608769 & cv<=-0.6502944588661193 & pa<=0.07311543673276902\n",
      "   +6.3108 if cp>=-0.03756543025374412 & cv>=-0.6343786001205445\n",
      "   +4.5515 if cp<=-0.030008174106478686 & cp>=-0.04471365660429001 & cv<=0.23048890829086305 & pav<=0.07444641590118409\n",
      "--------------\n",
      "   -0.0000 if cp>=-0.002485810266807661\n",
      "   -1.2108 if cp<=0.023049185425043126 & pa>=0.05214817151427281\n",
      "   +1.8782 if cp<=-0.01629803683608769\n",
      "   +2.4580 if cp<=-0.03756543025374412 & cv<=-0.24550054967403412\n",
      "   -4.7043 if cp<=-0.030008174106478686 & cp>=-0.04471365660429001 & pav<=0.07444641590118409 & pav>=-0.10267639309167861\n",
      "Run episode 490 with rewards 25.0\n",
      "============ 491 ===========\n",
      "31 actions [0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1]\n",
      "   -3.5115 if pav>=0.3114900290966034\n",
      "   +7.3122 if cp>=-0.011025765910744667 & pa>=-0.07097708433866501\n",
      "   +1.5532 if cp>=-0.03756543025374412 & cv>=-0.6343786001205445\n",
      "   -0.0000 if cp<=-0.030008174106478686 & cp>=-0.04471365660429001 & cv<=0.23048890829086305 & pav<=0.07444641590118409\n",
      "   -3.1061 if cp<=-0.061272853612899775 & pav<=0.28226370811462415\n",
      "--------------\n",
      "   +1.4104 if cp<=0.023049185425043126 & pa>=0.05214817151427281\n",
      "   +0.6872 if cp<=-0.01629803683608769\n",
      "   +0.6427 if cp<=-0.03756543025374412 & cv<=-0.24550054967403412\n",
      "   +0.0000 if cp<=-0.030008174106478686 & cp>=-0.04471365660429001 & pav<=0.07444641590118409 & pav>=-0.10267639309167861\n",
      "   -3.6967 if cp<=0.011734396778047088 & pa<=0.05169108584523203\n",
      "Run episode 491 with rewards 31.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 492 ===========\n",
      "37 actions [0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1]\n",
      "   -0.7910 if pav>=0.3114900290966034\n",
      "   +1.0248 if cp>=-0.011025765910744667 & pa>=-0.07097708433866501\n",
      "   +3.2381 if cp>=-0.03756543025374412 & cv>=-0.6343786001205445\n",
      "   -2.4880 if cp<=-0.061272853612899775 & pav<=0.28226370811462415\n",
      "   -4.8022 if cv<=-0.7599854469299316 & pa<=0.01908051408827305\n",
      "--------------\n",
      "   +4.1358 if cp<=0.023049185425043126 & pa>=0.05214817151427281\n",
      "   -0.0406 if cp<=-0.01629803683608769\n",
      "   -1.8130 if cp<=-0.03756543025374412 & cv<=-0.24550054967403412\n",
      "   -4.9789 if cp<=0.011734396778047088 & pa<=0.05169108584523203\n",
      "   +4.2280 if pa<=0.01908051408827305 & pa>=0.01908051408827305\n",
      "Run episode 492 with rewards 37.0\n",
      "============ 493 ===========\n",
      "45 actions [0, 0, 0, 0, 1, 0, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 1, 0, 0, 0, 1, 0, 1]\n",
      "   +0.9264 if cp>=-0.011025765910744667 & pa>=-0.07097708433866501\n",
      "   +2.6773 if cp>=-0.03756543025374412 & cv>=-0.6343786001205445\n",
      "   -1.4209 if cp<=-0.061272853612899775 & pav<=0.28226370811462415\n",
      "   -2.6037 if cv<=-0.7599854469299316 & pa<=0.01908051408827305\n",
      "   +5.0496 if cv<=-0.4117184281349182 & pa<=0.08652647435665133 & pav<=0.6943521618843079\n",
      "--------------\n",
      "   +5.6758 if cp<=0.023049185425043126 & pa>=0.05214817151427281\n",
      "   -2.3946 if cp<=-0.03756543025374412 & cv<=-0.24550054967403412\n",
      "   -2.1873 if cp<=0.011734396778047088 & pa<=0.05169108584523203\n",
      "   -0.0000 if pa<=0.01908051408827305 & pa>=0.01908051408827305\n",
      "   -6.5591 if cv<=-0.4117184281349182 & pav<=0.6943521618843079\n",
      "Run episode 493 with rewards 45.0\n",
      "============ 494 ===========\n",
      "12 actions [0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1]\n",
      "   +2.6098 if cp>=-0.03756543025374412 & cv>=-0.6343786001205445\n",
      "   -0.6126 if cp<=-0.061272853612899775 & pav<=0.28226370811462415\n",
      "   -3.4248 if cv<=-0.7599854469299316 & pa<=0.01908051408827305\n",
      "   +0.0112 if cv<=-0.4117184281349182 & pa<=0.08652647435665133 & pav<=0.6943521618843079\n",
      "   +2.9710 if pa<=-0.01182293128222227\n",
      "--------------\n",
      "   +4.1766 if cp<=0.023049185425043126 & pa>=0.05214817151427281\n",
      "   -2.9766 if cp<=-0.03756543025374412 & cv<=-0.24550054967403412\n",
      "   -2.7010 if cp<=0.011734396778047088 & pa<=0.05169108584523203\n",
      "   -6.5217 if cv<=-0.4117184281349182 & pav<=0.6943521618843079\n",
      "   +2.7148 if cp<=0.023446995019912723\n",
      "Run episode 494 with rewards 12.0\n",
      "============ 495 ===========\n",
      "8 actions [0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +1.5387 if cp>=-0.03756543025374412 & cv>=-0.6343786001205445\n",
      "   +0.0000 if cp<=-0.061272853612899775 & pav<=0.28226370811462415\n",
      "   +0.4157 if cv<=-0.7599854469299316 & pa<=0.01908051408827305\n",
      "   +1.7852 if pa<=-0.01182293128222227\n",
      "   +0.5911 if cp>=-0.030829526484012604\n",
      "--------------\n",
      "   -2.0442 if cp<=0.023049185425043126 & pa>=0.05214817151427281\n",
      "   -6.6164 if cp<=-0.03756543025374412 & cv<=-0.24550054967403412\n",
      "   +2.3185 if cv<=-0.4117184281349182 & pav<=0.6943521618843079\n",
      "   -7.4246 if cp<=0.023446995019912723\n",
      "   +0.4084 if cp<=-0.16351735293865202 & cv>=-0.9251467704772949\n",
      "Run episode 495 with rewards 8.0\n",
      "============ 496 ===========\n",
      "30 actions [0, 1, 1, 0, 0, 1, 0, 1, 1, 1, 0, 1, 1, 0, 0, 1, 0, 0, 1, 1, 1, 1, 0, 1, 0, 1, 1, 0, 0, 1]\n",
      "   +0.0251 if cp>=-0.03756543025374412 & cv>=-0.6343786001205445\n",
      "   +0.0000 if cv<=-0.7599854469299316 & pa<=0.01908051408827305\n",
      "   +0.0000 if pa<=-0.01182293128222227\n",
      "   +0.0000 if cp>=-0.030829526484012604\n",
      "   +0.0187 if cp>=-0.03291536644101143\n",
      "--------------\n",
      "   +6.0485 if cp<=0.023049185425043126 & pa>=0.05214817151427281\n",
      "   +9.2451 if cp<=-0.03756543025374412 & cv<=-0.24550054967403412\n",
      "   +1.6210 if cv<=-0.4117184281349182 & pav<=0.6943521618843079\n",
      "   -0.0364 if cp<=0.023446995019912723\n",
      "   +1.0000 if cp<=-0.05456963330507278\n",
      "Run episode 496 with rewards 30.0\n",
      "============ 497 ===========\n",
      "41 actions [1, 0, 0, 0, 0, 1, 0, 1, 1, 0, 1, 1, 1, 0, 1, 0, 0, 1, 0, 0, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 0, 0, 1, 0, 1, 1, 1, 0, 0]\n",
      "   -0.2229 if cp>=-0.03756543025374412 & cv>=-0.6343786001205445\n",
      "   -2.2676 if pa<=-0.01182293128222227\n",
      "   -0.2229 if cp>=-0.030829526484012604\n",
      "   -0.2229 if cp>=-0.03291536644101143\n",
      "   +2.1304 if pa<=0.02421671636402607\n",
      "--------------\n",
      "   +0.0000 if cp<=0.023049185425043126 & pa>=0.05214817151427281\n",
      "   +0.0000 if cp<=-0.03756543025374412 & cv<=-0.24550054967403412\n",
      "   +0.0000 if cv<=-0.4117184281349182 & pav<=0.6943521618843079\n",
      "   +0.0000 if cp<=-0.05456963330507278\n",
      "   +3.6753 if cp<=-0.01196023914963007 & cp>=-0.017379719763994217 & cv<=-0.03011808469891548\n",
      "Run episode 497 with rewards 41.0\n",
      "============ 498 ===========\n",
      "8 actions [1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -16.3161 if pa<=-0.01182293128222227\n",
      "   -1.2779 if cp>=-0.030829526484012604\n",
      "   -1.2779 if cp>=-0.03291536644101143\n",
      "   +3.3637 if pa<=0.02421671636402607\n",
      "   -4.3465 if cp<=-0.0548764206469059 & pa>=0.1039608046412468\n",
      "--------------\n",
      "   -0.1172 if cp<=0.023049185425043126 & pa>=0.05214817151427281\n",
      "   +0.2125 if cp<=-0.03756543025374412 & cv<=-0.24550054967403412\n",
      "   +0.4608 if cv<=-0.4117184281349182 & pav<=0.6943521618843079\n",
      "   +2.7490 if cp<=-0.01196023914963007 & cp>=-0.017379719763994217 & cv<=-0.03011808469891548\n",
      "   +4.3562 if cp<=-0.0548764206469059 & pa>=0.1039608046412468\n",
      "Run episode 498 with rewards 8.0\n",
      "============ 499 ===========\n",
      "26 actions [1, 1, 0, 0, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0, 0]\n",
      "   -0.1427 if pa<=-0.01182293128222227\n",
      "   -0.1427 if cp>=-0.030829526484012604\n",
      "   -0.1427 if pa<=0.02421671636402607\n",
      "   -0.0000 if cp<=-0.0548764206469059 & pa>=0.1039608046412468\n",
      "  +13.9556 if cp>=0.07797289639711381\n",
      "--------------\n",
      "   +0.0000 if cp<=-0.03756543025374412 & cv<=-0.24550054967403412\n",
      "   +0.0000 if cv<=-0.4117184281349182 & pav<=0.6943521618843079\n",
      "   +0.0000 if cp<=-0.01196023914963007 & cp>=-0.017379719763994217 & cv<=-0.03011808469891548\n",
      "   +0.0000 if cp<=-0.0548764206469059 & pa>=0.1039608046412468\n",
      "   +0.0000 if cp<=0.06038348004221916\n",
      "Run episode 499 with rewards 26.0\n",
      "============ 500 ===========\n",
      "24 actions [0, 1, 0, 0, 1, 1, 0, 1, 1, 1, 1, 1, 0, 1, 1, 0, 1, 1, 1, 1, 0, 0, 0, 0]\n",
      "   +0.2654 if pa<=-0.01182293128222227\n",
      "   -2.8142 if cp>=-0.030829526484012604\n",
      "   +5.3737 if pa<=0.02421671636402607\n",
      "   +2.1702 if cp>=0.07797289639711381\n",
      "   -6.2337 if cp<=0.07615478336811068 & pa<=0.0012674696044996494\n",
      "--------------\n",
      "  +18.3037 if cp<=-0.03756543025374412 & cv<=-0.24550054967403412\n",
      "   -0.0000 if cv<=-0.4117184281349182 & pav<=0.6943521618843079\n",
      "   -0.0000 if cp<=-0.01196023914963007 & cp>=-0.017379719763994217 & cv<=-0.03011808469891548\n",
      "  +10.9798 if cp<=-0.0548764206469059 & pa>=0.1039608046412468\n",
      "   +2.3156 if cp<=0.07615478336811068 & cv>=-0.5511630773544312 & pa<=0.0012674696044996494\n",
      "Run episode 500 with rewards 24.0\n",
      "============ 501 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -10.2681 if cp>=-0.030829526484012604\n",
      "  -11.2619 if pa<=0.02421671636402607\n",
      "   -9.3850 if cp>=0.07797289639711381\n",
      "   -7.9633 if cp<=0.07615478336811068 & pa<=0.0012674696044996494\n",
      "   -2.8650 if pa>=0.07674648761749268\n",
      "--------------\n",
      "   +2.8440 if cp<=-0.03756543025374412 & cv<=-0.24550054967403412\n",
      "   -0.0000 if cv<=-0.4117184281349182 & pav<=0.6943521618843079\n",
      "   -0.0000 if cp<=-0.0548764206469059 & pa>=0.1039608046412468\n",
      "   +0.5399 if cp<=0.07615478336811068 & cv>=-0.5511630773544312 & pa<=0.0012674696044996494\n",
      "   +3.8771 if pa>=0.07674648761749268\n",
      "Run episode 501 with rewards 9.0\n",
      "============ 502 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +1.2618 if cp>=-0.030829526484012604\n",
      "   +2.0355 if pa<=0.02421671636402607\n",
      "  +14.5583 if cp>=0.07797289639711381\n",
      "   -7.7847 if cp<=0.07615478336811068 & pa<=0.0012674696044996494\n",
      "   +1.0000 if cp<=0.05271103531122208\n",
      "--------------\n",
      "   -0.0000 if cp<=-0.03756543025374412 & cv<=-0.24550054967403412\n",
      "   +0.0000 if cp<=-0.0548764206469059 & pa>=0.1039608046412468\n",
      "   +0.0000 if cp<=0.07615478336811068 & cv>=-0.5511630773544312 & pa<=0.0012674696044996494\n",
      "   +0.0000 if pa>=0.07674648761749268\n",
      "   +0.0000 if cp<=0.05271103531122208\n",
      "Run episode 502 with rewards 9.0\n",
      "============ 503 ===========\n",
      "65 actions [0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1]\n",
      "   +2.0630 if cp>=-0.030829526484012604\n",
      "   +1.5710 if pa<=0.02421671636402607\n",
      "   +0.0000 if cp>=0.07797289639711381\n",
      "   +0.0000 if cp<=0.07615478336811068 & pa<=0.0012674696044996494\n",
      "  -20.0000 if cp<=-0.05557908415794372\n",
      "--------------\n",
      "   +6.2287 if cp<=-0.03756543025374412 & cv<=-0.24550054967403412\n",
      "   +5.1801 if cp<=-0.0548764206469059 & pa>=0.1039608046412468\n",
      "   +0.0000 if cp<=0.07615478336811068 & cv>=-0.5511630773544312 & pa<=0.0012674696044996494\n",
      "   +6.2287 if pa>=0.07674648761749268\n",
      "   +1.0000 if cp<=-0.022246890142560004\n",
      "Run episode 503 with rewards 65.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 504 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 1, 1, 1, 1]\n",
      "   +2.9758 if cp>=-0.030829526484012604\n",
      "   -1.5593 if pa<=0.02421671636402607\n",
      "  +17.5733 if cp>=0.07797289639711381\n",
      "   -7.7647 if cp<=-0.05557908415794372\n",
      "   +5.1160 if cp<=0.15417632162570957 & pa<=0.06267490088939673 & pa>=-0.05154875069856643\n",
      "--------------\n",
      "   +6.9650 if cp<=-0.03756543025374412 & cv<=-0.24550054967403412\n",
      "   +0.0000 if cp<=-0.0548764206469059 & pa>=0.1039608046412468\n",
      "   +6.4716 if pa>=0.07674648761749268\n",
      "   -2.3301 if cp<=-0.022246890142560004\n",
      "   +6.3845 if cv<=-0.22216859459877014 & pa<=-0.05154875069856643 & pav<=0.4817822217941289\n",
      "Run episode 504 with rewards 10.0\n",
      "============ 505 ===========\n",
      "10 actions [0, 0, 1, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +1.7838 if cp>=-0.030829526484012604\n",
      "   +0.0000 if cp>=0.07797289639711381\n",
      "   +0.0002 if cp<=-0.05557908415794372\n",
      "   +1.7341 if cp<=0.15417632162570957 & pa<=0.06267490088939673 & pa>=-0.05154875069856643\n",
      "   +0.6649 if cp>=0.01022158581763506\n",
      "--------------\n",
      "   -8.3128 if cp<=-0.03756543025374412 & cv<=-0.24550054967403412\n",
      "   -8.3742 if pa>=0.07674648761749268\n",
      "   -8.1006 if cp<=-0.022246890142560004\n",
      "   +0.7940 if cv<=-0.22216859459877014 & pa<=-0.05154875069856643 & pav<=0.4817822217941289\n",
      "   +1.0000 if cv<=-0.9390092968940735\n",
      "Run episode 505 with rewards 10.0\n",
      "============ 506 ===========\n",
      "47 actions [0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   +0.9192 if cp>=-0.030829526484012604\n",
      "   -0.0000 if cp<=-0.05557908415794372\n",
      "   -2.5037 if cp<=0.15417632162570957 & pa<=0.06267490088939673 & pa>=-0.05154875069856643\n",
      "   +0.9201 if cp>=0.01022158581763506\n",
      "   +3.2137 if cp>=0.031809251755476\n",
      "--------------\n",
      "   +8.3128 if cp<=-0.03756543025374412 & cv<=-0.24550054967403412\n",
      "   +8.3742 if pa>=0.07674648761749268\n",
      "   +8.1006 if cp<=-0.022246890142560004\n",
      "   +1.0000 if cv<=-0.9390092968940735\n",
      "   +1.0000 if cp<=0.031809251755476 & cp>=0.02137250080704689\n",
      "Run episode 506 with rewards 47.0\n",
      "============ 507 ===========\n",
      "27 actions [0, 0, 0, 0, 1, 1, 1, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1]\n",
      "   +3.0251 if cp>=-0.030829526484012604\n",
      "   -3.5360 if cp<=0.15417632162570957 & pa<=0.06267490088939673 & pa>=-0.05154875069856643\n",
      "   +2.5943 if cp>=0.01022158581763506\n",
      "   +6.2768 if cp>=0.031809251755476\n",
      "   -7.6534 if cp>=0.012179874069988734 & pav>=-0.6642648935317993\n",
      "--------------\n",
      "   +0.4735 if cp<=-0.03756543025374412 & cv<=-0.24550054967403412\n",
      "   -0.0000 if pa>=0.07674648761749268\n",
      "   +3.7069 if cp<=-0.022246890142560004\n",
      "   +2.3982 if cp<=0.031809251755476 & cp>=0.02137250080704689\n",
      "   -5.5699 if cv>=-0.18133982419967648 & cv>=0.0028693795204162904 & pav>=-0.2788690388202667\n",
      "Run episode 507 with rewards 27.0\n",
      "============ 508 ===========\n",
      "20 actions [0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1]\n",
      "   +0.8838 if cp>=-0.030829526484012604\n",
      "   +2.2935 if cp<=0.15417632162570957 & pa<=0.06267490088939673 & pa>=-0.05154875069856643\n",
      "   +0.0000 if cp>=0.031809251755476\n",
      "   +0.0000 if cp>=0.012179874069988734 & pav>=-0.6642648935317993\n",
      "   -3.0552 if cp>=-0.027110809087753294 & pav>=0.6508710384368896\n",
      "--------------\n",
      "   +0.7907 if cp<=-0.03756543025374412 & cv<=-0.24550054967403412\n",
      "   +4.6455 if cp<=-0.022246890142560004\n",
      "   +0.0000 if cp<=0.031809251755476 & cp>=0.02137250080704689\n",
      "   -6.8414 if cv>=-0.18133982419967648 & cv>=0.0028693795204162904 & pav>=-0.2788690388202667\n",
      "   -1.2196 if \n",
      "Run episode 508 with rewards 20.0\n",
      "============ 509 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 1, 1, 1]\n",
      "   +2.1454 if cp>=-0.030829526484012604\n",
      "   +0.9628 if cp<=0.15417632162570957 & pa<=0.06267490088939673 & pa>=-0.05154875069856643\n",
      "   +0.0000 if cp>=0.012179874069988734 & pav>=-0.6642648935317993\n",
      "   +0.8985 if cp>=-0.027110809087753294 & pav>=0.6508710384368896\n",
      "   -1.2176 if cp<=-0.013904586061835277 & cp>=-0.0867932379245758 & cv<=0.020514637976884846\n",
      "--------------\n",
      "   +2.4611 if cp<=-0.03756543025374412 & cv<=-0.24550054967403412\n",
      "   +4.7879 if cp<=-0.022246890142560004\n",
      "   -4.8776 if cv>=-0.18133982419967648 & cv>=0.0028693795204162904 & pav>=-0.2788690388202667\n",
      "   -2.2754 if \n",
      "   +2.3582 if pav>=1.4543012380599976\n",
      "Run episode 509 with rewards 10.0\n",
      "============ 510 ===========\n",
      "13 actions [0, 0, 0, 1, 0, 0, 1, 1, 0, 0, 0, 0, 0]\n",
      "   -0.0565 if cp>=-0.030829526484012604\n",
      "   +2.0085 if cp<=0.15417632162570957 & pa<=0.06267490088939673 & pa>=-0.05154875069856643\n",
      "   -0.8429 if cp>=-0.027110809087753294 & pav>=0.6508710384368896\n",
      "   -2.0637 if cp<=-0.013904586061835277 & cp>=-0.0867932379245758 & cv<=0.020514637976884846\n",
      "   +0.4204 if cp<=0.03373795226216316 & cp>=0.016372096538543705\n",
      "--------------\n",
      "   -8.6554 if cp<=-0.03756543025374412 & cv<=-0.24550054967403412\n",
      "  -11.5025 if cp<=-0.022246890142560004\n",
      "   -1.3677 if cv>=-0.18133982419967648 & cv>=0.0028693795204162904 & pav>=-0.2788690388202667\n",
      "  -12.9368 if pav>=1.4543012380599976\n",
      "   +1.0000 if pa>=0.2048637717962265\n",
      "Run episode 510 with rewards 13.0\n",
      "============ 511 ===========\n",
      "23 actions [0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 0, 0, 0]\n",
      "   +3.2335 if cp<=0.15417632162570957 & pa<=0.06267490088939673 & pa>=-0.05154875069856643\n",
      "   -1.9111 if cp>=-0.027110809087753294 & pav>=0.6508710384368896\n",
      "   -0.6448 if cp<=-0.013904586061835277 & cp>=-0.0867932379245758 & cv<=0.020514637976884846\n",
      "   -3.1116 if cp<=0.03373795226216316 & cp>=0.016372096538543705\n",
      "   +0.0149 if cp>=0.009048230759799488\n",
      "--------------\n",
      "   +9.1585 if cp<=-0.03756543025374412 & cv<=-0.24550054967403412\n",
      "  +11.5594 if cp<=-0.022246890142560004\n",
      "   +0.7884 if cv>=-0.18133982419967648 & cv>=0.0028693795204162904 & pav>=-0.2788690388202667\n",
      "  +13.2445 if pav>=1.4543012380599976\n",
      "   +1.5598 if cp>=0.009048230759799488 & cv<=-0.5380533337593076\n",
      "Run episode 511 with rewards 23.0\n",
      "============ 512 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   +3.8500 if cp<=0.15417632162570957 & pa<=0.06267490088939673 & pa>=-0.05154875069856643\n",
      "   +0.7489 if cp>=-0.027110809087753294 & pav>=0.6508710384368896\n",
      "   +0.2787 if cp<=-0.013904586061835277 & cp>=-0.0867932379245758 & cv<=0.020514637976884846\n",
      "   -1.3577 if cp<=0.03373795226216316 & cp>=0.016372096538543705\n",
      "  -19.9992 if cp>=0.016538787260651607\n",
      "--------------\n",
      "   +1.3030 if cp<=-0.03756543025374412 & cv<=-0.24550054967403412\n",
      "   +6.3836 if cp<=-0.022246890142560004\n",
      "   -0.0000 if pav>=1.4543012380599976\n",
      "   -0.0000 if cp>=0.009048230759799488 & cv<=-0.5380533337593076\n",
      "   -0.9821 if cp<=-0.00504495599307119 & cp<=0.016538787260651607 & cv<=1.169577670097351\n",
      "Run episode 512 with rewards 9.0\n",
      "============ 513 ===========\n",
      "30 actions [1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 0, 1, 1, 1, 0]\n",
      "  -14.6295 if cp<=0.15417632162570957 & pa<=0.06267490088939673 & pa>=-0.05154875069856643\n",
      "   +0.2700 if cp>=-0.027110809087753294 & pav>=0.6508710384368896\n",
      "   +0.4894 if cp<=0.03373795226216316 & cp>=0.016372096538543705\n",
      "  +13.6878 if cp>=0.016538787260651607\n",
      "   -0.3217 if cp<=0.11799646466970444\n",
      "--------------\n",
      "   -0.0000 if cp<=-0.03756543025374412 & cv<=-0.24550054967403412\n",
      "   -0.0000 if cp<=-0.022246890142560004\n",
      "   -0.0000 if pav>=1.4543012380599976\n",
      "   -0.0000 if cp<=-0.00504495599307119 & cp<=0.016538787260651607 & cv<=1.169577670097351\n",
      "   +0.0000 if cp<=0.06234208792448044\n",
      "Run episode 513 with rewards 30.0\n",
      "============ 514 ===========\n",
      "13 actions [1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 0]\n",
      "   -6.3239 if cp<=0.15417632162570957 & pa<=0.06267490088939673 & pa>=-0.05154875069856643\n",
      "   -0.0960 if cp<=0.03373795226216316 & cp>=0.016372096538543705\n",
      "   +5.1919 if cp>=0.016538787260651607\n",
      "   -3.0426 if cp<=0.11799646466970444\n",
      "   -8.1641 if pa>=0.20573613047599792\n",
      "--------------\n",
      "   -8.7976 if cp<=-0.03756543025374412 & cv<=-0.24550054967403412\n",
      "   -8.7976 if cp<=-0.022246890142560004\n",
      "   +4.8133 if pav>=1.4543012380599976\n",
      "   -8.7976 if cp<=-0.00504495599307119 & cp<=0.016538787260651607 & cv<=1.169577670097351\n",
      "   +2.1155 if cp<=0.06260557472705842 & pa>=-0.014330355823039978\n",
      "Run episode 514 with rewards 13.0\n",
      "============ 515 ===========\n",
      "35 actions [1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0]\n",
      "   -6.6000 if cp<=0.15417632162570957 & pa<=0.06267490088939673 & pa>=-0.05154875069856643\n",
      "   +3.7203 if cp>=0.016538787260651607\n",
      "   -4.6839 if cp<=0.11799646466970444\n",
      "   +0.0000 if pa>=0.20573613047599792\n",
      "   +2.6330 if cv>=0.42061257362365745\n",
      "--------------\n",
      "   -0.0000 if cp<=-0.03756543025374412 & cv<=-0.24550054967403412\n",
      "   -0.0000 if cp<=-0.022246890142560004\n",
      "   -0.0000 if pav>=1.4543012380599976\n",
      "   +0.0073 if cp<=-0.00504495599307119 & cp<=0.016538787260651607 & cv<=1.169577670097351\n",
      "   -0.6793 if cv>=0.9633318185806274\n",
      "Run episode 515 with rewards 35.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 516 ===========\n",
      "11 actions [1, 1, 1, 1, 1, 1, 0, 0, 1, 1, 0]\n",
      "   -0.0426 if cp<=0.15417632162570957 & pa<=0.06267490088939673 & pa>=-0.05154875069856643\n",
      "   +4.3840 if cp>=0.016538787260651607\n",
      "  -13.8846 if cp<=0.11799646466970444\n",
      "   +0.1576 if cv>=0.42061257362365745\n",
      "  +10.2589 if cp>=0.0343598447740078 & pa<=-0.05538062751293182 & pa>=-0.11794856488704682\n",
      "--------------\n",
      "   -0.0000 if cp<=-0.03756543025374412 & cv<=-0.24550054967403412\n",
      "   +1.3751 if cp<=-0.022246890142560004\n",
      "   -3.6621 if cp<=-0.00504495599307119 & cp<=0.016538787260651607 & cv<=1.169577670097351\n",
      "   -0.8088 if cv>=0.9633318185806274\n",
      "   +1.8958 if pav>=1.4159740209579468\n",
      "Run episode 516 with rewards 11.0\n",
      "============ 517 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -7.6849 if cp>=0.016538787260651607\n",
      "   -2.7663 if cp<=0.11799646466970444\n",
      "   -7.9607 if cv>=0.42061257362365745\n",
      "   -0.1682 if cp>=0.0343598447740078 & pa<=-0.05538062751293182 & pa>=-0.11794856488704682\n",
      "   +0.3010 if cp<=0.0004689665511250496\n",
      "--------------\n",
      "   -0.0000 if cp<=-0.022246890142560004\n",
      "   -0.0000 if cp<=-0.00504495599307119 & cp<=0.016538787260651607 & cv<=1.169577670097351\n",
      "   +0.9475 if cv>=0.9633318185806274\n",
      "   -0.0000 if pav>=1.4159740209579468\n",
      "   +0.5943 if cp<=0.09665267914533615 & cp>=0.05417013913393023 & cv>=0.963825523853302\n",
      "Run episode 517 with rewards 10.0\n",
      "============ 518 ===========\n",
      "55 actions [1, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0, 1, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1]\n",
      "   +9.3897 if cp>=0.016538787260651607\n",
      "   +0.6122 if cp<=0.11799646466970444\n",
      "   +8.5464 if cv>=0.42061257362365745\n",
      "   -3.8355 if cp<=0.0004689665511250496\n",
      "   +1.0000 if cp<=0.007634516782127327 & cp>=-0.020884466916322706\n",
      "--------------\n",
      "   +1.0879 if cp<=-0.00504495599307119 & cp<=0.016538787260651607 & cv<=1.169577670097351\n",
      "   +0.0001 if cv>=0.9633318185806274\n",
      "   -0.0000 if pav>=1.4159740209579468\n",
      "   -0.0000 if cp<=0.09665267914533615 & cp>=0.05417013913393023 & cv>=0.963825523853302\n",
      "   +0.6429 if cp<=-0.03693445771932602\n",
      "Run episode 518 with rewards 55.0\n",
      "============ 519 ===========\n",
      "36 actions [1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 0, 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0]\n",
      "   +6.0107 if cp>=0.016538787260651607\n",
      "  +10.5416 if cv>=0.42061257362365745\n",
      "   -6.3028 if cp<=0.0004689665511250496\n",
      "   +2.9465 if cp<=0.007634516782127327 & cp>=-0.020884466916322706\n",
      "   -0.8909 if cp>=0.008737471327185633 & cv<=0.40956060886383056\n",
      "--------------\n",
      "   +2.2061 if cp<=-0.00504495599307119 & cp<=0.016538787260651607 & cv<=1.169577670097351\n",
      "   +0.0000 if cv>=0.9633318185806274\n",
      "   +0.0000 if cp<=0.09665267914533615 & cp>=0.05417013913393023 & cv>=0.963825523853302\n",
      "   -0.1175 if cp<=-0.03693445771932602\n",
      "   +1.8428 if cp>=0.008737471327185633 & cv>=-0.17065418064594268 & pa<=0.006084751803427935 & pa>=-0.018039095774292944\n",
      "Run episode 519 with rewards 36.0\n",
      "============ 520 ===========\n",
      "35 actions [1, 1, 1, 0, 0, 1, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 1, 0, 0, 0, 1, 0, 0, 1, 1, 1, 1, 1, 0]\n",
      "   +4.6680 if cp>=0.016538787260651607\n",
      "   +6.8764 if cv>=0.42061257362365745\n",
      "   -4.7713 if cp<=0.0004689665511250496\n",
      "   +1.8846 if cp<=0.007634516782127327 & cp>=-0.020884466916322706\n",
      "   -3.0626 if pav>=0.8050910234451294\n",
      "--------------\n",
      "   +1.9648 if cp<=-0.00504495599307119 & cp<=0.016538787260651607 & cv<=1.169577670097351\n",
      "   +0.0000 if cv>=0.9633318185806274\n",
      "   +0.0000 if cp<=-0.03693445771932602\n",
      "   +0.0000 if cp>=0.008737471327185633 & cv>=-0.17065418064594268 & pa<=0.006084751803427935 & pa>=-0.018039095774292944\n",
      "   +3.0626 if pav>=0.8050910234451294\n",
      "Run episode 520 with rewards 35.0\n",
      "============ 521 ===========\n",
      "45 actions [1, 1, 1, 0, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 0, 1, 1, 0, 1, 1, 1, 1, 0, 1]\n",
      "   +4.3053 if cp>=0.016538787260651607\n",
      "   +7.1975 if cv>=0.42061257362365745\n",
      "   -2.6024 if cp<=0.0004689665511250496\n",
      "   -0.0000 if pav>=0.8050910234451294\n",
      "   +3.6973 if cv>=0.40172467231750486 & pav>=-0.6807488918304443\n",
      "--------------\n",
      "   +0.8771 if cp<=-0.00504495599307119 & cp<=0.016538787260651607 & cv<=1.169577670097351\n",
      "   -0.0000 if cp<=-0.03693445771932602\n",
      "   -0.0000 if cp>=0.008737471327185633 & cv>=-0.17065418064594268 & pa<=0.006084751803427935 & pa>=-0.018039095774292944\n",
      "   -0.0000 if pav>=0.8050910234451294\n",
      "   +2.9731 if pav>=0.7279935479164124\n",
      "Run episode 521 with rewards 45.0\n",
      "============ 522 ===========\n",
      "26 actions [1, 1, 0, 1, 0, 0, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 0, 1, 0, 1, 0, 0]\n",
      "   +6.8790 if cp>=0.016538787260651607\n",
      "   +6.3154 if cv>=0.42061257362365745\n",
      "   -2.2290 if cp<=0.0004689665511250496\n",
      "   +0.0000 if cv>=0.40172467231750486 & pav>=-0.6807488918304443\n",
      "   -2.7180 if cp>=0.006706281239166915\n",
      "--------------\n",
      "   +0.4818 if cp<=-0.00504495599307119 & cp<=0.016538787260651607 & cv<=1.169577670097351\n",
      "   +3.3433 if cp>=0.008737471327185633 & cv>=-0.17065418064594268 & pa<=0.006084751803427935 & pa>=-0.018039095774292944\n",
      "   +1.9663 if pav>=0.8050910234451294\n",
      "   +1.6771 if pav>=0.7279935479164124\n",
      "   +4.4504 if cp<=0.0312889039516449 & cp>=-0.015848329290747643 & cv<=-0.4051395237445831 & cv<=0.36805674433708196 & pa<=-0.07716700136661529 & pa>=-0.10519040971994399\n",
      "Run episode 522 with rewards 26.0\n",
      "============ 523 ===========\n",
      "38 actions [1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1]\n",
      "   +4.9017 if cp>=0.016538787260651607\n",
      "   +6.2774 if cv>=0.42061257362365745\n",
      "   -4.6526 if cp<=0.0004689665511250496\n",
      "   -4.1284 if cp>=0.006706281239166915\n",
      "   +1.9087 if \n",
      "--------------\n",
      "   +0.0000 if cp>=0.008737471327185633 & cv>=-0.17065418064594268 & pa<=0.006084751803427935 & pa>=-0.018039095774292944\n",
      "   +0.0000 if pav>=0.8050910234451294\n",
      "   +0.0000 if pav>=0.7279935479164124\n",
      "   +5.6579 if cp<=0.0312889039516449 & cp>=-0.015848329290747643 & cv<=-0.4051395237445831 & cv<=0.36805674433708196 & pa<=-0.07716700136661529 & pa>=-0.10519040971994399\n",
      "   -2.8778 if cp>=-0.005667153745889664 & cv<=0.2347601652145386 & pa>=-0.07000657916069031\n",
      "Run episode 523 with rewards 38.0\n",
      "============ 524 ===========\n",
      "42 actions [1, 1, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1]\n",
      "   +4.7466 if cp>=0.016538787260651607\n",
      "   +7.2568 if cv>=0.42061257362365745\n",
      "   -4.2334 if cp<=0.0004689665511250496\n",
      "   -2.7506 if cp>=0.006706281239166915\n",
      "   +5.6541 if cp<=0.018950447812676432 & pa<=0.007640395779162648\n",
      "--------------\n",
      "   -5.0066 if cp>=0.008737471327185633 & cv>=-0.17065418064594268 & pa<=0.006084751803427935 & pa>=-0.018039095774292944\n",
      "   -1.2939 if pav>=0.8050910234451294\n",
      "   +0.0000 if cp<=0.0312889039516449 & cp>=-0.015848329290747643 & cv<=-0.4051395237445831 & cv<=0.36805674433708196 & pa<=-0.07716700136661529 & pa>=-0.10519040971994399\n",
      "   -4.6551 if cp>=-0.005667153745889664 & cv<=0.2347601652145386 & pa>=-0.07000657916069031\n",
      "   +2.9834 if cv<=0.1883446514606476 & pa>=0.007640395779162648 & pav>=-0.09695709943771359\n",
      "Run episode 524 with rewards 42.0\n",
      "============ 525 ===========\n",
      "31 actions [0, 0, 0, 0, 1, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 0]\n",
      "   +0.1590 if cp>=0.016538787260651607\n",
      "   +7.7509 if cv>=0.42061257362365745\n",
      "   -2.1772 if cp<=0.0004689665511250496\n",
      "   +4.1676 if cp<=0.018950447812676432 & pa<=0.007640395779162648\n",
      "   -1.9264 if cp<=0.010077395103871832 & cv>=-0.20890448987483978 & pa>=-0.0011674457928165787\n",
      "--------------\n",
      "   -0.7419 if cp>=0.008737471327185633 & cv>=-0.17065418064594268 & pa<=0.006084751803427935 & pa>=-0.018039095774292944\n",
      "   -1.9767 if pav>=0.8050910234451294\n",
      "   -4.4971 if cp>=-0.005667153745889664 & cv<=0.2347601652145386 & pa>=-0.07000657916069031\n",
      "   +1.4526 if cv<=0.1883446514606476 & pa>=0.007640395779162648 & pav>=-0.09695709943771359\n",
      "   -1.2830 if cv>=0.5720940232276917\n",
      "Run episode 525 with rewards 31.0\n",
      "============ 526 ===========\n",
      "35 actions [0, 1, 0, 0, 0, 1, 1, 1, 1, 1, 0, 0, 1, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 1, 0, 0, 1, 1, 0, 1, 0]\n",
      "   +7.8965 if cv>=0.42061257362365745\n",
      "   -5.8940 if cp<=0.0004689665511250496\n",
      "   +0.0989 if cp<=0.018950447812676432 & pa<=0.007640395779162648\n",
      "   +0.9062 if cp<=0.010077395103871832 & cv>=-0.20890448987483978 & pa>=-0.0011674457928165787\n",
      "   +8.0635 if cp<=-0.01656123623251913 & pa<=0.05553453415632248\n",
      "--------------\n",
      "   +1.1384 if pav>=0.8050910234451294\n",
      "   -2.7674 if cp>=-0.005667153745889664 & cv<=0.2347601652145386 & pa>=-0.07000657916069031\n",
      "   +2.4793 if cv<=0.1883446514606476 & pa>=0.007640395779162648 & pav>=-0.09695709943771359\n",
      "   +0.0000 if cv>=0.5720940232276917\n",
      "   -8.4397 if cp<=-0.01656123623251913 & pa<=0.05553453415632248\n",
      "Run episode 526 with rewards 35.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 527 ===========\n",
      "32 actions [1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 1, 0, 0, 1, 0, 0]\n",
      "   +5.8201 if cv>=0.42061257362365745\n",
      "   -2.9665 if cp<=0.0004689665511250496\n",
      "   -0.5272 if cp<=0.010077395103871832 & cv>=-0.20890448987483978 & pa>=-0.0011674457928165787\n",
      "   +0.0000 if cp<=-0.01656123623251913 & pa<=0.05553453415632248\n",
      "   -5.4742 if cp>=0.023225478827953342 & cv<=0.029215022921562205 & pa<=0.034660347551107404\n",
      "--------------\n",
      "   +1.6045 if pav>=0.8050910234451294\n",
      "   -1.5949 if cp>=-0.005667153745889664 & cv<=0.2347601652145386 & pa>=-0.07000657916069031\n",
      "   +1.0786 if cv<=0.1883446514606476 & pa>=0.007640395779162648 & pav>=-0.09695709943771359\n",
      "   +0.0001 if cp<=-0.01656123623251913 & pa<=0.05553453415632248\n",
      "   +4.2433 if cp<=0.015167190693318844 & cv<=-0.18388716280460357 & pa<=0.08402228206396103\n",
      "Run episode 527 with rewards 32.0\n",
      "============ 528 ===========\n",
      "11 actions [0, 0, 0, 0, 1, 0, 1, 1, 1, 0, 1]\n",
      "   +1.8278 if cv>=0.42061257362365745\n",
      "   -0.0000 if cp<=0.0004689665511250496\n",
      "   -0.0000 if cp<=0.010077395103871832 & cv>=-0.20890448987483978 & pa>=-0.0011674457928165787\n",
      "   -7.9694 if cp>=0.023225478827953342 & cv<=0.029215022921562205 & pa<=0.034660347551107404\n",
      "   +2.1772 if cv<=0.1853512078523636\n",
      "--------------\n",
      "   -0.0000 if pav>=0.8050910234451294\n",
      "   -2.7250 if cp>=-0.005667153745889664 & cv<=0.2347601652145386 & pa>=-0.07000657916069031\n",
      "   +1.7545 if cv<=0.1883446514606476 & pa>=0.007640395779162648 & pav>=-0.09695709943771359\n",
      "   -0.0000 if cp<=0.015167190693318844 & cv<=-0.18388716280460357 & pa<=0.08402228206396103\n",
      "   +2.3442 if cp<=0.09391327500343323 & cp>=0.07674080431461335 & cv>=0.1853512078523636\n",
      "Run episode 528 with rewards 11.0\n",
      "============ 529 ===========\n",
      "8 actions [0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   -0.0000 if cv>=0.42061257362365745\n",
      "   +4.5631 if cp<=0.0004689665511250496\n",
      "   -0.0000 if cp>=0.023225478827953342 & cv<=0.029215022921562205 & pa<=0.034660347551107404\n",
      "   +3.3367 if cv<=0.1853512078523636\n",
      "   -5.4686 if cv<=-0.6040807962417603\n",
      "--------------\n",
      "   +0.9693 if cp>=-0.005667153745889664 & cv<=0.2347601652145386 & pa>=-0.07000657916069031\n",
      "   -2.1316 if cv<=0.1883446514606476 & pa>=0.007640395779162648 & pav>=-0.09695709943771359\n",
      "   +3.7900 if cp<=0.015167190693318844 & cv<=-0.18388716280460357 & pa<=0.08402228206396103\n",
      "   -0.0000 if cp<=0.09391327500343323 & cp>=0.07674080431461335 & cv>=0.1853512078523636\n",
      "   -7.3265 if pa>=0.20376475155353546\n",
      "Run episode 529 with rewards 8.0\n",
      "============ 530 ===========\n",
      "30 actions [1, 0, 1, 0, 1, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1]\n",
      "   +1.9510 if cp<=0.0004689665511250496\n",
      "   +0.0000 if cp>=0.023225478827953342 & cv<=0.029215022921562205 & pa<=0.034660347551107404\n",
      "   +1.9510 if cv<=0.1853512078523636\n",
      "   +0.3194 if cv<=-0.6040807962417603\n",
      "   +0.7015 if cp>=-0.028152740374207494\n",
      "--------------\n",
      "   +0.0000 if cp>=-0.005667153745889664 & cv<=0.2347601652145386 & pa>=-0.07000657916069031\n",
      "  +13.9530 if cv<=0.1883446514606476 & pa>=0.007640395779162648 & pav>=-0.09695709943771359\n",
      "   -7.9238 if cp<=0.015167190693318844 & cv<=-0.18388716280460357 & pa<=0.08402228206396103\n",
      "   +0.0000 if pa>=0.20376475155353546\n",
      "   -6.3922 if cp>=-0.026013841852545738\n",
      "Run episode 530 with rewards 30.0\n",
      "============ 531 ===========\n",
      "100 actions [1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0, 0, 0, 1, 1, 1, 1, 0, 0, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1]\n",
      "   +2.0793 if cp<=0.0004689665511250496\n",
      "   +0.5018 if cv<=0.1853512078523636\n",
      "   -0.1178 if cv<=-0.6040807962417603\n",
      "   +1.6946 if cp>=-0.028152740374207494\n",
      "   -3.7264 if cp<=-0.08616624921560287 & cv>=0.3126583695411682 & pa<=0.17547701597213744\n",
      "--------------\n",
      "   +8.3799 if cv<=0.1883446514606476 & pa>=0.007640395779162648 & pav>=-0.09695709943771359\n",
      "   -5.8349 if cp<=0.015167190693318844 & cv<=-0.18388716280460357 & pa<=0.08402228206396103\n",
      "   -0.0666 if pa>=0.20376475155353546\n",
      "   -1.6742 if cp>=-0.026013841852545738\n",
      "   +3.9692 if pav>=1.5314189195632935\n",
      "Run episode 531 with rewards 100.0\n",
      "best\n",
      "============ 532 ===========\n",
      "42 actions [1, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 0, 1, 1, 1, 0, 0, 1, 1, 0, 0, 1, 0, 1, 1]\n",
      "   -0.9343 if cp<=0.0004689665511250496\n",
      "   +2.2729 if cv<=0.1853512078523636\n",
      "   +0.8605 if cp>=-0.028152740374207494\n",
      "   -0.0008 if cp<=-0.08616624921560287 & cv>=0.3126583695411682 & pa<=0.17547701597213744\n",
      "   +4.1985 if cp<=0.03955579027533531 & cv>=0.1471000373363495 & pav<=-0.16999360918998718\n",
      "--------------\n",
      "  +10.5766 if cv<=0.1883446514606476 & pa>=0.007640395779162648 & pav>=-0.09695709943771359\n",
      "   -0.0000 if cp<=0.015167190693318844 & cv<=-0.18388716280460357 & pa<=0.08402228206396103\n",
      "   -1.3625 if cp>=-0.026013841852545738\n",
      "   -0.0000 if pav>=1.5314189195632935\n",
      "   -6.8066 if cp>=0.09982170760631563 & cv<=0.1339903950691223 & pa<=0.01899844706058502\n",
      "Run episode 532 with rewards 42.0\n",
      "============ 533 ===========\n",
      "43 actions [1, 1, 0, 0, 0, 1, 1, 0, 1, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1]\n",
      "   -4.0462 if cp<=0.0004689665511250496\n",
      "   -1.5661 if cv<=0.1853512078523636\n",
      "   +0.3492 if cp>=-0.028152740374207494\n",
      "   +7.4291 if cp<=0.03955579027533531 & cv>=0.1471000373363495 & pav<=-0.16999360918998718\n",
      "   +8.1554 if cp>=-0.027103241905570022 & cv<=0.020878265425562877\n",
      "--------------\n",
      "   +5.0222 if cv<=0.1883446514606476 & pa>=0.007640395779162648 & pav>=-0.09695709943771359\n",
      "   +2.4757 if cp<=0.015167190693318844 & cv<=-0.18388716280460357 & pa<=0.08402228206396103\n",
      "   -0.1964 if cp>=-0.026013841852545738\n",
      "   -0.0000 if cp>=0.09982170760631563 & cv<=0.1339903950691223 & pa<=0.01899844706058502\n",
      "   +6.1161 if cp<=0.04248922541737557 & cv<=0.21956417560577393 & pa<=0.044113460928201696 & pav<=0.37474566102027895\n",
      "Run episode 533 with rewards 43.0\n",
      "============ 534 ===========\n",
      "23 actions [1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1]\n",
      "   -3.4056 if cp<=0.0004689665511250496\n",
      "   +0.9764 if cv<=0.1853512078523636\n",
      "   +5.9704 if cp<=0.03955579027533531 & cv>=0.1471000373363495 & pav<=-0.16999360918998718\n",
      "   +5.0076 if cp>=-0.027103241905570022 & cv<=0.020878265425562877\n",
      "   +3.5479 if cp>=0.02047837153077126 & cv<=-0.20609814822673797\n",
      "--------------\n",
      "   +3.9677 if cv<=0.1883446514606476 & pa>=0.007640395779162648 & pav>=-0.09695709943771359\n",
      "   +1.8084 if cp<=0.015167190693318844 & cv<=-0.18388716280460357 & pa<=0.08402228206396103\n",
      "   +0.6999 if cp>=-0.026013841852545738\n",
      "   +4.8921 if cp<=0.04248922541737557 & cv<=0.21956417560577393 & pa<=0.044113460928201696 & pav<=0.37474566102027895\n",
      "   +4.3901 if cv<=0.17023333609104158 & cv>=-0.20609814822673797 & pa<=0.11839164495468141 & pav>=0.16081965863704692\n",
      "Run episode 534 with rewards 23.0\n",
      "============ 535 ===========\n",
      "32 actions [1, 0, 1, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 0, 0, 0, 0, 1, 1, 1, 1, 0]\n",
      "   +0.5156 if cp<=0.0004689665511250496\n",
      "   +4.6195 if cp<=0.03955579027533531 & cv>=0.1471000373363495 & pav<=-0.16999360918998718\n",
      "   -0.0000 if cp>=-0.027103241905570022 & cv<=0.020878265425562877\n",
      "   -0.0000 if cp>=0.02047837153077126 & cv<=-0.20609814822673797\n",
      "  +10.3326 if cp>=0.0514470674097538\n",
      "--------------\n",
      "   +0.0000 if cv<=0.1883446514606476 & pa>=0.007640395779162648 & pav>=-0.09695709943771359\n",
      "   +0.0000 if cp<=0.015167190693318844 & cv<=-0.18388716280460357 & pa<=0.08402228206396103\n",
      "   +5.0169 if cp<=0.04248922541737557 & cv<=0.21956417560577393 & pa<=0.044113460928201696 & pav<=0.37474566102027895\n",
      "   +0.0000 if cv<=0.17023333609104158 & cv>=-0.20609814822673797 & pa<=0.11839164495468141 & pav>=0.16081965863704692\n",
      "   -0.7655 if cv<=0.24723159670829772\n",
      "Run episode 535 with rewards 32.0\n",
      "============ 536 ===========\n",
      "24 actions [1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0]\n",
      "   -3.1051 if cp<=0.0004689665511250496\n",
      "   +5.4881 if cp<=0.03955579027533531 & cv>=0.1471000373363495 & pav<=-0.16999360918998718\n",
      "   -1.1532 if cp>=-0.027103241905570022 & cv<=0.020878265425562877\n",
      "   +2.9882 if cp>=0.0514470674097538\n",
      "   +4.6474 if pa>=0.003835946787148714\n",
      "--------------\n",
      "   -0.0000 if cv<=0.1883446514606476 & pa>=0.007640395779162648 & pav>=-0.09695709943771359\n",
      "   -0.7448 if cp<=0.04248922541737557 & cv<=0.21956417560577393 & pa<=0.044113460928201696 & pav<=0.37474566102027895\n",
      "   -0.0000 if cv<=0.17023333609104158 & cv>=-0.20609814822673797 & pa<=0.11839164495468141 & pav>=0.16081965863704692\n",
      "   +6.2441 if cv<=0.24723159670829772\n",
      "   -4.7197 if cp<=0.015202299505472184 & cp>=-0.0014008165337145316 & cv>=0.013719696085900073\n",
      "Run episode 536 with rewards 24.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 537 ===========\n",
      "43 actions [1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 1, 0, 1, 1, 1, 1]\n",
      "   -0.0000 if cp<=0.0004689665511250496\n",
      "   +7.9179 if cp<=0.03955579027533531 & cv>=0.1471000373363495 & pav<=-0.16999360918998718\n",
      "  -11.5973 if cp>=0.0514470674097538\n",
      "   -0.0000 if pa>=0.003835946787148714\n",
      "   +1.0889 if cv>=-0.02000867314636707 & pav<=-0.3105943083763122\n",
      "--------------\n",
      "   +2.7039 if cp<=0.04248922541737557 & cv<=0.21956417560577393 & pa<=0.044113460928201696 & pav<=0.37474566102027895\n",
      "   +0.0000 if cv<=0.17023333609104158 & cv>=-0.20609814822673797 & pa<=0.11839164495468141 & pav>=0.16081965863704692\n",
      "   +2.7039 if cv<=0.24723159670829772\n",
      "   -0.5714 if cp<=0.015202299505472184 & cp>=-0.0014008165337145316 & cv>=0.013719696085900073\n",
      "   -3.9738 if cv>=-0.031203919276595115\n",
      "Run episode 537 with rewards 43.0\n",
      "============ 538 ===========\n",
      "57 actions [1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1]\n",
      "   +7.5588 if cp<=0.03955579027533531 & cv>=0.1471000373363495 & pav<=-0.16999360918998718\n",
      "  +12.9985 if cp>=0.0514470674097538\n",
      "   -2.1933 if pa>=0.003835946787148714\n",
      "   +3.0255 if cv>=-0.02000867314636707 & pav<=-0.3105943083763122\n",
      "   -2.5048 if cp<=0.04152171462774277 & cv<=0.012428898550570012 & pa<=0.0007444730028510103\n",
      "--------------\n",
      "   +2.9155 if cp<=0.04248922541737557 & cv<=0.21956417560577393 & pa<=0.044113460928201696 & pav<=0.37474566102027895\n",
      "   -0.3639 if cv<=0.24723159670829772\n",
      "   -0.3211 if cp<=0.015202299505472184 & cp>=-0.0014008165337145316 & cv>=0.013719696085900073\n",
      "   -1.0710 if cv>=-0.031203919276595115\n",
      "   +4.1987 if cv<=0.012428898550570012\n",
      "Run episode 538 with rewards 57.0\n",
      "============ 539 ===========\n",
      "27 actions [1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0]\n",
      "   +6.6122 if cp<=0.03955579027533531 & cv>=0.1471000373363495 & pav<=-0.16999360918998718\n",
      "   -0.0000 if cp>=0.0514470674097538\n",
      "   +8.3358 if cv>=-0.02000867314636707 & pav<=-0.3105943083763122\n",
      "   -0.1983 if cp<=0.04152171462774277 & cv<=0.012428898550570012 & pa<=0.0007444730028510103\n",
      "   -4.3022 if cp<=0.010149947181344033 & cv<=0.024221719801425935 & pa>=-0.021161284297704697\n",
      "--------------\n",
      "   +1.5586 if cp<=0.04248922541737557 & cv<=0.21956417560577393 & pa<=0.044113460928201696 & pav<=0.37474566102027895\n",
      "   +2.5396 if cv<=0.24723159670829772\n",
      "   +0.8966 if cv>=-0.031203919276595115\n",
      "   +1.6430 if cv<=0.012428898550570012\n",
      "   -3.9848 if cv>=0.020977913215756417 & pav<=0.03450910858809952\n",
      "Run episode 539 with rewards 27.0\n",
      "============ 540 ===========\n",
      "25 actions [1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0]\n",
      "   +3.9746 if cp<=0.03955579027533531 & cv>=0.1471000373363495 & pav<=-0.16999360918998718\n",
      "   +6.7154 if cv>=-0.02000867314636707 & pav<=-0.3105943083763122\n",
      "   +0.6466 if cp<=0.04152171462774277 & cv<=0.012428898550570012 & pa<=0.0007444730028510103\n",
      "   -0.0000 if cp<=0.010149947181344033 & cv<=0.024221719801425935 & pa>=-0.021161284297704697\n",
      "   -5.0829 if cv>=-0.006612250488251441\n",
      "--------------\n",
      "   +1.7021 if cp<=0.04248922541737557 & cv<=0.21956417560577393 & pa<=0.044113460928201696 & pav<=0.37474566102027895\n",
      "   +1.7021 if cv<=0.24723159670829772\n",
      "   +1.7058 if cv<=0.012428898550570012\n",
      "   -0.0037 if cv>=0.020977913215756417 & pav<=0.03450910858809952\n",
      "   -0.3541 if cp>=-0.0013144951779395337\n",
      "Run episode 540 with rewards 25.0\n",
      "============ 541 ===========\n",
      "22 actions [1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1]\n",
      "   +0.2970 if cp<=0.03955579027533531 & cv>=0.1471000373363495 & pav<=-0.16999360918998718\n",
      "   +5.0734 if cv>=-0.02000867314636707 & pav<=-0.3105943083763122\n",
      "   -0.0000 if cp<=0.04152171462774277 & cv<=0.012428898550570012 & pa<=0.0007444730028510103\n",
      "   -1.9796 if cv>=-0.006612250488251441\n",
      "   -4.0588 if cv>=0.19031234085559845 & pa<=-0.08564410656690598 & pav>=-0.5283585786819458\n",
      "--------------\n",
      "   +0.1993 if cp<=0.04248922541737557 & cv<=0.21956417560577393 & pa<=0.044113460928201696 & pav<=0.37474566102027895\n",
      "   +7.5471 if cv<=0.24723159670829772\n",
      "   +0.1185 if cv<=0.012428898550570012\n",
      "   -1.5704 if cp>=-0.0013144951779395337\n",
      "   -5.6603 if cp<=0.09743509739637375 & cp>=0.07319603264331818 & cv<=0.19031234085559845 & pa>=-0.08564410656690598\n",
      "Run episode 541 with rewards 22.0\n",
      "============ 542 ===========\n",
      "40 actions [1, 0, 1, 0, 1, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0]\n",
      "   +0.3683 if cp<=0.03955579027533531 & cv>=0.1471000373363495 & pav<=-0.16999360918998718\n",
      "   +0.9961 if cv>=-0.02000867314636707 & pav<=-0.3105943083763122\n",
      "   +0.3890 if cv>=-0.006612250488251441\n",
      "   +0.0000 if cv>=0.19031234085559845 & pa<=-0.08564410656690598 & pav>=-0.5283585786819458\n",
      "   +1.7924 if cv>=0.18344755470752716\n",
      "--------------\n",
      "   +2.4588 if cp<=0.04248922541737557 & cv<=0.21956417560577393 & pa<=0.044113460928201696 & pav<=0.37474566102027895\n",
      "   +2.1295 if cv<=0.24723159670829772\n",
      "   -0.9910 if cp>=-0.0013144951779395337\n",
      "   -0.0000 if cp<=0.09743509739637375 & cp>=0.07319603264331818 & cv<=0.19031234085559845 & pa>=-0.08564410656690598\n",
      "   +4.4314 if cp>=0.03722931370139122 & cv<=0.18344755470752716\n",
      "Run episode 542 with rewards 40.0\n",
      "============ 543 ===========\n",
      "17 actions [1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1]\n",
      "   -1.8057 if cp<=0.03955579027533531 & cv>=0.1471000373363495 & pav<=-0.16999360918998718\n",
      "   +0.8281 if cv>=-0.02000867314636707 & pav<=-0.3105943083763122\n",
      "   -0.7033 if cv>=-0.006612250488251441\n",
      "   +4.1873 if cv>=0.18344755470752716\n",
      "   -5.0858 if cp<=0.05371867716312409 & cv>=0.06344528198242189 & pav>=-0.27223171591758727\n",
      "--------------\n",
      "   +2.5851 if cp<=0.04248922541737557 & cv<=0.21956417560577393 & pa<=0.044113460928201696 & pav<=0.37474566102027895\n",
      "   +3.2117 if cv<=0.24723159670829772\n",
      "   -0.7047 if cp>=-0.0013144951779395337\n",
      "   +5.2160 if cp>=0.03722931370139122 & cv<=0.18344755470752716\n",
      "   -2.6751 if cp>=0.05371867716312409 & cv<=0.24446063935756684\n",
      "Run episode 543 with rewards 17.0\n",
      "============ 544 ===========\n",
      "24 actions [1, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0]\n",
      "   -0.2724 if cp<=0.03955579027533531 & cv>=0.1471000373363495 & pav<=-0.16999360918998718\n",
      "   +0.6552 if cv>=-0.02000867314636707 & pav<=-0.3105943083763122\n",
      "   -0.2724 if cv>=0.18344755470752716\n",
      "   +0.0000 if cp<=0.05371867716312409 & cv>=0.06344528198242189 & pav>=-0.27223171591758727\n",
      "   +4.1209 if cv>=0.22646544873714447 & pav<=-0.4365691304206848\n",
      "--------------\n",
      "   +1.4297 if cp<=0.04248922541737557 & cv<=0.21956417560577393 & pa<=0.044113460928201696 & pav<=0.37474566102027895\n",
      "   +1.3423 if cv<=0.24723159670829772\n",
      "   -0.0000 if cp>=0.03722931370139122 & cv<=0.18344755470752716\n",
      "   -0.0000 if cp>=0.05371867716312409 & cv<=0.24446063935756684\n",
      "   +4.2634 if cv>=0.049531131982803345 & pav>=-0.4365691304206848\n",
      "Run episode 544 with rewards 24.0\n",
      "============ 545 ===========\n",
      "22 actions [1, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 1]\n",
      "   +1.7941 if cp<=0.03955579027533531 & cv>=0.1471000373363495 & pav<=-0.16999360918998718\n",
      "   +3.5728 if cv>=-0.02000867314636707 & pav<=-0.3105943083763122\n",
      "   -1.0887 if cv>=0.18344755470752716\n",
      "   +1.7771 if cv>=0.22646544873714447 & pav<=-0.4365691304206848\n",
      "   -1.1691 if pav>=0.039883263409137726\n",
      "--------------\n",
      "   +1.2239 if cp<=0.04248922541737557 & cv<=0.21956417560577393 & pa<=0.044113460928201696 & pav<=0.37474566102027895\n",
      "   +2.9302 if cv<=0.24723159670829772\n",
      "   -1.7020 if cp>=0.03722931370139122 & cv<=0.18344755470752716\n",
      "   +2.4993 if cv>=0.049531131982803345 & pav>=-0.4365691304206848\n",
      "   -2.2338 if cv>=0.06695899069309234 & pav>=-0.3681217074394225\n",
      "Run episode 545 with rewards 22.0\n",
      "============ 546 ===========\n",
      "27 actions [1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0]\n",
      "   -0.0152 if cp<=0.03955579027533531 & cv>=0.1471000373363495 & pav<=-0.16999360918998718\n",
      "   +2.2685 if cv>=-0.02000867314636707 & pav<=-0.3105943083763122\n",
      "   +2.1095 if cv>=0.22646544873714447 & pav<=-0.4365691304206848\n",
      "   +0.0000 if pav>=0.039883263409137726\n",
      "   -2.6274 if cp>=0.03658856973052025 & cv<=0.033622947067488015 & pav>=-0.4059382438659667\n",
      "--------------\n",
      "   +3.0575 if cv<=0.24723159670829772\n",
      "   -1.7807 if cp>=0.03722931370139122 & cv<=0.18344755470752716\n",
      "   +4.3255 if cv>=0.049531131982803345 & pav>=-0.4365691304206848\n",
      "   -1.9465 if cv>=0.06695899069309234 & pav>=-0.3681217074394225\n",
      "   +3.1877 if cp>=0.03658856973052025 & cv<=0.033622947067488015 & pav>=-0.4059382438659667\n",
      "Run episode 546 with rewards 27.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 547 ===========\n",
      "19 actions [1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0]\n",
      "   +0.0349 if cp<=0.03955579027533531 & cv>=0.1471000373363495 & pav<=-0.16999360918998718\n",
      "   +3.6250 if cv>=-0.02000867314636707 & pav<=-0.3105943083763122\n",
      "   +1.7024 if cv>=0.22646544873714447 & pav<=-0.4365691304206848\n",
      "   -0.0501 if cp>=0.03658856973052025 & cv<=0.033622947067488015 & pav>=-0.4059382438659667\n",
      "   -3.9235 if cp<=0.09107083082199097 & cv<=0.2734469056129458 & pav<=-0.29603985548019407\n",
      "--------------\n",
      "   +3.3477 if cv<=0.24723159670829772\n",
      "   +2.1821 if cv>=0.049531131982803345 & pav>=-0.4365691304206848\n",
      "   +1.4078 if cv>=0.06695899069309234 & pav>=-0.3681217074394225\n",
      "   +0.6806 if cp>=0.03658856973052025 & cv<=0.033622947067488015 & pav>=-0.4059382438659667\n",
      "   -4.8983 if cp>=0.09107083082199097 & cv<=0.2734469056129458\n",
      "Run episode 547 with rewards 19.0\n",
      "============ 548 ===========\n",
      "23 actions [1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0]\n",
      "   +1.6414 if cv>=-0.02000867314636707 & pav<=-0.3105943083763122\n",
      "   +2.4274 if cv>=0.22646544873714447 & pav<=-0.4365691304206848\n",
      "   +0.0000 if cp>=0.03658856973052025 & cv<=0.033622947067488015 & pav>=-0.4059382438659667\n",
      "   -0.8215 if cp<=0.09107083082199097 & cv<=0.2734469056129458 & pav<=-0.29603985548019407\n",
      "   -0.0063 if \n",
      "--------------\n",
      "   +2.5894 if cv<=0.24723159670829772\n",
      "   +1.2025 if cv>=0.049531131982803345 & pav>=-0.4365691304206848\n",
      "   +0.5934 if cv>=0.06695899069309234 & pav>=-0.3681217074394225\n",
      "   +0.0000 if cp>=0.09107083082199097 & cv<=0.2734469056129458\n",
      "   +1.1302 if pa>=0.00038720472366549075\n",
      "Run episode 548 with rewards 23.0\n",
      "============ 549 ===========\n",
      "31 actions [1, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0]\n",
      "   +3.4375 if cv>=-0.02000867314636707 & pav<=-0.3105943083763122\n",
      "   +2.3006 if cv>=0.22646544873714447 & pav<=-0.4365691304206848\n",
      "   +0.4881 if cp<=0.09107083082199097 & cv<=0.2734469056129458 & pav<=-0.29603985548019407\n",
      "   -1.2205 if \n",
      "   +1.0789 if cv<=0.18412997722625732\n",
      "--------------\n",
      "   +2.2441 if cv<=0.24723159670829772\n",
      "   +0.7661 if cv>=0.049531131982803345 & pav>=-0.4365691304206848\n",
      "   -1.3160 if cv>=0.06695899069309234 & pav>=-0.3681217074394225\n",
      "   +0.7373 if pa>=0.00038720472366549075\n",
      "   +2.3543 if cp<=0.06548167094588281 & pav>=-0.2731593430042267\n",
      "Run episode 549 with rewards 31.0\n",
      "============ 550 ===========\n",
      "27 actions [1, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1]\n",
      "   +4.4199 if cv>=-0.02000867314636707 & pav<=-0.3105943083763122\n",
      "   +0.5663 if cv>=0.22646544873714447 & pav<=-0.4365691304206848\n",
      "   +1.0897 if \n",
      "   +1.8705 if cv<=0.18412997722625732\n",
      "   -3.0358 if cv<=0.21047437191009521\n",
      "--------------\n",
      "   -0.1835 if cv<=0.24723159670829772\n",
      "   +2.6659 if cv>=0.049531131982803345 & pav>=-0.4365691304206848\n",
      "   +0.2905 if cv>=0.06695899069309234 & pav>=-0.3681217074394225\n",
      "   +4.5607 if cp<=0.06548167094588281 & pav>=-0.2731593430042267\n",
      "   -3.1415 if cv<=0.2058197259902954 & cv>=0.2058197259902954\n",
      "Run episode 550 with rewards 27.0\n",
      "============ 551 ===========\n",
      "30 actions [1, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1]\n",
      "   +7.2296 if cv>=-0.02000867314636707 & pav<=-0.3105943083763122\n",
      "   -0.8003 if \n",
      "   -0.9682 if cv<=0.18412997722625732\n",
      "   -0.9682 if cv<=0.21047437191009521\n",
      "   -2.7169 if cv<=0.2408610224723816 & pav<=-0.4076853215694427\n",
      "--------------\n",
      "   +1.2016 if cv>=0.049531131982803345 & pav>=-0.4365691304206848\n",
      "   +2.0078 if cv>=0.06695899069309234 & pav>=-0.3681217074394225\n",
      "   +1.6829 if cp<=0.06548167094588281 & pav>=-0.2731593430042267\n",
      "   +0.0000 if cv<=0.2058197259902954 & cv>=0.2058197259902954\n",
      "   +2.6540 if pav>=-0.2959510624408722\n",
      "Run episode 551 with rewards 30.0\n",
      "============ 552 ===========\n",
      "33 actions [1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 0, 0, 1, 0, 1, 0, 0]\n",
      "   +5.6469 if cv>=-0.02000867314636707 & pav<=-0.3105943083763122\n",
      "   -0.7502 if cv<=0.18412997722625732\n",
      "   -0.7502 if cv<=0.21047437191009521\n",
      "   +6.3557 if cv<=0.2408610224723816 & pav<=-0.4076853215694427\n",
      "   +2.1857 if cp>=-0.008740498125553128 & cv<=0.24459224045276642 & pav>=-0.5427351474761962\n",
      "--------------\n",
      "   +0.6896 if cv>=0.049531131982803345 & pav>=-0.4365691304206848\n",
      "   +1.9928 if cv>=0.06695899069309234 & pav>=-0.3681217074394225\n",
      "   +1.8123 if cp<=0.06548167094588281 & pav>=-0.2731593430042267\n",
      "   +1.8123 if pav>=-0.2959510624408722\n",
      "   -1.1948 if cp>=-0.008740498125553128 & cv<=0.24459224045276642 & pav>=-0.5427351474761962\n",
      "Run episode 552 with rewards 33.0\n",
      "============ 553 ===========\n",
      "31 actions [1, 1, 0, 1, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 0, 1, 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1]\n",
      "   +5.8835 if cv>=-0.02000867314636707 & pav<=-0.3105943083763122\n",
      "   -2.2577 if cv<=0.21047437191009521\n",
      "   -0.6244 if cv<=0.2408610224723816 & pav<=-0.4076853215694427\n",
      "   +1.0748 if cp>=-0.008740498125553128 & cv<=0.24459224045276642 & pav>=-0.5427351474761962\n",
      "   +5.3509 if cp>=0.032033082097768784\n",
      "--------------\n",
      "   +2.6443 if cv>=0.06695899069309234 & pav>=-0.3681217074394225\n",
      "   +1.4975 if cp<=0.06548167094588281 & pav>=-0.2731593430042267\n",
      "   +2.2863 if pav>=-0.2959510624408722\n",
      "   +0.6341 if cp>=-0.008740498125553128 & cv<=0.24459224045276642 & pav>=-0.5427351474761962\n",
      "   -5.4492 if cp>=0.032033082097768784\n",
      "Run episode 553 with rewards 31.0\n",
      "============ 554 ===========\n",
      "48 actions [1, 1, 0, 1, 0, 1, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1]\n",
      "   +4.7681 if cv>=-0.02000867314636707 & pav<=-0.3105943083763122\n",
      "   -0.6852 if cv<=0.21047437191009521\n",
      "   -0.8065 if cp>=-0.008740498125553128 & cv<=0.24459224045276642 & pav>=-0.5427351474761962\n",
      "   +2.9458 if cp>=0.032033082097768784\n",
      "   +3.1527 if cp>=0.04363182932138443 & cv>=0.13485614955425262\n",
      "--------------\n",
      "   +3.6358 if cv>=0.06695899069309234 & pav>=-0.3681217074394225\n",
      "   +1.5590 if cp<=0.06548167094588281 & pav>=-0.2731593430042267\n",
      "   +1.5590 if pav>=-0.2959510624408722\n",
      "   -2.2356 if cp>=0.032033082097768784\n",
      "   -3.2970 if cp>=0.04363182932138443 & cv>=0.13485614955425262\n",
      "Run episode 554 with rewards 48.0\n",
      "============ 555 ===========\n",
      "47 actions [1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 1, 0, 0]\n",
      "   +3.5808 if cv>=-0.02000867314636707 & pav<=-0.3105943083763122\n",
      "   -1.5897 if cp>=-0.008740498125553128 & cv<=0.24459224045276642 & pav>=-0.5427351474761962\n",
      "   +4.6499 if cp>=0.032033082097768784\n",
      "   +2.3564 if cp>=0.04363182932138443 & cv>=0.13485614955425262\n",
      "  +10.6120 if pa>=0.19458255171775818\n",
      "--------------\n",
      "   +6.3399 if cv>=0.06695899069309234 & pav>=-0.3681217074394225\n",
      "   +3.0078 if cp<=0.06548167094588281 & pav>=-0.2731593430042267\n",
      "   -4.2592 if cp>=0.032033082097768784\n",
      "   -3.7434 if cp>=0.04363182932138443 & cv>=0.13485614955425262\n",
      "  -10.5200 if pa>=0.19458255171775818\n",
      "Run episode 555 with rewards 47.0\n",
      "origin 58.257985024960036 new 59.69722488227554 not updated\n",
      "============ 556 ===========\n",
      "37 actions [1, 1, 0, 0, 0, 0, 1, 1, 1, 1, 0, 0, 1, 0, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0]\n",
      "   +5.3824 if cv>=-0.02000867314636707 & pav<=-0.3105943083763122\n",
      "   +5.4387 if cp>=0.032033082097768784\n",
      "   -0.0000 if cp>=0.04363182932138443 & cv>=0.13485614955425262\n",
      "   -0.0000 if pa>=0.19458255171775818\n",
      "   -2.4872 if pa>=-0.1174993798136711 & pav>=-0.37325292229652396\n",
      "--------------\n",
      "   +6.3399 if cv>=0.06695899069309234 & pav>=-0.3681217074394225\n",
      "   +3.0078 if cp<=0.06548167094588281 & pav>=-0.2731593430042267\n",
      "   -4.2592 if cp>=0.032033082097768784\n",
      "   -3.7434 if cp>=0.04363182932138443 & cv>=0.13485614955425262\n",
      "  -10.5200 if pa>=0.19458255171775818\n",
      "Run episode 556 with rewards 37.0\n",
      "============ 557 ===========\n",
      "59 actions [1, 1, 0, 1, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 0, 1, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 0, 1, 0, 1, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 0, 1, 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1]\n",
      "   +2.3131 if cv>=-0.02000867314636707 & pav<=-0.3105943083763122\n",
      "   +6.7916 if cp>=0.032033082097768784\n",
      "   +0.0000 if pa>=0.19458255171775818\n",
      "   -2.1335 if pa>=-0.1174993798136711 & pav>=-0.37325292229652396\n",
      "   +3.5776 if cv>=-0.041355805844068526 & pav<=-0.36174283027648924\n",
      "--------------\n",
      "   +4.9049 if cv>=0.06695899069309234 & pav>=-0.3681217074394225\n",
      "   -5.1075 if cp>=0.032033082097768784\n",
      "   +0.0000 if cp>=0.04363182932138443 & cv>=0.13485614955425262\n",
      "   +0.0000 if pa>=0.19458255171775818\n",
      "   +2.9107 if pav>=-0.2408460021018982\n",
      "Run episode 557 with rewards 59.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 558 ===========\n",
      "58 actions [1, 1, 0, 1, 0, 0, 1, 0, 0, 0, 1, 1, 1, 1, 0, 1, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +2.4144 if cv>=-0.02000867314636707 & pav<=-0.3105943083763122\n",
      "   +7.1109 if cp>=0.032033082097768784\n",
      "   -1.1896 if pa>=-0.1174993798136711 & pav>=-0.37325292229652396\n",
      "   +3.1402 if cv>=-0.041355805844068526 & pav<=-0.36174283027648924\n",
      "   -1.3004 if cv<=0.20719160437583925 & pa<=0.06922223716974263\n",
      "--------------\n",
      "   +3.0821 if cv>=0.06695899069309234 & pav>=-0.3681217074394225\n",
      "   -4.6351 if cp>=0.032033082097768784\n",
      "   -0.0298 if pa>=0.19458255171775818\n",
      "   +1.4482 if pav>=-0.2408460021018982\n",
      "   +1.8445 if cv<=0.20719160437583925\n",
      "Run episode 558 with rewards 58.0\n",
      "============ 559 ===========\n",
      "30 actions [1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1]\n",
      "   +2.7461 if cv>=-0.02000867314636707 & pav<=-0.3105943083763122\n",
      "   +5.5184 if cp>=0.032033082097768784\n",
      "   +2.7461 if cv>=-0.041355805844068526 & pav<=-0.36174283027648924\n",
      "   -1.7633 if cv<=0.20719160437583925 & pa<=0.06922223716974263\n",
      "   +6.6750 if cp<=0.02802856378257275 & cv>=0.2126500815153122 & pa<=-0.005887368880212307\n",
      "--------------\n",
      "   +2.7289 if cv>=0.06695899069309234 & pav>=-0.3681217074394225\n",
      "   -4.1026 if cp>=0.032033082097768784\n",
      "   +1.9342 if pav>=-0.2408460021018982\n",
      "   +1.3494 if cv<=0.20719160437583925\n",
      "   -7.4047 if cp<=0.02802856378257275 & cv>=0.2126500815153122 & pa<=-0.005887368880212307\n",
      "Run episode 559 with rewards 30.0\n",
      "============ 560 ===========\n",
      "31 actions [1, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 1, 0, 0, 0, 1]\n",
      "   +3.6283 if cv>=-0.02000867314636707 & pav<=-0.3105943083763122\n",
      "   +0.0000 if cp>=0.032033082097768784\n",
      "   +1.1528 if cv>=-0.041355805844068526 & pav<=-0.36174283027648924\n",
      "   +0.6787 if cp<=0.02802856378257275 & cv>=0.2126500815153122 & pa<=-0.005887368880212307\n",
      "   -2.3720 if pa>=-0.1094664305448532 & pav>=-0.27426750659942617\n",
      "--------------\n",
      "   -0.1412 if cv>=0.06695899069309234 & pav>=-0.3681217074394225\n",
      "   +0.0000 if cp>=0.032033082097768784\n",
      "   +1.6893 if pav>=-0.2408460021018982\n",
      "   -0.1421 if cp<=0.02802856378257275 & cv>=0.2126500815153122 & pa<=-0.005887368880212307\n",
      "   +2.2601 if pav>=-0.27426750659942617\n",
      "Run episode 560 with rewards 31.0\n",
      "============ 561 ===========\n",
      "33 actions [1, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 0, 1, 0, 1, 0, 0, 1, 1, 0]\n",
      "   +2.6701 if cv>=-0.02000867314636707 & pav<=-0.3105943083763122\n",
      "   +0.3274 if cv>=-0.041355805844068526 & pav<=-0.36174283027648924\n",
      "   +1.1129 if cp<=0.02802856378257275 & cv>=0.2126500815153122 & pa<=-0.005887368880212307\n",
      "   -4.1000 if pa>=-0.1094664305448532 & pav>=-0.27426750659942617\n",
      "   +1.6413 if pa>=-0.10488967597484589\n",
      "--------------\n",
      "   -1.0986 if cv>=0.06695899069309234 & pav>=-0.3681217074394225\n",
      "   +0.4520 if pav>=-0.2408460021018982\n",
      "   -1.0649 if cp<=0.02802856378257275 & cv>=0.2126500815153122 & pa<=-0.005887368880212307\n",
      "   +3.6456 if pav>=-0.27426750659942617\n",
      "   +0.8184 if pav>=-0.26558232307434076\n",
      "Run episode 561 with rewards 33.0\n",
      "============ 562 ===========\n",
      "59 actions [0, 0, 1, 0, 1, 1, 1, 0, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 0, 1, 1, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0]\n",
      "   +3.1253 if cv>=-0.02000867314636707 & pav<=-0.3105943083763122\n",
      "   +0.1024 if cp<=0.02802856378257275 & cv>=0.2126500815153122 & pa<=-0.005887368880212307\n",
      "   -3.6810 if pa>=-0.1094664305448532 & pav>=-0.27426750659942617\n",
      "   +2.2581 if pa>=-0.10488967597484589\n",
      "   +2.4137 if cp>=0.011136362329125404\n",
      "--------------\n",
      "   -1.8304 if cv>=0.06695899069309234 & pav>=-0.3681217074394225\n",
      "   -0.1883 if cp<=0.02802856378257275 & cv>=0.2126500815153122 & pa<=-0.005887368880212307\n",
      "   +3.4867 if pav>=-0.27426750659942617\n",
      "   +0.9800 if pav>=-0.26558232307434076\n",
      "   -2.4137 if cp>=0.011136362329125404\n",
      "Run episode 562 with rewards 59.0\n",
      "============ 563 ===========\n",
      "36 actions [1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 0, 0, 1, 1, 1, 0, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 0, 1, 0]\n",
      "   +1.3711 if cv>=-0.02000867314636707 & pav<=-0.3105943083763122\n",
      "   -0.8284 if pa>=-0.1094664305448532 & pav>=-0.27426750659942617\n",
      "   +0.5427 if pa>=-0.10488967597484589\n",
      "   +0.5427 if cp>=0.011136362329125404\n",
      "   +1.7646 if pa<=0.03225466534495354 & pav<=0.4350323677062989\n",
      "--------------\n",
      "   -1.1306 if cv>=0.06695899069309234 & pav>=-0.3681217074394225\n",
      "   -0.7303 if pav>=-0.27426750659942617\n",
      "   +2.4731 if pav>=-0.26558232307434076\n",
      "   -0.7792 if cp>=0.011136362329125404\n",
      "   +1.5632 if cv<=0.04004283994436264\n",
      "Run episode 563 with rewards 36.0\n",
      "============ 564 ===========\n",
      "8 actions [0, 0, 0, 0, 0, 0, 0, 1]\n",
      "   +4.2915 if cv>=-0.02000867314636707 & pav<=-0.3105943083763122\n",
      "   -1.3578 if pa>=-0.1094664305448532 & pav>=-0.27426750659942617\n",
      "   +5.1043 if pa>=-0.10488967597484589\n",
      "   -1.7238 if pa<=0.03225466534495354 & pav<=0.4350323677062989\n",
      "   +4.0111 if cp>=-0.019218306988477707\n",
      "--------------\n",
      "   -2.4779 if cv>=0.06695899069309234 & pav>=-0.3681217074394225\n",
      "   +1.6497 if pav>=-0.26558232307434076\n",
      "   -0.0000 if cp>=0.011136362329125404\n",
      "   +1.1625 if cv<=0.04004283994436264\n",
      "   -4.0506 if cp>=-0.019218306988477707\n",
      "Run episode 564 with rewards 8.0\n",
      "============ 565 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   -0.0000 if cv>=-0.02000867314636707 & pav<=-0.3105943083763122\n",
      "  +16.2342 if pa>=-0.10488967597484589\n",
      "   -0.0000 if pa<=0.03225466534495354 & pav<=0.4350323677062989\n",
      "   +0.0000 if cp>=-0.019218306988477707\n",
      "   +2.7063 if pa>=0.17200110852718353\n",
      "--------------\n",
      "   +1.5089 if cv>=0.06695899069309234 & pav>=-0.3681217074394225\n",
      "   -5.3558 if pav>=-0.26558232307434076\n",
      "   -5.6524 if cv<=0.04004283994436264\n",
      "   +3.4412 if cp>=-0.019218306988477707\n",
      "   +1.0000 if cp>=0.005575518868863587\n",
      "Run episode 565 with rewards 9.0\n",
      "============ 566 ===========\n",
      "15 actions [0, 0, 0, 1, 0, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1]\n",
      "   +0.0000 if cv>=-0.02000867314636707 & pav<=-0.3105943083763122\n",
      "   +0.0583 if pa>=-0.10488967597484589\n",
      "   +0.0588 if cp>=-0.019218306988477707\n",
      "   -0.0003 if pa>=0.17200110852718353\n",
      "   +0.0607 if cp>=0.02774189785122872\n",
      "--------------\n",
      "   -0.0000 if cv>=0.06695899069309234 & pav>=-0.3681217074394225\n",
      "   -0.0000 if pav>=-0.26558232307434076\n",
      "   -0.0000 if cv<=0.04004283994436264\n",
      "   -0.0000 if cp>=-0.019218306988477707\n",
      "   +0.0000 if cp>=0.004842675593681636\n",
      "Run episode 566 with rewards 15.0\n",
      "============ 567 ===========\n",
      "14 actions [0, 0, 0, 1, 0, 1, 1, 0, 0, 1, 0, 0, 1, 0]\n",
      "   +0.2783 if pa>=-0.10488967597484589\n",
      "   -1.4661 if cp>=-0.019218306988477707\n",
      "  +11.1409 if pa>=0.17200110852718353\n",
      "   -0.0033 if cp>=0.02774189785122872\n",
      "   +4.5802 if cp>=-0.022162145376205422 & cv>=-0.5426541447639466\n",
      "--------------\n",
      "   -0.0197 if pav>=-0.26558232307434076\n",
      "   +0.3719 if cv<=0.04004283994436264\n",
      "   +1.1306 if cp>=-0.019218306988477707\n",
      "   -1.3952 if cp>=0.004842675593681636\n",
      "   -4.0903 if cp>=-0.022162145376205422 & cv>=-0.5426541447639466\n",
      "Run episode 567 with rewards 14.0\n",
      "============ 568 ===========\n",
      "30 actions [0, 0, 0, 1, 0, 0, 1, 1, 0, 1, 1, 1, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 0, 0, 0, 0, 1, 1, 1, 1]\n",
      "   -0.6605 if pa>=-0.10488967597484589\n",
      "   -0.1238 if cp>=-0.019218306988477707\n",
      "  -10.1859 if pa>=0.17200110852718353\n",
      "   +1.9699 if cp>=-0.022162145376205422 & cv>=-0.5426541447639466\n",
      "   +2.8501 if cp<=-0.010940019413828847 & cp>=-0.03653421625494956 & cv>=-0.5594245553016662\n",
      "--------------\n",
      "   +0.4159 if cv<=0.04004283994436264\n",
      "   +0.5998 if cp>=-0.019218306988477707\n",
      "   +0.0000 if cp>=0.004842675593681636\n",
      "   -1.6176 if cp>=-0.022162145376205422 & cv>=-0.5426541447639466\n",
      "   -2.2463 if cp<=-0.010940019413828847 & cp>=-0.03653421625494956 & cv>=-0.5594245553016662\n",
      "Run episode 568 with rewards 30.0\n",
      "============ 569 ===========\n",
      "68 actions [0, 0, 0, 1, 0, 1, 1, 1, 1, 0, 1, 1, 0, 1, 0, 0, 0, 0, 1, 1, 0, 1, 1, 0, 1, 1, 0, 1, 0, 0, 0, 0, 0, 1, 1, 1, 0, 1, 1, 1, 0, 0, 1, 1, 0, 0, 1, 1, 0, 0, 0, 0, 1, 1, 1, 0, 1, 1, 0, 1, 1, 0, 0, 0, 0, 0, 0, 0]\n",
      "   -1.4383 if pa>=-0.10488967597484589\n",
      "  +10.5959 if pa>=0.17200110852718353\n",
      "   +5.2410 if cp>=-0.022162145376205422 & cv>=-0.5426541447639466\n",
      "   +4.5382 if cp<=-0.010940019413828847 & cp>=-0.03653421625494956 & cv>=-0.5594245553016662\n",
      "   +3.9317 if cp<=-0.041837364435195916 & cv>=0.22540774047374726\n",
      "--------------\n",
      "   +1.1249 if cv<=0.04004283994436264\n",
      "   +3.0412 if cp>=-0.019218306988477707\n",
      "  -11.8132 if cp>=-0.022162145376205422 & cv>=-0.5426541447639466\n",
      "  -10.6967 if cp<=-0.010940019413828847 & cp>=-0.03653421625494956 & cv>=-0.5594245553016662\n",
      "   -3.5390 if cp<=-0.041837364435195916 & cv>=0.22540774047374726\n",
      "Run episode 569 with rewards 68.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 570 ===========\n",
      "85 actions [0, 1, 0, 1, 0, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 0, 0, 0, 0, 1, 1, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 0, 1, 1, 1, 0, 1, 0, 0, 0, 1, 0, 0, 1, 0, 1, 1, 1]\n",
      "  -12.5455 if pa>=0.17200110852718353\n",
      "   +0.1158 if cp>=-0.022162145376205422 & cv>=-0.5426541447639466\n",
      "   -0.0190 if cp<=-0.010940019413828847 & cp>=-0.03653421625494956 & cv>=-0.5594245553016662\n",
      "   +2.0633 if cp<=-0.041837364435195916 & cv>=0.22540774047374726\n",
      "   -4.3337 if cp<=-0.039739470928907394 & pa<=0.05035664439201355 & pav>=0.0354054257273674\n",
      "--------------\n",
      "   +1.9098 if cp>=-0.019218306988477707\n",
      "   -3.0936 if cp>=-0.022162145376205422 & cv>=-0.5426541447639466\n",
      "   -2.7134 if cp<=-0.010940019413828847 & cp>=-0.03653421625494956 & cv>=-0.5594245553016662\n",
      "   -2.7967 if cp<=-0.041837364435195916 & cv>=0.22540774047374726\n",
      "   -5.1797 if cp>=-0.039739470928907394 & pav<=-0.21197470128536225\n",
      "Run episode 570 with rewards 85.0\n",
      "============ 571 ===========\n",
      "27 actions [0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 1, 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +13.1614 if pa>=0.17200110852718353\n",
      "   -1.4727 if cp>=-0.022162145376205422 & cv>=-0.5426541447639466\n",
      "   +2.4197 if cp<=-0.041837364435195916 & cv>=0.22540774047374726\n",
      "   -3.8004 if cp<=-0.039739470928907394 & pa<=0.05035664439201355 & pav>=0.0354054257273674\n",
      "   +3.8549 if cp>=-0.0036632190458476543\n",
      "--------------\n",
      "   +0.7318 if cp>=-0.022162145376205422 & cv>=-0.5426541447639466\n",
      "   -5.7358 if cp<=-0.010940019413828847 & cp>=-0.03653421625494956 & cv>=-0.5594245553016662\n",
      "   -3.0953 if cp<=-0.041837364435195916 & cv>=0.22540774047374726\n",
      "   -0.6547 if cp>=-0.039739470928907394 & pav<=-0.21197470128536225\n",
      "   -4.3211 if cp>=-0.0036632190458476543\n",
      "Run episode 571 with rewards 27.0\n",
      "============ 572 ===========\n",
      "25 actions [0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1]\n",
      "  -13.7281 if pa>=0.17200110852718353\n",
      "   +0.6765 if cp<=-0.041837364435195916 & cv>=0.22540774047374726\n",
      "   -2.8260 if cp<=-0.039739470928907394 & pa<=0.05035664439201355 & pav>=0.0354054257273674\n",
      "   +0.9934 if cp>=-0.0036632190458476543\n",
      "   -3.6285 if cp<=-0.05380092412233352 & cv<=0.18991560339927674 & cv>=-0.5926045179367065\n",
      "--------------\n",
      "   -1.3094 if cp>=-0.022162145376205422 & cv>=-0.5426541447639466\n",
      "   -0.0000 if cp<=-0.010940019413828847 & cp>=-0.03653421625494956 & cv>=-0.5594245553016662\n",
      "   -1.2528 if cp<=-0.041837364435195916 & cv>=0.22540774047374726\n",
      "   -1.3094 if cp>=-0.0036632190458476543\n",
      "   +4.0418 if cp<=-0.05380092412233352 & cv<=0.18991560339927674 & cv>=-0.5926045179367065\n",
      "Run episode 572 with rewards 25.0\n",
      "============ 573 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 1, 1]\n",
      "   +0.4194 if pa>=0.17200110852718353\n",
      "   +0.0381 if cp<=-0.039739470928907394 & pa<=0.05035664439201355 & pav>=0.0354054257273674\n",
      "  +11.2962 if cp>=-0.0036632190458476543\n",
      "   -0.4237 if cp<=-0.05380092412233352 & cv<=0.18991560339927674 & cv>=-0.5926045179367065\n",
      "   -4.5630 if cp<=-0.033916291594505286\n",
      "--------------\n",
      "   -1.3538 if cp>=-0.022162145376205422 & cv>=-0.5426541447639466\n",
      "   +0.0002 if cp<=-0.041837364435195916 & cv>=0.22540774047374726\n",
      "   -2.6785 if cp>=-0.0036632190458476543\n",
      "   +0.8922 if cp<=-0.05380092412233352 & cv<=0.18991560339927674 & cv>=-0.5926045179367065\n",
      "   +3.2587 if cv<=-0.4335327625274657 & pa>=0.08852021694183351 & pav>=1.0507852554321295\n",
      "Run episode 573 with rewards 10.0\n",
      "============ 574 ===========\n",
      "11 actions [0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0]\n",
      "  +10.7923 if pa>=0.17200110852718353\n",
      "   +2.5685 if cp>=-0.0036632190458476543\n",
      "   +0.0963 if cp<=-0.05380092412233352 & cv<=0.18991560339927674 & cv>=-0.5926045179367065\n",
      "  +20.5980 if cp<=-0.033916291594505286\n",
      "   +1.0000 if cp<=0.0020757289603352564 & cp>=-0.03833828717470169\n",
      "--------------\n",
      "   -3.8292 if cp>=-0.022162145376205422 & cv>=-0.5426541447639466\n",
      "   -1.2105 if cp>=-0.0036632190458476543\n",
      "   +1.9775 if cp<=-0.05380092412233352 & cv<=0.18991560339927674 & cv>=-0.5926045179367065\n",
      "  -20.5966 if cv<=-0.4335327625274657 & pa>=0.08852021694183351 & pav>=1.0507852554321295\n",
      "   +3.4735 if cp<=0.0020757289603352564 & cp>=-0.03833828717470169\n",
      "Run episode 574 with rewards 11.0\n",
      "============ 575 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 1, 1, 1, 1, 0]\n",
      "   -0.0000 if pa>=0.17200110852718353\n",
      "   +1.5406 if cp>=-0.0036632190458476543\n",
      "   -0.0000 if cp<=-0.033916291594505286\n",
      "   +0.0482 if cp<=0.0020757289603352564 & cp>=-0.03833828717470169\n",
      "   +0.0783 if cp>=0.042953673750162125\n",
      "--------------\n",
      "   -0.7020 if cp>=-0.022162145376205422 & cv>=-0.5426541447639466\n",
      "   -0.0000 if cp<=-0.05380092412233352 & cv<=0.18991560339927674 & cv>=-0.5926045179367065\n",
      "   +0.0000 if cv<=-0.4335327625274657 & pa>=0.08852021694183351 & pav>=1.0507852554321295\n",
      "   -1.4039 if cp<=0.0020757289603352564 & cp>=-0.03833828717470169\n",
      "   -1.1839 if pa<=0.003502445761114359\n",
      "Run episode 575 with rewards 10.0\n",
      "============ 576 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +2.5713 if cp>=-0.0036632190458476543\n",
      "  +11.4746 if cp<=-0.033916291594505286\n",
      "   +0.8353 if cp<=0.0020757289603352564 & cp>=-0.03833828717470169\n",
      "   +0.0000 if cp>=0.042953673750162125\n",
      "   -0.0001 if pa>=0.20864398777484894\n",
      "--------------\n",
      "   -1.7964 if cp>=-0.022162145376205422 & cv>=-0.5426541447639466\n",
      "   -6.2539 if cv<=-0.4335327625274657 & pa>=0.08852021694183351 & pav>=1.0507852554321295\n",
      "   -1.3429 if cp<=0.0020757289603352564 & cp>=-0.03833828717470169\n",
      "   +0.0000 if pa<=0.003502445761114359\n",
      "   +7.7265 if pa>=0.20864398777484894\n",
      "Run episode 576 with rewards 10.0\n",
      "============ 577 ===========\n",
      "13 actions [0, 1, 0, 0, 0, 0, 1, 0, 0, 0, 0, 1, 1]\n",
      "   -0.0001 if cp>=-0.0036632190458476543\n",
      "   +0.1190 if cp<=-0.033916291594505286\n",
      "   +1.9139 if cp<=0.0020757289603352564 & cp>=-0.03833828717470169\n",
      "   -0.0000 if pa>=0.20864398777484894\n",
      "  -13.8601 if cp<=-0.07418556362390519 & cp>=-0.11392632126808167\n",
      "--------------\n",
      "   -0.0000 if cp>=-0.022162145376205422 & cv>=-0.5426541447639466\n",
      "   +0.0004 if cv<=-0.4335327625274657 & pa>=0.08852021694183351 & pav>=1.0507852554321295\n",
      "   -1.8581 if cp<=0.0020757289603352564 & cp>=-0.03833828717470169\n",
      "   -0.0000 if pa>=0.20864398777484894\n",
      "   -0.9504 if cp>=-0.03223344050347805\n",
      "Run episode 577 with rewards 13.0\n",
      "============ 578 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.2139 if cp>=-0.0036632190458476543\n",
      "  +15.7398 if cp<=-0.033916291594505286\n",
      "   +0.5002 if cp<=0.0020757289603352564 & cp>=-0.03833828717470169\n",
      "  +14.6104 if cp<=-0.07418556362390519 & cp>=-0.11392632126808167\n",
      "   -1.5513 if cp>=0.03996407240629196\n",
      "--------------\n",
      "  -17.7715 if cv<=-0.4335327625274657 & pa>=0.08852021694183351 & pav>=1.0507852554321295\n",
      "   -0.8718 if cp<=0.0020757289603352564 & cp>=-0.03833828717470169\n",
      "   -0.0000 if pa>=0.20864398777484894\n",
      "   -1.6252 if cp>=-0.03223344050347805\n",
      "   +2.5373 if cp>=0.03996407240629196\n",
      "Run episode 578 with rewards 9.0\n",
      "============ 579 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 1, 1]\n",
      "   -0.0000 if cp<=-0.033916291594505286\n",
      "   +0.0791 if cp<=0.0020757289603352564 & cp>=-0.03833828717470169\n",
      "   -0.0000 if cp<=-0.07418556362390519 & cp>=-0.11392632126808167\n",
      "   -0.0000 if cp>=0.03996407240629196\n",
      "   +1.6431 if \n",
      "--------------\n",
      "  +21.2681 if cv<=-0.4335327625274657 & pa>=0.08852021694183351 & pav>=1.0507852554321295\n",
      "   -0.1946 if cp<=0.0020757289603352564 & cp>=-0.03833828717470169\n",
      "   -2.6023 if cp>=-0.03223344050347805\n",
      "   -0.0000 if cp>=0.03996407240629196\n",
      "   +0.0021 if pa>=0.1921793818473816\n",
      "Run episode 579 with rewards 10.0\n",
      "============ 580 ===========\n",
      "27 actions [0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 0]\n",
      "   -9.7835 if cp<=-0.033916291594505286\n",
      "   -4.3727 if cp<=0.0020757289603352564 & cp>=-0.03833828717470169\n",
      "   +0.0000 if cp<=-0.07418556362390519 & cp>=-0.11392632126808167\n",
      "   -1.1168 if \n",
      "   -5.9139 if cp<=-0.013012574333697555 & cp>=-0.05174998044967651\n",
      "--------------\n",
      "  -14.1970 if cv<=-0.4335327625274657 & pa>=0.08852021694183351 & pav>=1.0507852554321295\n",
      "   +0.7442 if cp<=0.0020757289603352564 & cp>=-0.03833828717470169\n",
      "   -4.7080 if cp>=-0.03223344050347805\n",
      "   +0.0011 if pa>=0.1921793818473816\n",
      "   +1.0000 if cp>=-0.05174998044967651\n",
      "Run episode 580 with rewards 27.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 581 ===========\n",
      "14 actions [0, 0, 0, 0, 1, 1, 0, 0, 1, 0, 1, 1, 0, 1]\n",
      "   +9.6863 if cp<=-0.033916291594505286\n",
      "   -7.4325 if cp<=0.0020757289603352564 & cp>=-0.03833828717470169\n",
      "   +1.5285 if \n",
      "   -2.1372 if cp<=-0.013012574333697555 & cp>=-0.05174998044967651\n",
      "   +1.0000 if cp>=-0.00372941382229328 & pa>=0.05506619811058046\n",
      "--------------\n",
      "  +15.5941 if cv<=-0.4335327625274657 & pa>=0.08852021694183351 & pav>=1.0507852554321295\n",
      "   +1.8229 if cp<=0.0020757289603352564 & cp>=-0.03833828717470169\n",
      "   -1.2802 if cp>=-0.03223344050347805\n",
      "   -4.6707 if cp>=-0.05174998044967651\n",
      "   +1.2298 if \n",
      "Run episode 581 with rewards 14.0\n",
      "============ 582 ===========\n",
      "71 actions [0, 0, 0, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 1, 1, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1, 0, 1, 1, 0, 1, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   +1.0391 if cp<=-0.033916291594505286\n",
      "   -2.1127 if cp<=0.0020757289603352564 & cp>=-0.03833828717470169\n",
      "   -2.9323 if \n",
      "   +0.6431 if cp<=-0.013012574333697555 & cp>=-0.05174998044967651\n",
      "   +3.2559 if cp>=-0.04988920390605926 & cv>=-0.542587673664093\n",
      "--------------\n",
      "  -11.0829 if cv<=-0.4335327625274657 & pa>=0.08852021694183351 & pav>=1.0507852554321295\n",
      "   +1.0949 if cp<=0.0020757289603352564 & cp>=-0.03833828717470169\n",
      "   -0.0069 if cp>=-0.03223344050347805\n",
      "   -2.6583 if cp>=-0.05174998044967651\n",
      "   -0.1254 if pa>=0.2072620987892151\n",
      "Run episode 582 with rewards 71.0\n",
      "============ 583 ===========\n",
      "10 actions [0, 1, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.6959 if cp<=-0.033916291594505286\n",
      "   -0.5080 if cp<=0.0020757289603352564 & cp>=-0.03833828717470169\n",
      "   -3.2905 if \n",
      "   +3.0565 if cp>=-0.04988920390605926 & cv>=-0.542587673664093\n",
      "   +5.7831 if pa>=0.06379622966051102\n",
      "--------------\n",
      "   +0.0000 if cv<=-0.4335327625274657 & pa>=0.08852021694183351 & pav>=1.0507852554321295\n",
      "   -0.2065 if cp<=0.0020757289603352564 & cp>=-0.03833828717470169\n",
      "   -2.1024 if cp>=-0.05174998044967651\n",
      "   +0.0000 if pa>=0.2072620987892151\n",
      "   -5.1936 if pa>=0.06379622966051102\n",
      "Run episode 583 with rewards 10.0\n",
      "============ 584 ===========\n",
      "20 actions [1, 1, 1, 0, 0, 0, 0, 1, 1, 0, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -4.0506 if cp<=-0.033916291594505286\n",
      "   -2.3543 if \n",
      "   +0.7008 if cp>=-0.04988920390605926 & cv>=-0.542587673664093\n",
      "  -15.4418 if pa>=0.06379622966051102\n",
      "   +0.9084 if cp>=-0.011331777088344097\n",
      "--------------\n",
      "  +13.3407 if cv<=-0.4335327625274657 & pa>=0.08852021694183351 & pav>=1.0507852554321295\n",
      "   -3.2567 if cp<=0.0020757289603352564 & cp>=-0.03833828717470169\n",
      "   +0.5482 if cp>=-0.05174998044967651\n",
      "  +17.1883 if pa>=0.06379622966051102\n",
      "   +1.0000 if cp>=-0.011331777088344097\n",
      "Run episode 584 with rewards 20.0\n",
      "============ 585 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -3.3418 if cp<=-0.033916291594505286\n",
      "   +0.2153 if \n",
      "   -0.0000 if pa>=0.06379622966051102\n",
      "   -1.8338 if cp>=-0.011331777088344097\n",
      "   -2.4673 if pav>=0.2577446699142456\n",
      "--------------\n",
      "   +0.0000 if cv<=-0.4335327625274657 & pa>=0.08852021694183351 & pav>=1.0507852554321295\n",
      "   -4.1366 if cp<=0.0020757289603352564 & cp>=-0.03833828717470169\n",
      "   +0.0000 if pa>=0.06379622966051102\n",
      "   +3.2860 if cp>=-0.011331777088344097\n",
      "   +2.4780 if pav>=0.2577446699142456\n",
      "Run episode 585 with rewards 10.0\n",
      "============ 586 ===========\n",
      "56 actions [1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -3.0484 if cp<=-0.033916291594505286\n",
      "  +11.4219 if \n",
      "   +9.9455 if cp>=-0.011331777088344097\n",
      "   -2.2506 if pav>=0.2577446699142456\n",
      "  -19.7263 if cp<=0.0767821028828621\n",
      "--------------\n",
      "   -0.0023 if cp<=0.0020757289603352564 & cp>=-0.03833828717470169\n",
      "   -0.0000 if pa>=0.06379622966051102\n",
      "  -13.5292 if cp>=-0.011331777088344097\n",
      "   -0.0014 if pav>=0.2577446699142456\n",
      "   -6.9567 if cp>=0.0767821028828621\n",
      "Run episode 586 with rewards 56.0\n",
      "============ 587 ===========\n",
      "10 actions [1, 1, 1, 1, 0, 0, 1, 1, 0, 0]\n",
      "   -1.0880 if cp<=-0.033916291594505286\n",
      "   -2.8845 if \n",
      "   +0.4090 if cp>=-0.011331777088344097\n",
      "   -2.8845 if cp<=0.0767821028828621\n",
      "   -0.0855 if pav>=1.7523624897003174\n",
      "--------------\n",
      "   -0.3934 if cp<=0.0020757289603352564 & cp>=-0.03833828717470169\n",
      "   -4.1798 if cp>=-0.011331777088344097\n",
      "   -1.9696 if pav>=0.2577446699142456\n",
      "   -0.0000 if cp>=0.0767821028828621\n",
      "   -0.5237 if cp>=0.036732133477926254\n",
      "Run episode 587 with rewards 10.0\n",
      "============ 588 ===========\n",
      "8 actions [1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   +0.4865 if cp<=-0.033916291594505286\n",
      "  -14.6048 if \n",
      "  -15.7118 if cp>=-0.011331777088344097\n",
      "  -10.3037 if cp<=0.0767821028828621\n",
      "   +1.0000 if cp<=0.0550732895731926\n",
      "--------------\n",
      "   +0.3288 if cp<=0.0020757289603352564 & cp>=-0.03833828717470169\n",
      "   +7.7670 if cp>=-0.011331777088344097\n",
      "   +1.6465 if pav>=0.2577446699142456\n",
      "   +4.8959 if cp>=0.036732133477926254\n",
      "   +1.0000 if cp>=0.07222969830036163\n",
      "Run episode 588 with rewards 8.0\n",
      "============ 589 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +14.6048 if \n",
      "  +15.7118 if cp>=-0.011331777088344097\n",
      "  +10.3037 if cp<=0.0767821028828621\n",
      "   +1.0000 if cp<=0.0550732895731926\n",
      "   +1.0000 if cp>=0.11354677379131317\n",
      "--------------\n",
      "   -0.0000 if cp>=-0.011331777088344097\n",
      "   -0.0000 if pav>=0.2577446699142456\n",
      "   -0.0000 if cp>=0.036732133477926254\n",
      "   -0.0000 if cp>=0.07222969830036163\n",
      "   +0.0000 if cp>=0.11354677379131317\n",
      "Run episode 589 with rewards 10.0\n",
      "origin -3.848782191514869e-06 new -3.848782191514866e-06 not updated\n",
      "============ 590 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 1]\n",
      "   +1.4862 if \n",
      "   -0.0000 if cp>=-0.011331777088344097\n",
      "   +1.4862 if cp<=0.0767821028828621\n",
      "   -0.0000 if cp>=0.11354677379131317\n",
      "  -21.5334 if cp<=-0.04881117790937423\n",
      "--------------\n",
      "   -0.0000 if cp>=-0.011331777088344097\n",
      "   -0.0000 if pav>=0.2577446699142456\n",
      "   -0.0000 if cp>=0.036732133477926254\n",
      "   -0.0000 if cp>=0.07222969830036163\n",
      "   +0.0000 if cp>=0.11354677379131317\n",
      "Run episode 590 with rewards 9.0\n",
      "============ 591 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 1, 0, 0, 0]\n",
      "   +2.1882 if \n",
      "   +0.0813 if cp>=-0.011331777088344097\n",
      "   +2.1882 if cp<=0.0767821028828621\n",
      "  +21.4442 if cp<=-0.04881117790937423\n",
      "   +1.0000 if cp>=-0.028749344870448112\n",
      "--------------\n",
      "  -14.1166 if cp>=-0.011331777088344097\n",
      "   +8.7283 if pav>=0.2577446699142456\n",
      "   -0.0000 if cp>=0.036732133477926254\n",
      "   -0.0000 if cp>=0.07222969830036163\n",
      "   +8.0364 if \n",
      "Run episode 591 with rewards 10.0\n",
      "============ 592 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 1, 1, 1]\n",
      "   +0.0536 if \n",
      "   +0.0536 if cp<=0.0767821028828621\n",
      "  -18.6476 if cp<=-0.04881117790937423\n",
      "  +15.1763 if cp>=-0.028749344870448112\n",
      "   +1.0000 if cp>=0.00921128168702126\n",
      "--------------\n",
      "   +0.0739 if cp>=-0.011331777088344097\n",
      "   -4.1346 if pav>=0.2577446699142456\n",
      "   +0.0000 if cp>=0.036732133477926254\n",
      "   -5.2627 if \n",
      "   -0.8395 if cp<=-0.018578514643013477 & cp>=-0.057321013510227205\n",
      "Run episode 592 with rewards 9.0\n",
      "============ 593 ===========\n",
      "22 actions [1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.0536 if \n",
      "  +18.6476 if cp<=-0.04881117790937423\n",
      "  +15.1763 if cp>=-0.028749344870448112\n",
      "   +1.0000 if cp>=0.00921128168702126\n",
      "   +1.0000 if pa>=0.18600794672966003\n",
      "--------------\n",
      "   -0.0140 if cp>=-0.011331777088344097\n",
      "   +3.9737 if pav>=0.2577446699142456\n",
      "   +3.9736 if \n",
      "   +3.9884 if cp<=-0.018578514643013477 & cp>=-0.057321013510227205\n",
      "   -0.0000 if pav>=1.8144909143447876\n",
      "Run episode 593 with rewards 22.0\n",
      "============ 594 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 1, 1, 1, 1, 1]\n",
      "  -13.8002 if cp<=-0.04881117790937423\n",
      "  +16.9784 if cp>=-0.028749344870448112\n",
      "   +6.6738 if cp>=0.00921128168702126\n",
      "   -0.6204 if pa>=0.18600794672966003\n",
      "   +1.0000 if cp<=-0.09129744172096252\n",
      "--------------\n",
      "   -0.0003 if cp>=-0.011331777088344097\n",
      "   +0.0912 if pav>=0.2577446699142456\n",
      "   +2.2608 if \n",
      "   +2.2611 if cp<=-0.018578514643013477 & cp>=-0.057321013510227205\n",
      "   -0.0008 if cv>=0.8129658699035645\n",
      "Run episode 594 with rewards 10.0\n",
      "============ 595 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +18.1933 if cp<=-0.04881117790937423\n",
      "   +6.6015 if cp>=-0.028749344870448112\n",
      "   +2.5537 if cp>=0.00921128168702126\n",
      "   +0.3826 if cp<=-0.09129744172096252\n",
      "   +1.0000 if cp<=-0.06961396634578705\n",
      "--------------\n",
      "   -0.9325 if pav>=0.2577446699142456\n",
      "   -0.9325 if \n",
      "   -0.9324 if cp<=-0.018578514643013477 & cp>=-0.057321013510227205\n",
      "   +0.0000 if cv>=0.8129658699035645\n",
      "   -0.9323 if pav>=1.5699787139892578\n",
      "Run episode 595 with rewards 10.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 596 ===========\n",
      "11 actions [0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1]\n",
      "  -14.0414 if cp<=-0.04881117790937423\n",
      "   +9.5516 if cp>=-0.028749344870448112\n",
      "   -1.2667 if cp>=0.00921128168702126\n",
      "   -5.3961 if cp<=-0.06961396634578705\n",
      "   +0.8399 if cp<=-0.10919667482376098\n",
      "--------------\n",
      "   -0.8646 if pav>=0.2577446699142456\n",
      "   -0.8849 if \n",
      "   -0.8646 if cp<=-0.018578514643013477 & cp>=-0.057321013510227205\n",
      "   +0.0000 if pav>=1.5699787139892578\n",
      "   -0.2393 if cp<=-0.03702923282980918 & cp>=-0.06685886830091477\n",
      "Run episode 596 with rewards 11.0\n",
      "============ 597 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +14.0414 if cp<=-0.04881117790937423\n",
      "   +9.5516 if cp>=-0.028749344870448112\n",
      "   +1.2667 if cp>=0.00921128168702126\n",
      "   +5.3961 if cp<=-0.06961396634578705\n",
      "   +1.0000 if pa>=0.20194284617900848\n",
      "--------------\n",
      "   -0.0089 if pav>=0.2577446699142456\n",
      "   -0.0191 if \n",
      "   +0.0002 if cp<=-0.018578514643013477 & cp>=-0.057321013510227205\n",
      "   -0.0000 if cp<=-0.03702923282980918 & cp>=-0.06685886830091477\n",
      "   -0.0191 if pa<=0.011036650277674198\n",
      "Run episode 597 with rewards 9.0\n",
      "============ 598 ===========\n",
      "12 actions [1, 1, 1, 1, 1, 1, 0, 0, 1, 0, 0, 0]\n",
      "  -13.4233 if cp<=-0.04881117790937423\n",
      "   -2.2916 if cp>=-0.028749344870448112\n",
      "   +5.6942 if cp>=0.00921128168702126\n",
      "   -7.0946 if cp<=-0.06961396634578705\n",
      "   +1.0000 if pa>=0.16529636085033417\n",
      "--------------\n",
      "   +8.1908 if pav>=0.2577446699142456\n",
      "   +8.5095 if \n",
      "  +15.4566 if cp<=-0.018578514643013477 & cp>=-0.057321013510227205\n",
      "   -7.1311 if pa<=0.011036650277674198\n",
      "   +0.1011 if cp>=0.017941806837916383\n",
      "Run episode 598 with rewards 12.0\n",
      "============ 599 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   +0.0000 if cp<=-0.04881117790937423\n",
      "   +3.9173 if cp>=-0.028749344870448112\n",
      "   +5.5866 if cp>=0.00921128168702126\n",
      "   +0.0000 if cp<=-0.06961396634578705\n",
      "   -1.7262 if cv>=0.7858353853225708\n",
      "--------------\n",
      "   +7.0931 if pav>=0.2577446699142456\n",
      "  +13.4650 if \n",
      "  +13.3851 if cp<=-0.018578514643013477 & cp>=-0.057321013510227205\n",
      "  +12.2713 if pa<=0.011036650277674198\n",
      "   +1.0000 if cp>=0.06663096696138383\n",
      "Run episode 599 with rewards 10.0\n",
      "============ 600 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.0000 if cp<=-0.04881117790937423\n",
      "   -0.0001 if cp>=-0.028749344870448112\n",
      "   +0.0000 if cp>=0.00921128168702126\n",
      "   +0.0000 if cv>=0.7858353853225708\n",
      "   -0.0001 if cp<=-0.0029577041044831272\n",
      "--------------\n",
      "   -3.3449 if pav>=0.2577446699142456\n",
      "   -6.2208 if \n",
      "   -6.3119 if cp<=-0.018578514643013477 & cp>=-0.057321013510227205\n",
      "   -6.9572 if pa<=0.011036650277674198\n",
      "   +1.3946 if cp<=0.08626990467309953\n",
      "Run episode 600 with rewards 10.0\n",
      "============ 601 ===========\n",
      "247 actions [0, 1, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 0, 0, 1, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 1, 0, 1, 0, 0, 1, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 1, 0, 0, 1, 0, 1, 0, 0, 1, 1, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0, 1, 0, 0, 1, 1, 0, 0, 0, 0, 1, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 0, 1, 0, 1, 0]\n",
      "   +0.0002 if cp>=-0.028749344870448112\n",
      "   -0.0000 if cp>=0.00921128168702126\n",
      "   -0.0000 if cv>=0.7858353853225708\n",
      "   -0.0135 if cp<=-0.0029577041044831272\n",
      "   -0.0105 if cp<=-0.08050460070371628\n",
      "--------------\n",
      "  +11.0443 if pav>=0.2577446699142456\n",
      "   +7.4143 if \n",
      "   +4.3190 if cp<=-0.018578514643013477 & cp>=-0.057321013510227205\n",
      "  -17.4435 if pa<=0.011036650277674198\n",
      "   -0.8711 if cp>=-0.014207053184509273\n",
      "Run episode 601 with rewards 247.0\n",
      "best\n",
      "origin 3035.6630961132555 new 103137.17834671549 not updated\n",
      "============ 602 ===========\n",
      "269 actions [0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 0, 1, 1, 0, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 1, 0, 0, 1, 0, 1, 0, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 0, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 0, 1, 0, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 0, 1, 0]\n",
      "   +0.9031 if cp>=-0.028749344870448112\n",
      "   -0.5590 if cp>=0.00921128168702126\n",
      "   +1.3876 if cp<=-0.0029577041044831272\n",
      "   -0.7552 if cp<=-0.08050460070371628\n",
      "   -3.7708 if pav>=1.5328729152679443\n",
      "--------------\n",
      "  +11.0443 if pav>=0.2577446699142456\n",
      "   +7.4143 if \n",
      "   +4.3190 if cp<=-0.018578514643013477 & cp>=-0.057321013510227205\n",
      "  -17.4435 if pa<=0.011036650277674198\n",
      "   -0.8711 if cp>=-0.014207053184509273\n",
      "Run episode 602 with rewards 269.0\n",
      "best\n",
      "============ 603 ===========\n",
      "223 actions [0, 1, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 0, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 0, 0, 0, 1, 0, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 0, 1, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0]\n",
      "   -2.5881 if cp>=-0.028749344870448112\n",
      "   -0.0940 if cp<=-0.0029577041044831272\n",
      "   +1.2143 if cp<=-0.08050460070371628\n",
      "   -0.0002 if pav>=1.5328729152679443\n",
      "   -5.4173 if cp>=-0.34897989034652704 & cv>=-0.9436933159828186 & pa>=-0.03141852095723152 & pav>=0.504111683368683\n",
      "--------------\n",
      "   +8.1653 if pav>=0.2577446699142456\n",
      "   +5.3391 if \n",
      "   +3.8424 if cp<=-0.018578514643013477 & cp>=-0.057321013510227205\n",
      "  -12.8391 if pa<=0.011036650277674198\n",
      "   +2.4693 if cp>=-0.11598589867353437 & pa<=-0.0016309547238051757 & pa>=-0.05938097015023232 & pav>=0.2316213786602021\n",
      "Run episode 603 with rewards 223.0\n",
      "============ 604 ===========\n",
      "140 actions [0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0]\n",
      "   -0.0001 if cp>=-0.028749344870448112\n",
      "   +2.4671 if cp<=-0.0029577041044831272\n",
      "   -1.1004 if cp<=-0.08050460070371628\n",
      "   -6.8476 if cp>=-0.34897989034652704 & cv>=-0.9436933159828186 & pa>=-0.03141852095723152 & pav>=0.504111683368683\n",
      "   -4.6007 if cv>=-0.418967068195343 & pa>=0.0066844535060227 & pav>=0.2437113732099534\n",
      "--------------\n",
      "   +7.1016 if pav>=0.2577446699142456\n",
      "   +7.2722 if \n",
      "   +2.3293 if cp<=-0.018578514643013477 & cp>=-0.057321013510227205\n",
      "  -13.8966 if pa<=0.011036650277674198\n",
      "   +4.6528 if cp>=-0.12154064178466796 & pa<=-0.0563332751393318 & pav>=0.2437113732099534\n",
      "Run episode 604 with rewards 140.0\n",
      "============ 605 ===========\n",
      "175 actions [0, 1, 0, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 1, 0, 0, 1, 0, 1, 0, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 1, 0, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +5.1542 if cp<=-0.0029577041044831272\n",
      "   +0.9112 if cp<=-0.08050460070371628\n",
      "   -7.3815 if cp>=-0.34897989034652704 & cv>=-0.9436933159828186 & pa>=-0.03141852095723152 & pav>=0.504111683368683\n",
      "   -0.1051 if cv>=-0.418967068195343 & pa>=0.0066844535060227 & pav>=0.2437113732099534\n",
      "   -2.5903 if cp<=0.0019565606024116314\n",
      "--------------\n",
      "   +6.0129 if pav>=0.2577446699142456\n",
      "   +7.6396 if \n",
      "  -13.4834 if pa<=0.011036650277674198\n",
      "   +5.1310 if cp>=-0.12154064178466796 & pa<=-0.0563332751393318 & pav>=0.2437113732099534\n",
      "   +6.4580 if cp<=0.0019565606024116314 & cp>=-0.07492737025022506 & cv<=-0.520794677734375 & pa<=-0.02263965867459774\n",
      "Run episode 605 with rewards 175.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 606 ===========\n",
      "452 actions [0, 0, 1, 0, 1, 1, 1, 1, 0, 0, 0, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 1, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 0, 1, 1, 1, 0, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 0, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 1, 0, 1, 1, 0, 1, 1, 0, 0, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 0, 1, 1, 0, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 0, 1, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 1, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 1, 0, 0, 0, 1, 0, 0, 0, 1, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +4.8669 if cp<=-0.0029577041044831272\n",
      "   -4.7793 if cp<=-0.08050460070371628\n",
      "   -9.9810 if cp>=-0.34897989034652704 & cv>=-0.9436933159828186 & pa>=-0.03141852095723152 & pav>=0.504111683368683\n",
      "   -2.9385 if cp<=0.0019565606024116314\n",
      "   +4.5109 if cp<=-0.05403863117098805\n",
      "--------------\n",
      "   +6.9600 if pav>=0.2577446699142456\n",
      "   +6.3257 if \n",
      "  -12.2189 if pa<=0.011036650277674198\n",
      "   +5.1359 if cp<=0.0019565606024116314 & cp>=-0.07492737025022506 & cv<=-0.520794677734375 & pa<=-0.02263965867459774\n",
      "   +5.3993 if cp>=-0.20653745532035828 & pa<=-0.02592739388346672 & pa<=-0.053775882720947264 & pav>=0.24917209744453445\n",
      "Run episode 606 with rewards 452.0\n",
      "best\n",
      "============ 607 ===========\n",
      "151 actions [0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1, 1, 1, 0, 1, 1, 1, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 0, 1, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +3.9184 if cp<=-0.0029577041044831272\n",
      "   -3.7388 if cp<=-0.08050460070371628\n",
      "   -9.0058 if cp>=-0.34897989034652704 & cv>=-0.9436933159828186 & pa>=-0.03141852095723152 & pav>=0.504111683368683\n",
      "   +3.8094 if cp<=-0.05403863117098805\n",
      "   -2.2105 if cp<=-0.012420541420578947\n",
      "--------------\n",
      "   +8.6953 if pav>=0.2577446699142456\n",
      "   +6.3086 if \n",
      "  -13.8903 if pa<=0.011036650277674198\n",
      "   +5.4438 if cp>=-0.20653745532035828 & pa<=-0.02592739388346672 & pa<=-0.053775882720947264 & pav>=0.24917209744453445\n",
      "   -1.2302 if cp>=-0.012420541420578947 & cv<=-0.3174127876758575 & pa<=0.0061044441536069055 & pa>=-0.039529354125261304 & pav<=0.49739250540733343\n",
      "Run episode 607 with rewards 151.0\n",
      "============ 608 ===========\n",
      "155 actions [0, 0, 0, 1, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 1, 0, 0, 0, 0, 0, 1, 0, 1, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0]\n",
      "   +2.4508 if cp<=-0.0029577041044831272\n",
      "   -1.3629 if cp<=-0.08050460070371628\n",
      "   -7.5330 if cp>=-0.34897989034652704 & cv>=-0.9436933159828186 & pa>=-0.03141852095723152 & pav>=0.504111683368683\n",
      "   +1.0332 if cp<=-0.05403863117098805\n",
      "   +2.6168 if cp<=-0.13908900320529932 & pa<=0.010749897919595252 & pa>=-0.06748585402965546 & pav>=0.26811635494232183\n",
      "--------------\n",
      "   +4.0963 if pav>=0.2577446699142456\n",
      "   +6.9006 if \n",
      "  -11.3198 if pa<=0.011036650277674198\n",
      "   +7.0183 if cp>=-0.20653745532035828 & pa<=-0.02592739388346672 & pa<=-0.053775882720947264 & pav>=0.24917209744453445\n",
      "   +2.8139 if cp<=-0.07306573539972305 & cp>=-0.13908900320529932 & cv<=-0.38189953565597534 & pa<=0.010749897919595252 & pa>=-0.026697134599089622 & pav<=0.5790603756904602\n",
      "Run episode 608 with rewards 155.0\n",
      "============ 609 ===========\n",
      "241 actions [0, 0, 1, 1, 0, 1, 0, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 1, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 0, 1, 1, 1, 0, 0, 0, 1, 0, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1, 1, 0, 1, 1, 1, 1, 1, 1, 0, 1, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 1, 0, 1, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0, 1, 0, 0, 0, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0]\n",
      "   -1.7427 if cp<=-0.0029577041044831272\n",
      "   -2.6229 if cp<=-0.08050460070371628\n",
      "   -8.8895 if cp>=-0.34897989034652704 & cv>=-0.9436933159828186 & pa>=-0.03141852095723152 & pav>=0.504111683368683\n",
      "   +4.2873 if cp<=-0.13908900320529932 & pa<=0.010749897919595252 & pa>=-0.06748585402965546 & pav>=0.26811635494232183\n",
      "   +3.8408 if \n",
      "--------------\n",
      "   +4.2189 if pav>=0.2577446699142456\n",
      "   +8.3321 if \n",
      "  -10.8875 if pa<=0.011036650277674198\n",
      "   +5.6157 if cp>=-0.20653745532035828 & pa<=-0.02592739388346672 & pa<=-0.053775882720947264 & pav>=0.24917209744453445\n",
      "   -6.0597 if cp>=-0.04622268751263618 & cv<=-0.23819604516029358 & pa<=-0.029148938506841658\n",
      "Run episode 609 with rewards 241.0\n",
      "origin 3190.968686574325 new 3246.092494846054 not updated\n",
      "============ 610 ===========\n",
      "41 actions [0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0]\n",
      "   -2.0220 if cp<=-0.08050460070371628\n",
      "   -6.3796 if cp>=-0.34897989034652704 & cv>=-0.9436933159828186 & pa>=-0.03141852095723152 & pav>=0.504111683368683\n",
      "   +3.0269 if cp<=-0.13908900320529932 & pa<=0.010749897919595252 & pa>=-0.06748585402965546 & pav>=0.26811635494232183\n",
      "   +1.6212 if \n",
      "   +3.3046 if cp>=-0.5207653045654297 & cv>=-1.0628056526184082 & pa<=-0.03944564238190651 & pav>=0.22416704893112188\n",
      "--------------\n",
      "   +4.2189 if pav>=0.2577446699142456\n",
      "   +8.3321 if \n",
      "  -10.8875 if pa<=0.011036650277674198\n",
      "   +5.6157 if cp>=-0.20653745532035828 & pa<=-0.02592739388346672 & pa<=-0.053775882720947264 & pav>=0.24917209744453445\n",
      "   -6.0597 if cp>=-0.04622268751263618 & cv<=-0.23819604516029358 & pa<=-0.029148938506841658\n",
      "Run episode 610 with rewards 41.0\n",
      "origin 21.221545361521002 new 27.601355708836852 not updated\n",
      "============ 611 ===========\n",
      "136 actions [0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -2.0220 if cp<=-0.08050460070371628\n",
      "   -6.3796 if cp>=-0.34897989034652704 & cv>=-0.9436933159828186 & pa>=-0.03141852095723152 & pav>=0.504111683368683\n",
      "   +3.0269 if cp<=-0.13908900320529932 & pa<=0.010749897919595252 & pa>=-0.06748585402965546 & pav>=0.26811635494232183\n",
      "   +1.6212 if \n",
      "   +3.3046 if cp>=-0.5207653045654297 & cv>=-1.0628056526184082 & pa<=-0.03944564238190651 & pav>=0.22416704893112188\n",
      "--------------\n",
      "   +4.1336 if \n",
      "   -6.5182 if pa<=0.011036650277674198\n",
      "   -0.0162 if cp>=-0.20653745532035828 & pa<=-0.02592739388346672 & pa<=-0.053775882720947264 & pav>=0.24917209744453445\n",
      "   -0.8050 if cp>=-0.04622268751263618 & cv<=-0.23819604516029358 & pa<=-0.029148938506841658\n",
      "   +4.0836 if pav>=1.5938622951507568\n",
      "Run episode 611 with rewards 136.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 612 ===========\n",
      "145 actions [0, 0, 0, 1, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.0641 if cp<=-0.08050460070371628\n",
      "   -9.4373 if cp>=-0.34897989034652704 & cv>=-0.9436933159828186 & pa>=-0.03141852095723152 & pav>=0.504111683368683\n",
      "   +0.2139 if cp<=-0.13908900320529932 & pa<=0.010749897919595252 & pa>=-0.06748585402965546 & pav>=0.26811635494232183\n",
      "   -2.5970 if cp>=-0.5207653045654297 & cv>=-1.0628056526184082 & pa<=-0.03944564238190651 & pav>=0.22416704893112188\n",
      "   +2.4999 if cp>=-0.34773147106170654 & pa<=0.015125785022974023 & pav<=0.9842319488525391\n",
      "--------------\n",
      "   +9.5074 if \n",
      "  -10.4283 if pa<=0.011036650277674198\n",
      "   -0.7043 if cp>=-0.04622268751263618 & cv<=-0.23819604516029358 & pa<=-0.029148938506841658\n",
      "   +9.1221 if pav>=1.5938622951507568\n",
      "   -3.3952 if cp<=-0.06501882523298264\n",
      "Run episode 612 with rewards 145.0\n",
      "============ 613 ===========\n",
      "153 actions [0, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0]\n",
      "  -11.1085 if cp>=-0.34897989034652704 & cv>=-0.9436933159828186 & pa>=-0.03141852095723152 & pav>=0.504111683368683\n",
      "   +0.1459 if cp<=-0.13908900320529932 & pa<=0.010749897919595252 & pa>=-0.06748585402965546 & pav>=0.26811635494232183\n",
      "   -3.0727 if cp>=-0.5207653045654297 & cv>=-1.0628056526184082 & pa<=-0.03944564238190651 & pav>=0.22416704893112188\n",
      "   +3.9989 if cp>=-0.34773147106170654 & pa<=0.015125785022974023 & pav<=0.9842319488525391\n",
      "   -4.1334 if cp>=0.013323076441884043 & cv<=-0.5264392495155334 & pa<=-0.025479671731591224 & pav>=0.5752061486244202\n",
      "--------------\n",
      "   +6.8652 if \n",
      "   -6.1408 if pa<=0.011036650277674198\n",
      "   +5.3151 if pav>=1.5938622951507568\n",
      "   -3.7312 if cp<=-0.06501882523298264\n",
      "   -4.6917 if pa<=0.006895773485302927 & pav<=0.5752061486244202\n",
      "Run episode 613 with rewards 153.0\n",
      "origin 255.2197404471041 new 389.5090384441992 not updated\n",
      "============ 614 ===========\n",
      "335 actions [1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  -12.3789 if cp>=-0.34897989034652704 & cv>=-0.9436933159828186 & pa>=-0.03141852095723152 & pav>=0.504111683368683\n",
      "   -3.6027 if cp>=-0.5207653045654297 & cv>=-1.0628056526184082 & pa<=-0.03944564238190651 & pav>=0.22416704893112188\n",
      "   +4.5561 if cp>=-0.34773147106170654 & pa<=0.015125785022974023 & pav<=0.9842319488525391\n",
      "   +0.0000 if cp>=0.013323076441884043 & cv<=-0.5264392495155334 & pa<=-0.025479671731591224 & pav>=0.5752061486244202\n",
      "   -4.0378 if cp<=-0.018750508129596707 & cp>=-0.05391428917646408 & pa<=-0.03618420511484146\n",
      "--------------\n",
      "   +6.8652 if \n",
      "   -6.1408 if pa<=0.011036650277674198\n",
      "   +5.3151 if pav>=1.5938622951507568\n",
      "   -3.7312 if cp<=-0.06501882523298264\n",
      "   -4.6917 if pa<=0.006895773485302927 & pav<=0.5752061486244202\n",
      "Run episode 614 with rewards 335.0\n",
      "origin 1146.1622877106306 new 1608.5664537344953 not updated\n",
      "============ 615 ===========\n",
      "211 actions [0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0]\n",
      "  -14.3945 if cp>=-0.34897989034652704 & cv>=-0.9436933159828186 & pa>=-0.03141852095723152 & pav>=0.504111683368683\n",
      "   -3.8071 if cp>=-0.5207653045654297 & cv>=-1.0628056526184082 & pa<=-0.03944564238190651 & pav>=0.22416704893112188\n",
      "   +4.7379 if cp>=-0.34773147106170654 & pa<=0.015125785022974023 & pav<=0.9842319488525391\n",
      "   -2.4416 if cp<=-0.018750508129596707 & cp>=-0.05391428917646408 & pa<=-0.03618420511484146\n",
      "   -5.9474 if cp<=-0.01972345411777486 & cp>=-0.17122833132743845 & cv<=-0.199380362033844 & cv>=-0.5796834707260132 & pa<=-0.06028790920972825 & pav>=0.25968048572540287\n",
      "--------------\n",
      "   +6.8652 if \n",
      "   -6.1408 if pa<=0.011036650277674198\n",
      "   +5.3151 if pav>=1.5938622951507568\n",
      "   -3.7312 if cp<=-0.06501882523298264\n",
      "   -4.6917 if pa<=0.006895773485302927 & pav<=0.5752061486244202\n",
      "Run episode 615 with rewards 211.0\n",
      "============ 616 ===========\n",
      "55 actions [0, 0, 0, 1, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1]\n",
      "  -12.0922 if cp>=-0.34897989034652704 & cv>=-0.9436933159828186 & pa>=-0.03141852095723152 & pav>=0.504111683368683\n",
      "   -3.9348 if cp>=-0.5207653045654297 & cv>=-1.0628056526184082 & pa<=-0.03944564238190651 & pav>=0.22416704893112188\n",
      "   +3.6361 if cp>=-0.34773147106170654 & pa<=0.015125785022974023 & pav<=0.9842319488525391\n",
      "   -5.6888 if cp<=-0.01972345411777486 & cp>=-0.17122833132743845 & cv<=-0.199380362033844 & cv>=-0.5796834707260132 & pa<=-0.06028790920972825 & pav>=0.25968048572540287\n",
      "   +6.4981 if cp<=-0.09334824234247208 & cp<=-0.1463204175233841 & cp>=-0.1463204175233841 & cv<=0.04618395492434503 & cv>=-0.33552390336990356\n",
      "--------------\n",
      "   +2.8174 if \n",
      "   -5.4526 if pa<=0.011036650277674198\n",
      "   +0.9805 if pav>=1.5938622951507568\n",
      "   -5.1097 if pa<=0.006895773485302927 & pav<=0.5752061486244202\n",
      "   +1.5779 if pa<=0.014621011912822751\n",
      "Run episode 616 with rewards 55.0\n",
      "============ 617 ===========\n",
      "289 actions [0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 0, 1, 0, 1, 1, 1, 1, 1, 0, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 0, 0, 0, 0, 0, 1, 1]\n",
      "   -8.7218 if cp>=-0.34897989034652704 & cv>=-0.9436933159828186 & pa>=-0.03141852095723152 & pav>=0.504111683368683\n",
      "   -0.2217 if cp>=-0.5207653045654297 & cv>=-1.0628056526184082 & pa<=-0.03944564238190651 & pav>=0.22416704893112188\n",
      "   +0.0000 if cp<=-0.01972345411777486 & cp>=-0.17122833132743845 & cv<=-0.199380362033844 & cv>=-0.5796834707260132 & pa<=-0.06028790920972825 & pav>=0.25968048572540287\n",
      "   +0.0000 if cp<=-0.09334824234247208 & cp<=-0.1463204175233841 & cp>=-0.1463204175233841 & cv<=0.04618395492434503 & cv>=-0.33552390336990356\n",
      "   -4.0121 if cp>=-0.03998597860336304 & cv<=-0.59386066198349 & pa<=-0.03407704457640647\n",
      "--------------\n",
      "   +2.4228 if \n",
      "   +1.5682 if pa<=0.011036650277674198\n",
      "   -4.9150 if pa<=0.006895773485302927 & pav<=0.5752061486244202\n",
      "   +1.5707 if pa<=0.014621011912822751\n",
      "   -5.5797 if pa<=0.00662959311157465\n",
      "Run episode 617 with rewards 289.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 618 ===========\n",
      "182 actions [1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 0, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 1, 0, 1, 1, 1, 1, 0, 1, 0, 0, 0, 0, 1, 0, 1, 1, 1, 0, 1, 0, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 1, 0, 1, 1, 0, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   -9.4326 if cp>=-0.34897989034652704 & cv>=-0.9436933159828186 & pa>=-0.03141852095723152 & pav>=0.504111683368683\n",
      "   -0.2467 if cp>=-0.5207653045654297 & cv>=-1.0628056526184082 & pa<=-0.03944564238190651 & pav>=0.22416704893112188\n",
      "   +0.0000 if cp<=-0.09334824234247208 & cp<=-0.1463204175233841 & cp>=-0.1463204175233841 & cv<=0.04618395492434503 & cv>=-0.33552390336990356\n",
      "   -4.5859 if cp>=-0.03998597860336304 & cv<=-0.59386066198349 & pa<=-0.03407704457640647\n",
      "   -2.3913 if cp<=0.04635245129466057 & cp>=-1.2734074354171754 & pa<=-0.032383657246828075 & pav>=0.6297808408737183\n",
      "--------------\n",
      "   +2.9611 if \n",
      "   -3.9065 if pa<=0.006895773485302927 & pav<=0.5752061486244202\n",
      "   +5.0436 if pa<=0.014621011912822751\n",
      "   -7.0555 if pa<=0.00662959311157465\n",
      "   -1.5976 if pa<=0.029334025457501415 & pav<=0.6297808408737183\n",
      "Run episode 618 with rewards 182.0\n",
      "============ 619 ===========\n",
      "417 actions [0, 0, 1, 0, 1, 1, 1, 0, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 0, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 1, 0, 1, 1, 1, 1, 0, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 1, 1, 1, 0, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 0, 1, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 0, 0, 1, 1, 0, 1, 1, 0, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 0, 1, 1, 1, 1, 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 0, 0, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0, 0, 0, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 1, 0, 0, 0, 0]\n",
      "   -9.3735 if cp>=-0.34897989034652704 & cv>=-0.9436933159828186 & pa>=-0.03141852095723152 & pav>=0.504111683368683\n",
      "   +2.7320 if cp>=-0.5207653045654297 & cv>=-1.0628056526184082 & pa<=-0.03944564238190651 & pav>=0.22416704893112188\n",
      "   -0.0000 if cp>=-0.03998597860336304 & cv<=-0.59386066198349 & pa<=-0.03407704457640647\n",
      "   -5.8778 if cp<=0.04635245129466057 & cp>=-1.2734074354171754 & pa<=-0.032383657246828075 & pav>=0.6297808408737183\n",
      "   -5.0227 if cp<=-0.02619173526763916 & cp>=-0.2101022720336914 & cv<=0.030156206339597712 & cv>=-0.5122064769268031 & pa>=0.007871035486459744\n",
      "--------------\n",
      "   +2.0006 if \n",
      "   -2.9527 if pa<=0.006895773485302927 & pav<=0.5752061486244202\n",
      "   +3.6423 if pa<=0.014621011912822751\n",
      "   -6.3851 if pa<=0.00662959311157465\n",
      "   -2.6396 if cp>=-0.2101022720336914 & cv<=0.22678737342357635 & cv>=0.030156206339597712 & pa>=0.007871035486459744 & pa>=0.022794276475906396\n",
      "Run episode 619 with rewards 417.0\n",
      "============ 620 ===========\n",
      "89 actions [0, 0, 1, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0]\n",
      "  -10.0555 if cp>=-0.34897989034652704 & cv>=-0.9436933159828186 & pa>=-0.03141852095723152 & pav>=0.504111683368683\n",
      "   +4.0379 if cp>=-0.5207653045654297 & cv>=-1.0628056526184082 & pa<=-0.03944564238190651 & pav>=0.22416704893112188\n",
      "   -7.0302 if cp<=0.04635245129466057 & cp>=-1.2734074354171754 & pa<=-0.032383657246828075 & pav>=0.6297808408737183\n",
      "   -5.5171 if cp<=-0.02619173526763916 & cp>=-0.2101022720336914 & cv<=0.030156206339597712 & cv>=-0.5122064769268031 & pa>=0.007871035486459744\n",
      "   +0.5961 if cp>=-0.7835829854011536 & pa<=0.036352673172950746\n",
      "--------------\n",
      "   -3.2146 if pa<=0.006895773485302927 & pav<=0.5752061486244202\n",
      "   +1.7692 if pa<=0.014621011912822751\n",
      "   -5.0880 if pa<=0.00662959311157465\n",
      "   -3.3888 if cp>=-0.2101022720336914 & cv<=0.22678737342357635 & cv>=0.030156206339597712 & pa>=0.007871035486459744 & pa>=0.022794276475906396\n",
      "   +2.0051 if \n",
      "Run episode 620 with rewards 89.0\n",
      "============ 621 ===========\n",
      "75 actions [1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0]\n",
      "   -5.7968 if cp>=-0.34897989034652704 & cv>=-0.9436933159828186 & pa>=-0.03141852095723152 & pav>=0.504111683368683\n",
      "   +2.7092 if cp>=-0.5207653045654297 & cv>=-1.0628056526184082 & pa<=-0.03944564238190651 & pav>=0.22416704893112188\n",
      "   +0.0000 if cp<=0.04635245129466057 & cp>=-1.2734074354171754 & pa<=-0.032383657246828075 & pav>=0.6297808408737183\n",
      "   +0.0000 if cp<=-0.02619173526763916 & cp>=-0.2101022720336914 & cv<=0.030156206339597712 & cv>=-0.5122064769268031 & pa>=0.007871035486459744\n",
      "   +1.7643 if cp<=0.0496792197227478 & cv>=0.0012940536485984934 & pav<=-0.04089766442775719 & pav>=-0.42539845705032336\n",
      "--------------\n",
      "   -3.5496 if pa<=0.006895773485302927 & pav<=0.5752061486244202\n",
      "   -7.7566 if pa<=0.00662959311157465\n",
      "  -10.3127 if cp>=-0.2101022720336914 & cv<=0.22678737342357635 & cv>=0.030156206339597712 & pa>=0.007871035486459744 & pa>=0.022794276475906396\n",
      "   +4.9619 if \n",
      "   +1.1279 if pa<=0.02981069013476372 & pa<=0.03790879994630815 & pav<=0.3472855806350708\n",
      "Run episode 621 with rewards 75.0\n",
      "============ 622 ===========\n",
      "498 actions [0, 0, 1, 0, 1, 1, 1, 0, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 0, 1, 1, 1, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 0, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 0, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 0, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 0, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 0, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 0, 1, 0, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 1, 1, 1, 1, 0, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 1, 1, 1, 1, 1, 0, 1, 0, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 0]\n",
      "   -4.1721 if cp>=-0.34897989034652704 & cv>=-0.9436933159828186 & pa>=-0.03141852095723152 & pav>=0.504111683368683\n",
      "   -0.0000 if cp>=-0.5207653045654297 & cv>=-1.0628056526184082 & pa<=-0.03944564238190651 & pav>=0.22416704893112188\n",
      "   -0.0000 if cp<=0.04635245129466057 & cp>=-1.2734074354171754 & pa<=-0.032383657246828075 & pav>=0.6297808408737183\n",
      "   +0.9051 if cp<=0.0496792197227478 & cv>=0.0012940536485984934 & pav<=-0.04089766442775719 & pav>=-0.42539845705032336\n",
      "   -2.6151 if pav>=0.8499523997306824\n",
      "--------------\n",
      "   -8.0570 if pa<=0.006895773485302927 & pav<=0.5752061486244202\n",
      "   -6.4523 if pa<=0.00662959311157465\n",
      "   -9.5233 if cp>=-0.2101022720336914 & cv<=0.22678737342357635 & cv>=0.030156206339597712 & pa>=0.007871035486459744 & pa>=0.022794276475906396\n",
      "   +5.1435 if \n",
      "   +1.1519 if cp>=-0.00408112602308392 & cv>=-0.056063193082809444 & pav>=0.3578081905841828\n",
      "Run episode 622 with rewards 498.0\n",
      "best\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 623 ===========\n",
      "62 actions [0, 0, 0, 0, 1, 1, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1]\n",
      "   -3.6474 if cp>=-0.34897989034652704 & cv>=-0.9436933159828186 & pa>=-0.03141852095723152 & pav>=0.504111683368683\n",
      "   +2.4762 if cp>=-0.5207653045654297 & cv>=-1.0628056526184082 & pa<=-0.03944564238190651 & pav>=0.22416704893112188\n",
      "   -0.0515 if cp<=0.0496792197227478 & cv>=0.0012940536485984934 & pav<=-0.04089766442775719 & pav>=-0.42539845705032336\n",
      "   -6.6018 if pav>=0.8499523997306824\n",
      "   +4.4029 if cp<=-0.770960783958435 & pa<=0.00657081371173263 & pav>=0.6109533190727234\n",
      "--------------\n",
      "  -10.6323 if pa<=0.006895773485302927 & pav<=0.5752061486244202\n",
      "   -9.1009 if pa<=0.00662959311157465\n",
      "  -12.7228 if cp>=-0.2101022720336914 & cv<=0.22678737342357635 & cv>=0.030156206339597712 & pa>=0.007871035486459744 & pa>=0.022794276475906396\n",
      "   +7.2901 if \n",
      "   +1.9021 if cp<=-0.048161176592111506 & cp>=-0.770960783958435 & cv<=-0.6487268328666681 & pa<=0.00657081371173263 & pa>=-0.04226885214447975 & pav>=0.6109533190727234\n",
      "Run episode 623 with rewards 62.0\n",
      "============ 624 ===========\n",
      "44 actions [1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0]\n",
      "   +2.9127 if cp>=-0.34897989034652704 & cv>=-0.9436933159828186 & pa>=-0.03141852095723152 & pav>=0.504111683368683\n",
      "   +0.0009 if cp>=-0.5207653045654297 & cv>=-1.0628056526184082 & pa<=-0.03944564238190651 & pav>=0.22416704893112188\n",
      "   -5.8551 if pav>=0.8499523997306824\n",
      "   +0.0015 if cp<=-0.770960783958435 & pa<=0.00657081371173263 & pav>=0.6109533190727234\n",
      "   +6.0000 if pa>=0.20383130013942719\n",
      "--------------\n",
      "   -1.8680 if pa<=0.006895773485302927 & pav<=0.5752061486244202\n",
      "  -10.3072 if pa<=0.00662959311157465\n",
      "  -11.7034 if cp>=-0.2101022720336914 & cv<=0.22678737342357635 & cv>=0.030156206339597712 & pa>=0.007871035486459744 & pa>=0.022794276475906396\n",
      "   +4.2047 if \n",
      "  -11.0719 if pa>=0.20383130013942719\n",
      "Run episode 624 with rewards 44.0\n",
      "============ 625 ===========\n",
      "57 actions [1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0]\n",
      "   -0.7014 if cp>=-0.34897989034652704 & cv>=-0.9436933159828186 & pa>=-0.03141852095723152 & pav>=0.504111683368683\n",
      "   -0.2981 if pav>=0.8499523997306824\n",
      "   +0.0000 if cp<=-0.770960783958435 & pa<=0.00657081371173263 & pav>=0.6109533190727234\n",
      "   +0.0000 if pa>=0.20383130013942719\n",
      "   -1.6824 if cp<=-0.013827382028102863 & pa<=0.06338748931884766 & pav<=0.5860528826713561\n",
      "--------------\n",
      "   -9.8290 if pa<=0.00662959311157465\n",
      "   -8.7075 if cp>=-0.2101022720336914 & cv<=0.22678737342357635 & cv>=0.030156206339597712 & pa>=0.007871035486459744 & pa>=0.022794276475906396\n",
      "   +4.7434 if \n",
      "   +0.0000 if pa>=0.20383130013942719\n",
      "   -0.1976 if cp>=-0.03788607940077782 & cv<=-0.0033851120155304684\n",
      "Run episode 625 with rewards 57.0\n",
      "============ 626 ===========\n",
      "70 actions [1, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1]\n",
      "   -0.4706 if cp>=-0.34897989034652704 & cv>=-0.9436933159828186 & pa>=-0.03141852095723152 & pav>=0.504111683368683\n",
      "   -0.1439 if pav>=0.8499523997306824\n",
      "   +0.0000 if pa>=0.20383130013942719\n",
      "   +0.0000 if cp<=-0.013827382028102863 & pa<=0.06338748931884766 & pav<=0.5860528826713561\n",
      "   -5.6057 if cv>=0.024318878352642403 & pav>=0.3492515861988068\n",
      "--------------\n",
      "   -9.4687 if pa<=0.00662959311157465\n",
      "   -6.8230 if cp>=-0.2101022720336914 & cv<=0.22678737342357635 & cv>=0.030156206339597712 & pa>=0.007871035486459744 & pa>=0.022794276475906396\n",
      "   +7.2553 if \n",
      "   -2.0086 if cp>=-0.03788607940077782 & cv<=-0.0033851120155304684\n",
      "   -4.3334 if cv>=0.024318878352642403 & pav<=0.3492515861988068\n",
      "Run episode 626 with rewards 70.0\n",
      "============ 627 ===========\n",
      "73 actions [0, 0, 0, 0, 1, 1, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0, 1, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1]\n",
      "   +0.1497 if cp>=-0.34897989034652704 & cv>=-0.9436933159828186 & pa>=-0.03141852095723152 & pav>=0.504111683368683\n",
      "   -0.2119 if pav>=0.8499523997306824\n",
      "   +0.5472 if cp<=-0.013827382028102863 & pa<=0.06338748931884766 & pav<=0.5860528826713561\n",
      "   +0.0000 if cv>=0.024318878352642403 & pav>=0.3492515861988068\n",
      "   -2.2066 if cv<=0.17740824520587922 & pa<=0.04423547908663751 & pav<=0.006225889548659363\n",
      "--------------\n",
      "   -8.0853 if pa<=0.00662959311157465\n",
      "   -6.7697 if cp>=-0.2101022720336914 & cv<=0.22678737342357635 & cv>=0.030156206339597712 & pa>=0.007871035486459744 & pa>=0.022794276475906396\n",
      "   +7.9059 if \n",
      "   -4.0492 if cv>=0.024318878352642403 & pav<=0.3492515861988068\n",
      "   -3.4586 if cv<=-0.010098529793322084\n",
      "Run episode 627 with rewards 73.0\n",
      "============ 628 ===========\n",
      "72 actions [0, 0, 0, 1, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0]\n",
      "   -1.1039 if cp>=-0.34897989034652704 & cv>=-0.9436933159828186 & pa>=-0.03141852095723152 & pav>=0.504111683368683\n",
      "   +1.3843 if pav>=0.8499523997306824\n",
      "   +1.4891 if cp<=-0.013827382028102863 & pa<=0.06338748931884766 & pav<=0.5860528826713561\n",
      "   +0.3590 if cv<=0.17740824520587922 & pa<=0.04423547908663751 & pav<=0.006225889548659363\n",
      "   -3.5545 if pa<=-0.13668815791606903 & pav>=0.30789158344268797\n",
      "--------------\n",
      "   -8.9072 if pa<=0.00662959311157465\n",
      "   -7.5207 if cp>=-0.2101022720336914 & cv<=0.22678737342357635 & cv>=0.030156206339597712 & pa>=0.007871035486459744 & pa>=0.022794276475906396\n",
      "   +9.1329 if \n",
      "   -5.6246 if cv>=0.024318878352642403 & pav<=0.3492515861988068\n",
      "   -4.4991 if cp<=0.2478560864925385 & cv<=0.015359239093959332 & cv<=0.6932383298873904 & pa<=0.0019516031257808238 & pa>=-0.13668815791606903\n",
      "Run episode 628 with rewards 72.0\n",
      "============ 629 ===========\n",
      "52 actions [0, 0, 0, 0, 1, 1, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0]\n",
      "   +0.8046 if cp>=-0.34897989034652704 & cv>=-0.9436933159828186 & pa>=-0.03141852095723152 & pav>=0.504111683368683\n",
      "   +0.7774 if pav>=0.8499523997306824\n",
      "   +0.2033 if cp<=-0.013827382028102863 & pa<=0.06338748931884766 & pav<=0.5860528826713561\n",
      "   -0.0000 if pa<=-0.13668815791606903 & pav>=0.30789158344268797\n",
      "   +4.0173 if cp<=-0.07877655029296875 & pa>=0.13056663274765018\n",
      "--------------\n",
      "  -10.5079 if pa<=0.00662959311157465\n",
      "   -9.0595 if cp>=-0.2101022720336914 & cv<=0.22678737342357635 & cv>=0.030156206339597712 & pa>=0.007871035486459744 & pa>=0.022794276475906396\n",
      "   +6.1278 if \n",
      "   -1.0048 if cv>=0.024318878352642403 & pav<=0.3492515861988068\n",
      "   +4.9642 if cp>=-0.07877655029296875 & cv>=-0.04437122568488121 & pav>=0.4342654585838321\n",
      "Run episode 629 with rewards 52.0\n",
      "============ 630 ===========\n",
      "37 actions [1, 0, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1]\n",
      "   +0.2191 if cp>=-0.34897989034652704 & cv>=-0.9436933159828186 & pa>=-0.03141852095723152 & pav>=0.504111683368683\n",
      "   -0.2302 if pav>=0.8499523997306824\n",
      "   +0.9165 if cp<=-0.013827382028102863 & pa<=0.06338748931884766 & pav<=0.5860528826713561\n",
      "   -0.0000 if cp<=-0.07877655029296875 & pa>=0.13056663274765018\n",
      "   +2.1953 if cp<=-0.07024876624345779 & cv>=-0.014933994039893145 & pav<=0.4189684629440309\n",
      "--------------\n",
      "   -7.5287 if pa<=0.00662959311157465\n",
      "   -8.6094 if cp>=-0.2101022720336914 & cv<=0.22678737342357635 & cv>=0.030156206339597712 & pa>=0.007871035486459744 & pa>=0.022794276475906396\n",
      "   +4.4496 if \n",
      "   +5.8397 if cp>=-0.07877655029296875 & cv>=-0.04437122568488121 & pav>=0.4342654585838321\n",
      "   +1.4321 if pav>=1.124075174331665\n",
      "Run episode 630 with rewards 37.0\n",
      "============ 631 ===========\n",
      "39 actions [1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1]\n",
      "   +0.0777 if cp>=-0.34897989034652704 & cv>=-0.9436933159828186 & pa>=-0.03141852095723152 & pav>=0.504111683368683\n",
      "   -0.0600 if pav>=0.8499523997306824\n",
      "   -0.2688 if cp<=-0.013827382028102863 & pa<=0.06338748931884766 & pav<=0.5860528826713561\n",
      "   +0.9164 if cp<=-0.07024876624345779 & cv>=-0.014933994039893145 & pav<=0.4189684629440309\n",
      "   +2.5698 if pa<=0.00648821070790291\n",
      "--------------\n",
      "   -7.8620 if pa<=0.00662959311157465\n",
      "   -5.9251 if cp>=-0.2101022720336914 & cv<=0.22678737342357635 & cv>=0.030156206339597712 & pa>=0.007871035486459744 & pa>=0.022794276475906396\n",
      "   +4.0045 if \n",
      "   +0.0000 if cp>=-0.07877655029296875 & cv>=-0.04437122568488121 & pav>=0.4342654585838321\n",
      "   +1.2791 if cv<=-0.06471060365438461 & pa>=0.00648821070790291\n",
      "Run episode 631 with rewards 39.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 632 ===========\n",
      "53 actions [1, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1]\n",
      "   -0.0181 if cp>=-0.34897989034652704 & cv>=-0.9436933159828186 & pa>=-0.03141852095723152 & pav>=0.504111683368683\n",
      "   -1.0931 if cp<=-0.013827382028102863 & pa<=0.06338748931884766 & pav<=0.5860528826713561\n",
      "   -0.1655 if cp<=-0.07024876624345779 & cv>=-0.014933994039893145 & pav<=0.4189684629440309\n",
      "   +1.8958 if pa<=0.00648821070790291\n",
      "   +2.5918 if cp<=-0.047867994755506516 & cv>=0.14265448749065468 & pav<=0.13959051966667177\n",
      "--------------\n",
      "   -5.5805 if pa<=0.00662959311157465\n",
      "   -6.8637 if cp>=-0.2101022720336914 & cv<=0.22678737342357635 & cv>=0.030156206339597712 & pa>=0.007871035486459744 & pa>=0.022794276475906396\n",
      "   +3.5089 if \n",
      "   +0.9380 if cv<=-0.06471060365438461 & pa>=0.00648821070790291\n",
      "   +1.3042 if cp<=-0.007756106927990896 & cv<=0.00026519537786953457\n",
      "Run episode 632 with rewards 53.0\n",
      "============ 633 ===========\n",
      "12 actions [0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1]\n",
      "   -0.2059 if cp<=-0.013827382028102863 & pa<=0.06338748931884766 & pav<=0.5860528826713561\n",
      "   -0.0000 if cp<=-0.07024876624345779 & cv>=-0.014933994039893145 & pav<=0.4189684629440309\n",
      "   -0.1223 if pa<=0.00648821070790291\n",
      "   +2.3637 if cp<=-0.047867994755506516 & cv>=0.14265448749065468 & pav<=0.13959051966667177\n",
      "   +3.0916 if cp<=-0.028577221930027003 & cp>=-0.041630998998880384 & pav>=0.5395895242691041\n",
      "--------------\n",
      "   -4.0324 if pa<=0.00662959311157465\n",
      "   -4.8760 if cp>=-0.2101022720336914 & cv<=0.22678737342357635 & cv>=0.030156206339597712 & pa>=0.007871035486459744 & pa>=0.022794276475906396\n",
      "   -0.5867 if \n",
      "   +4.8098 if cp<=-0.007756106927990896 & cv<=0.00026519537786953457\n",
      "   +1.1642 if cp>=-0.017168862372636793 & cv<=0.14485360980033876 & cv>=-0.039283321052789685 & pa<=0.035199709981679914\n",
      "Run episode 633 with rewards 12.0\n",
      "============ 634 ===========\n",
      "23 actions [0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 0, 1, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0]\n",
      "   -0.0000 if cp<=-0.013827382028102863 & pa<=0.06338748931884766 & pav<=0.5860528826713561\n",
      "   +0.5921 if pa<=0.00648821070790291\n",
      "   -0.0000 if cp<=-0.047867994755506516 & cv>=0.14265448749065468 & pav<=0.13959051966667177\n",
      "   +0.1109 if cp<=-0.028577221930027003 & cp>=-0.041630998998880384 & pav>=0.5395895242691041\n",
      "   +0.8565 if cp>=-0.0034538058098405374 & cv<=-0.7321171641349792\n",
      "--------------\n",
      "  -10.3426 if pa<=0.00662959311157465\n",
      "   -7.6957 if cp>=-0.2101022720336914 & cv<=0.22678737342357635 & cv>=0.030156206339597712 & pa>=0.007871035486459744 & pa>=0.022794276475906396\n",
      "  -16.0270 if cp<=-0.007756106927990896 & cv<=0.00026519537786953457\n",
      "   -1.7142 if cp>=-0.017168862372636793 & cv<=0.14485360980033876 & cv>=-0.039283321052789685 & pa<=0.035199709981679914\n",
      "   +0.0597 if cp<=-0.04760992750525474\n",
      "Run episode 634 with rewards 23.0\n",
      "============ 635 ===========\n",
      "15 actions [1, 1, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.7528 if pa<=0.00648821070790291\n",
      "   -0.0000 if cp<=-0.047867994755506516 & cv>=0.14265448749065468 & pav<=0.13959051966667177\n",
      "   -0.1410 if cp<=-0.028577221930027003 & cp>=-0.041630998998880384 & pav>=0.5395895242691041\n",
      "  -23.4975 if cp>=-0.0034538058098405374 & cv<=-0.7321171641349792\n",
      "   -2.2024 if cv<=-0.005211336724460123 & cv<=-0.010101334936916825 & pa<=0.04053586199879646 & pa<=0.04822327196598054\n",
      "--------------\n",
      "   +8.1122 if pa<=0.00662959311157465\n",
      "   -3.4886 if cp>=-0.2101022720336914 & cv<=0.22678737342357635 & cv>=0.030156206339597712 & pa>=0.007871035486459744 & pa>=0.022794276475906396\n",
      "  +17.8730 if cp<=-0.007756106927990896 & cv<=0.00026519537786953457\n",
      "   -5.2234 if cp>=-0.017168862372636793 & cv<=0.14485360980033876 & cv>=-0.039283321052789685 & pa<=0.035199709981679914\n",
      "   +2.8609 if cv<=-0.010101334936916825 & pa<=0.04053586199879646\n",
      "Run episode 635 with rewards 15.0\n",
      "============ 636 ===========\n",
      "11 actions [0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.0263 if pa<=0.00648821070790291\n",
      "   -0.0000 if cp<=-0.028577221930027003 & cp>=-0.041630998998880384 & pav>=0.5395895242691041\n",
      "   -0.0000 if cp>=-0.0034538058098405374 & cv<=-0.7321171641349792\n",
      "   -3.7017 if cv<=-0.005211336724460123 & cv<=-0.010101334936916825 & pa<=0.04053586199879646 & pa<=0.04822327196598054\n",
      "   +2.5452 if cp<=-0.004786870721727609 & cv<=0.16690974831581115 & cv>=0.1271973758935929\n",
      "--------------\n",
      "  -31.0135 if pa<=0.00662959311157465\n",
      "   +2.8300 if cp>=-0.2101022720336914 & cv<=0.22678737342357635 & cv>=0.030156206339597712 & pa>=0.007871035486459744 & pa>=0.022794276475906396\n",
      "   -4.6398 if cp<=-0.007756106927990896 & cv<=0.00026519537786953457\n",
      "   -0.1307 if cp>=-0.017168862372636793 & cv<=0.14485360980033876 & cv>=-0.039283321052789685 & pa<=0.035199709981679914\n",
      "   +1.0000 if cp>=0.03654637560248377\n",
      "Run episode 636 with rewards 11.0\n",
      "============ 637 ===========\n",
      "41 actions [1, 0, 0, 1, 0, 1, 1, 0, 0, 0, 1, 1, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1]\n",
      "   +0.0000 if pa<=0.00648821070790291\n",
      "   +0.0000 if cp>=-0.0034538058098405374 & cv<=-0.7321171641349792\n",
      "   -2.0496 if cv<=-0.005211336724460123 & cv<=-0.010101334936916825 & pa<=0.04053586199879646 & pa<=0.04822327196598054\n",
      "   +0.0000 if cp<=-0.004786870721727609 & cv<=0.16690974831581115 & cv>=0.1271973758935929\n",
      "   -2.0496 if cv>=-0.6111044883728025\n",
      "--------------\n",
      "   -2.6734 if pa<=0.00662959311157465\n",
      "   +1.5618 if cp>=-0.2101022720336914 & cv<=0.22678737342357635 & cv>=0.030156206339597712 & pa>=0.007871035486459744 & pa>=0.022794276475906396\n",
      "  +19.4684 if cp<=-0.007756106927990896 & cv<=0.00026519537786953457\n",
      "   +0.5519 if cp>=0.03654637560248377\n",
      "   +1.0000 if cp<=-0.12429545074701309\n",
      "Run episode 637 with rewards 41.0\n",
      "============ 638 ===========\n",
      "69 actions [0, 0, 0, 1, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0, 0, 1, 1, 1, 1, 0, 0, 0, 0, 1, 0, 1, 0, 0, 1, 0, 1, 1, 1, 1, 0, 1, 0, 1, 0]\n",
      "   +2.7422 if pa<=0.00648821070790291\n",
      "   -8.4353 if cv<=-0.005211336724460123 & cv<=-0.010101334936916825 & pa<=0.04053586199879646 & pa<=0.04822327196598054\n",
      "   +0.0000 if cp<=-0.004786870721727609 & cv<=0.16690974831581115 & cv>=0.1271973758935929\n",
      "   +2.4216 if cv>=-0.6111044883728025\n",
      "   -4.9146 if pa>=0.016030343249440193\n",
      "--------------\n",
      "   -3.3153 if pa<=0.00662959311157465\n",
      "   +0.0000 if cp>=-0.2101022720336914 & cv<=0.22678737342357635 & cv>=0.030156206339597712 & pa>=0.007871035486459744 & pa>=0.022794276475906396\n",
      "   +0.0000 if cp<=-0.007756106927990896 & cv<=0.00026519537786953457\n",
      "   +0.0000 if cp<=-0.12429545074701309\n",
      "   -4.3761 if cp>=0.031040426343679428 & cv>=-0.045058395713567734 & pa>=-0.011637414805591101 & pav>=-0.039536844938993385\n",
      "Run episode 638 with rewards 69.0\n",
      "============ 639 ===========\n",
      "100 actions [0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1, 1, 0, 1, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 1, 0, 0, 0]\n",
      "   +0.3991 if pa<=0.00648821070790291\n",
      "   -4.5976 if cv<=-0.005211336724460123 & cv<=-0.010101334936916825 & pa<=0.04053586199879646 & pa<=0.04822327196598054\n",
      "   +1.6978 if cv>=-0.6111044883728025\n",
      "   -6.6055 if pa>=0.016030343249440193\n",
      "   -2.1109 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "--------------\n",
      "   -5.6812 if pa<=0.00662959311157465\n",
      "   +1.7825 if cp>=-0.2101022720336914 & cv<=0.22678737342357635 & cv>=0.030156206339597712 & pa>=0.007871035486459744 & pa>=0.022794276475906396\n",
      "   -0.0885 if cp<=-0.007756106927990896 & cv<=0.00026519537786953457\n",
      "   +0.0000 if cp>=0.031040426343679428 & cv>=-0.045058395713567734 & pa>=-0.011637414805591101 & pav>=-0.039536844938993385\n",
      "   +2.1617 if pa<=-0.03234592527151106\n",
      "Run episode 639 with rewards 100.0\n",
      "============ 640 ===========\n",
      "101 actions [0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0, 1, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 0, 1, 0, 0, 1, 0, 1, 1, 0, 0, 0, 1, 0, 1, 0, 0, 1, 1, 1, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0]\n",
      "   -3.9724 if cv<=-0.005211336724460123 & cv<=-0.010101334936916825 & pa<=0.04053586199879646 & pa<=0.04822327196598054\n",
      "   +2.1936 if cv>=-0.6111044883728025\n",
      "   -9.9181 if pa>=0.016030343249440193\n",
      "   -8.2228 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "   +2.1384 if cv>=-0.7453900218009949\n",
      "--------------\n",
      "   -7.9478 if pa<=0.00662959311157465\n",
      "   +0.6803 if cp>=-0.2101022720336914 & cv<=0.22678737342357635 & cv>=0.030156206339597712 & pa>=0.007871035486459744 & pa>=0.022794276475906396\n",
      "   -1.5585 if cp<=-0.007756106927990896 & cv<=0.00026519537786953457\n",
      "   +4.0719 if pa<=-0.03234592527151106\n",
      "   +1.7573 if cv<=-0.7453900218009949 & pa<=-0.008999437838792793\n",
      "Run episode 640 with rewards 101.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 641 ===========\n",
      "119 actions [0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 0, 1, 1, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 0, 1, 0, 0, 1, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0]\n",
      "   -3.1835 if cv<=-0.005211336724460123 & cv<=-0.010101334936916825 & pa<=0.04053586199879646 & pa<=0.04822327196598054\n",
      "   +3.6852 if cv>=-0.6111044883728025\n",
      "  -10.0028 if pa>=0.016030343249440193\n",
      "   -5.4794 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "   -5.0677 if cp<=-0.00864351913332938 & cp>=-0.32613515853881836 & pa<=-0.09256293624639506 & pa<=0.014065826311707497 & pav>=0.07876881957054159\n",
      "--------------\n",
      "   -6.2420 if pa<=0.00662959311157465\n",
      "   -1.9974 if cp<=-0.007756106927990896 & cv<=0.00026519537786953457\n",
      "   -0.4523 if pa<=-0.03234592527151106\n",
      "   +4.0591 if cv<=-0.7453900218009949 & pa<=-0.008999437838792793\n",
      "   +5.2069 if cp<=-0.00864351913332938 & cp>=-0.32613515853881836 & pa<=-0.09256293624639506 & pa<=0.014065826311707497 & pav>=0.07876881957054159\n",
      "Run episode 641 with rewards 119.0\n",
      "origin 448.40072932656057 new 539.5819342681862 not updated\n",
      "============ 642 ===========\n",
      "97 actions [0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0]\n",
      "   -3.1835 if cv<=-0.005211336724460123 & cv<=-0.010101334936916825 & pa<=0.04053586199879646 & pa<=0.04822327196598054\n",
      "   +3.6852 if cv>=-0.6111044883728025\n",
      "  -10.0028 if pa>=0.016030343249440193\n",
      "   -5.4794 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "   -5.0677 if cp<=-0.00864351913332938 & cp>=-0.32613515853881836 & pa<=-0.09256293624639506 & pa<=0.014065826311707497 & pav>=0.07876881957054159\n",
      "--------------\n",
      "   -7.8816 if pa<=0.00662959311157465\n",
      "   -1.8309 if cp<=-0.007756106927990896 & cv<=0.00026519537786953457\n",
      "   +5.1960 if cv<=-0.7453900218009949 & pa<=-0.008999437838792793\n",
      "   +5.2165 if cp<=-0.00864351913332938 & cp>=-0.32613515853881836 & pa<=-0.09256293624639506 & pa<=0.014065826311707497 & pav>=0.07876881957054159\n",
      "   +4.6691 if cv<=-0.9175455212593079 & pa<=-0.09731827974319457\n",
      "Run episode 642 with rewards 97.0\n",
      "============ 643 ===========\n",
      "31 actions [1, 1, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 1, 0, 1, 0, 0, 0, 0, 0, 0, 1, 0]\n",
      "   +2.2165 if cv>=-0.6111044883728025\n",
      "   -5.5237 if pa>=0.016030343249440193\n",
      "   -5.0601 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "   +1.3816 if cp<=-0.00864351913332938 & cp>=-0.32613515853881836 & pa<=-0.09256293624639506 & pa<=0.014065826311707497 & pav>=0.07876881957054159\n",
      "   -4.2372 if \n",
      "--------------\n",
      "   -5.8074 if pa<=0.00662959311157465\n",
      "   +2.3905 if cv<=-0.7453900218009949 & pa<=-0.008999437838792793\n",
      "   -2.1569 if cp<=-0.00864351913332938 & cp>=-0.32613515853881836 & pa<=-0.09256293624639506 & pa<=0.014065826311707497 & pav>=0.07876881957054159\n",
      "   +0.0000 if cv<=-0.9175455212593079 & pa<=-0.09731827974319457\n",
      "   +4.7467 if cp>=0.03660010471940044 & cv<=-0.6026479601860046\n",
      "Run episode 643 with rewards 31.0\n",
      "============ 644 ===========\n",
      "11 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -3.2593 if cv>=-0.6111044883728025\n",
      "   -0.6728 if pa>=0.016030343249440193\n",
      "  +11.5466 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "   -3.7872 if \n",
      "   +5.4400 if cp<=0.017428113147616473 & pa<=0.006336313672363768\n",
      "--------------\n",
      "   -5.2309 if pa<=0.00662959311157465\n",
      "   -0.0000 if cv<=-0.7453900218009949 & pa<=-0.008999437838792793\n",
      "   -0.0000 if cp<=-0.00864351913332938 & cp>=-0.32613515853881836 & pa<=-0.09256293624639506 & pa<=0.014065826311707497 & pav>=0.07876881957054159\n",
      "   -0.0000 if cp>=0.03660010471940044 & cv<=-0.6026479601860046\n",
      "   +8.6906 if cp>=0.017428113147616473\n",
      "Run episode 644 with rewards 11.0\n",
      "============ 645 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +11.9564 if cv>=-0.6111044883728025\n",
      "   +9.9783 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  +12.4126 if \n",
      "   +4.7012 if cp<=0.017428113147616473 & pa<=0.006336313672363768\n",
      "   +1.0000 if cp<=0.07633116841316226\n",
      "--------------\n",
      "   -0.1857 if pa<=0.00662959311157465\n",
      "   -0.0000 if cv<=-0.7453900218009949 & pa<=-0.008999437838792793\n",
      "   -0.0000 if cp>=0.03660010471940044 & cv<=-0.6026479601860046\n",
      "   -0.1787 if cp>=0.017428113147616473\n",
      "   -0.1369 if cp>=0.12854450941085815\n",
      "Run episode 645 with rewards 9.0\n",
      "============ 646 ===========\n",
      "8 actions [1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -10.5992 if cv>=-0.6111044883728025\n",
      "  -10.3124 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  -17.2882 if \n",
      "   -4.8585 if cp<=0.017428113147616473 & pa<=0.006336313672363768\n",
      "   +0.2170 if cp<=-0.06338228285312653\n",
      "--------------\n",
      "   -0.0000 if pa<=0.00662959311157465\n",
      "   +0.0000 if cp>=0.03660010471940044 & cv<=-0.6026479601860046\n",
      "   +0.0000 if cp>=0.017428113147616473\n",
      "   +0.0000 if cp>=0.12854450941085815\n",
      "   +0.0001 if cp<=-0.030480357259511946\n",
      "Run episode 646 with rewards 8.0\n",
      "============ 647 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +10.5992 if cv>=-0.6111044883728025\n",
      "  +10.3124 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  +17.2882 if \n",
      "   +4.8585 if cp<=0.017428113147616473 & pa<=0.006336313672363768\n",
      "   +1.0000 if cp<=0.07192226946353913\n",
      "--------------\n",
      "   -0.0000 if pa<=0.00662959311157465\n",
      "   -0.0000 if cp>=0.017428113147616473\n",
      "   -0.0000 if cp>=0.12854450941085815\n",
      "   -0.0000 if cp<=-0.030480357259511946\n",
      "   +0.0000 if cp<=0.07192226946353913\n",
      "Run episode 647 with rewards 9.0\n",
      "origin 1.8725445716274803e-05 new 1.872544582558412e-05 not updated\n",
      "============ 648 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -10.5838 if cv>=-0.6111044883728025\n",
      "  -15.6475 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  -40.2829 if \n",
      "   -7.3721 if cp<=0.017428113147616473 & pa<=0.006336313672363768\n",
      "   +1.0000 if cp<=-0.03970168754458427\n",
      "--------------\n",
      "   -0.0000 if pa<=0.00662959311157465\n",
      "   -0.0000 if cp>=0.017428113147616473\n",
      "   -0.0000 if cp>=0.12854450941085815\n",
      "   -0.0000 if cp<=-0.030480357259511946\n",
      "   +0.0000 if cp<=0.07192226946353913\n",
      "Run episode 648 with rewards 9.0\n",
      "============ 649 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +10.5838 if cv>=-0.6111044883728025\n",
      "  +15.6475 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  +40.2829 if \n",
      "   +7.3721 if cp<=0.017428113147616473 & pa<=0.006336313672363768\n",
      "   +1.0000 if cp<=0.077937950193882\n",
      "--------------\n",
      "   +0.0000 if pa<=0.00662959311157465\n",
      "   +0.0000 if cp>=0.017428113147616473\n",
      "   +0.0000 if cp>=0.12854450941085815\n",
      "   +0.0000 if cp<=-0.030480357259511946\n",
      "   +0.0000 if \n",
      "Run episode 649 with rewards 9.0\n",
      "============ 650 ===========\n",
      "8 actions [1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   +0.5478 if cv>=-0.6111044883728025\n",
      "   -3.2878 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  -15.9577 if \n",
      "   -1.5490 if cp<=0.017428113147616473 & pa<=0.006336313672363768\n",
      "   +0.1982 if cp<=-0.0512218214571476\n",
      "--------------\n",
      "   -0.0000 if pa<=0.00662959311157465\n",
      "   -0.0000 if cp>=0.017428113147616473\n",
      "   +0.0000 if cp<=-0.030480357259511946\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.005637743696570405\n",
      "Run episode 650 with rewards 8.0\n",
      "============ 651 ===========\n",
      "8 actions [0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.5478 if cv>=-0.6111044883728025\n",
      "   +3.2878 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  +15.9577 if \n",
      "   +1.5490 if cp<=0.017428113147616473 & pa<=0.006336313672363768\n",
      "   +1.0000 if cp<=-0.007844104617834073\n",
      "--------------\n",
      "   -0.0000 if pa<=0.00662959311157465\n",
      "   -0.0000 if cp>=0.017428113147616473\n",
      "   +0.0000 if cp<=-0.030480357259511946\n",
      "   -0.0000 if \n",
      "   +0.0000 if cp<=-0.007844104617834073 & cp>=-0.025504299253225324\n",
      "Run episode 651 with rewards 8.0\n",
      "============ 652 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -3.0539 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  -15.4905 if \n",
      "   -1.4388 if cp<=0.017428113147616473 & pa<=0.006336313672363768\n",
      "   -1.7710 if cp<=-0.007844104617834073\n",
      "   +0.5101 if cp<=-0.04908317402005195\n",
      "--------------\n",
      "   +0.0000 if pa<=0.00662959311157465\n",
      "   +0.0000 if cp>=0.017428113147616473\n",
      "   +0.0000 if cp<=-0.030480357259511946\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=-0.010372513812035314\n",
      "Run episode 652 with rewards 9.0\n",
      "============ 653 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +3.0539 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  +15.4905 if \n",
      "   +1.4388 if cp<=0.017428113147616473 & pa<=0.006336313672363768\n",
      "   +1.7710 if cp<=-0.007844104617834073\n",
      "   +1.0000 if cp>=-0.03412737846374511\n",
      "--------------\n",
      "   -0.0000 if pa<=0.00662959311157465\n",
      "   +0.0000 if cp<=-0.030480357259511946\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp>=-0.010372513812035314\n",
      "   +0.0000 if cp<=-0.011436926387250412 & cp>=-0.03412737846374511\n",
      "Run episode 653 with rewards 10.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 654 ===========\n",
      "8 actions [1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -3.0303 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  -15.3763 if \n",
      "   -1.4275 if cp<=0.017428113147616473 & pa<=0.006336313672363768\n",
      "   -1.7627 if cp<=-0.007844104617834073\n",
      "   +1.0000 if cp>=-0.09004759639501572\n",
      "--------------\n",
      "   -0.0000 if pa<=0.00662959311157465\n",
      "   +0.0000 if cp<=-0.030480357259511946\n",
      "   +0.0000 if \n",
      "   -0.0000 if cp>=-0.010372513812035314\n",
      "   +0.0000 if cp>=-0.024810425564646715\n",
      "Run episode 654 with rewards 8.0\n",
      "============ 655 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +3.0267 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  +15.3967 if \n",
      "   +1.4270 if cp<=0.017428113147616473 & pa<=0.006336313672363768\n",
      "   +1.7622 if cp<=-0.007844104617834073\n",
      "   +1.0000 if cp>=0.07773212790489198\n",
      "--------------\n",
      "   -0.0001 if pa<=0.00662959311157465\n",
      "   +0.0000 if cp<=-0.030480357259511946\n",
      "   -0.0001 if \n",
      "   -0.0001 if cp>=-0.010372513812035314\n",
      "   +0.0000 if cp<=0.060616294294595724\n",
      "Run episode 655 with rewards 10.0\n",
      "============ 656 ===========\n",
      "8 actions [1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -2.9375 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  -15.4822 if \n",
      "   -1.0991 if cp<=0.017428113147616473 & pa<=0.006336313672363768\n",
      "   -2.4495 if cp<=-0.007844104617834073\n",
      "   +0.5303 if cp<=-0.08981096893548965\n",
      "--------------\n",
      "   -0.0000 if pa<=0.00662959311157465\n",
      "   +0.0000 if \n",
      "   -0.0000 if cp>=-0.010372513812035314\n",
      "   +0.0000 if cp<=0.060616294294595724\n",
      "   +0.0000 if cp>=-0.08981096893548965\n",
      "Run episode 656 with rewards 8.0\n",
      "============ 657 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +2.9375 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  +15.4822 if \n",
      "   +1.0991 if cp<=0.017428113147616473 & pa<=0.006336313672363768\n",
      "   +2.4495 if cp<=-0.007844104617834073\n",
      "   +1.0000 if cp>=0.057862651348114025\n",
      "--------------\n",
      "   -0.0000 if pa<=0.00662959311157465\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp>=-0.010372513812035314\n",
      "   -0.0000 if cp<=0.060616294294595724\n",
      "   +0.0000 if cp<=0.018835944123566154\n",
      "Run episode 657 with rewards 9.0\n",
      "============ 658 ===========\n",
      "8 actions [1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -2.8075 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  -14.7957 if \n",
      "   -1.0505 if cp<=0.017428113147616473 & pa<=0.006336313672363768\n",
      "   -2.3442 if cp<=-0.007844104617834073\n",
      "   +1.0000 if cp<=-0.07117798775434495\n",
      "--------------\n",
      "   +0.0000 if pa<=0.00662959311157465\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp>=-0.010372513812035314\n",
      "   -0.0000 if cp<=0.060616294294595724\n",
      "   +0.0000 if cp>=-0.07117798775434495\n",
      "Run episode 658 with rewards 8.0\n",
      "============ 659 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +2.7891 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  +15.2345 if \n",
      "   +1.0900 if cp<=0.017428113147616473 & pa<=0.006336313672363768\n",
      "   +2.3288 if cp<=-0.007844104617834073\n",
      "   +1.0000 if cp>=0.004144913423806431\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp>=-0.010372513812035314\n",
      "   -0.0000 if cp<=0.060616294294595724\n",
      "   -0.0000 if cp>=-0.07117798775434495\n",
      "   +0.0000 if cp<=0.004144913423806431\n",
      "Run episode 659 with rewards 10.0\n",
      "============ 660 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -2.6917 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  -14.8115 if \n",
      "   -0.9899 if cp<=0.017428113147616473 & pa<=0.006336313672363768\n",
      "   -2.4185 if cp<=-0.007844104617834073\n",
      "   +0.9262 if cp<=-0.003484937734901901 & cp>=-0.07113339155912399\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   -0.0000 if cp>=-0.010372513812035314\n",
      "   +0.0000 if cp<=0.060616294294595724\n",
      "   -0.0000 if cp>=-0.07117798775434495\n",
      "   +0.0000 if cp>=-0.07113339155912399\n",
      "Run episode 660 with rewards 9.0\n",
      "============ 661 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +2.6549 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  +15.8102 if \n",
      "   +0.9764 if cp<=0.017428113147616473 & pa<=0.006336313672363768\n",
      "   +2.3854 if cp<=-0.007844104617834073\n",
      "   +1.0000 if cp>=0.08377283215522767\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp>=-0.010372513812035314\n",
      "   +0.0000 if cp<=0.060616294294595724\n",
      "   -0.0000 if cp>=-0.07117798775434495\n",
      "   +0.0000 if cp<=0.08377283215522767\n",
      "Run episode 661 with rewards 10.0\n",
      "============ 662 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -2.5795 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  -15.3630 if \n",
      "   -2.3196 if cp<=-0.007844104617834073\n",
      "   -0.9716 if cp>=0.08377283215522767\n",
      "   +1.0000 if cp>=-0.06365211308002472\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=-0.010372513812035314\n",
      "   +0.0000 if cp<=0.060616294294595724\n",
      "   +0.0000 if cp>=-0.07117798775434495\n",
      "   +0.0000 if cp<=-0.017022042348980904 & cp>=-0.10573242902755738\n",
      "Run episode 662 with rewards 10.0\n",
      "============ 663 ===========\n",
      "11 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +2.5751 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  +15.4894 if \n",
      "   +2.2690 if cp<=-0.007844104617834073\n",
      "   +1.1508 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp<=0.04367383867502213\n",
      "--------------\n",
      "   -0.0001 if \n",
      "   -0.0000 if cp<=0.060616294294595724\n",
      "   -0.0001 if cp>=-0.07117798775434495\n",
      "   +0.0000 if cp<=-0.017022042348980904 & cp>=-0.10573242902755738\n",
      "   -0.0001 if cp>=-0.03637436702847481\n",
      "Run episode 663 with rewards 11.0\n",
      "============ 664 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -2.5369 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  -15.2640 if \n",
      "   -2.2393 if cp<=-0.007844104617834073\n",
      "   -1.1332 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp<=-0.01465491484850645 & cp>=-0.11687687039375305\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.060616294294595724\n",
      "   +0.0000 if cp>=-0.07117798775434495\n",
      "   -0.0000 if cp>=-0.03637436702847481\n",
      "   +0.0000 if cp>=-0.06720294058322906\n",
      "Run episode 664 with rewards 10.0\n",
      "============ 665 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +2.5326 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  +15.3892 if \n",
      "   +2.1819 if cp<=-0.007844104617834073\n",
      "   +1.2825 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp<=0.07009950876235962\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp<=0.060616294294595724\n",
      "   -0.0000 if cp>=-0.07117798775434495\n",
      "   -0.0000 if cp>=-0.03637436702847481\n",
      "   +0.0000 if cp<=0.07009950876235962\n",
      "Run episode 665 with rewards 10.0\n",
      "============ 666 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -2.4534 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  -14.9092 if \n",
      "   -2.1179 if cp<=-0.007844104617834073\n",
      "   -1.2398 if cp>=-0.06365211308002472\n",
      "   +1.0000 if pa>=0.20588329434394836\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp<=0.060616294294595724\n",
      "   -0.0000 if cp>=-0.07117798775434495\n",
      "   -0.0000 if cp>=-0.03637436702847481\n",
      "   +0.0000 if cp>=-0.04272129759192467\n",
      "Run episode 666 with rewards 9.0\n",
      "============ 667 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +2.4515 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  +14.9661 if \n",
      "   +2.1162 if cp<=-0.007844104617834073\n",
      "   +1.3074 if cp>=-0.06365211308002472\n",
      "   +0.9955 if cp<=0.0739745154976845\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   +0.0000 if cp<=0.060616294294595724\n",
      "   -0.0000 if cp>=-0.07117798775434495\n",
      "   -0.0000 if cp>=-0.03637436702847481\n",
      "   +0.0000 if cp>=0.10640954971313478\n",
      "Run episode 667 with rewards 10.0\n",
      "============ 668 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -6.6156 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  -40.3956 if \n",
      "   -5.7254 if cp<=-0.007844104617834073\n",
      "   -3.5216 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp<=-0.10015702098608018\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp<=0.060616294294595724\n",
      "   -0.0000 if cp>=-0.07117798775434495\n",
      "   -0.0000 if cp>=-0.03637436702847481\n",
      "   +0.0000 if cp>=-0.05778614431619644\n",
      "Run episode 668 with rewards 10.0\n",
      "============ 669 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +6.6156 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  +40.3956 if \n",
      "   +5.7254 if cp<=-0.007844104617834073\n",
      "   +3.5216 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp<=0.05615329146385194\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.060616294294595724\n",
      "   +0.0000 if cp>=-0.07117798775434495\n",
      "   +0.0000 if cp>=-0.03637436702847481\n",
      "   +0.0000 if \n",
      "Run episode 669 with rewards 10.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 670 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -2.3130 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  -14.3505 if \n",
      "   -2.3528 if cp<=-0.007844104617834073\n",
      "   -1.1905 if cp>=-0.06365211308002472\n",
      "   +0.8863 if pa>=0.17266440391540527\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp>=-0.07117798775434495\n",
      "   -0.0000 if cp>=-0.03637436702847481\n",
      "   -0.0000 if cp>=0.00035197040560888167\n",
      "   +0.0000 if cp<=-0.013600229844450947\n",
      "Run episode 670 with rewards 10.0\n",
      "============ 671 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +2.2936 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  +14.9775 if \n",
      "   +2.1029 if cp<=-0.007844104617834073\n",
      "   +1.9281 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp<=0.04592779576778412\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp>=-0.07117798775434495\n",
      "   -0.0000 if cp>=-0.03637436702847481\n",
      "   -0.0000 if cp>=0.00035197040560888167\n",
      "   +0.0000 if pa>=0.040123894810676575\n",
      "Run episode 671 with rewards 9.0\n",
      "============ 672 ===========\n",
      "8 actions [1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -2.1944 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  -14.7009 if \n",
      "   -2.4211 if cp<=-0.007844104617834073\n",
      "   -2.0435 if cp>=-0.06365211308002472\n",
      "   +0.4883 if cp<=0.02864958308637143\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp>=-0.07117798775434495\n",
      "   -0.0000 if cp>=-0.03637436702847481\n",
      "   -0.0000 if cp>=0.00035197040560888167\n",
      "   +0.0000 if cp>=0.006715804990381005\n",
      "Run episode 672 with rewards 8.0\n",
      "============ 673 ===========\n",
      "8 actions [0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +2.1944 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  +14.7009 if \n",
      "   +2.4211 if cp<=-0.007844104617834073\n",
      "   +2.0435 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp<=0.031554428488016144\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp>=-0.07117798775434495\n",
      "   -0.0000 if cp>=-0.03637436702847481\n",
      "   -0.0000 if cp>=0.00035197040560888167\n",
      "   +0.0000 if cp<=0.008528157696127891\n",
      "Run episode 673 with rewards 8.0\n",
      "============ 674 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -2.1266 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  -14.4443 if \n",
      "   -2.5437 if cp<=-0.007844104617834073\n",
      "   -1.9744 if cp>=-0.06365211308002472\n",
      "   +0.8458 if cp<=-0.07977243810892105\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=-0.07117798775434495\n",
      "   -0.0000 if cp>=-0.03637436702847481\n",
      "   -0.0000 if cp>=0.00035197040560888167\n",
      "   +0.0000 if cp<=-0.056435027718544\n",
      "Run episode 674 with rewards 10.0\n",
      "============ 675 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +2.1231 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  +14.5721 if \n",
      "   +2.4884 if cp<=-0.007844104617834073\n",
      "   +2.1225 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp<=0.070343217253685 & cp>=-0.0016671827528625715\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp>=-0.07117798775434495\n",
      "   -0.0000 if cp>=-0.03637436702847481\n",
      "   -0.0000 if cp<=-0.056435027718544\n",
      "   +0.0000 if cp<=-0.0016671827528625715\n",
      "Run episode 675 with rewards 9.0\n",
      "============ 676 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -5.6776 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  -38.9747 if \n",
      "   -6.6647 if cp<=-0.007844104617834073\n",
      "   -5.6735 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp<=0.017612652108073237 & cp>=-0.049527280032634735\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=-0.07117798775434495\n",
      "   -0.0000 if cp>=-0.03637436702847481\n",
      "   +0.0000 if cp<=-0.0016671827528625715\n",
      "   +0.0000 if cp<=-0.049527280032634735\n",
      "Run episode 676 with rewards 9.0\n",
      "============ 677 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +5.6776 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  +38.9747 if \n",
      "   +6.6647 if cp<=-0.007844104617834073\n",
      "   +5.6735 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp<=0.062251289933919915\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=-0.07117798775434495\n",
      "   +0.0000 if cp>=-0.03637436702847481\n",
      "   +0.0000 if cp<=-0.0016671827528625715\n",
      "   +0.0000 if \n",
      "Run episode 677 with rewards 9.0\n",
      "============ 678 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -2.0665 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  -14.2872 if \n",
      "   -2.5537 if cp<=-0.007844104617834073\n",
      "   -2.1206 if cp>=-0.06365211308002472\n",
      "   +0.8677 if cp<=0.013620760291814806\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp>=-0.07117798775434495\n",
      "   +0.0000 if cp<=-0.0016671827528625715\n",
      "   +0.0000 if cp<=0.013620760291814806 & cp>=-0.018025181442499157\n",
      "   +0.0000 if cv>=0.027066685259342194\n",
      "Run episode 678 with rewards 9.0\n",
      "============ 679 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +2.0618 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  +14.3139 if \n",
      "   +2.5451 if cp<=-0.007844104617834073\n",
      "   +2.1517 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp<=0.05494043529033662\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp>=-0.07117798775434495\n",
      "   +0.0000 if cp<=-0.0016671827528625715\n",
      "   -0.0000 if cp<=0.013620760291814806 & cp>=-0.018025181442499157\n",
      "   +0.0000 if cp>=0.05494043529033662\n",
      "Run episode 679 with rewards 10.0\n",
      "============ 680 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -5.4679 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  -37.9745 if \n",
      "   -6.7642 if cp<=-0.007844104617834073\n",
      "   -5.7041 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp<=0.01869256775826216 & cp>=-0.05016182661056518\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   -0.0000 if cp>=-0.07117798775434495\n",
      "   +0.0000 if cp<=-0.0016671827528625715\n",
      "   +0.0000 if cp<=0.013620760291814806 & cp>=-0.018025181442499157\n",
      "   +0.0000 if cp>=0.03767474740743637\n",
      "Run episode 680 with rewards 10.0\n",
      "============ 681 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +5.4679 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  +37.9745 if \n",
      "   +6.7642 if cp<=-0.007844104617834073\n",
      "   +5.7041 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp<=0.047544591873884205\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=-0.07117798775434495\n",
      "   +0.0000 if cp<=-0.0016671827528625715\n",
      "   +0.0000 if cp<=0.013620760291814806 & cp>=-0.018025181442499157\n",
      "   +0.0000 if \n",
      "Run episode 681 with rewards 9.0\n",
      "============ 682 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -1.9829 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  -13.7711 if \n",
      "   -2.4530 if cp<=-0.007844104617834073\n",
      "   -2.0685 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp<=0.003971821116283537 & cp>=-0.06049487739801407\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp>=-0.07117798775434495\n",
      "   +0.0000 if cp<=-0.0016671827528625715\n",
      "   -0.0000 if cp<=0.003971821116283537 & cp>=-0.06049487739801407\n",
      "   +0.0000 if cp>=0.006269838660955429\n",
      "Run episode 682 with rewards 9.0\n",
      "============ 683 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +1.9778 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  +13.9612 if \n",
      "   +2.4466 if cp<=-0.007844104617834073\n",
      "   +2.2890 if cp>=-0.06365211308002472\n",
      "   +0.9938 if cp<=0.07677439004182816\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp>=-0.07117798775434495\n",
      "   -0.0000 if cp<=-0.0016671827528625715\n",
      "   -0.0000 if cp<=0.003971821116283537 & cp>=-0.06049487739801407\n",
      "   +0.0000 if cp<=0.07677439004182816\n",
      "Run episode 683 with rewards 10.0\n",
      "============ 684 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -5.1813 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  -36.6110 if \n",
      "   -6.4424 if cp<=-0.007844104617834073\n",
      "   -5.9960 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp>=-0.12954743206501007\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=-0.07117798775434495\n",
      "   +0.0000 if cp<=-0.0016671827528625715\n",
      "   +0.0000 if cp<=0.07677439004182816\n",
      "   +0.0000 if cp<=-0.12954743206501007\n",
      "Run episode 684 with rewards 9.0\n",
      "============ 685 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +5.1813 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  +36.6110 if \n",
      "   +6.4424 if cp<=-0.007844104617834073\n",
      "   +5.9960 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp<=0.0822411745786667\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=-0.07117798775434495\n",
      "   +0.0000 if cp<=-0.0016671827528625715\n",
      "   +0.0000 if cp<=0.07677439004182816\n",
      "   +0.0000 if \n",
      "Run episode 685 with rewards 9.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 686 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -1.8602 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  -13.8487 if \n",
      "   -3.0174 if cp<=-0.007844104617834073\n",
      "   -1.9244 if cp>=-0.06365211308002472\n",
      "   +0.8206 if cp<=-0.06349826753139495 & cp>=-0.1188211441040039\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=-0.0016671827528625715\n",
      "   +0.0000 if cp<=0.07677439004182816\n",
      "   -0.0000 if cp>=-0.06349826753139495\n",
      "   +0.0000 if cp>=-0.06349826753139495\n",
      "Run episode 686 with rewards 9.0\n",
      "============ 687 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +1.8565 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  +13.9968 if \n",
      "   +3.0212 if cp<=-0.007844104617834073\n",
      "   +2.0967 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp>=0.01746193505823613\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp<=-0.0016671827528625715\n",
      "   -0.0000 if cp<=0.07677439004182816\n",
      "   -0.0000 if cp>=0.01746193505823613\n",
      "   +0.0000 if cp>=0.01746193505823613\n",
      "Run episode 687 with rewards 10.0\n",
      "============ 688 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -4.8811 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  -36.8186 if \n",
      "   -7.9611 if cp<=-0.007844104617834073\n",
      "   -5.5114 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp>=-0.06288471445441246\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.07677439004182816\n",
      "   -0.0000 if cp>=0.01746193505823613\n",
      "   -0.0000 if cp>=-0.06288471445441246\n",
      "   +0.0000 if cp<=-0.021910711005330086 & cp>=-0.10221149325370789\n",
      "Run episode 688 with rewards 10.0\n",
      "============ 689 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +4.8811 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  +36.8186 if \n",
      "   +7.9611 if cp<=-0.007844104617834073\n",
      "   +5.5114 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp<=0.07054825276136399\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.07677439004182816\n",
      "   +0.0000 if cp>=-0.06288471445441246\n",
      "   +0.0000 if cp<=-0.021910711005330086 & cp>=-0.10221149325370789\n",
      "   +0.0000 if \n",
      "Run episode 689 with rewards 9.0\n",
      "============ 690 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -1.8110 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  -13.6610 if \n",
      "   -2.9539 if cp<=-0.007844104617834073\n",
      "   -2.0449 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp<=0.010118599608540536 & cp>=-0.05296573340892791\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp<=0.07677439004182816\n",
      "   -0.0000 if cp>=-0.06288471445441246\n",
      "   +0.0000 if cp<=-0.021715353615581988\n",
      "   +0.0000 if cp<=-0.021715353615581988\n",
      "Run episode 690 with rewards 10.0\n",
      "============ 691 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +1.7961 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  +14.2887 if \n",
      "   +2.6674 if cp<=-0.007844104617834073\n",
      "   +2.7686 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp<=0.06133758276700974 & cp>=-0.008895294927060603\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp>=-0.06288471445441246\n",
      "   +0.0000 if cp<=-0.021715353615581988\n",
      "   -0.0000 if cp<=0.019965627603232866\n",
      "   +0.0000 if cp>=0.06133758276700974\n",
      "Run episode 691 with rewards 10.0\n",
      "============ 692 ===========\n",
      "8 actions [1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -4.7744 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  -37.9996 if \n",
      "   -7.1076 if cp<=-0.007844104617834073\n",
      "   -7.3587 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp>=-0.06970473974943162\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   -0.0000 if cp>=-0.06288471445441246\n",
      "   +0.0000 if cp<=-0.021715353615581988\n",
      "   +0.0000 if cp<=0.019965627603232866\n",
      "   +0.0000 if cp<=-0.06970473974943162 & cp>=-0.10933515727519989\n",
      "Run episode 692 with rewards 8.0\n",
      "============ 693 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +4.7744 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  +37.9996 if \n",
      "   +7.1076 if cp<=-0.007844104617834073\n",
      "   +7.3587 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp<=0.03849200010299684\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=-0.06288471445441246\n",
      "   +0.0000 if cp<=-0.021715353615581988\n",
      "   +0.0000 if cp<=0.019965627603232866\n",
      "   +0.0000 if \n",
      "Run episode 693 with rewards 9.0\n",
      "============ 694 ===========\n",
      "8 actions [1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -1.7309 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  -13.7762 if \n",
      "   -2.5767 if cp<=-0.007844104617834073\n",
      "   -2.6678 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp<=0.0019528655684553098 & cp>=-0.06129813492298126\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=-0.021715353615581988\n",
      "   +0.0000 if cp<=0.019965627603232866\n",
      "   +0.0000 if cp<=0.0019528655684553098\n",
      "   +0.0000 if cp<=-0.06129813492298126\n",
      "Run episode 694 with rewards 8.0\n",
      "============ 695 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +1.7309 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  +13.7762 if \n",
      "   +2.5767 if cp<=-0.007844104617834073\n",
      "   +2.6678 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp<=0.07340844571590424\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   +0.0000 if cp<=-0.021715353615581988\n",
      "   +0.0000 if cp<=0.019965627603232866\n",
      "   +0.0000 if cp<=0.0019528655684553098\n",
      "   +0.0000 if cp>=0.04829738736152651\n",
      "Run episode 695 with rewards 10.0\n",
      "============ 696 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -4.5146 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  -35.9669 if \n",
      "   -6.7547 if cp<=-0.007844104617834073\n",
      "   -6.9569 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp>=-0.13287438452243805\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=-0.021715353615581988\n",
      "   +0.0000 if cp<=0.019965627603232866\n",
      "   +0.0000 if cp>=0.04829738736152651\n",
      "   +0.0000 if cp>=-0.06465886831283568\n",
      "Run episode 696 with rewards 10.0\n",
      "============ 697 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +4.5146 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  +35.9669 if \n",
      "   +6.7547 if cp<=-0.007844104617834073\n",
      "   +6.9569 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp<=0.08703156262636186\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=-0.021715353615581988\n",
      "   +0.0000 if cp<=0.019965627603232866\n",
      "   +0.0000 if cp>=-0.06465886831283568\n",
      "   +0.0000 if \n",
      "Run episode 697 with rewards 10.0\n",
      "============ 698 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -1.7027 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  -14.0335 if \n",
      "   -3.2286 if cp<=-0.007844104617834073\n",
      "   -2.5649 if cp>=-0.06365211308002472\n",
      "   +0.3606 if cp<=0.015584276616573335\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=-0.021715353615581988\n",
      "   +0.0000 if cp<=0.019965627603232866\n",
      "   +0.0000 if cp<=-0.07298066914081573\n",
      "   +0.0000 if cp>=-0.030949779227375983\n",
      "Run episode 698 with rewards 9.0\n",
      "============ 699 ===========\n",
      "8 actions [0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +1.7027 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  +14.0335 if \n",
      "   +3.2286 if cp<=-0.007844104617834073\n",
      "   +2.5649 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp<=0.036041123420000085\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   +0.0000 if cp<=-0.021715353615581988\n",
      "   -0.0000 if cp<=0.019965627603232866\n",
      "   +0.0000 if cp<=-0.07298066914081573\n",
      "   +0.0000 if cp>=0.003713018819689762\n",
      "Run episode 699 with rewards 8.0\n",
      "============ 700 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -4.4982 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  -37.0770 if \n",
      "   -8.5354 if cp<=-0.007844104617834073\n",
      "   -6.7746 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp<=0.003240821138024332\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=-0.021715353615581988\n",
      "   +0.0000 if cp<=0.019965627603232866\n",
      "   -0.0000 if cp>=0.003713018819689762\n",
      "   +0.0000 if pa>=0.1683027744293213\n",
      "Run episode 700 with rewards 10.0\n",
      "============ 701 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +4.4982 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  +37.0770 if \n",
      "   +8.5354 if cp<=-0.007844104617834073\n",
      "   +6.7746 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp<=0.05764594674110413\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=-0.021715353615581988\n",
      "   +0.0000 if cp<=0.019965627603232866\n",
      "   +0.0000 if cp>=0.003713018819689762\n",
      "   +0.0000 if \n",
      "Run episode 701 with rewards 9.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 702 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -1.5705 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  -13.7187 if \n",
      "   -3.7538 if cp<=-0.007844104617834073\n",
      "   -2.0846 if cp>=-0.06365211308002472\n",
      "   +0.6087 if cp<=-0.06008024364709853 & cp>=-0.11093827933073044\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=-0.021715353615581988\n",
      "   +0.0000 if cp<=0.019965627603232866\n",
      "   -0.0000 if cp>=-0.06008024364709853\n",
      "   +0.0000 if cp>=-0.06008024364709853\n",
      "Run episode 702 with rewards 10.0\n",
      "============ 703 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +1.5655 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  +13.9532 if \n",
      "   +3.7417 if cp<=-0.007844104617834073\n",
      "   +2.3564 if cp>=-0.06365211308002472\n",
      "   +0.9878 if cp<=0.09245821386575699\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp<=-0.021715353615581988\n",
      "   -0.0000 if cp<=0.019965627603232866\n",
      "   -0.0000 if cp>=0.09245821386575699\n",
      "   +0.0000 if cp<=0.06285466998815536\n",
      "Run episode 703 with rewards 10.0\n",
      "============ 704 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -4.1350 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  -36.8557 if \n",
      "   -9.8914 if cp<=-0.007844104617834073\n",
      "   -6.2172 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp<=0.022068499028682714 & cp>=-0.045529690384864804\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.019965627603232866\n",
      "   -0.0000 if cp>=0.09245821386575699\n",
      "   +0.0000 if cp<=0.06285466998815536\n",
      "   +0.0000 if cp<=0.03705778121948242\n",
      "Run episode 704 with rewards 10.0\n",
      "============ 705 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +4.1350 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  +36.8557 if \n",
      "   +9.8914 if cp<=-0.007844104617834073\n",
      "   +6.2172 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp<=0.05173196345567704\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.019965627603232866\n",
      "   +0.0000 if cp<=0.06285466998815536\n",
      "   +0.0000 if cp<=0.03705778121948242\n",
      "   +0.0000 if \n",
      "Run episode 705 with rewards 9.0\n",
      "============ 706 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -1.4941 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  -13.3172 if \n",
      "   -3.5741 if cp<=-0.007844104617834073\n",
      "   -2.2465 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp>=-0.09436772614717484\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.019965627603232866\n",
      "   +0.0000 if cp<=0.06285466998815536\n",
      "   -0.0000 if cp>=-0.0428617313504219\n",
      "   +0.0000 if cp>=-0.0428617313504219\n",
      "Run episode 706 with rewards 10.0\n",
      "============ 707 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +1.4866 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  +13.6905 if \n",
      "   +3.5561 if cp<=-0.007844104617834073\n",
      "   +2.6755 if cp>=-0.06365211308002472\n",
      "   +0.9774 if cp<=0.06802526563405992\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   +0.0000 if cp<=0.019965627603232866\n",
      "   +0.0000 if cp<=0.06285466998815536\n",
      "   -0.0000 if cp>=0.11010435521602631\n",
      "   -0.0001 if cp>=0.03844120502471924\n",
      "Run episode 707 with rewards 9.0\n",
      "============ 708 ===========\n",
      "8 actions [1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -3.8919 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  -35.8466 if \n",
      "   -9.3207 if cp<=-0.007844104617834073\n",
      "   -6.9992 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp<=-0.038615706562995906 & cp>=-0.06984694600105286\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp<=0.019965627603232866\n",
      "   -0.0000 if cp>=0.11010435521602631\n",
      "   -0.0000 if cp>=0.03844120502471924\n",
      "   +0.0000 if cp>=-0.06984694600105286\n",
      "Run episode 708 with rewards 8.0\n",
      "============ 709 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +3.8919 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  +35.8466 if \n",
      "   +9.3207 if cp<=-0.007844104617834073\n",
      "   +6.9992 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp>=0.006151513382792484\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.019965627603232866\n",
      "   +0.0000 if cp>=0.03844120502471924\n",
      "   +0.0000 if cp>=-0.06984694600105286\n",
      "   +0.0000 if \n",
      "Run episode 709 with rewards 10.0\n",
      "============ 710 ===========\n",
      "8 actions [1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -1.3916 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  -13.6562 if \n",
      "   -3.7623 if cp<=-0.007844104617834073\n",
      "   -2.6557 if cp>=-0.06365211308002472\n",
      "   +0.7053 if cp<=0.011814308352768425\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.019965627603232866\n",
      "   +0.0000 if cp>=-0.06984694600105286\n",
      "   +0.0000 if cp<=0.011814308352768425 & cp>=-0.015444579161703584\n",
      "   +0.0000 if cp>=0.02651888281106949\n",
      "Run episode 710 with rewards 8.0\n",
      "============ 711 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +1.3916 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  +13.6562 if \n",
      "   +3.7623 if cp<=-0.007844104617834073\n",
      "   +2.6557 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp>=0.005969508737325685\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp<=0.019965627603232866\n",
      "   -0.0000 if cp>=-0.06984694600105286\n",
      "   -0.0000 if cp<=0.011814308352768425 & cp>=-0.015444579161703584\n",
      "   +0.0000 if cp>=-0.019380273297429085\n",
      "Run episode 711 with rewards 9.0\n",
      "origin 2.0087891166152783e-05 new 2.008789308208332e-05 not updated\n",
      "============ 712 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -3.6442 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  -35.7669 if \n",
      "   -9.8644 if cp<=-0.007844104617834073\n",
      "   -6.9484 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp<=-0.0216476447880268\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp<=0.019965627603232866\n",
      "   -0.0000 if cp>=-0.06984694600105286\n",
      "   -0.0000 if cp<=0.011814308352768425 & cp>=-0.015444579161703584\n",
      "   +0.0000 if cp>=-0.019380273297429085\n",
      "Run episode 712 with rewards 10.0\n",
      "============ 713 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +3.6442 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  +35.7669 if \n",
      "   +9.8644 if cp<=-0.007844104617834073\n",
      "   +6.9484 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp<=0.04779356569051743\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.019965627603232866\n",
      "   +0.0000 if cp>=-0.06984694600105286\n",
      "   +0.0000 if cp<=0.011814308352768425 & cp>=-0.015444579161703584\n",
      "   +0.0000 if \n",
      "Run episode 713 with rewards 10.0\n",
      "============ 714 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -1.3757 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  -13.5024 if \n",
      "   -3.7239 if cp<=-0.007844104617834073\n",
      "   -2.6231 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp<=0.01750730276107788 & cp>=-0.06148935407400131\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp<=0.019965627603232866\n",
      "   -0.0000 if cp>=-0.06984694600105286\n",
      "   +0.0000 if cp<=0.0037705741357058325\n",
      "   +0.0000 if cp<=0.01750730276107788\n",
      "Run episode 714 with rewards 10.0\n",
      "============ 715 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +1.3742 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  +13.5832 if \n",
      "   +3.7199 if cp<=-0.007844104617834073\n",
      "   +2.7157 if cp>=-0.06365211308002472\n",
      "   +0.9877 if cp<=0.055647230148315435\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.019965627603232866\n",
      "   +0.0000 if cp>=-0.06984694600105286\n",
      "   +0.0000 if cp<=0.0037705741357058325\n",
      "   +0.0000 if cp<=0.09684418886899948 & cp>=0.02696361988782883\n",
      "Run episode 715 with rewards 9.0\n",
      "============ 716 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -3.5894 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  -35.4812 if \n",
      "   -9.7269 if cp<=-0.007844104617834073\n",
      "   -7.0864 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp<=0.007924350257962943 & cp>=-0.061009619385004044\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp<=0.019965627603232866\n",
      "   -0.0000 if cp>=-0.06984694600105286\n",
      "   +0.0000 if cp<=0.09684418886899948 & cp>=0.02696361988782883\n",
      "   +0.0000 if cp>=-0.02786743268370628\n",
      "Run episode 716 with rewards 10.0\n",
      "============ 717 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +3.5894 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  +35.4812 if \n",
      "   +9.7269 if cp<=-0.007844104617834073\n",
      "   +7.0864 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp<=0.050792048871517184\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.019965627603232866\n",
      "   +0.0000 if cp>=-0.06984694600105286\n",
      "   +0.0000 if cp>=-0.02786743268370628\n",
      "   +0.0000 if \n",
      "Run episode 717 with rewards 10.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 718 ===========\n",
      "11 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -1.3757 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  -13.6954 if \n",
      "   -3.8703 if cp<=-0.007844104617834073\n",
      "   -2.7027 if cp>=-0.06365211308002472\n",
      "   +0.8684 if cp<=-0.04263468086719513\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp<=0.019965627603232866\n",
      "   -0.0000 if cp>=-0.06984694600105286\n",
      "   +0.0000 if cp<=-0.08236064314842224\n",
      "   +0.0000 if cp<=-0.08236064314842224\n",
      "Run episode 718 with rewards 11.0\n",
      "============ 719 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +1.3729 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  +13.8414 if \n",
      "   +3.7762 if cp<=-0.007844104617834073\n",
      "   +2.8704 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp<=0.06953626126050949\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp<=0.019965627603232866\n",
      "   -0.0000 if cp>=-0.06984694600105286\n",
      "   -0.0000 if cp<=0.06953626126050949\n",
      "   +0.0000 if cp>=0.13661570847034454\n",
      "Run episode 719 with rewards 10.0\n",
      "============ 720 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -3.6232 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  -36.5417 if \n",
      "   -9.9789 if cp<=-0.007844104617834073\n",
      "   -7.5746 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp>=-0.140504851937294\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.019965627603232866\n",
      "   -0.0000 if cp>=-0.06984694600105286\n",
      "   +0.0000 if cp<=0.06953626126050949\n",
      "   +0.0000 if cp>=-0.09831868261098861\n",
      "Run episode 720 with rewards 9.0\n",
      "============ 721 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +3.6232 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  +36.5417 if \n",
      "   +9.9789 if cp<=-0.007844104617834073\n",
      "   +7.5746 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp<=0.05441632792353631\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.019965627603232866\n",
      "   +0.0000 if cp>=-0.06984694600105286\n",
      "   +0.0000 if cp<=0.06953626126050949\n",
      "   +0.0000 if \n",
      "Run episode 721 with rewards 10.0\n",
      "============ 722 ===========\n",
      "11 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -1.3058 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  -13.1694 if \n",
      "   -3.5963 if cp<=-0.007844104617834073\n",
      "   -2.7298 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp>=-0.06057514399290084\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.019965627603232866\n",
      "   +0.0000 if cp<=0.06953626126050949\n",
      "   -0.0000 if cp>=-0.033793761581182476\n",
      "   +0.0000 if cp>=-0.033793761581182476\n",
      "Run episode 722 with rewards 11.0\n",
      "============ 723 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +1.3010 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  +13.4311 if \n",
      "   +3.5831 if cp<=-0.007844104617834073\n",
      "   +3.0301 if cp>=-0.06365211308002472\n",
      "   +0.9508 if cp<=0.06590571254491809\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   +0.0000 if cp<=0.019965627603232866\n",
      "   +0.0000 if cp<=0.06953626126050949\n",
      "   -0.0000 if cp<=0.11796251684427261\n",
      "   -0.0000 if cp>=0.008584692142903805\n",
      "Run episode 723 with rewards 9.0\n",
      "============ 724 ===========\n",
      "8 actions [1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -3.3826 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  -34.9283 if \n",
      "   -9.3244 if cp<=-0.007844104617834073\n",
      "   -7.8779 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp<=0.02568284124135972\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.019965627603232866\n",
      "   +0.0000 if cp<=0.06953626126050949\n",
      "   -0.0000 if cp>=0.008584692142903805\n",
      "   +0.0000 if cp<=0.03860109373927117 & cp>=0.02568284124135972\n",
      "Run episode 724 with rewards 8.0\n",
      "============ 725 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +3.3826 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  +34.9283 if \n",
      "   +9.3244 if cp<=-0.007844104617834073\n",
      "   +7.8779 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp>=0.01431173160672189\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.019965627603232866\n",
      "   +0.0000 if cp<=0.06953626126050949\n",
      "   +0.0000 if cp>=0.008584692142903805\n",
      "   +0.0000 if \n",
      "Run episode 725 with rewards 9.0\n",
      "============ 726 ===========\n",
      "11 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -1.2887 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  -13.3071 if \n",
      "   -3.5525 if cp<=-0.007844104617834073\n",
      "   -3.0013 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp<=0.018144354224205017\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.019965627603232866\n",
      "   -0.0000 if cp>=0.008584692142903805\n",
      "   +0.0000 if pa>=0.1739991456270218\n",
      "   +0.0000 if cp<=-0.016635843366384503\n",
      "Run episode 726 with rewards 11.0\n",
      "============ 727 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +1.2886 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  +13.3135 if \n",
      "   +3.5521 if cp<=-0.007844104617834073\n",
      "   +3.0088 if cp>=-0.06365211308002472\n",
      "   +0.9972 if cp<=0.0920209586620331\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp<=0.019965627603232866\n",
      "   -0.0000 if cp>=0.008584692142903805\n",
      "   -0.0000 if pa>=0.1739991456270218\n",
      "   +0.0000 if cp<=0.0920209586620331\n",
      "Run episode 727 with rewards 9.0\n",
      "============ 728 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -3.3347 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  -34.4563 if \n",
      "   -9.2020 if cp<=-0.007844104617834073\n",
      "   -7.7815 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp<=0.01689049080014229\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp<=0.019965627603232866\n",
      "   -0.0000 if cp>=0.008584692142903805\n",
      "   -0.0000 if cp<=0.0920209586620331\n",
      "   +0.0000 if cp>=-0.016842950135469433\n",
      "Run episode 728 with rewards 10.0\n",
      "============ 729 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +3.3347 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  +34.4563 if \n",
      "   +9.2020 if cp<=-0.007844104617834073\n",
      "   +7.7815 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp<=0.06154335215687753\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.019965627603232866\n",
      "   +0.0000 if cp>=0.008584692142903805\n",
      "   +0.0000 if cp<=0.0920209586620331\n",
      "   +0.0000 if \n",
      "Run episode 729 with rewards 9.0\n",
      "============ 730 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -1.2747 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  -13.1710 if \n",
      "   -3.5175 if cp<=-0.007844104617834073\n",
      "   -2.9745 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp<=0.006760153826326133 & cp>=-0.060577566921710964\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp>=0.008584692142903805\n",
      "   -0.0000 if cp<=0.0920209586620331\n",
      "   -0.0000 if cp<=0.006760153826326133 & cp>=-0.060577566921710964\n",
      "   +0.0000 if cp<=0.006760153826326133 & cp>=-0.060577566921710964\n",
      "Run episode 730 with rewards 9.0\n",
      "============ 731 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +1.2738 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  +13.2201 if \n",
      "   +3.5071 if cp<=-0.007844104617834073\n",
      "   +3.0311 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp<=0.03516058772802354\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp>=0.008584692142903805\n",
      "   -0.0000 if cp<=0.0920209586620331\n",
      "   +0.0000 if cp<=-0.019991318881511688\n",
      "   +0.0000 if cp<=-0.019991318881511688\n",
      "Run episode 731 with rewards 10.0\n",
      "============ 732 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -3.2841 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  -34.1142 if \n",
      "   -9.0716 if cp<=-0.007844104617834073\n",
      "   -7.8133 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp>=-0.09216814637184143\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=0.008584692142903805\n",
      "   +0.0000 if cp<=0.0920209586620331\n",
      "   +0.0000 if cp>=-0.09216814637184143\n",
      "   +0.0000 if cp<=-0.049819710105657576 & cp>=-0.1321140021085739\n",
      "Run episode 732 with rewards 10.0\n",
      "============ 733 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +3.2841 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  +34.1142 if \n",
      "   +9.0716 if cp<=-0.007844104617834073\n",
      "   +7.8133 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp<=0.04252564311027528\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.0920209586620331\n",
      "   +0.0000 if cp>=-0.09216814637184143\n",
      "   +0.0000 if cp<=-0.049819710105657576 & cp>=-0.1321140021085739\n",
      "   +0.0000 if \n",
      "Run episode 733 with rewards 10.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 734 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -1.2373 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  -12.8712 if \n",
      "   -3.4364 if cp<=-0.007844104617834073\n",
      "   -2.9375 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp>=-0.06344078332185746\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.0920209586620331\n",
      "   +0.0000 if cp>=-0.09216814637184143\n",
      "   -0.0000 if cp>=-0.06344078332185746\n",
      "   +0.0000 if cp<=-0.019214102998375893 & cp>=-0.104292032122612\n",
      "Run episode 734 with rewards 9.0\n",
      "============ 735 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +1.2341 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  +13.0418 if \n",
      "   +3.4276 if cp<=-0.007844104617834073\n",
      "   +3.1336 if cp>=-0.06365211308002472\n",
      "   +0.9929 if cp<=0.052711820602417005\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp<=0.0920209586620331\n",
      "   -0.0000 if cp>=-0.09216814637184143\n",
      "   -0.0000 if cp>=-0.06344078332185746\n",
      "   +0.0000 if cp>=0.12362590432167053\n",
      "Run episode 735 with rewards 9.0\n",
      "============ 736 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -3.1606 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  -33.4325 if \n",
      "   -8.8101 if cp<=-0.007844104617834073\n",
      "   -8.0240 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp<=-0.055102209746837605 & cp>=-0.110066619515419\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.0920209586620331\n",
      "   +0.0000 if cp>=-0.09216814637184143\n",
      "   -0.0000 if cp>=-0.06344078332185746\n",
      "   +0.0000 if cp<=-0.04287654012441635 & cp>=-0.110066619515419\n",
      "Run episode 736 with rewards 9.0\n",
      "============ 737 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +3.1606 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  +33.4325 if \n",
      "   +8.8101 if cp<=-0.007844104617834073\n",
      "   +8.0240 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp>=0.01601195568218828\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.0920209586620331\n",
      "   +0.0000 if cp>=-0.09216814637184143\n",
      "   +0.0000 if cp>=-0.06344078332185746\n",
      "   +0.0000 if \n",
      "Run episode 737 with rewards 9.0\n",
      "============ 738 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -1.1914 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  -13.1042 if \n",
      "   -3.8816 if cp<=-0.007844104617834073\n",
      "   -3.2907 if cp>=-0.06365211308002472\n",
      "   +0.2960 if cp<=0.029060390219092378\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.0920209586620331\n",
      "   +0.0000 if cp>=-0.09216814637184143\n",
      "   -0.0000 if cp>=0.029060390219092378\n",
      "   +0.0000 if cp>=0.029060390219092378\n",
      "Run episode 738 with rewards 9.0\n",
      "============ 739 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +1.1914 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  +13.1042 if \n",
      "   +3.8816 if cp<=-0.007844104617834073\n",
      "   +3.2907 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp<=0.06228518933057786\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp>=-0.09216814637184143\n",
      "   -0.0000 if cp>=0.029060390219092378\n",
      "   +0.0000 if cp<=0.026414962857961653\n",
      "   +0.0000 if cp<=0.026414962857961653\n",
      "Run episode 739 with rewards 9.0\n",
      "============ 740 ===========\n",
      "8 actions [1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -3.0767 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  -33.8573 if \n",
      "  -10.0413 if cp<=-0.007844104617834073\n",
      "   -8.4975 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp<=-0.08596898168325424\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=-0.09216814637184143\n",
      "   +0.0000 if cp>=0.029060390219092378\n",
      "   +0.0000 if cp<=-0.052777832746505736\n",
      "   +0.0000 if pa>=0.20511656999588013\n",
      "Run episode 740 with rewards 8.0\n",
      "============ 741 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +3.0767 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  +33.8573 if \n",
      "  +10.0413 if cp<=-0.007844104617834073\n",
      "   +8.4975 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp>=-0.04776645675301552\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=-0.09216814637184143\n",
      "   +0.0000 if cp<=-0.052777832746505736\n",
      "   +0.0000 if pa>=0.20511656999588013\n",
      "   +0.0000 if \n",
      "Run episode 741 with rewards 9.0\n",
      "============ 742 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -1.1870 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  -13.0621 if \n",
      "   -3.8739 if cp<=-0.007844104617834073\n",
      "   -3.2783 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp<=0.015364259481430055\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=-0.09216814637184143\n",
      "   +0.0000 if cp<=-0.052777832746505736\n",
      "   +0.0000 if cp<=0.015364259481430055 & cp>=-0.047369583696126934\n",
      "   +0.0000 if cp<=0.004754845332354315\n",
      "Run episode 742 with rewards 10.0\n",
      "============ 743 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +1.1870 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  +13.0621 if \n",
      "   +3.8739 if cp<=-0.007844104617834073\n",
      "   +3.2783 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp<=0.06079309731721878\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp>=-0.09216814637184143\n",
      "   -0.0000 if cp<=-0.052777832746505736\n",
      "   +0.0000 if cp<=0.015364259481430055 & cp>=-0.047369583696126934\n",
      "   +0.0000 if cp<=0.06079309731721878\n",
      "Run episode 743 with rewards 9.0\n",
      "============ 744 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -3.0599 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  -33.6930 if \n",
      "  -10.0070 if cp<=-0.007844104617834073\n",
      "   -8.4506 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp>=-0.09827734231948852\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=-0.09216814637184143\n",
      "   -0.0000 if cp<=0.015364259481430055 & cp>=-0.047369583696126934\n",
      "   +0.0000 if cp<=0.06079309731721878\n",
      "   +0.0000 if cp<=-0.03342854306101799\n",
      "Run episode 744 with rewards 10.0\n",
      "============ 745 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +3.0599 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  +33.6930 if \n",
      "  +10.0070 if cp<=-0.007844104617834073\n",
      "   +8.4506 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp<=0.06971534043550492\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=-0.09216814637184143\n",
      "   +0.0000 if cp<=0.015364259481430055 & cp>=-0.047369583696126934\n",
      "   +0.0000 if cp<=0.06079309731721878\n",
      "   +0.0000 if \n",
      "Run episode 745 with rewards 10.0\n",
      "============ 746 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -1.1980 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  -13.1916 if \n",
      "   -3.9180 if cp<=-0.007844104617834073\n",
      "   -3.3086 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp<=0.030507361143827443\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp>=-0.09216814637184143\n",
      "   -0.0000 if cp<=0.06079309731721878\n",
      "   +0.0000 if cp<=0.0026476385071873684\n",
      "   +0.0000 if cp<=0.0026476385071873684\n",
      "Run episode 746 with rewards 10.0\n",
      "============ 747 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +1.1980 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  +13.1916 if \n",
      "   +3.9180 if cp<=-0.007844104617834073\n",
      "   +3.3086 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp<=0.07089857310056687\n",
      "--------------\n",
      "   -0.0000 if cp>=-0.09216814637184143\n",
      "   +0.0000 if cp<=0.06079309731721878\n",
      "   +0.0000 if cp<=0.0026476385071873684\n",
      "   -0.0000 if cp>=0.024317192286252974\n",
      "   +0.0000 if cp<=0.1129424124956131 & cp>=0.024317192286252974\n",
      "Run episode 747 with rewards 10.0\n",
      "============ 748 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -3.1052 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  -34.2135 if \n",
      "  -10.1767 if cp<=-0.007844104617834073\n",
      "   -8.5749 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp>=-0.08271209001541138\n",
      "--------------\n",
      "   +0.0000 if cp>=-0.09216814637184143\n",
      "   +0.0000 if cp<=0.06079309731721878\n",
      "   -0.0000 if cp>=0.024317192286252974\n",
      "   -0.0000 if cp<=0.1129424124956131 & cp>=0.024317192286252974\n",
      "   +0.0000 if cp>=-0.12340719103813172\n",
      "Run episode 748 with rewards 10.0\n",
      "============ 749 ===========\n",
      "8 actions [0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +3.1052 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  +34.2135 if \n",
      "  +10.1767 if cp<=-0.007844104617834073\n",
      "   +8.5749 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp<=0.053749793767929085\n",
      "--------------\n",
      "   +0.0000 if cp>=-0.09216814637184143\n",
      "   +0.0000 if cp<=0.06079309731721878\n",
      "   +0.0000 if cp>=0.024317192286252974\n",
      "   +0.0000 if cp>=-0.12340719103813172\n",
      "   +0.0000 if \n",
      "Run episode 749 with rewards 8.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 750 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -1.1702 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  -12.8938 if \n",
      "   -3.8352 if cp<=-0.007844104617834073\n",
      "   -3.2316 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp<=0.012861184030771257\n",
      "--------------\n",
      "   +0.0000 if cp>=-0.09216814637184143\n",
      "   +0.0000 if cp<=0.06079309731721878\n",
      "   +0.0000 if cp>=-0.12340719103813172\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=-0.03516068831086158\n",
      "Run episode 750 with rewards 9.0\n",
      "============ 751 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +1.1700 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  +12.9052 if \n",
      "   +3.8346 if cp<=-0.007844104617834073\n",
      "   +3.2447 if cp>=-0.06365211308002472\n",
      "   +0.9977 if cp<=0.048398040235042586\n",
      "--------------\n",
      "   -0.0000 if cp>=-0.09216814637184143\n",
      "   +0.0000 if cp<=0.06079309731721878\n",
      "   -0.0000 if cp>=-0.12340719103813172\n",
      "   -0.0000 if \n",
      "   +0.0000 if cp<=0.08067341148853303\n",
      "Run episode 751 with rewards 10.0\n",
      "============ 752 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -2.9940 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  -33.0526 if \n",
      "   -9.8322 if cp<=-0.007844104617834073\n",
      "   -8.3029 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp<=0.02918220162391663\n",
      "--------------\n",
      "   -0.0000 if cp>=-0.09216814637184143\n",
      "   -0.0000 if cp<=0.06079309731721878\n",
      "   -0.0000 if cp>=-0.12340719103813172\n",
      "   -0.0000 if \n",
      "   +0.0000 if cp>=0.04843078553676605\n",
      "Run episode 752 with rewards 9.0\n",
      "============ 753 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +2.9940 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  +33.0526 if \n",
      "   +9.8322 if cp<=-0.007844104617834073\n",
      "   +8.3029 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp<=0.035092465206980714\n",
      "--------------\n",
      "   +0.0000 if cp>=-0.09216814637184143\n",
      "   +0.0000 if cp<=0.06079309731721878\n",
      "   +0.0000 if cp>=-0.12340719103813172\n",
      "   +0.0000 if \n",
      "   +0.0000 if \n",
      "Run episode 753 with rewards 9.0\n",
      "============ 754 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -1.1056 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  -12.6002 if \n",
      "   -4.0256 if cp<=-0.007844104617834073\n",
      "   -2.9616 if cp>=-0.06365211308002472\n",
      "   +0.9489 if cp>=-0.09818213433027267\n",
      "--------------\n",
      "   +0.0000 if cp>=-0.09216814637184143\n",
      "   +0.0000 if cp>=-0.12340719103813172\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=-0.06487170383334159\n",
      "   +0.0000 if cp>=-0.06487170383334159\n",
      "Run episode 754 with rewards 9.0\n",
      "============ 755 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +1.0946 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  +13.2340 if \n",
      "   +3.7688 if cp<=-0.007844104617834073\n",
      "   +3.6911 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp<=0.055822228640317925\n",
      "--------------\n",
      "   -0.0000 if cp>=-0.09216814637184143\n",
      "   -0.0000 if cp>=-0.12340719103813172\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp<=-0.06487170383334159\n",
      "   +0.0000 if cp<=-1.929346472024718e-05\n",
      "Run episode 755 with rewards 9.0\n",
      "============ 756 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -2.8463 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  -34.4310 if \n",
      "   -9.8188 if cp<=-0.007844104617834073\n",
      "   -9.5975 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp>=-0.1048249900341034\n",
      "--------------\n",
      "   +0.0000 if cp>=-0.09216814637184143\n",
      "   +0.0000 if cp>=-0.12340719103813172\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=-1.929346472024718e-05\n",
      "   +0.0000 if cp<=-0.1048249900341034\n",
      "Run episode 756 with rewards 10.0\n",
      "============ 757 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +2.8463 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  +34.4310 if \n",
      "   +9.8188 if cp<=-0.007844104617834073\n",
      "   +9.5975 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp<=0.06716973185539246 & cp>=-0.001959251426160335\n",
      "--------------\n",
      "   +0.0000 if cp>=-0.09216814637184143\n",
      "   +0.0000 if cp>=-0.12340719103813172\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=-1.929346472024718e-05\n",
      "   +0.0000 if \n",
      "Run episode 757 with rewards 9.0\n",
      "============ 758 ===========\n",
      "11 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -1.0993 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  -13.2980 if \n",
      "   -3.7922 if cp<=-0.007844104617834073\n",
      "   -3.7067 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp<=0.019420797377824785\n",
      "--------------\n",
      "   +0.0000 if cp>=-0.12340719103813172\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=-1.929346472024718e-05\n",
      "   +0.0000 if pa>=0.20542341470718384\n",
      "   +0.0000 if cp<=0.019420797377824785 & cp>=-0.04822879657149315\n",
      "Run episode 758 with rewards 11.0\n",
      "origin 2.2451334275713337e-05 new 2.2451335462717096e-05 not updated\n",
      "============ 759 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +1.0993 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  +13.2980 if \n",
      "   +3.7922 if cp<=-0.007844104617834073\n",
      "   +3.7067 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp<=0.0774587467312813\n",
      "--------------\n",
      "   +0.0000 if cp>=-0.12340719103813172\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=-1.929346472024718e-05\n",
      "   +0.0000 if pa>=0.20542341470718384\n",
      "   +0.0000 if cp<=0.019420797377824785 & cp>=-0.04822879657149315\n",
      "Run episode 759 with rewards 9.0\n",
      "origin 1.9349300028534393e-05 new 1.9349300222085945e-05 not updated\n",
      "============ 760 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -2.8660 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  -34.6721 if \n",
      "   -9.8939 if cp<=-0.007844104617834073\n",
      "   -9.6607 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp<=0.027212132140994074\n",
      "--------------\n",
      "   +0.0000 if cp>=-0.12340719103813172\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=-1.929346472024718e-05\n",
      "   +0.0000 if pa>=0.20542341470718384\n",
      "   +0.0000 if cp<=0.019420797377824785 & cp>=-0.04822879657149315\n",
      "Run episode 760 with rewards 10.0\n",
      "============ 761 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +2.8660 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  +34.6721 if \n",
      "   +9.8939 if cp<=-0.007844104617834073\n",
      "   +9.6607 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp<=0.08660009056329727\n",
      "--------------\n",
      "   +0.0000 if cp>=-0.12340719103813172\n",
      "   +0.0000 if \n",
      "   -0.0000 if cp<=-1.929346472024718e-05\n",
      "   +0.0000 if pa>=0.20542341470718384\n",
      "   +0.0000 if \n",
      "Run episode 761 with rewards 10.0\n",
      "============ 762 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -1.0533 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  -12.7433 if \n",
      "   -3.6364 if cp<=-0.007844104617834073\n",
      "   -3.5507 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp>=-0.05861919820308685\n",
      "--------------\n",
      "   +0.0000 if cp>=-0.12340719103813172\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=-1.929346472024718e-05\n",
      "   -0.0000 if cp>=-0.05861919820308685\n",
      "   +0.0000 if cp<=-0.0987367421388626\n",
      "Run episode 762 with rewards 10.0\n",
      "============ 763 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +1.0533 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  +12.7433 if \n",
      "   +3.6364 if cp<=-0.007844104617834073\n",
      "   +3.5507 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp<=0.05090207308530808\n",
      "--------------\n",
      "   -0.0000 if cp>=-0.12340719103813172\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp<=-1.929346472024718e-05\n",
      "   -0.0000 if cp>=-0.05861919820308685\n",
      "   +0.0000 if cp<=0.02285142205655575\n",
      "Run episode 763 with rewards 9.0\n",
      "============ 764 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -2.6823 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  -32.4502 if \n",
      "   -9.2630 if cp<=-0.007844104617834073\n",
      "   -9.0413 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp<=0.03897663727402687\n",
      "--------------\n",
      "   -0.0000 if cp>=-0.12340719103813172\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp>=-0.05861919820308685\n",
      "   +0.0000 if cp<=0.02285142205655575\n",
      "   +0.0000 if cp<=-0.022901732660830017\n",
      "Run episode 764 with rewards 9.0\n",
      "============ 765 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +2.6823 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  +32.4502 if \n",
      "   +9.2630 if cp<=-0.007844104617834073\n",
      "   +9.0413 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp<=0.0512876182794571\n",
      "--------------\n",
      "   +0.0000 if cp>=-0.12340719103813172\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=-0.05861919820308685\n",
      "   +0.0000 if cp<=0.02285142205655575\n",
      "   +0.0000 if \n",
      "Run episode 765 with rewards 10.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 766 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -1.0475 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  -12.6720 if \n",
      "   -3.6173 if cp<=-0.007844104617834073\n",
      "   -3.5307 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp<=0.026228468865156174 & cp>=-0.055452845990657806\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   -0.0000 if cp>=-0.05861919820308685\n",
      "   +0.0000 if cp<=0.02285142205655575\n",
      "   +0.0000 if cp<=0.026228468865156174\n",
      "   +0.0000 if pa>=0.20328876376152039\n",
      "Run episode 766 with rewards 10.0\n",
      "============ 767 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +1.0475 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  +12.6720 if \n",
      "   +3.6173 if cp<=-0.007844104617834073\n",
      "   +3.5307 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp<=0.07613179534673692\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp>=-0.05861919820308685\n",
      "   -0.0000 if cp<=0.02285142205655575\n",
      "   -0.0000 if cp<=0.026228468865156174\n",
      "   +0.0000 if cp<=0.07613179534673692\n",
      "Run episode 767 with rewards 10.0\n",
      "============ 768 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -2.6586 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  -32.2066 if \n",
      "   -9.2225 if cp<=-0.007844104617834073\n",
      "   -8.9612 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp>=-0.10113739669322967\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   -0.0000 if cp>=-0.05861919820308685\n",
      "   +0.0000 if cp<=0.02285142205655575\n",
      "   +0.0000 if cp<=0.07613179534673692\n",
      "   +0.0000 if cp<=-0.059623217582702635 & cp>=-0.10113739669322967\n",
      "Run episode 768 with rewards 9.0\n",
      "============ 769 ===========\n",
      "8 actions [0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +2.6586 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  +32.2066 if \n",
      "   +9.2225 if cp<=-0.007844104617834073\n",
      "   +8.9612 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp<=0.075929394364357\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=-0.05861919820308685\n",
      "   +0.0000 if cp<=0.02285142205655575\n",
      "   +0.0000 if cp<=0.07613179534673692\n",
      "   +0.0000 if \n",
      "Run episode 769 with rewards 8.0\n",
      "============ 770 ===========\n",
      "8 actions [1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.9984 if cv>=-0.2412268579006195 & pa<=-0.03234592527151106 & pav>=0.014347173646092434\n",
      "  -12.0947 if \n",
      "   -3.4634 if cp<=-0.007844104617834073\n",
      "   -3.3652 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp>=-0.047418434917926786\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.02285142205655575\n",
      "   +0.0000 if cp<=0.07613179534673692\n",
      "   -0.0000 if cp>=-0.030832522362470617\n",
      "   +0.0000 if cp>=-0.030832522362470617\n",
      "Run episode 770 with rewards 8.0\n",
      "============ 771 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +12.0947 if \n",
      "   +3.4634 if cp<=-0.007844104617834073\n",
      "   +3.3652 if cp>=-0.06365211308002472\n",
      "   +1.0000 if cp>=-0.047418434917926786\n",
      "   +1.0000 if cp<=0.018871868029236804\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp<=0.02285142205655575\n",
      "   -0.0000 if cp<=0.07613179534673692\n",
      "   -0.0000 if cp>=-0.03166245967149735\n",
      "   +0.0000 if cp>=0.050616368651390076\n",
      "Run episode 771 with rewards 9.0\n",
      "============ 772 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -29.8568 if \n",
      "   -8.5676 if cp<=-0.007844104617834073\n",
      "   -8.2915 if cp>=-0.06365211308002472\n",
      "   -2.4892 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=-0.03851274102926254\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   +0.0000 if cp<=0.02285142205655575\n",
      "   -0.0000 if cp<=0.07613179534673692\n",
      "   -0.0000 if cp>=-0.03166245967149735\n",
      "   +0.0000 if cp>=0.02567945420742035\n",
      "Run episode 772 with rewards 10.0\n",
      "============ 773 ===========\n",
      "11 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +29.8568 if \n",
      "   +8.5676 if cp<=-0.007844104617834073\n",
      "   +8.2915 if cp>=-0.06365211308002472\n",
      "   +2.4892 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.05398668199777604\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.02285142205655575\n",
      "   +0.0000 if cp<=0.07613179534673692\n",
      "   +0.0000 if cp>=-0.03166245967149735\n",
      "   +0.0000 if \n",
      "Run episode 773 with rewards 11.0\n",
      "============ 774 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -12.0079 if \n",
      "   -3.7450 if cp<=-0.007844104617834073\n",
      "   -2.9513 if cp>=-0.06365211308002472\n",
      "   -1.3858 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp>=-0.07559467852115631\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.02285142205655575\n",
      "   -0.0000 if cp>=-0.03166245967149735\n",
      "   +0.0000 if cp>=-0.07559467852115631\n",
      "   +0.0000 if cp>=-0.07559467852115631\n",
      "Run episode 774 with rewards 10.0\n",
      "============ 775 ===========\n",
      "8 actions [0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +12.6318 if \n",
      "   +3.7074 if cp<=-0.007844104617834073\n",
      "   +3.6661 if cp>=-0.06365211308002472\n",
      "   +1.0720 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.041873242706060416\n",
      "--------------\n",
      "   -0.0001 if \n",
      "   +0.0000 if cp<=0.02285142205655575\n",
      "   -0.0001 if cp>=-0.07559467852115631\n",
      "   -0.0000 if cp<=0.08221389800310136\n",
      "   +0.0000 if cp<=0.08221389800310136\n",
      "Run episode 775 with rewards 8.0\n",
      "============ 776 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -32.1078 if \n",
      "   -9.4314 if cp<=-0.007844104617834073\n",
      "   -9.3157 if cp>=-0.06365211308002472\n",
      "   -2.7349 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp>=-0.047260561585426325\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=-0.07559467852115631\n",
      "   +0.0000 if cp<=0.08221389800310136\n",
      "   +0.0000 if cp<=-0.020995887741446492\n",
      "   +0.0000 if pa>=0.16501495242118835\n",
      "Run episode 776 with rewards 9.0\n",
      "============ 777 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +32.1078 if \n",
      "   +9.4314 if cp<=-0.007844104617834073\n",
      "   +9.3157 if cp>=-0.06365211308002472\n",
      "   +2.7349 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.04393986314535142\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=-0.07559467852115631\n",
      "   +0.0000 if cp<=0.08221389800310136\n",
      "   +0.0000 if cp<=-0.020995887741446492\n",
      "   +0.0000 if \n",
      "Run episode 777 with rewards 10.0\n",
      "============ 778 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -12.5284 if \n",
      "   -4.1179 if cp<=-0.007844104617834073\n",
      "   -3.1436 if cp>=-0.06365211308002472\n",
      "   -1.6342 if cp<=0.018871868029236804\n",
      "   +0.5336 if cp<=-0.11187238097190857\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.08221389800310136\n",
      "   +0.0000 if cp<=-0.020995887741446492\n",
      "   -0.0000 if cp>=-0.04642718434333801\n",
      "   +0.0000 if cp>=-0.04642718434333801\n",
      "Run episode 778 with rewards 10.0\n",
      "============ 779 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +12.7866 if \n",
      "   +4.0993 if cp<=-0.007844104617834073\n",
      "   +3.4441 if cp>=-0.06365211308002472\n",
      "   +1.6269 if cp<=0.018871868029236804\n",
      "   +0.9478 if cp<=0.08386858254671098\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   +0.0000 if cp<=0.08221389800310136\n",
      "   +0.0000 if cp<=-0.020995887741446492\n",
      "   -0.0000 if cp>=0.0559616707265377\n",
      "   +0.0000 if cp>=0.12427230179309845\n",
      "Run episode 779 with rewards 10.0\n",
      "============ 780 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -32.8293 if \n",
      "  -10.5322 if cp<=-0.007844104617834073\n",
      "   -8.8375 if cp>=-0.06365211308002472\n",
      "   -4.1815 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=-0.05730056911706924 & cp>=-0.0994550883769989\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp<=0.08221389800310136\n",
      "   +0.0000 if cp>=0.0559616707265377\n",
      "   +0.0000 if cp>=0.12427230179309845\n",
      "   +0.0000 if cp>=-0.05730056911706924\n",
      "Run episode 780 with rewards 10.0\n",
      "============ 781 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +32.8293 if \n",
      "  +10.5322 if cp<=-0.007844104617834073\n",
      "   +8.8375 if cp>=-0.06365211308002472\n",
      "   +4.1815 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.040237558633089074\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.08221389800310136\n",
      "   +0.0000 if cp>=0.0559616707265377\n",
      "   +0.0000 if cp>=-0.05730056911706924\n",
      "   +0.0000 if \n",
      "Run episode 781 with rewards 10.0\n",
      "============ 782 ===========\n",
      "8 actions [1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -12.5265 if \n",
      "   -4.0187 if cp<=-0.007844104617834073\n",
      "   -3.3721 if cp>=-0.06365211308002472\n",
      "   -1.5955 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=-0.11943414211273193\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.08221389800310136\n",
      "   -0.0000 if cp>=-0.05730056911706924\n",
      "   +0.0000 if cp>=-0.07991157025098801\n",
      "   +0.0000 if cp<=-0.11943414211273193\n",
      "Run episode 782 with rewards 8.0\n",
      "============ 783 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +12.5534 if \n",
      "   +4.0169 if cp<=-0.007844104617834073\n",
      "   +3.4032 if cp>=-0.06365211308002472\n",
      "   +1.5948 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.05726691186428072\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp<=0.08221389800310136\n",
      "   -0.0000 if cp>=-0.05730056911706924\n",
      "   -0.0000 if cp>=-0.07991157025098801\n",
      "   +0.0000 if cp>=0.11192282289266586\n",
      "Run episode 783 with rewards 10.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 784 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -31.9090 if \n",
      "  -10.2195 if cp<=-0.007844104617834073\n",
      "   -8.6463 if cp>=-0.06365211308002472\n",
      "   -4.0656 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp>=-0.0970751941204071\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.08221389800310136\n",
      "   -0.0000 if cp>=-0.05730056911706924\n",
      "   +0.0000 if cp>=-0.07991157025098801\n",
      "   +0.0000 if cp<=-0.06730402559041976 & cp>=-0.13933166563510896\n",
      "Run episode 784 with rewards 10.0\n",
      "============ 785 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +31.9090 if \n",
      "  +10.2195 if cp<=-0.007844104617834073\n",
      "   +8.6463 if cp>=-0.06365211308002472\n",
      "   +4.0656 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.09438633024692536\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.08221389800310136\n",
      "   +0.0000 if cp>=-0.05730056911706924\n",
      "   +0.0000 if cp>=-0.07991157025098801\n",
      "   +0.0000 if \n",
      "Run episode 785 with rewards 9.0\n",
      "============ 786 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -12.7029 if \n",
      "   -4.0684 if cp<=-0.007844104617834073\n",
      "   -3.4421 if cp>=-0.06365211308002472\n",
      "   -1.6185 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp>=-0.021905697695910928\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp<=0.08221389800310136\n",
      "   -0.0000 if cp>=-0.07991157025098801\n",
      "   -0.0000 if cp>=-0.021905697695910928\n",
      "   +0.0000 if cp>=-0.021905697695910928\n",
      "Run episode 786 with rewards 10.0\n",
      "============ 787 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +12.8881 if \n",
      "   +3.9578 if cp<=-0.007844104617834073\n",
      "   +3.6549 if cp>=-0.06365211308002472\n",
      "   +1.5265 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.06920306086540223 & cp>=-0.002433718927204608\n",
      "--------------\n",
      "   -0.0000 if cp<=0.08221389800310136\n",
      "   -0.0000 if cp>=-0.07991157025098801\n",
      "   -0.0000 if cp>=-0.021905697695910928\n",
      "   -0.0000 if cp<=0.02713120877742768\n",
      "   +0.0000 if cp<=-0.002433718927204608\n",
      "Run episode 787 with rewards 10.0\n",
      "============ 788 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -33.2052 if \n",
      "  -10.2045 if cp<=-0.007844104617834073\n",
      "   -9.4079 if cp>=-0.06365211308002472\n",
      "   -3.9409 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.044559305906295775 & cp>=-0.04284560084342957\n",
      "--------------\n",
      "   +0.0000 if cp<=0.08221389800310136\n",
      "   -0.0000 if cp>=-0.07991157025098801\n",
      "   -0.0000 if cp>=-0.021905697695910928\n",
      "   +0.0000 if cp<=0.02713120877742768\n",
      "   +0.0000 if cp<=0.02792586944997311 & cp>=-0.04284560084342957\n",
      "Run episode 788 with rewards 9.0\n",
      "============ 789 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +33.2052 if \n",
      "  +10.2045 if cp<=-0.007844104617834073\n",
      "   +9.4079 if cp>=-0.06365211308002472\n",
      "   +3.9409 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.05496792495250703\n",
      "--------------\n",
      "   +0.0000 if cp<=0.08221389800310136\n",
      "   +0.0000 if cp>=-0.07991157025098801\n",
      "   +0.0000 if cp>=-0.021905697695910928\n",
      "   +0.0000 if cp<=0.02713120877742768\n",
      "   +0.0000 if \n",
      "Run episode 789 with rewards 10.0\n",
      "============ 790 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -12.9040 if \n",
      "   -3.9656 if cp<=-0.007844104617834073\n",
      "   -3.6560 if cp>=-0.06365211308002472\n",
      "   -1.5315 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp>=-0.0031294421292841395\n",
      "--------------\n",
      "   -0.0000 if cp>=-0.07991157025098801\n",
      "   -0.0000 if cp>=-0.021905697695910928\n",
      "   +0.0000 if cp<=0.02713120877742768\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=-0.030172641575336456\n",
      "Run episode 790 with rewards 10.0\n",
      "============ 791 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +12.9040 if \n",
      "   +3.9656 if cp<=-0.007844104617834073\n",
      "   +3.6560 if cp>=-0.06365211308002472\n",
      "   +1.5315 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.04325576126575471\n",
      "--------------\n",
      "   -0.0000 if cp>=-0.07991157025098801\n",
      "   -0.0000 if cp>=-0.021905697695910928\n",
      "   -0.0000 if cp<=0.02713120877742768\n",
      "   -0.0000 if \n",
      "   +0.0000 if cp<=-0.022392859682440758\n",
      "Run episode 791 with rewards 9.0\n",
      "============ 792 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -33.2704 if \n",
      "  -10.2286 if cp<=-0.007844104617834073\n",
      "   -9.4218 if cp>=-0.06365211308002472\n",
      "   -3.9544 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.034142839908599856\n",
      "--------------\n",
      "   -0.0000 if cp>=-0.07991157025098801\n",
      "   -0.0000 if cp>=-0.021905697695910928\n",
      "   +0.0000 if cp<=0.02713120877742768\n",
      "   -0.0000 if \n",
      "   +0.0000 if cp<=-0.033853188157081604\n",
      "Run episode 792 with rewards 10.0\n",
      "============ 793 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +33.2704 if \n",
      "  +10.2286 if cp<=-0.007844104617834073\n",
      "   +9.4218 if cp>=-0.06365211308002472\n",
      "   +3.9544 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.0751335397362709\n",
      "--------------\n",
      "   +0.0000 if cp>=-0.07991157025098801\n",
      "   +0.0000 if cp>=-0.021905697695910928\n",
      "   +0.0000 if cp<=0.02713120877742768\n",
      "   +0.0000 if \n",
      "   +0.0000 if \n",
      "Run episode 793 with rewards 9.0\n",
      "============ 794 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -13.0563 if \n",
      "   -4.0140 if cp<=-0.007844104617834073\n",
      "   -3.6974 if cp>=-0.06365211308002472\n",
      "   -1.5518 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp>=0.004221850447356709\n",
      "--------------\n",
      "   -0.0000 if cp>=-0.021905697695910928\n",
      "   +0.0000 if cp<=0.02713120877742768\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.015452742949128153\n",
      "   +0.0000 if pa>=0.20049458742141724\n",
      "Run episode 794 with rewards 9.0\n",
      "============ 795 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +13.0563 if \n",
      "   +4.0140 if cp<=-0.007844104617834073\n",
      "   +3.6974 if cp>=-0.06365211308002472\n",
      "   +1.5518 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.07742609381675722\n",
      "--------------\n",
      "   -0.0000 if cp>=-0.021905697695910928\n",
      "   -0.0000 if cp<=0.02713120877742768\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp<=0.015452742949128153\n",
      "   +0.0000 if cp<=0.07742609381675722\n",
      "Run episode 795 with rewards 9.0\n",
      "============ 796 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -33.8818 if \n",
      "  -10.4214 if cp<=-0.007844104617834073\n",
      "   -9.5902 if cp>=-0.06365211308002472\n",
      "   -4.0320 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.006179778464138516 & cp>=-0.05023829713463783\n",
      "--------------\n",
      "   -0.0000 if cp>=-0.021905697695910928\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.015452742949128153\n",
      "   +0.0000 if cp<=0.07742609381675722\n",
      "   +0.0000 if cp<=0.01912793219089508\n",
      "Run episode 796 with rewards 10.0\n",
      "============ 797 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +33.8818 if \n",
      "  +10.4214 if cp<=-0.007844104617834073\n",
      "   +9.5902 if cp>=-0.06365211308002472\n",
      "   +4.0320 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.09764031916856766\n",
      "--------------\n",
      "   +0.0000 if cp>=-0.021905697695910928\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.015452742949128153\n",
      "   +0.0000 if cp<=0.07742609381675722\n",
      "   +0.0000 if \n",
      "Run episode 797 with rewards 9.0\n",
      "============ 798 ===========\n",
      "11 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -12.7824 if \n",
      "   -3.9316 if cp<=-0.007844104617834073\n",
      "   -3.6180 if cp>=-0.06365211308002472\n",
      "   -1.5211 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp>=-0.0673524186015129\n",
      "--------------\n",
      "   +0.0000 if cp>=-0.021905697695910928\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.015452742949128153\n",
      "   +0.0000 if cp>=-0.10053028613328933\n",
      "   +0.0000 if cp>=-0.0673524186015129\n",
      "Run episode 798 with rewards 11.0\n",
      "============ 799 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +12.8099 if \n",
      "   +3.9296 if cp<=-0.007844104617834073\n",
      "   +3.6503 if cp>=-0.06365211308002472\n",
      "   +1.4959 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.06486110389232637\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   +0.0000 if cp<=0.015452742949128153\n",
      "   -0.0000 if cp>=-0.10053028613328933\n",
      "   -0.0000 if cp>=-0.0673524186015129\n",
      "   +0.0000 if cp<=0.06486110389232637 & cp>=0.010767837055027485\n",
      "Run episode 799 with rewards 9.0\n",
      "============ 800 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -32.8932 if \n",
      "  -10.0924 if cp<=-0.007844104617834073\n",
      "   -9.3701 if cp>=-0.06365211308002472\n",
      "   -3.8440 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.039528431743383406\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   +0.0000 if cp<=0.015452742949128153\n",
      "   -0.0000 if cp>=-0.10053028613328933\n",
      "   -0.0000 if cp>=-0.0673524186015129\n",
      "   +0.0000 if cp<=0.039528431743383406 & cp>=0.029301795735955247\n",
      "Run episode 800 with rewards 10.0\n",
      "============ 801 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +32.8932 if \n",
      "  +10.0924 if cp<=-0.007844104617834073\n",
      "   +9.3701 if cp>=-0.06365211308002472\n",
      "   +3.8440 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.04717285633087159\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.015452742949128153\n",
      "   +0.0000 if cp>=-0.10053028613328933\n",
      "   +0.0000 if cp>=-0.0673524186015129\n",
      "   +0.0000 if \n",
      "Run episode 801 with rewards 9.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 802 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -12.8806 if \n",
      "   -3.9521 if cp<=-0.007844104617834073\n",
      "   -3.6692 if cp>=-0.06365211308002472\n",
      "   -1.5052 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp>=-0.023482497036457054\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=-0.10053028613328933\n",
      "   -0.0000 if cp>=-0.0673524186015129\n",
      "   +0.0000 if cp<=-0.010204406455159186\n",
      "   +0.0000 if cp<=-0.08056063652038574\n",
      "Run episode 802 with rewards 10.0\n",
      "============ 803 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +12.8806 if \n",
      "   +3.9521 if cp<=-0.007844104617834073\n",
      "   +3.6692 if cp>=-0.06365211308002472\n",
      "   +1.5052 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.05575410723686219 & cp>=-0.01136720646172762\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp>=-0.10053028613328933\n",
      "   -0.0000 if cp>=-0.0673524186015129\n",
      "   +0.0000 if cp<=-0.010204406455159186\n",
      "   +0.0000 if cp<=-0.01136720646172762\n",
      "Run episode 803 with rewards 10.0\n",
      "============ 804 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -33.1895 if \n",
      "  -10.1898 if cp<=-0.007844104617834073\n",
      "   -9.4516 if cp>=-0.06365211308002472\n",
      "   -3.8868 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp>=-0.0580815851688385\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=-0.10053028613328933\n",
      "   -0.0000 if cp>=-0.0673524186015129\n",
      "   +0.0000 if cp<=-0.010204406455159186\n",
      "   +0.0000 if pa>=0.15795095264911652\n",
      "Run episode 804 with rewards 10.0\n",
      "============ 805 ===========\n",
      "8 actions [0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +33.1895 if \n",
      "  +10.1898 if cp<=-0.007844104617834073\n",
      "   +9.4516 if cp>=-0.06365211308002472\n",
      "   +3.8868 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.07130703479051591\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=-0.10053028613328933\n",
      "   +0.0000 if cp>=-0.0673524186015129\n",
      "   +0.0000 if cp<=-0.010204406455159186\n",
      "   +0.0000 if \n",
      "Run episode 805 with rewards 8.0\n",
      "============ 806 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -12.5553 if \n",
      "   -3.8547 if cp<=-0.007844104617834073\n",
      "   -3.5755 if cp>=-0.06365211308002472\n",
      "   -1.4704 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp>=-0.04627497494220733\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=-0.10053028613328933\n",
      "   +0.0000 if cp<=-0.010204406455159186\n",
      "   +0.0000 if pa>=0.17644432187080383\n",
      "   +0.0000 if cp<=-0.02876752279698848\n",
      "Run episode 806 with rewards 10.0\n",
      "============ 807 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +12.5553 if \n",
      "   +3.8547 if cp<=-0.007844104617834073\n",
      "   +3.5755 if cp>=-0.06365211308002472\n",
      "   +1.4704 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.07590395510196686\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp>=-0.10053028613328933\n",
      "   -0.0000 if cp<=-0.010204406455159186\n",
      "   -0.0000 if pa>=0.17644432187080383\n",
      "   +0.0000 if cp<=0.07590395510196686\n",
      "Run episode 807 with rewards 10.0\n",
      "============ 808 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -31.8902 if \n",
      "   -9.8026 if cp<=-0.007844104617834073\n",
      "   -9.0739 if cp>=-0.06365211308002472\n",
      "   -3.7434 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=-0.05289920940995216 & cp>=-0.09314930588006973\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   -0.0000 if cp>=-0.10053028613328933\n",
      "   +0.0000 if cp<=-0.010204406455159186\n",
      "   +0.0000 if cp<=0.07590395510196686\n",
      "   +0.0000 if cp>=-0.05289920940995216\n",
      "Run episode 808 with rewards 9.0\n",
      "============ 809 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +31.8902 if \n",
      "   +9.8026 if cp<=-0.007844104617834073\n",
      "   +9.0739 if cp>=-0.06365211308002472\n",
      "   +3.7434 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.05548080354928971\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=-0.10053028613328933\n",
      "   +0.0000 if cp<=-0.010204406455159186\n",
      "   +0.0000 if cp<=0.07590395510196686\n",
      "   +0.0000 if \n",
      "Run episode 809 with rewards 10.0\n",
      "============ 810 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -12.4086 if \n",
      "   -3.8142 if cp<=-0.007844104617834073\n",
      "   -3.5307 if cp>=-0.06365211308002472\n",
      "   -1.4566 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp>=-0.09354725927114486\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=-0.10053028613328933\n",
      "   +0.0000 if cp<=-0.010204406455159186\n",
      "   +0.0000 if cp>=-0.13511010110378266\n",
      "   +0.0000 if pa>=0.2057034820318222\n",
      "Run episode 810 with rewards 10.0\n",
      "============ 811 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +12.6309 if \n",
      "   +3.6830 if cp<=-0.007844104617834073\n",
      "   +3.7873 if cp>=-0.06365211308002472\n",
      "   +1.3684 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.05455381274223328\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp>=-0.10053028613328933\n",
      "   +0.0000 if cp<=-0.010204406455159186\n",
      "   -0.0000 if cp>=-0.13511010110378266\n",
      "   +0.0000 if cp>=0.05455381274223328\n",
      "Run episode 811 with rewards 10.0\n",
      "============ 812 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -32.1724 if \n",
      "   -9.3928 if cp<=-0.007844104617834073\n",
      "   -9.6387 if cp>=-0.06365211308002472\n",
      "   -3.4929 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp>=0.00794682726264\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp>=-0.10053028613328933\n",
      "   +0.0000 if cp<=-0.010204406455159186\n",
      "   -0.0000 if cp>=-0.13511010110378266\n",
      "   +0.0000 if cp>=-0.035185838118195534\n",
      "Run episode 812 with rewards 10.0\n",
      "============ 813 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +32.1724 if \n",
      "   +9.3928 if cp<=-0.007844104617834073\n",
      "   +9.6387 if cp>=-0.06365211308002472\n",
      "   +3.4929 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.079789736866951\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=-0.10053028613328933\n",
      "   +0.0000 if cp<=-0.010204406455159186\n",
      "   +0.0000 if cp>=-0.13511010110378266\n",
      "   +0.0000 if \n",
      "Run episode 813 with rewards 10.0\n",
      "============ 814 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -12.3611 if \n",
      "   -3.7497 if cp<=-0.007844104617834073\n",
      "   -3.5472 if cp>=-0.06365211308002472\n",
      "   -1.5193 if cp<=0.018871868029236804\n",
      "   +0.8262 if cp<=-0.12297816276550293\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=-0.10053028613328933\n",
      "   +0.0000 if cp<=-0.010204406455159186\n",
      "   +0.0000 if cp<=-0.057086555659770964\n",
      "   +0.0000 if cp<=-0.057086555659770964\n",
      "Run episode 814 with rewards 9.0\n",
      "============ 815 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +12.3611 if \n",
      "   +3.7497 if cp<=-0.007844104617834073\n",
      "   +3.5472 if cp>=-0.06365211308002472\n",
      "   +1.5193 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp>=0.06072913482785225\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   +0.0000 if cp<=-0.010204406455159186\n",
      "   +0.0000 if cp<=-0.057086555659770964\n",
      "   -0.0000 if cp>=0.02087563481181861\n",
      "   +0.0000 if cp>=0.06072913482785225\n",
      "Run episode 815 with rewards 9.0\n",
      "============ 816 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -31.1231 if \n",
      "   -9.4528 if cp<=-0.007844104617834073\n",
      "   -8.9259 if cp>=-0.06365211308002472\n",
      "   -3.8401 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp>=-0.06371719688177109\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=-0.010204406455159186\n",
      "   -0.0000 if cp>=0.02087563481181861\n",
      "   -0.0000 if cp>=0.06072913482785225\n",
      "   +0.0000 if cp>=-0.09625696688890457\n",
      "Run episode 816 with rewards 9.0\n",
      "============ 817 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +31.1231 if \n",
      "   +9.4528 if cp<=-0.007844104617834073\n",
      "   +8.9259 if cp>=-0.06365211308002472\n",
      "   +3.8401 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.042012175172567376\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=-0.010204406455159186\n",
      "   +0.0000 if cp>=0.02087563481181861\n",
      "   +0.0000 if cp>=-0.09625696688890457\n",
      "   +0.0000 if \n",
      "Run episode 817 with rewards 9.0\n",
      "============ 818 ===========\n",
      "8 actions [1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -12.1788 if \n",
      "   -3.6990 if cp<=-0.007844104617834073\n",
      "   -3.4928 if cp>=-0.06365211308002472\n",
      "   -1.5027 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp>=-0.052559197694063184\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=-0.010204406455159186\n",
      "   +0.0000 if cp>=-0.09625696688890457\n",
      "   -0.0000 if cp>=-0.052559197694063184\n",
      "   +0.0000 if pa>=0.16352996230125427\n",
      "Run episode 818 with rewards 8.0\n",
      "============ 819 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +12.3071 if \n",
      "   +3.6567 if cp<=-0.007844104617834073\n",
      "   +3.6429 if cp>=-0.06365211308002472\n",
      "   +1.5013 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.03146108835935594\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   +0.0000 if cp<=-0.010204406455159186\n",
      "   -0.0000 if cp>=-0.09625696688890457\n",
      "   -0.0000 if cp>=-0.052559197694063184\n",
      "   +0.0000 if cp<=0.0074644953943789165 & cp>=-0.008695586770772932\n",
      "Run episode 819 with rewards 10.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 820 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -30.9228 if \n",
      "   -9.2037 if cp<=-0.007844104617834073\n",
      "   -9.1457 if cp>=-0.06365211308002472\n",
      "   -3.7918 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=-0.12016011476516723\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=-0.010204406455159186\n",
      "   +0.0000 if cp>=-0.09625696688890457\n",
      "   -0.0000 if cp>=-0.052559197694063184\n",
      "   +0.0000 if cp<=-0.03851780146360397 & cp>=-0.12016011476516723\n",
      "Run episode 820 with rewards 9.0\n",
      "============ 821 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +30.9228 if \n",
      "   +9.2037 if cp<=-0.007844104617834073\n",
      "   +9.1457 if cp>=-0.06365211308002472\n",
      "   +3.7918 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.08146689981222154 & cp>=0.01193166058510542\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=-0.010204406455159186\n",
      "   +0.0000 if cp>=-0.09625696688890457\n",
      "   +0.0000 if cp>=-0.052559197694063184\n",
      "   +0.0000 if \n",
      "Run episode 821 with rewards 9.0\n",
      "============ 822 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -12.3939 if \n",
      "   -3.6888 if cp<=-0.007844104617834073\n",
      "   -3.6656 if cp>=-0.06365211308002472\n",
      "   -1.5198 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.040069867670536045\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   +0.0000 if cp<=-0.010204406455159186\n",
      "   -0.0000 if cp>=-0.09625696688890457\n",
      "   +0.0000 if cp<=0.040069867670536045\n",
      "   +0.0000 if cp<=0.040069867670536045\n",
      "Run episode 822 with rewards 9.0\n",
      "============ 823 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +12.3939 if \n",
      "   +3.6888 if cp<=-0.007844104617834073\n",
      "   +3.6656 if cp>=-0.06365211308002472\n",
      "   +1.5198 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.08298952132463457\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp>=-0.09625696688890457\n",
      "   -0.0000 if cp<=0.040069867670536045\n",
      "   +0.0000 if cp<=0.08298952132463457\n",
      "   +0.0000 if cp<=0.11532309353351594\n",
      "Run episode 823 with rewards 9.0\n",
      "============ 824 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -31.2446 if \n",
      "   -9.3082 if cp<=-0.007844104617834073\n",
      "   -9.2310 if cp>=-0.06365211308002472\n",
      "   -3.8403 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=-0.037559560313820836\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp>=-0.09625696688890457\n",
      "   -0.0000 if cp<=0.08298952132463457\n",
      "   -0.0000 if cp<=0.11532309353351594\n",
      "   +0.0000 if cp<=-0.037559560313820836\n",
      "Run episode 824 with rewards 9.0\n",
      "============ 825 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +31.2446 if \n",
      "   +9.3082 if cp<=-0.007844104617834073\n",
      "   +9.2310 if cp>=-0.06365211308002472\n",
      "   +3.8403 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.06003556102514268 & cp>=-0.007129047624766826\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=-0.09625696688890457\n",
      "   +0.0000 if cp<=0.08298952132463457\n",
      "   +0.0000 if cp<=0.11532309353351594\n",
      "   +0.0000 if \n",
      "Run episode 825 with rewards 9.0\n",
      "============ 826 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -12.4336 if \n",
      "   -3.7042 if cp<=-0.007844104617834073\n",
      "   -3.6734 if cp>=-0.06365211308002472\n",
      "   -1.5282 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp>=-0.011081819608807554\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.08298952132463457\n",
      "   +0.0000 if cp<=0.11532309353351594\n",
      "   -0.0000 if cp>=-0.011081819608807554\n",
      "   +0.0000 if cp>=-0.011081819608807554\n",
      "Run episode 826 with rewards 9.0\n",
      "============ 827 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +12.4336 if \n",
      "   +3.7042 if cp<=-0.007844104617834073\n",
      "   +3.6734 if cp>=-0.06365211308002472\n",
      "   +1.5282 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.08036274015903475\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   +0.0000 if cp<=0.08298952132463457\n",
      "   +0.0000 if cp<=0.11532309353351594\n",
      "   -0.0000 if cp>=0.048922798782587054\n",
      "   +0.0000 if cp>=0.05943726897239685\n",
      "Run episode 827 with rewards 10.0\n",
      "============ 828 ===========\n",
      "8 actions [1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -31.4264 if \n",
      "   -9.3745 if cp<=-0.007844104617834073\n",
      "   -9.2792 if cp>=-0.06365211308002472\n",
      "   -3.8777 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp>=-0.06288867741823197\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.08298952132463457\n",
      "   +0.0000 if cp<=0.11532309353351594\n",
      "   +0.0000 if cp>=0.048922798782587054\n",
      "   +0.0000 if cp>=-0.036122982203960416\n",
      "Run episode 828 with rewards 8.0\n",
      "============ 829 ===========\n",
      "8 actions [0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +31.4264 if \n",
      "   +9.3745 if cp<=-0.007844104617834073\n",
      "   +9.2792 if cp>=-0.06365211308002472\n",
      "   +3.8777 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.04653768986463548\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.08298952132463457\n",
      "   +0.0000 if cp<=0.11532309353351594\n",
      "   +0.0000 if cp>=-0.036122982203960416\n",
      "   +0.0000 if \n",
      "Run episode 829 with rewards 8.0\n",
      "============ 830 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -11.8197 if \n",
      "   -3.5258 if cp<=-0.007844104617834073\n",
      "   -3.4900 if cp>=-0.06365211308002472\n",
      "   -1.4584 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp>=-0.055138358473777765\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.08298952132463457\n",
      "   +0.0000 if cp<=0.11532309353351594\n",
      "   -0.0000 if cp>=-0.03899474889039992\n",
      "   +0.0000 if cp<=-0.07912133932113648\n",
      "Run episode 830 with rewards 10.0\n",
      "============ 831 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +12.4104 if \n",
      "   +3.1223 if cp<=-0.007844104617834073\n",
      "   +4.1758 if cp>=-0.06365211308002472\n",
      "   +1.3248 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.04475807547569276\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp<=0.08298952132463457\n",
      "   -0.0000 if cp<=0.11532309353351594\n",
      "   -0.0000 if cp>=-0.03899474889039992\n",
      "   +0.0000 if cp<=0.0025783927179873056\n",
      "Run episode 831 with rewards 9.0\n",
      "============ 832 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -31.3152 if \n",
      "   -7.8963 if cp<=-0.007844104617834073\n",
      "  -10.5287 if cp>=-0.06365211308002472\n",
      "   -3.3642 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp>=-0.06029307171702385\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.08298952132463457\n",
      "   +0.0000 if cp<=0.11532309353351594\n",
      "   -0.0000 if cp>=-0.03899474889039992\n",
      "   +0.0000 if cp>=-0.03739515468478202\n",
      "Run episode 832 with rewards 9.0\n",
      "============ 833 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +31.3152 if \n",
      "   +7.8963 if cp<=-0.007844104617834073\n",
      "  +10.5287 if cp>=-0.06365211308002472\n",
      "   +3.3642 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.05557144656777383\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.08298952132463457\n",
      "   +0.0000 if cp<=0.11532309353351594\n",
      "   +0.0000 if cp>=-0.03899474889039992\n",
      "   +0.0000 if \n",
      "Run episode 833 with rewards 9.0\n",
      "============ 834 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -11.9625 if \n",
      "   -3.1006 if cp<=-0.007844104617834073\n",
      "   -3.9721 if cp>=-0.06365211308002472\n",
      "   -1.3856 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp>=-0.05658329278230667\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.08298952132463457\n",
      "   +0.0000 if cp<=0.11532309353351594\n",
      "   -0.0000 if cp>=-0.035334633290767664\n",
      "   +0.0000 if cp>=-0.035334633290767664\n",
      "Run episode 834 with rewards 10.0\n",
      "============ 835 ===========\n",
      "8 actions [0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +12.1685 if \n",
      "   +2.9735 if cp<=-0.007844104617834073\n",
      "   +4.2133 if cp>=-0.06365211308002472\n",
      "   +1.2318 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.07927177250385285 & cp>=0.010544661059975625\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp<=0.08298952132463457\n",
      "   -0.0000 if cp<=0.11532309353351594\n",
      "   -0.0000 if cp>=0.0386595655232668\n",
      "   +0.0000 if cp<=0.0386595655232668 & cp>=0.010544661059975625\n",
      "Run episode 835 with rewards 8.0\n",
      "============ 836 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -30.3487 if \n",
      "   -7.4283 if cp<=-0.007844104617834073\n",
      "  -10.5013 if cp>=-0.06365211308002472\n",
      "   -3.0888 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=-0.031243145465850827\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.08298952132463457\n",
      "   +0.0000 if cp<=0.11532309353351594\n",
      "   +0.0000 if cp>=0.0386595655232668\n",
      "   +0.0000 if cp>=0.012031991407275209\n",
      "Run episode 836 with rewards 10.0\n",
      "============ 837 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +30.3487 if \n",
      "   +7.4283 if cp<=-0.007844104617834073\n",
      "  +10.5013 if cp>=-0.06365211308002472\n",
      "   +3.0888 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.06504021733999253 & cp>=-0.0027588475961238135\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.08298952132463457\n",
      "   +0.0000 if cp<=0.11532309353351594\n",
      "   +0.0000 if cp>=0.012031991407275209\n",
      "   +0.0000 if \n",
      "Run episode 837 with rewards 10.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 838 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -12.3419 if \n",
      "   -3.1118 if cp<=-0.007844104617834073\n",
      "   -4.2831 if cp>=-0.06365211308002472\n",
      "   -1.3678 if cp<=0.018871868029236804\n",
      "   +0.8900 if cp<=0.043743963539600375\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp<=0.08298952132463457\n",
      "   -0.0000 if cp<=0.11532309353351594\n",
      "   -0.0000 if cp>=0.029271246120333674\n",
      "   +0.0000 if cp>=0.029271246120333674\n",
      "Run episode 838 with rewards 9.0\n",
      "============ 839 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +12.3419 if \n",
      "   +3.1118 if cp<=-0.007844104617834073\n",
      "   +4.2831 if cp>=-0.06365211308002472\n",
      "   +1.3678 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp>=0.029095244780182848\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp<=0.11532309353351594\n",
      "   -0.0000 if cp>=0.029271246120333674\n",
      "   +0.0000 if cp<=-0.004026611719746131\n",
      "   +0.0000 if cp<=-0.02696772888302803\n",
      "Run episode 839 with rewards 10.0\n",
      "============ 840 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -31.1035 if \n",
      "   -7.8638 if cp<=-0.007844104617834073\n",
      "  -10.7817 if cp>=-0.06365211308002472\n",
      "   -3.4661 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp>=-0.018053312599658963\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.11532309353351594\n",
      "   +0.0000 if cp>=0.029271246120333674\n",
      "   +0.0000 if cp<=-0.004026611719746131\n",
      "   +0.0000 if cp>=-0.003120913170278072\n",
      "Run episode 840 with rewards 9.0\n",
      "============ 841 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +31.1035 if \n",
      "   +7.8638 if cp<=-0.007844104617834073\n",
      "  +10.7817 if cp>=-0.06365211308002472\n",
      "   +3.4661 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.07082974985241891\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.11532309353351594\n",
      "   +0.0000 if cp<=-0.004026611719746131\n",
      "   +0.0000 if cp>=-0.003120913170278072\n",
      "   +0.0000 if \n",
      "Run episode 841 with rewards 10.0\n",
      "============ 842 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -12.6094 if \n",
      "   -3.1880 if cp<=-0.007844104617834073\n",
      "   -4.3709 if cp>=-0.06365211308002472\n",
      "   -1.4052 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=-0.01965536680072546 & cp>=-0.061942049860954286\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp<=0.11532309353351594\n",
      "   +0.0000 if cp<=-0.004026611719746131\n",
      "   +0.0000 if cp<=0.010144556313753134\n",
      "   +0.0000 if cp<=0.027485036849975587 & cp>=-0.01965536680072546\n",
      "Run episode 842 with rewards 10.0\n",
      "origin 1.680019143080668e-05 new 1.680019148098387e-05 not updated\n",
      "============ 843 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +12.6094 if \n",
      "   +3.1880 if cp<=-0.007844104617834073\n",
      "   +4.3709 if cp>=-0.06365211308002472\n",
      "   +1.4052 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.09636596888303757\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp<=0.11532309353351594\n",
      "   +0.0000 if cp<=-0.004026611719746131\n",
      "   +0.0000 if cp<=0.010144556313753134\n",
      "   +0.0000 if cp<=0.027485036849975587 & cp>=-0.01965536680072546\n",
      "Run episode 843 with rewards 10.0\n",
      "origin 1.9436648766960552e-05 new 1.9436649619059505e-05 not updated\n",
      "============ 844 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -32.1591 if \n",
      "   -8.1434 if cp<=-0.007844104617834073\n",
      "  -11.1377 if cp>=-0.06365211308002472\n",
      "   -3.5982 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.04179136529564857 & cp>=-0.04357858896255493\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp<=0.11532309353351594\n",
      "   +0.0000 if cp<=-0.004026611719746131\n",
      "   +0.0000 if cp<=0.010144556313753134\n",
      "   +0.0000 if cp<=0.027485036849975587 & cp>=-0.01965536680072546\n",
      "Run episode 844 with rewards 9.0\n",
      "============ 845 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +32.1591 if \n",
      "   +8.1434 if cp<=-0.007844104617834073\n",
      "  +11.1377 if cp>=-0.06365211308002472\n",
      "   +3.5982 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.054966958612203604 & cp>=-0.006449220422655344\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   -0.0000 if cp<=0.11532309353351594\n",
      "   +0.0000 if cp<=-0.004026611719746131\n",
      "   +0.0000 if cp<=0.010144556313753134\n",
      "   +0.0000 if \n",
      "Run episode 845 with rewards 10.0\n",
      "============ 846 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -12.3964 if \n",
      "   -3.1391 if cp<=-0.007844104617834073\n",
      "   -4.2933 if cp>=-0.06365211308002472\n",
      "   -1.3870 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp>=-0.022432285919785494\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.11532309353351594\n",
      "   +0.0000 if cp<=0.010144556313753134\n",
      "   -0.0000 if cp>=-0.022432285919785494\n",
      "   +0.0000 if cp>=-0.022432285919785494\n",
      "Run episode 846 with rewards 9.0\n",
      "============ 847 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +12.3964 if \n",
      "   +3.1391 if cp<=-0.007844104617834073\n",
      "   +4.2933 if cp>=-0.06365211308002472\n",
      "   +1.3870 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp>=0.03181433379650117\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp<=0.11532309353351594\n",
      "   -0.0000 if cp<=0.010144556313753134\n",
      "   -0.0000 if cp>=0.03181433379650117\n",
      "   +0.0000 if cp<=-0.0006014395505189781\n",
      "Run episode 847 with rewards 10.0\n",
      "============ 848 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -31.3304 if \n",
      "   -7.9546 if cp<=-0.007844104617834073\n",
      "  -10.8404 if cp>=-0.06365211308002472\n",
      "   -3.5305 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp>=-0.06816862151026726\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.11532309353351594\n",
      "   +0.0000 if cp<=0.010144556313753134\n",
      "   +0.0000 if cp>=0.03181433379650117\n",
      "   +0.0000 if cp>=-0.038985586166381835\n",
      "Run episode 848 with rewards 9.0\n",
      "============ 849 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +31.3304 if \n",
      "   +7.9546 if cp<=-0.007844104617834073\n",
      "  +10.8404 if cp>=-0.06365211308002472\n",
      "   +3.5305 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp>=0.033780273422598844\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.11532309353351594\n",
      "   +0.0000 if cp<=0.010144556313753134\n",
      "   +0.0000 if cp>=-0.038985586166381835\n",
      "   +0.0000 if \n",
      "Run episode 849 with rewards 10.0\n",
      "============ 850 ===========\n",
      "11 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -12.1808 if \n",
      "   -3.5470 if cp<=-0.007844104617834073\n",
      "   -3.6949 if cp>=-0.06365211308002472\n",
      "   -1.9129 if cp<=0.018871868029236804\n",
      "   +0.8098 if cp<=-0.11486057341098785\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.11532309353351594\n",
      "   +0.0000 if cp<=0.010144556313753134\n",
      "   -0.0000 if cp>=-0.04874972328543663\n",
      "   +0.0000 if cp>=-0.04874972328543663\n",
      "Run episode 850 with rewards 11.0\n",
      "============ 851 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +12.6789 if \n",
      "   +3.5035 if cp<=-0.007844104617834073\n",
      "   +4.2971 if cp>=-0.06365211308002472\n",
      "   +1.2905 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.05711050331592562\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp<=0.11532309353351594\n",
      "   +0.0000 if cp<=0.010144556313753134\n",
      "   -0.0000 if pa<=-0.03471370413899422\n",
      "   +0.0000 if cp>=0.10771291702985764\n",
      "Run episode 851 with rewards 9.0\n",
      "============ 852 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -32.4841 if \n",
      "   -8.9861 if cp<=-0.007844104617834073\n",
      "  -11.0046 if cp>=-0.06365211308002472\n",
      "   -3.3189 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp>=-0.05630635321140289\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.11532309353351594\n",
      "   +0.0000 if cp<=0.010144556313753134\n",
      "   +0.0000 if pa<=-0.03471370413899422\n",
      "   +0.0000 if cp>=-0.03353152126073836\n",
      "Run episode 852 with rewards 9.0\n",
      "============ 853 ===========\n",
      "11 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +32.4841 if \n",
      "   +8.9861 if cp<=-0.007844104617834073\n",
      "  +11.0046 if cp>=-0.06365211308002472\n",
      "   +3.3189 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.06363578215241433\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.11532309353351594\n",
      "   +0.0000 if cp<=0.010144556313753134\n",
      "   +0.0000 if cp>=-0.03353152126073836\n",
      "   +0.0000 if \n",
      "Run episode 853 with rewards 11.0\n",
      "============ 854 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -12.5725 if \n",
      "   -3.4780 if cp<=-0.007844104617834073\n",
      "   -4.2592 if cp>=-0.06365211308002472\n",
      "   -1.2845 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp>=-0.024957062676548947\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.11532309353351594\n",
      "   +0.0000 if cp<=0.010144556313753134\n",
      "   -0.0000 if pa<=-0.01900515891611576\n",
      "   +0.0000 if pa<=-0.01900515891611576\n",
      "Run episode 854 with rewards 10.0\n",
      "============ 855 ===========\n",
      "8 actions [0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +12.5725 if \n",
      "   +3.4780 if cp<=-0.007844104617834073\n",
      "   +4.2592 if cp>=-0.06365211308002472\n",
      "   +1.2845 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.055107015371322635\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp<=0.11532309353351594\n",
      "   +0.0000 if cp<=0.010144556313753134\n",
      "   -0.0000 if cp>=0.055107015371322635\n",
      "   +0.0000 if cp<=0.055107015371322635 & cp>=0.026702290773391726\n",
      "Run episode 855 with rewards 8.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 856 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -32.0505 if \n",
      "   -8.8716 if cp<=-0.007844104617834073\n",
      "  -10.8547 if cp>=-0.06365211308002472\n",
      "   -3.2787 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp>=-0.02544559463858604\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.11532309353351594\n",
      "   +0.0000 if cp<=0.010144556313753134\n",
      "   +0.0000 if cp>=0.055107015371322635\n",
      "   +0.0000 if cp>=-0.008350775949656955\n",
      "Run episode 856 with rewards 9.0\n",
      "============ 857 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +32.0505 if \n",
      "   +8.8716 if cp<=-0.007844104617834073\n",
      "  +10.8547 if cp>=-0.06365211308002472\n",
      "   +3.2787 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.08031138181686402 & cp>=0.014683867618441582\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.11532309353351594\n",
      "   +0.0000 if cp<=0.010144556313753134\n",
      "   +0.0000 if cp>=-0.008350775949656955\n",
      "   +0.0000 if \n",
      "Run episode 857 with rewards 10.0\n",
      "============ 858 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -12.3870 if \n",
      "   -3.4287 if cp<=-0.007844104617834073\n",
      "   -4.1952 if cp>=-0.06365211308002472\n",
      "   -1.2672 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp>=0.006524560600519181\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.11532309353351594\n",
      "   +0.0000 if cp<=0.010144556313753134\n",
      "   -0.0000 if cp>=-0.007344425097107883\n",
      "   +0.0000 if cp>=-0.007344425097107883\n",
      "Run episode 858 with rewards 9.0\n",
      "============ 859 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +12.3870 if \n",
      "   +3.4287 if cp<=-0.007844104617834073\n",
      "   +4.1952 if cp>=-0.06365211308002472\n",
      "   +1.2672 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.06349413990974427\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp<=0.11532309353351594\n",
      "   +0.0000 if cp<=0.010144556313753134\n",
      "   -0.0000 if cp>=0.04105981290340424\n",
      "   +0.0000 if cp>=0.09609248191118241\n",
      "Run episode 859 with rewards 10.0\n",
      "============ 860 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -31.3093 if \n",
      "   -8.6818 if cp<=-0.007844104617834073\n",
      "  -10.5910 if cp>=-0.06365211308002472\n",
      "   -3.2206 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.04029376059770584 & cp>=-0.04454377144575119\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp<=0.11532309353351594\n",
      "   -0.0000 if cp>=0.04105981290340424\n",
      "   +0.0000 if cp>=0.09609248191118241\n",
      "   +0.0000 if cp<=0.04029376059770584 & cp>=-0.04454377144575119\n",
      "Run episode 860 with rewards 10.0\n",
      "============ 861 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +31.3093 if \n",
      "   +8.6818 if cp<=-0.007844104617834073\n",
      "  +10.5910 if cp>=-0.06365211308002472\n",
      "   +3.2206 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.06090839505195618 & cp>=-0.008012095699086785\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.11532309353351594\n",
      "   +0.0000 if cp>=0.04105981290340424\n",
      "   +0.0000 if cp<=0.04029376059770584 & cp>=-0.04454377144575119\n",
      "   +0.0000 if \n",
      "Run episode 861 with rewards 10.0\n",
      "============ 862 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -12.4914 if \n",
      "   -3.4638 if cp<=-0.007844104617834073\n",
      "   -4.2255 if cp>=-0.06365211308002472\n",
      "   -1.2849 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=-0.021816829405725 & cp>=-0.06086621880531311\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.11532309353351594\n",
      "   +0.0000 if cp>=0.04105981290340424\n",
      "   -0.0000 if cp>=-0.021816829405725\n",
      "   +0.0000 if cp<=0.018587428703904153 & cp>=-0.06086621880531311\n",
      "Run episode 862 with rewards 9.0\n",
      "============ 863 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +12.4914 if \n",
      "   +3.4638 if cp<=-0.007844104617834073\n",
      "   +4.2255 if cp>=-0.06365211308002472\n",
      "   +1.2849 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.08727837651968003 & cp>=0.0193185418844223\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp<=0.11532309353351594\n",
      "   -0.0000 if cp>=-0.021816829405725\n",
      "   +0.0000 if cp<=0.018587428703904153 & cp>=-0.06086621880531311\n",
      "   +0.0000 if cp>=0.12951698899269104\n",
      "Run episode 863 with rewards 10.0\n",
      "============ 864 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -31.7379 if \n",
      "   -8.8154 if cp<=-0.007844104617834073\n",
      "  -10.7272 if cp>=-0.06365211308002472\n",
      "   -3.2783 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp>=-0.022329476475715634\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.11532309353351594\n",
      "   -0.0000 if cp>=-0.021816829405725\n",
      "   -0.0000 if cp<=0.018587428703904153 & cp>=-0.06086621880531311\n",
      "   +0.0000 if cp<=-0.0893417552113533\n",
      "Run episode 864 with rewards 10.0\n",
      "============ 865 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +31.7379 if \n",
      "   +8.8154 if cp<=-0.007844104617834073\n",
      "  +10.7272 if cp>=-0.06365211308002472\n",
      "   +3.2783 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.052839273959398275\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.11532309353351594\n",
      "   +0.0000 if cp>=-0.021816829405725\n",
      "   +0.0000 if cp<=0.018587428703904153 & cp>=-0.06086621880531311\n",
      "   +0.0000 if \n",
      "Run episode 865 with rewards 10.0\n",
      "============ 866 ===========\n",
      "8 actions [1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -12.3746 if \n",
      "   -3.4371 if cp<=-0.007844104617834073\n",
      "   -4.1825 if cp>=-0.06365211308002472\n",
      "   -1.2782 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp>=0.013453060388565065\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.11532309353351594\n",
      "   -0.0000 if cp>=-0.021816829405725\n",
      "   +0.0000 if cp<=0.013453060388565065 & cp>=-0.07377390861511231\n",
      "   +0.0000 if cp>=-0.03222409076988697\n",
      "Run episode 866 with rewards 8.0\n",
      "============ 867 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +12.3746 if \n",
      "   +3.4371 if cp<=-0.007844104617834073\n",
      "   +4.1825 if cp>=-0.06365211308002472\n",
      "   +1.2782 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.05990598052740099\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp<=0.11532309353351594\n",
      "   -0.0000 if cp>=-0.021816829405725\n",
      "   -0.0000 if cp<=0.013453060388565065 & cp>=-0.07377390861511231\n",
      "   +0.0000 if cp<=0.044244690984487536\n",
      "Run episode 867 with rewards 10.0\n",
      "============ 868 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -31.2601 if \n",
      "   -8.6986 if cp<=-0.007844104617834073\n",
      "  -10.5520 if cp>=-0.06365211308002472\n",
      "   -3.2453 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=-0.01770135313272476 & cp>=-0.05762326568365097\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp<=0.11532309353351594\n",
      "   -0.0000 if cp>=-0.021816829405725\n",
      "   -0.0000 if cp<=0.044244690984487536\n",
      "   +0.0000 if cp>=-0.01770135313272476\n",
      "Run episode 868 with rewards 9.0\n",
      "============ 869 ===========\n",
      "11 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +31.2601 if \n",
      "   +8.6986 if cp<=-0.007844104617834073\n",
      "  +10.5520 if cp>=-0.06365211308002472\n",
      "   +3.2453 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp>=0.031866868957877166\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.11532309353351594\n",
      "   +0.0000 if cp>=-0.021816829405725\n",
      "   +0.0000 if cp<=0.044244690984487536\n",
      "   +0.0000 if \n",
      "Run episode 869 with rewards 11.0\n",
      "============ 870 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -12.4224 if \n",
      "   -3.6389 if cp<=-0.007844104617834073\n",
      "   -4.0877 if cp>=-0.06365211308002472\n",
      "   -1.4603 if cp<=0.018871868029236804\n",
      "   +0.9067 if cp>=-0.09248097240924835 & pa>=0.03139406442642215\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp>=-0.021816829405725\n",
      "   -0.0000 if cp<=0.044244690984487536\n",
      "   -0.0000 if cp>=-0.09248097240924835\n",
      "   +0.0000 if cp>=-0.09248097240924835\n",
      "Run episode 870 with rewards 10.0\n",
      "============ 871 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +12.4224 if \n",
      "   +3.6389 if cp<=-0.007844104617834073\n",
      "   +4.0877 if cp>=-0.06365211308002472\n",
      "   +1.4603 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.07165829837322235\n",
      "--------------\n",
      "   -0.0000 if cp>=-0.021816829405725\n",
      "   +0.0000 if cp<=0.044244690984487536\n",
      "   -0.0000 if cp>=-0.09248097240924835\n",
      "   -0.0000 if cp<=0.11060067117214203 & cp>=0.045230112969875336\n",
      "   +0.0000 if cp<=0.11060067117214203 & cp>=0.045230112969875336\n",
      "Run episode 871 with rewards 10.0\n",
      "============ 872 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -31.4872 if \n",
      "   -9.2325 if cp<=-0.007844104617834073\n",
      "  -10.3515 if cp>=-0.06365211308002472\n",
      "   -3.7107 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.045521567761898044\n",
      "--------------\n",
      "   -0.0000 if cp>=-0.021816829405725\n",
      "   +0.0000 if cp<=0.044244690984487536\n",
      "   +0.0000 if cp>=-0.09248097240924835\n",
      "   +0.0000 if pa>=0.20345933735370636\n",
      "   +0.0000 if cp<=0.03001145273447037\n",
      "Run episode 872 with rewards 9.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 873 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +31.4872 if \n",
      "   +9.2325 if cp<=-0.007844104617834073\n",
      "  +10.3515 if cp>=-0.06365211308002472\n",
      "   +3.7107 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.054576343297958387\n",
      "--------------\n",
      "   +0.0000 if cp>=-0.021816829405725\n",
      "   +0.0000 if cp<=0.044244690984487536\n",
      "   +0.0000 if cp>=-0.09248097240924835\n",
      "   +0.0000 if pa>=0.20345933735370636\n",
      "   +0.0000 if \n",
      "Run episode 873 with rewards 9.0\n",
      "============ 874 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -11.8432 if \n",
      "   -3.5025 if cp<=-0.007844104617834073\n",
      "   -3.8636 if cp>=-0.06365211308002472\n",
      "   -1.4331 if cp<=0.018871868029236804\n",
      "   +1.0050 if cp>=-0.07724856436252593\n",
      "--------------\n",
      "   +0.0000 if cp>=-0.021816829405725\n",
      "   +0.0000 if cp<=0.044244690984487536\n",
      "   +0.0000 if pa>=0.20345933735370636\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=-0.07724856436252593\n",
      "Run episode 874 with rewards 10.0\n",
      "============ 875 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +12.0659 if \n",
      "   +3.2842 if cp<=-0.007844104617834073\n",
      "   +4.1317 if cp>=-0.06365211308002472\n",
      "   +1.3320 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.04716888964176179\n",
      "--------------\n",
      "   -0.0000 if cp>=-0.021816829405725\n",
      "   -0.0000 if cp<=0.044244690984487536\n",
      "   +0.0000 if pa>=0.20345933735370636\n",
      "   -0.0000 if \n",
      "   +0.0000 if cp<=0.006193083385005601\n",
      "Run episode 875 with rewards 10.0\n",
      "============ 876 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -30.0698 if \n",
      "   -8.2116 if cp<=-0.007844104617834073\n",
      "  -10.2833 if cp>=-0.06365211308002472\n",
      "   -3.3523 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp>=-0.06683558598160744\n",
      "--------------\n",
      "   +0.0000 if cp>=-0.021816829405725\n",
      "   +0.0000 if cp<=0.044244690984487536\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.006193083385005601\n",
      "   +0.0000 if cp>=-0.0395617738366127\n",
      "Run episode 876 with rewards 10.0\n",
      "============ 877 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +30.0698 if \n",
      "   +8.2116 if cp<=-0.007844104617834073\n",
      "  +10.2833 if cp>=-0.06365211308002472\n",
      "   +3.3523 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.0535181149840355\n",
      "--------------\n",
      "   +0.0000 if cp<=0.044244690984487536\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.006193083385005601\n",
      "   +0.0000 if cp>=-0.0395617738366127\n",
      "   +0.0000 if \n",
      "Run episode 877 with rewards 9.0\n",
      "============ 878 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -12.0487 if \n",
      "   -3.2903 if cp<=-0.007844104617834073\n",
      "   -4.1204 if cp>=-0.06365211308002472\n",
      "   -1.3432 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=-0.038479880616068836\n",
      "--------------\n",
      "   -0.0000 if cp<=0.044244690984487536\n",
      "   -0.0000 if \n",
      "   +0.0000 if cp<=0.006193083385005601\n",
      "   -0.0000 if cp<=0.023070933297276497\n",
      "   +0.0000 if cp<=0.023070933297276497 & cp>=-0.038479880616068836\n",
      "Run episode 878 with rewards 10.0\n",
      "============ 879 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +12.0704 if \n",
      "   +3.2680 if cp<=-0.007844104617834073\n",
      "   +4.1468 if cp>=-0.06365211308002472\n",
      "   +1.3327 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.04526719003915787\n",
      "--------------\n",
      "   -0.0000 if cp<=0.044244690984487536\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp<=0.006193083385005601\n",
      "   -0.0000 if cp<=0.023070933297276497\n",
      "   +0.0000 if cp>=0.09940937161445618\n",
      "Run episode 879 with rewards 10.0\n",
      "============ 880 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -30.0756 if \n",
      "   -8.1692 if cp<=-0.007844104617834073\n",
      "  -10.3163 if cp>=-0.06365211308002472\n",
      "   -3.3423 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp>=0.0071169216185808185\n",
      "--------------\n",
      "   +0.0000 if cp<=0.044244690984487536\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.006193083385005601\n",
      "   +0.0000 if cp<=0.023070933297276497\n",
      "   +0.0000 if cp<=-0.009238574653863903\n",
      "Run episode 880 with rewards 10.0\n",
      "============ 881 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +30.0756 if \n",
      "   +8.1692 if cp<=-0.007844104617834073\n",
      "  +10.3163 if cp>=-0.06365211308002472\n",
      "   +3.3423 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.08718895614147187\n",
      "--------------\n",
      "   +0.0000 if cp<=0.044244690984487536\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.006193083385005601\n",
      "   +0.0000 if cp<=0.023070933297276497\n",
      "   +0.0000 if \n",
      "Run episode 881 with rewards 9.0\n",
      "============ 882 ===========\n",
      "8 actions [1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -11.8949 if \n",
      "   -3.4349 if cp<=-0.007844104617834073\n",
      "   -3.9115 if cp>=-0.06365211308002472\n",
      "   -1.5708 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp>=-0.07289128452539444\n",
      "--------------\n",
      "   +0.0000 if cp<=0.044244690984487536\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.006193083385005601\n",
      "   -0.0000 if cp>=-0.04964668303728103\n",
      "   +0.0000 if cp>=-0.04964668303728103\n",
      "Run episode 882 with rewards 8.0\n",
      "============ 883 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +11.8949 if \n",
      "   +3.4349 if cp<=-0.007844104617834073\n",
      "   +3.9115 if cp>=-0.06365211308002472\n",
      "   +1.5708 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp>=0.044509466737508774\n",
      "--------------\n",
      "   -0.0000 if cp<=0.044244690984487536\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp<=0.006193083385005601\n",
      "   +0.0000 if cp<=-0.013897020742297154\n",
      "   +0.0000 if cp>=-0.013897020742297154\n",
      "Run episode 883 with rewards 9.0\n",
      "============ 884 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -29.4046 if \n",
      "   -8.5085 if cp<=-0.007844104617834073\n",
      "   -9.6588 if cp>=-0.06365211308002472\n",
      "   -3.8958 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp>=-0.02651368379592895\n",
      "--------------\n",
      "   +0.0000 if cp<=0.044244690984487536\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.006193083385005601\n",
      "   +0.0000 if cp<=-0.013897020742297154\n",
      "   +0.0000 if cp<=-0.05872032418847084\n",
      "Run episode 884 with rewards 9.0\n",
      "============ 885 ===========\n",
      "8 actions [0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +29.4046 if \n",
      "   +8.5085 if cp<=-0.007844104617834073\n",
      "   +9.6588 if cp>=-0.06365211308002472\n",
      "   +3.8958 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.048156847059726726\n",
      "--------------\n",
      "   +0.0000 if cp<=0.044244690984487536\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.006193083385005601\n",
      "   +0.0000 if cp<=-0.013897020742297154\n",
      "   +0.0000 if \n",
      "Run episode 885 with rewards 8.0\n",
      "============ 886 ===========\n",
      "8 actions [1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -11.4996 if \n",
      "   -3.3275 if cp<=-0.007844104617834073\n",
      "   -3.7774 if cp>=-0.06365211308002472\n",
      "   -1.5236 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp>=-0.03533356711268425\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.006193083385005601\n",
      "   +0.0000 if cp<=-0.013897020742297154\n",
      "   -0.0000 if cp>=-0.010912146046757696\n",
      "   +0.0000 if cp>=-0.010912146046757696\n",
      "Run episode 886 with rewards 8.0\n",
      "============ 887 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +11.4996 if \n",
      "   +3.3275 if cp<=-0.007844104617834073\n",
      "   +3.7774 if cp>=-0.06365211308002472\n",
      "   +1.5236 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp>=0.03527643531560898\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp<=0.006193083385005601\n",
      "   +0.0000 if cp<=-0.013897020742297154\n",
      "   -0.0000 if cp>=0.03527643531560898\n",
      "   +0.0000 if cp>=-0.03280955478549003\n",
      "Run episode 887 with rewards 10.0\n",
      "============ 888 ===========\n",
      "8 actions [1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -27.7959 if \n",
      "   -8.0715 if cp<=-0.007844104617834073\n",
      "   -9.1002 if cp>=-0.06365211308002472\n",
      "   -3.7126 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.045364754647016524\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.006193083385005601\n",
      "   +0.0000 if cp<=-0.013897020742297154\n",
      "   -0.0000 if cp>=0.03527643531560898\n",
      "   +0.0000 if pa>=0.1821891814470291\n",
      "Run episode 888 with rewards 8.0\n",
      "============ 889 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +27.7959 if \n",
      "   +8.0715 if cp<=-0.007844104617834073\n",
      "   +9.1002 if cp>=-0.06365211308002472\n",
      "   +3.7126 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.05884985327720644\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.006193083385005601\n",
      "   +0.0000 if cp<=-0.013897020742297154\n",
      "   -0.0000 if cp>=0.03527643531560898\n",
      "   +0.0000 if pa>=-0.04762880876660347\n",
      "Run episode 889 with rewards 9.0\n",
      "============ 890 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -11.4216 if \n",
      "   -3.3167 if cp<=-0.007844104617834073\n",
      "   -3.7394 if cp>=-0.06365211308002472\n",
      "   -1.5256 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp>=-0.024214738234877582\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.006193083385005601\n",
      "   +0.0000 if cp<=-0.013897020742297154\n",
      "   +0.0000 if pa>=-0.04762880876660347\n",
      "   +0.0000 if cp<=-0.05784672126173973\n",
      "Run episode 890 with rewards 10.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 891 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +11.9385 if \n",
      "   +2.7874 if cp<=-0.007844104617834073\n",
      "   +4.3620 if cp>=-0.06365211308002472\n",
      "   +1.2705 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.040215995162725456\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp<=0.006193083385005601\n",
      "   +0.0000 if cp<=-0.013897020742297154\n",
      "   -0.0000 if pa>=-0.04762880876660347\n",
      "   +0.0000 if cp>=0.0928429588675499\n",
      "Run episode 891 with rewards 10.0\n",
      "============ 892 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -29.5351 if \n",
      "   -6.9385 if cp<=-0.007844104617834073\n",
      "  -10.7673 if cp>=-0.06365211308002472\n",
      "   -3.1822 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp>=0.011952420137822628\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.006193083385005601\n",
      "   +0.0000 if cp<=-0.013897020742297154\n",
      "   +0.0000 if pa>=-0.04762880876660347\n",
      "   +0.0000 if cp>=-0.07448589205741882\n",
      "Run episode 892 with rewards 9.0\n",
      "============ 893 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +29.5351 if \n",
      "   +6.9385 if cp<=-0.007844104617834073\n",
      "  +10.7673 if cp>=-0.06365211308002472\n",
      "   +3.1822 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.08689833283424378 & cp>=0.0210124135017395\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.006193083385005601\n",
      "   +0.0000 if cp<=-0.013897020742297154\n",
      "   +0.0000 if pa>=-0.04762880876660347\n",
      "   +0.0000 if \n",
      "Run episode 893 with rewards 9.0\n",
      "============ 894 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -12.5882 if \n",
      "   -4.3867 if cp<=-0.007844104617834073\n",
      "   -3.1773 if cp>=-0.06365211308002472\n",
      "   -3.0233 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp>=-0.07947189509868621\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.006193083385005601\n",
      "   +0.0000 if cp<=-0.013897020742297154\n",
      "   -0.0000 if cp>=-0.05844503641128539\n",
      "   +0.0000 if cp>=-0.05844503641128539\n",
      "Run episode 894 with rewards 9.0\n",
      "============ 895 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +12.7077 if \n",
      "   +4.3206 if cp<=-0.007844104617834073\n",
      "   +3.3242 if cp>=-0.06365211308002472\n",
      "   +2.9908 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp>=0.028867892920970924\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp<=0.006193083385005601\n",
      "   +0.0000 if cp<=-0.013897020742297154\n",
      "   -0.0000 if cp>=0.07144530862569809\n",
      "   +0.0000 if cp>=0.028867892920970924\n",
      "Run episode 895 with rewards 10.0\n",
      "============ 896 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -32.8534 if \n",
      "  -11.1767 if cp<=-0.007844104617834073\n",
      "   -8.5826 if cp>=-0.06365211308002472\n",
      "   -7.7374 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=-0.018520988337695596 & cp>=-0.06048669070005417\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   +0.0000 if cp<=0.006193083385005601\n",
      "   +0.0000 if cp<=-0.013897020742297154\n",
      "   +0.0000 if cp>=0.07144530862569809\n",
      "   +0.0000 if cp>=0.03235502913594246\n",
      "Run episode 896 with rewards 10.0\n",
      "============ 897 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +33.0634 if \n",
      "  +10.4631 if cp<=-0.007844104617834073\n",
      "   +9.1760 if cp>=-0.06365211308002472\n",
      "   +7.0460 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.07443853616714478 & cp>=0.005084633640944958\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.006193083385005601\n",
      "   +0.0000 if cp<=-0.013897020742297154\n",
      "   +0.0000 if cp>=0.03235502913594246\n",
      "   +0.0000 if \n",
      "Run episode 897 with rewards 9.0\n",
      "============ 898 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -13.1066 if \n",
      "   -4.1477 if cp<=-0.007844104617834073\n",
      "   -3.6374 if cp>=-0.06365211308002472\n",
      "   -2.7931 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=-0.048518646508455276\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   +0.0000 if cp<=0.006193083385005601\n",
      "   +0.0000 if cp<=-0.013897020742297154\n",
      "   -0.0000 if cp>=0.021704864501953126\n",
      "   +0.0000 if cp>=0.025574125349521637\n",
      "Run episode 898 with rewards 10.0\n",
      "============ 899 ===========\n",
      "8 actions [0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +13.1066 if \n",
      "   +4.1477 if cp<=-0.007844104617834073\n",
      "   +3.6374 if cp>=-0.06365211308002472\n",
      "   +2.7931 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.06437182649970055\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   +0.0000 if cp<=0.006193083385005601\n",
      "   +0.0000 if cp<=-0.013897020742297154\n",
      "   -0.0000 if cp>=0.021704864501953126\n",
      "   +0.0000 if cp>=0.06437182649970055\n",
      "Run episode 899 with rewards 8.0\n",
      "============ 900 ===========\n",
      "8 actions [1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -34.3363 if \n",
      "  -10.8667 if cp<=-0.007844104617834073\n",
      "   -9.5279 if cp>=-0.06365211308002472\n",
      "   -7.3188 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.037818641215562825\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   +0.0000 if cp<=0.006193083385005601\n",
      "   -0.0000 if cp>=0.021704864501953126\n",
      "   +0.0000 if cp>=0.06437182649970055\n",
      "   +0.0000 if cp>=0.037818641215562825\n",
      "Run episode 900 with rewards 8.0\n",
      "============ 901 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +34.3363 if \n",
      "  +10.8667 if cp<=-0.007844104617834073\n",
      "   +9.5279 if cp>=-0.06365211308002472\n",
      "   +7.3188 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp>=0.060434624552726746\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.006193083385005601\n",
      "   +0.0000 if cp>=0.021704864501953126\n",
      "   +0.0000 if cp>=0.037818641215562825\n",
      "   +0.0000 if \n",
      "Run episode 901 with rewards 9.0\n",
      "============ 902 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -13.4804 if \n",
      "   -4.2662 if cp<=-0.007844104617834073\n",
      "   -3.7406 if cp>=-0.06365211308002472\n",
      "   -2.8733 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=-0.04472667276859283\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   +0.0000 if cp<=0.006193083385005601\n",
      "   -0.0000 if cp>=0.021704864501953126\n",
      "   -0.0000 if cp>=0.02339334413409233\n",
      "   +0.0000 if cp>=0.009298915229737767\n",
      "Run episode 902 with rewards 10.0\n",
      "============ 903 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +13.4804 if \n",
      "   +4.2662 if cp<=-0.007844104617834073\n",
      "   +3.7406 if cp>=-0.06365211308002472\n",
      "   +2.8733 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.08735194504261018\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp<=0.006193083385005601\n",
      "   -0.0000 if cp>=0.021704864501953126\n",
      "   -0.0000 if cp>=0.02339334413409233\n",
      "   +0.0000 if cp<=0.058588118851184846\n",
      "Run episode 903 with rewards 10.0\n",
      "============ 904 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -35.8283 if \n",
      "  -11.3411 if cp<=-0.007844104617834073\n",
      "   -9.9376 if cp>=-0.06365211308002472\n",
      "   -7.6387 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=-0.04207111001014709\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp>=0.021704864501953126\n",
      "   -0.0000 if cp>=0.02339334413409233\n",
      "   -0.0000 if cp<=0.058588118851184846\n",
      "   +0.0000 if cp<=-0.003206051979213952\n",
      "Run episode 904 with rewards 10.0\n",
      "============ 905 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +35.8283 if \n",
      "  +11.3411 if cp<=-0.007844104617834073\n",
      "   +9.9376 if cp>=-0.06365211308002472\n",
      "   +7.6387 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.0480948880314827\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=0.021704864501953126\n",
      "   +0.0000 if cp>=0.02339334413409233\n",
      "   +0.0000 if cp<=0.058588118851184846\n",
      "   +0.0000 if \n",
      "Run episode 905 with rewards 10.0\n",
      "============ 906 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -13.1397 if \n",
      "   -4.1593 if cp<=-0.007844104617834073\n",
      "   -3.6445 if cp>=-0.06365211308002472\n",
      "   -2.8014 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp>=-0.05795295089483261\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=0.021704864501953126\n",
      "   +0.0000 if cp>=0.02339334413409233\n",
      "   +0.0000 if cp<=-0.05795295089483261\n",
      "   +0.0000 if cp<=-0.09963246732950211\n",
      "Run episode 906 with rewards 9.0\n",
      "============ 907 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +13.1397 if \n",
      "   +4.1593 if cp<=-0.007844104617834073\n",
      "   +3.6445 if cp>=-0.06365211308002472\n",
      "   +2.8014 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.053167420625686655\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp>=0.02339334413409233\n",
      "   +0.0000 if cp<=-0.05795295089483261\n",
      "   +0.0000 if cp<=-0.09963246732950211\n",
      "   +0.0000 if cp>=0.053167420625686655\n",
      "Run episode 907 with rewards 10.0\n",
      "============ 908 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -34.4737 if \n",
      "  -10.9142 if cp<=-0.007844104617834073\n",
      "   -9.5611 if cp>=-0.06365211308002472\n",
      "   -7.3521 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp>=-0.09432614892721176\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   -0.0000 if cp>=0.02339334413409233\n",
      "   +0.0000 if cp<=-0.05795295089483261\n",
      "   -0.0000 if cp>=0.053167420625686655\n",
      "   +0.0000 if cp<=-0.09432614892721176\n",
      "Run episode 908 with rewards 9.0\n",
      "============ 909 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +34.4737 if \n",
      "  +10.9142 if cp<=-0.007844104617834073\n",
      "   +9.5611 if cp>=-0.06365211308002472\n",
      "   +7.3521 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp>=0.033116500452160844\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=0.02339334413409233\n",
      "   +0.0000 if cp<=-0.05795295089483261\n",
      "   +0.0000 if cp<=-0.09432614892721176\n",
      "   +0.0000 if \n",
      "Run episode 909 with rewards 10.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 910 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -12.7947 if \n",
      "   -4.0507 if cp<=-0.007844104617834073\n",
      "   -3.5485 if cp>=-0.06365211308002472\n",
      "   -2.7287 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=-0.12436785101890564\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=-0.05795295089483261\n",
      "   +0.0000 if cp<=-0.09432614892721176\n",
      "   +0.0000 if cp<=-0.12436785101890564\n",
      "   +0.0000 if pa>=0.20219653844833374\n",
      "Run episode 910 with rewards 9.0\n",
      "============ 911 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +12.7947 if \n",
      "   +4.0507 if cp<=-0.007844104617834073\n",
      "   +3.5485 if cp>=-0.06365211308002472\n",
      "   +2.7287 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.06497218906879426\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   +0.0000 if cp<=-0.05795295089483261\n",
      "   +0.0000 if cp<=-0.09432614892721176\n",
      "   +0.0000 if cp<=-0.12436785101890564\n",
      "   +0.0000 if cp>=0.03184430338442327\n",
      "Run episode 911 with rewards 10.0\n",
      "============ 912 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -33.0955 if \n",
      "  -10.4809 if cp<=-0.007844104617834073\n",
      "   -9.1774 if cp>=-0.06365211308002472\n",
      "   -7.0616 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp>=-0.0976430669426918\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=-0.05795295089483261\n",
      "   +0.0000 if cp<=-0.09432614892721176\n",
      "   -0.0000 if cp>=0.03184430338442327\n",
      "   +0.0000 if cp<=-0.13985447883605956\n",
      "Run episode 912 with rewards 9.0\n",
      "============ 913 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +33.0955 if \n",
      "  +10.4809 if cp<=-0.007844104617834073\n",
      "   +9.1774 if cp>=-0.06365211308002472\n",
      "   +7.0616 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.060430581867694864\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=-0.05795295089483261\n",
      "   +0.0000 if cp<=-0.09432614892721176\n",
      "   +0.0000 if cp<=-0.13985447883605956\n",
      "   +0.0000 if \n",
      "Run episode 913 with rewards 10.0\n",
      "============ 914 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -12.3590 if \n",
      "   -3.9139 if cp<=-0.007844104617834073\n",
      "   -3.4272 if cp>=-0.06365211308002472\n",
      "   -2.6371 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp>=-0.09277320057153701\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=-0.05795295089483261\n",
      "   +0.0000 if cp<=-0.09432614892721176\n",
      "   +0.0000 if cp<=-0.1328412801027298\n",
      "   +0.0000 if pa>=0.20882852375507355\n",
      "Run episode 914 with rewards 9.0\n",
      "============ 915 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +12.5372 if \n",
      "   +3.8416 if cp<=-0.007844104617834073\n",
      "   +3.6482 if cp>=-0.06365211308002472\n",
      "   +2.5298 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.0629610188305378 & cp>=-0.004832299333065748\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   +0.0000 if cp<=-0.05795295089483261\n",
      "   +0.0000 if cp<=-0.09432614892721176\n",
      "   +0.0000 if cp<=-0.1328412801027298\n",
      "   +0.0000 if cp>=0.03017826043069364\n",
      "Run episode 915 with rewards 9.0\n",
      "============ 916 ===========\n",
      "11 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -32.0293 if \n",
      "   -9.8170 if cp<=-0.007844104617834073\n",
      "   -9.3152 if cp>=-0.06365211308002472\n",
      "   -6.4659 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.04653942584991455\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   +0.0000 if cp<=-0.05795295089483261\n",
      "   +0.0000 if cp<=-0.09432614892721176\n",
      "   -0.0000 if cp>=0.03017826043069364\n",
      "   +0.0000 if cp>=0.04653942584991455\n",
      "Run episode 916 with rewards 11.0\n",
      "============ 917 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +32.0293 if \n",
      "   +9.8170 if cp<=-0.007844104617834073\n",
      "   +9.3152 if cp>=-0.06365211308002472\n",
      "   +6.4659 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.08141374588012697\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=-0.05795295089483261\n",
      "   +0.0000 if cp>=0.03017826043069364\n",
      "   +0.0000 if cp>=0.04653942584991455\n",
      "   +0.0000 if \n",
      "Run episode 917 with rewards 10.0\n",
      "============ 918 ===========\n",
      "8 actions [1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -12.8091 if \n",
      "   -3.9260 if cp<=-0.007844104617834073\n",
      "   -3.7253 if cp>=-0.06365211308002472\n",
      "   -2.5858 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=-0.022218520939350127 & cp>=-0.06262964457273483\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   +0.0000 if cp<=-0.05795295089483261\n",
      "   +0.0000 if cp>=0.03017826043069364\n",
      "   -0.0000 if cp>=0.02107667587697506\n",
      "   +0.0000 if cp>=0.0056827554712072055\n",
      "Run episode 918 with rewards 8.0\n",
      "============ 919 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +12.8091 if \n",
      "   +3.9260 if cp<=-0.007844104617834073\n",
      "   +3.7253 if cp>=-0.06365211308002472\n",
      "   +2.5858 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.059964063763618486\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp<=-0.05795295089483261\n",
      "   -0.0000 if cp>=0.02107667587697506\n",
      "   -0.0000 if cp>=0.0056827554712072055\n",
      "   +0.0000 if cp<=0.04269106835126877\n",
      "Run episode 919 with rewards 9.0\n",
      "============ 920 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -33.1253 if \n",
      "  -10.1555 if cp<=-0.007844104617834073\n",
      "   -9.6322 if cp>=-0.06365211308002472\n",
      "   -6.6883 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp>=-0.01593649648129939\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   +0.0000 if cp>=0.02107667587697506\n",
      "   +0.0000 if cp>=0.0056827554712072055\n",
      "   -0.0000 if cp<=0.04269106835126877\n",
      "   +0.0000 if cp>=-0.07108369767665863\n",
      "Run episode 920 with rewards 9.0\n",
      "============ 921 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +33.1253 if \n",
      "  +10.1555 if cp<=-0.007844104617834073\n",
      "   +9.6322 if cp>=-0.06365211308002472\n",
      "   +6.6883 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.05845813676714898\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=0.0056827554712072055\n",
      "   +0.0000 if cp<=0.04269106835126877\n",
      "   +0.0000 if cp>=-0.07108369767665863\n",
      "   +0.0000 if \n",
      "Run episode 921 with rewards 10.0\n",
      "============ 922 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -12.8222 if \n",
      "   -3.9310 if cp<=-0.007844104617834073\n",
      "   -3.7284 if cp>=-0.06365211308002472\n",
      "   -2.5889 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp>=-0.015076962485909458\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.04269106835126877\n",
      "   -0.0000 if cp>=-0.07108369767665863\n",
      "   -0.0000 if cp>=-0.04250875264406204\n",
      "   +0.0000 if cp<=-0.00018802342237904607 & cp>=-0.08243978023529053\n",
      "Run episode 922 with rewards 9.0\n",
      "============ 923 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +12.8222 if \n",
      "   +3.9310 if cp<=-0.007844104617834073\n",
      "   +3.7284 if cp>=-0.06365211308002472\n",
      "   +2.5889 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.07723063826560975\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   +0.0000 if cp<=0.04269106835126877\n",
      "   -0.0000 if cp>=-0.07108369767665863\n",
      "   -0.0000 if cp>=-0.04250875264406204\n",
      "   +0.0000 if cp<=0.07723063826560975 & cp>=0.04100960567593574\n",
      "Run episode 923 with rewards 9.0\n",
      "============ 924 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -33.1778 if \n",
      "  -10.1740 if cp<=-0.007844104617834073\n",
      "   -9.6457 if cp>=-0.06365211308002472\n",
      "   -6.7000 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp>=-0.025777495652437206\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp<=0.04269106835126877\n",
      "   -0.0000 if cp>=-0.07108369767665863\n",
      "   -0.0000 if cp>=-0.04250875264406204\n",
      "   +0.0000 if cp>=-0.025777495652437206\n",
      "Run episode 924 with rewards 9.0\n",
      "============ 925 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +33.1778 if \n",
      "  +10.1740 if cp<=-0.007844104617834073\n",
      "   +9.6457 if cp>=-0.06365211308002472\n",
      "   +6.7000 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.0526203103363514\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.04269106835126877\n",
      "   +0.0000 if cp>=-0.07108369767665863\n",
      "   +0.0000 if cp>=-0.04250875264406204\n",
      "   +0.0000 if \n",
      "Run episode 925 with rewards 9.0\n",
      "============ 926 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -12.4549 if \n",
      "   -3.8193 if cp<=-0.007844104617834073\n",
      "   -3.6210 if cp>=-0.06365211308002472\n",
      "   -2.5152 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp>=-0.04657338410615921\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=-0.07108369767665863\n",
      "   -0.0000 if cp>=-0.04250875264406204\n",
      "   +0.0000 if pa>=0.16620685160160065\n",
      "   +0.0000 if \n",
      "Run episode 926 with rewards 10.0\n",
      "============ 927 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +12.4549 if \n",
      "   +3.8193 if cp<=-0.007844104617834073\n",
      "   +3.6210 if cp>=-0.06365211308002472\n",
      "   +2.5152 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.08001774400472642\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp>=-0.07108369767665863\n",
      "   +0.0000 if pa>=0.16620685160160065\n",
      "   +0.0000 if cp<=0.08001774400472642\n",
      "   +0.0000 if cp<=0.08001774400472642\n",
      "Run episode 927 with rewards 9.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 928 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -31.7099 if \n",
      "   -9.7281 if cp<=-0.007844104617834073\n",
      "   -9.2160 if cp>=-0.06365211308002472\n",
      "   -6.4056 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp>=-0.030962222069501874\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   -0.0000 if cp>=-0.07108369767665863\n",
      "   +0.0000 if cp<=0.08001774400472642\n",
      "   +0.0000 if cp<=-0.030962222069501874\n",
      "   +0.0000 if pa>=0.19873405992984772\n",
      "Run episode 928 with rewards 9.0\n",
      "============ 929 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +31.7099 if \n",
      "   +9.7281 if cp<=-0.007844104617834073\n",
      "   +9.2160 if cp>=-0.06365211308002472\n",
      "   +6.4056 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.055129723995924\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=-0.07108369767665863\n",
      "   +0.0000 if cp<=0.08001774400472642\n",
      "   +0.0000 if cp<=-0.030962222069501874\n",
      "   +0.0000 if \n",
      "Run episode 929 with rewards 9.0\n",
      "============ 930 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -12.6075 if \n",
      "   -3.8678 if cp<=-0.007844104617834073\n",
      "   -3.6642 if cp>=-0.06365211308002472\n",
      "   -2.5468 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=-0.04582613185048103\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp<=0.08001774400472642\n",
      "   +0.0000 if cp<=-0.030962222069501874\n",
      "   -0.0000 if cp<=0.020567022264003754 & cp>=-0.04582613185048103\n",
      "   +0.0000 if cp<=0.020567022264003754 & cp>=-0.04582613185048103\n",
      "Run episode 930 with rewards 9.0\n",
      "============ 931 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +12.6075 if \n",
      "   +3.8678 if cp<=-0.007844104617834073\n",
      "   +3.6642 if cp>=-0.06365211308002472\n",
      "   +2.5468 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.07508906573057175 & cp>=0.013368179835379124\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp<=0.08001774400472642\n",
      "   +0.0000 if cp<=0.020567022264003754 & cp>=-0.04582613185048103\n",
      "   -0.0000 if cp>=0.04425664842128755\n",
      "   +0.0000 if cp>=0.11532055586576462\n",
      "Run episode 931 with rewards 9.0\n",
      "============ 932 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -32.3238 if \n",
      "   -9.9203 if cp<=-0.007844104617834073\n",
      "   -9.3927 if cp>=-0.06365211308002472\n",
      "   -6.5340 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp>=-0.06419230103492736\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.08001774400472642\n",
      "   -0.0000 if cp<=0.020567022264003754 & cp>=-0.04582613185048103\n",
      "   -0.0000 if cp>=0.04425664842128755\n",
      "   +0.0000 if cp<=-0.04172124564647674 & cp>=-0.09684581458568572\n",
      "Run episode 932 with rewards 9.0\n",
      "============ 933 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +32.3238 if \n",
      "   +9.9203 if cp<=-0.007844104617834073\n",
      "   +9.3927 if cp>=-0.06365211308002472\n",
      "   +6.5340 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp>=0.06372909992933273\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.08001774400472642\n",
      "   +0.0000 if cp<=0.020567022264003754 & cp>=-0.04582613185048103\n",
      "   +0.0000 if cp<=-0.04172124564647674 & cp>=-0.09684581458568572\n",
      "   +0.0000 if \n",
      "Run episode 933 with rewards 9.0\n",
      "============ 934 ===========\n",
      "8 actions [1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -12.8712 if \n",
      "   -3.9502 if cp<=-0.007844104617834073\n",
      "   -3.7401 if cp>=-0.06365211308002472\n",
      "   -2.6018 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.03643625304102898\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp<=0.08001774400472642\n",
      "   +0.0000 if cp<=0.020567022264003754 & cp>=-0.04582613185048103\n",
      "   -0.0000 if cp<=0.03643625304102898\n",
      "   +0.0000 if cp<=0.03643625304102898\n",
      "Run episode 934 with rewards 8.0\n",
      "============ 935 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +12.8712 if \n",
      "   +3.9502 if cp<=-0.007844104617834073\n",
      "   +3.7401 if cp>=-0.06365211308002472\n",
      "   +2.6018 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.054976943135261545\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp<=0.08001774400472642\n",
      "   -0.0000 if cp<=0.03643625304102898\n",
      "   -0.0000 if cp>=0.013008466921746733\n",
      "   +0.0000 if cp>=0.054976943135261545\n",
      "Run episode 935 with rewards 9.0\n",
      "============ 936 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -33.3771 if \n",
      "  -10.2458 if cp<=-0.007844104617834073\n",
      "   -9.6978 if cp>=-0.06365211308002472\n",
      "   -6.7496 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp>=-0.05802365019917488\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.08001774400472642\n",
      "   +0.0000 if cp<=0.03643625304102898\n",
      "   +0.0000 if cp>=0.013008466921746733\n",
      "   +0.0000 if cp>=-0.03733519986271858\n",
      "Run episode 936 with rewards 9.0\n",
      "============ 937 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +33.3771 if \n",
      "  +10.2458 if cp<=-0.007844104617834073\n",
      "   +9.6978 if cp>=-0.06365211308002472\n",
      "   +6.7496 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.06473728716373445 & cp>=-0.004925079178065062\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.08001774400472642\n",
      "   +0.0000 if cp<=0.03643625304102898\n",
      "   +0.0000 if cp>=-0.03733519986271858\n",
      "   +0.0000 if \n",
      "Run episode 937 with rewards 10.0\n",
      "============ 938 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -13.2098 if \n",
      "   -4.0551 if cp<=-0.007844104617834073\n",
      "   -3.8381 if cp>=-0.06365211308002472\n",
      "   -2.6713 if cp<=0.018871868029236804\n",
      "   +1.0000 if pa>=0.19825440645217896\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp<=0.08001774400472642\n",
      "   -0.0000 if cp<=0.03643625304102898\n",
      "   +0.0000 if cp<=-0.02995460145175457\n",
      "   +0.0000 if cp<=-0.02995460145175457\n",
      "Run episode 938 with rewards 10.0\n",
      "============ 939 ===========\n",
      "8 actions [0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +13.2098 if \n",
      "   +4.0551 if cp<=-0.007844104617834073\n",
      "   +3.8381 if cp>=-0.06365211308002472\n",
      "   +2.6713 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.0760209545493126\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.08001774400472642\n",
      "   +0.0000 if cp<=0.03643625304102898\n",
      "   -0.0000 if cp>=0.11606828272342683\n",
      "   +0.0000 if cp>=0.048493819683790206\n",
      "Run episode 939 with rewards 8.0\n",
      "============ 940 ===========\n",
      "8 actions [1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -34.7309 if \n",
      "  -10.6629 if cp<=-0.007844104617834073\n",
      "  -10.0905 if cp>=-0.06365211308002472\n",
      "   -7.0251 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp>=-0.06988407224416732\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.08001774400472642\n",
      "   +0.0000 if cp<=0.03643625304102898\n",
      "   +0.0000 if cp>=0.11606828272342683\n",
      "   +0.0000 if cp>=-0.052695459872484196\n",
      "Run episode 940 with rewards 8.0\n",
      "============ 941 ===========\n",
      "8 actions [0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +34.7309 if \n",
      "  +10.6629 if cp<=-0.007844104617834073\n",
      "  +10.0905 if cp>=-0.06365211308002472\n",
      "   +7.0251 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.0563151925802231\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.08001774400472642\n",
      "   +0.0000 if cp<=0.03643625304102898\n",
      "   +0.0000 if cp>=-0.052695459872484196\n",
      "   +0.0000 if \n",
      "Run episode 941 with rewards 8.0\n",
      "============ 942 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -13.2362 if \n",
      "   -4.0637 if cp<=-0.007844104617834073\n",
      "   -3.8455 if cp>=-0.06365211308002472\n",
      "   -2.6773 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.04166023135185242\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp<=0.08001774400472642\n",
      "   +0.0000 if cp<=0.03643625304102898\n",
      "   +0.0000 if cp<=0.04166023135185242\n",
      "   +0.0000 if cp>=0.04414936900138855\n",
      "Run episode 942 with rewards 10.0\n",
      "============ 943 ===========\n",
      "8 actions [0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +13.2362 if \n",
      "   +4.0637 if cp<=-0.007844104617834073\n",
      "   +3.8455 if cp>=-0.06365211308002472\n",
      "   +2.6773 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.08313329219818116\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.08001774400472642\n",
      "   +0.0000 if cp<=0.03643625304102898\n",
      "   +0.0000 if cp<=0.04166023135185242\n",
      "   +0.0000 if cp>=0.125252303481102\n",
      "Run episode 943 with rewards 8.0\n",
      "============ 944 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -34.8363 if \n",
      "  -10.6965 if cp<=-0.007844104617834073\n",
      "  -10.1206 if cp>=-0.06365211308002472\n",
      "   -7.0478 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp>=-0.05960089415311813\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.08001774400472642\n",
      "   +0.0000 if cp<=0.03643625304102898\n",
      "   +0.0000 if cp<=0.04166023135185242\n",
      "   +0.0000 if cp>=-0.03480657041072845\n",
      "Run episode 944 with rewards 10.0\n",
      "============ 945 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +35.0904 if \n",
      "   +4.8170 if cp<=-0.007844104617834073\n",
      "  +13.3682 if cp>=-0.06365211308002472\n",
      "   +2.2426 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.049166141450405126\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.08001774400472642\n",
      "   +0.0000 if cp<=0.03643625304102898\n",
      "   +0.0000 if cp<=0.04166023135185242\n",
      "   +0.0000 if \n",
      "Run episode 945 with rewards 9.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 946 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -13.7279 if \n",
      "   -3.5730 if cp<=-0.007844104617834073\n",
      "   -3.9580 if cp>=-0.06365211308002472\n",
      "   -2.7094 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp>=-0.06948567777872085\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.08001774400472642\n",
      "   +0.0000 if cp<=0.04166023135185242\n",
      "   -0.0000 if cp>=-0.04612636715173721\n",
      "   +0.0000 if cp>=-0.04612636715173721\n",
      "Run episode 946 with rewards 10.0\n",
      "============ 947 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +13.7279 if \n",
      "   +3.5730 if cp<=-0.007844104617834073\n",
      "   +3.9580 if cp>=-0.06365211308002472\n",
      "   +2.7094 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.06503322273492813 & cp>=-0.015388242900371552\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp<=0.08001774400472642\n",
      "   -0.0000 if cp<=0.04166023135185242\n",
      "   -0.0000 if cp>=0.025700289756059654\n",
      "   +0.0000 if cp>=0.1168861836194992\n",
      "Run episode 947 with rewards 10.0\n",
      "============ 948 ===========\n",
      "8 actions [1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -36.5785 if \n",
      "   -9.5222 if cp<=-0.007844104617834073\n",
      "  -10.5456 if cp>=-0.06365211308002472\n",
      "   -7.2213 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp>=-0.09362749606370926\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.08001774400472642\n",
      "   +0.0000 if cp<=0.04166023135185242\n",
      "   +0.0000 if cp>=0.025700289756059654\n",
      "   +0.0000 if cp>=-0.06601971983909606\n",
      "Run episode 948 with rewards 8.0\n",
      "============ 949 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +36.5785 if \n",
      "   +9.5222 if cp<=-0.007844104617834073\n",
      "  +10.5456 if cp>=-0.06365211308002472\n",
      "   +7.2213 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.06839275807142259\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.08001774400472642\n",
      "   +0.0000 if cp<=0.04166023135185242\n",
      "   +0.0000 if cp>=-0.06601971983909606\n",
      "   +0.0000 if \n",
      "Run episode 949 with rewards 10.0\n",
      "============ 950 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -14.0035 if \n",
      "   -3.6454 if cp<=-0.007844104617834073\n",
      "   -4.0372 if cp>=-0.06365211308002472\n",
      "   -2.7646 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=-0.017651173286139965 & cp>=-0.05784688889980316\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp<=0.08001774400472642\n",
      "   -0.0000 if cp<=0.04166023135185242\n",
      "   +0.0000 if cp<=-0.017651173286139965\n",
      "   +0.0000 if cp<=-0.017651173286139965\n",
      "Run episode 950 with rewards 10.0\n",
      "============ 951 ===========\n",
      "8 actions [0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +14.0035 if \n",
      "   +3.6454 if cp<=-0.007844104617834073\n",
      "   +4.0372 if cp>=-0.06365211308002472\n",
      "   +2.7646 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.08033135682344437\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.08001774400472642\n",
      "   +0.0000 if cp<=0.04166023135185242\n",
      "   -0.0000 if cp>=0.12233123779296876\n",
      "   +0.0000 if cp>=0.050828713178634646\n",
      "Run episode 951 with rewards 8.0\n",
      "============ 952 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -12.6758 if \n",
      "   -3.2999 if cp<=-0.007844104617834073\n",
      "   -3.6542 if cp>=-0.06365211308002472\n",
      "   -2.5027 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.03590061292052269\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp<=0.08001774400472642\n",
      "   -0.0000 if cp<=0.04166023135185242\n",
      "   -0.0000 if cp>=0.12233123779296876\n",
      "   +0.0000 if cp<=0.009867694973945622\n",
      "Run episode 952 with rewards 9.0\n",
      "============ 953 ===========\n",
      "11 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +12.6758 if \n",
      "   +3.2999 if cp<=-0.007844104617834073\n",
      "   +3.6542 if cp>=-0.06365211308002472\n",
      "   +2.5027 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.057533575594425214\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.08001774400472642\n",
      "   +0.0000 if cp<=0.04166023135185242\n",
      "   +0.0000 if cp<=0.009867694973945622\n",
      "   +0.0000 if cp>=0.027012259513139725\n",
      "Run episode 953 with rewards 11.0\n",
      "============ 954 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -32.3768 if \n",
      "   -8.4377 if cp<=-0.007844104617834073\n",
      "   -9.3284 if cp>=-0.06365211308002472\n",
      "   -6.3994 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp>=-0.00945331808179617\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.08001774400472642\n",
      "   +0.0000 if cp<=0.04166023135185242\n",
      "   +0.0000 if cp>=0.027012259513139725\n",
      "   +0.0000 if pa<=-0.014514580368995667\n",
      "Run episode 954 with rewards 9.0\n",
      "============ 955 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +32.3768 if \n",
      "   +8.4377 if cp<=-0.007844104617834073\n",
      "   +9.3284 if cp>=-0.06365211308002472\n",
      "   +6.3994 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.060203305631876\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.08001774400472642\n",
      "   +0.0000 if cp<=0.04166023135185242\n",
      "   +0.0000 if pa<=-0.014514580368995667\n",
      "   +0.0000 if \n",
      "Run episode 955 with rewards 10.0\n",
      "============ 956 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -12.1458 if \n",
      "   -3.1653 if cp<=-0.007844104617834073\n",
      "   -3.4994 if cp>=-0.06365211308002472\n",
      "   -2.4007 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp>=-0.091136234998703\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.08001774400472642\n",
      "   +0.0000 if cp<=0.04166023135185242\n",
      "   -0.0000 if cp>=-0.06123814582824706\n",
      "   +0.0000 if cp>=-0.06123814582824706\n",
      "Run episode 956 with rewards 9.0\n",
      "============ 957 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +12.3040 if \n",
      "   +3.0078 if cp<=-0.007844104617834073\n",
      "   +3.7049 if cp>=-0.06365211308002472\n",
      "   +2.3134 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.039196067303419124\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp<=0.08001774400472642\n",
      "   -0.0000 if cp<=0.04166023135185242\n",
      "   -0.0000 if cp>=0.007676219381392013\n",
      "   +0.0000 if cp<=0.007676219381392013 & cp>=-0.013656316697597502\n",
      "Run episode 957 with rewards 9.0\n",
      "============ 958 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -30.8467 if \n",
      "   -7.5484 if cp<=-0.007844104617834073\n",
      "   -9.2800 if cp>=-0.06365211308002472\n",
      "   -5.8089 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.044518618285655974\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp<=0.08001774400472642\n",
      "   +0.0000 if cp<=0.04166023135185242\n",
      "   -0.0000 if cp>=0.007676219381392013\n",
      "   +0.0000 if cp<=0.0321730922907591\n",
      "Run episode 958 with rewards 10.0\n",
      "============ 959 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +31.1376 if \n",
      "   +4.3693 if cp<=-0.007844104617834073\n",
      "  +11.1989 if cp>=-0.06365211308002472\n",
      "   +2.4732 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.07006693929433823 & cp>=0.004842014051973821\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.08001774400472642\n",
      "   +0.0000 if cp<=0.04166023135185242\n",
      "   +0.0000 if cp>=0.007676219381392013\n",
      "   +0.0000 if \n",
      "Run episode 959 with rewards 9.0\n",
      "============ 960 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -13.4110 if \n",
      "   -1.9432 if cp<=-0.007844104617834073\n",
      "   -4.7889 if cp>=-0.06365211308002472\n",
      "   -1.1309 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp>=-0.047201985865831374\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.04166023135185242\n",
      "   +0.0000 if cp>=0.007676219381392013\n",
      "   +0.0000 if cp>=-0.07946805953979492\n",
      "   +0.0000 if cp>=-0.047201985865831374\n",
      "Run episode 960 with rewards 9.0\n",
      "============ 961 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +13.4110 if \n",
      "   +1.9432 if cp<=-0.007844104617834073\n",
      "   +4.7889 if cp>=-0.06365211308002472\n",
      "   +1.1309 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.07403331696987153\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   +0.0000 if cp<=0.04166023135185242\n",
      "   -0.0000 if cp>=-0.07946805953979492\n",
      "   -0.0000 if cp>=-0.047201985865831374\n",
      "   +0.0000 if cp<=0.07403331696987153\n",
      "Run episode 961 with rewards 9.0\n",
      "============ 962 ===========\n",
      "8 actions [1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -35.0468 if \n",
      "   -5.0865 if cp<=-0.007844104617834073\n",
      "  -12.5107 if cp>=-0.06365211308002472\n",
      "   -2.9642 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=-0.045580434054136275\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.04166023135185242\n",
      "   -0.0000 if cp>=-0.07946805953979492\n",
      "   -0.0000 if cp>=-0.047201985865831374\n",
      "   +0.0000 if cp>=-0.01346381902694702\n",
      "Run episode 962 with rewards 8.0\n",
      "============ 963 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +35.0468 if \n",
      "   +5.0865 if cp<=-0.007844104617834073\n",
      "  +12.5107 if cp>=-0.06365211308002472\n",
      "   +2.9642 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.0442008137702942\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.04166023135185242\n",
      "   +0.0000 if cp>=-0.07946805953979492\n",
      "   +0.0000 if cp>=-0.047201985865831374\n",
      "   +0.0000 if \n",
      "Run episode 963 with rewards 9.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 964 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -12.7882 if \n",
      "   -2.2148 if cp<=-0.007844104617834073\n",
      "   -4.3716 if cp>=-0.06365211308002472\n",
      "   -1.4658 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp>=-0.05247332602739334\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.04166023135185242\n",
      "   -0.0000 if cp>=-0.047201985865831374\n",
      "   +0.0000 if cp<=-0.016236043721437454 & cp>=-0.0858678713440895\n",
      "   +0.0000 if cp>=-0.0858678713440895\n",
      "Run episode 964 with rewards 10.0\n",
      "============ 965 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +12.7882 if \n",
      "   +2.2148 if cp<=-0.007844104617834073\n",
      "   +4.3716 if cp>=-0.06365211308002472\n",
      "   +1.4658 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.07913035154342651\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   +0.0000 if cp<=0.04166023135185242\n",
      "   -0.0000 if cp>=-0.047201985865831374\n",
      "   -0.0000 if cp<=-0.016236043721437454 & cp>=-0.0858678713440895\n",
      "   +0.0000 if cp<=0.12050481140613556\n",
      "Run episode 965 with rewards 10.0\n",
      "============ 966 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -32.6201 if \n",
      "   -5.6799 if cp<=-0.007844104617834073\n",
      "  -11.1376 if cp>=-0.06365211308002472\n",
      "   -3.7716 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=-0.1206812471151352\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.04166023135185242\n",
      "   -0.0000 if cp>=-0.047201985865831374\n",
      "   +0.0000 if cp<=0.12050481140613556\n",
      "   +0.0000 if cp>=-0.07945004254579544\n",
      "Run episode 966 with rewards 9.0\n",
      "============ 967 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +32.6201 if \n",
      "   +5.6799 if cp<=-0.007844104617834073\n",
      "  +11.1376 if cp>=-0.06365211308002472\n",
      "   +3.7716 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.04741522520780564\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.04166023135185242\n",
      "   +0.0000 if cp>=-0.047201985865831374\n",
      "   +0.0000 if cp<=0.12050481140613556\n",
      "   +0.0000 if \n",
      "Run episode 967 with rewards 10.0\n",
      "============ 968 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -12.3223 if \n",
      "   -2.6415 if cp<=-0.007844104617834073\n",
      "   -3.7607 if cp>=-0.06365211308002472\n",
      "   -1.9557 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp>=-0.06414062529802322\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.04166023135185242\n",
      "   +0.0000 if cp<=0.12050481140613556\n",
      "   -0.0000 if cp>=-0.03466628119349479\n",
      "   +0.0000 if cp>=-0.03466628119349479\n",
      "Run episode 968 with rewards 10.0\n",
      "============ 969 ===========\n",
      "8 actions [0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +12.4276 if \n",
      "   +2.6270 if cp<=-0.007844104617834073\n",
      "   +3.9129 if cp>=-0.06365211308002472\n",
      "   +1.7536 if cp<=0.018871868029236804\n",
      "   +0.8794 if cp<=0.055510670691728596\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   +0.0000 if cp<=0.04166023135185242\n",
      "   -0.0000 if cp<=0.12050481140613556\n",
      "   -0.0000 if cp>=0.09495299756526948\n",
      "   +0.0000 if cp<=0.09495299756526948 & cp>=0.055510670691728596\n",
      "Run episode 969 with rewards 8.0\n",
      "============ 970 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -31.1877 if \n",
      "   -6.6060 if cp<=-0.007844104617834073\n",
      "   -9.8145 if cp>=-0.06365211308002472\n",
      "   -4.4152 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp>=-0.04547908902168273\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.04166023135185242\n",
      "   +0.0000 if cp<=0.12050481140613556\n",
      "   +0.0000 if cp>=0.09495299756526948\n",
      "   +0.0000 if cp>=-0.02935704141855239\n",
      "Run episode 970 with rewards 9.0\n",
      "============ 971 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +31.1877 if \n",
      "   +6.6060 if cp<=-0.007844104617834073\n",
      "   +9.8145 if cp>=-0.06365211308002472\n",
      "   +4.4152 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.08099797368049623\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.04166023135185242\n",
      "   +0.0000 if cp<=0.12050481140613556\n",
      "   +0.0000 if cp>=-0.02935704141855239\n",
      "   +0.0000 if \n",
      "Run episode 971 with rewards 9.0\n",
      "============ 972 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -11.9440 if \n",
      "   -2.6462 if cp<=-0.007844104617834073\n",
      "   -3.6962 if cp>=-0.06365211308002472\n",
      "   -1.8175 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp>=-0.050469073653221126\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.04166023135185242\n",
      "   +0.0000 if cp<=0.12050481140613556\n",
      "   -0.0000 if cp>=-0.02728560119867324\n",
      "   +0.0000 if cp>=-0.02728560119867324\n",
      "Run episode 972 with rewards 9.0\n",
      "============ 973 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +12.1209 if \n",
      "   +2.4826 if cp<=-0.007844104617834073\n",
      "   +3.9317 if cp>=-0.06365211308002472\n",
      "   +1.6379 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.05609503462910653 & cp>=-0.008854839578270912\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp<=0.04166023135185242\n",
      "   -0.0000 if cp<=0.12050481140613556\n",
      "   -0.0000 if cp>=0.05609503462910653\n",
      "   +0.0000 if cp>=0.05609503462910653\n",
      "Run episode 973 with rewards 9.0\n",
      "============ 974 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -29.9833 if \n",
      "   -6.1676 if cp<=-0.007844104617834073\n",
      "   -9.7133 if cp>=-0.06365211308002472\n",
      "   -4.0738 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp>=-0.03240164630115032\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.12050481140613556\n",
      "   +0.0000 if cp>=0.05609503462910653\n",
      "   -0.0000 if cp>=-0.06486972868442535\n",
      "   +0.0000 if cp>=-0.06486972868442535\n",
      "Run episode 974 with rewards 10.0\n",
      "============ 975 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +29.9833 if \n",
      "   +6.1676 if cp<=-0.007844104617834073\n",
      "   +9.7133 if cp>=-0.06365211308002472\n",
      "   +4.0738 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=0.09280535131692887\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.12050481140613556\n",
      "   +0.0000 if cp>=-0.06486972868442535\n",
      "   +0.0000 if \n",
      "   +0.0000 if \n",
      "Run episode 975 with rewards 10.0\n",
      "============ 976 ===========\n",
      "11 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -12.6866 if \n",
      "   -4.1010 if cp<=-0.007844104617834073\n",
      "   -2.4609 if cp>=-0.06365211308002472\n",
      "   -3.3462 if cp<=0.018871868029236804\n",
      "   +1.0000 if cp<=-0.12258328199386596\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.12050481140613556\n",
      "   +0.0000 if cp>=-0.08189549297094345\n",
      "   +0.0000 if cp<=-0.03796394169330597 & cp>=-0.12258328199386596\n",
      "   +0.0000 if cp>=-0.08189549297094345\n",
      "Run episode 976 with rewards 11.0\n",
      "============ 977 ===========\n",
      "11 actions [0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1]\n",
      "  +15.3950 if \n",
      "   +2.2917 if cp<=-0.007844104617834073\n",
      "   +9.6805 if cp>=-0.06365211308002472\n",
      "   +1.8699 if cp<=0.018871868029236804\n",
      "  -21.5201 if cp<=0.10888379067182544\n",
      "--------------\n",
      "   -0.0000 if \n",
      "   +0.0000 if cp<=0.12050481140613556\n",
      "   +0.0000 if cp<=-0.03796394169330597 & cp>=-0.12258328199386596\n",
      "   -0.0000 if cp>=0.0731930062174797\n",
      "   +0.0000 if cp<=0.16018934547901154 & cp>=0.0731930062174797\n",
      "Run episode 977 with rewards 11.0\n",
      "============ 978 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +15.3950 if \n",
      "   +2.2917 if cp<=-0.007844104617834073\n",
      "   +9.6805 if cp>=-0.06365211308002472\n",
      "  +21.5201 if cp<=0.10888379067182544\n",
      "   +1.0000 if cv<=-0.9390060901641846 & pa>=0.046297155320644406\n",
      "--------------\n",
      "  -14.8492 if \n",
      "  -14.8492 if cp<=0.12050481140613556\n",
      "   -0.0000 if cp>=0.0731930062174797\n",
      "   -0.0000 if cp<=0.16018934547901154 & cp>=0.0731930062174797\n",
      "   +1.0000 if cp>=-0.06237262114882469\n",
      "Run episode 978 with rewards 9.0\n",
      "============ 979 ===========\n",
      "12 actions [1, 1, 1, 0, 1, 1, 0, 1, 1, 0, 0, 1]\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp<=-0.007844104617834073\n",
      "   +0.0000 if cp>=-0.06365211308002472\n",
      "   -0.0000 if cp<=0.10888379067182544\n",
      "   +0.0000 if cp>=-0.07110647112131119\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.12050481140613556\n",
      "   +0.0000 if cp>=0.0731930062174797\n",
      "   -0.0000 if cp>=-0.06237262114882469\n",
      "   +0.0000 if cp>=-0.10210026949644088\n",
      "Run episode 979 with rewards 12.0\n",
      "============ 980 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -5.1605 if \n",
      "   +0.9426 if cp<=-0.007844104617834073\n",
      "   -5.1605 if cp>=-0.06365211308002472\n",
      "   -5.1605 if cp<=0.10888379067182544\n",
      "   +1.0000 if cp>=-0.02869724445044994 & cv<=0.7967338562011719\n",
      "--------------\n",
      "   +6.9051 if \n",
      "   +6.9051 if cp<=0.12050481140613556\n",
      "   +7.6355 if cp>=0.0731930062174797\n",
      "   +6.9051 if cp>=-0.06237262114882469\n",
      "   +1.0000 if cp>=0.05044594630599023 & cv>=0.7967338562011719\n",
      "Run episode 980 with rewards 9.0\n",
      "============ 981 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 1, 1]\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp>=-0.06365211308002472\n",
      "   -0.0000 if cp<=0.10888379067182544\n",
      "   -0.0000 if cp>=-0.02869724445044994 & cv<=0.7967338562011719\n",
      "   +0.0000 if cp<=0.04937243014574051\n",
      "--------------\n",
      "   -0.0013 if \n",
      "   +0.0000 if cp<=0.12050481140613556\n",
      "   -0.0013 if cp>=0.0731930062174797\n",
      "   -0.0013 if cp>=-0.06237262114882469\n",
      "   +0.0000 if cp<=0.062027630209922795\n",
      "Run episode 981 with rewards 10.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 982 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +14.4809 if \n",
      "   -1.9528 if cp>=-0.06365211308002472\n",
      "  +14.4809 if cp<=0.10888379067182544\n",
      "   +4.2180 if cp>=-0.02869724445044994 & cv<=0.7967338562011719\n",
      "   +1.0000 if cp<=0.025459470599889757\n",
      "--------------\n",
      "  -14.7808 if \n",
      "  -14.7812 if cp<=0.12050481140613556\n",
      "   +0.0005 if cp>=0.0731930062174797\n",
      "   +2.0026 if cp>=-0.06237262114882469\n",
      "   +1.0000 if cp>=-0.01708525437861681\n",
      "Run episode 982 with rewards 9.0\n",
      "============ 983 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.0000 if \n",
      "   +0.0000 if cp>=-0.06365211308002472\n",
      "   -0.0000 if cp<=0.10888379067182544\n",
      "   -0.0000 if cp>=-0.02869724445044994 & cv<=0.7967338562011719\n",
      "   +0.0000 if cp>=-0.04149352014064789\n",
      "--------------\n",
      "  +23.8055 if \n",
      "  +23.7998 if cp<=0.12050481140613556\n",
      "   +5.4452 if cp>=-0.06237262114882469\n",
      "  -12.5745 if cp>=-0.01708525437861681\n",
      "   +1.0000 if cp>=-0.10251039713621139\n",
      "Run episode 983 with rewards 9.0\n",
      "============ 984 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=-0.06365211308002472\n",
      "   +0.0000 if cp<=0.10888379067182544\n",
      "   -0.0000 if cp>=-0.02869724445044994 & cv<=0.7967338562011719\n",
      "   +0.0000 if cp<=0.09619892239570618 & cp>=0.02830362394452095\n",
      "--------------\n",
      "  -10.1495 if \n",
      "   -8.5111 if cp<=0.12050481140613556\n",
      "   -4.3382 if cp>=-0.06237262114882469\n",
      "   -6.5947 if cp>=-0.01708525437861681\n",
      "   +1.0000 if cp>=0.02830362394452095\n",
      "Run episode 984 with rewards 9.0\n",
      "============ 985 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp>=-0.06365211308002472\n",
      "   -0.0000 if cp>=-0.02869724445044994 & cv<=0.7967338562011719\n",
      "   +0.0000 if cp<=0.09619892239570618 & cp>=0.02830362394452095\n",
      "   +0.0000 if cp<=-0.015515549667179582\n",
      "--------------\n",
      "  +10.1495 if \n",
      "   +8.5111 if cp<=0.12050481140613556\n",
      "   +4.3382 if cp>=-0.06237262114882469\n",
      "   +6.5947 if cp>=-0.01708525437861681\n",
      "   +1.0000 if cp>=-0.015515549667179582\n",
      "Run episode 985 with rewards 9.0\n",
      "============ 986 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp>=-0.06365211308002472\n",
      "   -0.0000 if cp>=-0.02869724445044994 & cv<=0.7967338562011719\n",
      "   -0.0000 if cp<=-0.015515549667179582\n",
      "   +0.0000 if cp>=0.035114061087369926\n",
      "--------------\n",
      "   -5.1131 if \n",
      "   -4.2877 if cp<=0.12050481140613556\n",
      "   -2.1855 if cp>=-0.06237262114882469\n",
      "   -3.3223 if cp>=-0.01708525437861681\n",
      "   +1.0000 if cp<=-0.02827070765197277\n",
      "Run episode 986 with rewards 10.0\n",
      "============ 987 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.0137 if \n",
      "   -0.0064 if cp>=-0.06365211308002472\n",
      "   +0.0000 if cp>=-0.02869724445044994 & cv<=0.7967338562011719\n",
      "   -0.0137 if cp<=-0.015515549667179582\n",
      "   -0.0137 if cp<=-0.0008647551760077457\n",
      "--------------\n",
      "   +8.5396 if \n",
      "   +7.7645 if cp<=0.12050481140613556\n",
      "   +2.3581 if cp>=-0.06237262114882469\n",
      "   +2.2542 if cp>=-0.01708525437861681\n",
      "   +1.0000 if pa>=0.17228783667087555\n",
      "Run episode 987 with rewards 10.0\n",
      "============ 988 ===========\n",
      "8 actions [0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp>=-0.06365211308002472\n",
      "   -0.0000 if cp<=-0.015515549667179582\n",
      "   -0.0000 if cp<=-0.0008647551760077457\n",
      "   +0.0000 if cp<=-0.024200992286205293\n",
      "--------------\n",
      "   -6.9064 if \n",
      "   -6.2794 if cp<=0.12050481140613556\n",
      "   -1.9058 if cp>=-0.06237262114882469\n",
      "   -1.8253 if cp>=-0.01708525437861681\n",
      "   +1.0000 if cp<=-0.024200992286205293\n",
      "Run episode 988 with rewards 8.0\n",
      "============ 989 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.0002 if \n",
      "   -0.0000 if cp>=-0.06365211308002472\n",
      "   -0.0002 if cp<=-0.015515549667179582\n",
      "   -0.0002 if cp<=-0.0008647551760077457\n",
      "   -0.0002 if cp<=-0.03937829360365867\n",
      "--------------\n",
      "   +7.7597 if \n",
      "   +7.1434 if cp<=0.12050481140613556\n",
      "   +2.3928 if cp>=-0.06237262114882469\n",
      "   +1.7186 if cp>=-0.01708525437861681\n",
      "   +0.9997 if cp>=-0.015194289386272427\n",
      "Run episode 989 with rewards 10.0\n",
      "============ 990 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.0001 if \n",
      "   +0.0000 if cp<=-0.015515549667179582\n",
      "   +0.0000 if cp<=-0.0008647551760077457\n",
      "   +0.0000 if cp<=-0.03937829360365867\n",
      "   +0.0001 if cp>=0.133489727973938\n",
      "--------------\n",
      "  -10.0671 if \n",
      "   -4.0190 if cp<=0.12050481140613556\n",
      "   -4.7574 if cp>=-0.06237262114882469\n",
      "   -4.0904 if cp>=-0.01708525437861681\n",
      "   +1.0000 if cp<=0.133489727973938\n",
      "Run episode 990 with rewards 10.0\n",
      "============ 991 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.0001 if \n",
      "   -0.0001 if cp<=-0.015515549667179582\n",
      "   -0.0001 if cp<=-0.0008647551760077457\n",
      "   +0.0000 if cp>=0.133489727973938\n",
      "   -0.0001 if cp<=-0.048983094096183774\n",
      "--------------\n",
      "  +10.9025 if \n",
      "   +4.9526 if cp<=0.12050481140613556\n",
      "   +4.7628 if cp>=-0.06237262114882469\n",
      "   +3.5763 if cp>=-0.01708525437861681\n",
      "   +0.9995 if cp>=-0.0072799010318703936\n",
      "Run episode 991 with rewards 9.0\n",
      "============ 992 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=-0.015515549667179582\n",
      "   +0.0000 if cp<=-0.0008647551760077457\n",
      "   +0.0000 if cp<=-0.048983094096183774\n",
      "   +0.0000 if cp>=0.1103552281856537\n",
      "--------------\n",
      "   -9.3692 if \n",
      "   -4.1804 if cp<=0.12050481140613556\n",
      "   -4.1622 if cp>=-0.06237262114882469\n",
      "   -3.1560 if cp>=-0.01708525437861681\n",
      "   +0.9168 if cp>=0.15242810547351837\n",
      "Run episode 992 with rewards 10.0\n",
      "============ 993 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.0001 if \n",
      "   -0.0001 if cp<=-0.015515549667179582\n",
      "   -0.0001 if cp<=-0.0008647551760077457\n",
      "   +0.0000 if cp>=0.1103552281856537\n",
      "   -0.0001 if cp<=-0.08261779993772507\n",
      "--------------\n",
      "  +10.7049 if \n",
      "   +5.6448 if cp<=0.12050481140613556\n",
      "   +3.7284 if cp>=-0.06237262114882469\n",
      "   +2.2140 if cp>=-0.01708525437861681\n",
      "   +1.0000 if cp<=0.005304522626101971 & cp>=-0.08261779993772507\n",
      "Run episode 993 with rewards 9.0\n",
      "============ 994 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=-0.015515549667179582\n",
      "   +0.0000 if cp<=-0.0008647551760077457\n",
      "   +0.0000 if cp<=-0.08261779993772507\n",
      "   +0.0000 if cp>=0.04308824203908444\n",
      "--------------\n",
      "   -8.8574 if \n",
      "   -4.6707 if cp<=0.12050481140613556\n",
      "   -3.0851 if cp>=-0.06237262114882469\n",
      "   -1.8321 if cp>=-0.01708525437861681\n",
      "   +1.0000 if cp<=0.012128297984600068\n",
      "Run episode 994 with rewards 9.0\n",
      "============ 995 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.0001 if \n",
      "   -0.0001 if cp<=-0.015515549667179582\n",
      "   -0.0001 if cp<=-0.0008647551760077457\n",
      "   +0.0000 if cp>=0.04308824203908444\n",
      "   -0.0001 if pa>=0.16527299582958221\n",
      "--------------\n",
      "   +9.5137 if \n",
      "   +5.3796 if cp<=0.12050481140613556\n",
      "   +3.4500 if cp>=-0.06237262114882469\n",
      "   +1.7101 if cp>=-0.01708525437861681\n",
      "   +0.9927 if cp>=-0.013819941505789754\n",
      "Run episode 995 with rewards 10.0\n",
      "============ 996 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=-0.015515549667179582\n",
      "   +0.0000 if cp<=-0.0008647551760077457\n",
      "   +0.0000 if pa>=0.16527299582958221\n",
      "   +0.0000 if cp>=0.14367322623729706\n",
      "--------------\n",
      "  -10.0930 if \n",
      "   -5.3469 if cp<=0.12050481140613556\n",
      "   -4.1774 if cp>=-0.06237262114882469\n",
      "   -2.4800 if cp>=-0.01708525437861681\n",
      "   +0.4573 if cp>=0.14367322623729706\n",
      "Run episode 996 with rewards 10.0\n",
      "============ 997 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp<=-0.015515549667179582\n",
      "   -0.0000 if cp<=-0.0008647551760077457\n",
      "   +0.0000 if cp>=0.14367322623729706\n",
      "   +0.0000 if cp<=-0.05892395377159119\n",
      "--------------\n",
      "  +10.2719 if \n",
      "   +5.5422 if cp<=0.12050481140613556\n",
      "   +4.1810 if cp>=-0.06237262114882469\n",
      "   +2.3761 if cp>=-0.01708525437861681\n",
      "   +0.9862 if cp>=-0.01802050657570362\n",
      "Run episode 997 with rewards 10.0\n",
      "============ 998 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp<=-0.015515549667179582\n",
      "   -0.0000 if cp<=-0.0008647551760077457\n",
      "   +0.0000 if cp<=-0.05892395377159119\n",
      "   +0.0000 if cp<=-0.02646150141954422\n",
      "--------------\n",
      "   -8.0135 if \n",
      "   -4.3234 if cp<=0.12050481140613556\n",
      "   -3.2613 if cp>=-0.06237262114882469\n",
      "   -1.8543 if cp>=-0.01708525437861681\n",
      "   +1.0000 if cp<=-0.02646150141954422\n",
      "Run episode 998 with rewards 10.0\n",
      "============ 999 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.0009 if \n",
      "   -0.0009 if cp<=-0.015515549667179582\n",
      "   -0.0009 if cp<=-0.0008647551760077457\n",
      "   -0.0009 if cp<=-0.02646150141954422\n",
      "   -0.0007 if cp<=-0.06868215501308442\n",
      "--------------\n",
      "  +11.0286 if \n",
      "   +7.5487 if cp<=0.12050481140613556\n",
      "   +2.2535 if cp>=-0.06237262114882469\n",
      "   -0.2648 if cp>=-0.01708525437861681\n",
      "   +1.0000 if cp<=0.015217326581478119 & cp>=-0.06868215501308442\n",
      "Run episode 999 with rewards 10.0\n",
      "\n",
      "Done\n"
     ]
    }
   ],
   "source": [
    "rewards = train()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 25,
   "id": "3d20e8e0",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-------------------------\n",
      "   -4.1721 if cp>=-0.34897989034652704 & cv>=-0.9436933159828186 & pa>=-0.03141852095723152 & pav>=0.504111683368683\n",
      "   -0.0000 if cp>=-0.5207653045654297 & cv>=-1.0628056526184082 & pa<=-0.03944564238190651 & pav>=0.22416704893112188\n",
      "   -0.0000 if cp<=0.04635245129466057 & cp>=-1.2734074354171754 & pa<=-0.032383657246828075 & pav>=0.6297808408737183\n",
      "   +0.9051 if cp<=0.0496792197227478 & cv>=0.0012940536485984934 & pav<=-0.04089766442775719 & pav>=-0.42539845705032336\n",
      "   -2.6151 if pav>=0.8499523997306824\n",
      "-------------------------\n",
      "   -8.0570 if pa<=0.006895773485302927 & pav<=0.5752061486244202\n",
      "   -6.4523 if pa<=0.00662959311157465\n",
      "   -9.5233 if cp>=-0.2101022720336914 & cv<=0.22678737342357635 & cv>=0.030156206339597712 & pa>=0.007871035486459744 & pa>=0.022794276475906396\n",
      "   +5.1435 if \n",
      "   +1.1519 if cp>=-0.00408112602308392 & cv>=-0.056063193082809444 & pav>=0.3578081905841828\n"
     ]
    }
   ],
   "source": [
    "for i in range(2):\n",
    "    print('-------------------------')\n",
    "    print(actor.best_model[i].rules_)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 26,
   "id": "0b443f87",
   "metadata": {},
   "outputs": [],
   "source": [
    "def test(num_test_episodes=100):\n",
    "    \"\"\"\n",
    "    Test the learned policy using the trained actor model.\n",
    "\n",
    "    Args:\n",
    "        num_test_episodes (int): Number of episodes to test the model.\n",
    "\n",
    "    Returns:\n",
    "        float: Average reward over the test episodes.\n",
    "    \"\"\"\n",
    "    total_reward = 0\n",
    "\n",
    "    for episode in range(num_test_episodes):\n",
    "        state = env.reset()[0]  # Reset the environment and get the initial state\n",
    "        episode_reward = 0\n",
    "\n",
    "        for t in range(1, 10000):  # Limit the number of time steps\n",
    "            # Convert state to tensor and predict action probabilities\n",
    "            #             state_tensor = torch.tensor(state, dtype=torch.float32).to(device)\n",
    "            action_probs = actor.predict(pd.DataFrame(np.array([state]), columns=column_names))\n",
    "            # Select action based on the highest probability\n",
    "            action = np.argmax(action_probs)\n",
    "            # Take the chosen action\n",
    "            next_state, reward, done, trunc, _ = env.step(action)\n",
    "            # Accumulate reward\n",
    "            episode_reward += reward\n",
    "            if done or trunc:\n",
    "                break\n",
    "            # Update state\n",
    "            state = next_state\n",
    "        total_reward += episode_reward\n",
    "        print(f\"Test Episode {episode + 1}, Reward: {episode_reward}\")\n",
    "    avg_reward = total_reward / num_test_episodes\n",
    "    print(f\"\\nAverage Reward over {num_test_episodes} Test Episodes: {avg_reward}\")\n",
    "    return avg_reward"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 27,
   "id": "ef9e3e26",
   "metadata": {
    "scrolled": false
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Test Episode 1, Reward: 404.0\n",
      "Test Episode 2, Reward: 94.0\n",
      "Test Episode 3, Reward: 273.0\n",
      "Test Episode 4, Reward: 96.0\n",
      "Test Episode 5, Reward: 77.0\n",
      "Test Episode 6, Reward: 55.0\n",
      "Test Episode 7, Reward: 69.0\n",
      "Test Episode 8, Reward: 107.0\n",
      "Test Episode 9, Reward: 144.0\n",
      "Test Episode 10, Reward: 69.0\n",
      "Test Episode 11, Reward: 133.0\n",
      "Test Episode 12, Reward: 299.0\n",
      "Test Episode 13, Reward: 33.0\n",
      "Test Episode 14, Reward: 148.0\n",
      "Test Episode 15, Reward: 106.0\n",
      "Test Episode 16, Reward: 59.0\n",
      "Test Episode 17, Reward: 109.0\n",
      "Test Episode 18, Reward: 198.0\n",
      "Test Episode 19, Reward: 29.0\n",
      "Test Episode 20, Reward: 61.0\n",
      "Test Episode 21, Reward: 35.0\n",
      "Test Episode 22, Reward: 129.0\n",
      "Test Episode 23, Reward: 40.0\n",
      "Test Episode 24, Reward: 227.0\n",
      "Test Episode 25, Reward: 32.0\n",
      "Test Episode 26, Reward: 82.0\n",
      "Test Episode 27, Reward: 309.0\n",
      "Test Episode 28, Reward: 91.0\n",
      "Test Episode 29, Reward: 178.0\n",
      "Test Episode 30, Reward: 29.0\n",
      "Test Episode 31, Reward: 54.0\n",
      "Test Episode 32, Reward: 39.0\n",
      "Test Episode 33, Reward: 375.0\n",
      "Test Episode 34, Reward: 85.0\n",
      "Test Episode 35, Reward: 224.0\n",
      "Test Episode 36, Reward: 207.0\n",
      "Test Episode 37, Reward: 500.0\n",
      "Test Episode 38, Reward: 33.0\n",
      "Test Episode 39, Reward: 338.0\n",
      "Test Episode 40, Reward: 373.0\n",
      "Test Episode 41, Reward: 90.0\n",
      "Test Episode 42, Reward: 84.0\n",
      "Test Episode 43, Reward: 47.0\n",
      "Test Episode 44, Reward: 79.0\n",
      "Test Episode 45, Reward: 141.0\n",
      "Test Episode 46, Reward: 277.0\n",
      "Test Episode 47, Reward: 153.0\n",
      "Test Episode 48, Reward: 57.0\n",
      "Test Episode 49, Reward: 40.0\n",
      "Test Episode 50, Reward: 87.0\n",
      "Test Episode 51, Reward: 33.0\n",
      "Test Episode 52, Reward: 32.0\n",
      "Test Episode 53, Reward: 58.0\n",
      "Test Episode 54, Reward: 285.0\n",
      "Test Episode 55, Reward: 113.0\n",
      "Test Episode 56, Reward: 251.0\n",
      "Test Episode 57, Reward: 168.0\n",
      "Test Episode 58, Reward: 117.0\n",
      "Test Episode 59, Reward: 74.0\n",
      "Test Episode 60, Reward: 36.0\n",
      "Test Episode 61, Reward: 96.0\n",
      "Test Episode 62, Reward: 399.0\n",
      "Test Episode 63, Reward: 39.0\n",
      "Test Episode 64, Reward: 89.0\n",
      "Test Episode 65, Reward: 96.0\n",
      "Test Episode 66, Reward: 500.0\n",
      "Test Episode 67, Reward: 64.0\n",
      "Test Episode 68, Reward: 251.0\n",
      "Test Episode 69, Reward: 38.0\n",
      "Test Episode 70, Reward: 72.0\n",
      "Test Episode 71, Reward: 111.0\n",
      "Test Episode 72, Reward: 73.0\n",
      "Test Episode 73, Reward: 27.0\n",
      "Test Episode 74, Reward: 421.0\n",
      "Test Episode 75, Reward: 190.0\n",
      "Test Episode 76, Reward: 32.0\n",
      "Test Episode 77, Reward: 274.0\n",
      "Test Episode 78, Reward: 82.0\n",
      "Test Episode 79, Reward: 88.0\n",
      "Test Episode 80, Reward: 133.0\n",
      "Test Episode 81, Reward: 356.0\n",
      "Test Episode 82, Reward: 90.0\n",
      "Test Episode 83, Reward: 59.0\n",
      "Test Episode 84, Reward: 25.0\n",
      "Test Episode 85, Reward: 64.0\n",
      "Test Episode 86, Reward: 119.0\n",
      "Test Episode 87, Reward: 149.0\n",
      "Test Episode 88, Reward: 59.0\n",
      "Test Episode 89, Reward: 50.0\n",
      "Test Episode 90, Reward: 87.0\n",
      "Test Episode 91, Reward: 52.0\n",
      "Test Episode 92, Reward: 38.0\n",
      "Test Episode 93, Reward: 121.0\n",
      "Test Episode 94, Reward: 313.0\n",
      "Test Episode 95, Reward: 175.0\n",
      "Test Episode 96, Reward: 179.0\n",
      "Test Episode 97, Reward: 87.0\n",
      "Test Episode 98, Reward: 109.0\n",
      "Test Episode 99, Reward: 90.0\n",
      "Test Episode 100, Reward: 191.0\n",
      "\n",
      "Average Reward over 100 Test Episodes: 136.53\n"
     ]
    }
   ],
   "source": [
    "avg_test_reward = test(num_test_episodes=100)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 28,
   "id": "31340922",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[<matplotlib.lines.Line2D at 0x7f324128b1f0>]"
      ]
     },
     "execution_count": 28,
     "metadata": {},
     "output_type": "execute_result"
    },
    {
     "data": {
      "image/png": "iVBORw0KGgoAAAANSUhEUgAAAXcAAAD4CAYAAAAXUaZHAAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjUuMiwgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy8qNh9FAAAACXBIWXMAAAsTAAALEwEAmpwYAAA1vklEQVR4nO3deXxU1f3/8ddntoQkhAQICIQdFHFBEBUqtlWLWm3Vb21tq1XqUn/91tba+m3daq1bv9pvq9baWq1atW51q7jggoDixhJk38OesGQhezLrPb8/7p3JTBaSQCAzw+f5eEDuNjPn5k7ec+bcc88VYwxKKaXSi6unC6CUUqr7abgrpVQa0nBXSqk0pOGulFJpSMNdKaXSkKenCwDQv39/M2LEiJ4uhlJKpZQlS5ZUGGMK2lqXFOE+YsQIioqKeroYSimVUkRkW3vrtFlGKaXSkIa7UkqlIQ13pZRKQxruSimVhjoV7iKyVURWisgyESlylvUVkdkistH5me8sFxF5SESKRWSFiEw6mDuglFKqta7U3E83xpxgjJnszN8EzDHGjAXmOPMAXwfGOv+uAR7prsIqpZTqnANplrkAeNqZfhq4MG75M8a2AMgTkUEH8DpKKaW6qLPhboD3RWSJiFzjLBtojNnlTO8GBjrTQ4AdcY8tcZYlEJFrRKRIRIrKy8v3o+hKHZ7mrS+jpKqxp4uhklxnL2KaZowpFZEBwGwRWRe/0hhjRKRLA8MbYx4DHgOYPHmyDiqvVCdd8c/F9M7wsPKOs3u6KCqJdarmbowpdX6WAf8BTgb2RJtbnJ9lzualwNC4hxc6y5RS3aQuEO7pIqgk12G4i0i2iPSOTgNnAauAN4AZzmYzgJnO9BvA5U6vmSlATVzzjVJKqUOgM80yA4H/iEh0++eNMe+KyGLgJRG5CtgGXOxsPws4FygGGoErur3USiml9qnDcDfGbAYmtLG8EjizjeUGuLZbSqeUUmq/6BWqSimVhjTclVIqDWm4K6VUGtJwV0qpNKThrpRSaUjDXSml0pCGu1JKpSENd6WUSkMa7koplYY03JVSKg1puCulVBrScFdKqTSk4a6UUmlIw12pJPbdRz/nN6+v7OliqBSk4a5UElu4ZS/PLtje08VQKUjDXSml0pCGu1JKpSENd6WUSkMa7koplYY03JVSKg1puCulVBrScFcqhRhjeroIKkVouCulVBrScFcqhWjFXXWWhrtSSqUhDXelUohW3FVnabgrpVQa0nBXKoXcNnNVTxdBpQgNd6VSyPMLdYRI1Tka7koplYY03JVSKg1puCulVBrqdLiLiFtElorIW878SBFZKCLFIvJvEfE5yzOc+WJn/YiDVHallFLt6ErN/efA2rj5+4AHjDFjgCrgKmf5VUCVs/wBZzullFKHUKfCXUQKgfOAx515Ac4AXnE2eRq40Jm+wJnHWX+ms71SSqlDpLM19weBXwOWM98PqDbGhJ35EmCIMz0E2AHgrK9xtk8gIteISJGIFJWXl+9f6ZVSSrWpw3AXkW8AZcaYJd35wsaYx4wxk40xkwsKCrrzqZVS6rDn6cQ2pwLni8i5QCaQC/wZyBMRj1M7LwRKne1LgaFAiYh4gD5AZbeXXCmlVLs6rLkbY242xhQaY0YA3wPmGmMuBeYB33Y2mwHMdKbfcOZx1s81eocBpZQ6pA6kn/uNwC9FpBi7Tf0JZ/kTQD9n+S+Bmw6siEoppbqqM80yMcaYD4EPnenNwMltbOMHvtMNZVNKKbWf9ApVpZRKQxruSimVhjTclVIqDWm4K6VUGtJwV0qpNKThrpRSaUjDXSml0pCGu1JKpSENd6WUSkMa7koplYY03JVSKg1puCulVBrScFdKqTSk4a6UUmlIw10ppdKQhrtSSqUhDXellEpDGu5KKZWGNNyVUioNdekeqkqpnrG9spFH52/q6WKoFKLhrlQK+NmLS1m+o7qni6FSiDbLKKVUGtJwV0qpNKThrlQKkJ4ugEo5Gu5KKZWGNNyVUioNabgrlQJE22VUF2m4K6VUGtJwVyoFaMVddZWGu1JKpSENd6WUSkMdhruIZIrIIhFZLiKrReQOZ/lIEVkoIsUi8m8R8TnLM5z5Ymf9iIO8D0qlPdEzqqqLOlNzDwBnGGMmACcA54jIFOA+4AFjzBigCrjK2f4qoMpZ/oCznVJKqUOow3A3tnpn1uv8M8AZwCvO8qeBC53pC5x5nPVnilY7lFLqkOpUm7uIuEVkGVAGzAY2AdXGmLCzSQkwxJkeAuwAcNbXAP3aeM5rRKRIRIrKy8sPaCeUSndaO1Jd1alwN8ZEjDEnAIXAycC4A31hY8xjxpjJxpjJBQUFB/p0SqUdY0xPF0GlsC71ljHGVAPzgKlAnohEx4MvBEqd6VJgKICzvg9Q2R2FVUop1Tmd6S1TICJ5znQvYDqwFjvkv+1sNgOY6Uy/4czjrJ9rtAqiVJfpX406EJ25E9Mg4GkRcWN/GLxkjHlLRNYAL4rI3cBS4Aln+yeAf4lIMbAX+N5BKLdSaU+zXR2IDsPdGLMCmNjG8s3Y7e8tl/uB73RL6ZRSgA4cprpOr1BVKklpa6Y6EBruSiUpjXZ1IDTclUpS8RV30Z7uqos03JVSKg1puCuVpAwJVXelukTDXakkFYpoq7vafxruSiWhxmCYY29/r6eLoVKYhrtSSaiqMZQwr60yqqs03JVKQuGI1dNFUClOw12pJBS2Etvb9QpV1VUa7koloUBIa+7qwGi4K5WE/OFITxdBpTgNd6WSkD9kh3sv/GQQTFg3RkrIpaEniqVSiIa7UkkoELabZdZmXsls368S1n2Q8Wte8t3ZE8VSKUTDXakkFAg1N8sMc7W+x/A4145DWRyVgjTclUpC0Zp7VPPAYXrVquocDXelkpDVzljuLg131Uka7koloZbZ/vlm+x7zXsI9UBqVijTclUohHrSLpOocDXelklDLmnsu9QC4NdxVJ2m4K5WEWrasv+G7DQCvhrvqJA13pZJQy5tjj3DtAeBKzzs9URyVgjTclUpCJu7/eNd63jjURVEpSsNdqSTlRgcPU/tPw12pZGTa6hmjfdxV52m4K5WEDKZVuGcQamdrpVrTcFcqCZk2au69CPRQaVQq0nBXKgkZWnd7zMbfM4VRKUnDXakkZEzrC5ZypKmHSqNSkYa7UknKK83hvskaxCCp7MHSqFSj4a5UErJPqNqDhFlG8BFmmJT1cKlUKukw3EVkqIjME5E1IrJaRH7uLO8rIrNFZKPzM99ZLiLykIgUi8gKEZl0sHdCqXRjDPiccK+nF14Jkxd3a72A8fRU0VSK6EzNPQzcYIwZD0wBrhWR8cBNwBxjzFhgjjMP8HVgrPPvGuCRbi+1UmnOAD6n66MfH24sfGLP15tMgnh7sHQqFXQY7saYXcaYL5zpOmAtMAS4AHja2exp4EJn+gLgGWNbAOSJyKDuLrhSac2YWM29yfhwYeEjTKPJ4PnImXr1qupQl9rcRWQEMBFYCAw0xuxyVu0GBjrTQ4D4GzyWOMtaPtc1IlIkIkXl5a3vEanU4c4ndrjHau6ECOHGwoVLw111oNPhLiI5wKvA9caY2vh1xh7CrkvXRhtjHjPGTDbGTC4oKOjKQ5VKe3Y/d6fm7oT7Dz3v00casRANd9WhToW7iHixg/05Y8xrzuI90eYW52f0VH4pMDTu4YXOMqVUJ9knVKNt7hn0juvjHsGlzTKqQ53pLSPAE8BaY8z9caveAGY40zOAmXHLL3d6zUwBauKab5RSnWCMiV2h6je+hHUWLtyig4ipfetMf6pTgcuAlSKyzFl2C3Av8JKIXAVsAy521s0CzgWKgUbgiu4ssFKHg/jeMk20CHcjzoQFLr1URbWtw3A3xnwCSDurz2xjewNce4DlUuqwF39CNV4k+oXbWOh1iKo9+s5QKgnFX8TU1KpZxqlrGb2fqmqfhrtSSSi+WSbQslkm+mdrabir9mm4K5WE7BOq0a6QGQnrmmvu2mNGtU/DXakk1VazzPXBn8S1uWvNXbVPw12pJGRM8wnVQNw4MtvNgOZmGa25q33QcFcqSfkIETAeIrhjy0J44trcNdxV+zTclUpCBrvNPYi3uRkGO9y1WUZ1hoa7Ukko2hUyhLtFuLsxekJVdYKGu1JJKDpwWBBvczMMLWru2hVS7YOGu1JJyD6hGiJkPAk197Bxt7hCVam2abgrlaQyCBMkMdz9+OKaZbTmrtqn4a5UEmo+oerBMs1/po1kEDHaLKM6puGuVBKKjufesrdMAG/cFao67K9qn4a7UknKSzixXztgcDUPRxCobeeRSmm4K5WUjDF4JdLqhCpAqelvT9TqDc5U+zTclUpCxoAbizAufL7E2y7sNP2ciaU9UDKVKjTclUpSHiJEcBMRb8LyKnJZYw2HrZ/2UMlUKujMbfaUUoeYAdxECOPi49BRNLl9fGYdE1tfYXK1K6TaJw13pZKQMeDBIoKbqnAmx4afSFhv4dKLmNQ+abOMUknIYPAQ4cSRBQB280zc6JAWouGu9knDXakkZJ9QjdAvN6vN9RaiFzGpfdJwVypJeYggLm+b6wwuvYhJ7ZOGu1JJyABuscDV9mmxiLa5qw5ouCuVjIzd5o7L3eZqbXNXHdFwVyoJ2V0h26+52+Gube6qfRruSiUhuytkZB/hrs0yat803JVKQgbTiZp7c7hHLMPDczdS0xQ6VEVUSU7DXakkte8298Sa+9x1Zfzx/Q3c8/aaQ1U8leQ03JVKQtF+7u3V3A0CVnO4N4Xs9veGoLbDK5uGu1JJyBiDT9oP94hJrLlblt3n3SVySMqnkp+Gu1LJKBrcnWxzt0w03A96yVSK0HBXKgmJCdsT7s51hYxerKo1dxXVYbiLyJMiUiYiq+KW9RWR2SKy0fmZ7ywXEXlIRIpFZIWITDqYhVcqXbmiwd3JrpDBiD2t2a6iOlNzfwo4p8Wym4A5xpixwBxnHuDrwFjn3zXAI91TTKUOLy6ra+He6JxI1Zq7iuow3I0x84G9LRZfADztTD8NXBi3/BljWwDkicigbiqrUknpN6+v5NLHF3Trc0qHNffENvcvtlUB4NZwV479vVnHQGPMLmd6NzDQmR4C7IjbrsRZtosWROQa7No9w4YN289iKNXznl2wvdufM9bm3k4/95ZdIXdUNfJLz0v03zseOL7by6NSzwGfUDXGGOyhMLr6uMeMMZONMZMLCgoOtBhKpRWxouHeuVEhg2GL6zyvc8nO3x+K4qkUsL/hvifa3OL8LHOWlwJD47YrdJYppbpgf0+oKhW1v+H+BjDDmZ4BzIxbfrnTa2YKUBPXfKOU6qSutrkHwxruKlGHbe4i8gLwVaC/iJQAtwP3Ai+JyFXANuBiZ/NZwLlAMdAIXHEQytxKTWOIhmCYwXm9DsXLKXXQNbe572P4gfh+7uHAoSiWSiEdhrsx5vvtrDqzjW0NcO2BFqqrzvjTh1Q2BNl673mH+qWV6rIbXlrOgNwMbjxnXLvbdHRCtWWbuyfc2LzSssCl1yce7tLiHVDZEOzpIhwWpt03l2n3ze3pYqS8V78o4ZEPN+1zm+Z+7m3fQ7Vls4w30tS8MtTYxiPU4WZ/u0Kqw1BJVVPHG6lukXhCtfVIjyZaczcGRPBG/M1VtVATZOQcsrKq5JQWNXel0o2LfZ9QjRjnT9cYjDF4rbjautbcFRruSiWl5n7u+7hBNoCxCEUMWRJ3QjWk37CUhnvaKKlq5K/zijGmy9eTpaXisnoe/3hzTxejlYjV+viUVDXGxmOP6lRXSGBrRR3BiEUW/uaVWnNXaLinjaufLuL/3lufku3iH6zZw4+eKerW5/zW3z7l7rfXJl3/7+gdk6KKy+qYdt88Hp2f+EG0r3D/xvGD7DZ3YNHmckJhi+yEcE+994Dqfikf7v6Q3lYMoD5gf41PxYr71c8UMXvNHi5/chGn3ts9vXFq/fbvo62ack9qDIYT5nfstYN4webKhOWuDvq5R5yae1MwTDBi0UubZVQLKR/uzy7Y1qOvP29dWdLVDlPV/A3llFZ3bzCFrLaPze/eWM1Li3e0uS5edWOQix75jJKqjps6OtMk1t57peVgjq599HMXEXv4AWBYyZsEW9XcGzosh0p/KR/uoUjzH9Shbm9euLmSK55azJ9mrz+kr9uW6K6nyoiv63bX8nJRx+F6oCKRtt8TT322lV+/uqLDx7+xfCdLtlXx6Ecdt9935ktCuJ3ytHzrdjS2zBFij8J9+sbfO23uWnNXiVK+n7sn7qaRlgH3IQy3vc7FU9sqkucElpUi7TLnPPgxAN+ZPLSDLQ9MezX3gyFiGdxt3MR04546DFBa3URhJ4fIiLW5u1tfxORxCSWmeSTVUDhMlugJVZUo5cM9/o8pbFm42+k6djAkY4yGD1Ib8xLnZhA9Yc3OWjaW1XHBCUO6/NiWNeWmYITxt7/baruZy0oZO6A34wfn7nc51++uY8OeOi46sTBh+cWPfk5VYwiAy6YMb/Ox9YEwwbCFz2N/md7XnZgyPC6eiZxFNn5+5X0JU12iNXfVSso3y0TDfQBVREI9MwxBMjSFRJuk9vcEYnldgNU7a9pdf9Ejn+3X83aHcx/6mJ+/uGy/Htsy3Pc2Bts86fzzF5dx7kMfd+o531y+k/vfb90U982HP+GGl5e3Wh4NdoAtFYnt4capIizZVsWMJxfFlrtov809YhksXBRZRwHgrtpEFgEqjfPBpDV3RZqE+3RXEYsyr8XzwW8P6Wv39MnceNG8aq9NtyPTH/iI8x76pFVvjlTXslmmZRv8nlp/wnH856dbOnzOn72wlIfmFu9fefYx7vrncT1mpI2a+4PfPYG//+DE2Af4ZnMEAPM++5xs8VMnOYRxa81dAWkS7v/w3Q9A4+q3eXVJSbc+//Id1dz6n5WtTtZur2zks02V7Tzq0IsWb39r7tVO7XL8b9/rriJ1SldOgre80Afgw/Vl/KmNWnTU6p21CfMtb2rxk+e+4Devr4rN3/HmmrbL2YVGuJbHYIyUcKPnBQSr081mbQ0/cOHEIZxz7BGx5ygnj3qTibd6C1n48UsmfjI03BWQDuEuwmLrSAA2NmZzw8vLeHz+vkfc64pL/rGA5xZupyGY2J8+fAhP1HXFwSzXJNnAnZ5/Jty780BFg3CU7KQP9fvc1h9ufU3DD/+5mL/Mbf/K3OteWArAP+ZvZuKd7yfUnLNpYsu2zn37enbB9n1+cN7geYnXfbfhJpLQ3fGhORt50Ps3/tvzJmOllHDEwkuYH7nfgkBdu8+3rzb35nIIFaYP+VJHlgQIuHoRIAOC2hVSpUG4W8bgwf5jOlE28oT3j8yYe3K3v07LP2xJhob2ONGa5cG8aOe1jN9xuWc21O9JWL5mZy01ce3KXRG2DB7CzM34H17x3bHPbZuC7V+w1tjGuiz8DML+dnXPrLVUNYYSwv29jBv5IvPHsXk3EbyEqW4Mcv2LS6lpStyn15cm3jHyuYX2B4Ng8TPP65zg2kRvGhO+Hdw/ewNupxY+0VVMMGK42P0ht3qfh8//2u7+yD4GDov/AK8li1wayaaJoKsXfvFpzV0BaRDujcEIudg1FZcYznQvxUsYIvvXdlxeF2iz/3U4YvHOyl0c9Zt38IcivLl8Z2xdMuR8NNO7o7fMvtqFAWgoi01W1gc496GPufk/HfcZb0vEMhwjWwEY69r37XZf+Hh1u+v2tjGm/zO+e/k882cJtfrquA+hQqkAwEMYMMz2/YqnvPfx5zkbeX3ZTp5fuD3h5GutPzHsb/3PKpbvqGYQe2PLcsTfxoVK9hvkR+63yQjXMtXl7EdDebtXFDfX3FufUD1rvN3WPjA3g1qTRa40kEMTAXeO0yyjJ1RVGoT7nW+tIVca2GX6Jq5oKN+v5/vxs0v41Ssr2FWTWPsJRQz3vbuOQNiitLqJ+2dv2N8iHxTGQC/8rH/ldxh/bccPaMNw2c0xspUz/vRhbNlDczYy+pZZiRvWN/9uo23a2yrtQPloQzl//6jzzWLhiGG4lMUtaTvttmZewk8Xnk6oemerdV92LSe85JlWyye77GMUrG8+N3L5k4voSy33eJ6ILfuN51n60MAo125Oda+m/26718x9767jj3Ht+fEnq/Oo4wLXJ1zw108Z7HxIgN3U88uXlsUNi2EYJvY3nTGunUwKLmGMOPvQWNnuhU/NvWU89OmV2Nf9ohMLWXvnOQzvm00t2fShgd7SRMCdTZO2uStHyod7oZRTILUss0Ynrqjf3eXn+uN762P9uVv2OglFrFhTTIc12wNgjOHFRdtjY8V01vjwatZmXsmMxmeoXPZ2lx5b59RI5/lu4O2MW3BV2T1GGgJh7p+9gRPMulhAAVC5MTYZ/V143fZbacaTi7j3nXWdfu36YJjCuHDPoXUw9aa5Jrp2ReIAY0PyevGM7z5Gfnpju23YofLEq0s/zPgFl3rmxOZ/6Hmf33sfj82fVvHv2HSdv/k4xPe8+aP37/zZ9zeucb/Jkd7m8p/pWsonG8v4YK39+zpJ1pMtAW4JXUXIuBkR2UqOOPsYqGu3GS3+CtW5N3yFOTd8JWF9L5+b8voANSabfKmnN02EPDka7iom5cP9SLGbUD60TkhcUdf1cH94Xvvd20KR2AjarN3VXDMeJnuQNv4+1++uI9DGCcCOLNqyl5teW8ntM9tvgmhp5rJSJoWXxebLKira37gNWyoa8BLG5ezIRxm/BOymDsHi1Yw7mJ/xi9j2Zltzn/doE0TLpqm2era0pd4fpp80h3KetD4ZeEpe8+/78/dfTFjXL8fXPLOn+Xc2MK6ppKk68ZtBrrQOv/PczX3Ma0MujpdNtPwWEYkYlmyzn/dIsXtl3eJ9gd+7/h7b5tfef3Ob59nYH9b0zDVEjPB65FSKzWBGRbY2f1j5a9u9org53L30y8lgdEHrOyv9YvqRlJgCCqSGDAkR8ubQZHzaLKOAFA/3QDDI/d5HAFhv2Zexz48cZ6/cj3CPF61RRXvJhCKGzc4FKL/4t32hytGyjfkZv+CiisQTY5X1Ac5+cD63/mcVXRU9MVhe3/m72b+1Yhd9aQ5I09C1cA+ELY6VFv27g40EwhajJbEZxDICFc0195ZdC6M+3FDW5vKWvv33zxJq5tEeM9Hff8QyFNQ1h/aXXIkfeqFg8+9p77aVfLDGrjGf4lobW75g7WbOd33G1sxL+DzjZwmPnxG8MWF+dmQS06wi3si4jfNdzR9iU1xr8Ab2ctEjnwMQwJfwuFrTPKzAlZ53ya3bwPrddYwNb2SzayiNZLLODGOMtbX520mgNnaOZGvmJdzreSz2HC4Ttsds38eNrs+fMBhX/+ZvrBFvDk1ouCtbSof7kmdujtX0fEMncX7gLq4J2bVOc4DhHopYrCqNXrFp+KS4ZWAa3sm4GYCptYmXs0fH7P58f/rBS8KPTpm9Zg8FUs0GawiNJgNXY9fCPRi2ONllN6WssEYCYOp28b+z1jLRlfht5kNrAlTbvURW76zhPqcJpmV5r3yqc+Oz1/nD5EpzGOVJPYu27GX0LbNYtGUvS7ZVcYJsotzk8lz4TIZI4r7lBZubi96c8xFXO+PCj3Y1fygtW7OOh3wPAzBImmv03w3cxkfWBG4NXQnAb0JXsMY0Dw8wxfmAyKGRF3138/W19gdBFn7Gukp5MnwOsyMn2q9hjeHx8Ne5I3QZANW7t3Hug/M43rWZ1YwBYJ01jCOkEnf0q16gDssysd403/N8GHttl4kQoeOhNMq8zUMyRLy9aTLaLKNsKR3uTfnjYtPXn3U0K8xo/GRQYXKx6nbt13NmEOQY2UowYrGxrI4vuVaxKuMqPpj1MgBewvy3+w0mSXPt1bSItmjT7MFsm29+rWg/8V2Umv6sMiMYuuv9LvUWCoYtxrpK2WX6cl/4ewA07S1lzroyLnR9mrDtUmsMEmqESIhv/OUTdtbYA1at2lnLipJqAE6WtVzhfof3VnXuGOTSQLXJBuB6z6vM32CfsP2kuIJQxKKv1FJu8tlmBtBX6nni3QWxx/YPNYf40MiO2O+kDw12EwVwm/c5AMpMXmzbo/xPsdAcDcBzka8xwv88z0ams84aFtvmEs9cCqWMy9wfAJBVvx2Ac90LAdhkBlNi+gNQTQ53hy9jtmWH/WdfLOcrruX0kzq+8o3LOOeYI1hnmp+7yfgw/lqW7ajmz96HW/1O7HDv+M+z0tc8jo1k5tJgebXmroAUD/e6EdP5Q+i7TPA/ljCAWLnJw9Tu2ccj23en5ynezrgFU7eHmsYQp7uWkSN+nvD+ERcWZ7mKuNH7Iq9l/C72mJbhHm1rD1uGivoAd7y5uvNjvpuEHx3yhyMMoZyjXCUsto7i6fDZ5ATLoHSJ/TzGsHFP+xfL2OW16EcNFSY3Ntpg07oPAMNxri08Gz6TEtOf20MzqMdpfgjUxbrxjZPtZIerOf/hTxmS14uHfX/hdu+/uPe5t1v1FY93iqzlJs8L5EsdO5zXPcm1AU+Z063SGC59fCF9pY4mbx4fWRMAKP74pdhz5EXsD4Jl1ijGiN2VMhixyJVGyk2fhNc7K3Afb0amcHnwRgL4+NrRA1uVqci5IC7qk4zrudFrt/PXOU0vY2QnYePihcgZ7JYBALicI1bufID83vsET/r+SEAyyZ9wHn+/7EQa8porIztNPyRYxzuffcE3nA+LeJ2tuYe92c0zGbnUmwyM1twVKR7uZx1XyN8iF1BDTkK4l5m8/eotA81ttZ7qzTQEI+SL3QacJQEucs/nQvenrR7jM34INQ+56g/ZQR6KWNzx5hr++elWPlzfuTborvZTrw+E+arbPgcwyzol1mvoi8WfsKq0hpE3z2L6A/PjmphaC0Ys+kodlaYPkbyRrLGGs2HRbAqoIVca2WAKmRZ4iKcjZyeEO0AmAd7NuImlmT9mmmslBTk+Bkg1YF91urOdm2/k0sC/M+7ix543Odq1gzJv89C/12+6mgya+633pZYjR43khElfYps1gNNdy2Lr+kXspq/PrGMplAoyCOIP2dc+1BIXfEA1vflZ6DrmOx8Sp48roKVy8jnJ/zdO8D/aat0oSrjM/T5XumdR6hnK89d8icZsu1kkGvwBfFwXvDb2GDn7bvBkAFDv7RdbHu26G998VGFyWb6jmnW7a3HRuXDfsbe5li4ZvfGTYX+zSpGhn9XBk9LhnuXzsOHur7Pst9MZM8DuTTB1VD/2mHykvus19+NkMyNc9uM8VcU0BMKxKxwB/s/7GNPdS3gtMo2fBK8D4NrgdXhNCJY9G9vOrrkbpgfnsnKFXYOODuXakfga/uby5svxy+r8/O+stYRbNPU0BiKMk+00SRbfmf4VGnsNotb0YtuyObz5txvZkHEZ6zMup6aidf/wqFDYop/UcuyRozj7mCNYZ4YyzLWHcS67GWKTGQzAyP7Z1JksAPZU2EF6n/cfsef5lvtjCoPNfdxHya527+l6g+elhPnGXkfwQWRibD7PObHqI2S3s/cZisstLDejGe+y2/wjlqHA7KXW1Yc11nBcYhgn2+0L26SRWpPFeYF7KLKOZNExt7Uqg8cl/Ouq1lczl5NHNb3bLPdd3qfwSYRadz5TRvVjsXsSd4YuY+Woq7j/4gl85cgC3rBO5fPIeFZbw/GdcnXssRne5rDeZeygj55DWGcNpb/U8su/vcQ5D37c6Zr7pvIGtlj2NxBXZk6sKYqwfx+PUoeDlA53sEMzL8tHXpaPrfeex39NGkIZebgaysDqWlfEU13NvVt6716EaahgimsNb0cSA+CXoZ8wy5rCCP/zvG2dQoOrN+xqvkIzELY417WQ+31/527PkwhWp5tZAuEI42Url225idsf+AtPfbqF7z76OSffM4dH52/mk+IKXirawS3/WQnAS4u3ca57IbWDpnLtGWOZMCyfTWYI/+X+lJu9L+CTCBkSpv+O1mOYR4VCAY5gLxn9huN2CdvNAAaxl+s9rwKw0bLbde+64NhYzf3hd5dylXsWF7jtHiULrXF8y/0Jv6j+39jz3up9nqItlfzr862tvjnEn9gEsLIKuDr0K14MfxWAPs6J8rFSgk8iuAdPIBC2WGMNt68sbarCH4owUPYSzBpI/1HHAzAz47c0+v3kU081Oaw2I/l28Hec/J3/Yeu957H13vP4xvGDAHC7XJw2toAvbpvOQ9+fyJs/nZZQpvtD345N3x6awRJrbGx+fuYZAAQlgycjX2fyCRP51qRCHr7E/oC6NHQLl7nuS+gjmuFpDuud2OFeKHaz0v1h+7V+77UvrhITISKd+/O8NHgrfwufT7DPSLufO+hJVZX64d5ShsdFmcmz72TTWEkwbDHiprd5/OOOb5M2Wnay2+Sz0BrHwK0zOXbPTNxieDYyfR+PEmo9faGpim2VDViWIRAKcYv3eQCmuVezJfMHjPr8lk6V3zRW8aLvLqa7lzDD/R6/e3M1A7e9xTzfL1ib8UPGvH0xd72ygOcXbqe0uomP5s+ln9RR0v80AI4ZnMtfwhcyP3Icz4dP57uB29hp+lKw+I/U1diBGgxbCfcE9dXvxCMWkj+SpmCEbdZAXGI40bWR58NnUEY+YF/uHj0pme8vYZLLPql8V+gHbLLs2v1o1y52m3zWWHavk5sXT2X7W/fx0F8fYORNb7Joi10GL2F2m/xYGfz5do+St6yp9uM8z3Psnpmxq0w9hRNpCkZYaezePKyZSVMowhFShb/XQPZmjYk9V//XvstAqaKiRZt77Ig5getcd0XfbB/nTxjMcYWJ2z8U+VZs+vnImfRymopuD83gg8yvJWyb6dTKs3z2WDA//upY5t+c+L6J//a2w9ht9ePF/na03BrN/MhxDHa+KbpNuFM1d4Cd9OcP4e/RK8Nrd4UEHTxMpV+4+9yu2FfeeQuLuO/tFfSjhv+dtZpnF2yLXRZuWYbGYJiZy+yR+rZWNDDGtZNN1mB+43SNG797JgCrreFcFbwBgD+ELo691qA+mQA0unNprK3gjP+bw98/KqZ081oKpYJt1oDYtsO3vsxfnn2Z61+0RylcuLmSuevsJiBjTGz8k3fnzY1dZPM191K2Zl7KQ76HyRE/280ACmuXsjLzatZnzKDggSE85/s9AeNh5EnnAPCzM8Zyzrd+yOWhm/kd/4/7b7yWO0KX01fqWf3Bv9hd4+fOt1Yz7b551PpDGGPIrLMDxtVvBDurm1hhRsXK/Z51Umx67MDebDRDKDN5TK/7D19zL+XVyDSeiJxrd5F05FHPxcHb+CRyDGDX4B/zPcCyjGsoffIHXHfLrZzuXh47efuZOY7QiDMBqHF6zZzuXs5Zm+7hDu/T7LAK8PUfxbbKRj63jmGxdSS1797Frmo/Q6QCf69B7KhuYqz/Gd6ITCWvbCG50kiV07Qyqn9i23tH3Uzjz99cFLidx8LnEcLDneHLeC8ymeciZzZfWepsmul1xR679d7z+PU548jJSBz0qzEY5puBu3k1chrz5GRCxs109xKqTA57yWWDKWSoq5xfe15kSu27nQ73qEyPm0ZjvydbXq17oPcXjr5HD+R5DvY9jtsq34GUubvKG4pYvLViZ+c7VXSTlL/NXks+j4ttxm6DPP3j73M6cJvzfuddePOdaeQMn8R7O3sxwb+ITAny+qtuIsbFdz3FPB2ezmZjf20f6dpDielPLTnMsU5khN+ujc+67jRmLi/l52eOZdJds9lc72N002cszVhG1od2COOC28M/5Gr32yy2xvFTz+v8rPhqKkwuS+8exaymCZzrXsjb2WNZUZvDKNmFAR5yfwYC/wp/jcs8H9BkfDwcvpBHIudjIdzpeYrvuedSQzYDpJpNVj/6X/h7Coba3foyvW4unjyUs8YPRETwuoX3rJPYbfKZsvK3rFj+T463hvFXbxOb/nAPH/b6Gl+umwUucPcfxTcnuLl+XRmn+v/MXYM/557v/zfT/tR8Mc/t3zyWB2ddFGs+WOo0VbxvncQY/zO85rudlyNfoZ4sfhC6le9a8/i+ey4ZhDAIZ7mK+C/npPQ2M5Ar/f/D4IFH8N/O+ClbzREss0bxVmQqv3G6MK4oOI+hLheXnDKM37xey9uRKZwUeoa+/5hIvtRTkjuKmr0hQni4K/QDznfbFxptsY7gpBH5PHv1KQnvkcJ8u2lpSxv3vl3+27MQFxz/u/cBWGKOYknYvuPRAms8C6zxALic2n/0Z3yTS3vK6gKUmFEEv/k3Kl9byXLXaCbLBl6PnEoID3udOyn9xPMGAGJ1PNLmxZMLeanIvlo2y+eOvfc3F73P71Z/wdT+fjZt2sAU11p8Ph8FffPZkzcRty+LyvLd5LqasEJ+6murkb4jweVhd3klfaUWn+VnV+7x+MQiq2wJ/ailmhw2m0FkZWUzemA+Rw3pSzh7IM9+upHp2ZuRQD2RIZOZu6aU0ZRwTH6E2ozBDBo4gLeKg4y2tjCit0Xp3nrKTD5B4yarVyZBywWNe/FJmCy3hU8ijMxzk5eby9bMo8npNxiPW/hiWzW9fcLOXSXU1lQxKrMBd6CaSpPLQKmiFwHKfIX0dfvJlBCljS4Ge+rIzhvA+hoX4woHMHTssby2NZNBgS30l1rW7api/KjhlNf6CZQup970wiDkuEPkDxlDbv5AAqEwRw7pR2ZWbxZsq8UbquOZDR4mmnUgLrJDlRhg8rgRuPJHULRkMSce4cIqGE/ZF29ximst75vBWMNP44utlfTNiFCYn0lhcBu9TpnBcaee1+Gx7qq0C/cxA3LYZgZSbA2mkQx2mX6c6NrAWmsYx7q2cgaLyd7+CacD9e5MKkwfCqSaXgR5J3ISI86/mchru3knchLHuzbz8eCrefDkE7j+38tirzF+cG7sXpsXnjCEoi+O5KvuZaw1w6gwuZzsWs8yazRDJ36NJ+qnM299Oce6tjLdvYTV1gi+FFrJRO8ySkx/jm/czHnexBENNzCcO8KXc1v4Cv7faaO46dyj+ZUIxhjeXjmJKa8tZWB+Lj+cOpSC3F4cPa51l768rOYrKM8cN5CbNvyIOzxPMVZKOd6zhVrTi1yriYkNq8EF281AhuYN4cK+bk4e2Zc568o4dfJlZHjcHDM4NzZA2A9PHclrvut4YuZOhskeXJMuh8V2f/Zbv3k85795j11Tdq7m/XfkdJb0+ybfmjQEj0uYMetzhko5HiJsMUdQSw7fO2oABTl2W3EdWVwYvBuA3tLIRClm9Ln2yesfTBnO6eMG8F/3VnGh+xOOkCpqTRbBwilM8/Znc0UD5eRxT+gSdpu+HH/2DB78SmLXRoArp42kaFsV35rY+p6sfbJa35Aa4NghuawqtX8Hp43tz6Wn2H3Wxx3Rm+Ky+n0ORxyV4TTLnDg8nzPGDeC363/IFe53ednY7ffRSsUDoYsY6yrBNWwqgzp4zj98ewLXfHk0TcEIIwuy2WiGUGOyGLX4dp4B2A54odL0JhJ2k1vWQGb5y20/WVt9EKrs8y4Bt4dKculHLRkShhBQ4vwDTgEI2Fcwuza8zIUeZ7rOQB1QAVOdp/RXesmUkP2tR+zHgV1OgJBxEzZuQlVuMqpCHC/N12x8Ob5sXiBCLMUsI/YQGhZgQcQIbo+h1vQiu8rPeWJgB7ADjmu5n85lK5ZbYsNwALDL+Re3zVHO7CXQ/DUw+rZx+hOcHffYgNvDKjOSqa419CtZyPkep9wVUEkeW/ee3rI03UIOxlclETkH+DPgBh43xty7r+0nT55sioo6d0VjZ5RUNca6I85Zu4ddNX6OHNibiDGE6irI9+/AZSKcePKX2Rv2Ut/YRF+fYcgRBfTO9LK5vB6v24UI9M/JiLWnVjv338zPbg7OhkCYLRUNHDM4FxHBH4qwsrSG44b0iT1uc3k91Y1BPixawfHjxvGvt97n3OGGMad8nSyvi5c+WUVGr1zWlPmp3r6C+3/yHcYM6td6x/ZTxDLMeHIRQ/v24uzxA1m2bDGuPkMpLtnJhYWNDBl5FN6+wxg1oO2bQzcGw9T7wwzItb8CWZZhyfYqhvfNYkBuJjVNIXbsbeTYIX3YuKeOEf2zWb6jmsF5vTDYg3u1ZIxhRUkNvXxuhvfLwutysaK0Bo9L6OVzM6hPZsJrxnv8481k+TycNrY/wYjFyH7ZhC3D9r0NvLhoBz89Ywy1TWEG52Xice9fy+OnxRU8u2AbU0f347SxBYzsn00wbFFeH0jYn+rGIA/PLeZ/zj4qdrzb89mmClaX1vKjL9vNXhHLsLWygdEFOZTXBfjDu+v4zpFuxh05lrqA1ebvrSNz1+1hYVERo2sXsG5PE7tCWfzo9KM55isXUdkYYenmXWz4Yj5fHV9IXr8C9kay6J2Tw4rdTbzyzmz+37ShfFGVxYwvj+O1lXvZsGQOP5s+nszhJxIwPmav2EKBu4FRfTMYmO1me1kVGzeuYcSAfMZNPI1/LtrJ1NxKcrN64R04Fl9mNibYwBvzi5iUU8ki1wQunTaORz9czzeO6U/fDKhpaMLlr8KV3R965fPKF6V84/jBTCjsw0drSiletYCJA9y4RPhsUwWF+VlU19Ux+uhJjBk1iqqQF9NUTcTXm/mrdzC6n4/JRw5lWUktazdv49KvnkCDP4gr4mf11t2sXTKPcMVmzp46CRk0ga01YXZvWcO3pxzFdu9ICNZhWcLK3fVkBys5KjeEuH1EQgHWbd9NtifCxr1hIrtWUTjhTL7YE+KU4X0YPWo0eyvLqNi6hqOPOZ4PtzYyNaeM8ROnsqK6FybkJ1i+heXlYaaNG8qQvtkMHHhEl49xPBFZYoyZ3Oa67g53EXEDG4Dp2J/ri4HvG2Pavn8Z3R/uSil1ONhXuB+ME6onA8XGmM3GmCDwInDBQXgdpZRS7TgY4T4Eu2UrqsRZlkBErhGRIhEpKi/fvxtrKKWUaluPdYU0xjxmjJlsjJlcUND6MnCllFL772CEeykwNG6+0FmmlFLqEDkY4b4YGCsiI0XEB3wPeOMgvI5SSql2dHs/d2NMWER+CryH3RXySWNM5+8Zp5RS6oAdlIuYjDGzgFkH47mVUkp1LO3GllFKKXWQrlDtciFEyoFt+/nw/kDXbhqa+nSfDw+6z4eHA9nn4caYNrsbJkW4HwgRKWrvCq10pft8eNB9PjwcrH3WZhmllEpDGu5KKZWG0iHcH+vpAvQA3efDg+7z4eGg7HPKt7krpZRqLR1q7koppVrQcFdKqTSU0uEuIueIyHoRKRaRm3q6PN1FRIaKyDwRWSMiq0Xk587yviIyW0Q2Oj/zneUiIg85v4cVIjKpZ/dg/4iIW0SWishbzvxIEVno7Ne/nbGKEJEMZ77YWT+iRwu+n0QkT0ReEZF1IrJWRKYeBsf4F857epWIvCAimel4nEXkSREpE5FVccu6fGxFZIaz/UYRmdGVMqRsuDt3fPor8HVgPPB9ERnfs6XqNmHgBmPMeGAKcK2zbzcBc4wxY4E5zjzYv4Oxzr9rgEcOfZG7xc+BtXHz9wEPGGPGAFXAVc7yq4AqZ/kDznap6M/Au8aYccAE7H1P22MsIkOA64DJxphjscee+h7peZyfAs5psaxLx1ZE+gK3Y9+i9mTg9ugHQqcYY1LyH/b9dt+Lm78ZuLmny3WQ9nUm9m0L1wODnGWDgPXO9KPYtzKMbh/bLlX+YQ8NPQc4A3gL+9bDFYCn5fHGHpRuqjPtcbaTnt6HLu5vH2BLy3Kn+TGO3sinr3Pc3sK+l3RaHmdgBLBqf48t8H3g0bjlCdt19C9la+508o5Pqc75KjoRWAgMNMZE78W+GxjoTKfD7+JB4NfY964H6AdUG2PCznz8PsX211lf42yfSkYC5cA/naaox0UkmzQ+xsaYUuCPwHZgF/ZxW0J6H+d4XT22B3TMUznc056I5ACvAtcbY2rj1xn7ozwt+rGKyDeAMmPMkp4uyyHkASYBjxhjJgINNH9NB9LrGAM4TQoXYH+wDQayad10cVg4FMc2lcM9re/4JCJe7GB/zhjzmrN4j4gMctYPAsqc5an+uzgVOF9EtmLfUP0M7PboPBGJDksdv0+x/XXW9wEqD2WBu0EJUGKMWejMv4Id9ul6jAG+BmwxxpQbY0LAa9jHPp2Pc7yuHtsDOuapHO5pe8cnERHgCWCtMeb+uFVvANEz5jOw2+Kjyy93zrpPAWrivv4lPWPMzcaYQmPMCOzjONcYcykwD/i2s1nL/Y3+Hr7tbJ9SNVxjzG5gh4gc5Sw6E1hDmh5jx3ZgiohkOe/x6D6n7XFuoavH9j3gLBHJd771nOUs65yePulwgCcszgU2AJuAW3u6PN24X9Owv7KtAJY5/87Fbm+cA2wEPgD6OtsLds+hTcBK7N4IPb4f+7nvXwXecqZHAYuAYuBlIMNZnunMFzvrR/V0ufdzX08Aipzj/DqQn+7HGLgDWAesAv4FZKTjcQZewD6vEML+lnbV/hxb4Epn/4uBK7pSBh1+QCml0lAqN8sopZRqh4a7UkqlIQ13pZRKQxruSimVhjTclVIqDWm4K6VUGtJwV0qpNPT/Ad4j+U90umNiAAAAAElFTkSuQmCC\n",
      "text/plain": [
       "<Figure size 432x288 with 1 Axes>"
      ]
     },
     "metadata": {
      "needs_background": "light"
     },
     "output_type": "display_data"
    }
   ],
   "source": [
    "import matplotlib.pyplot as plt\n",
    "# Generate recent 50 interval average\n",
    "average_reward = []\n",
    "for idx in range(len(rewards)):\n",
    "    avg_list = np.empty(shape=(1,), dtype=int)\n",
    "    if idx < 5:\n",
    "        avg_list = rewards[:idx+1]\n",
    "    else:\n",
    "        avg_list = rewards[idx-4:idx+1]\n",
    "    average_reward.append(np.average(avg_list))\n",
    "plt.plot(rewards)\n",
    "plt.plot(average_reward)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "9f18bae5",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "44b0354e",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "58e2db1b",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "8385f8b3",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "c1d27da3",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "fb4df6e4",
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.10.12"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
