{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "id": "67576132",
   "metadata": {},
   "outputs": [],
   "source": [
    "from math import inf\n",
    "import numpy as np\n",
    "import scipy\n",
    "import torch\n",
    "import torch.nn as nn\n",
    "import torch.nn.functional as F\n",
    "import torch.optim as optim\n",
    "import gymnasium as gym\n",
    "import pandas as pd\n",
    "from datetime import datetime\n",
    "from sklearn.base import BaseEstimator\n",
    "from realkd.boosting import WeightUpdateMethod\n",
    "from pandas import qcut\n",
    "from realkd.rules import SquaredLoss, AdditiveRuleEnsemble, Rule\n",
    "from realkd.search import Context\n",
    "\n",
    "import warnings"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "id": "8b8f01e2",
   "metadata": {},
   "outputs": [],
   "source": [
    "# warnings.filterwarnings('ignore')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "id": "db545637",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "cuda\n"
     ]
    }
   ],
   "source": [
    "env = gym.make('CartPole-v1', render_mode='rgb_array')\n",
    "device = torch.device(\"cuda\" if torch.cuda.is_available() else \"cpu\")\n",
    "print(device)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "id": "7aa6c889",
   "metadata": {},
   "outputs": [],
   "source": [
    "column_names = ['cp', 'cv', 'pa', 'pav']"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "id": "24f75485",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<torch._C.Generator at 0x7f33da341410>"
      ]
     },
     "execution_count": 5,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "np.random.seed(753894)\n",
    "torch.manual_seed(3921840)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "id": "84732b72",
   "metadata": {},
   "outputs": [],
   "source": [
    "def orthonormalization(Q):\n",
    "    n, k = Q.shape\n",
    "    O = np.zeros(shape=(n, k))\n",
    "    q = Q[:, 0]\n",
    "    O[:, 0] = q / (norm(q) + 1e-6)\n",
    "    for i in range(1, k):\n",
    "        O_i = O[:, :i]\n",
    "        q = Q[:, i]\n",
    "        q_orth = q - O_i.dot(O_i.T.dot(q))\n",
    "        O[:, i] = q_orth / (norm(q_orth) + 1e-6)\n",
    "    return O"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "id": "973f1f9b",
   "metadata": {},
   "outputs": [],
   "source": [
    "def softmax1(action, values, other_values, location):\n",
    "    all_values = np.insert(other_values, location, values, axis=1)\n",
    "    exps = np.exp(all_values)\n",
    "    res = np.exp(all_values[np.arange(values.shape[0]), action]) / np.sum(exps, axis=1)\n",
    "    return res\n",
    "\n",
    "def norm(x):\n",
    "    \"\"\"\n",
    "    Calculate the L-2 norm of a vector\n",
    "    :param x: the vector whose L-2 norm is to be calculated\n",
    "    :return: the L-2 norm of the vector\n",
    "    \"\"\"\n",
    "    return (x * x).sum() ** 0.5\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "id": "5b0af6ac",
   "metadata": {},
   "outputs": [],
   "source": [
    "class PiLoss:\n",
    "    _instance = None\n",
    "\n",
    "    def __new__(cls):\n",
    "        if cls._instance is None:\n",
    "            cls._instance = super(PiLoss, cls).__new__(cls)\n",
    "        return cls._instance\n",
    "\n",
    "    @staticmethod\n",
    "    def __call__(action, values, advantage, other_values, current):\n",
    "        \"\"\"\n",
    "        :param action: the action chosen\n",
    "        :param values: the values provided by current model\n",
    "        :param other_values: the output by other models\n",
    "        :param current: the action represented by the current model\n",
    "        \"\"\"\n",
    "        sm = softmax1(action, values, other_values, current)+1e-6\n",
    "        return -np.log(sm) * advantage\n",
    "\n",
    "    @staticmethod\n",
    "    def g(action, values, advantage, other_values, current):\n",
    "        return np.where(action == current, -advantage * (1 - softmax1(current, values, other_values, current)),\n",
    "                        advantage * softmax1(current, values, other_values, current))\n",
    "\n",
    "    @staticmethod\n",
    "    def h(action, values, advantage, other_values, current):\n",
    "        sm = softmax1(current, values, other_values, current)\n",
    "        return advantage * sm * (1 - sm)\n",
    "\n",
    "    @staticmethod\n",
    "    def __repr__():\n",
    "        return 'pi_loss'\n",
    "\n",
    "    @staticmethod\n",
    "    def __str__():\n",
    "        return 'pi_loss'"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 9,
   "id": "67942365",
   "metadata": {},
   "outputs": [],
   "source": [
    "loss_functions = {\n",
    "    'pi_loss': PiLoss()\n",
    "}"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 10,
   "id": "693287f4",
   "metadata": {},
   "outputs": [],
   "source": [
    "def loss_function(loss):\n",
    "    \"\"\"Provides loss functions from string representation.\n",
    "\n",
    "    :param loss: string identifier of loss function loss function\n",
    "    :return: loss function matching corresponding to input string (or unchanged input if was already loss function)\n",
    "    \"\"\"\n",
    "    if callable(loss):\n",
    "        return loss\n",
    "    else:\n",
    "        return loss_functions[loss]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 11,
   "id": "ae0af97c",
   "metadata": {},
   "outputs": [],
   "source": [
    "def calc_risk(loss, action, rules, states, reg, advantage, others, current):\n",
    "    weights = np.array([rule.y for rule in rules])\n",
    "    risk = sum(loss(action, rules(states), advantage, others, current)) + reg * sum(weights * weights) / 2\n",
    "    return risk"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 12,
   "id": "d06dc96b",
   "metadata": {},
   "outputs": [],
   "source": [
    "class FullyCorrectiveA2C:\n",
    "    def __init__(self, loss='pi_loss', reg=1.0, solver='L-BFGS-B'):\n",
    "        self.loss = loss_function(loss)\n",
    "        self.reg = reg\n",
    "        self.solver = solver\n",
    "\n",
    "    @staticmethod\n",
    "    def get_risk(loss, action, q_mat, reg, advantage, others, current):\n",
    "        def sum_loss(weights):\n",
    "            return sum(loss(action, q_mat.dot(weights), advantage, others, current)) + reg * sum(weights * weights) / 2\n",
    "\n",
    "        return sum_loss\n",
    "\n",
    "    @staticmethod\n",
    "    def get_gradient(g, action, q_mat, reg, advantage, other, current):\n",
    "        def gradient(weights):\n",
    "            grad_vec = g(action, q_mat.dot(weights), advantage, other, current)\n",
    "            return q_mat.T.dot(grad_vec) + reg * weights\n",
    "\n",
    "        return gradient\n",
    "\n",
    "    @staticmethod\n",
    "    def get_hessian(h, action, q_mat, reg, advantage, other, current):\n",
    "        def hessian(weights):\n",
    "            h_vec = h(action, q_mat.dot(weights), advantage, other, current)\n",
    "            return q_mat.T.dot(np.diag(h_vec)).dot(q_mat) + np.diag([reg] * len(weights))\n",
    "\n",
    "        return hessian\n",
    "\n",
    "    def calc_weight(self, data, action, rules, advantage, other, current):\n",
    "        g = self.loss.g\n",
    "        h = self.loss.h\n",
    "        loss = self.loss\n",
    "        y = np.array(action)\n",
    "        q_mat = np.column_stack(\n",
    "            [rules[i].q(data) + np.zeros(len(data)) for i in range(len(rules))])\n",
    "        sum_loss = self.get_risk(loss, y, q_mat, self.reg, advantage, other, current)\n",
    "        gradient = self.get_gradient(g, y, q_mat, self.reg, advantage, other, current)\n",
    "        hessian = self.get_hessian(h, y, q_mat, self.reg, advantage, other, current)\n",
    "        if self.solver == 'GD':  # Gradient descent\n",
    "            w = np.array([r.y for r in rules])\n",
    "            old_w = np.ones_like(w) * (1.0 if len(w) - sum(w) > 1e-5 else 2.0)\n",
    "            i = 0\n",
    "            while norm(old_w - w) > 1e-3 and i < 50:\n",
    "                old_w = np.array(w)\n",
    "                if norm(gradient(w)) == 0:\n",
    "                    break\n",
    "                p = -gradient(w) / norm(gradient(w))\n",
    "                w += GoldenRatioSearch(sum_loss, old_w, p, gradient).run() * p\n",
    "                i += 1\n",
    "        elif self.solver == 'Line':\n",
    "            w = np.array([r.y for r in rules])\n",
    "            if norm(gradient(w)) != 0:\n",
    "                p = -gradient(w) / norm(gradient(w))\n",
    "                distance = GoldenRatioSearch(sum_loss, w, p, gradient).run()\n",
    "                w += distance * p\n",
    "        else:\n",
    "            w = np.array([r.y for r in rules])\n",
    "            w = scipy.optimize.minimize(sum_loss, w, method=self.solver, jac=gradient,  # hess=hessian,\n",
    "                                        options={'disp': False}).x\n",
    "\n",
    "        return w"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 13,
   "id": "2d0c04a8",
   "metadata": {},
   "outputs": [],
   "source": [
    "class ObjectFunction:\n",
    "    def __init__(self, data, target, predictions, loss, reg, advantage, other_values, current, rules=None):\n",
    "        self.loss = loss_function(loss)\n",
    "        self.reg = reg\n",
    "        predictions = np.zeros_like(\n",
    "            target) if predictions is None else predictions\n",
    "        g = np.array(self.loss.g(target, predictions, advantage, other_values, current))\n",
    "        h = np.array(self.loss.h(target, predictions, advantage, other_values, current)) + 1e-6\n",
    "        r = g / h\n",
    "        order = np.argsort(r)[::-1]\n",
    "        self.g = g[order]\n",
    "        self.h = h[order]\n",
    "        self.data = data.iloc[order].reset_index(drop=True)\n",
    "        self.target = target.iloc[order].reset_index(drop=True)\n",
    "        self.n = len(target)\n",
    "\n",
    "    def __call__(self, ext):\n",
    "        raise NotImplementedError()\n",
    "\n",
    "    def bound(self, ext):\n",
    "        raise NotImplementedError()\n",
    "\n",
    "    def search(self, method='greedy', verbose=False, **search_params):\n",
    "        from realkd.search import search_methods\n",
    "        ctx = Context.from_df(self.data, **search_params)\n",
    "        if verbose >= 2:\n",
    "            print(\n",
    "                f'Created search context with {len(ctx.attributes)} attributes')\n",
    "        return search_methods[method](ctx, self, self.bound, verbose=verbose, **search_params).run()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 14,
   "id": "eaec4413",
   "metadata": {},
   "outputs": [],
   "source": [
    "class OrthogonalBoostingObjective(ObjectFunction):\n",
    "    def __init__(self, data, target, advantage, other_values, current, predictions=None, loss=SquaredLoss, reg=1.0,\n",
    "                 rules=None,\n",
    "                 epsilon=1e-4, **kwargs):\n",
    "        super().__init__(data, target, predictions, loss, reg, advantage, other_values, current, rules)\n",
    "        self.rules = [] if rules is None else rules\n",
    "        self.loss = loss_function(loss)\n",
    "        self.reg = reg\n",
    "        self.epsilon = epsilon\n",
    "        predictions = np.zeros_like(\n",
    "            target) if predictions is None else predictions\n",
    "        g = np.array(self.loss.g(target, predictions, advantage, other_values, current))\n",
    "        self.n = len(target)\n",
    "        r = g\n",
    "        order = np.argsort(r)[::-1]\n",
    "        self.g = g[order]\n",
    "        self.data = data.iloc[order].reset_index(drop=True)\n",
    "        self.target = target.iloc[order].reset_index(drop=True)\n",
    "        if len(rules) != 0:\n",
    "            orth_basis = kwargs['orth_basis']\n",
    "            self.orth_basis = orth_basis[order]\n",
    "            self.g = self.g - self.orth_basis @ self.orth_basis.T @ self.g\n",
    "        else:\n",
    "            self.orth_basis = np.zeros(self.n)\n",
    "\n",
    "    def __call__(self, ext):\n",
    "        if len(ext) == 0:\n",
    "            return -inf\n",
    "        g_q = self.g[ext]\n",
    "        if len(self.rules) == 0:\n",
    "            h_q = self.h[ext]\n",
    "            return abs(g_q.sum()) / np.sqrt(h_q.sum())\n",
    "        length = self.fast_orth_norm(ext)\n",
    "        if length > 1e-4:\n",
    "            obj = abs(g_q.sum()) / (length + self.epsilon)\n",
    "        else:\n",
    "            obj = 0\n",
    "        return obj\n",
    "\n",
    "    def fast_orth_norm(self, ext):\n",
    "        deltas = self.orth_basis[ext]\n",
    "        length = len(ext)\n",
    "        okqi = abs(np.sum(deltas, axis=0))\n",
    "        q_para_norms = (okqi ** 2).sum()\n",
    "        q_orth_norms_sq = np.abs(length - q_para_norms)\n",
    "        return np.sqrt(q_orth_norms_sq)\n",
    "\n",
    "    def fast_para_norms_prefix(self, ext):\n",
    "        deltas = self.orth_basis[ext]\n",
    "        length = len(ext)\n",
    "        okqi = np.cumsum(deltas, axis=0)\n",
    "        q_para_norms = (okqi ** 2).sum(axis=1)\n",
    "        q_orth_norms_sq = np.abs(np.arange(1, length + 1) - q_para_norms)\n",
    "        q_orth_norms = np.sqrt(q_orth_norms_sq)\n",
    "        return q_orth_norms\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 15,
   "id": "626cceb7",
   "metadata": {},
   "outputs": [],
   "source": [
    "class GeneralRuleBoostingEstimator(BaseEstimator):\n",
    "    def __init__(self, num_rules, objective_function, weight_update_method, loss='squared', reg=1.0,\n",
    "                 search='greedy', max_col_attr=10,\n",
    "                 search_params=None, verbose=False):\n",
    "        if search_params is None:\n",
    "            search_params = {'order': 'bestboundfirst', 'apx': 1.0, 'max_depth': None, 'discretization': qcut,\n",
    "                             'max_col_attr': max_col_attr}\n",
    "        self.num_rules = num_rules\n",
    "        self.num_components = 500\n",
    "        self.objective = objective_function\n",
    "        self.objective_function = objective_function\n",
    "        self.max_col_attr = max_col_attr\n",
    "        self.weight_update_method = weight_update_method\n",
    "        self.loss = loss_function(loss)\n",
    "        self.reg = reg\n",
    "        self.weight_update_method.loss = loss\n",
    "        self.weight_update_method.reg = reg\n",
    "        self.verbose = verbose\n",
    "        self.search = search\n",
    "        self.rules_ = AdditiveRuleEnsemble([])\n",
    "        self.search_params = search_params\n",
    "        self.history = []\n",
    "        self.time = []\n",
    "\n",
    "    def set_reg(self, reg):\n",
    "        self.reg = reg\n",
    "        self.objective.reg = reg\n",
    "        self.weight_update_method.reg = reg\n",
    "\n",
    "    def fit(self, data, target, advantage, other_values, current, has_origin_rules=False, verbose=False):\n",
    "        if not has_origin_rules:\n",
    "            self.history = []\n",
    "            self.time = []\n",
    "            self.rules_.members = []\n",
    "            orth_basis = np.array([])\n",
    "        else:\n",
    "            q_mat = np.column_stack(\n",
    "                [self.rules_[i].q(data) + np.zeros(len(data)) for i in range(len(self.rules_))])\n",
    "            orth_basis = orthonormalization(q_mat)\n",
    "        num_components = 0\n",
    "        while len(self.rules_) < self.num_rules and num_components < self.num_components:\n",
    "            start_time = datetime.now()\n",
    "            # Search for a rule\n",
    "            scores = self.rules_(data)\n",
    "            obj = self.objective(data, target, advantage, other_values, current, predictions=scores,\n",
    "                                 loss=self.loss, reg=self.reg, rules=self.rules_, orth_basis=orth_basis)\n",
    "            q = obj.search(method=self.search, verbose=verbose,\n",
    "                           **self.search_params)\n",
    "            if hasattr(self.objective, 'opt_weight') and callable(getattr(self.objective, 'opt_weight')):\n",
    "                y = obj.opt_weight(q)\n",
    "            else:\n",
    "                y = 1.0  # np.random.random()\n",
    "            q_vec = q(data)\n",
    "            num_components += (1 + len(q))\n",
    "            if len(orth_basis) == 0:\n",
    "                basis = q_vec / norm(q_vec)\n",
    "                orth_basis = np.array([basis]).T\n",
    "            else:\n",
    "                basis = q_vec - orth_basis.dot(orth_basis.T.dot(q_vec))\n",
    "                basis = basis / (norm(basis) + 1e-6)\n",
    "                orth_basis = np.hstack((orth_basis, np.array([basis]).T))\n",
    "            rule = Rule(q, y)\n",
    "            if self.verbose:\n",
    "                print(rule)\n",
    "            self.rules_.append(rule)\n",
    "            # Calculate weights\n",
    "            weights = self.weight_update_method.calc_weight(\n",
    "                data, target, self.rules_, advantage, other_values, current)\n",
    "            for i in range(len(self.rules_)):\n",
    "                self.rules_[i].y = weights[i]\n",
    "            self.history.append(AdditiveRuleEnsemble(\n",
    "                [Rule(q=rule.q, y=rule.y) for rule in self.rules_.members]))\n",
    "            end_time = datetime.now()\n",
    "            self.time.append(str(end_time - start_time))\n",
    "        return self\n",
    "\n",
    "    def predict(self, data):\n",
    "        loss = loss_function(self.loss)\n",
    "        return loss.preidictions(self.rules_(data))\n",
    "\n",
    "    def decision_function(self, data):\n",
    "        return self.rules_(data)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 16,
   "id": "b50ce787",
   "metadata": {},
   "outputs": [],
   "source": [
    "# class Actor(nn.Module):\n",
    "#     def __init__(self, action_space, node=16):\n",
    "#         super(Actor, self).__init__()\n",
    "#         self.fc1 = nn.Linear(4, node)  \n",
    "# #         self.fc1_ = nn.Linear(node, node)\n",
    "#         self.fc2 = nn.Linear(node, action_space)\n",
    "\n",
    "#     def forward(self, state):\n",
    "#         x = F.relu(self.fc1(state))\n",
    "# #         x = F.relu(self.fc1_(x))\n",
    "#         x = self.fc2(x)\n",
    "#         return x"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 17,
   "id": "84b0ee0a",
   "metadata": {},
   "outputs": [],
   "source": [
    "def copy_rules(origin_rules):\n",
    "    rules = []\n",
    "    for n in range(len(origin_rules)):\n",
    "        rule = origin_rules[n]\n",
    "        rules.append(Rule(q=rule.q, y=rule.y))\n",
    "    return AdditiveRuleEnsemble(rules)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 18,
   "id": "bb3fcc8c",
   "metadata": {},
   "outputs": [],
   "source": [
    "class ActorRule():\n",
    "    def __init__(self, action_space=2, num_rules=5):\n",
    "        self.action_space = action_space\n",
    "        self.model = [GeneralRuleBoostingEstimator(num_rules=num_rules, objective_function=OrthogonalBoostingObjective,\n",
    "                                                   weight_update_method=FullyCorrectiveA2C(), loss=PiLoss(),\n",
    "                                                   reg=0.3, search='greedy', max_col_attr=10, verbose=False) for _ in\n",
    "                      range(action_space)]\n",
    "        self.best_model = [\n",
    "            GeneralRuleBoostingEstimator(num_rules=num_rules, objective_function=OrthogonalBoostingObjective,\n",
    "                                         weight_update_method=FullyCorrectiveA2C(), loss=PiLoss(),\n",
    "                                         reg=0.01, search='greedy', max_col_attr=20, verbose=False) for _ in\n",
    "            range(action_space)]\n",
    "\n",
    "    def __call__(self, state):\n",
    "        res = [self.model[i].rules_(state) for i in range(len(self.model))]\n",
    "        return np.array(res)\n",
    "\n",
    "    def predict(self, state):\n",
    "        res = [self.best_model[i].rules_(state) for i in range(len(self.model))]\n",
    "        return np.array(res)\n",
    "\n",
    "\n",
    "def update_rules(estimator: GeneralRuleBoostingEstimator, x, y, adv, other_values, current):\n",
    "    queries_lst = []\n",
    "    queries = {}\n",
    "    original_rules = copy_rules(estimator.rules_)\n",
    "    origin_risk = calc_risk(PiLoss(), y, original_rules, x, estimator.reg, adv, other_values, current)\n",
    "    for i in range(len(estimator.rules_)):\n",
    "        q_str = str(estimator.rules_[i].q)\n",
    "        if q_str not in queries:\n",
    "            queries[q_str] = estimator.rules_[i].y\n",
    "            queries_lst.append(estimator.rules_[i].q)\n",
    "        else:\n",
    "            queries[q_str] += estimator.rules_[i].y\n",
    "    for k in queries:\n",
    "        queries[k] = abs(queries[k])\n",
    "    min_weight_query = min(queries, key=queries.get)\n",
    "    rules = []\n",
    "    for i in range(len(queries_lst)):\n",
    "        q_str = str(queries_lst[i])\n",
    "        if q_str != min_weight_query:\n",
    "            rules.append(Rule(q=queries_lst[i], y=queries[str(queries_lst[i])]))\n",
    "    if len(rules) == 0:\n",
    "        rules = [Rule(q=queries_lst[0], y=queries[str(queries_lst[0])])]\n",
    "    new_rules = AdditiveRuleEnsemble(rules)\n",
    "    weights = FullyCorrectiveA2C(loss_function('pi_loss'), estimator.reg).calc_weight(x, y, new_rules, adv,\n",
    "                                                                                      other_values, current)\n",
    "    for i in range(len(new_rules)):\n",
    "        new_rules[i].y = weights[i]\n",
    "    estimator.rules_ = new_rules\n",
    "    estimator.fit(x, y, adv, other_values, current, has_origin_rules=True)\n",
    "    weights = FullyCorrectiveA2C(loss_function('pi_loss'), estimator.reg).calc_weight(x, y, estimator.rules_, adv,\n",
    "                                                                                      other_values, current)\n",
    "    for i in range(len(estimator.rules_)):\n",
    "        estimator.rules_[i].y = weights[i]\n",
    "    new_risk = calc_risk(PiLoss(), y, estimator.rules_, x, estimator.reg, adv, other_values, current)\n",
    "    if new_risk > origin_risk:\n",
    "        estimator.rules_ = copy_rules(original_rules)\n",
    "        print(\"origin\", origin_risk, 'new', new_risk, 'not updated')\n",
    "        # risk = sum(PiLoss.__call__(y, estimator.rules_[i].y))\n",
    "    return estimator"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 19,
   "id": "2824981f",
   "metadata": {},
   "outputs": [],
   "source": [
    "class Critic(nn.Module):\n",
    "    def __init__(self, node=16):\n",
    "        super(Critic, self).__init__()\n",
    "        self.fc1 = nn.Linear(4, node)\n",
    "        self.fc2 = nn.Linear(node, 1)\n",
    "\n",
    "    def forward(self, state):\n",
    "        x = F.relu(self.fc1(state))\n",
    "        x = self.fc2(x)\n",
    "        return x"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 20,
   "id": "6b6e2dd7",
   "metadata": {},
   "outputs": [],
   "source": [
    "gamma = 0.99\n",
    "actor = ActorRule()\n",
    "critic = Critic().to(device)\n",
    "critic_optimizer = optim.AdamW(critic.parameters(), lr=0.001)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 21,
   "id": "ae072cc5",
   "metadata": {},
   "outputs": [],
   "source": [
    "class ActorNet(nn.Module):\n",
    "    def __init__(self, hidden_dim=16):\n",
    "        super().__init__()\n",
    "\n",
    "        self.hidden = nn.Linear(4, hidden_dim)\n",
    "        self.output = nn.Linear(hidden_dim, 2)\n",
    "\n",
    "    def forward(self, s):\n",
    "        outs = self.hidden(s)\n",
    "        outs = F.relu(outs)\n",
    "        logits = self.output(outs)\n",
    "        return logits\n",
    "\n",
    "\n",
    "actor_func = ActorNet().to(device)\n",
    "value_func = critic"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 22,
   "id": "c565d5ef",
   "metadata": {
    "scrolled": true
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Run episode 0 with rewards 22.0\n",
      "Run episode 1 with rewards 11.0\n",
      "Run episode 2 with rewards 13.0\n",
      "Run episode 3 with rewards 13.0\n",
      "Run episode 4 with rewards 13.0\n",
      "Run episode 5 with rewards 13.0\n",
      "Run episode 6 with rewards 14.0\n",
      "Run episode 7 with rewards 9.0\n",
      "Run episode 8 with rewards 10.0\n",
      "Run episode 9 with rewards 11.0\n",
      "Run episode 10 with rewards 12.0\n",
      "Run episode 11 with rewards 53.0\n",
      "Run episode 12 with rewards 12.0\n",
      "Run episode 13 with rewards 10.0\n",
      "Run episode 14 with rewards 18.0\n",
      "Run episode 15 with rewards 18.0\n",
      "Run episode 16 with rewards 12.0\n",
      "Run episode 17 with rewards 15.0\n",
      "Run episode 18 with rewards 13.0\n",
      "Run episode 19 with rewards 14.0\n",
      "Run episode 20 with rewards 12.0\n",
      "Run episode 21 with rewards 18.0\n",
      "Run episode 22 with rewards 26.0\n",
      "Run episode 23 with rewards 18.0\n",
      "Run episode 24 with rewards 10.0\n",
      "Run episode 25 with rewards 14.0\n",
      "Run episode 26 with rewards 21.0\n",
      "Run episode 27 with rewards 12.0\n",
      "Run episode 28 with rewards 16.0\n",
      "Run episode 29 with rewards 14.0\n",
      "Run episode 30 with rewards 19.0\n",
      "Run episode 31 with rewards 10.0\n",
      "Run episode 32 with rewards 24.0\n",
      "Run episode 33 with rewards 18.0\n",
      "Run episode 34 with rewards 14.0\n",
      "Run episode 35 with rewards 9.0\n",
      "Run episode 36 with rewards 13.0\n",
      "Run episode 37 with rewards 13.0\n",
      "Run episode 38 with rewards 24.0\n",
      "Run episode 39 with rewards 11.0\n",
      "Run episode 40 with rewards 15.0\n",
      "Run episode 41 with rewards 12.0\n",
      "Run episode 42 with rewards 17.0\n",
      "Run episode 43 with rewards 10.0\n",
      "Run episode 44 with rewards 13.0\n",
      "Run episode 45 with rewards 12.0\n",
      "Run episode 46 with rewards 10.0\n",
      "Run episode 47 with rewards 23.0\n",
      "Run episode 48 with rewards 18.0\n",
      "Run episode 49 with rewards 15.0\n",
      "Run episode 50 with rewards 16.0\n",
      "Run episode 51 with rewards 12.0\n",
      "Run episode 52 with rewards 22.0\n",
      "Run episode 53 with rewards 11.0\n",
      "Run episode 54 with rewards 13.0\n",
      "Run episode 55 with rewards 13.0\n",
      "Run episode 56 with rewards 12.0\n",
      "Run episode 57 with rewards 30.0\n",
      "Run episode 58 with rewards 16.0\n",
      "Run episode 59 with rewards 21.0\n",
      "Run episode 60 with rewards 13.0\n",
      "Run episode 61 with rewards 9.0\n",
      "Run episode 62 with rewards 13.0\n",
      "Run episode 63 with rewards 10.0\n",
      "Run episode 64 with rewards 11.0\n",
      "Run episode 65 with rewards 12.0\n",
      "Run episode 66 with rewards 14.0\n",
      "Run episode 67 with rewards 15.0\n",
      "Run episode 68 with rewards 18.0\n",
      "Run episode 69 with rewards 13.0\n",
      "Run episode 70 with rewards 11.0\n",
      "Run episode 71 with rewards 14.0\n",
      "Run episode 72 with rewards 12.0\n",
      "Run episode 73 with rewards 9.0\n",
      "Run episode 74 with rewards 9.0\n",
      "Run episode 75 with rewards 12.0\n",
      "Run episode 76 with rewards 17.0\n",
      "Run episode 77 with rewards 8.0\n",
      "Run episode 78 with rewards 22.0\n",
      "Run episode 79 with rewards 20.0\n"
     ]
    }
   ],
   "source": [
    "opt1 = torch.optim.AdamW(value_func.parameters(), lr=0.001)\n",
    "opt2 = torch.optim.AdamW(actor_func.parameters(), lr=0.001)\n",
    "def pick_sample(s):\n",
    "    with torch.no_grad():\n",
    "        #   --> size : (1, 4)\n",
    "        s_batch = np.expand_dims(s, axis=0)\n",
    "        s_batch = torch.tensor(s_batch, dtype=torch.float).to(device)\n",
    "        # Get logits from state\n",
    "        #   --> size : (1, 2)\n",
    "        logits = actor_func(s_batch)\n",
    "        #   --> size : (2)\n",
    "        logits = logits.squeeze(dim=0)\n",
    "        # From logits to probabilities\n",
    "        probs = F.softmax(logits, dim=-1)\n",
    "        # Pick up action's sample\n",
    "        a = torch.multinomial(probs, num_samples=1)\n",
    "        # Return\n",
    "        return a.tolist()[0]\n",
    "reward_records = []\n",
    "for i in range(80):\n",
    "    #\n",
    "    # Run episode till done\n",
    "    #\n",
    "    done = False\n",
    "    states = []\n",
    "    actions = []\n",
    "    rewards = []\n",
    "    s, _ = env.reset(seed=np.random.randint(0, 1e6))\n",
    "    while not done:\n",
    "        states.append(s.tolist())\n",
    "        a = pick_sample(s)\n",
    "        s, r, term, trunc, _ = env.step(a)\n",
    "        done = term or trunc\n",
    "        actions.append(a)\n",
    "        rewards.append(r)\n",
    "\n",
    "    #\n",
    "    # Get cumulative rewards\n",
    "    #\n",
    "    cum_rewards = np.zeros_like(rewards)\n",
    "    reward_len = len(rewards)\n",
    "    for j in reversed(range(reward_len)):\n",
    "        cum_rewards[j] = rewards[j] + (cum_rewards[j+1]*gamma if j+1 < reward_len else 0)\n",
    "\n",
    "    #\n",
    "    # Train (optimize parameters)\n",
    "    #\n",
    "\n",
    "    # Optimize value loss (Critic)\n",
    "    opt1.zero_grad()\n",
    "    states = torch.tensor(states, dtype=torch.float).to(device)\n",
    "    cum_rewards = torch.tensor(cum_rewards, dtype=torch.float).to(device)\n",
    "    values = value_func(states)\n",
    "    values = values.squeeze(dim=1)\n",
    "    vf_loss = F.mse_loss(\n",
    "        values,\n",
    "        cum_rewards,\n",
    "        reduction=\"none\")\n",
    "    vf_loss.sum().backward()\n",
    "    opt1.step()\n",
    "\n",
    "    # Todo 2; RULE BASED UPDATES\n",
    "    with torch.no_grad():\n",
    "        values = value_func(states).squeeze(dim=1)\n",
    "    opt2.zero_grad()\n",
    "    actions = torch.tensor(actions, dtype=torch.int64).to(device)\n",
    "    advantages = cum_rewards - values\n",
    "#     print(advantages)\n",
    "    logits = actor_func(states)\n",
    "    log_probs = -F.cross_entropy(logits, actions, reduction=\"none\")\n",
    "    pi_loss = -log_probs * advantages\n",
    "    pi_loss.sum().backward()\n",
    "    opt2.step()\n",
    "\n",
    "    # Output total rewards in episode (max 500)\n",
    "    print(\"Run episode {} with rewards {}\".format(i, sum(rewards)))#, end=\"\\r\")\n",
    "    reward_records.append(sum(rewards))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 23,
   "id": "73589768",
   "metadata": {},
   "outputs": [],
   "source": [
    "def softmax(logits):\n",
    "    exp_logits = np.exp(logits)\n",
    "    sum_logits = np.sum(exp_logits)\n",
    "    return (exp_logits / sum_logits).reshape([-1])\n",
    "\n",
    "def pick_sample(s):\n",
    "    with torch.no_grad():\n",
    "        s_batch = np.expand_dims(s, axis=0)\n",
    "        logits = actor(pd.DataFrame(s_batch, columns=column_names))\n",
    "        probs = softmax(logits)\n",
    "        a = torch.multinomial(torch.tensor(probs), num_samples=1)\n",
    "        return a.tolist()[0]\n",
    "\n",
    "\n",
    "def train():\n",
    "    reward_records = []\n",
    "    best_rewards = 0\n",
    "    # best_model = None\n",
    "    for i in range(1000):\n",
    "\n",
    "        done = False\n",
    "        states = []\n",
    "        actions = []\n",
    "        rewards = []\n",
    "        s, _ = env.reset(seed=np.random.randint(0, 1e6))\n",
    "        if i == 2:\n",
    "            print('stop here')\n",
    "        while not done:\n",
    "            states.append(s.tolist())\n",
    "            a = pick_sample(s)\n",
    "            s, r, term, trunc, _ = env.step(a)\n",
    "            done = term or trunc\n",
    "            actions.append(a)\n",
    "            rewards.append(r)\n",
    "\n",
    "        # if sum(rewards) > 480:\n",
    "        #     break\n",
    "        #\n",
    "        # Get cumulative rewards\n",
    "        #\n",
    "        cum_rewards = np.zeros_like(rewards)\n",
    "        reward_len = len(rewards)\n",
    "        for j in reversed(range(reward_len)):\n",
    "            cum_rewards[j] = rewards[j] + (cum_rewards[j + 1] * gamma if j + 1 < reward_len else 0)\n",
    "        #\n",
    "        # Train (optimize parameters)\n",
    "        #\n",
    "        # Optimize value loss (Critic)\n",
    "        critic_optimizer.zero_grad()\n",
    "        states = torch.tensor(states, dtype=torch.float).to(device)\n",
    "        cum_rewards = torch.tensor(cum_rewards, dtype=torch.float).to(device)\n",
    "        values = critic(states)\n",
    "        values = values.squeeze(dim=1)\n",
    "        vf_loss = F.mse_loss(\n",
    "            values,\n",
    "            cum_rewards,\n",
    "            reduction=\"none\")\n",
    "        vf_loss.sum().backward()\n",
    "        critic_optimizer.step()\n",
    "        print('============', i, '===========')\n",
    "        print(len(actions), 'actions', actions)\n",
    "\n",
    "        print(\"{}\\n--------------\\n{}\\nRun episode {} with rewards {}\".format(actor.model[0].rules_,\n",
    "                                                                              actor.model[1].rules_,\n",
    "                                                                              i,\n",
    "                                                                              sum(rewards)))  # , end=\"\\r\")\n",
    "        if i > 0:\n",
    "            if sum(rewards) >= best_rewards:\n",
    "                best_rewards = sum(rewards)\n",
    "                for rr in range(actor.action_space):\n",
    "                    rules = []\n",
    "                    for n in range(len(actor.model[rr].rules_)):\n",
    "                        rule = actor.model[rr].rules_[n]\n",
    "                        rules.append(Rule(q=rule.q, y=rule.y))\n",
    "                    actor.best_model[rr].rules_ = AdditiveRuleEnsemble(rules)\n",
    "                print('best')\n",
    "        if np.average(reward_records[-5:]) > 475.0:\n",
    "            break\n",
    "        #     else:\n",
    "        #         for rr in range(actor.action_space):\n",
    "        #             rules = []\n",
    "        #             for n in range(len(actor.best_model[rr].rules_)):\n",
    "        #                 rule = actor.best_model[rr].rules_[n]\n",
    "        #                 rules.append(Rule(q=rule.q, y=rule.y))\n",
    "        #             actor.model[rr].rules_ = AdditiveRuleEnsemble(rules)\n",
    "        #         print('')\n",
    "\n",
    "        #\n",
    "        # Todo 2; RULE BASED UPDATES\n",
    "        with torch.no_grad():\n",
    "            values = critic(states).squeeze(dim=1)\n",
    "        actions = torch.tensor(actions, dtype=torch.int64).to(device)\n",
    "        advantages = cum_rewards - values\n",
    "        states_array = states.cpu().detach().numpy()\n",
    "        x = pd.DataFrame(states_array, columns=column_names)\n",
    "        y = pd.Series(actions.cpu().detach().numpy())\n",
    "#         advantages = (advantages-advantages.mean())/advantages.std()\n",
    "        adv = pd.Series(advantages.cpu().detach().numpy())\n",
    "        outputs = actor(x).T\n",
    "        # print('adv', advantages.cpu().detach().numpy())\n",
    "        # print('outputs', outputs.tolist())\n",
    "        for j in range(len(actor.model)):\n",
    "            m = actor.model[j]\n",
    "            masks = np.ones_like(outputs, dtype=bool)\n",
    "            masks[:, j] = False\n",
    "            other_values = outputs[masks].reshape(-1, outputs.shape[1] - 1)\n",
    "\n",
    "            if len(m.rules_) == 0:\n",
    "                m.fit(x, y, adv, other_values, j)\n",
    "            else:\n",
    "                for _ in range(1):\n",
    "                    update_rules(m, x, y, adv, other_values, j)\n",
    "        \n",
    "        # print(\n",
    "        #     \"{}\\n--------------\\n{}\\nRun episode {} with rewards {}\".format(actor.model[0].rules_,\n",
    "        #                                                                     actor.model[1].rules_,\n",
    "        #                                                                     i,\n",
    "        #                                                                     sum(rewards)))  # , end=\"\\r\")\n",
    "        reward_records.append(sum(rewards))\n",
    "    print(\"\\nDone\")\n",
    "    env.close()\n",
    "    return reward_records"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 24,
   "id": "b411aa5d",
   "metadata": {
    "scrolled": true
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 0 ===========\n",
      "67 actions [1, 0, 1, 1, 1, 0, 0, 0, 0, 1, 0, 0, 0, 1, 1, 0, 1, 1, 0, 0, 1, 1, 1, 0, 1, 1, 0, 0, 1, 1, 1, 0, 0, 1, 1, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 0, 1, 1, 0, 0, 0, 0, 1, 0, 0, 0]\n",
      "\n",
      "--------------\n",
      "\n",
      "Run episode 0 with rewards 67.0\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/home/fyan/.local/lib/python3.10/site-packages/numpy/lib/function_base.py:518: RuntimeWarning: Mean of empty slice.\n",
      "  avg = a.mean(axis, **keepdims_kw)\n",
      "/home/fyan/.local/lib/python3.10/site-packages/numpy/core/_methods.py:190: RuntimeWarning: invalid value encountered in double_scalars\n",
      "  ret = ret.dtype.type(ret / rcount)\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 1 ===========\n",
      "85 actions [1, 1, 0, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1, 1, 1, 0, 1, 0, 0, 0, 0, 1, 1, 1, 1, 0, 1, 0, 1, 0, 0, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 0, 0, 1, 1, 1, 1, 1, 1, 0, 0, 1, 0, 0, 0, 0, 1, 0, 0, 1, 0, 1, 1, 0, 1]\n",
      "   +1.4116 if cp>=0.025326931476593054 & cv>=-0.17492903470993043 & pa<=-0.029433537274599072\n",
      "   -2.5185 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   +1.2397 if cp<=0.025326931476593054 & cp>=-0.015411880426108835 & cv>=-0.17492903470993043 & pa>=-0.029433537274599072\n",
      "   +1.2995 if cp>=-0.015411880426108835 & cv>=0.019291881844401358 & pav>=-0.29077954292297364\n",
      "   -3.0085 if pav>=1.2673492431640625\n",
      "--------------\n",
      "   -1.4116 if cp>=0.025326931476593054 & cv>=-0.17492903470993043 & pa<=-0.029433537274599072\n",
      "   +2.5185 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   -1.2397 if cp<=0.025326931476593054 & cp>=-0.015411880426108835 & cv>=-0.17492903470993043 & pa>=-0.029433537274599072\n",
      "   -1.2995 if cp>=-0.015411880426108835 & cv>=0.019291881844401358 & pav>=-0.29077954292297364\n",
      "   +3.0085 if pav>=1.2673492431640625\n",
      "Run episode 1 with rewards 85.0\n",
      "best\n",
      "stop here\n",
      "============ 2 ===========\n",
      "64 actions [0, 0, 1, 1, 1, 0, 1, 0, 1, 0, 0, 0, 1, 1, 1, 0, 1, 0, 0, 0, 0, 1, 1, 1, 1, 1, 0, 0, 1, 1, 1, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0, 1, 1, 1, 1, 0, 1, 0]\n",
      "   +3.7435 if cp>=0.025326931476593054 & cv>=-0.17492903470993043 & pa<=-0.029433537274599072\n",
      "   -5.0065 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   +2.8999 if cp>=-0.015411880426108835 & cv>=0.019291881844401358 & pav>=-0.29077954292297364\n",
      "   +0.0001 if pav>=1.2673492431640625\n",
      "   +6.1295 if cp>=0.0010711406241171065 & cv>=0.04871476367115975 & pa<=-0.0045932557433843516 & pa>=-0.028237101808190345\n",
      "--------------\n",
      "   -3.7433 if cp>=0.025326931476593054 & cv>=-0.17492903470993043 & pa<=-0.029433537274599072\n",
      "   +5.0065 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   -2.9000 if cp>=-0.015411880426108835 & cv>=0.019291881844401358 & pav>=-0.29077954292297364\n",
      "   -0.0000 if pav>=1.2673492431640625\n",
      "   -6.1291 if cp>=0.0010711406241171065 & cv>=0.04871476367115975 & pa<=-0.0045932557433843516 & pa>=-0.028237101808190345\n",
      "Run episode 2 with rewards 64.0\n",
      "============ 3 ===========\n",
      "35 actions [1, 1, 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 1, 1, 0, 1, 0, 0]\n",
      "   +2.2100 if cp>=0.025326931476593054 & cv>=-0.17492903470993043 & pa<=-0.029433537274599072\n",
      "   -0.9532 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   -0.0000 if cp>=-0.015411880426108835 & cv>=0.019291881844401358 & pav>=-0.29077954292297364\n",
      "   +4.9023 if cp>=0.0010711406241171065 & cv>=0.04871476367115975 & pa<=-0.0045932557433843516 & pa>=-0.028237101808190345\n",
      "   +4.8108 if cv<=-0.1832945942878723 & pa<=-0.02219058610498905 & pa<=-0.03310773223638534 & pa>=-0.08485736101865766\n",
      "--------------\n",
      "   -2.2099 if cp>=0.025326931476593054 & cv>=-0.17492903470993043 & pa<=-0.029433537274599072\n",
      "   +0.9533 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   -0.0000 if cp>=-0.015411880426108835 & cv>=0.019291881844401358 & pav>=-0.29077954292297364\n",
      "   -4.9020 if cp>=0.0010711406241171065 & cv>=0.04871476367115975 & pa<=-0.0045932557433843516 & pa>=-0.028237101808190345\n",
      "   -4.8108 if cv<=-0.1832945942878723 & pa<=-0.02219058610498905 & pa<=-0.03310773223638534 & pa>=-0.08485736101865766\n",
      "Run episode 3 with rewards 35.0\n",
      "============ 4 ===========\n",
      "58 actions [1, 1, 0, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 0, 1, 1, 0, 0, 0, 1, 1, 1, 0, 0, 0, 0, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 0, 1, 1, 0]\n",
      "   +0.4252 if cp>=0.025326931476593054 & cv>=-0.17492903470993043 & pa<=-0.029433537274599072\n",
      "   -1.7095 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   -0.0000 if cp>=0.0010711406241171065 & cv>=0.04871476367115975 & pa<=-0.0045932557433843516 & pa>=-0.028237101808190345\n",
      "   +0.3843 if cv<=-0.1832945942878723 & pa<=-0.02219058610498905 & pa<=-0.03310773223638534 & pa>=-0.08485736101865766\n",
      "   +4.3153 if cp>=-0.010049265995621672 & pa>=-0.08306656628847121\n",
      "--------------\n",
      "   -0.4251 if cp>=0.025326931476593054 & cv>=-0.17492903470993043 & pa<=-0.029433537274599072\n",
      "   +1.7095 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   +0.0000 if cp>=0.0010711406241171065 & cv>=0.04871476367115975 & pa<=-0.0045932557433843516 & pa>=-0.028237101808190345\n",
      "   -0.3843 if cv<=-0.1832945942878723 & pa<=-0.02219058610498905 & pa<=-0.03310773223638534 & pa>=-0.08485736101865766\n",
      "   -4.3153 if cp>=-0.010049265995621672 & pa>=-0.08306656628847121\n",
      "Run episode 4 with rewards 58.0\n",
      "============ 5 ===========\n",
      "36 actions [1, 1, 0, 0, 0, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 0, 1, 1, 1, 0, 0, 0, 1, 0, 0, 0, 1]\n",
      "   +2.5570 if cp>=0.025326931476593054 & cv>=-0.17492903470993043 & pa<=-0.029433537274599072\n",
      "   -3.2253 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   +0.1350 if cv<=-0.1832945942878723 & pa<=-0.02219058610498905 & pa<=-0.03310773223638534 & pa>=-0.08485736101865766\n",
      "   +7.4274 if cp>=-0.010049265995621672 & pa>=-0.08306656628847121\n",
      "   -4.0805 if cp<=0.05880629867315293 & cp>=-0.021017606556415557 & pa>=-0.16076740622520447\n",
      "--------------\n",
      "   -2.5569 if cp>=0.025326931476593054 & cv>=-0.17492903470993043 & pa<=-0.029433537274599072\n",
      "   +3.2255 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   -0.1349 if cv<=-0.1832945942878723 & pa<=-0.02219058610498905 & pa<=-0.03310773223638534 & pa>=-0.08485736101865766\n",
      "   -7.4277 if cp>=-0.010049265995621672 & pa>=-0.08306656628847121\n",
      "   +4.0806 if cp<=0.05880629867315293 & cp>=-0.021017606556415557 & pa>=-0.16076740622520447\n",
      "Run episode 5 with rewards 36.0\n",
      "============ 6 ===========\n",
      "43 actions [1, 1, 0, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 0, 0, 1, 0, 1, 1, 0, 0, 1, 1, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 1, 1, 1, 0, 1, 1, 1]\n",
      "   -0.0000 if cp>=0.025326931476593054 & cv>=-0.17492903470993043 & pa<=-0.029433537274599072\n",
      "   -1.0319 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   +2.6385 if cp>=-0.010049265995621672 & pa>=-0.08306656628847121\n",
      "   +0.2677 if cp<=0.05880629867315293 & cp>=-0.021017606556415557 & pa>=-0.16076740622520447\n",
      "   -4.8113 if cv<=-0.21116065979003906 & pa<=0.03307227045297623\n",
      "--------------\n",
      "   +0.0000 if cp>=0.025326931476593054 & cv>=-0.17492903470993043 & pa<=-0.029433537274599072\n",
      "   +1.0321 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   -2.6386 if cp>=-0.010049265995621672 & pa>=-0.08306656628847121\n",
      "   -0.2677 if cp<=0.05880629867315293 & cp>=-0.021017606556415557 & pa>=-0.16076740622520447\n",
      "   +4.8113 if cv<=-0.21116065979003906 & pa<=0.03307227045297623\n",
      "Run episode 6 with rewards 43.0\n",
      "============ 7 ===========\n",
      "52 actions [1, 1, 0, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1]\n",
      "   -3.1995 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   +1.2574 if cp>=-0.010049265995621672 & pa>=-0.08306656628847121\n",
      "   +0.2030 if cp<=0.05880629867315293 & cp>=-0.021017606556415557 & pa>=-0.16076740622520447\n",
      "   -3.7366 if cv<=-0.21116065979003906 & pa<=0.03307227045297623\n",
      "   +7.8879 if cp<=-0.030739640071988105 & cv>=-0.024250079691410065 & pa>=-0.0021809887606650583 & pav>=-0.2843522667884827\n",
      "--------------\n",
      "   +3.1996 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   -1.2575 if cp>=-0.010049265995621672 & pa>=-0.08306656628847121\n",
      "   -0.2030 if cp<=0.05880629867315293 & cp>=-0.021017606556415557 & pa>=-0.16076740622520447\n",
      "   +3.7366 if cv<=-0.21116065979003906 & pa<=0.03307227045297623\n",
      "   -7.8878 if cp<=-0.030739640071988105 & cv>=-0.024250079691410065 & pa>=-0.0021809887606650583 & pav>=-0.2843522667884827\n",
      "Run episode 7 with rewards 52.0\n",
      "============ 8 ===========\n",
      "86 actions [1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1, 1, 1, 0, 1, 0, 0, 0, 1, 1, 1, 0, 0, 0, 1, 1, 1, 0, 0, 0, 1, 0, 1, 1, 1, 0, 0, 0, 1, 0, 1, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 0, 1, 0, 1, 0]\n",
      "   -5.1545 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   +0.1630 if cp>=-0.010049265995621672 & pa>=-0.08306656628847121\n",
      "   -4.9553 if cv<=-0.21116065979003906 & pa<=0.03307227045297623\n",
      "   +0.0000 if cp<=-0.030739640071988105 & cv>=-0.024250079691410065 & pa>=-0.0021809887606650583 & pav>=-0.2843522667884827\n",
      "   +2.0376 if pav>=-0.46547389030456543\n",
      "--------------\n",
      "   +5.1543 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   -0.1631 if cp>=-0.010049265995621672 & pa>=-0.08306656628847121\n",
      "   +4.9556 if cv<=-0.21116065979003906 & pa<=0.03307227045297623\n",
      "   +0.0001 if cp<=-0.030739640071988105 & cv>=-0.024250079691410065 & pa>=-0.0021809887606650583 & pav>=-0.2843522667884827\n",
      "   -2.0375 if pav>=-0.46547389030456543\n",
      "Run episode 8 with rewards 86.0\n",
      "best\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 9 ===========\n",
      "62 actions [0, 0, 1, 1, 1, 0, 0, 0, 1, 1, 0, 1, 1, 0, 0, 0, 1, 1, 1, 0, 0, 0, 1, 0, 1, 1, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 1, 1, 0]\n",
      "   -7.0843 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   -1.3228 if cp>=-0.010049265995621672 & pa>=-0.08306656628847121\n",
      "   -3.3172 if cv<=-0.21116065979003906 & pa<=0.03307227045297623\n",
      "   +0.8167 if pav>=-0.46547389030456543\n",
      "   +4.6968 if cv>=-0.1358855664730072 & pa>=-0.06187741458415985\n",
      "--------------\n",
      "   +7.0843 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   +1.3228 if cp>=-0.010049265995621672 & pa>=-0.08306656628847121\n",
      "   +3.3174 if cv<=-0.21116065979003906 & pa<=0.03307227045297623\n",
      "   -0.8167 if pav>=-0.46547389030456543\n",
      "   -4.6967 if cv>=-0.1358855664730072 & pa>=-0.06187741458415985\n",
      "Run episode 9 with rewards 62.0\n",
      "============ 10 ===========\n",
      "11 actions [0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   -2.9238 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   -0.0002 if cp>=-0.010049265995621672 & pa>=-0.08306656628847121\n",
      "   -3.4823 if cv<=-0.21116065979003906 & pa<=0.03307227045297623\n",
      "   +0.5841 if cv>=-0.1358855664730072 & pa>=-0.06187741458415985\n",
      "   +6.8364 if pa>=-0.019380318000912666\n",
      "--------------\n",
      "   +2.9238 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   -0.0000 if cp>=-0.010049265995621672 & pa>=-0.08306656628847121\n",
      "   +3.4825 if cv<=-0.21116065979003906 & pa<=0.03307227045297623\n",
      "   -0.5841 if cv>=-0.1358855664730072 & pa>=-0.06187741458415985\n",
      "   -6.8364 if pa>=-0.019380318000912666\n",
      "Run episode 10 with rewards 11.0\n",
      "============ 11 ===========\n",
      "8 actions [0, 0, 0, 0, 0, 0, 0, 1]\n",
      "   +0.6240 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   +0.0344 if cv<=-0.21116065979003906 & pa<=0.03307227045297623\n",
      "   +0.1651 if cv>=-0.1358855664730072 & pa>=-0.06187741458415985\n",
      "   +0.6240 if pa>=-0.019380318000912666\n",
      "   -3.6949 if cp>=-0.005644688848406076 & cv<=-0.2450009137392044\n",
      "--------------\n",
      "   -0.6240 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   -0.0344 if cv<=-0.21116065979003906 & pa<=0.03307227045297623\n",
      "   -0.1651 if cv>=-0.1358855664730072 & pa>=-0.06187741458415985\n",
      "   -0.6240 if pa>=-0.019380318000912666\n",
      "   +3.6949 if cp>=-0.005644688848406076 & cv<=-0.2450009137392044\n",
      "Run episode 11 with rewards 8.0\n",
      "============ 12 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +1.3266 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   +0.3048 if cv>=-0.1358855664730072 & pa>=-0.06187741458415985\n",
      "   +1.3266 if pa>=-0.019380318000912666\n",
      "   +0.0000 if cp>=-0.005644688848406076 & cv<=-0.2450009137392044\n",
      "   +0.2451 if cp<=-0.05678064301609992\n",
      "--------------\n",
      "   -1.3266 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   -0.3048 if cv>=-0.1358855664730072 & pa>=-0.06187741458415985\n",
      "   -1.3266 if pa>=-0.019380318000912666\n",
      "   +0.0000 if cp>=-0.005644688848406076 & cv<=-0.2450009137392044\n",
      "   -0.2451 if cp<=-0.05678064301609992\n",
      "Run episode 12 with rewards 10.0\n",
      "============ 13 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +1.0590 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   +0.1612 if cv>=-0.1358855664730072 & pa>=-0.06187741458415985\n",
      "   +1.0590 if pa>=-0.019380318000912666\n",
      "   +0.0929 if cp<=-0.05678064301609992\n",
      "   +0.2898 if cp<=-0.03336391001939773\n",
      "--------------\n",
      "   -1.0590 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   -0.1612 if cv>=-0.1358855664730072 & pa>=-0.06187741458415985\n",
      "   -1.0590 if pa>=-0.019380318000912666\n",
      "   -0.0929 if cp<=-0.05678064301609992\n",
      "   -0.2899 if cp<=-0.03336391001939773\n",
      "Run episode 13 with rewards 9.0\n",
      "============ 14 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +1.1591 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   +0.2203 if cv>=-0.1358855664730072 & pa>=-0.06187741458415985\n",
      "   +1.1591 if pa>=-0.019380318000912666\n",
      "   +0.2028 if cp<=-0.03336391001939773\n",
      "   +0.2028 if cp<=-0.031896191090345374\n",
      "--------------\n",
      "   -1.1591 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   -0.2203 if cv>=-0.1358855664730072 & pa>=-0.06187741458415985\n",
      "   -1.1591 if pa>=-0.019380318000912666\n",
      "   -0.2028 if cp<=-0.03336391001939773\n",
      "   -0.2028 if cp<=-0.031896191090345374\n",
      "Run episode 14 with rewards 9.0\n",
      "origin 0.6849780930645504 new 0.6852694221731955 not updated\n",
      "============ 15 ===========\n",
      "8 actions [0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +1.1591 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   +0.2203 if cv>=-0.1358855664730072 & pa>=-0.06187741458415985\n",
      "   +1.1591 if pa>=-0.019380318000912666\n",
      "   +0.2028 if cp<=-0.03336391001939773\n",
      "   +0.2028 if cp<=-0.031896191090345374\n",
      "--------------\n",
      "   -1.0523 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   -0.2122 if cv>=-0.1358855664730072 & pa>=-0.06187741458415985\n",
      "   -1.0523 if pa>=-0.019380318000912666\n",
      "   -0.3018 if cp<=-0.031896191090345374\n",
      "   -0.1754 if cp<=-0.03498250395059585\n",
      "Run episode 15 with rewards 8.0\n",
      "============ 16 ===========\n",
      "10 actions [0, 1, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +1.0929 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   +0.2156 if cv>=-0.1358855664730072 & pa>=-0.06187741458415985\n",
      "   +1.0929 if pa>=-0.019380318000912666\n",
      "   +0.0015 if cp<=-0.03336391001939773\n",
      "   +0.3498 if cp<=0.03269056975841523\n",
      "--------------\n",
      "   -1.0231 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   -0.2015 if cv>=-0.1358855664730072 & pa>=-0.06187741458415985\n",
      "   -1.0231 if pa>=-0.019380318000912666\n",
      "   -0.0015 if cp<=-0.031896191090345374\n",
      "   -0.3312 if cp<=0.03269056975841523\n",
      "Run episode 16 with rewards 10.0\n",
      "============ 17 ===========\n",
      "48 actions [0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 0, 1, 0, 1, 0, 0]\n",
      "   +0.1865 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   +0.9257 if cv>=-0.1358855664730072 & pa>=-0.06187741458415985\n",
      "   +0.1865 if pa>=-0.019380318000912666\n",
      "   +0.1865 if cp<=0.03269056975841523\n",
      "   -4.5536 if cp>=-0.04096805900335312 & cv<=-0.17705223858356472\n",
      "--------------\n",
      "   -0.1367 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   -0.9148 if cv>=-0.1358855664730072 & pa>=-0.06187741458415985\n",
      "   -0.1367 if pa>=-0.019380318000912666\n",
      "   -0.1367 if cp<=0.03269056975841523\n",
      "   +4.5606 if cp>=-0.04096805900335312 & cv<=-0.17705223858356472\n",
      "Run episode 17 with rewards 48.0\n",
      "============ 18 ===========\n",
      "104 actions [1, 0, 1, 0, 1, 0, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0, 0, 1, 0, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 0, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 0, 0, 0, 0, 1, 1, 1, 0]\n",
      "   +3.6495 if cv>=-0.1358855664730072 & pa>=-0.06187741458415985\n",
      "   -0.0002 if pa>=-0.019380318000912666\n",
      "   +0.1393 if cp<=0.03269056975841523\n",
      "   -2.2188 if cp>=-0.04096805900335312 & cv<=-0.17705223858356472\n",
      "   -7.6773 if cp>=0.014864135906100279 & pa>=-0.02832670323550701 & pav>=-0.06850113570690151\n",
      "--------------\n",
      "   +0.5735 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   -4.0188 if cv>=-0.1358855664730072 & pa>=-0.06187741458415985\n",
      "   -0.0000 if pa>=-0.019380318000912666\n",
      "   +2.0552 if cp>=-0.04096805900335312 & cv<=-0.17705223858356472\n",
      "   +7.4731 if cv>=-0.18116432726383208 & pa>=-0.02832670323550701 & pav>=-0.06850113570690151\n",
      "Run episode 18 with rewards 104.0\n",
      "best\n",
      "============ 19 ===========\n",
      "39 actions [1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 0, 0, 1, 1, 1, 0, 1, 0, 1, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 0, 1, 0]\n",
      "   +2.6825 if cv>=-0.1358855664730072 & pa>=-0.06187741458415985\n",
      "   +0.4619 if cp<=0.03269056975841523\n",
      "   -3.7295 if cp>=-0.04096805900335312 & cv<=-0.17705223858356472\n",
      "   -3.7817 if cp>=0.014864135906100279 & pa>=-0.02832670323550701 & pav>=-0.06850113570690151\n",
      "   +3.9384 if cp>=0.05088155344128609\n",
      "--------------\n",
      "   +0.0199 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   -3.2092 if cv>=-0.1358855664730072 & pa>=-0.06187741458415985\n",
      "   +3.4528 if cp>=-0.04096805900335312 & cv<=-0.17705223858356472\n",
      "   +5.3621 if cv>=-0.18116432726383208 & pa>=-0.02832670323550701 & pav>=-0.06850113570690151\n",
      "   -3.9384 if cp>=0.05088155344128609\n",
      "Run episode 19 with rewards 39.0\n",
      "============ 20 ===========\n",
      "47 actions [0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 0, 1, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 0, 0]\n",
      "   +0.9928 if cv>=-0.1358855664730072 & pa>=-0.06187741458415985\n",
      "   -6.2888 if cp>=-0.04096805900335312 & cv<=-0.17705223858356472\n",
      "   -2.7253 if cp>=0.014864135906100279 & pa>=-0.02832670323550701 & pav>=-0.06850113570690151\n",
      "   +5.8944 if cp>=0.05088155344128609\n",
      "   +6.4414 if cp>=0.04705715626478195 & pa<=0.030875412002205848 & pav<=0.06523336023092272\n",
      "--------------\n",
      "   -1.0027 if cv>=-0.1358855664730072 & pa>=-0.06187741458415985\n",
      "   +4.7973 if cp>=-0.04096805900335312 & cv<=-0.17705223858356472\n",
      "   +3.5979 if cv>=-0.18116432726383208 & pa>=-0.02832670323550701 & pav>=-0.06850113570690151\n",
      "   -5.4178 if cp>=0.05088155344128609\n",
      "   -6.2610 if cp>=0.04705715626478195 & pa<=0.030875412002205848 & pav<=0.06523336023092272\n",
      "Run episode 20 with rewards 47.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 21 ===========\n",
      "41 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0]\n",
      "   -3.7760 if cp>=-0.04096805900335312 & cv<=-0.17705223858356472\n",
      "   -1.1859 if cp>=0.014864135906100279 & pa>=-0.02832670323550701 & pav>=-0.06850113570690151\n",
      "   +1.7375 if cp>=0.05088155344128609\n",
      "   +0.0000 if cp>=0.04705715626478195 & pa<=0.030875412002205848 & pav<=0.06523336023092272\n",
      "   +6.0802 if cv<=0.16269262433052065 & pa<=0.06436489671468736 & pav<=0.049871761351823814\n",
      "--------------\n",
      "   +2.1983 if cp>=-0.04096805900335312 & cv<=-0.17705223858356472\n",
      "   +2.6615 if cv>=-0.18116432726383208 & pa>=-0.02832670323550701 & pav>=-0.06850113570690151\n",
      "   -2.1279 if cp>=0.05088155344128609\n",
      "   +0.0000 if cp>=0.04705715626478195 & pa<=0.030875412002205848 & pav<=0.06523336023092272\n",
      "   -5.4429 if cp<=0.006231134664267317 & pa<=0.06436489671468736 & pav<=0.049871761351823814\n",
      "Run episode 21 with rewards 41.0\n",
      "============ 22 ===========\n",
      "36 actions [0, 1, 0, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 0, 1, 1, 1, 0, 1, 0, 0, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0, 0, 0, 0]\n",
      "   -2.5256 if cp>=-0.04096805900335312 & cv<=-0.17705223858356472\n",
      "   +0.0000 if cp>=0.014864135906100279 & pa>=-0.02832670323550701 & pav>=-0.06850113570690151\n",
      "   +0.0000 if cp>=0.05088155344128609\n",
      "   +3.2149 if cv<=0.16269262433052065 & pa<=0.06436489671468736 & pav<=0.049871761351823814\n",
      "   -1.0424 if cp>=-0.06668204814195633\n",
      "--------------\n",
      "   +1.4722 if cp>=-0.04096805900335312 & cv<=-0.17705223858356472\n",
      "   -0.4373 if cv>=-0.18116432726383208 & pa>=-0.02832670323550701 & pav>=-0.06850113570690151\n",
      "   -0.0000 if cp>=0.05088155344128609\n",
      "   -1.4010 if cp<=0.006231134664267317 & pa<=0.06436489671468736 & pav<=0.049871761351823814\n",
      "   +1.0589 if cp>=-0.06668204814195633\n",
      "Run episode 22 with rewards 36.0\n",
      "============ 23 ===========\n",
      "47 actions [0, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1]\n",
      "   -0.0000 if cp>=-0.04096805900335312 & cv<=-0.17705223858356472\n",
      "   -0.0000 if cp>=0.05088155344128609\n",
      "   +3.6954 if cv<=0.16269262433052065 & pa<=0.06436489671468736 & pav<=0.049871761351823814\n",
      "   +0.3778 if cp>=-0.06668204814195633\n",
      "   -3.9877 if cp>=-0.12027187645435333 & pav>=0.3649852573871616\n",
      "--------------\n",
      "   -0.0000 if cp>=-0.04096805900335312 & cv<=-0.17705223858356472\n",
      "   -0.0921 if cv>=-0.18116432726383208 & pa>=-0.02832670323550701 & pav>=-0.06850113570690151\n",
      "   -2.4815 if cp<=0.006231134664267317 & pa<=0.06436489671468736 & pav<=0.049871761351823814\n",
      "   -0.3507 if cp>=-0.06668204814195633\n",
      "   +3.9859 if cp>=-0.12027187645435333 & pav>=0.3649852573871616\n",
      "Run episode 23 with rewards 47.0\n",
      "============ 24 ===========\n",
      "52 actions [0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 0, 1, 1, 1, 1, 0, 0, 1]\n",
      "   -0.9781 if cp>=-0.04096805900335312 & cv<=-0.17705223858356472\n",
      "   +2.6544 if cv<=0.16269262433052065 & pa<=0.06436489671468736 & pav<=0.049871761351823814\n",
      "   +0.9402 if cp>=-0.06668204814195633\n",
      "   -2.8047 if cp>=-0.12027187645435333 & pav>=0.3649852573871616\n",
      "   -4.7818 if cp<=-0.0031674618832766856 & cp<=-0.061794462800025936 & cv<=0.22162300050258638 & pa<=0.09393199980258946\n",
      "--------------\n",
      "   +3.4284 if cv>=-0.18116432726383208 & pa>=-0.02832670323550701 & pav>=-0.06850113570690151\n",
      "   -1.1303 if cp<=0.006231134664267317 & pa<=0.06436489671468736 & pav<=0.049871761351823814\n",
      "   -2.6039 if cp>=-0.06668204814195633\n",
      "   +4.2770 if cp>=-0.12027187645435333 & pav>=0.3649852573871616\n",
      "   -1.8496 if cp>=-0.061794462800025936 & cv<=0.02486563660204412 & pav<=0.3116439402103426\n",
      "Run episode 24 with rewards 52.0\n",
      "============ 25 ===========\n",
      "19 actions [0, 0, 1, 0, 0, 1, 1, 1, 0, 1, 0, 0, 1, 1, 1, 0, 1, 0, 1]\n",
      "   -3.9367 if cp>=-0.04096805900335312 & cv<=-0.17705223858356472\n",
      "   +1.0799 if cv<=0.16269262433052065 & pa<=0.06436489671468736 & pav<=0.049871761351823814\n",
      "   +0.7837 if cp>=-0.12027187645435333 & pav>=0.3649852573871616\n",
      "   -3.9657 if cp<=-0.0031674618832766856 & cp<=-0.061794462800025936 & cv<=0.22162300050258638 & pa<=0.09393199980258946\n",
      "   +2.8870 if cv<=0.3801601111888886 & pav<=0.3630851030349735 & pav>=0.07883234322071077\n",
      "--------------\n",
      "   +3.8954 if cv>=-0.18116432726383208 & pa>=-0.02832670323550701 & pav>=-0.06850113570690151\n",
      "   -3.9775 if cp>=-0.06668204814195633\n",
      "   +3.4749 if cp>=-0.12027187645435333 & pav>=0.3649852573871616\n",
      "   -4.3626 if cp>=-0.061794462800025936 & cv<=0.02486563660204412 & pav<=0.3116439402103426\n",
      "   +2.3111 if cp<=-0.05617154762148857 & cv>=0.3801601111888886\n",
      "Run episode 25 with rewards 19.0\n",
      "============ 26 ===========\n",
      "34 actions [0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 1, 1, 1, 1, 0, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1]\n",
      "   -0.7459 if cp>=-0.04096805900335312 & cv<=-0.17705223858356472\n",
      "   +0.4286 if cv<=0.16269262433052065 & pa<=0.06436489671468736 & pav<=0.049871761351823814\n",
      "   +0.0000 if cp<=-0.0031674618832766856 & cp<=-0.061794462800025936 & cv<=0.22162300050258638 & pa<=0.09393199980258946\n",
      "   +3.4375 if cv<=0.3801601111888886 & pav<=0.3630851030349735 & pav>=0.07883234322071077\n",
      "   -3.3127 if pav>=0.6621821045875549\n",
      "--------------\n",
      "   +3.9516 if cv>=-0.18116432726383208 & pa>=-0.02832670323550701 & pav>=-0.06850113570690151\n",
      "   -4.3889 if cp>=-0.06668204814195633\n",
      "   +1.7093 if cp>=-0.12027187645435333 & pav>=0.3649852573871616\n",
      "   -1.9733 if cp>=-0.061794462800025936 & cv<=0.02486563660204412 & pav<=0.3116439402103426\n",
      "   +3.1384 if pav>=0.6621821045875549\n",
      "Run episode 26 with rewards 34.0\n",
      "============ 27 ===========\n",
      "32 actions [0, 0, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 1, 0, 1, 0, 1, 1, 0, 0, 0, 1, 1, 0, 0, 1, 1, 1, 0, 1, 0, 1]\n",
      "   +1.3367 if cp>=-0.04096805900335312 & cv<=-0.17705223858356472\n",
      "   +0.1419 if cv<=0.16269262433052065 & pa<=0.06436489671468736 & pav<=0.049871761351823814\n",
      "   +3.9484 if cv<=0.3801601111888886 & pav<=0.3630851030349735 & pav>=0.07883234322071077\n",
      "   -4.8615 if pav>=0.6621821045875549\n",
      "   -5.1975 if cp<=-0.04292856231331825 & cv<=-0.42646949291229247 & pav<=0.6685341238975525\n",
      "--------------\n",
      "   +3.7239 if cv>=-0.18116432726383208 & pa>=-0.02832670323550701 & pav>=-0.06850113570690151\n",
      "   -3.3669 if cp>=-0.06668204814195633\n",
      "   -0.8783 if cp>=-0.061794462800025936 & cv<=0.02486563660204412 & pav<=0.3116439402103426\n",
      "   +3.9288 if pav>=0.6621821045875549\n",
      "   +5.8275 if cp<=-0.01755637452006338 & cp<=-0.04292856231331825 & cv<=-0.20005003511905653 & pav<=0.6685341238975525 & pav>=0.3519272327423096\n",
      "Run episode 27 with rewards 32.0\n",
      "============ 28 ===========\n",
      "54 actions [0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 1]\n",
      "   +0.6566 if cp>=-0.04096805900335312 & cv<=-0.17705223858356472\n",
      "   +1.2488 if cv<=0.3801601111888886 & pav<=0.3630851030349735 & pav>=0.07883234322071077\n",
      "   -4.2016 if pav>=0.6621821045875549\n",
      "   -0.0000 if cp<=-0.04292856231331825 & cv<=-0.42646949291229247 & pav<=0.6685341238975525\n",
      "   +3.7496 if cv>=0.15397329926490785 & pa<=0.10597171783447266\n",
      "--------------\n",
      "   +5.7487 if cv>=-0.18116432726383208 & pa>=-0.02832670323550701 & pav>=-0.06850113570690151\n",
      "   -5.1122 if cp>=-0.06668204814195633\n",
      "   +5.3855 if pav>=0.6621821045875549\n",
      "   +7.8872 if cp<=-0.01755637452006338 & cp<=-0.04292856231331825 & cv<=-0.20005003511905653 & pav<=0.6685341238975525 & pav>=0.3519272327423096\n",
      "   -3.8309 if cv>=0.15397329926490785 & pa<=0.10597171783447266\n",
      "Run episode 28 with rewards 54.0\n",
      "============ 29 ===========\n",
      "12 actions [1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0]\n",
      "   +0.0000 if cp>=-0.04096805900335312 & cv<=-0.17705223858356472\n",
      "   +3.2110 if cv<=0.3801601111888886 & pav<=0.3630851030349735 & pav>=0.07883234322071077\n",
      "   -0.2171 if pav>=0.6621821045875549\n",
      "   +1.0050 if cv>=0.15397329926490785 & pa<=0.10597171783447266\n",
      "   -2.3629 if cp<=-0.11825198382139206 & pav<=-0.05982564762234682\n",
      "--------------\n",
      "   +7.2510 if cv>=-0.18116432726383208 & pa>=-0.02832670323550701 & pav>=-0.06850113570690151\n",
      "   -5.4468 if cp>=-0.06668204814195633\n",
      "   +0.9824 if pav>=0.6621821045875549\n",
      "  +10.8743 if cp<=-0.01755637452006338 & cp<=-0.04292856231331825 & cv<=-0.20005003511905653 & pav<=0.6685341238975525 & pav>=0.3519272327423096\n",
      "   -2.2668 if pav>=-0.05982564762234682\n",
      "Run episode 29 with rewards 12.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 30 ===========\n",
      "15 actions [1, 0, 1, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 1, 1]\n",
      "   +0.0120 if cv<=0.3801601111888886 & pav<=0.3630851030349735 & pav>=0.07883234322071077\n",
      "   -2.1038 if pav>=0.6621821045875549\n",
      "   +0.1259 if cv>=0.15397329926490785 & pa<=0.10597171783447266\n",
      "   +0.0000 if cp<=-0.11825198382139206 & pav<=-0.05982564762234682\n",
      "   -2.9057 if cp>=0.005294948071241379 & pa>=0.002686667535454035\n",
      "--------------\n",
      "   +4.0112 if cv>=-0.18116432726383208 & pa>=-0.02832670323550701 & pav>=-0.06850113570690151\n",
      "   -3.1112 if cp>=-0.06668204814195633\n",
      "   -0.0000 if cp<=-0.01755637452006338 & cp<=-0.04292856231331825 & cv<=-0.20005003511905653 & pav<=0.6685341238975525 & pav>=0.3519272327423096\n",
      "   +0.4584 if pav>=-0.05982564762234682\n",
      "   -3.4213 if cp>=0.00865623727440834\n",
      "Run episode 30 with rewards 15.0\n",
      "============ 31 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.0652 if cv<=0.3801601111888886 & pav<=0.3630851030349735 & pav>=0.07883234322071077\n",
      "   -0.8068 if pav>=0.6621821045875549\n",
      "   +2.4802 if cv>=0.15397329926490785 & pa<=0.10597171783447266\n",
      "   -5.5924 if cp>=0.005294948071241379 & pa>=0.002686667535454035\n",
      "   +2.8030 if cp>=0.00773359667509795 & cv<=-0.31751075983047444 & cv>=-0.6692519307136535\n",
      "--------------\n",
      "   +4.8048 if cv>=-0.18116432726383208 & pa>=-0.02832670323550701 & pav>=-0.06850113570690151\n",
      "   -4.7542 if cp>=-0.06668204814195633\n",
      "   +0.2333 if pav>=-0.05982564762234682\n",
      "   -0.7824 if cp>=0.00865623727440834\n",
      "   -2.1674 if cp>=0.03786369040608406\n",
      "Run episode 31 with rewards 9.0\n",
      "============ 32 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +1.7782 if pav>=0.6621821045875549\n",
      "   -0.0000 if cv>=0.15397329926490785 & pa<=0.10597171783447266\n",
      "   -0.0000 if cp>=0.005294948071241379 & pa>=0.002686667535454035\n",
      "   -0.0000 if cp>=0.00773359667509795 & cv<=-0.31751075983047444 & cv>=-0.6692519307136535\n",
      "   +2.5548 if cp>=-0.017135579138994217\n",
      "--------------\n",
      "   -0.2437 if cv>=-0.18116432726383208 & pa>=-0.02832670323550701 & pav>=-0.06850113570690151\n",
      "   -1.7812 if cp>=-0.06668204814195633\n",
      "   -0.0000 if cp>=0.00865623727440834\n",
      "   -0.0000 if cp>=0.03786369040608406\n",
      "   -2.6847 if cp>=-0.08920289427042008\n",
      "Run episode 32 with rewards 9.0\n",
      "============ 33 ===========\n",
      "9 actions [0, 0, 0, 1, 0, 0, 0, 0, 0]\n",
      "   +0.2025 if pav>=0.6621821045875549\n",
      "   +0.2778 if cp>=0.005294948071241379 & pa>=0.002686667535454035\n",
      "   +0.1207 if cp>=0.00773359667509795 & cv<=-0.31751075983047444 & cv>=-0.6692519307136535\n",
      "   +0.3794 if cp>=-0.017135579138994217\n",
      "   +0.4211 if cp>=-0.045064251869916916\n",
      "--------------\n",
      "   -0.3975 if cv>=-0.18116432726383208 & pa>=-0.02832670323550701 & pav>=-0.06850113570690151\n",
      "   -0.9631 if cp>=-0.06668204814195633\n",
      "   -0.0000 if cp>=0.03786369040608406\n",
      "   -0.9398 if cp>=-0.08920289427042008\n",
      "   -0.0264 if cp<=0.006803672201931484 & cp>=-0.014044384472072121\n",
      "Run episode 33 with rewards 9.0\n",
      "============ 34 ===========\n",
      "12 actions [0, 0, 0, 1, 0, 1, 0, 0, 1, 1, 0, 0]\n",
      "   +0.2623 if pav>=0.6621821045875549\n",
      "   -0.0000 if cp>=0.005294948071241379 & pa>=0.002686667535454035\n",
      "   +1.5789 if cp>=-0.017135579138994217\n",
      "   +0.1692 if cp>=-0.045064251869916916\n",
      "   -3.6536 if cp>=-0.024263936281204216 & cv<=-0.4211744308471678\n",
      "--------------\n",
      "   -0.7449 if cv>=-0.18116432726383208 & pa>=-0.02832670323550701 & pav>=-0.06850113570690151\n",
      "   +0.1712 if cp>=-0.06668204814195633\n",
      "   -0.1046 if cp>=-0.08920289427042008\n",
      "   -2.0946 if cp<=0.006803672201931484 & cp>=-0.014044384472072121\n",
      "   -2.2823 if cp<=-0.024263936281204216\n",
      "Run episode 34 with rewards 12.0\n",
      "============ 35 ===========\n",
      "11 actions [0, 0, 0, 1, 0, 0, 1, 1, 1, 0, 1]\n",
      "   -2.2706 if pav>=0.6621821045875549\n",
      "   +3.3039 if cp>=-0.017135579138994217\n",
      "   -0.2362 if cp>=-0.045064251869916916\n",
      "   -2.9173 if cp>=-0.024263936281204216 & cv<=-0.4211744308471678\n",
      "   +1.8355 if cp<=-0.006551685370504853 & cp>=-0.03490797542035579\n",
      "--------------\n",
      "   -0.5120 if cv>=-0.18116432726383208 & pa>=-0.02832670323550701 & pav>=-0.06850113570690151\n",
      "   +0.0003 if cp>=-0.06668204814195633\n",
      "   -3.0025 if cp<=0.006803672201931484 & cp>=-0.014044384472072121\n",
      "   +0.5003 if cp<=-0.024263936281204216\n",
      "   -1.9875 if cp>=0.037367440015077594\n",
      "Run episode 35 with rewards 11.0\n",
      "============ 36 ===========\n",
      "14 actions [0, 0, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 1]\n",
      "   -2.4494 if pav>=0.6621821045875549\n",
      "   +2.7890 if cp>=-0.017135579138994217\n",
      "   -2.1564 if cp>=-0.024263936281204216 & cv<=-0.4211744308471678\n",
      "   +1.1332 if cp<=-0.006551685370504853 & cp>=-0.03490797542035579\n",
      "   +1.4181 if cp<=-0.002018781378865232 & cv>=-0.1854899823665619\n",
      "--------------\n",
      "   -1.0347 if cv>=-0.18116432726383208 & pa>=-0.02832670323550701 & pav>=-0.06850113570690151\n",
      "   -2.8438 if cp<=0.006803672201931484 & cp>=-0.014044384472072121\n",
      "   -0.4197 if cp<=-0.024263936281204216\n",
      "   +0.0000 if cp>=0.037367440015077594\n",
      "   +0.5113 if cv<=-0.37181591987609863\n",
      "Run episode 36 with rewards 14.0\n",
      "============ 37 ===========\n",
      "13 actions [0, 0, 0, 0, 1, 1, 0, 1, 1, 0, 0, 1, 1]\n",
      "   -2.6880 if pav>=0.6621821045875549\n",
      "   +0.0000 if cp>=-0.017135579138994217\n",
      "   +0.0000 if cp>=-0.024263936281204216 & cv<=-0.4211744308471678\n",
      "   +0.0803 if cp<=-0.002018781378865232 & cv>=-0.1854899823665619\n",
      "   +4.7284 if cp>=-0.08581082671880721 & pav<=0.909254789352417\n",
      "--------------\n",
      "   -0.3824 if cv>=-0.18116432726383208 & pa>=-0.02832670323550701 & pav>=-0.06850113570690151\n",
      "   +0.0000 if cp<=0.006803672201931484 & cp>=-0.014044384472072121\n",
      "   -2.8945 if cp<=-0.024263936281204216\n",
      "   +0.8842 if cv<=-0.37181591987609863\n",
      "   +2.5878 if cv<=-0.4683873891830444 & pav>=0.909254789352417\n",
      "Run episode 37 with rewards 13.0\n",
      "============ 38 ===========\n",
      "43 actions [0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 1, 0]\n",
      "   -2.8939 if pav>=0.6621821045875549\n",
      "   +5.0202 if cp>=-0.017135579138994217\n",
      "   +0.2247 if cp<=-0.002018781378865232 & cv>=-0.1854899823665619\n",
      "   +0.4183 if cp>=-0.08581082671880721 & pav<=0.909254789352417\n",
      "   +0.2777 if cp>=-0.00422500977292656\n",
      "--------------\n",
      "   -0.7603 if cv>=-0.18116432726383208 & pa>=-0.02832670323550701 & pav>=-0.06850113570690151\n",
      "   +2.3621 if cp<=-0.024263936281204216\n",
      "   -0.6668 if cv<=-0.37181591987609863\n",
      "   +1.1906 if cv<=-0.4683873891830444 & pav>=0.909254789352417\n",
      "   -1.6576 if cp<=-0.07095447331666946 & pav<=0.8885409235954285\n",
      "Run episode 38 with rewards 43.0\n",
      "============ 39 ===========\n",
      "14 actions [0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 0, 1, 1, 0]\n",
      "   -5.3681 if pav>=0.6621821045875549\n",
      "   +4.3970 if cp>=-0.017135579138994217\n",
      "   +0.6036 if cp>=-0.08581082671880721 & pav<=0.909254789352417\n",
      "   +5.0770 if cp>=-0.00422500977292656\n",
      "   -2.8188 if cp<=0.03477869853377343 & cv>=0.2755682587623599\n",
      "--------------\n",
      "   -1.9857 if cv>=-0.18116432726383208 & pa>=-0.02832670323550701 & pav>=-0.06850113570690151\n",
      "   +7.2327 if cp<=-0.024263936281204216\n",
      "   +1.0991 if cv<=-0.4683873891830444 & pav>=0.909254789352417\n",
      "   -5.1674 if cp<=-0.07095447331666946 & pav<=0.8885409235954285\n",
      "   -1.9808 if cp<=-0.023953026533126826\n",
      "Run episode 39 with rewards 14.0\n",
      "============ 40 ===========\n",
      "29 actions [0, 0, 0, 0, 1, 1, 1, 0, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0]\n",
      "   -0.6944 if pav>=0.6621821045875549\n",
      "   +0.0928 if cp>=-0.017135579138994217\n",
      "   +4.1009 if cp>=-0.00422500977292656\n",
      "   +0.0000 if cp<=0.03477869853377343 & cv>=0.2755682587623599\n",
      "   -2.4710 if cv<=0.004333408409729601 & pa>=0.18370938003063203\n",
      "--------------\n",
      "   -1.9828 if cv>=-0.18116432726383208 & pa>=-0.02832670323550701 & pav>=-0.06850113570690151\n",
      "   +1.2989 if cp<=-0.024263936281204216\n",
      "   -0.4905 if cp<=-0.07095447331666946 & pav<=0.8885409235954285\n",
      "   +1.2989 if cp<=-0.023953026533126826\n",
      "   +1.6922 if pav>=1.5026167631149292\n",
      "Run episode 40 with rewards 29.0\n",
      "============ 41 ===========\n",
      "14 actions [0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 0, 1, 1, 1]\n",
      "   -1.6875 if pav>=0.6621821045875549\n",
      "   +0.4014 if cp>=-0.017135579138994217\n",
      "   +2.6905 if cp>=-0.00422500977292656\n",
      "   +0.3233 if cv<=0.004333408409729601 & pa>=0.18370938003063203\n",
      "   +3.9927 if cp<=-0.02776297479867935 & pa<=0.17418833673000336 & pav<=0.5101841270923618\n",
      "--------------\n",
      "   -3.3764 if cv>=-0.18116432726383208 & pa>=-0.02832670323550701 & pav>=-0.06850113570690151\n",
      "   +1.0983 if cp<=-0.024263936281204216\n",
      "   +1.0983 if cp<=-0.023953026533126826\n",
      "   -0.1543 if pav>=1.5026167631149292\n",
      "   +4.3152 if cp<=-0.02776297479867935 & pa>=0.17418833673000336\n",
      "Run episode 41 with rewards 14.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 42 ===========\n",
      "25 actions [0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1]\n",
      "   +0.3733 if pav>=0.6621821045875549\n",
      "   +2.9968 if cp>=-0.017135579138994217\n",
      "   +2.9968 if cp>=-0.00422500977292656\n",
      "   -0.0000 if cp<=-0.02776297479867935 & pa<=0.17418833673000336 & pav<=0.5101841270923618\n",
      "   -1.9260 if cp>=-0.05849563851952552\n",
      "--------------\n",
      "   -0.0000 if cv>=-0.18116432726383208 & pa>=-0.02832670323550701 & pav>=-0.06850113570690151\n",
      "   +0.8135 if cp<=-0.024263936281204216\n",
      "   +0.8135 if cp<=-0.023953026533126826\n",
      "   +1.1226 if cp<=-0.02776297479867935 & pa>=0.17418833673000336\n",
      "   -1.9571 if cp<=0.028244622796773915 & cv>=-0.8379717230796814\n",
      "Run episode 42 with rewards 25.0\n",
      "============ 43 ===========\n",
      "36 actions [0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   -0.6230 if pav>=0.6621821045875549\n",
      "   +6.2149 if cp>=-0.017135579138994217\n",
      "   +2.4846 if cp>=-0.00422500977292656\n",
      "   -3.9791 if cp>=-0.05849563851952552\n",
      "   -0.7483 if cp<=-0.01792926266789436 & pa>=0.05777111351490021\n",
      "--------------\n",
      "   +1.6065 if cp<=-0.024263936281204216\n",
      "   +1.6065 if cp<=-0.023953026533126826\n",
      "   -0.0008 if cp<=-0.02776297479867935 & pa>=0.17418833673000336\n",
      "   -1.2569 if cp<=0.028244622796773915 & cv>=-0.8379717230796814\n",
      "   +2.2846 if cp<=-0.01792926266789436 & cv<=0.45012400150299126\n",
      "Run episode 43 with rewards 36.0\n",
      "============ 44 ===========\n",
      "35 actions [1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0]\n",
      "   +3.0680 if cp>=-0.017135579138994217\n",
      "   +1.5345 if cp>=-0.00422500977292656\n",
      "   +1.0705 if cp>=-0.05849563851952552\n",
      "   -2.9982 if cp<=-0.01792926266789436 & pa>=0.05777111351490021\n",
      "   +0.1785 if cv>=1.5178991556167603\n",
      "--------------\n",
      "   +2.8521 if cp<=-0.024263936281204216\n",
      "   +2.8521 if cp<=-0.023953026533126826\n",
      "   +0.3743 if cp<=0.028244622796773915 & cv>=-0.8379717230796814\n",
      "   +1.1579 if cp<=-0.01792926266789436 & cv<=0.45012400150299126\n",
      "   -1.9211 if cp<=0.024269644170999548\n",
      "Run episode 44 with rewards 35.0\n",
      "============ 45 ===========\n",
      "24 actions [1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0]\n",
      "   +3.2317 if cp>=-0.017135579138994217\n",
      "   +2.3109 if cp>=-0.00422500977292656\n",
      "   +0.1029 if cp>=-0.05849563851952552\n",
      "   -0.7546 if cp<=-0.01792926266789436 & pa>=0.05777111351490021\n",
      "   -1.0577 if cp<=-0.019180504232645 & cp>=-0.052694191038608534 & cv>=0.3886843502521515 & pa>=-0.04617589637637137\n",
      "--------------\n",
      "   +2.9005 if cp<=-0.024263936281204216\n",
      "   +2.9005 if cp<=-0.023953026533126826\n",
      "   +1.0712 if cp<=-0.01792926266789436 & cv<=0.45012400150299126\n",
      "   +0.1133 if cp<=0.024269644170999548\n",
      "   -0.1228 if cv>=-0.002094418217893684\n",
      "Run episode 45 with rewards 24.0\n",
      "============ 46 ===========\n",
      "31 actions [0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1]\n",
      "   +3.8252 if cp>=-0.017135579138994217\n",
      "   +1.5457 if cp>=-0.00422500977292656\n",
      "   -0.0000 if cp<=-0.01792926266789436 & pa>=0.05777111351490021\n",
      "   -0.0000 if cp<=-0.019180504232645 & cp>=-0.052694191038608534 & cv>=0.3886843502521515 & pa>=-0.04617589637637137\n",
      "   -2.7608 if cp>=-0.04315799735486505 & pa>=-0.04160828441381453\n",
      "--------------\n",
      "   +1.2685 if cp<=-0.024263936281204216\n",
      "   +1.2685 if cp<=-0.023953026533126826\n",
      "   +3.9731 if cp<=-0.01792926266789436 & cv<=0.45012400150299126\n",
      "   +0.1943 if cv>=-0.002094418217893684\n",
      "   +0.9372 if cp<=-0.01876702792942523 & cv>=0.5776128649711609\n",
      "Run episode 46 with rewards 31.0\n",
      "============ 47 ===========\n",
      "24 actions [1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0]\n",
      "   +5.8273 if cp>=-0.017135579138994217\n",
      "   -0.1048 if cp>=-0.00422500977292656\n",
      "   -0.1884 if cp<=-0.019180504232645 & cp>=-0.052694191038608534 & cv>=0.3886843502521515 & pa>=-0.04617589637637137\n",
      "   -2.0192 if cp>=-0.04315799735486505 & pa>=-0.04160828441381453\n",
      "   -5.6385 if cp>=0.01658136583864692 & cv<=0.5845133662223816 & cv>=0.5845133662223816\n",
      "--------------\n",
      "   +1.3497 if cp<=-0.024263936281204216\n",
      "   +1.3497 if cp<=-0.023953026533126826\n",
      "   +3.4204 if cp<=-0.01792926266789436 & cv<=0.45012400150299126\n",
      "   +0.2183 if cp<=-0.01876702792942523 & cv>=0.5776128649711609\n",
      "   -2.6639 if cp<=0.01658136583864692 & cv<=0.003865611972287299\n",
      "Run episode 47 with rewards 24.0\n",
      "============ 48 ===========\n",
      "32 actions [0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +5.1429 if cp>=-0.017135579138994217\n",
      "   -0.7154 if cp<=-0.019180504232645 & cp>=-0.052694191038608534 & cv>=0.3886843502521515 & pa>=-0.04617589637637137\n",
      "   -0.8647 if cp>=-0.04315799735486505 & pa>=-0.04160828441381453\n",
      "   +0.0000 if cp>=0.01658136583864692 & cv<=0.5845133662223816 & cv>=0.5845133662223816\n",
      "   -1.1142 if cp>=-0.048256512731313705 & pa<=-0.007012215256690959\n",
      "--------------\n",
      "   +1.2840 if cp<=-0.024263936281204216\n",
      "   +1.2840 if cp<=-0.023953026533126826\n",
      "   +1.8595 if cp<=-0.01792926266789436 & cv<=0.45012400150299126\n",
      "   +0.3184 if cp<=0.01658136583864692 & cv<=0.003865611972287299\n",
      "   +1.0890 if cp<=-0.008799812104552962 & cv>=-0.29624887406826006\n",
      "Run episode 48 with rewards 32.0\n",
      "============ 49 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 1, 1, 1]\n",
      "   +1.1382 if cp>=-0.017135579138994217\n",
      "   -1.3065 if cp<=-0.019180504232645 & cp>=-0.052694191038608534 & cv>=0.3886843502521515 & pa>=-0.04617589637637137\n",
      "   +1.1681 if cp>=-0.04315799735486505 & pa>=-0.04160828441381453\n",
      "   -0.0000 if cp>=-0.048256512731313705 & pa<=-0.007012215256690959\n",
      "   +4.2163 if cp>=-0.027115428820252415\n",
      "--------------\n",
      "   +4.0163 if cp<=-0.024263936281204216\n",
      "   +4.0163 if cp<=-0.023953026533126826\n",
      "   -3.1729 if cp<=-0.01792926266789436 & cv<=0.45012400150299126\n",
      "   +1.1722 if cp<=-0.008799812104552962 & cv>=-0.29624887406826006\n",
      "   -0.6310 if cp<=0.10201223939657213 & pav<=1.1777703523635865\n",
      "Run episode 49 with rewards 10.0\n",
      "============ 50 ===========\n",
      "8 actions [0, 0, 0, 0, 0, 0, 1, 1]\n",
      "   +1.1114 if cp>=-0.017135579138994217\n",
      "   -0.0000 if cp<=-0.019180504232645 & cp>=-0.052694191038608534 & cv>=0.3886843502521515 & pa>=-0.04617589637637137\n",
      "   +1.3958 if cp>=-0.04315799735486505 & pa>=-0.04160828441381453\n",
      "   +1.5852 if cp>=-0.027115428820252415\n",
      "   +0.3550 if cp>=0.035830370336771014\n",
      "--------------\n",
      "   +0.8685 if cp<=-0.024263936281204216\n",
      "   +0.8685 if cp<=-0.023953026533126826\n",
      "   +0.8685 if cp<=-0.01792926266789436 & cv<=0.45012400150299126\n",
      "   -0.0000 if cp<=-0.008799812104552962 & cv>=-0.29624887406826006\n",
      "   +0.5911 if cp<=0.035830370336771014\n",
      "Run episode 50 with rewards 8.0\n",
      "============ 51 ===========\n",
      "36 actions [1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1]\n",
      "   +1.6460 if cp>=-0.017135579138994217\n",
      "   +1.3247 if cp>=-0.04315799735486505 & pa>=-0.04160828441381453\n",
      "   +1.6460 if cp>=-0.027115428820252415\n",
      "   -0.0000 if cp>=0.035830370336771014\n",
      "   -0.3285 if cp<=-0.027089172601699827\n",
      "--------------\n",
      "   +0.8363 if cp<=-0.024263936281204216\n",
      "   +0.8363 if cp<=-0.023953026533126826\n",
      "   +0.8363 if cp<=-0.01792926266789436 & cv<=0.45012400150299126\n",
      "   -0.3725 if cp<=0.035830370336771014\n",
      "   +0.3395 if cp<=0.015123616531491288\n",
      "Run episode 51 with rewards 36.0\n",
      "============ 52 ===========\n",
      "50 actions [1, 1, 0, 0, 1, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   +6.9950 if cp>=-0.017135579138994217\n",
      "   -0.5925 if cp>=-0.04315799735486505 & pa>=-0.04160828441381453\n",
      "   -2.1991 if cp>=-0.027115428820252415\n",
      "   -0.1514 if cp<=-0.027089172601699827\n",
      "   -3.0260 if cp<=-0.030504142865538552 & cv<=0.825288712978363\n",
      "--------------\n",
      "   +1.5368 if cp<=-0.024263936281204216\n",
      "   +1.5368 if cp<=-0.023953026533126826\n",
      "   +1.4185 if cp<=-0.01792926266789436 & cv<=0.45012400150299126\n",
      "   +1.6842 if cp<=0.035830370336771014\n",
      "   -3.3899 if cv>=0.825288712978363\n",
      "Run episode 52 with rewards 50.0\n",
      "============ 53 ===========\n",
      "11 actions [0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1]\n",
      "   +7.8646 if cp>=-0.017135579138994217\n",
      "   -1.5498 if cp>=-0.04315799735486505 & pa>=-0.04160828441381453\n",
      "   -0.6062 if cp>=-0.027115428820252415\n",
      "   -1.0466 if cp<=-0.030504142865538552 & cv<=0.825288712978363\n",
      "   -3.2996 if cp>=-0.009246947243809672 & cv<=0.18535721004009248 & cv>=-0.1981553256511688 & pa>=-0.03180819004774093\n",
      "--------------\n",
      "   +1.2045 if cp<=-0.024263936281204216\n",
      "   +1.2045 if cp<=-0.023953026533126826\n",
      "   +2.4692 if cp<=0.035830370336771014\n",
      "   -2.0431 if cv>=0.825288712978363\n",
      "   -2.6931 if cp<=0.021468844264745768 & cp>=-0.009246947243809672 & cv<=-0.1981553256511688 & pa>=-0.03180819004774093\n",
      "Run episode 53 with rewards 11.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 54 ===========\n",
      "11 actions [0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 0]\n",
      "   +2.9804 if cp>=-0.017135579138994217\n",
      "   +2.4971 if cp>=-0.04315799735486505 & pa>=-0.04160828441381453\n",
      "   -0.5309 if cp<=-0.030504142865538552 & cv<=0.825288712978363\n",
      "   -0.0000 if cp>=-0.009246947243809672 & cv<=0.18535721004009248 & cv>=-0.1981553256511688 & pa>=-0.03180819004774093\n",
      "   +0.2828 if cp>=0.04330228641629219\n",
      "--------------\n",
      "   +0.9226 if cp<=-0.023953026533126826\n",
      "   +0.6035 if cp<=0.035830370336771014\n",
      "   +0.0000 if cv>=0.825288712978363\n",
      "   -0.0634 if cp<=0.021468844264745768 & cp>=-0.009246947243809672 & cv<=-0.1981553256511688 & pa>=-0.03180819004774093\n",
      "   -0.3845 if cv>=-1.019973635673523\n",
      "Run episode 54 with rewards 11.0\n",
      "============ 55 ===========\n",
      "43 actions [0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1, 0, 1, 0, 0, 0, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0]\n",
      "   +3.7491 if cp>=-0.017135579138994217\n",
      "   -0.2091 if cp>=-0.04315799735486505 & pa>=-0.04160828441381453\n",
      "   -1.0008 if cp<=-0.030504142865538552 & cv<=0.825288712978363\n",
      "   -0.0000 if cp>=0.04330228641629219\n",
      "   +0.9304 if pa>=0.20640085637569427\n",
      "--------------\n",
      "   +0.5011 if cp<=-0.023953026533126826\n",
      "   +1.9775 if cp<=0.035830370336771014\n",
      "   -0.3457 if cp<=0.021468844264745768 & cp>=-0.009246947243809672 & cv<=-0.1981553256511688 & pa>=-0.03180819004774093\n",
      "   -0.7983 if cv>=-1.019973635673523\n",
      "   +2.1353 if pav>=1.7934449911117554\n",
      "Run episode 55 with rewards 43.0\n",
      "============ 56 ===========\n",
      "45 actions [0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +2.5169 if cp>=-0.017135579138994217\n",
      "   +1.9273 if cp>=-0.04315799735486505 & pa>=-0.04160828441381453\n",
      "   -2.3740 if cp<=-0.030504142865538552 & cv<=0.825288712978363\n",
      "   +0.0000 if pa>=0.20640085637569427\n",
      "   -3.9840 if pav>=1.1559536457061768\n",
      "--------------\n",
      "   +0.3660 if cp<=-0.023953026533126826\n",
      "   +0.9525 if cp<=0.035830370336771014\n",
      "   +0.9525 if cv>=-1.019973635673523\n",
      "   -0.0000 if pav>=1.7934449911117554\n",
      "   -5.2026 if cp>=-0.042810378968715666 & cv>=-0.23563872575759887 & pa<=0.0056100058369338525 & pa>=-0.019244378618895976 & pa>=-0.07797572165727615\n",
      "Run episode 56 with rewards 45.0\n",
      "============ 57 ===========\n",
      "65 actions [0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0]\n",
      "   -0.1813 if cp>=-0.017135579138994217\n",
      "   -1.1890 if cp>=-0.04315799735486505 & pa>=-0.04160828441381453\n",
      "   -3.3061 if cp<=-0.030504142865538552 & cv<=0.825288712978363\n",
      "   -5.8236 if pav>=1.1559536457061768\n",
      "   +6.5135 if cp>=-0.024528086930513372\n",
      "--------------\n",
      "   +6.6892 if cp<=-0.023953026533126826\n",
      "   -2.3552 if cp<=0.035830370336771014\n",
      "   +1.2894 if cv>=-1.019973635673523\n",
      "   -0.4614 if cp>=-0.042810378968715666 & cv>=-0.23563872575759887 & pa<=0.0056100058369338525 & pa>=-0.019244378618895976 & pa>=-0.07797572165727615\n",
      "   +3.6945 if cv<=-0.4063100218772888 & pa<=0.06128802597522737 & pav>=1.0193459749221803\n",
      "Run episode 57 with rewards 65.0\n",
      "============ 58 ===========\n",
      "48 actions [0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 1]\n",
      "   +0.7142 if cp>=-0.04315799735486505 & pa>=-0.04160828441381453\n",
      "   -0.7049 if cp<=-0.030504142865538552 & cv<=0.825288712978363\n",
      "   -6.3481 if pav>=1.1559536457061768\n",
      "   +5.8379 if cp>=-0.024528086930513372\n",
      "   -1.9370 if pa>=-0.03507629930973053\n",
      "--------------\n",
      "   +3.5725 if cp<=-0.023953026533126826\n",
      "   +0.3065 if cp<=0.035830370336771014\n",
      "   -0.3828 if cv>=-1.019973635673523\n",
      "   +3.8236 if cv<=-0.4063100218772888 & pa<=0.06128802597522737 & pav>=1.0193459749221803\n",
      "   -2.4340 if cp>=-0.0011156381107866754 & cv<=-0.5931102752685546 & pa>=-0.07291205674409866\n",
      "Run episode 58 with rewards 48.0\n",
      "============ 59 ===========\n",
      "27 actions [1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   +1.2676 if cp>=-0.04315799735486505 & pa>=-0.04160828441381453\n",
      "   -7.0702 if pav>=1.1559536457061768\n",
      "   +5.1348 if cp>=-0.024528086930513372\n",
      "   -1.5773 if pa>=-0.03507629930973053\n",
      "   -1.2451 if pa<=0.15265043973922732 & pa>=0.04764041379094125\n",
      "--------------\n",
      "   +3.8010 if cp<=-0.023953026533126826\n",
      "   -0.3411 if cv>=-1.019973635673523\n",
      "   +1.7254 if cv<=-0.4063100218772888 & pa<=0.06128802597522737 & pav>=1.0193459749221803\n",
      "   +1.6307 if cp>=-0.0011156381107866754 & cv<=-0.5931102752685546 & pa>=-0.07291205674409866\n",
      "   +1.8915 if cp>=-0.021567066386342048 & cv<=-0.5491835236549377 & pa>=0.09688644409179688 & pav>=0.9672824025154114\n",
      "Run episode 59 with rewards 27.0\n",
      "============ 60 ===========\n",
      "38 actions [0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0]\n",
      "   +0.0000 if cp>=-0.04315799735486505 & pa>=-0.04160828441381453\n",
      "   -0.1308 if pav>=1.1559536457061768\n",
      "   +4.6913 if cp>=-0.024528086930513372\n",
      "   -1.0774 if pa>=-0.03507629930973053\n",
      "   -1.6910 if cp>=-0.05546507090330124 & pa>=-0.06270171254873275\n",
      "--------------\n",
      "   +4.6408 if cp<=-0.023953026533126826\n",
      "   -0.1123 if cv<=-0.4063100218772888 & pa<=0.06128802597522737 & pav>=1.0193459749221803\n",
      "   -0.0000 if cp>=-0.0011156381107866754 & cv<=-0.5931102752685546 & pa>=-0.07291205674409866\n",
      "   -0.0000 if cp>=-0.021567066386342048 & cv<=-0.5491835236549377 & pa>=0.09688644409179688 & pav>=0.9672824025154114\n",
      "   -0.6405 if pa<=-0.06270171254873275\n",
      "Run episode 60 with rewards 38.0\n",
      "============ 61 ===========\n",
      "40 actions [1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1]\n",
      "   +0.2155 if pav>=1.1559536457061768\n",
      "   +4.7126 if cp>=-0.024528086930513372\n",
      "   -1.3697 if pa>=-0.03507629930973053\n",
      "   +0.4924 if cp>=-0.05546507090330124 & pa>=-0.06270171254873275\n",
      "   -6.4680 if cp<=-0.014671675488352773 & cv<=-0.45671402215957635 & pa<=0.03575203716754914\n",
      "--------------\n",
      "   +3.7008 if cp<=-0.023953026533126826\n",
      "   -1.0578 if cv<=-0.4063100218772888 & pa<=0.06128802597522737 & pav>=1.0193459749221803\n",
      "   +0.0000 if cp>=-0.021567066386342048 & cv<=-0.5491835236549377 & pa>=0.09688644409179688 & pav>=0.9672824025154114\n",
      "   -1.1943 if pa<=-0.06270171254873275\n",
      "   +4.8598 if cp<=-0.014671675488352773 & cv<=-0.45671402215957635 & pa<=0.03575203716754914\n",
      "Run episode 61 with rewards 40.0\n",
      "============ 62 ===========\n",
      "8 actions [0, 0, 0, 0, 0, 0, 1, 1]\n",
      "   +5.7558 if cp>=-0.024528086930513372\n",
      "   -1.6573 if pa>=-0.03507629930973053\n",
      "   +0.8887 if cp>=-0.05546507090330124 & pa>=-0.06270171254873275\n",
      "   -0.0133 if cp<=-0.014671675488352773 & cv<=-0.45671402215957635 & pa<=0.03575203716754914\n",
      "   -0.4316 if \n",
      "--------------\n",
      "   +4.7803 if cp<=-0.023953026533126826\n",
      "   -0.4921 if cv<=-0.4063100218772888 & pa<=0.06128802597522737 & pav>=1.0193459749221803\n",
      "   -0.9052 if pa<=-0.06270171254873275\n",
      "   +0.0014 if cp<=-0.014671675488352773 & cv<=-0.45671402215957635 & pa<=0.03575203716754914\n",
      "   -0.4768 if cp<=0.00044456378091127687\n",
      "Run episode 62 with rewards 8.0\n",
      "============ 63 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +1.3937 if cp>=-0.024528086930513372\n",
      "   +0.9129 if pa>=-0.03507629930973053\n",
      "   +0.9131 if cp>=-0.05546507090330124 & pa>=-0.06270171254873275\n",
      "   +0.9129 if \n",
      "   -0.0698 if cp<=0.012518102675676355\n",
      "--------------\n",
      "   +0.3958 if cp<=-0.023953026533126826\n",
      "   -0.0000 if cv<=-0.4063100218772888 & pa<=0.06128802597522737 & pav>=1.0193459749221803\n",
      "   -0.0000 if pa<=-0.06270171254873275\n",
      "   +0.2670 if cp<=0.00044456378091127687\n",
      "   -0.5755 if cp>=-0.029834797978401183\n",
      "Run episode 63 with rewards 10.0\n",
      "============ 64 ===========\n",
      "8 actions [0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.8716 if cp>=-0.024528086930513372\n",
      "   +1.3363 if pa>=-0.03507629930973053\n",
      "   +1.2473 if cp>=-0.05546507090330124 & pa>=-0.06270171254873275\n",
      "   +2.1540 if \n",
      "   +0.0457 if cp<=-0.09050427675247193\n",
      "--------------\n",
      "   -0.6493 if cp<=-0.023953026533126826\n",
      "   +0.0000 if pa<=-0.06270171254873275\n",
      "   -1.2225 if cp<=0.00044456378091127687\n",
      "   -0.6638 if cp>=-0.029834797978401183\n",
      "   -0.0217 if cp<=-0.09050427675247193\n",
      "Run episode 64 with rewards 8.0\n",
      "============ 65 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.0000 if cp>=-0.024528086930513372\n",
      "   +0.9892 if pa>=-0.03507629930973053\n",
      "   +0.8091 if cp>=-0.05546507090330124 & pa>=-0.06270171254873275\n",
      "   +0.9892 if \n",
      "   +0.0432 if cp<=-0.08088618963956833\n",
      "--------------\n",
      "   -0.4002 if cp<=-0.023953026533126826\n",
      "   -0.4002 if cp<=0.00044456378091127687\n",
      "   -0.0000 if cp>=-0.029834797978401183\n",
      "   +0.0081 if cp<=-0.09050427675247193\n",
      "   -0.2243 if cp<=-0.03281810283660889\n",
      "Run episode 65 with rewards 10.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 66 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +1.4710 if pa>=-0.03507629930973053\n",
      "   +1.1824 if cp>=-0.05546507090330124 & pa>=-0.06270171254873275\n",
      "   +1.4710 if \n",
      "   +0.1119 if cp<=-0.08088618963956833\n",
      "   +0.0131 if cp<=-0.1004813328385353\n",
      "--------------\n",
      "   -0.4550 if cp<=-0.023953026533126826\n",
      "   -1.4669 if cp<=0.00044456378091127687\n",
      "   -0.0837 if cp<=-0.09050427675247193\n",
      "   -0.3398 if cp<=-0.03281810283660889\n",
      "   -0.4487 if cp<=-0.016987614147365094 & cp>=-0.06014373525977135\n",
      "Run episode 66 with rewards 10.0\n",
      "============ 67 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +1.4619 if pa>=-0.03507629930973053\n",
      "   +1.4583 if cp>=-0.05546507090330124 & pa>=-0.06270171254873275\n",
      "   +1.4619 if \n",
      "   -0.0062 if cp<=-0.08088618963956833\n",
      "   +0.2172 if cp<=0.017213637568056588\n",
      "--------------\n",
      "   -0.0416 if cp<=-0.023953026533126826\n",
      "   -0.1612 if cp<=0.00044456378091127687\n",
      "   -0.0416 if cp<=-0.03281810283660889\n",
      "   -0.0755 if cp<=-0.016987614147365094 & cp>=-0.06014373525977135\n",
      "   -0.9162 if \n",
      "Run episode 67 with rewards 10.0\n",
      "============ 68 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +1.0688 if pa>=-0.03507629930973053\n",
      "   +0.7160 if cp>=-0.05546507090330124 & pa>=-0.06270171254873275\n",
      "   +1.0688 if \n",
      "   +1.0688 if cp<=0.017213637568056588\n",
      "   +0.0089 if cp<=-0.10364686846733093\n",
      "--------------\n",
      "   -0.3328 if cp<=-0.023953026533126826\n",
      "   -0.5292 if cp<=0.00044456378091127687\n",
      "   -0.3580 if cp<=-0.016987614147365094 & cp>=-0.06014373525977135\n",
      "   -0.5292 if \n",
      "   -0.0076 if cp<=-0.10364686846733093\n",
      "Run episode 68 with rewards 10.0\n",
      "============ 69 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.5721 if pa>=-0.03507629930973053\n",
      "   +0.7122 if cp>=-0.05546507090330124 & pa>=-0.06270171254873275\n",
      "   +1.1962 if \n",
      "   +1.1962 if cp<=0.017213637568056588\n",
      "   +0.1712 if cp<=-0.08009615242481231\n",
      "--------------\n",
      "   -0.6542 if cp<=-0.023953026533126826\n",
      "   -0.6542 if cp<=0.00044456378091127687\n",
      "   -0.4899 if cp<=-0.016987614147365094 & cp>=-0.06014373525977135\n",
      "   -0.6542 if \n",
      "   -0.0040 if cp<=-0.11948426961898803\n",
      "Run episode 69 with rewards 9.0\n",
      "============ 70 ===========\n",
      "15 actions [1, 0, 1, 1, 1, 0, 0, 1, 0, 1, 0, 1, 1, 0, 1]\n",
      "   +0.7636 if pa>=-0.03507629930973053\n",
      "   +0.5229 if cp>=-0.05546507090330124 & pa>=-0.06270171254873275\n",
      "   +0.7636 if \n",
      "   +0.7636 if cp<=0.017213637568056588\n",
      "   +0.0175 if cp<=-0.09535319209098816\n",
      "--------------\n",
      "   -0.5303 if cp<=-0.023953026533126826\n",
      "   -0.5303 if cp<=0.00044456378091127687\n",
      "   -0.3636 if cp<=-0.016987614147365094 & cp>=-0.06014373525977135\n",
      "   -0.5303 if \n",
      "   -0.0110 if cp<=-0.09535319209098816\n",
      "Run episode 70 with rewards 15.0\n",
      "============ 71 ===========\n",
      "15 actions [1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1]\n",
      "   +0.0000 if pa>=-0.03507629930973053\n",
      "   -2.2086 if cp>=-0.05546507090330124 & pa>=-0.06270171254873275\n",
      "   +0.7129 if \n",
      "   +0.0000 if cp<=0.017213637568056588\n",
      "   -3.6713 if cp>=0.02455488555133343 & cv<=0.2264780580997467 & cv<=0.41638695597648623\n",
      "--------------\n",
      "   -0.0000 if cp<=-0.023953026533126826\n",
      "   -0.0000 if cp<=0.00044456378091127687\n",
      "   -0.0000 if cp<=-0.016987614147365094 & cp>=-0.06014373525977135\n",
      "   +2.1017 if \n",
      "   -4.0313 if cp<=0.08438727706670762 & cv>=0.41638695597648623\n",
      "Run episode 71 with rewards 15.0\n",
      "============ 72 ===========\n",
      "13 actions [1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1]\n",
      "   -1.1340 if pa>=-0.03507629930973053\n",
      "   -0.5610 if cp>=-0.05546507090330124 & pa>=-0.06270171254873275\n",
      "   -0.0842 if \n",
      "   +0.0000 if cp>=0.02455488555133343 & cv<=0.2264780580997467 & cv<=0.41638695597648623\n",
      "   +2.6348 if cp<=0.012162026017904289 & cv>=0.4613985836505894\n",
      "--------------\n",
      "   +0.7838 if cp<=-0.023953026533126826\n",
      "   -0.4587 if cp<=0.00044456378091127687\n",
      "   +2.8765 if \n",
      "   -6.4339 if cp<=0.08438727706670762 & cv>=0.41638695597648623\n",
      "   -0.4726 if cp>=0.012162026017904289 & cv>=0.4613985836505894\n",
      "Run episode 72 with rewards 13.0\n",
      "============ 73 ===========\n",
      "17 actions [1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0]\n",
      "   -0.5162 if pa>=-0.03507629930973053\n",
      "   -0.0678 if cp>=-0.05546507090330124 & pa>=-0.06270171254873275\n",
      "   -0.4432 if \n",
      "   +1.0525 if cp<=0.012162026017904289 & cv>=0.4613985836505894\n",
      "   -1.1076 if cv<=0.3584016978740692\n",
      "--------------\n",
      "   +0.0089 if cp<=-0.023953026533126826\n",
      "   +1.7337 if \n",
      "   -3.0548 if cp<=0.08438727706670762 & cv>=0.41638695597648623\n",
      "   -1.1865 if cp>=0.012162026017904289 & cv>=0.4613985836505894\n",
      "   +1.6638 if cv<=0.3584016978740692\n",
      "Run episode 73 with rewards 17.0\n",
      "============ 74 ===========\n",
      "20 actions [1, 1, 0, 1, 1, 0, 0, 1, 1, 0, 0, 1, 1, 0, 0, 1, 0, 1, 1, 0]\n",
      "   +0.8700 if pa>=-0.03507629930973053\n",
      "   -0.1030 if \n",
      "   +1.7013 if cp<=0.012162026017904289 & cv>=0.4613985836505894\n",
      "   -2.0830 if cv<=0.3584016978740692\n",
      "   -2.2046 if cp>=0.08152554333209992\n",
      "--------------\n",
      "   +0.3542 if \n",
      "   -2.9258 if cp<=0.08438727706670762 & cv>=0.41638695597648623\n",
      "   -1.0236 if cp>=0.012162026017904289 & cv>=0.4613985836505894\n",
      "   +2.3405 if cv<=0.3584016978740692\n",
      "   +2.7971 if cp>=0.08152554333209992\n",
      "Run episode 74 with rewards 20.0\n",
      "============ 75 ===========\n",
      "13 actions [1, 1, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 1]\n",
      "   +2.3104 if pa>=-0.03507629930973053\n",
      "   +1.0050 if cp<=0.012162026017904289 & cv>=0.4613985836505894\n",
      "   -0.7035 if cv<=0.3584016978740692\n",
      "   +0.0000 if cp>=0.08152554333209992\n",
      "   -4.4202 if cv<=0.37220085859298707\n",
      "--------------\n",
      "   -2.1485 if cp<=0.08438727706670762 & cv>=0.41638695597648623\n",
      "   -0.9678 if cp>=0.012162026017904289 & cv>=0.4613985836505894\n",
      "   +0.7456 if cv<=0.3584016978740692\n",
      "   +0.0000 if cp>=0.08152554333209992\n",
      "   +3.5379 if cv<=0.37220085859298707\n",
      "Run episode 75 with rewards 13.0\n",
      "============ 76 ===========\n",
      "13 actions [1, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1]\n",
      "   -0.3425 if pa>=-0.03507629930973053\n",
      "   +0.0000 if cp<=0.012162026017904289 & cv>=0.4613985836505894\n",
      "   -0.4406 if cv<=0.3584016978740692\n",
      "   -2.0901 if cv<=0.37220085859298707\n",
      "   +1.7738 if \n",
      "--------------\n",
      "   -1.2282 if cp<=0.08438727706670762 & cv>=0.41638695597648623\n",
      "   -2.5046 if cp>=0.012162026017904289 & cv>=0.4613985836505894\n",
      "   +1.0564 if cv<=0.3584016978740692\n",
      "   +1.6938 if cv<=0.37220085859298707\n",
      "   -1.2959 if cv<=0.37546820044517515\n",
      "Run episode 76 with rewards 13.0\n",
      "============ 77 ===========\n",
      "28 actions [1, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1]\n",
      "   -1.5422 if pa>=-0.03507629930973053\n",
      "   -1.4377 if cv<=0.3584016978740692\n",
      "   -1.4377 if cv<=0.37220085859298707\n",
      "   +1.6401 if \n",
      "   +4.3277 if cp<=-0.019311948493123048 & cp>=-0.03972508609294891 & cv<=0.34599844217300413\n",
      "--------------\n",
      "   -0.5963 if cp<=0.08438727706670762 & cv>=0.41638695597648623\n",
      "   -0.0373 if cp>=0.012162026017904289 & cv>=0.4613985836505894\n",
      "   +1.2452 if cv<=0.37220085859298707\n",
      "   +1.2452 if cv<=0.37546820044517515\n",
      "   -2.2439 if cp>=-0.03972508609294891\n",
      "Run episode 77 with rewards 28.0\n",
      "============ 78 ===========\n",
      "53 actions [1, 1, 0, 1, 0, 1, 0, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0, 0, 1, 0, 0, 0, 0, 0, 1, 1, 0, 0, 1, 1, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0, 0, 0, 0, 0, 0]\n",
      "   -0.8298 if pa>=-0.03507629930973053\n",
      "   -2.1716 if cv<=0.3584016978740692\n",
      "   +1.6073 if \n",
      "   +6.0002 if cp<=-0.019311948493123048 & cp>=-0.03972508609294891 & cv<=0.34599844217300413\n",
      "   -3.8335 if cp<=-0.03428530767560005\n",
      "--------------\n",
      "   +2.6226 if cp<=0.08438727706670762 & cv>=0.41638695597648623\n",
      "   +2.1711 if cv<=0.37220085859298707\n",
      "   +1.9661 if cv<=0.37546820044517515\n",
      "   -3.1675 if cp>=-0.03972508609294891\n",
      "   -1.8881 if cp>=-0.03428530767560005\n",
      "Run episode 78 with rewards 53.0\n",
      "============ 79 ===========\n",
      "23 actions [0, 0, 1, 1, 1, 1, 1, 0, 0, 1, 1, 1, 0, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +1.3892 if cv<=0.3584016978740692\n",
      "   -0.6260 if \n",
      "   +3.6924 if cp<=-0.019311948493123048 & cp>=-0.03972508609294891 & cv<=0.34599844217300413\n",
      "   -2.3702 if cp<=-0.03428530767560005\n",
      "   -2.6381 if cp<=0.07462580204010011 & cv<=0.19549628496170043\n",
      "--------------\n",
      "   +3.2675 if cp<=0.08438727706670762 & cv>=0.41638695597648623\n",
      "   +1.5766 if cv<=0.37220085859298707\n",
      "   +1.5767 if cv<=0.37546820044517515\n",
      "   -3.5097 if cp>=-0.03972508609294891\n",
      "   -0.7660 if cv<=0.0010787582723423856\n",
      "Run episode 79 with rewards 23.0\n",
      "============ 80 ===========\n",
      "34 actions [0, 0, 1, 1, 1, 0, 0, 0, 1, 1, 1, 1, 1, 0, 0, 1, 0, 0, 1, 1, 0, 1, 0, 0, 1, 1, 1, 0, 1, 1, 0, 0, 0, 1]\n",
      "   +0.0598 if cv<=0.3584016978740692\n",
      "   +3.8311 if cp<=-0.019311948493123048 & cp>=-0.03972508609294891 & cv<=0.34599844217300413\n",
      "   -6.0274 if cp<=-0.03428530767560005\n",
      "   -2.1999 if cp<=0.07462580204010011 & cv<=0.19549628496170043\n",
      "   -5.1922 if pav>=0.5754271745681763\n",
      "--------------\n",
      "   +0.6818 if cp<=0.08438727706670762 & cv>=0.41638695597648623\n",
      "   +0.7372 if cv<=0.37220085859298707\n",
      "   +0.7372 if cv<=0.37546820044517515\n",
      "   -1.1793 if cp>=-0.03972508609294891\n",
      "   +4.1448 if pav>=0.5754271745681763\n",
      "Run episode 80 with rewards 34.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 81 ===========\n",
      "37 actions [0, 0, 0, 1, 1, 1, 1, 1, 1, 0, 1, 0, 0, 0, 1, 1, 0, 1, 0, 1, 1, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0]\n",
      "   +6.1523 if cp<=-0.019311948493123048 & cp>=-0.03972508609294891 & cv<=0.34599844217300413\n",
      "   -6.2747 if cp<=-0.03428530767560005\n",
      "   -2.5811 if cp<=0.07462580204010011 & cv<=0.19549628496170043\n",
      "   -2.6593 if pav>=0.5754271745681763\n",
      "   +3.2763 if pa>=0.011727696284651756\n",
      "--------------\n",
      "   +1.1906 if cv<=0.37220085859298707\n",
      "   +1.1906 if cv<=0.37546820044517515\n",
      "   -1.6333 if cp>=-0.03972508609294891\n",
      "   +2.6678 if pav>=0.5754271745681763\n",
      "   -3.4328 if cp<=-0.024268984422087664 & cv<=0.23797347545623784\n",
      "Run episode 81 with rewards 37.0\n",
      "============ 82 ===========\n",
      "22 actions [0, 0, 0, 1, 1, 1, 1, 1, 1, 0, 1, 1, 0, 0, 1, 0, 0, 0, 1, 1, 1, 0]\n",
      "   +2.7543 if cp<=-0.019311948493123048 & cp>=-0.03972508609294891 & cv<=0.34599844217300413\n",
      "   -2.0133 if cp<=-0.03428530767560005\n",
      "   +1.2102 if pav>=0.5754271745681763\n",
      "   +1.9482 if pa>=0.011727696284651756\n",
      "   -5.1421 if cp<=-0.03897182270884514 & pav>=-0.4377006351947784\n",
      "--------------\n",
      "   +2.5164 if cv<=0.37546820044517515\n",
      "   -1.1596 if cp>=-0.03972508609294891\n",
      "   -3.8977 if pav>=0.5754271745681763\n",
      "   -2.2939 if cp<=-0.024268984422087664 & cv<=0.23797347545623784\n",
      "   -5.5812 if cp<=-0.007167091127485037 & cp<=-0.03897182270884514 & cv>=0.42185771465301514\n",
      "Run episode 82 with rewards 22.0\n",
      "============ 83 ===========\n",
      "21 actions [0, 1, 1, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 1, 0, 0, 0]\n",
      "   +3.1230 if cp<=-0.019311948493123048 & cp>=-0.03972508609294891 & cv<=0.34599844217300413\n",
      "   -3.3014 if cp<=-0.03428530767560005\n",
      "   -0.0527 if pa>=0.011727696284651756\n",
      "   -3.2302 if cp<=-0.03897182270884514 & pav>=-0.4377006351947784\n",
      "   +1.4256 if cp<=0.025132893398404126 & cp>=-0.03532056137919426 & cv>=0.36738150119781493\n",
      "--------------\n",
      "   +0.5012 if cv<=0.37546820044517515\n",
      "   +0.3483 if pav>=0.5754271745681763\n",
      "   -1.7336 if cp<=-0.024268984422087664 & cv<=0.23797347545623784\n",
      "   -4.1279 if cp<=-0.007167091127485037 & cp<=-0.03897182270884514 & cv>=0.42185771465301514\n",
      "   -3.1367 if cp<=0.025132893398404126 & pav<=-0.9723165988922119\n",
      "Run episode 83 with rewards 21.0\n",
      "============ 84 ===========\n",
      "10 actions [1, 1, 1, 0, 1, 1, 1, 1, 1, 0]\n",
      "   +0.0000 if cp<=-0.019311948493123048 & cp>=-0.03972508609294891 & cv<=0.34599844217300413\n",
      "   +0.0000 if cp<=-0.03428530767560005\n",
      "   +0.0000 if cp<=-0.03897182270884514 & pav>=-0.4377006351947784\n",
      "   +3.1518 if cp<=0.025132893398404126 & cp>=-0.03532056137919426 & cv>=0.36738150119781493\n",
      "   +3.2388 if pa>=0.05128761753439903\n",
      "--------------\n",
      "   +1.6028 if cv<=0.37546820044517515\n",
      "   +0.0000 if cp<=-0.024268984422087664 & cv<=0.23797347545623784\n",
      "   +0.0000 if cp<=-0.007167091127485037 & cp<=-0.03897182270884514 & cv>=0.42185771465301514\n",
      "   +0.0000 if cp<=0.025132893398404126 & pav<=-0.9723165988922119\n",
      "   -4.1316 if pa>=0.05128761753439903\n",
      "Run episode 84 with rewards 10.0\n",
      "============ 85 ===========\n",
      "11 actions [1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1]\n",
      "   -0.0000 if cp<=-0.03428530767560005\n",
      "   -0.0000 if cp<=-0.03897182270884514 & pav>=-0.4377006351947784\n",
      "   +2.5899 if cp<=0.025132893398404126 & cp>=-0.03532056137919426 & cv>=0.36738150119781493\n",
      "   -0.0000 if pa>=0.05128761753439903\n",
      "   -2.1843 if cp<=0.07196499407291412\n",
      "--------------\n",
      "   +4.7173 if cv<=0.37546820044517515\n",
      "   +0.0000 if cp<=-0.007167091127485037 & cp<=-0.03897182270884514 & cv>=0.42185771465301514\n",
      "   +0.0000 if cp<=0.025132893398404126 & pav<=-0.9723165988922119\n",
      "   +0.0000 if pa>=0.05128761753439903\n",
      "   +2.4530 if cp<=0.07196499407291412 & cp>=0.029426610469818117 & cv>=0.4899545907974243\n",
      "Run episode 85 with rewards 11.0\n",
      "============ 86 ===========\n",
      "8 actions [1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.0000 if cp<=-0.03428530767560005\n",
      "   -0.0000 if cp<=0.025132893398404126 & cp>=-0.03532056137919426 & cv>=0.36738150119781493\n",
      "   -0.0000 if pa>=0.05128761753439903\n",
      "   -2.4953 if cp<=0.07196499407291412\n",
      "   +1.8281 if cp<=0.08293555676937105 & cv>=0.9657369256019595\n",
      "--------------\n",
      "   +1.5172 if cv<=0.37546820044517515\n",
      "   +0.0000 if cp<=-0.007167091127485037 & cp<=-0.03897182270884514 & cv>=0.42185771465301514\n",
      "   +0.0000 if pa>=0.05128761753439903\n",
      "   +0.5136 if cp<=0.07196499407291412 & cp>=0.029426610469818117 & cv>=0.4899545907974243\n",
      "   +2.0509 if cp>=0.02917221374809742 & cv<=0.9657369256019595\n",
      "Run episode 86 with rewards 8.0\n",
      "============ 87 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -1.2909 if cp<=0.025132893398404126 & cp>=-0.03532056137919426 & cv>=0.36738150119781493\n",
      "   -0.0000 if pa>=0.05128761753439903\n",
      "   -2.0204 if cp<=0.07196499407291412\n",
      "   -0.3444 if cp<=0.08293555676937105 & cv>=0.9657369256019595\n",
      "   -0.8283 if cp<=-0.016420724242925643\n",
      "--------------\n",
      "   +1.1420 if cv<=0.37546820044517515\n",
      "   +0.0000 if pa>=0.05128761753439903\n",
      "   +0.6685 if cp<=0.07196499407291412 & cp>=0.029426610469818117 & cv>=0.4899545907974243\n",
      "   +0.0000 if cp>=0.02917221374809742 & cv<=0.9657369256019595\n",
      "   +1.4806 if cp<=0.025653280317783366 & cp>=-0.025705167278647422\n",
      "Run episode 87 with rewards 10.0\n",
      "============ 88 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 0, 1]\n",
      "   -0.8901 if cp<=0.025132893398404126 & cp>=-0.03532056137919426 & cv>=0.36738150119781493\n",
      "   -1.8930 if cp<=0.07196499407291412\n",
      "   -0.6449 if cp<=0.08293555676937105 & cv>=0.9657369256019595\n",
      "   -0.5480 if cp<=-0.016420724242925643\n",
      "   -0.7889 if cp>=0.06150437146425248\n",
      "--------------\n",
      "   +0.5574 if cv<=0.37546820044517515\n",
      "   +0.3726 if cp<=0.07196499407291412 & cp>=0.029426610469818117 & cv>=0.4899545907974243\n",
      "   +0.0000 if cp>=0.02917221374809742 & cv<=0.9657369256019595\n",
      "   +1.2109 if cp<=0.025653280317783366 & cp>=-0.025705167278647422\n",
      "   +1.0347 if cp>=0.021337078884243972\n",
      "Run episode 88 with rewards 9.0\n",
      "============ 89 ===========\n",
      "14 actions [1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 1, 1, 1, 1]\n",
      "   -0.2037 if cp<=0.025132893398404126 & cp>=-0.03532056137919426 & cv>=0.36738150119781493\n",
      "   -2.1459 if cp<=0.07196499407291412\n",
      "   -1.0449 if cp<=0.08293555676937105 & cv>=0.9657369256019595\n",
      "   +0.2769 if cp>=0.06150437146425248\n",
      "   +1.2198 if cv>=1.3850103616714478\n",
      "--------------\n",
      "   +0.9318 if cv<=0.37546820044517515\n",
      "   +1.0432 if cp<=0.07196499407291412 & cp>=0.029426610469818117 & cv>=0.4899545907974243\n",
      "   +1.1536 if cp<=0.025653280317783366 & cp>=-0.025705167278647422\n",
      "   +0.5724 if cp>=0.021337078884243972\n",
      "   -1.4826 if cv>=1.3850103616714478\n",
      "Run episode 89 with rewards 14.0\n",
      "============ 90 ===========\n",
      "8 actions [1, 1, 1, 1, 1, 1, 1, 0]\n",
      "   -3.1439 if cp<=0.07196499407291412\n",
      "   -1.0076 if cp<=0.08293555676937105 & cv>=0.9657369256019595\n",
      "   +2.5600 if cp>=0.06150437146425248\n",
      "   +0.0000 if cv>=1.3850103616714478\n",
      "   -1.5261 if cp>=0.12545117288827898\n",
      "--------------\n",
      "   +1.6963 if cv<=0.37546820044517515\n",
      "   +1.6382 if cp<=0.07196499407291412 & cp>=0.029426610469818117 & cv>=0.4899545907974243\n",
      "   +0.0000 if cp<=0.025653280317783366 & cp>=-0.025705167278647422\n",
      "   +0.0000 if cv>=1.3850103616714478\n",
      "   -2.4928 if cp<=0.12545117288827898 & cv>=0.9686972737312317\n",
      "Run episode 90 with rewards 8.0\n",
      "============ 91 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -2.7412 if cp<=0.07196499407291412\n",
      "   -0.6766 if cp<=0.08293555676937105 & cv>=0.9657369256019595\n",
      "   -0.2176 if cp>=0.06150437146425248\n",
      "   +0.0000 if cp>=0.12545117288827898\n",
      "   -0.5907 if cp<=0.017253958061337473 & cp>=0.007408408727496863\n",
      "--------------\n",
      "   +0.4411 if cv<=0.37546820044517515\n",
      "   +0.4295 if cp<=0.07196499407291412 & cp>=0.029426610469818117 & cv>=0.4899545907974243\n",
      "   +0.0291 if cv>=1.3850103616714478\n",
      "   +0.3555 if cp<=0.12545117288827898 & cv>=0.9686972737312317\n",
      "   +1.0169 if cp<=0.03493259623646738\n",
      "Run episode 91 with rewards 9.0\n",
      "============ 92 ===========\n",
      "8 actions [1, 1, 1, 1, 1, 1, 1, 0]\n",
      "   -2.5375 if cp<=0.07196499407291412\n",
      "   -0.6959 if cp<=0.08293555676937105 & cv>=0.9657369256019595\n",
      "   -0.4171 if cp>=0.06150437146425248\n",
      "   -0.2848 if cp<=0.017253958061337473 & cp>=0.007408408727496863\n",
      "   +0.1620 if cp>=0.09996415674686432\n",
      "--------------\n",
      "   +0.5022 if cv<=0.37546820044517515\n",
      "   +0.2305 if cp<=0.07196499407291412 & cp>=0.029426610469818117 & cv>=0.4899545907974243\n",
      "   +0.5310 if cp<=0.12545117288827898 & cv>=0.9686972737312317\n",
      "   +1.3614 if cp<=0.03493259623646738\n",
      "   -0.1683 if cp>=0.09996415674686432\n",
      "Run episode 92 with rewards 8.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 93 ===========\n",
      "14 actions [0, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1]\n",
      "   -2.0919 if cp<=0.07196499407291412\n",
      "   -0.0900 if cp<=0.08293555676937105 & cv>=0.9657369256019595\n",
      "   -0.6269 if cp>=0.06150437146425248\n",
      "   +0.0000 if cp<=0.017253958061337473 & cp>=0.007408408727496863\n",
      "   -1.2685 if cp>=0.04030550643801689\n",
      "--------------\n",
      "   +0.6286 if cv<=0.37546820044517515\n",
      "   +0.8533 if cp<=0.07196499407291412 & cp>=0.029426610469818117 & cv>=0.4899545907974243\n",
      "   +0.9200 if cp<=0.12545117288827898 & cv>=0.9686972737312317\n",
      "   +1.0777 if cp<=0.03493259623646738\n",
      "   +0.2420 if cp>=0.11146552860736847\n",
      "Run episode 93 with rewards 14.0\n",
      "============ 94 ===========\n",
      "13 actions [0, 0, 0, 1, 0, 0, 0, 1, 1, 0, 1, 0, 1]\n",
      "   +1.0409 if cp<=0.07196499407291412\n",
      "   -1.3543 if cp<=0.08293555676937105 & cv>=0.9657369256019595\n",
      "   -0.5415 if cp>=0.06150437146425248\n",
      "   -0.5414 if cp>=0.04030550643801689\n",
      "   -3.3317 if cv<=0.8927881121635438 & cv>=0.07630051970481874\n",
      "--------------\n",
      "   -1.2181 if cv<=0.37546820044517515\n",
      "   +0.4257 if cp<=0.07196499407291412 & cp>=0.029426610469818117 & cv>=0.4899545907974243\n",
      "   +0.5970 if cp<=0.12545117288827898 & cv>=0.9686972737312317\n",
      "   -0.7282 if cp<=0.03493259623646738\n",
      "   +3.2379 if cp<=-0.043973684310913086\n",
      "Run episode 94 with rewards 13.0\n",
      "============ 95 ===========\n",
      "41 actions [1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 0, 1, 1, 0, 0, 0, 1, 0, 1, 0, 0, 1, 0, 0, 1]\n",
      "   +1.2670 if cp<=0.07196499407291412\n",
      "   -0.0000 if cp<=0.08293555676937105 & cv>=0.9657369256019595\n",
      "   -0.0000 if cp>=0.06150437146425248\n",
      "   -0.0000 if cv<=0.8927881121635438 & cv>=0.07630051970481874\n",
      "   -3.0855 if cp<=-0.00874435547739266 & cp>=-0.03332340233027934\n",
      "--------------\n",
      "   +0.1880 if cv<=0.37546820044517515\n",
      "   -0.0000 if cp<=0.12545117288827898 & cv>=0.9686972737312317\n",
      "   +0.1880 if cp<=0.03493259623646738\n",
      "   +0.6894 if cp<=-0.043973684310913086\n",
      "   -2.9143 if cp>=-0.00874435547739266\n",
      "Run episode 95 with rewards 41.0\n",
      "============ 96 ===========\n",
      "21 actions [1, 1, 0, 1, 0, 0, 0, 0, 0, 0, 1, 1, 0, 1, 0, 0, 0, 1, 0, 1, 1]\n",
      "   +0.9350 if cp<=0.07196499407291412\n",
      "   +0.0000 if cp<=0.08293555676937105 & cv>=0.9657369256019595\n",
      "   +0.7538 if cv<=0.8927881121635438 & cv>=0.07630051970481874\n",
      "   -5.4517 if cp<=-0.00874435547739266 & cp>=-0.03332340233027934\n",
      "   +3.9207 if cp<=-0.07428082823753356 & pav<=-0.1543794870376587\n",
      "--------------\n",
      "   -0.0156 if cv<=0.37546820044517515\n",
      "   -0.7161 if cp<=0.03493259623646738\n",
      "   +1.5713 if cp<=-0.043973684310913086\n",
      "   -4.5286 if cp>=-0.00874435547739266\n",
      "   +1.5266 if cp>=-0.07428082823753356\n",
      "Run episode 96 with rewards 21.0\n",
      "============ 97 ===========\n",
      "10 actions [0, 0, 0, 0, 1, 1, 0, 0, 0, 0]\n",
      "   +2.3012 if cp<=0.07196499407291412\n",
      "   +2.5885 if cv<=0.8927881121635438 & cv>=0.07630051970481874\n",
      "   -4.3260 if cp<=-0.00874435547739266 & cp>=-0.03332340233027934\n",
      "   -0.0000 if cp<=-0.07428082823753356 & pav<=-0.1543794870376587\n",
      "   -2.6971 if cv<=0.21153220534324646 & cv>=0.21153220534324646\n",
      "--------------\n",
      "   -0.6959 if cp<=0.03493259623646738\n",
      "   +1.2467 if cp<=-0.043973684310913086\n",
      "   -2.5385 if cp>=-0.00874435547739266\n",
      "   -0.2162 if cp>=-0.07428082823753356\n",
      "   -5.1363 if cp<=-0.02006866596639156 & pa<=0.001207590801641345\n",
      "Run episode 97 with rewards 10.0\n",
      "============ 98 ===========\n",
      "13 actions [0, 0, 0, 0, 0, 1, 1, 1, 0, 0, 0, 0, 0]\n",
      "   +0.6902 if cp<=0.07196499407291412\n",
      "   +0.0000 if cv<=0.8927881121635438 & cv>=0.07630051970481874\n",
      "   -3.5931 if cp<=-0.00874435547739266 & cp>=-0.03332340233027934\n",
      "   +0.0000 if cv<=0.21153220534324646 & cv>=0.21153220534324646\n",
      "   +1.4652 if cp<=-0.032809289544820784 & cp>=-0.04929647594690323\n",
      "--------------\n",
      "   -0.3974 if cp<=0.03493259623646738\n",
      "   -0.4260 if cp<=-0.043973684310913086\n",
      "   -1.9349 if cp>=-0.00874435547739266\n",
      "   +0.0000 if cp<=-0.02006866596639156 & pa<=0.001207590801641345\n",
      "   +0.7066 if cp>=-0.032809289544820784\n",
      "Run episode 98 with rewards 13.0\n",
      "============ 99 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 1, 0, 0, 0]\n",
      "   +0.5263 if cp<=0.07196499407291412\n",
      "   -2.8367 if cp<=-0.00874435547739266 & cp>=-0.03332340233027934\n",
      "   +0.0000 if cv<=0.21153220534324646 & cv>=0.21153220534324646\n",
      "   -4.0027 if cp<=-0.032809289544820784 & cp>=-0.04929647594690323\n",
      "   +1.4897 if cv>=-0.8253847479820251\n",
      "--------------\n",
      "   -1.3551 if cp<=0.03493259623646738\n",
      "   +0.3151 if cp<=-0.043973684310913086\n",
      "   -2.5575 if cp>=-0.00874435547739266\n",
      "   -1.6702 if cp>=-0.032809289544820784\n",
      "   +3.9530 if cp>=-0.048676740378141396 & cv<=-0.6312472105026246\n",
      "Run episode 99 with rewards 9.0\n",
      "============ 100 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 1, 0, 0]\n",
      "   +0.3512 if cp<=0.07196499407291412\n",
      "   -0.2837 if cp<=-0.00874435547739266 & cp>=-0.03332340233027934\n",
      "   +0.0000 if cp<=-0.032809289544820784 & cp>=-0.04929647594690323\n",
      "   +2.5076 if cv>=-0.8253847479820251\n",
      "   -0.1133 if cp>=-0.05784094110131264\n",
      "--------------\n",
      "   -1.1137 if cp<=0.03493259623646738\n",
      "   -0.9414 if cp>=-0.00874435547739266\n",
      "   -0.4532 if cp>=-0.032809289544820784\n",
      "   +0.4882 if cp>=-0.048676740378141396 & cv<=-0.6312472105026246\n",
      "   -1.6711 if cp<=-0.007442009076476089 & cp>=-0.029108889028429983\n",
      "Run episode 100 with rewards 9.0\n",
      "============ 101 ===========\n",
      "11 actions [0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0]\n",
      "   +0.0755 if cp<=0.07196499407291412\n",
      "   -1.4781 if cp<=-0.00874435547739266 & cp>=-0.03332340233027934\n",
      "   +1.4668 if cv>=-0.8253847479820251\n",
      "   +0.2433 if cp>=-0.05784094110131264\n",
      "   +0.9506 if cp<=-0.01059927102178335 & cv>=-1.054683792591095\n",
      "--------------\n",
      "   -1.0260 if cp<=0.03493259623646738\n",
      "   -0.9375 if cp>=-0.00874435547739266\n",
      "   +0.2762 if cp>=-0.048676740378141396 & cv<=-0.6312472105026246\n",
      "   -1.2173 if cp<=-0.007442009076476089 & cp>=-0.029108889028429983\n",
      "   +1.6478 if cp>=-0.04258006438612938 & cv<=-1.054683792591095\n",
      "Run episode 101 with rewards 11.0\n",
      "============ 102 ===========\n",
      "8 actions [0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   -1.5821 if cp<=-0.00874435547739266 & cp>=-0.03332340233027934\n",
      "   +1.4585 if cv>=-0.8253847479820251\n",
      "   +0.1870 if cp>=-0.05784094110131264\n",
      "   +1.2605 if cp<=-0.01059927102178335 & cv>=-1.054683792591095\n",
      "   +0.9300 if cp>=-0.07507374882698059\n",
      "--------------\n",
      "   -1.6771 if cp<=0.03493259623646738\n",
      "   -1.2150 if cp>=-0.00874435547739266\n",
      "   -1.1190 if cp<=-0.007442009076476089 & cp>=-0.029108889028429983\n",
      "   +2.1068 if cp>=-0.04258006438612938 & cv<=-1.054683792591095\n",
      "   +0.2591 if pa>=0.17608387768268585\n",
      "Run episode 102 with rewards 8.0\n",
      "============ 103 ===========\n",
      "8 actions [0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   -0.0000 if cp<=-0.00874435547739266 & cp>=-0.03332340233027934\n",
      "   +0.8582 if cv>=-0.8253847479820251\n",
      "   +1.1939 if cp<=-0.01059927102178335 & cv>=-1.054683792591095\n",
      "   +0.8582 if cp>=-0.07507374882698059\n",
      "   -0.2814 if pa>=0.18360260128974915\n",
      "--------------\n",
      "   -1.2492 if cp<=0.03493259623646738\n",
      "   +0.0000 if cp>=-0.00874435547739266\n",
      "   +0.0000 if cp<=-0.007442009076476089 & cp>=-0.029108889028429983\n",
      "   +0.0000 if cp>=-0.04258006438612938 & cv<=-1.054683792591095\n",
      "   +0.3303 if pa>=0.18360260128974915\n",
      "Run episode 103 with rewards 8.0\n",
      "============ 104 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +1.7494 if cv>=-0.8253847479820251\n",
      "   +0.0000 if cp<=-0.01059927102178335 & cv>=-1.054683792591095\n",
      "   +1.9470 if cp>=-0.07507374882698059\n",
      "   +0.0000 if pa>=0.18360260128974915\n",
      "   +0.4533 if cp<=0.036857610195875176\n",
      "--------------\n",
      "   -0.5404 if cp<=0.03493259623646738\n",
      "   -2.0429 if cp>=-0.00874435547739266\n",
      "   -0.2115 if cp>=-0.04258006438612938 & cv<=-1.054683792591095\n",
      "   -0.0000 if pa>=0.18360260128974915\n",
      "   +0.2235 if pa>=0.1800243854522705\n",
      "Run episode 104 with rewards 10.0\n",
      "============ 105 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.4307 if cv>=-0.8253847479820251\n",
      "   +0.3750 if cp<=-0.01059927102178335 & cv>=-1.054683792591095\n",
      "   +1.4234 if cp>=-0.07507374882698059\n",
      "   +1.1582 if cp<=0.036857610195875176\n",
      "   -0.5441 if pa>=0.20821206271648407\n",
      "--------------\n",
      "   -0.8517 if cp<=0.03493259623646738\n",
      "   -0.3167 if cp>=-0.00874435547739266\n",
      "   -0.0000 if cp>=-0.04258006438612938 & cv<=-1.054683792591095\n",
      "   +0.6639 if pa>=0.1800243854522705\n",
      "   -0.5858 if cp>=-0.030966914817690847\n",
      "Run episode 105 with rewards 9.0\n",
      "============ 106 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.7763 if cv>=-0.8253847479820251\n",
      "   +1.3302 if cp>=-0.07507374882698059\n",
      "   +1.1022 if cp<=0.036857610195875176\n",
      "   -0.0000 if pa>=0.20821206271648407\n",
      "   -0.4941 if pa>=0.20813114941120148\n",
      "--------------\n",
      "   -0.9409 if cp<=0.03493259623646738\n",
      "   -0.3459 if cp>=-0.00874435547739266\n",
      "   +0.2085 if pa>=0.1800243854522705\n",
      "   -0.5590 if cp>=-0.030966914817690847\n",
      "   -0.4608 if cp>=-0.012142494320869437\n",
      "Run episode 106 with rewards 10.0\n",
      "============ 107 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.6017 if cv>=-0.8253847479820251\n",
      "   +0.7797 if cp>=-0.07507374882698059\n",
      "   +1.3625 if cp<=0.036857610195875176\n",
      "   -0.0000 if pa>=0.20813114941120148\n",
      "   +1.4206 if cp>=-0.14176995158195496\n",
      "--------------\n",
      "   -1.6266 if cp<=0.03493259623646738\n",
      "   +0.0000 if cp>=-0.00874435547739266\n",
      "   +0.0000 if cp>=-0.030966914817690847\n",
      "   +0.0000 if cp>=-0.012142494320869437\n",
      "   -0.8540 if cp<=-0.06979367882013321 & cp>=-0.14176995158195496\n",
      "Run episode 107 with rewards 10.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 108 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +1.1549 if cv>=-0.8253847479820251\n",
      "   +1.4024 if cp>=-0.07507374882698059\n",
      "   +0.3189 if cp<=0.036857610195875176\n",
      "   +1.3725 if cp>=-0.14176995158195496\n",
      "   +0.6032 if cp>=0.03958725780248642\n",
      "--------------\n",
      "   -0.2401 if cp<=0.03493259623646738\n",
      "   -0.9521 if cp>=-0.030966914817690847\n",
      "   -0.8834 if cp>=-0.012142494320869437\n",
      "   +0.0493 if cp<=-0.06979367882013321 & cp>=-0.14176995158195496\n",
      "   -0.1246 if cp<=-0.007028314238414166\n",
      "Run episode 108 with rewards 9.0\n",
      "============ 109 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.7191 if cv>=-0.8253847479820251\n",
      "   +0.9919 if cp>=-0.07507374882698059\n",
      "   +0.9919 if cp>=-0.14176995158195496\n",
      "   +0.4704 if cp>=0.03958725780248642\n",
      "   -0.1616 if pa>=0.2093908190727234\n",
      "--------------\n",
      "   -0.2421 if cp<=0.03493259623646738\n",
      "   -0.4349 if cp>=-0.030966914817690847\n",
      "   -0.4349 if cp>=-0.012142494320869437\n",
      "   -0.0629 if cp<=-0.007028314238414166\n",
      "   -0.4460 if \n",
      "Run episode 109 with rewards 10.0\n",
      "============ 110 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.7397 if cv>=-0.8253847479820251\n",
      "   +1.4103 if cp>=-0.07507374882698059\n",
      "   +1.3439 if cp>=-0.14176995158195496\n",
      "   +0.0000 if cp>=0.03958725780248642\n",
      "   -0.2648 if pa>=0.18037763237953186\n",
      "--------------\n",
      "   -0.9107 if cp<=0.03493259623646738\n",
      "   -0.5979 if cp>=-0.030966914817690847\n",
      "   -0.4435 if cp>=-0.012142494320869437\n",
      "   -0.9107 if \n",
      "   +0.0060 if cp<=-0.06628662347793579\n",
      "Run episode 110 with rewards 9.0\n",
      "============ 111 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.6231 if cv>=-0.8253847479820251\n",
      "   +0.6231 if cp>=-0.07507374882698059\n",
      "   +1.0626 if cp>=-0.14176995158195496\n",
      "   +0.0000 if pa>=0.18037763237953186\n",
      "   +0.9491 if cp>=-0.11268960684537888\n",
      "--------------\n",
      "   -0.9127 if cp<=0.03493259623646738\n",
      "   +0.0000 if cp>=-0.030966914817690847\n",
      "   +0.0000 if cp>=-0.012142494320869437\n",
      "   -0.9127 if \n",
      "   +0.2807 if pa>=0.17165899276733398\n",
      "Run episode 111 with rewards 9.0\n",
      "============ 112 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.6342 if cv>=-0.8253847479820251\n",
      "   +0.8680 if cp>=-0.07507374882698059\n",
      "   +0.8016 if cp>=-0.14176995158195496\n",
      "   +0.8016 if cp>=-0.11268960684537888\n",
      "   +0.2758 if cp>=0.016430372744798662\n",
      "--------------\n",
      "   -0.6953 if cp<=0.03493259623646738\n",
      "   -0.6111 if cp>=-0.030966914817690847\n",
      "   -0.6953 if \n",
      "   +0.0557 if pa>=0.17165899276733398\n",
      "   +0.0179 if cp<=-0.05123436450958252\n",
      "Run episode 112 with rewards 10.0\n",
      "origin 0.6571397557119494 new 0.6730435896150799 not updated\n",
      "============ 113 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.6342 if cv>=-0.8253847479820251\n",
      "   +0.8680 if cp>=-0.07507374882698059\n",
      "   +0.8016 if cp>=-0.14176995158195496\n",
      "   +0.8016 if cp>=-0.11268960684537888\n",
      "   +0.2758 if cp>=0.016430372744798662\n",
      "--------------\n",
      "   -0.7615 if cp<=0.03493259623646738\n",
      "   -0.6796 if cp>=-0.030966914817690847\n",
      "   -0.7615 if \n",
      "   +0.0920 if pa>=0.17165899276733398\n",
      "   +0.0168 if cp<=-0.05858030319213867\n",
      "Run episode 113 with rewards 9.0\n",
      "origin 0.6472829106221999 new 0.6937556682600338 not updated\n",
      "============ 114 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.6342 if cv>=-0.8253847479820251\n",
      "   +0.8680 if cp>=-0.07507374882698059\n",
      "   +0.8016 if cp>=-0.14176995158195496\n",
      "   +0.8016 if cp>=-0.11268960684537888\n",
      "   +0.2758 if cp>=0.016430372744798662\n",
      "--------------\n",
      "   -0.2635 if cp<=0.03493259623646738\n",
      "   -0.7938 if cp>=-0.030966914817690847\n",
      "   -0.8056 if \n",
      "   +0.0478 if pa>=0.17165899276733398\n",
      "   -0.2504 if cp<=0.0455742858350277 & cp>=0.010792110674083236\n",
      "Run episode 114 with rewards 10.0\n",
      "============ 115 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 1]\n",
      "   +0.5030 if cv>=-0.8253847479820251\n",
      "   +0.9262 if cp>=-0.07507374882698059\n",
      "   +0.7523 if cp>=-0.14176995158195496\n",
      "   +1.0238 if cp>=-0.11268960684537888\n",
      "   +0.3221 if cp<=0.026951509714126586 & cp>=-0.01956425309181213\n",
      "--------------\n",
      "   -0.7281 if cp<=0.03493259623646738\n",
      "   -0.5625 if cp>=-0.030966914817690847\n",
      "   -0.7281 if \n",
      "   -0.3249 if cp<=0.0455742858350277 & cp>=0.010792110674083236\n",
      "   +0.1159 if cp<=-0.06154061257839203\n",
      "Run episode 115 with rewards 9.0\n",
      "============ 116 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.3246 if cv>=-0.8253847479820251\n",
      "   +0.3916 if cp>=-0.07507374882698059\n",
      "   +2.1339 if cp>=-0.14176995158195496\n",
      "   +0.4973 if cp>=-0.11268960684537888\n",
      "   +0.4593 if cp>=-0.08546641319990159\n",
      "--------------\n",
      "   -1.7954 if cp<=0.03493259623646738\n",
      "   -0.0680 if cp>=-0.030966914817690847\n",
      "   -1.7954 if \n",
      "   +0.0000 if cp<=0.0455742858350277 & cp>=0.010792110674083236\n",
      "   -0.1201 if cp>=-0.08546641319990159\n",
      "Run episode 116 with rewards 9.0\n",
      "============ 117 ===========\n",
      "10 actions [0, 0, 0, 1, 0, 0, 0, 0, 0, 1]\n",
      "   +0.4109 if cp>=-0.07507374882698059\n",
      "   +0.4067 if cp>=-0.14176995158195496\n",
      "   +0.4358 if cp>=-0.11268960684537888\n",
      "   +0.4109 if cp>=-0.08546641319990159\n",
      "   +0.2841 if cp>=-0.016958585008978837\n",
      "--------------\n",
      "   -0.4662 if cp<=0.03493259623646738\n",
      "   -0.3721 if cp>=-0.030966914817690847\n",
      "   -0.4662 if \n",
      "   -0.4852 if cp>=-0.08546641319990159\n",
      "   +0.0773 if pa>=0.1698560267686844\n",
      "Run episode 117 with rewards 10.0\n",
      "============ 118 ===========\n",
      "8 actions [0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   -0.1952 if cp>=-0.07507374882698059\n",
      "   +0.9895 if cp>=-0.14176995158195496\n",
      "   +0.9895 if cp>=-0.11268960684537888\n",
      "   -0.1952 if cp>=-0.08546641319990159\n",
      "   -4.5805 if cp>=-0.004374532029032703 & cv<=-0.5309064149856567\n",
      "--------------\n",
      "   -1.0161 if cp<=0.03493259623646738\n",
      "   +0.4194 if cp>=-0.030966914817690847\n",
      "   -1.0161 if \n",
      "   +0.1711 if cp>=-0.08546641319990159\n",
      "   +4.5897 if cp>=-0.004374532029032703 & cv<=-0.5309064149856567\n",
      "Run episode 118 with rewards 8.0\n",
      "============ 119 ===========\n",
      "8 actions [0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.8761 if cp>=-0.14176995158195496\n",
      "   +0.9284 if cp>=-0.11268960684537888\n",
      "   +0.8868 if cp>=-0.08546641319990159\n",
      "   -0.0000 if cp>=-0.004374532029032703 & cv<=-0.5309064149856567\n",
      "   +0.2336 if cp<=-0.05532147362828254\n",
      "--------------\n",
      "   -1.2781 if cp<=0.03493259623646738\n",
      "   -0.0000 if cp>=-0.030966914817690847\n",
      "   -1.2781 if \n",
      "   -0.0000 if cp>=-0.004374532029032703 & cv<=-0.5309064149856567\n",
      "   -0.3175 if cp<=-0.05532147362828254\n",
      "Run episode 119 with rewards 8.0\n",
      "============ 120 ===========\n",
      "8 actions [0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.7501 if cp>=-0.14176995158195496\n",
      "   +0.7501 if cp>=-0.11268960684537888\n",
      "   +0.7501 if cp>=-0.08546641319990159\n",
      "   -0.0068 if cp<=-0.05532147362828254\n",
      "   +0.0601 if cp<=-0.019670251011848446\n",
      "--------------\n",
      "   -0.8859 if cp<=0.03493259623646738\n",
      "   -0.8859 if \n",
      "   -0.0000 if cp>=-0.004374532029032703 & cv<=-0.5309064149856567\n",
      "   +0.0076 if cp<=-0.05532147362828254\n",
      "   -0.3790 if cp<=0.0056426679715514206\n",
      "Run episode 120 with rewards 8.0\n",
      "============ 121 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.8311 if cp>=-0.14176995158195496\n",
      "   +0.8311 if cp>=-0.11268960684537888\n",
      "   +0.8540 if cp>=-0.08546641319990159\n",
      "   +0.1305 if cp<=-0.019670251011848446\n",
      "   -0.0019 if cp<=-0.056292854249477386\n",
      "--------------\n",
      "   -0.8063 if cp<=0.03493259623646738\n",
      "   -0.8063 if \n",
      "   -0.0003 if cp<=-0.05532147362828254\n",
      "   -0.8063 if cp<=0.0056426679715514206\n",
      "   -0.1784 if cp<=-0.017739418707787984 & cp>=-0.033097570389509195\n",
      "Run episode 121 with rewards 9.0\n",
      "============ 122 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.7479 if cp>=-0.14176995158195496\n",
      "   +0.7054 if cp>=-0.11268960684537888\n",
      "   +0.5467 if cp>=-0.08546641319990159\n",
      "   +0.6735 if cp<=-0.019670251011848446\n",
      "   +0.2427 if cp>=-0.04726159274578094\n",
      "--------------\n",
      "   -0.7957 if cp<=0.03493259623646738\n",
      "   -0.7957 if \n",
      "   -0.7957 if cp<=0.0056426679715514206\n",
      "   -0.0000 if cp<=-0.017739418707787984 & cp>=-0.033097570389509195\n",
      "   -0.1455 if cp<=-0.0822770059108734\n",
      "Run episode 122 with rewards 9.0\n",
      "============ 123 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.7815 if cp>=-0.14176995158195496\n",
      "   +0.8296 if cp>=-0.11268960684537888\n",
      "   +0.8017 if cp>=-0.08546641319990159\n",
      "   +0.1747 if cp<=-0.019670251011848446\n",
      "   +0.3051 if cp>=-0.010166625119745731\n",
      "--------------\n",
      "   -0.8449 if cp<=0.03493259623646738\n",
      "   -0.8449 if \n",
      "   -0.8449 if cp<=0.0056426679715514206\n",
      "   +0.0101 if cp<=-0.0822770059108734\n",
      "   -0.0580 if cp<=-0.041710613295435905\n",
      "Run episode 123 with rewards 9.0\n",
      "============ 124 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.8191 if cp>=-0.14176995158195496\n",
      "   +0.8191 if cp>=-0.11268960684537888\n",
      "   +0.8191 if cp>=-0.08546641319990159\n",
      "   +0.7145 if cp>=-0.010166625119745731\n",
      "   +0.0022 if cp<=-0.04181877672672271\n",
      "--------------\n",
      "   -0.9613 if cp<=0.03493259623646738\n",
      "   -0.9613 if \n",
      "   -0.2232 if cp<=0.0056426679715514206\n",
      "   -0.0031 if cp<=-0.041710613295435905\n",
      "   -0.3270 if cp<=0.02841019593179226 & cp>=-0.00824345368891954\n",
      "Run episode 124 with rewards 10.0\n",
      "============ 125 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.7532 if cp>=-0.14176995158195496\n",
      "   +0.8401 if cp>=-0.11268960684537888\n",
      "   +0.8092 if cp>=-0.08546641319990159\n",
      "   +0.5830 if cp>=-0.010166625119745731\n",
      "   +0.2252 if cp<=0.005329220870044087\n",
      "--------------\n",
      "   -0.7820 if cp<=0.03493259623646738\n",
      "   -0.7820 if \n",
      "   -0.3248 if cp<=0.0056426679715514206\n",
      "   -0.5182 if cp<=0.02841019593179226 & cp>=-0.00824345368891954\n",
      "   -0.2333 if cp>=0.021521159261465073\n",
      "Run episode 125 with rewards 10.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 126 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.9408 if cp>=-0.14176995158195496\n",
      "   +0.9408 if cp>=-0.11268960684537888\n",
      "   +0.9889 if cp>=-0.08546641319990159\n",
      "   +0.8514 if cp>=-0.010166625119745731\n",
      "   -0.0482 if pa>=0.18822601437568665\n",
      "--------------\n",
      "   -0.4526 if cp<=0.03493259623646738\n",
      "   -1.4190 if \n",
      "   -0.1137 if cp<=0.0056426679715514206\n",
      "   -0.1859 if cp<=0.02841019593179226 & cp>=-0.00824345368891954\n",
      "   +0.0285 if cp<=-0.04098551869392395\n",
      "Run episode 126 with rewards 10.0\n",
      "============ 127 ===========\n",
      "8 actions [0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.8297 if cp>=-0.14176995158195496\n",
      "   +0.9424 if cp>=-0.11268960684537888\n",
      "   +0.9049 if cp>=-0.08546641319990159\n",
      "   +0.5029 if cp>=-0.010166625119745731\n",
      "   +0.0562 if cp<=-0.034732059389352796\n",
      "--------------\n",
      "   -0.6806 if cp<=0.03493259623646738\n",
      "   -0.6806 if \n",
      "   -0.4374 if cp<=0.0056426679715514206\n",
      "   -0.3630 if cp<=0.02841019593179226 & cp>=-0.00824345368891954\n",
      "   -0.0488 if cp<=-0.034732059389352796\n",
      "Run episode 127 with rewards 8.0\n",
      "============ 128 ===========\n",
      "8 actions [0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.7440 if cp>=-0.14176995158195496\n",
      "   +0.7440 if cp>=-0.11268960684537888\n",
      "   +0.7440 if cp>=-0.08546641319990159\n",
      "   +0.6181 if cp>=-0.010166625119745731\n",
      "   +0.4157 if cp>=0.012907126545906077\n",
      "--------------\n",
      "   -0.6485 if cp<=0.03493259623646738\n",
      "   -0.6485 if \n",
      "   -0.1578 if cp<=0.0056426679715514206\n",
      "   -0.5456 if cp<=0.02841019593179226 & cp>=-0.00824345368891954\n",
      "   -0.1029 if cp<=-0.004839609051123257\n",
      "Run episode 128 with rewards 8.0\n",
      "origin 0.5259821562157398 new 0.5651547575079062 not updated\n",
      "============ 129 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.7440 if cp>=-0.14176995158195496\n",
      "   +0.7440 if cp>=-0.11268960684537888\n",
      "   +0.7440 if cp>=-0.08546641319990159\n",
      "   +0.6181 if cp>=-0.010166625119745731\n",
      "   +0.4157 if cp>=0.012907126545906077\n",
      "--------------\n",
      "   -0.6355 if cp<=0.03493259623646738\n",
      "   -0.6355 if \n",
      "   -0.1201 if cp<=0.0056426679715514206\n",
      "   -0.5153 if cp<=0.02841019593179226 & cp>=-0.00824345368891954\n",
      "   -0.2257 if cp>=0.02653018832206726\n",
      "Run episode 129 with rewards 9.0\n",
      "============ 130 ===========\n",
      "8 actions [0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.8582 if cp>=-0.14176995158195496\n",
      "   +0.8582 if cp>=-0.11268960684537888\n",
      "   +0.9388 if cp>=-0.08546641319990159\n",
      "   +0.6445 if cp>=-0.010166625119745731\n",
      "   -0.0806 if pa>=0.19800804555416107\n",
      "--------------\n",
      "   -0.8540 if cp<=0.03493259623646738\n",
      "   -0.8540 if \n",
      "   -0.4615 if cp<=0.02841019593179226 & cp>=-0.00824345368891954\n",
      "   +0.0000 if cp>=0.02653018832206726\n",
      "   +0.0311 if cp<=-0.05458217784762382\n",
      "Run episode 130 with rewards 8.0\n",
      "============ 131 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.9362 if cp>=-0.14176995158195496\n",
      "   +0.9362 if cp>=-0.11268960684537888\n",
      "   +0.9718 if cp>=-0.08546641319990159\n",
      "   -0.0000 if cp>=-0.010166625119745731\n",
      "   +0.0517 if cp<=-0.05324227958917618\n",
      "--------------\n",
      "   -0.8999 if cp<=0.03493259623646738\n",
      "   -0.8999 if \n",
      "   -0.0000 if cp<=0.02841019593179226 & cp>=-0.00824345368891954\n",
      "   -0.0561 if cp<=-0.05458217784762382\n",
      "   -0.3331 if cp<=-0.028217961639165876 & cp>=-0.05324227958917618\n",
      "Run episode 131 with rewards 9.0\n",
      "============ 132 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.8739 if cp>=-0.14176995158195496\n",
      "   +0.9702 if cp>=-0.11268960684537888\n",
      "   +0.9249 if cp>=-0.08546641319990159\n",
      "   +0.0845 if cp<=-0.05324227958917618\n",
      "   +0.3625 if cp>=-0.022439345717430115\n",
      "--------------\n",
      "   -0.8909 if cp<=0.03493259623646738\n",
      "   -0.8909 if \n",
      "   -0.0811 if cp<=-0.05458217784762382\n",
      "   -0.1762 if cp<=-0.028217961639165876 & cp>=-0.05324227958917618\n",
      "   -0.3192 if cp<=-0.022439345717430115 & cp>=-0.05591271743178367\n",
      "Run episode 132 with rewards 9.0\n",
      "============ 133 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.8428 if cp>=-0.14176995158195496\n",
      "   +0.9320 if cp>=-0.11268960684537888\n",
      "   +0.8856 if cp>=-0.08546641319990159\n",
      "   +0.3972 if cp>=-0.022439345717430115\n",
      "   +0.1544 if cp<=-0.03246178701519965\n",
      "--------------\n",
      "   -0.8334 if cp<=0.03493259623646738\n",
      "   -0.8334 if \n",
      "   -0.1918 if cp<=-0.028217961639165876 & cp>=-0.05324227958917618\n",
      "   -0.4129 if cp<=-0.022439345717430115 & cp>=-0.05591271743178367\n",
      "   -0.0699 if cp<=-0.052866483479738234\n",
      "Run episode 133 with rewards 10.0\n",
      "============ 134 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +1.0936 if cp>=-0.14176995158195496\n",
      "   +1.0037 if cp>=-0.11268960684537888\n",
      "   +0.8911 if cp>=-0.08546641319990159\n",
      "   +0.3697 if cp>=-0.022439345717430115\n",
      "   -0.4669 if pa>=0.1679963320493698\n",
      "--------------\n",
      "   -0.9297 if cp<=0.03493259623646738\n",
      "   -0.9297 if \n",
      "   -0.1912 if cp<=-0.028217961639165876 & cp>=-0.05324227958917618\n",
      "   -0.3659 if cp<=-0.022439345717430115 & cp>=-0.05591271743178367\n",
      "   -0.0357 if cp<=-0.0717900276184082\n",
      "Run episode 134 with rewards 9.0\n",
      "origin 0.6866544692721919 new 0.7129937662753825 not updated\n",
      "============ 135 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +1.0936 if cp>=-0.14176995158195496\n",
      "   +1.0037 if cp>=-0.11268960684537888\n",
      "   +0.8911 if cp>=-0.08546641319990159\n",
      "   +0.3697 if cp>=-0.022439345717430115\n",
      "   -0.4669 if pa>=0.1679963320493698\n",
      "--------------\n",
      "   -0.7430 if cp<=0.03493259623646738\n",
      "   -0.7430 if \n",
      "   -0.0219 if cp<=-0.028217961639165876 & cp>=-0.05324227958917618\n",
      "   -0.0219 if cp<=-0.022439345717430115 & cp>=-0.05591271743178367\n",
      "   -0.3568 if cp<=0.032333555072546004 & cp>=-0.02835443466901779\n",
      "Run episode 135 with rewards 10.0\n",
      "origin 1.0001832042255474 new 1.0405065561851938 not updated\n",
      "============ 136 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 1]\n",
      "   +1.0936 if cp>=-0.14176995158195496\n",
      "   +1.0037 if cp>=-0.11268960684537888\n",
      "   +0.8911 if cp>=-0.08546641319990159\n",
      "   +0.3697 if cp>=-0.022439345717430115\n",
      "   -0.4669 if pa>=0.1679963320493698\n",
      "--------------\n",
      "   -0.3501 if cp<=0.03493259623646738\n",
      "   -1.1886 if \n",
      "   -0.0538 if cp<=-0.028217961639165876 & cp>=-0.05324227958917618\n",
      "   -0.2243 if cp<=0.032333555072546004 & cp>=-0.02835443466901779\n",
      "   +0.0748 if cp<=-0.044353237748146056\n",
      "Run episode 136 with rewards 9.0\n",
      "============ 137 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +2.0392 if cp>=-0.14176995158195496\n",
      "   +2.0392 if cp>=-0.11268960684537888\n",
      "   +0.2407 if cp>=-0.08546641319990159\n",
      "   +1.7985 if pa>=0.1679963320493698\n",
      "   +0.1682 if cp>=0.006088346987962732\n",
      "--------------\n",
      "   -1.8822 if cp<=0.03493259623646738\n",
      "   -1.8822 if \n",
      "   -0.0769 if cp<=0.032333555072546004 & cp>=-0.02835443466901779\n",
      "   -1.7987 if cp<=-0.044353237748146056\n",
      "   -0.0699 if cp>=-0.01729680299758911\n",
      "Run episode 137 with rewards 9.0\n",
      "============ 138 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.4234 if cp>=-0.14176995158195496\n",
      "   +0.4278 if cp>=-0.11268960684537888\n",
      "   +0.4245 if cp>=-0.08546641319990159\n",
      "   -0.0000 if pa>=0.1679963320493698\n",
      "   +0.4083 if cp>=-0.05375895202159881\n",
      "--------------\n",
      "   -0.4527 if cp<=0.03493259623646738\n",
      "   -0.4527 if \n",
      "   -0.2854 if cp<=0.032333555072546004 & cp>=-0.02835443466901779\n",
      "   -0.0083 if cp<=-0.044353237748146056\n",
      "   -0.0083 if cp<=-0.05375895202159881\n",
      "Run episode 138 with rewards 10.0\n",
      "============ 139 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   -0.1860 if cp>=-0.14176995158195496\n",
      "   +1.3416 if cp>=-0.11268960684537888\n",
      "   +1.3416 if cp>=-0.08546641319990159\n",
      "   +1.1268 if cp>=-0.05375895202159881\n",
      "   -1.5276 if pa>=0.1910223662853241\n",
      "--------------\n",
      "   -1.1425 if cp<=0.03493259623646738\n",
      "   -1.1425 if \n",
      "   -0.9398 if cp<=0.032333555072546004 & cp>=-0.02835443466901779\n",
      "   -0.0374 if cp<=-0.044353237748146056\n",
      "   +0.1023 if cp<=-0.06284533441066742\n",
      "Run episode 139 with rewards 10.0\n",
      "============ 140 ===========\n",
      "11 actions [0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1]\n",
      "   +0.7228 if cp>=-0.11268960684537888\n",
      "   +0.7228 if cp>=-0.08546641319990159\n",
      "   +0.5621 if cp>=-0.05375895202159881\n",
      "   -0.0000 if pa>=0.1910223662853241\n",
      "   +0.4407 if cp>=-0.022750954329967498\n",
      "--------------\n",
      "   -0.0377 if cp<=0.03493259623646738\n",
      "   -0.0377 if \n",
      "   -1.0761 if cp<=0.032333555072546004 & cp>=-0.02835443466901779\n",
      "   +1.6338 if cp<=-0.06284533441066742\n",
      "   +2.0888 if pa>=0.18679410219192505\n",
      "Run episode 140 with rewards 11.0\n",
      "============ 141 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 1, 0, 1]\n",
      "   +2.0925 if cp>=-0.11268960684537888\n",
      "   -1.3699 if cp>=-0.08546641319990159\n",
      "   +2.2983 if cp>=-0.05375895202159881\n",
      "   +0.7827 if cp>=-0.022750954329967498\n",
      "   -0.7619 if cp<=-0.1137404590845108 & cv<=-1.0081068277359009\n",
      "--------------\n",
      "   -1.3138 if \n",
      "   -0.9734 if cp<=0.032333555072546004 & cp>=-0.02835443466901779\n",
      "   +0.8803 if cp<=-0.06284533441066742\n",
      "   -0.0369 if pa>=0.18679410219192505\n",
      "   +3.1600 if cv<=-1.0081068277359009\n",
      "Run episode 141 with rewards 9.0\n",
      "============ 142 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 1, 0, 1, 1]\n",
      "   +0.2132 if cp>=-0.11268960684537888\n",
      "   +0.1421 if cp>=-0.08546641319990159\n",
      "   +0.8421 if cp>=-0.05375895202159881\n",
      "   +0.4952 if cp>=-0.022750954329967498\n",
      "   +1.1889 if cv>=-1.0183420658111573\n",
      "--------------\n",
      "   -0.1937 if \n",
      "   -0.8773 if cp<=0.032333555072546004 & cp>=-0.02835443466901779\n",
      "   -1.1838 if cp<=-0.06284533441066742\n",
      "   +1.3573 if cv<=-1.0081068277359009\n",
      "   -0.8725 if pa>=0.18913505971431732\n",
      "Run episode 142 with rewards 10.0\n",
      "============ 143 ===========\n",
      "12 actions [0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 0, 1]\n",
      "   -0.3793 if cp>=-0.11268960684537888\n",
      "   +0.1371 if cp>=-0.05375895202159881\n",
      "   +1.3479 if cp>=-0.022750954329967498\n",
      "   +2.3701 if cv>=-1.0183420658111573\n",
      "   +0.4737 if pa>=0.19056789577007294\n",
      "--------------\n",
      "   -1.5343 if cp<=0.032333555072546004 & cp>=-0.02835443466901779\n",
      "   -0.1348 if cp<=-0.06284533441066742\n",
      "   +2.3912 if cv<=-1.0081068277359009\n",
      "   -0.4478 if pa>=0.18913505971431732\n",
      "   -0.7126 if cp<=-0.01863118577748537 & cv>=-1.0044811248779297\n",
      "Run episode 143 with rewards 12.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 144 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.0240 if cp>=-0.11268960684537888\n",
      "   +0.9952 if cp>=-0.022750954329967498\n",
      "   +2.4308 if cv>=-1.0183420658111573\n",
      "   +1.1200 if pa>=0.19056789577007294\n",
      "   +2.3050 if cp<=-0.109855717420578 & cv<=-1.1214398860931396\n",
      "--------------\n",
      "   -1.2660 if cp<=0.032333555072546004 & cp>=-0.02835443466901779\n",
      "   +1.4737 if cv<=-1.0081068277359009\n",
      "   -1.2199 if pa>=0.18913505971431732\n",
      "   -1.2543 if cp<=-0.01863118577748537 & cv>=-1.0044811248779297\n",
      "   -2.0781 if cp<=-0.109855717420578 & cv<=-1.1214398860931396\n",
      "Run episode 144 with rewards 10.0\n",
      "============ 145 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.5466 if cp>=-0.022750954329967498\n",
      "   +0.5466 if cv>=-1.0183420658111573\n",
      "   -0.0000 if pa>=0.19056789577007294\n",
      "   -0.0558 if cp<=-0.109855717420578 & cv<=-1.1214398860931396\n",
      "   +3.0953 if \n",
      "--------------\n",
      "   -1.2071 if cp<=0.032333555072546004 & cp>=-0.02835443466901779\n",
      "   -1.3558 if cv<=-1.0081068277359009\n",
      "   +0.0000 if cp<=-0.01863118577748537 & cv>=-1.0044811248779297\n",
      "   +0.0581 if cp<=-0.109855717420578 & cv<=-1.1214398860931396\n",
      "   -1.0996 if cp<=-0.02555277161300182 & cp>=-0.0654942587018013\n",
      "Run episode 145 with rewards 9.0\n",
      "============ 146 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 1, 0]\n",
      "   +0.9460 if cp>=-0.022750954329967498\n",
      "   +1.1938 if cv>=-1.0183420658111573\n",
      "   -0.0000 if cp<=-0.109855717420578 & cv<=-1.1214398860931396\n",
      "   +1.3080 if \n",
      "   -0.1379 if pa>=0.2074715942144394\n",
      "--------------\n",
      "   -0.7291 if cp<=0.032333555072546004 & cp>=-0.02835443466901779\n",
      "   -0.1504 if cv<=-1.0081068277359009\n",
      "   -0.0000 if cp<=-0.109855717420578 & cv<=-1.1214398860931396\n",
      "   -0.3270 if cp<=-0.02555277161300182 & cp>=-0.0654942587018013\n",
      "   +0.0750 if pa>=0.2074715942144394\n",
      "Run episode 146 with rewards 9.0\n",
      "============ 147 ===========\n",
      "11 actions [0, 0, 0, 0, 1, 0, 1, 0, 0, 0, 0]\n",
      "   +1.8148 if cp>=-0.022750954329967498\n",
      "   +1.6090 if cv>=-1.0183420658111573\n",
      "   +0.5781 if \n",
      "   -0.0000 if pa>=0.2074715942144394\n",
      "   -0.9875 if pav>=2.1672475337982178\n",
      "--------------\n",
      "   -0.7174 if cp<=0.032333555072546004 & cp>=-0.02835443466901779\n",
      "   +0.9575 if cv<=-1.0081068277359009\n",
      "   +1.3443 if cp<=-0.02555277161300182 & cp>=-0.0654942587018013\n",
      "   +0.0000 if pa>=0.2074715942144394\n",
      "   -0.5937 if \n",
      "Run episode 147 with rewards 11.0\n",
      "============ 148 ===========\n",
      "17 actions [1, 0, 1, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 1, 1, 0, 1]\n",
      "   +1.0470 if cp>=-0.022750954329967498\n",
      "   +1.3355 if cv>=-1.0183420658111573\n",
      "   +0.9676 if \n",
      "   -0.0000 if pav>=2.1672475337982178\n",
      "   -3.6187 if cp>=-0.05922462418675423 & cv<=-0.8062889575958252\n",
      "--------------\n",
      "   -1.0101 if cp<=0.032333555072546004 & cp>=-0.02835443466901779\n",
      "   +0.6096 if cv<=-1.0081068277359009\n",
      "   +3.2961 if cp<=-0.02555277161300182 & cp>=-0.0654942587018013\n",
      "   +0.3144 if \n",
      "   -2.9519 if cp<=-0.030866166576743116 & cv>=-0.6116338968276978\n",
      "Run episode 148 with rewards 17.0\n",
      "============ 149 ===========\n",
      "22 actions [1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 1, 1, 0]\n",
      "   -0.0000 if cp>=-0.022750954329967498\n",
      "   +1.2726 if cv>=-1.0183420658111573\n",
      "   +0.8834 if \n",
      "   -0.0000 if cp>=-0.05922462418675423 & cv<=-0.8062889575958252\n",
      "   -3.9592 if cp<=-0.040179960429668427 & cp>=-0.04557589441537857 & pa>=-0.0335906058549881\n",
      "--------------\n",
      "   +0.0000 if cp<=0.032333555072546004 & cp>=-0.02835443466901779\n",
      "   +0.9251 if cv<=-1.0081068277359009\n",
      "   +4.4795 if cp<=-0.02555277161300182 & cp>=-0.0654942587018013\n",
      "   -0.0760 if cp<=-0.030866166576743116 & cv>=-0.6116338968276978\n",
      "   -3.6234 if pa<=-0.0335906058549881\n",
      "Run episode 149 with rewards 22.0\n",
      "============ 150 ===========\n",
      "22 actions [1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 1]\n",
      "   -1.5390 if cv>=-1.0183420658111573\n",
      "   +2.3101 if \n",
      "   +1.5959 if cp>=-0.05922462418675423 & cv<=-0.8062889575958252\n",
      "   +0.0000 if cp<=-0.040179960429668427 & cp>=-0.04557589441537857 & pa>=-0.0335906058549881\n",
      "   -1.5959 if cv<=-1.1575457572937011\n",
      "--------------\n",
      "   -1.2898 if cv<=-1.0081068277359009\n",
      "   +4.5948 if cp<=-0.02555277161300182 & cp>=-0.0654942587018013\n",
      "   +2.0472 if cp<=-0.030866166576743116 & cv>=-0.6116338968276978\n",
      "   -4.1179 if pa<=-0.0335906058549881\n",
      "   +2.1894 if cp<=-0.10070250928401947 & cv<=-1.1575457572937011\n",
      "Run episode 150 with rewards 22.0\n",
      "============ 151 ===========\n",
      "20 actions [1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +1.1127 if cv>=-1.0183420658111573\n",
      "   +2.1112 if \n",
      "   +2.6388 if cp>=-0.05922462418675423 & cv<=-0.8062889575958252\n",
      "   +0.9985 if cv<=-1.1575457572937011\n",
      "   -2.9617 if cp>=-0.12677187025547026\n",
      "--------------\n",
      "   +2.5410 if cp<=-0.02555277161300182 & cp>=-0.0654942587018013\n",
      "   +4.2823 if cp<=-0.030866166576743116 & cv>=-0.6116338968276978\n",
      "   -3.4612 if pa<=-0.0335906058549881\n",
      "   +1.3508 if cp<=-0.10070250928401947 & cv<=-1.1575457572937011\n",
      "   -3.7515 if cp<=-0.12677187025547026\n",
      "Run episode 151 with rewards 20.0\n",
      "============ 152 ===========\n",
      "8 actions [0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +2.4590 if cv>=-1.0183420658111573\n",
      "   -0.7663 if \n",
      "   +1.2160 if cp>=-0.05922462418675423 & cv<=-0.8062889575958252\n",
      "   -0.8449 if cp>=-0.12677187025547026\n",
      "   +4.0375 if cv<=-0.9915713787078857 & pa>=-0.04359552040696144\n",
      "--------------\n",
      "   +2.4778 if cp<=-0.02555277161300182 & cp>=-0.0654942587018013\n",
      "   +5.2994 if cp<=-0.030866166576743116 & cv>=-0.6116338968276978\n",
      "   -1.1767 if pa<=-0.0335906058549881\n",
      "   -0.5664 if cp<=-0.12677187025547026\n",
      "   -2.9189 if cv>=-0.9915713787078857\n",
      "Run episode 152 with rewards 8.0\n",
      "============ 153 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.7562 if cv>=-1.0183420658111573\n",
      "   +0.3640 if cp>=-0.05922462418675423 & cv<=-0.8062889575958252\n",
      "   +1.0841 if cp>=-0.12677187025547026\n",
      "   +0.3280 if cv<=-0.9915713787078857 & pa>=-0.04359552040696144\n",
      "   -1.2441 if pa>=0.17269212007522583\n",
      "--------------\n",
      "   -0.0232 if cp<=-0.02555277161300182 & cp>=-0.0654942587018013\n",
      "   -0.0000 if cp<=-0.030866166576743116 & cv>=-0.6116338968276978\n",
      "   -0.0000 if pa<=-0.0335906058549881\n",
      "   -2.1865 if cv>=-0.9915713787078857\n",
      "   -1.0340 if cp>=0.013534338399767884\n",
      "Run episode 153 with rewards 10.0\n",
      "============ 154 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 1, 0, 0]\n",
      "   +0.9302 if cv>=-1.0183420658111573\n",
      "   +1.4295 if cp>=-0.05922462418675423 & cv<=-0.8062889575958252\n",
      "   +1.1302 if cp>=-0.12677187025547026\n",
      "   -0.0000 if pa>=0.17269212007522583\n",
      "   -1.1637 if pa>=0.171900674700737\n",
      "--------------\n",
      "   -0.2180 if cp<=-0.02555277161300182 & cp>=-0.0654942587018013\n",
      "   +0.0000 if cp<=-0.030866166576743116 & cv>=-0.6116338968276978\n",
      "   -1.3534 if cv>=-0.9915713787078857\n",
      "   -1.2069 if cp>=0.013534338399767884\n",
      "   -1.1353 if cp<=0.018362705595791343 & cp>=-0.05299719423055649\n",
      "Run episode 154 with rewards 10.0\n",
      "============ 155 ===========\n",
      "9 actions [0, 0, 0, 0, 1, 0, 0, 0, 0]\n",
      "   +1.0459 if cv>=-1.0183420658111573\n",
      "   +0.6678 if cp>=-0.05922462418675423 & cv<=-0.8062889575958252\n",
      "   -0.8413 if cp>=-0.12677187025547026\n",
      "   +0.0000 if pa>=0.171900674700737\n",
      "   +1.9719 if cv>=-1.243846607208252\n",
      "--------------\n",
      "   +0.8293 if cp<=-0.02555277161300182 & cp>=-0.0654942587018013\n",
      "   -1.2321 if cv>=-0.9915713787078857\n",
      "   -0.9323 if cp>=0.013534338399767884\n",
      "   -1.0584 if cp<=0.018362705595791343 & cp>=-0.05299719423055649\n",
      "   +1.3401 if cp>=-0.06916606426239014 & cv<=-1.243846607208252\n",
      "Run episode 155 with rewards 9.0\n",
      "============ 156 ===========\n",
      "11 actions [0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0]\n",
      "   +0.7532 if cv>=-1.0183420658111573\n",
      "   +0.0000 if cp>=-0.05922462418675423 & cv<=-0.8062889575958252\n",
      "   +0.4251 if cp>=-0.12677187025547026\n",
      "   +0.4251 if cv>=-1.243846607208252\n",
      "   -3.9005 if cp>=-0.05924984738230705 & cv<=-0.7543661713600158\n",
      "--------------\n",
      "   +0.2014 if cv>=-0.9915713787078857\n",
      "   -0.0000 if cp>=0.013534338399767884\n",
      "   +2.2212 if cp<=0.018362705595791343 & cp>=-0.05299719423055649\n",
      "   -0.0000 if cp>=-0.06916606426239014 & cv<=-1.243846607208252\n",
      "   -3.4389 if cp>=-0.03700120970606803\n",
      "Run episode 156 with rewards 11.0\n",
      "============ 157 ===========\n",
      "12 actions [0, 0, 0, 1, 0, 0, 0, 0, 1, 0, 0, 0]\n",
      "   +0.5953 if cv>=-1.0183420658111573\n",
      "   +1.2322 if cp>=-0.12677187025547026\n",
      "   +0.9558 if cv>=-1.243846607208252\n",
      "   -2.6648 if cp>=-0.05924984738230705 & cv<=-0.7543661713600158\n",
      "   +0.4783 if \n",
      "--------------\n",
      "   -1.2762 if cv>=-0.9915713787078857\n",
      "   +0.7813 if cp<=0.018362705595791343 & cp>=-0.05299719423055649\n",
      "   +0.0000 if cp>=-0.06916606426239014 & cv<=-1.243846607208252\n",
      "   -1.9380 if cp>=-0.03700120970606803\n",
      "   -0.8537 if cp<=-0.09971141070127487 & cp>=-0.09971141070127487\n",
      "Run episode 157 with rewards 12.0\n",
      "============ 158 ===========\n",
      "11 actions [0, 0, 0, 1, 0, 1, 0, 0, 0, 0, 0]\n",
      "   +1.4945 if cv>=-1.0183420658111573\n",
      "   -0.2746 if cp>=-0.12677187025547026\n",
      "   -0.2746 if cv>=-1.243846607208252\n",
      "   +1.0975 if cp>=-0.05924984738230705 & cv<=-0.7543661713600158\n",
      "   -4.8462 if cp>=-0.015325212851166715 & cv<=-0.5719308018684387\n",
      "--------------\n",
      "   -0.3598 if cv>=-0.9915713787078857\n",
      "   -0.2018 if cp<=0.018362705595791343 & cp>=-0.05299719423055649\n",
      "   +2.7857 if cp>=-0.03700120970606803\n",
      "   +0.0000 if cp<=-0.09971141070127487 & cp>=-0.09971141070127487\n",
      "   -2.8451 if cv>=-0.5719308018684387\n",
      "Run episode 158 with rewards 11.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 159 ===========\n",
      "10 actions [0, 0, 0, 1, 0, 0, 0, 0, 1, 0]\n",
      "   +0.2975 if cv>=-1.0183420658111573\n",
      "   -0.3935 if cv>=-1.243846607208252\n",
      "   -0.0000 if cp>=-0.05924984738230705 & cv<=-0.7543661713600158\n",
      "   -0.0000 if cp>=-0.015325212851166715 & cv<=-0.5719308018684387\n",
      "   +2.8747 if cp>=-0.02441021427512169\n",
      "--------------\n",
      "   -1.2865 if cv>=-0.9915713787078857\n",
      "   +1.5103 if cp<=0.018362705595791343 & cp>=-0.05299719423055649\n",
      "   +0.1536 if cp>=-0.03700120970606803\n",
      "   -3.2438 if cv>=-0.5719308018684387\n",
      "   +2.8657 if cp>=-0.06275220215320587 & cv<=-0.38378193974494934\n",
      "Run episode 159 with rewards 10.0\n",
      "============ 160 ===========\n",
      "14 actions [0, 0, 0, 1, 1, 0, 1, 0, 1, 0, 0, 0, 0, 1]\n",
      "   +0.9139 if cv>=-1.0183420658111573\n",
      "   -0.1299 if cv>=-1.243846607208252\n",
      "   -0.0000 if cp>=-0.015325212851166715 & cv<=-0.5719308018684387\n",
      "   -0.0000 if cp>=-0.02441021427512169\n",
      "   -2.7545 if cp>=-0.052837055176496506 & cv<=-0.46743569374084465\n",
      "--------------\n",
      "   -2.3407 if cv>=-0.9915713787078857\n",
      "   +0.2481 if cp<=0.018362705595791343 & cp>=-0.05299719423055649\n",
      "   -0.9490 if cv>=-0.5719308018684387\n",
      "   +4.2389 if cp>=-0.06275220215320587 & cv<=-0.38378193974494934\n",
      "   +0.6787 if cp<=-0.09375375807285309\n",
      "Run episode 160 with rewards 14.0\n",
      "============ 161 ===========\n",
      "12 actions [0, 0, 0, 1, 0, 1, 0, 1, 0, 0, 0, 0]\n",
      "   +0.8825 if cv>=-1.0183420658111573\n",
      "   +0.8825 if cv>=-1.243846607208252\n",
      "   +1.8278 if cp>=-0.02441021427512169\n",
      "   -1.2249 if cp>=-0.052837055176496506 & cv<=-0.46743569374084465\n",
      "   -3.4401 if cp>=-0.07248848527669907 & cv<=-0.41210718750953673\n",
      "--------------\n",
      "   -0.8648 if cv>=-0.9915713787078857\n",
      "   +0.3665 if cv>=-0.5719308018684387\n",
      "   +3.4770 if cp>=-0.06275220215320587 & cv<=-0.38378193974494934\n",
      "   -0.6995 if cp<=-0.09375375807285309\n",
      "   -4.3128 if cv>=-0.41210718750953673\n",
      "Run episode 161 with rewards 12.0\n",
      "============ 162 ===========\n",
      "15 actions [0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1]\n",
      "   -0.1747 if cv>=-1.0183420658111573\n",
      "   +0.5468 if cp>=-0.02441021427512169\n",
      "   -0.1610 if cp>=-0.052837055176496506 & cv<=-0.46743569374084465\n",
      "   -2.3250 if cp>=-0.07248848527669907 & cv<=-0.41210718750953673\n",
      "   +1.1175 if cp<=-0.08178898990154267\n",
      "--------------\n",
      "   -0.3462 if cv>=-0.9915713787078857\n",
      "   +0.8384 if cp>=-0.06275220215320587 & cv<=-0.38378193974494934\n",
      "   -0.1976 if cp<=-0.09375375807285309\n",
      "   -1.9662 if cv>=-0.41210718750953673\n",
      "   +0.5818 if cp>=-0.08178898990154267\n",
      "Run episode 162 with rewards 15.0\n",
      "============ 163 ===========\n",
      "18 actions [0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1]\n",
      "   +1.3807 if cv>=-1.0183420658111573\n",
      "   -0.1497 if cp>=-0.02441021427512169\n",
      "   -3.7206 if cp>=-0.07248848527669907 & cv<=-0.41210718750953673\n",
      "   +0.6163 if cp<=-0.08178898990154267\n",
      "   +1.6089 if cp>=-0.020810493826866127 & cv>=-0.35870438218116757\n",
      "--------------\n",
      "   -0.9045 if cv>=-0.9915713787078857\n",
      "   +2.2416 if cp>=-0.06275220215320587 & cv<=-0.38378193974494934\n",
      "   -3.2203 if cv>=-0.41210718750953673\n",
      "   +0.0706 if cp>=-0.08178898990154267\n",
      "   +0.4838 if cp<=-0.020810493826866127 & cv<=-0.5489708065986634\n",
      "Run episode 163 with rewards 18.0\n",
      "============ 164 ===========\n",
      "11 actions [0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0]\n",
      "   +0.7850 if cv>=-1.0183420658111573\n",
      "   -4.1087 if cp>=-0.07248848527669907 & cv<=-0.41210718750953673\n",
      "   +3.5572 if cp<=-0.08178898990154267\n",
      "   +0.0000 if cp>=-0.020810493826866127 & cv>=-0.35870438218116757\n",
      "   +0.5461 if cp>=-0.08121584951877593 & cv<=-0.4229486048221588\n",
      "--------------\n",
      "   -0.0425 if cv>=-0.9915713787078857\n",
      "   +1.8760 if cp>=-0.06275220215320587 & cv<=-0.38378193974494934\n",
      "   -3.0277 if cv>=-0.41210718750953673\n",
      "   -3.0479 if cp<=-0.020810493826866127 & cv<=-0.5489708065986634\n",
      "   -1.3592 if cp<=-0.060262212157249445 & cp>=-0.08121584951877593 & cv<=-0.4229486048221588\n",
      "Run episode 164 with rewards 11.0\n",
      "============ 165 ===========\n",
      "16 actions [0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0]\n",
      "   +0.7420 if cv>=-1.0183420658111573\n",
      "   -1.9513 if cp>=-0.07248848527669907 & cv<=-0.41210718750953673\n",
      "   -0.0000 if cp<=-0.08178898990154267\n",
      "   -1.9513 if cp>=-0.08121584951877593 & cv<=-0.4229486048221588\n",
      "   +0.3354 if cp<=-0.01817573793232441 & cv>=-0.37595853209495544\n",
      "--------------\n",
      "   +0.9878 if cp>=-0.06275220215320587 & cv<=-0.38378193974494934\n",
      "   -2.9975 if cv>=-0.41210718750953673\n",
      "   +0.2413 if cp<=-0.020810493826866127 & cv<=-0.5489708065986634\n",
      "   -0.0000 if cp<=-0.060262212157249445 & cp>=-0.08121584951877593 & cv<=-0.4229486048221588\n",
      "   +0.1765 if cv<=-0.36813226342201233 & cv>=-0.561775803565979\n",
      "Run episode 165 with rewards 16.0\n",
      "============ 166 ===========\n",
      "14 actions [0, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 0, 0]\n",
      "   +1.8533 if cv>=-1.0183420658111573\n",
      "   -3.3738 if cp>=-0.07248848527669907 & cv<=-0.41210718750953673\n",
      "   -0.9999 if cp>=-0.08121584951877593 & cv<=-0.4229486048221588\n",
      "   -0.0000 if cp<=-0.01817573793232441 & cv>=-0.37595853209495544\n",
      "   -1.5424 if pav>=1.4128538370132446\n",
      "--------------\n",
      "   +1.1202 if cp>=-0.06275220215320587 & cv<=-0.38378193974494934\n",
      "   -3.2653 if cv>=-0.41210718750953673\n",
      "   -0.8025 if cp<=-0.020810493826866127 & cv<=-0.5489708065986634\n",
      "   -1.6237 if cv<=-0.36813226342201233 & cv>=-0.561775803565979\n",
      "   +1.5136 if pav>=1.4128538370132446\n",
      "Run episode 166 with rewards 14.0\n",
      "============ 167 ===========\n",
      "16 actions [0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 0]\n",
      "   +0.2005 if cv>=-1.0183420658111573\n",
      "   -3.7207 if cp>=-0.07248848527669907 & cv<=-0.41210718750953673\n",
      "   -0.5111 if cp>=-0.08121584951877593 & cv<=-0.4229486048221588\n",
      "   +0.0000 if pav>=1.4128538370132446\n",
      "   +0.9554 if cp>=-0.010089655965566633 & cv>=-0.2220733106136322\n",
      "--------------\n",
      "   +1.1344 if cp>=-0.06275220215320587 & cv<=-0.38378193974494934\n",
      "   -3.0624 if cv>=-0.41210718750953673\n",
      "   +0.3360 if cv<=-0.36813226342201233 & cv>=-0.561775803565979\n",
      "   +0.0000 if pav>=1.4128538370132446\n",
      "   +0.0612 if cv>=-0.49708273410797116 & pav<=0.9669625639915467\n",
      "Run episode 167 with rewards 16.0\n",
      "============ 168 ===========\n",
      "16 actions [0, 0, 0, 1, 0, 1, 1, 0, 0, 1, 0, 0, 0, 1, 1, 0]\n",
      "   -1.0513 if cv>=-1.0183420658111573\n",
      "   -2.5074 if cp>=-0.07248848527669907 & cv<=-0.41210718750953673\n",
      "   -2.5074 if cp>=-0.08121584951877593 & cv<=-0.4229486048221588\n",
      "   +0.3959 if cp>=-0.010089655965566633 & cv>=-0.2220733106136322\n",
      "   +3.0973 if cv>=-0.5950794816017151\n",
      "--------------\n",
      "   +0.2583 if cp>=-0.06275220215320587 & cv<=-0.38378193974494934\n",
      "   -1.8586 if cv>=-0.41210718750953673\n",
      "   -1.1607 if cv<=-0.36813226342201233 & cv>=-0.561775803565979\n",
      "   -1.8586 if cv>=-0.49708273410797116 & pav<=0.9669625639915467\n",
      "   +1.7172 if pav>=1.3063709735870361\n",
      "Run episode 168 with rewards 16.0\n",
      "============ 169 ===========\n",
      "13 actions [0, 0, 0, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1]\n",
      "   +0.0814 if cv>=-1.0183420658111573\n",
      "   -1.1663 if cp>=-0.07248848527669907 & cv<=-0.41210718750953673\n",
      "   -1.1663 if cp>=-0.08121584951877593 & cv<=-0.4229486048221588\n",
      "   +1.5210 if cv>=-0.5950794816017151\n",
      "   -1.1663 if cp>=-0.06942482292652127 & cv<=-0.4362390637397766\n",
      "--------------\n",
      "   -0.2015 if cv>=-0.41210718750953673\n",
      "   -1.5756 if cv<=-0.36813226342201233 & cv>=-0.561775803565979\n",
      "   -1.7771 if cv>=-0.49708273410797116 & pav<=0.9669625639915467\n",
      "   +1.3897 if pav>=1.3063709735870361\n",
      "   -2.3517 if cv>=-0.4362390637397766\n",
      "Run episode 169 with rewards 13.0\n",
      "============ 170 ===========\n",
      "11 actions [0, 0, 0, 1, 0, 0, 1, 1, 0, 1, 0]\n",
      "   +0.9030 if cp>=-0.07248848527669907 & cv<=-0.41210718750953673\n",
      "   -0.7437 if cp>=-0.08121584951877593 & cv<=-0.4229486048221588\n",
      "   +3.1990 if cv>=-0.5950794816017151\n",
      "   +0.9030 if cp>=-0.06942482292652127 & cv<=-0.4362390637397766\n",
      "   -2.3375 if cv>=-0.7397883892059326\n",
      "--------------\n",
      "   -4.3036 if cv<=-0.36813226342201233 & cv>=-0.561775803565979\n",
      "   -1.3706 if cv>=-0.49708273410797116 & pav<=0.9669625639915467\n",
      "   +1.7768 if pav>=1.3063709735870361\n",
      "   -1.3706 if cv>=-0.4362390637397766\n",
      "   -4.5772 if cp>=-0.07667860239744186 & cv<=-0.7397883892059326 & cv>=-0.7444226741790771\n",
      "Run episode 170 with rewards 11.0\n",
      "============ 171 ===========\n",
      "20 actions [1, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1]\n",
      "   -1.0163 if cp>=-0.07248848527669907 & cv<=-0.41210718750953673\n",
      "   -1.4473 if cv>=-0.5950794816017151\n",
      "   -1.0163 if cp>=-0.06942482292652127 & cv<=-0.4362390637397766\n",
      "   +0.4666 if cv>=-0.7397883892059326\n",
      "   +1.4471 if cp>=-0.07922516763210297\n",
      "--------------\n",
      "   -1.0779 if cv<=-0.36813226342201233 & cv>=-0.561775803565979\n",
      "   -4.6208 if cv>=-0.49708273410797116 & pav<=0.9669625639915467\n",
      "   +2.4792 if pav>=1.3063709735870361\n",
      "   +0.0000 if cp>=-0.07667860239744186 & cv<=-0.7397883892059326 & cv>=-0.7444226741790771\n",
      "   +2.6687 if cv>=-0.5943180918693542\n",
      "Run episode 171 with rewards 20.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 172 ===========\n",
      "42 actions [1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 1, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0]\n",
      "   -0.7130 if cp>=-0.07248848527669907 & cv<=-0.41210718750953673\n",
      "   -0.6163 if cv>=-0.5950794816017151\n",
      "   -0.7130 if cp>=-0.06942482292652127 & cv<=-0.4362390637397766\n",
      "   -0.6912 if cp>=-0.07922516763210297\n",
      "   +3.3066 if cp>=0.02606125399470329\n",
      "--------------\n",
      "   -5.1632 if cv<=-0.36813226342201233 & cv>=-0.561775803565979\n",
      "   +0.7063 if cv>=-0.49708273410797116 & pav<=0.9669625639915467\n",
      "   +0.0000 if pav>=1.3063709735870361\n",
      "   +1.2490 if cv>=-0.5943180918693542\n",
      "   -4.9310 if cp>=0.02606125399470329 & cv>=-0.34120571613311745\n",
      "Run episode 172 with rewards 42.0\n",
      "============ 173 ===========\n",
      "18 actions [1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 1, 1, 0, 1]\n",
      "   -1.0705 if cp>=-0.07248848527669907 & cv<=-0.41210718750953673\n",
      "   +0.4775 if cp>=-0.06942482292652127 & cv<=-0.4362390637397766\n",
      "   -2.3029 if cp>=-0.07922516763210297\n",
      "   +6.5653 if cp>=0.02606125399470329\n",
      "   -6.0757 if cp>=-0.053343309462070436 & cp>=0.08598316162824635 & cv<=-0.7180232882499695 & cv>=-0.7297283291816712\n",
      "--------------\n",
      "   -4.3906 if cv<=-0.36813226342201233 & cv>=-0.561775803565979\n",
      "   +2.5827 if cv>=-0.49708273410797116 & pav<=0.9669625639915467\n",
      "   -1.8079 if cv>=-0.5943180918693542\n",
      "   -4.5478 if cp>=0.02606125399470329 & cv>=-0.34120571613311745\n",
      "   +0.7128 if \n",
      "Run episode 173 with rewards 18.0\n",
      "============ 174 ===========\n",
      "39 actions [1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 1, 1, 0, 1, 0, 0, 0, 1, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0]\n",
      "   -1.3355 if cp>=-0.07248848527669907 & cv<=-0.41210718750953673\n",
      "   -0.8048 if cp>=-0.07922516763210297\n",
      "   +4.9736 if cp>=0.02606125399470329\n",
      "   +0.0000 if cp>=-0.053343309462070436 & cp>=0.08598316162824635 & cv<=-0.7180232882499695 & cv>=-0.7297283291816712\n",
      "   -1.7937 if cv>=-0.12885482907295207\n",
      "--------------\n",
      "   -3.2825 if cv<=-0.36813226342201233 & cv>=-0.561775803565979\n",
      "   +0.5703 if cv>=-0.49708273410797116 & pav<=0.9669625639915467\n",
      "   -1.0506 if cv>=-0.5943180918693542\n",
      "   -0.7721 if cp>=0.02606125399470329 & cv>=-0.34120571613311745\n",
      "   +2.3300 if cv>=-0.12885482907295207 & cv>=-0.5586721777915955 & pa>=0.034017217159271244\n",
      "Run episode 174 with rewards 39.0\n",
      "============ 175 ===========\n",
      "24 actions [1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 0, 0]\n",
      "   -3.7872 if cp>=-0.07248848527669907 & cv<=-0.41210718750953673\n",
      "   +1.2017 if cp>=-0.07922516763210297\n",
      "   +6.6865 if cp>=0.02606125399470329\n",
      "   -5.1728 if cv>=-0.12885482907295207\n",
      "   -6.3681 if cv<=-0.9260005474090576 & pa<=-0.12495201379060744\n",
      "--------------\n",
      "   -5.9229 if cv<=-0.36813226342201233 & cv>=-0.561775803565979\n",
      "   +0.9896 if cv>=-0.5943180918693542\n",
      "   -3.6134 if cp>=0.02606125399470329 & cv>=-0.34120571613311745\n",
      "   +0.0000 if cv>=-0.12885482907295207 & cv>=-0.5586721777915955 & pa>=0.034017217159271244\n",
      "   +5.3012 if cv<=-0.9260005474090576 & pa<=-0.12495201379060744\n",
      "Run episode 175 with rewards 24.0\n",
      "============ 176 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 0, 0]\n",
      "   -1.4982 if cp>=-0.07248848527669907 & cv<=-0.41210718750953673\n",
      "   +4.8814 if cp>=0.02606125399470329\n",
      "   -2.9615 if cv>=-0.12885482907295207\n",
      "   -0.0000 if cv<=-0.9260005474090576 & pa<=-0.12495201379060744\n",
      "   +3.0797 if cp>=0.01073979437351228 & cv<=-1.002700078487396\n",
      "--------------\n",
      "   -0.5171 if cv<=-0.36813226342201233 & cv>=-0.561775803565979\n",
      "   +0.5116 if cv>=-0.5943180918693542\n",
      "   -2.5292 if cp>=0.02606125399470329 & cv>=-0.34120571613311745\n",
      "   -0.0000 if cv<=-0.9260005474090576 & pa<=-0.12495201379060744\n",
      "   -3.8723 if cp>=0.01073979437351228 & cv<=-1.002700078487396\n",
      "Run episode 176 with rewards 9.0\n",
      "============ 177 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.0000 if cp>=-0.07248848527669907 & cv<=-0.41210718750953673\n",
      "   +0.7550 if cp>=0.02606125399470329\n",
      "   -2.9181 if cv>=-0.12885482907295207\n",
      "   -0.0000 if cp>=0.01073979437351228 & cv<=-1.002700078487396\n",
      "   +0.9062 if cv>=1.3332217931747437\n",
      "--------------\n",
      "   +0.0000 if cv<=-0.36813226342201233 & cv>=-0.561775803565979\n",
      "   +1.2650 if cv>=-0.5943180918693542\n",
      "   -0.4197 if cp>=0.02606125399470329 & cv>=-0.34120571613311745\n",
      "   +0.0000 if cp>=0.01073979437351228 & cv<=-1.002700078487396\n",
      "   -0.4915 if cv>=1.3332217931747437\n",
      "Run episode 177 with rewards 9.0\n",
      "============ 178 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.7645 if cp>=0.02606125399470329\n",
      "   -2.4460 if cv>=-0.12885482907295207\n",
      "   +0.0000 if cp>=0.01073979437351228 & cv<=-1.002700078487396\n",
      "   -0.0397 if cv>=1.3332217931747437\n",
      "   -0.2537 if cp>=0.051494143903255477\n",
      "--------------\n",
      "   +1.1686 if cv>=-0.5943180918693542\n",
      "   +0.6353 if cp>=0.02606125399470329 & cv>=-0.34120571613311745\n",
      "   +0.0000 if cp>=0.01073979437351228 & cv<=-1.002700078487396\n",
      "   +0.0796 if cv>=1.3332217931747437\n",
      "   +0.7891 if cp<=0.051494143903255477\n",
      "Run episode 178 with rewards 10.0\n",
      "============ 179 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -1.1241 if cp>=0.02606125399470329\n",
      "   -1.1241 if cv>=-0.12885482907295207\n",
      "   -0.0135 if cv>=1.3332217931747437\n",
      "   -0.6197 if cp>=0.051494143903255477\n",
      "   -0.3217 if cp<=0.04927158281207085\n",
      "--------------\n",
      "   +0.8141 if cv>=-0.5943180918693542\n",
      "   +0.8141 if cp>=0.02606125399470329 & cv>=-0.34120571613311745\n",
      "   +0.0084 if cv>=1.3332217931747437\n",
      "   +0.4151 if cp<=0.051494143903255477\n",
      "   +0.0962 if cp>=0.08963352590799332\n",
      "Run episode 179 with rewards 9.0\n",
      "============ 180 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.0975 if cp>=0.02606125399470329\n",
      "   -1.4725 if cv>=-0.12885482907295207\n",
      "   -0.0738 if cp>=0.051494143903255477\n",
      "   -1.3987 if cp<=0.04927158281207085\n",
      "   -0.5779 if cp<=0.04322010129690171 & cp>=-0.018345948308706284\n",
      "--------------\n",
      "   +1.2702 if cv>=-0.5943180918693542\n",
      "   +0.0665 if cp>=0.02606125399470329 & cv>=-0.34120571613311745\n",
      "   +1.2405 if cp<=0.051494143903255477\n",
      "   +0.0000 if cp>=0.08963352590799332\n",
      "   +0.7682 if cp<=-0.008206608332693575\n",
      "Run episode 180 with rewards 9.0\n",
      "============ 181 ===========\n",
      "11 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.3242 if cp>=0.02606125399470329\n",
      "   -0.9363 if cv>=-0.12885482907295207\n",
      "   -0.6676 if cp<=0.04927158281207085\n",
      "   -0.6676 if cp<=0.04322010129690171 & cp>=-0.018345948308706284\n",
      "   +0.0592 if cp>=0.10196342319250107\n",
      "--------------\n",
      "   +0.8750 if cv>=-0.5943180918693542\n",
      "   +0.3262 if cp>=0.02606125399470329 & cv>=-0.34120571613311745\n",
      "   +0.7675 if cp<=0.051494143903255477\n",
      "   +0.2419 if cp<=-0.008206608332693575\n",
      "   -0.0464 if cp>=0.10196342319250107\n",
      "Run episode 181 with rewards 11.0\n",
      "============ 182 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.7824 if cp>=0.02606125399470329\n",
      "   -1.6307 if cv>=-0.12885482907295207\n",
      "   -0.8831 if cp<=0.04927158281207085\n",
      "   -0.8831 if cp<=0.04322010129690171 & cp>=-0.018345948308706284\n",
      "   -0.1625 if cp>=0.1123085618019104\n",
      "--------------\n",
      "   +1.1937 if cv>=-0.5943180918693542\n",
      "   +0.5374 if cp>=0.02606125399470329 & cv>=-0.34120571613311745\n",
      "   +0.6907 if cp<=0.051494143903255477\n",
      "   +0.0000 if cp<=-0.008206608332693575\n",
      "   +1.1414 if cp<=0.1123085618019104\n",
      "Run episode 182 with rewards 9.0\n",
      "============ 183 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.8037 if cp>=0.02606125399470329\n",
      "   -0.8037 if cv>=-0.12885482907295207\n",
      "   -0.2684 if cp<=0.04927158281207085\n",
      "   -0.1814 if cp<=0.04322010129690171 & cp>=-0.018345948308706284\n",
      "   -0.1999 if cp>=0.07783826291561127\n",
      "--------------\n",
      "   +0.7040 if cv>=-0.5943180918693542\n",
      "   +0.7040 if cp>=0.02606125399470329 & cv>=-0.34120571613311745\n",
      "   +0.1609 if cp<=0.051494143903255477\n",
      "   +0.6705 if cp<=0.1123085618019104\n",
      "   -0.0164 if cp>=0.15288345515727997\n",
      "Run episode 183 with rewards 10.0\n",
      "============ 184 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -1.1072 if cp>=0.02606125399470329\n",
      "   -1.1072 if cv>=-0.12885482907295207\n",
      "   -0.3734 if cp<=0.04927158281207085\n",
      "   -0.3532 if cp>=0.07783826291561127\n",
      "   -0.5318 if cp<=0.06451627463102341\n",
      "--------------\n",
      "   +1.0602 if cv>=-0.5943180918693542\n",
      "   +1.0602 if cp>=0.02606125399470329 & cv>=-0.34120571613311745\n",
      "   +0.3935 if cp<=0.051494143903255477\n",
      "   +0.9166 if cp<=0.1123085618019104\n",
      "   +0.0263 if cp>=0.13428235650062562\n",
      "Run episode 184 with rewards 9.0\n",
      "============ 185 ===========\n",
      "8 actions [1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.0582 if cp>=0.02606125399470329\n",
      "   -0.7830 if cv>=-0.12885482907295207\n",
      "   -0.7446 if cp<=0.04927158281207085\n",
      "   -0.7446 if cp<=0.06451627463102341\n",
      "   -0.5044 if cp<=-0.00247330507263541\n",
      "--------------\n",
      "   +0.8885 if cv>=-0.5943180918693542\n",
      "   +0.0376 if cp>=0.02606125399470329 & cv>=-0.34120571613311745\n",
      "   +0.8636 if cp<=0.051494143903255477\n",
      "   +0.8885 if cp<=0.1123085618019104\n",
      "   +0.4134 if cp>=-0.01400601640343666\n",
      "Run episode 185 with rewards 8.0\n",
      "============ 186 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.7865 if cv>=-0.12885482907295207\n",
      "   -0.5307 if cp<=0.04927158281207085\n",
      "   -0.6863 if cp<=0.06451627463102341\n",
      "   -0.0000 if cp<=-0.00247330507263541\n",
      "   +0.0351 if cp>=0.0929931029677391\n",
      "--------------\n",
      "   +0.7541 if cv>=-0.5943180918693542\n",
      "   +0.5273 if cp<=0.051494143903255477\n",
      "   +0.7541 if cp<=0.1123085618019104\n",
      "   +0.7541 if cp>=-0.01400601640343666\n",
      "   -0.0321 if cp>=0.0929931029677391\n",
      "Run episode 186 with rewards 9.0\n",
      "============ 187 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.8656 if cv>=-0.12885482907295207\n",
      "   -0.9028 if cp<=0.04927158281207085\n",
      "   -0.9028 if cp<=0.06451627463102341\n",
      "   +0.0000 if cp>=0.0929931029677391\n",
      "   -0.0866 if cp>=-0.021918121725320813\n",
      "--------------\n",
      "   +0.9016 if cv>=-0.5943180918693542\n",
      "   +0.9612 if cp<=0.051494143903255477\n",
      "   +0.9016 if cp<=0.1123085618019104\n",
      "   +0.1684 if cp>=-0.01400601640343666\n",
      "   -0.0398 if cp>=0.03456699401140214\n",
      "Run episode 187 with rewards 10.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 188 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.8252 if cv>=-0.12885482907295207\n",
      "   -0.7237 if cp<=0.04927158281207085\n",
      "   -0.7717 if cp<=0.06451627463102341\n",
      "   -0.3347 if cp>=-0.021918121725320813\n",
      "   +0.0532 if cp>=0.11034790426492691\n",
      "--------------\n",
      "   +0.8458 if cv>=-0.5943180918693542\n",
      "   +0.7836 if cp<=0.051494143903255477\n",
      "   +0.8458 if cp<=0.1123085618019104\n",
      "   +0.2789 if cp>=-0.01400601640343666\n",
      "   -0.0631 if cp>=0.11034790426492691\n",
      "Run episode 188 with rewards 9.0\n",
      "============ 189 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.7426 if cv>=-0.12885482907295207\n",
      "   -0.5380 if cp<=0.04927158281207085\n",
      "   -0.5380 if cp<=0.06451627463102341\n",
      "   -0.7426 if cp>=-0.021918121725320813\n",
      "   -0.0138 if cp>=0.0745883271098137\n",
      "--------------\n",
      "   +0.6112 if cv>=-0.5943180918693542\n",
      "   +0.4187 if cp<=0.051494143903255477\n",
      "   +0.6944 if cp<=0.1123085618019104\n",
      "   +0.6112 if cp>=-0.01400601640343666\n",
      "   +0.5762 if cp<=0.0745883271098137\n",
      "Run episode 189 with rewards 10.0\n",
      "origin 0.5311664389769887 new 0.5652734854077519 not updated\n",
      "============ 190 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.7326 if cv>=-0.12885482907295207\n",
      "   -0.6319 if cp<=0.04927158281207085\n",
      "   -0.6319 if cp<=0.06451627463102341\n",
      "   -0.7326 if cp>=-0.021918121725320813\n",
      "   -0.2127 if cp>=0.0046307619661092765\n",
      "--------------\n",
      "   +0.6112 if cv>=-0.5943180918693542\n",
      "   +0.4187 if cp<=0.051494143903255477\n",
      "   +0.6944 if cp<=0.1123085618019104\n",
      "   +0.6112 if cp>=-0.01400601640343666\n",
      "   +0.5762 if cp<=0.0745883271098137\n",
      "Run episode 190 with rewards 9.0\n",
      "origin 0.4416944469247006 new 0.46942964752712657 not updated\n",
      "============ 191 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.6352 if cv>=-0.12885482907295207\n",
      "   -0.6422 if cp<=0.04927158281207085\n",
      "   -0.6661 if cp<=0.06451627463102341\n",
      "   -0.6352 if cp>=-0.021918121725320813\n",
      "   -0.2561 if cp>=-0.018743649125099182\n",
      "--------------\n",
      "   +0.6112 if cv>=-0.5943180918693542\n",
      "   +0.4187 if cp<=0.051494143903255477\n",
      "   +0.6944 if cp<=0.1123085618019104\n",
      "   +0.6112 if cp>=-0.01400601640343666\n",
      "   +0.5762 if cp<=0.0745883271098137\n",
      "Run episode 191 with rewards 9.0\n",
      "origin 0.3756640671687204 new 0.39319189898821627 not updated\n",
      "origin 0.37687912344407115 new 0.40631511622564875 not updated\n",
      "============ 192 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.6352 if cv>=-0.12885482907295207\n",
      "   -0.6422 if cp<=0.04927158281207085\n",
      "   -0.6661 if cp<=0.06451627463102341\n",
      "   -0.6352 if cp>=-0.021918121725320813\n",
      "   -0.2561 if cp>=-0.018743649125099182\n",
      "--------------\n",
      "   +0.6112 if cv>=-0.5943180918693542\n",
      "   +0.4187 if cp<=0.051494143903255477\n",
      "   +0.6944 if cp<=0.1123085618019104\n",
      "   +0.6112 if cp>=-0.01400601640343666\n",
      "   +0.5762 if cp<=0.0745883271098137\n",
      "Run episode 192 with rewards 9.0\n",
      "origin 0.4114845338258769 new 0.436760650154082 not updated\n",
      "origin 0.4126995901012277 new 0.43863662618168264 not updated\n",
      "============ 193 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.6352 if cv>=-0.12885482907295207\n",
      "   -0.6422 if cp<=0.04927158281207085\n",
      "   -0.6661 if cp<=0.06451627463102341\n",
      "   -0.6352 if cp>=-0.021918121725320813\n",
      "   -0.2561 if cp>=-0.018743649125099182\n",
      "--------------\n",
      "   +0.6112 if cv>=-0.5943180918693542\n",
      "   +0.4187 if cp<=0.051494143903255477\n",
      "   +0.6944 if cp<=0.1123085618019104\n",
      "   +0.6112 if cp>=-0.01400601640343666\n",
      "   +0.5762 if cp<=0.0745883271098137\n",
      "Run episode 193 with rewards 10.0\n",
      "============ 194 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.9631 if cv>=-0.12885482907295207\n",
      "   -0.3550 if cp<=0.04927158281207085\n",
      "   -0.4384 if cp<=0.06451627463102341\n",
      "   -0.9631 if cp>=-0.021918121725320813\n",
      "   -0.0464 if cp>=0.11679955422878266\n",
      "--------------\n",
      "   +0.7765 if cv>=-0.5943180918693542\n",
      "   +0.7423 if cp<=0.1123085618019104\n",
      "   +0.7765 if cp>=-0.01400601640343666\n",
      "   +0.5255 if cp<=0.0745883271098137\n",
      "   +0.4300 if cp>=0.04613241851329804\n",
      "Run episode 194 with rewards 10.0\n",
      "============ 195 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.9100 if cv>=-0.12885482907295207\n",
      "   -0.9061 if cp<=0.04927158281207085\n",
      "   -0.9061 if cp<=0.06451627463102341\n",
      "   -0.2068 if cp>=-0.021918121725320813\n",
      "   -0.3398 if cp<=-0.04161364734172821\n",
      "--------------\n",
      "   +0.9863 if cv>=-0.5943180918693542\n",
      "   +0.9863 if cp<=0.1123085618019104\n",
      "   +0.0723 if cp>=-0.01400601640343666\n",
      "   +1.0066 if cp<=0.0745883271098137\n",
      "   +0.1209 if cp>=-0.025574035197496413\n",
      "Run episode 195 with rewards 10.0\n",
      "============ 196 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -1.2575 if cv>=-0.12885482907295207\n",
      "   -0.4385 if cp<=0.04927158281207085\n",
      "   -0.5503 if cp<=0.06451627463102341\n",
      "   -0.0000 if cp<=-0.04161364734172821\n",
      "   +0.1160 if cp>=0.16497428715229034\n",
      "--------------\n",
      "   +0.8099 if cv>=-0.5943180918693542\n",
      "   +0.7717 if cp<=0.1123085618019104\n",
      "   +0.5025 if cp<=0.0745883271098137\n",
      "   +0.8099 if cp>=-0.025574035197496413\n",
      "   +0.5167 if cp>=0.04538324177265167\n",
      "Run episode 196 with rewards 10.0\n",
      "============ 197 ===========\n",
      "8 actions [1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.8141 if cv>=-0.12885482907295207\n",
      "   -0.8103 if cp<=0.04927158281207085\n",
      "   -0.8103 if cp<=0.06451627463102341\n",
      "   +0.0000 if cp>=0.16497428715229034\n",
      "   -0.5945 if cp<=-0.02776113040745258\n",
      "--------------\n",
      "   +1.1585 if cv>=-0.5943180918693542\n",
      "   +1.1585 if cp<=0.1123085618019104\n",
      "   +0.2884 if cp>=-0.025574035197496413\n",
      "   +0.0217 if cp>=0.04538324177265167\n",
      "   +0.4357 if cp<=0.0018955933861434533 & cp>=-0.04493551477789879\n",
      "Run episode 197 with rewards 8.0\n",
      "============ 198 ===========\n",
      "8 actions [1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.6141 if cv>=-0.12885482907295207\n",
      "   -0.6141 if cp<=0.04927158281207085\n",
      "   -0.6141 if cp<=0.06451627463102341\n",
      "   -0.4678 if cp<=-0.02776113040745258\n",
      "   -0.0234 if cp>=0.005625746957957755\n",
      "--------------\n",
      "   +0.6575 if cv>=-0.5943180918693542\n",
      "   +0.6575 if cp<=0.1123085618019104\n",
      "   +0.2059 if cp>=-0.025574035197496413\n",
      "   +0.6186 if cp<=0.0018955933861434533 & cp>=-0.04493551477789879\n",
      "   +0.2407 if cp<=-0.04092939719557762\n",
      "Run episode 198 with rewards 8.0\n",
      "============ 199 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.8288 if cv>=-0.12885482907295207\n",
      "   -0.9073 if cp<=0.04927158281207085\n",
      "   -0.9073 if cp<=0.06451627463102341\n",
      "   +0.0000 if cp<=-0.02776113040745258\n",
      "   +0.0785 if cp>=0.0648471787571907\n",
      "--------------\n",
      "   +1.0327 if cv>=-0.5943180918693542\n",
      "   +1.0327 if cp<=0.1123085618019104\n",
      "   +0.7192 if cp<=0.0018955933861434533 & cp>=-0.04493551477789879\n",
      "   -0.0000 if cp<=-0.04092939719557762\n",
      "   +0.0009 if cp>=0.034156351536512385\n",
      "Run episode 199 with rewards 9.0\n",
      "============ 200 ===========\n",
      "8 actions [1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -1.2881 if cv>=-0.12885482907295207\n",
      "   -0.6616 if cp<=0.04927158281207085\n",
      "   -0.8544 if cp<=0.06451627463102341\n",
      "   -0.4337 if cp>=0.0648471787571907\n",
      "   -0.0840 if cp>=0.10070613473653794\n",
      "--------------\n",
      "   +1.1421 if cv>=-0.5943180918693542\n",
      "   +1.0456 if cp<=0.1123085618019104\n",
      "   +0.0000 if cp<=0.0018955933861434533 & cp>=-0.04493551477789879\n",
      "   +0.7449 if cp>=0.034156351536512385\n",
      "   -0.0747 if cp>=0.1427478939294815\n",
      "Run episode 200 with rewards 8.0\n",
      "============ 201 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 0]\n",
      "   -0.8868 if cv>=-0.12885482907295207\n",
      "   -0.4553 if cp<=0.04927158281207085\n",
      "   -0.6126 if cp<=0.06451627463102341\n",
      "   -0.2742 if cp>=0.0648471787571907\n",
      "   -0.0078 if cp>=0.0939271003007889\n",
      "--------------\n",
      "   +0.7771 if cv>=-0.5943180918693542\n",
      "   +0.8047 if cp<=0.1123085618019104\n",
      "   +0.7771 if cp>=0.034156351536512385\n",
      "   -0.0000 if cp>=0.1427478939294815\n",
      "   +0.0144 if cp>=0.0939271003007889\n",
      "Run episode 201 with rewards 10.0\n",
      "============ 202 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -2.0781 if cv>=-0.12885482907295207\n",
      "   -0.6682 if cp<=0.04927158281207085\n",
      "   -0.7406 if cp<=0.06451627463102341\n",
      "   -1.3375 if cp>=0.0648471787571907\n",
      "   -0.0451 if cp<=0.11071850955486298 & cp>=0.06884123012423515\n",
      "--------------\n",
      "   +2.1245 if cv>=-0.5943180918693542\n",
      "   +0.8344 if cp<=0.1123085618019104\n",
      "   +1.4005 if cp>=0.034156351536512385\n",
      "   +1.2965 if cp>=0.0939271003007889\n",
      "   +1.2827 if cp>=0.16511429846286774\n",
      "Run episode 202 with rewards 10.0\n",
      "============ 203 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 0, 0]\n",
      "   -0.6909 if cv>=-0.12885482907295207\n",
      "   -0.6039 if cp<=0.04927158281207085\n",
      "   -0.6372 if cp<=0.06451627463102341\n",
      "   -0.0537 if cp>=0.0648471787571907\n",
      "   -0.2705 if cp>=0.0297895397990942\n",
      "--------------\n",
      "   +0.8752 if cv>=-0.5943180918693542\n",
      "   +0.3917 if cp>=0.034156351536512385\n",
      "   +0.0571 if cp>=0.0939271003007889\n",
      "   +0.0000 if cp>=0.16511429846286774\n",
      "   +0.7355 if cp<=0.06991276964545251\n",
      "Run episode 203 with rewards 9.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 204 ===========\n",
      "8 actions [1, 1, 1, 1, 1, 1, 1, 0]\n",
      "   -0.7896 if cv>=-0.12885482907295207\n",
      "   -0.9880 if cp<=0.04927158281207085\n",
      "   -1.1596 if cp<=0.06451627463102341\n",
      "   -0.0543 if cp>=0.0297895397990942\n",
      "   +1.5912 if cv>=1.361337661743164\n",
      "--------------\n",
      "   +1.1168 if cv>=-0.5943180918693542\n",
      "   +0.0750 if cp>=0.034156351536512385\n",
      "   -0.7991 if cp>=0.0939271003007889\n",
      "   +1.3146 if cp<=0.06991276964545251\n",
      "   -1.3058 if cv>=1.361337661743164\n",
      "Run episode 204 with rewards 8.0\n",
      "============ 205 ===========\n",
      "8 actions [1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -1.6500 if cv>=-0.12885482907295207\n",
      "   -0.4536 if cp<=0.04927158281207085\n",
      "   -0.5427 if cp<=0.06451627463102341\n",
      "   -0.6846 if cv>=1.361337661743164\n",
      "   -0.2703 if cp<=0.08310824185609819 & cp>=0.05792813003063203\n",
      "--------------\n",
      "   +1.6339 if cv>=-0.5943180918693542\n",
      "   +0.7824 if cp>=0.0939271003007889\n",
      "   +0.3680 if cp<=0.06991276964545251\n",
      "   +0.7824 if cv>=1.361337661743164\n",
      "   +0.6374 if cp<=0.08310824185609819\n",
      "Run episode 205 with rewards 8.0\n",
      "============ 206 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.7924 if cv>=-0.12885482907295207\n",
      "   -0.5848 if cp<=0.04927158281207085\n",
      "   -0.6861 if cp<=0.06451627463102341\n",
      "   +0.0161 if cv>=1.361337661743164\n",
      "   -0.3761 if cp<=0.020832819119095805\n",
      "--------------\n",
      "   +0.7467 if cv>=-0.5943180918693542\n",
      "   -0.0414 if cp>=0.0939271003007889\n",
      "   -0.0414 if cv>=1.361337661743164\n",
      "   +0.7882 if cp<=0.08310824185609819\n",
      "   +0.7042 if cp<=0.06299763321876527\n",
      "Run episode 206 with rewards 10.0\n",
      "============ 207 ===========\n",
      "8 actions [1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -1.2055 if cv>=-0.12885482907295207\n",
      "   -0.6320 if cp<=0.04927158281207085\n",
      "   -0.7683 if cp<=0.06451627463102341\n",
      "   -0.5317 if cp<=0.020832819119095805\n",
      "   +0.2267 if cp>=0.13477735221385956\n",
      "--------------\n",
      "   +1.0772 if cv>=-0.5943180918693542\n",
      "   +0.2980 if cv>=1.361337661743164\n",
      "   +1.0141 if cp<=0.08310824185609819\n",
      "   +0.7792 if cp<=0.06299763321876527\n",
      "   -0.1693 if cp>=0.13477735221385956\n",
      "Run episode 207 with rewards 8.0\n",
      "============ 208 ===========\n",
      "11 actions [1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 0]\n",
      "   -0.5591 if cv>=-0.12885482907295207\n",
      "   -0.5706 if cp<=0.04927158281207085\n",
      "   -0.5591 if cp<=0.06451627463102341\n",
      "   -0.5437 if cp<=0.020832819119095805\n",
      "   -0.0516 if cp>=-0.002762948721647246\n",
      "--------------\n",
      "   +0.5748 if cv>=-0.5943180918693542\n",
      "   -0.0221 if cv>=1.361337661743164\n",
      "   +0.5748 if cp<=0.08310824185609819\n",
      "   +0.5748 if cp<=0.06299763321876527\n",
      "   +0.3347 if cp<=-0.018991316854953765\n",
      "Run episode 208 with rewards 11.0\n",
      "============ 209 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 0, 1, 1, 1]\n",
      "   -1.9580 if cv>=-0.12885482907295207\n",
      "   -2.3063 if cp<=0.04927158281207085\n",
      "   +2.5877 if cp<=0.06451627463102341\n",
      "   -1.1578 if cp<=0.020832819119095805\n",
      "   +1.5515 if cp<=0.0980374813079834 & cp>=0.056106582283973715\n",
      "--------------\n",
      "   +1.0420 if cv>=-0.5943180918693542\n",
      "   -1.2661 if cp<=0.08310824185609819\n",
      "   -1.4811 if cp<=0.06299763321876527\n",
      "   -0.0000 if cp<=-0.018991316854953765\n",
      "   +3.3943 if cv<=0.9509786367416384\n",
      "Run episode 209 with rewards 10.0\n",
      "============ 210 ===========\n",
      "8 actions [1, 1, 1, 1, 1, 1, 1, 0]\n",
      "   +0.0398 if cv>=-0.12885482907295207\n",
      "   -1.0844 if cp<=0.04927158281207085\n",
      "   -1.7722 if cp<=0.06451627463102341\n",
      "   +1.7008 if cp<=0.0980374813079834 & cp>=0.056106582283973715\n",
      "   -1.4024 if cp<=0.08132929503917695 & cp>=0.05482790023088455\n",
      "--------------\n",
      "   -0.4171 if cv>=-0.5943180918693542\n",
      "   +1.9508 if cp<=0.08310824185609819\n",
      "   +1.5498 if cp<=0.06299763321876527\n",
      "   +2.2406 if cv<=0.9509786367416384\n",
      "   -0.7453 if cp<=0.11877854764461518\n",
      "Run episode 210 with rewards 8.0\n",
      "============ 211 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.5013 if cp<=0.04927158281207085\n",
      "   -0.5579 if cp<=0.06451627463102341\n",
      "   -0.8916 if cp<=0.0980374813079834 & cp>=0.056106582283973715\n",
      "   -0.8916 if cp<=0.08132929503917695 & cp>=0.05482790023088455\n",
      "   -0.9482 if cp>=0.0457787148654461\n",
      "--------------\n",
      "   +1.1773 if cp<=0.08310824185609819\n",
      "   +0.3072 if cp<=0.06299763321876527\n",
      "   +0.2673 if cv<=0.9509786367416384\n",
      "   +1.1773 if cp<=0.11877854764461518\n",
      "   +0.8839 if cp>=0.0457787148654461\n",
      "Run episode 211 with rewards 9.0\n",
      "============ 212 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -1.3215 if cp<=0.06451627463102341\n",
      "   -0.4084 if cp<=0.0980374813079834 & cp>=0.056106582283973715\n",
      "   -0.0478 if cp<=0.08132929503917695 & cp>=0.05482790023088455\n",
      "   -0.2715 if cp>=0.0457787148654461\n",
      "   +0.4039 if cp>=0.13675861060619354\n",
      "--------------\n",
      "   +1.0069 if cp<=0.08310824185609819\n",
      "   +0.9861 if cp<=0.06299763321876527\n",
      "   +1.2939 if cp<=0.11877854764461518\n",
      "   +0.1125 if cp>=0.0457787148654461\n",
      "   +0.4201 if cp>=0.024920472502708436\n",
      "Run episode 212 with rewards 10.0\n",
      "============ 213 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 0, 1]\n",
      "   -1.3045 if cp<=0.06451627463102341\n",
      "   -0.0935 if cp<=0.0980374813079834 & cp>=0.056106582283973715\n",
      "   +0.0439 if cp>=0.0457787148654461\n",
      "   -0.0000 if cp>=0.13675861060619354\n",
      "   -0.2364 if cp>=-0.015002396889030933\n",
      "--------------\n",
      "   +1.2222 if cp<=0.08310824185609819\n",
      "   +1.0887 if cp<=0.06299763321876527\n",
      "   +0.8601 if cp<=0.11877854764461518\n",
      "   -0.0661 if cp>=0.024920472502708436\n",
      "   +0.6036 if cp<=-0.015002396889030933\n",
      "Run episode 213 with rewards 9.0\n",
      "============ 214 ===========\n",
      "10 actions [1, 1, 1, 1, 0, 1, 1, 1, 1, 1]\n",
      "   -0.5615 if cp<=0.06451627463102341\n",
      "   -0.7968 if cp<=0.0980374813079834 & cp>=0.056106582283973715\n",
      "   -0.6274 if cp>=0.0457787148654461\n",
      "   -0.6274 if cp>=-0.015002396889030933\n",
      "   +1.1899 if cv>=1.3558756113052368\n",
      "--------------\n",
      "   +0.9295 if cp<=0.08310824185609819\n",
      "   +0.5076 if cp<=0.06299763321876527\n",
      "   +2.1825 if cp<=0.11877854764461518\n",
      "   -0.0000 if cp<=-0.015002396889030933\n",
      "   -0.8257 if cv>=1.3558756113052368\n",
      "Run episode 214 with rewards 10.0\n",
      "============ 215 ===========\n",
      "18 actions [0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 0, 0, 0]\n",
      "   +0.0485 if cp<=0.0980374813079834 & cp>=0.056106582283973715\n",
      "   +0.0485 if cp>=0.0457787148654461\n",
      "   +0.7719 if cp>=-0.015002396889030933\n",
      "   +0.0000 if cv>=1.3558756113052368\n",
      "   +2.6820 if cp<=0.02067835815250874 & cp>=-0.0031857557827606785\n",
      "--------------\n",
      "   -0.0435 if cp<=0.08310824185609819\n",
      "   -0.0435 if cp<=0.06299763321876527\n",
      "   -0.1734 if cp<=0.11877854764461518\n",
      "   -0.0000 if cv>=1.3558756113052368\n",
      "   +3.0502 if cp<=-0.0031857557827606785\n",
      "Run episode 215 with rewards 18.0\n",
      "============ 216 ===========\n",
      "16 actions [0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 0, 0]\n",
      "   -0.5790 if cp<=0.0980374813079834 & cp>=0.056106582283973715\n",
      "   +0.8259 if cp>=0.0457787148654461\n",
      "   -1.5422 if cp>=-0.015002396889030933\n",
      "   +4.8124 if cp<=0.02067835815250874 & cp>=-0.0031857557827606785\n",
      "   +1.8579 if cv>=1.3765403032302856\n",
      "--------------\n",
      "   +1.3478 if cp<=0.08310824185609819\n",
      "   +1.3478 if cp<=0.06299763321876527\n",
      "   -0.4495 if cp<=0.11877854764461518\n",
      "   +3.6316 if cp<=-0.0031857557827606785\n",
      "   -2.1250 if cp>=-0.025498259812593457 & cv<=0.16732363104820264\n",
      "Run episode 216 with rewards 16.0\n",
      "============ 217 ===========\n",
      "8 actions [1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   +2.0124 if cp>=0.0457787148654461\n",
      "   -3.2302 if cp>=-0.015002396889030933\n",
      "   -0.0000 if cp<=0.02067835815250874 & cp>=-0.0031857557827606785\n",
      "   +1.1559 if cv>=1.3765403032302856\n",
      "   +4.3412 if cp>=0.049455877393484116 & cv<=0.36111724376678467\n",
      "--------------\n",
      "   +1.3324 if cp<=0.08310824185609819\n",
      "   +0.0340 if cp<=0.06299763321876527\n",
      "   +0.0000 if cp<=-0.0031857557827606785\n",
      "   -3.9682 if cp>=-0.025498259812593457 & cv<=0.16732363104820264\n",
      "   +2.4196 if pa>=0.04201820492744447 & pav>=-0.4616793692111964\n",
      "Run episode 217 with rewards 8.0\n",
      "============ 218 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.4777 if cp>=0.0457787148654461\n",
      "   -2.8540 if cp>=-0.015002396889030933\n",
      "   +0.0000 if cv>=1.3765403032302856\n",
      "   +0.0000 if cp>=0.049455877393484116 & cv<=0.36111724376678467\n",
      "   -2.0825 if pav>=0.013356895186007023\n",
      "--------------\n",
      "   +1.1796 if cp<=0.08310824185609819\n",
      "   +0.7006 if cp<=0.06299763321876527\n",
      "   +0.1249 if cp>=-0.025498259812593457 & cv<=0.16732363104820264\n",
      "   +0.0000 if pa>=0.04201820492744447 & pav>=-0.4616793692111964\n",
      "   +1.0816 if cp>=0.04396088793873787\n",
      "Run episode 218 with rewards 9.0\n",
      "============ 219 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 0, 1]\n",
      "   -0.2374 if cp>=0.0457787148654461\n",
      "   -1.5817 if cp>=-0.015002396889030933\n",
      "   +0.0000 if cp>=0.049455877393484116 & cv<=0.36111724376678467\n",
      "   -0.2265 if pav>=0.013356895186007023\n",
      "   -0.9473 if cp<=0.03313287198543549\n",
      "--------------\n",
      "   +0.6778 if cp<=0.08310824185609819\n",
      "   +0.6296 if cp<=0.06299763321876527\n",
      "   +0.0252 if cp>=-0.025498259812593457 & cv<=0.16732363104820264\n",
      "   +0.1071 if cp>=0.04396088793873787\n",
      "   +0.6956 if \n",
      "Run episode 219 with rewards 9.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 220 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 0]\n",
      "   +0.6112 if cp>=0.0457787148654461\n",
      "   -1.0578 if cp>=-0.015002396889030933\n",
      "   -0.2669 if pav>=0.013356895186007023\n",
      "   -1.2421 if cp<=0.03313287198543549\n",
      "   +1.2109 if cv>=1.3737422227859497\n",
      "--------------\n",
      "   +1.5944 if cp<=0.08310824185609819\n",
      "   +0.9270 if cp<=0.06299763321876527\n",
      "   -1.1331 if cp>=0.04396088793873787\n",
      "   -0.2061 if \n",
      "   -0.3327 if cp>=0.11457589268684387\n",
      "Run episode 220 with rewards 9.0\n",
      "============ 221 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -1.2635 if cp>=0.0457787148654461\n",
      "   -1.3639 if cp>=-0.015002396889030933\n",
      "   -0.6237 if cp<=0.03313287198543549\n",
      "   -1.2558 if cv>=1.3737422227859497\n",
      "   -1.9094 if \n",
      "--------------\n",
      "   +1.3893 if cp<=0.08310824185609819\n",
      "   +1.3893 if cp<=0.06299763321876527\n",
      "   +0.6456 if cp>=0.04396088793873787\n",
      "   -0.0000 if cp>=0.11457589268684387\n",
      "   +0.4579 if cp<=0.046323141455650335 & cp>=-0.01849757581949234\n",
      "Run episode 221 with rewards 9.0\n",
      "============ 222 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.5057 if cp>=0.0457787148654461\n",
      "   -0.8870 if cp>=-0.015002396889030933\n",
      "   -0.0497 if cv>=1.3737422227859497\n",
      "   -0.8870 if \n",
      "   -0.4101 if cp<=0.06492680907249451\n",
      "--------------\n",
      "   +0.5443 if cp<=0.08310824185609819\n",
      "   +0.4980 if cp<=0.06299763321876527\n",
      "   +0.1412 if cp>=0.04396088793873787\n",
      "   +0.4554 if cp<=0.046323141455650335 & cp>=-0.01849757581949234\n",
      "   +0.0960 if cp<=0.0977122336626053 & cp>=0.06492680907249451\n",
      "Run episode 222 with rewards 9.0\n",
      "============ 223 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 0, 1]\n",
      "   +0.0778 if cp>=0.0457787148654461\n",
      "   -0.2127 if cp>=-0.015002396889030933\n",
      "   -1.3779 if \n",
      "   -1.4913 if cp<=0.06492680907249451\n",
      "   -0.5645 if cp<=-0.024439392238855363\n",
      "--------------\n",
      "   +1.1188 if cp<=0.08310824185609819\n",
      "   +1.1578 if cp<=0.06299763321876527\n",
      "   -0.0221 if cp>=0.04396088793873787\n",
      "   +0.3585 if cp<=0.046323141455650335 & cp>=-0.01849757581949234\n",
      "   +0.9119 if cp<=-0.013717117905616758\n",
      "Run episode 223 with rewards 9.0\n",
      "============ 224 ===========\n",
      "8 actions [1, 1, 1, 1, 1, 1, 1, 0]\n",
      "   -0.4458 if cp>=-0.015002396889030933\n",
      "   -0.4458 if \n",
      "   -1.1007 if cp<=0.06492680907249451\n",
      "   -0.0000 if cp<=-0.024439392238855363\n",
      "   +1.3662 if cp>=0.08791697174310685\n",
      "--------------\n",
      "   +1.0375 if cp<=0.08310824185609819\n",
      "   +0.6098 if cp<=0.06299763321876527\n",
      "   +0.5202 if cp<=0.046323141455650335 & cp>=-0.01849757581949234\n",
      "   +0.0000 if cp<=-0.013717117905616758\n",
      "   -1.2801 if cv>=1.3497552871704102\n",
      "Run episode 224 with rewards 8.0\n",
      "============ 225 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 0, 1, 1]\n",
      "   -1.3961 if cp>=-0.015002396889030933\n",
      "   -1.3961 if \n",
      "   -0.3539 if cp<=0.06492680907249451\n",
      "   -0.9876 if cp>=0.08791697174310685\n",
      "   -0.3031 if cp<=0.044920961558818834\n",
      "--------------\n",
      "   +1.0980 if cp<=0.08310824185609819\n",
      "   +0.7885 if cp<=0.06299763321876527\n",
      "   +0.6633 if cp<=0.046323141455650335 & cp>=-0.01849757581949234\n",
      "   +0.5561 if cv>=1.3497552871704102\n",
      "   +0.4209 if cp<=0.02766039408743382\n",
      "Run episode 225 with rewards 9.0\n",
      "============ 226 ===========\n",
      "37 actions [1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0, 0, 1, 0, 0, 1, 1, 0, 0, 1, 0]\n",
      "   -0.1328 if cp>=-0.015002396889030933\n",
      "   -0.1328 if \n",
      "   -0.4797 if cp<=0.06492680907249451\n",
      "   +0.9036 if cp>=0.08791697174310685\n",
      "   +3.1130 if cv>=1.0825722217559814\n",
      "--------------\n",
      "   -1.0805 if cp<=0.08310824185609819\n",
      "   -1.4985 if cp<=0.06299763321876527\n",
      "   +2.1927 if cp<=0.046323141455650335 & cp>=-0.01849757581949234\n",
      "   -0.0000 if cv>=1.3497552871704102\n",
      "   +1.1988 if cp<=0.009402625262737276\n",
      "Run episode 226 with rewards 37.0\n",
      "============ 227 ===========\n",
      "19 actions [1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 1, 0, 0, 1, 1, 1]\n",
      "   +2.4167 if \n",
      "   -2.6046 if cp<=0.06492680907249451\n",
      "   -2.3563 if cp>=0.08791697174310685\n",
      "   +2.5248 if cv>=1.0825722217559814\n",
      "   -3.1477 if cv<=0.7437525868415833 & pa>=0.03145952150225639\n",
      "--------------\n",
      "   -4.4938 if cp<=0.08310824185609819\n",
      "   +0.0244 if cp<=0.06299763321876527\n",
      "   +3.8995 if cp<=0.046323141455650335 & cp>=-0.01849757581949234\n",
      "   +2.8686 if cp<=0.009402625262737276\n",
      "   +2.6250 if pa>=0.03145952150225639\n",
      "Run episode 227 with rewards 19.0\n",
      "============ 228 ===========\n",
      "12 actions [1, 1, 1, 0, 1, 1, 1, 0, 0, 1, 0, 0]\n",
      "   +0.3051 if \n",
      "   -2.8757 if cp<=0.06492680907249451\n",
      "   +0.0000 if cv>=1.0825722217559814\n",
      "   +0.0000 if cv<=0.7437525868415833 & pa>=0.03145952150225639\n",
      "   +4.1580 if cv>=0.9623889923095703\n",
      "--------------\n",
      "   -1.9105 if cp<=0.08310824185609819\n",
      "   +4.2164 if cp<=0.046323141455650335 & cp>=-0.01849757581949234\n",
      "   +1.9111 if cp<=0.009402625262737276\n",
      "   +0.0000 if pa>=0.03145952150225639\n",
      "   -4.5500 if cv>=0.9623889923095703\n",
      "Run episode 228 with rewards 12.0\n",
      "============ 229 ===========\n",
      "12 actions [0, 1, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1]\n",
      "   +0.2870 if \n",
      "   +0.0297 if cp<=0.06492680907249451\n",
      "   +0.0000 if cv<=0.7437525868415833 & pa>=0.03145952150225639\n",
      "   +0.5410 if cv>=0.9623889923095703\n",
      "   -3.5815 if cp<=-0.026150033622980115\n",
      "--------------\n",
      "   -2.6236 if cp<=0.08310824185609819\n",
      "   +3.1329 if cp<=0.046323141455650335 & cp>=-0.01849757581949234\n",
      "   -0.7022 if cp<=0.009402625262737276\n",
      "   -1.1847 if cv>=0.9623889923095703\n",
      "   +3.9254 if cp<=-0.026150033622980115\n",
      "Run episode 229 with rewards 12.0\n",
      "============ 230 ===========\n",
      "18 actions [0, 0, 1, 1, 1, 1, 0, 1, 1, 1, 0, 1, 1, 0, 1, 1, 1, 1]\n",
      "   +0.9477 if \n",
      "   +0.9477 if cp<=0.06492680907249451\n",
      "   -0.0000 if cv>=0.9623889923095703\n",
      "   -2.8797 if cp<=-0.026150033622980115\n",
      "   -0.1199 if cp>=0.010723299719393264\n",
      "--------------\n",
      "   -1.6386 if cp<=0.08310824185609819\n",
      "   -1.2068 if cp<=0.046323141455650335 & cp>=-0.01849757581949234\n",
      "   -0.0000 if cv>=0.9623889923095703\n",
      "   +1.0694 if cp<=-0.026150033622980115\n",
      "   +4.8944 if cp>=0.019997090101242065\n",
      "Run episode 230 with rewards 18.0\n",
      "============ 231 ===========\n",
      "16 actions [0, 1, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 1, 0]\n",
      "   -0.6142 if \n",
      "   +1.5385 if cp<=0.06492680907249451\n",
      "   -0.0000 if cp<=-0.026150033622980115\n",
      "   -0.6142 if cp>=0.010723299719393264\n",
      "   +4.2520 if cp>=0.04840146899223328\n",
      "--------------\n",
      "   -2.0512 if cp<=0.08310824185609819\n",
      "   +4.1506 if cp<=0.046323141455650335 & cp>=-0.01849757581949234\n",
      "   +0.0000 if cp<=-0.026150033622980115\n",
      "   +1.4362 if cp>=0.019997090101242065\n",
      "   +4.3198 if cp>=0.04840146899223328 & cv<=0.5903132915496828 & cv>=0.31735821366310135 & pa<=0.011491686664521694\n",
      "Run episode 231 with rewards 16.0\n",
      "============ 232 ===========\n",
      "14 actions [1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 1, 1, 0]\n",
      "   +1.3929 if \n",
      "   -0.2474 if cp<=0.06492680907249451\n",
      "   -1.3982 if cp>=0.010723299719393264\n",
      "   +1.6402 if cp>=0.04840146899223328\n",
      "   +0.3873 if cp<=0.017517412081360838\n",
      "--------------\n",
      "   -0.5662 if cp<=0.08310824185609819\n",
      "   +1.0197 if cp<=0.046323141455650335 & cp>=-0.01849757581949234\n",
      "   +2.0411 if cp>=0.019997090101242065\n",
      "   -0.0000 if cp>=0.04840146899223328 & cv<=0.5903132915496828 & cv>=0.31735821366310135 & pa<=0.011491686664521694\n",
      "   +4.0616 if cv<=0.036152634769678116\n",
      "Run episode 232 with rewards 14.0\n",
      "============ 233 ===========\n",
      "15 actions [1, 1, 1, 0, 1, 1, 1, 0, 0, 0, 0, 1, 0, 0, 0]\n",
      "   +1.9358 if \n",
      "   -0.1252 if cp>=0.010723299719393264\n",
      "   -1.3353 if cp>=0.04840146899223328\n",
      "   +2.0609 if cp<=0.017517412081360838\n",
      "   -2.8069 if cv<=0.3471404016017915\n",
      "--------------\n",
      "   +1.8641 if cp<=0.08310824185609819\n",
      "   -0.2040 if cp<=0.046323141455650335 & cp>=-0.01849757581949234\n",
      "   -1.0062 if cp>=0.019997090101242065\n",
      "   +3.3142 if cv<=0.036152634769678116\n",
      "   -3.1836 if cp<=0.0025478094350546597 & cv>=0.10980756580829622\n",
      "Run episode 233 with rewards 15.0\n",
      "============ 234 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 0, 1, 1, 0]\n",
      "   -0.8174 if \n",
      "   +1.2435 if cp>=0.04840146899223328\n",
      "   -0.0000 if cp<=0.017517412081360838\n",
      "   -2.2331 if cv<=0.3471404016017915\n",
      "   -2.7624 if cp<=0.08573301434516907 & cv>=0.23767761886119843 & pav>=-0.6158170223236084\n",
      "--------------\n",
      "   +1.0811 if cp<=0.08310824185609819\n",
      "   -0.6553 if cp>=0.019997090101242065\n",
      "   -0.0000 if cv<=0.036152634769678116\n",
      "   -0.0000 if cp<=0.0025478094350546597 & cv>=0.10980756580829622\n",
      "   +3.3173 if cp<=0.08573301434516907 & pav>=-0.6158170223236084\n",
      "Run episode 234 with rewards 9.0\n",
      "============ 235 ===========\n",
      "11 actions [1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1]\n",
      "   -1.7065 if \n",
      "   -1.0094 if cp>=0.04840146899223328\n",
      "   -0.1005 if cv<=0.3471404016017915\n",
      "   -0.0000 if cp<=0.08573301434516907 & cv>=0.23767761886119843 & pav>=-0.6158170223236084\n",
      "   +2.5214 if cp<=0.02535203844308854 & cp>=-0.002927413972793136\n",
      "--------------\n",
      "   +1.8911 if cp<=0.08310824185609819\n",
      "   +1.0339 if cp>=0.019997090101242065\n",
      "   +0.1287 if cv<=0.036152634769678116\n",
      "   +0.2567 if cp<=0.08573301434516907 & pav>=-0.6158170223236084\n",
      "   -2.4587 if cp<=0.02535203844308854 & cp>=-0.002927413972793136\n",
      "Run episode 235 with rewards 11.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 236 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.8201 if \n",
      "   -0.1740 if cp>=0.04840146899223328\n",
      "   -1.0407 if cv<=0.3471404016017915\n",
      "   +2.1167 if cp<=0.02535203844308854 & cp>=-0.002927413972793136\n",
      "   -1.2097 if cp<=-0.0060440110974013805 & cp>=-0.025669584050774574\n",
      "--------------\n",
      "   +0.6354 if cp<=0.08310824185609819\n",
      "   +0.9155 if cp>=0.019997090101242065\n",
      "   +0.7596 if cp<=0.08573301434516907 & pav>=-0.6158170223236084\n",
      "   -1.8429 if cp<=0.02535203844308854 & cp>=-0.002927413972793136\n",
      "   +1.5767 if cp<=-0.0060440110974013805\n",
      "Run episode 236 with rewards 9.0\n",
      "============ 237 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -1.3394 if \n",
      "   -0.2693 if cv<=0.3471404016017915\n",
      "   +0.0000 if cp<=0.02535203844308854 & cp>=-0.002927413972793136\n",
      "   +0.0000 if cp<=-0.0060440110974013805 & cp>=-0.025669584050774574\n",
      "   -1.2979 if cp<=0.10839999169111253\n",
      "--------------\n",
      "   +2.1159 if cp>=0.019997090101242065\n",
      "   +0.5396 if cp<=0.08573301434516907 & pav>=-0.6158170223236084\n",
      "   -0.0000 if cp<=0.02535203844308854 & cp>=-0.002927413972793136\n",
      "   -0.0000 if cp<=-0.0060440110974013805\n",
      "   +0.9198 if cp<=0.07540008276700974 & cp>=0.03990563005208969\n",
      "Run episode 237 with rewards 9.0\n",
      "============ 238 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 0, 1, 1, 1, 1]\n",
      "   -0.9531 if \n",
      "   -0.3631 if cv<=0.3471404016017915\n",
      "   -0.0000 if cp<=0.02535203844308854 & cp>=-0.002927413972793136\n",
      "   -0.9439 if cp<=0.10839999169111253\n",
      "   +0.0795 if cp>=0.1474989503622055\n",
      "--------------\n",
      "   +1.2389 if cp>=0.019997090101242065\n",
      "   +0.6323 if cp<=0.08573301434516907 & pav>=-0.6158170223236084\n",
      "   -0.0000 if cp<=0.02535203844308854 & cp>=-0.002927413972793136\n",
      "   +0.4836 if cp<=0.07540008276700974 & cp>=0.03990563005208969\n",
      "   -0.1323 if cp>=0.1474989503622055\n",
      "Run episode 238 with rewards 10.0\n",
      "============ 239 ===========\n",
      "11 actions [1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1]\n",
      "   +0.2119 if \n",
      "   -0.7481 if cv<=0.3471404016017915\n",
      "   +0.2119 if cp<=0.10839999169111253\n",
      "   -0.0000 if cp>=0.1474989503622055\n",
      "   -3.3480 if cv<=0.8995623111724854\n",
      "--------------\n",
      "   +0.8559 if cp>=0.019997090101242065\n",
      "   +1.6862 if cp<=0.08573301434516907 & pav>=-0.6158170223236084\n",
      "   +0.3577 if cp<=0.07540008276700974 & cp>=0.03990563005208969\n",
      "   +0.0000 if cp>=0.1474989503622055\n",
      "   -3.0374 if cp<=0.021229229681193836 & cv>=0.8995623111724854\n",
      "Run episode 239 with rewards 11.0\n",
      "============ 240 ===========\n",
      "11 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.8352 if \n",
      "   -0.2481 if cv<=0.3471404016017915\n",
      "   -1.0929 if cp<=0.10839999169111253\n",
      "   -1.6575 if cv<=0.8995623111724854\n",
      "   +1.2972 if cp<=0.031649731099605574 & cv>=1.0008083581924438\n",
      "--------------\n",
      "   +1.5483 if cp>=0.019997090101242065\n",
      "   +0.5279 if cp<=0.08573301434516907 & pav>=-0.6158170223236084\n",
      "   +1.2577 if cp<=0.07540008276700974 & cp>=0.03990563005208969\n",
      "   -1.6902 if cp<=0.021229229681193836 & cv>=0.8995623111724854\n",
      "   +1.1959 if cp<=-0.004477961920201778\n",
      "Run episode 240 with rewards 11.0\n",
      "============ 241 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -1.4066 if \n",
      "   -1.1863 if cp<=0.10839999169111253\n",
      "   -0.9237 if cv<=0.8995623111724854\n",
      "   +0.0000 if cp<=0.031649731099605574 & cv>=1.0008083581924438\n",
      "   -0.9237 if pa>=0.015332168899476542\n",
      "--------------\n",
      "   +0.6853 if cp>=0.019997090101242065\n",
      "   +0.3416 if cp<=0.07540008276700974 & cp>=0.03990563005208969\n",
      "   +0.0000 if cp<=0.021229229681193836 & cv>=0.8995623111724854\n",
      "   +0.0000 if cp<=-0.004477961920201778\n",
      "   +1.4410 if cp<=0.11326095461845398\n",
      "Run episode 241 with rewards 9.0\n",
      "============ 242 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -1.1730 if \n",
      "   -1.1730 if cp<=0.10839999169111253\n",
      "   -0.9019 if cv<=0.8995623111724854\n",
      "   +0.0000 if pa>=0.015332168899476542\n",
      "   -0.0025 if cp>=0.029253367707133302\n",
      "--------------\n",
      "   +0.1021 if cp>=0.019997090101242065\n",
      "   +0.0069 if cp<=0.07540008276700974 & cp>=0.03990563005208969\n",
      "   +0.2679 if cp<=0.021229229681193836 & cv>=0.8995623111724854\n",
      "   +1.1008 if cp<=0.11326095461845398\n",
      "   +0.3466 if cp<=-0.034166553616523744\n",
      "Run episode 242 with rewards 9.0\n",
      "============ 243 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 0, 1]\n",
      "   -1.2549 if \n",
      "   -1.2549 if cp<=0.10839999169111253\n",
      "   -0.9804 if cv<=0.8995623111724854\n",
      "   -0.2745 if cp>=0.029253367707133302\n",
      "   -0.0049 if cp>=0.06594899371266366\n",
      "--------------\n",
      "   +0.3668 if cp>=0.019997090101242065\n",
      "   -0.0000 if cp<=0.021229229681193836 & cv>=0.8995623111724854\n",
      "   +1.2836 if cp<=0.11326095461845398\n",
      "   -0.0000 if cp<=-0.034166553616523744\n",
      "   +0.0049 if cp>=0.06594899371266366\n",
      "Run episode 243 with rewards 10.0\n",
      "============ 244 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 0, 0, 0]\n",
      "   -0.5195 if \n",
      "   -1.7807 if cp<=0.10839999169111253\n",
      "   -1.0495 if cv<=0.8995623111724854\n",
      "   +0.3741 if cp>=0.029253367707133302\n",
      "   +0.7683 if cv>=1.570242166519165\n",
      "--------------\n",
      "   -0.3468 if cp>=0.019997090101242065\n",
      "   +1.5779 if cp<=0.11326095461845398\n",
      "   +0.0000 if cp<=-0.034166553616523744\n",
      "   -0.8498 if cp>=0.06594899371266366\n",
      "   -1.4292 if cp>=0.09785044938325882\n",
      "Run episode 244 with rewards 10.0\n",
      "============ 245 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -1.2955 if \n",
      "   -1.9205 if cp<=0.10839999169111253\n",
      "   -0.6772 if cv<=0.8995623111724854\n",
      "   +0.0000 if cv>=1.570242166519165\n",
      "   +0.7977 if cv>=1.178801941871643\n",
      "--------------\n",
      "   +0.5177 if cp>=0.019997090101242065\n",
      "   +1.4841 if cp<=0.11326095461845398\n",
      "   -0.2660 if cp>=0.06594899371266366\n",
      "   -0.5778 if cp>=0.09785044938325882\n",
      "   -1.3421 if cv>=1.178801941871643\n",
      "Run episode 245 with rewards 9.0\n",
      "============ 246 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 0, 1]\n",
      "   -1.2532 if \n",
      "   -1.2532 if cp<=0.10839999169111253\n",
      "   -0.8083 if cv<=0.8995623111724854\n",
      "   -0.2774 if cv>=1.178801941871643\n",
      "   +0.0081 if cp>=0.025159078277647504\n",
      "--------------\n",
      "   +0.0067 if cp>=0.019997090101242065\n",
      "   +0.9669 if cp<=0.11326095461845398\n",
      "   +0.0000 if cp>=0.09785044938325882\n",
      "   +0.1635 if cv>=1.178801941871643\n",
      "   +0.2884 if cp<=-0.04248329848051071\n",
      "Run episode 246 with rewards 10.0\n",
      "============ 247 ===========\n",
      "8 actions [1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.4708 if \n",
      "   -2.0041 if cp<=0.10839999169111253\n",
      "   -1.0151 if cv<=0.8995623111724854\n",
      "   +0.7604 if cv>=1.178801941871643\n",
      "   -0.5884 if cp<=0.0604505017399788 & cp>=0.014509056508541108\n",
      "--------------\n",
      "   -0.3357 if cp>=0.019997090101242065\n",
      "   +1.6827 if cp<=0.11326095461845398\n",
      "   -0.9297 if cv>=1.178801941871643\n",
      "   -0.0000 if cp<=-0.04248329848051071\n",
      "   -1.4880 if cp>=0.10217128247022629\n",
      "Run episode 247 with rewards 8.0\n",
      "============ 248 ===========\n",
      "8 actions [1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -1.3210 if cp<=0.10839999169111253\n",
      "   -1.1817 if cv<=0.8995623111724854\n",
      "   +0.0894 if cv>=1.178801941871643\n",
      "   -0.5346 if cp<=0.0604505017399788 & cp>=0.014509056508541108\n",
      "   +0.3116 if cp>=0.07479312270879745\n",
      "--------------\n",
      "   +0.0911 if cp>=0.019997090101242065\n",
      "   +0.8232 if cp<=0.11326095461845398\n",
      "   -0.0165 if cv>=1.178801941871643\n",
      "   -0.0000 if cp>=0.10217128247022629\n",
      "   +0.4900 if cp<=0.0017849728465080283\n",
      "Run episode 248 with rewards 8.0\n",
      "============ 249 ===========\n",
      "11 actions [1, 1, 1, 1, 1, 1, 1, 0, 1, 0, 0]\n",
      "   -1.3319 if cp<=0.10839999169111253\n",
      "   -0.7925 if cv<=0.8995623111724854\n",
      "   -0.6376 if cp<=0.0604505017399788 & cp>=0.014509056508541108\n",
      "   +0.2669 if cp>=0.07479312270879745\n",
      "   -1.0611 if cp<=0.08978134840726854\n",
      "--------------\n",
      "   +0.2381 if cp>=0.019997090101242065\n",
      "   +1.4451 if cp<=0.11326095461845398\n",
      "   -1.2070 if cv>=1.178801941871643\n",
      "   -0.0000 if cp<=0.0017849728465080283\n",
      "   -0.1477 if cp>=0.043974905461072925\n",
      "Run episode 249 with rewards 11.0\n",
      "============ 250 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 0, 1, 0, 0]\n",
      "   -1.4891 if cp<=0.10839999169111253\n",
      "   -0.6338 if cv<=0.8995623111724854\n",
      "   -0.6338 if cp<=0.0604505017399788 & cp>=0.014509056508541108\n",
      "   -0.9284 if cp<=0.08978134840726854\n",
      "   -1.1991 if cp<=0.14460650086402893 & cp>=0.14460650086402893 & cv<=1.1555551290512085\n",
      "--------------\n",
      "   +0.6625 if cp>=0.019997090101242065\n",
      "   +1.1254 if cp<=0.11326095461845398\n",
      "   -2.2578 if cv>=1.178801941871643\n",
      "   +0.3410 if cp>=0.043974905461072925\n",
      "   +1.0646 if cp>=0.14460650086402893\n",
      "Run episode 250 with rewards 10.0\n",
      "============ 251 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 0, 1, 1]\n",
      "   +1.0494 if cp<=0.10839999169111253\n",
      "   -0.8387 if cv<=0.8995623111724854\n",
      "   -1.0126 if cp<=0.08978134840726854\n",
      "   +0.0000 if cp<=0.14460650086402893 & cp>=0.14460650086402893 & cv<=1.1555551290512085\n",
      "   -2.1567 if cv<=1.026763415336609\n",
      "--------------\n",
      "   +0.9990 if cp>=0.019997090101242065\n",
      "   -0.9878 if cp<=0.11326095461845398\n",
      "   -2.5818 if cv>=1.178801941871643\n",
      "   +0.7895 if cp>=0.14460650086402893\n",
      "   +1.2309 if cp<=0.08899649679660798\n",
      "Run episode 251 with rewards 9.0\n",
      "============ 252 ===========\n",
      "8 actions [1, 1, 1, 1, 1, 1, 1, 0]\n",
      "   -0.1630 if cp<=0.10839999169111253\n",
      "   -0.8909 if cv<=0.8995623111724854\n",
      "   -1.0890 if cp<=0.08978134840726854\n",
      "   -1.3125 if cv<=1.026763415336609\n",
      "   +1.7684 if cv>=1.0122532963752748\n",
      "--------------\n",
      "   -0.1406 if cp>=0.019997090101242065\n",
      "   +0.6179 if cp<=0.11326095461845398\n",
      "   -0.0000 if cv>=1.178801941871643\n",
      "   +1.1753 if cp<=0.08899649679660798\n",
      "   -1.6073 if cv>=1.0122532963752748\n",
      "Run episode 252 with rewards 8.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 253 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.5309 if cv<=0.8995623111724854\n",
      "   -2.1258 if cp<=0.08978134840726854\n",
      "   -0.5946 if cv<=1.026763415336609\n",
      "   -1.5312 if cv>=1.0122532963752748\n",
      "   -1.4778 if cp>=0.06121201813220978\n",
      "--------------\n",
      "   +1.4919 if cp>=0.019997090101242065\n",
      "   +1.6140 if cp<=0.11326095461845398\n",
      "   +1.6140 if cp<=0.08899649679660798\n",
      "   +1.4919 if cv>=1.0122532963752748\n",
      "   +1.4826 if cp>=0.06121201813220978\n",
      "Run episode 253 with rewards 10.0\n",
      "============ 254 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 0, 1, 0, 1]\n",
      "   -0.8475 if cp<=0.08978134840726854\n",
      "   -0.8397 if cv<=1.026763415336609\n",
      "   +0.0106 if cv>=1.0122532963752748\n",
      "   +0.0175 if cp>=0.06121201813220978\n",
      "   -0.1117 if cp>=0.0056287206709384925\n",
      "--------------\n",
      "   +0.1092 if cp>=0.019997090101242065\n",
      "   +0.8819 if cp<=0.11326095461845398\n",
      "   +0.8527 if cp<=0.08899649679660798\n",
      "   -0.0190 if cv>=1.0122532963752748\n",
      "   +0.2863 if cp<=-0.009264831990003585\n",
      "Run episode 254 with rewards 10.0\n",
      "============ 255 ===========\n",
      "37 actions [1, 1, 0, 0, 1, 1, 1, 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0, 1, 0, 0, 0]\n",
      "   -0.2586 if cp<=0.08978134840726854\n",
      "   -2.5212 if cv<=1.026763415336609\n",
      "   -0.2333 if cp>=0.06121201813220978\n",
      "   +1.1304 if cp>=0.0056287206709384925\n",
      "   +2.0172 if cp>=0.036443761736154566\n",
      "--------------\n",
      "   -1.8358 if cp>=0.019997090101242065\n",
      "   +0.4149 if cp<=0.11326095461845398\n",
      "   +1.7911 if cp<=0.08899649679660798\n",
      "   +0.0000 if cp<=-0.009264831990003585\n",
      "   -2.3338 if cp<=0.074497190117836 & cv>=0.9915950536727905\n",
      "Run episode 255 with rewards 37.0\n",
      "============ 256 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 0, 0, 0]\n",
      "   -5.2802 if cp<=0.08978134840726854\n",
      "   +0.5693 if cv<=1.026763415336609\n",
      "   +0.5692 if cp>=0.0056287206709384925\n",
      "   +4.0586 if cp>=0.036443761736154566\n",
      "   -2.2307 if cp>=0.08682473748922348\n",
      "--------------\n",
      "   -4.2596 if cp>=0.019997090101242065\n",
      "   +0.8622 if cp<=0.11326095461845398\n",
      "   +3.7890 if cp<=0.08899649679660798\n",
      "   +0.0000 if cp<=0.074497190117836 & cv>=0.9915950536727905\n",
      "   +4.2211 if cp>=0.03486344441771507 & pa>=-0.059788168966770174 & pav>=-0.256219345331192\n",
      "Run episode 256 with rewards 9.0\n",
      "============ 257 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 0]\n",
      "   -1.2821 if cp<=0.08978134840726854\n",
      "   -1.2772 if cv<=1.026763415336609\n",
      "   -0.2095 if cp>=0.036443761736154566\n",
      "   +0.1837 if cp>=0.08682473748922348\n",
      "   -1.3953 if cv<=1.0014243125915527\n",
      "--------------\n",
      "   +0.4957 if cp>=0.019997090101242065\n",
      "   +0.6311 if cp<=0.11326095461845398\n",
      "   +1.8124 if cp<=0.08899649679660798\n",
      "   +0.0000 if cp>=0.03486344441771507 & pa>=-0.059788168966770174 & pav>=-0.256219345331192\n",
      "   +0.0402 if cp<=0.034422870725393295\n",
      "Run episode 257 with rewards 10.0\n",
      "============ 258 ===========\n",
      "8 actions [1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.5728 if cp<=0.08978134840726854\n",
      "   -0.5728 if cv<=1.026763415336609\n",
      "   -2.6787 if cp>=0.036443761736154566\n",
      "   -0.5728 if cv<=1.0014243125915527\n",
      "   -2.1742 if cp>=0.17146804928779602\n",
      "--------------\n",
      "   +2.8968 if cp>=0.019997090101242065\n",
      "   +0.3857 if cp<=0.11326095461845398\n",
      "   +0.0756 if cp<=0.08899649679660798\n",
      "   +0.0000 if cp<=0.034422870725393295\n",
      "   +2.1712 if cp>=0.17146804928779602\n",
      "Run episode 258 with rewards 8.0\n",
      "============ 259 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -1.5540 if cp<=0.08978134840726854\n",
      "   -1.5504 if cv<=1.026763415336609\n",
      "   +0.0118 if cp>=0.036443761736154566\n",
      "   +0.0000 if cp>=0.17146804928779602\n",
      "   -0.7747 if cp<=-0.026924532651901242\n",
      "--------------\n",
      "   +0.1159 if cp>=0.019997090101242065\n",
      "   +1.0474 if cp<=0.11326095461845398\n",
      "   +1.0474 if cp<=0.08899649679660798\n",
      "   +0.0000 if cp>=0.17146804928779602\n",
      "   +0.8066 if cp<=-0.01038361601531504\n",
      "Run episode 259 with rewards 9.0\n",
      "============ 260 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 0, 1]\n",
      "   -1.1217 if cp<=0.08978134840726854\n",
      "   -0.9372 if cv<=1.026763415336609\n",
      "   +0.0055 if cp>=0.036443761736154566\n",
      "   -0.0000 if cp<=-0.026924532651901242\n",
      "   +0.0688 if cp>=0.0815315693616867\n",
      "--------------\n",
      "   +0.1425 if cp>=0.019997090101242065\n",
      "   +0.7470 if cp<=0.11326095461845398\n",
      "   +0.7470 if cp<=0.08899649679660798\n",
      "   +0.4625 if cp<=-0.01038361601531504\n",
      "   +0.4324 if cp>=-0.01870761103928089\n",
      "Run episode 260 with rewards 10.0\n",
      "============ 261 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 0, 0]\n",
      "   -2.0337 if cp<=0.08978134840726854\n",
      "   -0.9588 if cv<=1.026763415336609\n",
      "   +0.6406 if cp>=0.036443761736154566\n",
      "   +1.0521 if cp>=0.0815315693616867\n",
      "   +1.5081 if cp>=0.14960791170597076\n",
      "--------------\n",
      "   +1.6845 if cp<=0.11326095461845398\n",
      "   +1.2814 if cp<=0.08899649679660798\n",
      "   +0.0000 if cp<=-0.01038361601531504\n",
      "   -0.2805 if cp>=-0.01870761103928089\n",
      "   -1.3734 if cp>=0.14960791170597076\n",
      "Run episode 261 with rewards 9.0\n",
      "============ 262 ===========\n",
      "12 actions [1, 1, 1, 1, 1, 1, 0, 1, 0, 0, 1, 0]\n",
      "   -1.0747 if cp<=0.08978134840726854\n",
      "   -0.9532 if cv<=1.026763415336609\n",
      "   +0.4164 if cp>=0.0815315693616867\n",
      "   -0.0000 if cp>=0.14960791170597076\n",
      "   +0.8789 if cv>=1.4158145189285278\n",
      "--------------\n",
      "   +0.3351 if cp<=0.11326095461845398\n",
      "   +0.9099 if cp<=0.08899649679660798\n",
      "   +0.7154 if cp>=-0.01870761103928089\n",
      "   -0.0000 if cp>=0.14960791170597076\n",
      "   +0.2618 if cp<=0.04631521627306939 & cp>=0.00978351142257452\n",
      "Run episode 262 with rewards 12.0\n",
      "============ 263 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 0, 0]\n",
      "   -0.6735 if cp<=0.08978134840726854\n",
      "   -2.7525 if cv<=1.026763415336609\n",
      "   +2.3956 if cp>=0.0815315693616867\n",
      "   +0.0000 if cv>=1.4158145189285278\n",
      "   +1.0411 if cp>=0.15932092666625977\n",
      "--------------\n",
      "   -0.8542 if cp<=0.11326095461845398\n",
      "   +2.6337 if cp<=0.08899649679660798\n",
      "   +0.0681 if cp>=-0.01870761103928089\n",
      "   +0.6964 if cp<=0.04631521627306939 & cp>=0.00978351142257452\n",
      "   -1.3426 if cv>=1.1370278596878052\n",
      "Run episode 263 with rewards 10.0\n",
      "============ 264 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -1.9876 if cp<=0.08978134840726854\n",
      "   -0.9395 if cv<=1.026763415336609\n",
      "   -0.7610 if cp>=0.0815315693616867\n",
      "   -0.0000 if cp>=0.15932092666625977\n",
      "   -1.0433 if cp>=0.13602465391159058\n",
      "--------------\n",
      "   +0.7936 if cp<=0.11326095461845398\n",
      "   +1.1342 if cp<=0.08899649679660798\n",
      "   +0.1177 if cp<=0.04631521627306939 & cp>=0.00978351142257452\n",
      "   +0.4760 if cv>=1.1370278596878052\n",
      "   +0.2131 if cp<=-0.007099099829792976\n",
      "Run episode 264 with rewards 10.0\n",
      "============ 265 ===========\n",
      "8 actions [1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -1.1912 if cp<=0.08978134840726854\n",
      "   -1.1912 if cv<=1.026763415336609\n",
      "   -1.2415 if cp>=0.0815315693616867\n",
      "   +0.1720 if cp>=0.13602465391159058\n",
      "   -0.5311 if cp<=0.08426589369773865 & cp>=0.03993632942438126\n",
      "--------------\n",
      "   +1.2360 if cp<=0.11326095461845398\n",
      "   +0.8413 if cp<=0.08899649679660798\n",
      "   +1.0455 if cv>=1.1370278596878052\n",
      "   -0.0000 if cp<=-0.007099099829792976\n",
      "   -0.0565 if cp>=0.12516801953315734\n",
      "Run episode 265 with rewards 8.0\n",
      "============ 266 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -1.1035 if cp<=0.08978134840726854\n",
      "   -1.1017 if cv<=1.026763415336609\n",
      "   -0.0000 if cp>=0.0815315693616867\n",
      "   -0.0018 if cp<=0.08426589369773865 & cp>=0.03993632942438126\n",
      "   -0.2869 if cp>=0.0012259725015610478\n",
      "--------------\n",
      "   +0.9686 if cp<=0.11326095461845398\n",
      "   +0.9686 if cp<=0.08899649679660798\n",
      "   +0.0041 if cv>=1.1370278596878052\n",
      "   +0.0000 if cp>=0.12516801953315734\n",
      "   +0.3938 if cp<=0.042369706928730023 & cp>=-0.007594978809356689\n",
      "Run episode 266 with rewards 9.0\n",
      "============ 267 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -1.2958 if cp<=0.08978134840726854\n",
      "   -1.2056 if cv<=1.026763415336609\n",
      "   +0.0162 if cp<=0.08426589369773865 & cp>=0.03993632942438126\n",
      "   -0.0902 if cp>=0.0012259725015610478\n",
      "   -0.1664 if cp<=0.02987818270921708 & cp>=-0.0028489029093179737\n",
      "--------------\n",
      "   +1.0926 if cp<=0.11326095461845398\n",
      "   +1.0926 if cp<=0.08899649679660798\n",
      "   +0.0616 if cv>=1.1370278596878052\n",
      "   +0.1323 if cp<=0.042369706928730023 & cp>=-0.007594978809356689\n",
      "   +0.4951 if cp<=0.02987818270921708 & cp>=-0.037788526713848115\n",
      "Run episode 267 with rewards 10.0\n",
      "============ 268 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 0]\n",
      "   -1.4202 if cp<=0.08978134840726854\n",
      "   -0.8133 if cv<=1.026763415336609\n",
      "   +0.6088 if cp>=0.0012259725015610478\n",
      "   -0.5810 if cp<=0.02987818270921708 & cp>=-0.0028489029093179737\n",
      "   +2.2967 if cp>=0.13737648725509644\n",
      "--------------\n",
      "   +1.1738 if cp<=0.11326095461845398\n",
      "   +0.8927 if cp<=0.08899649679660798\n",
      "   +0.4710 if cp<=0.042369706928730023 & cp>=-0.007594978809356689\n",
      "   +0.3992 if cp<=0.02987818270921708 & cp>=-0.037788526713848115\n",
      "   -2.1574 if cp>=0.13737648725509644\n",
      "Run episode 268 with rewards 9.0\n",
      "============ 269 ===========\n",
      "8 actions [1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.3561 if cp<=0.08978134840726854\n",
      "   -0.3205 if cv<=1.026763415336609\n",
      "   -2.5576 if cp>=0.0012259725015610478\n",
      "   +0.0000 if cp>=0.13737648725509644\n",
      "   -2.1659 if cp>=0.13123147189617157\n",
      "--------------\n",
      "   +1.2766 if cp<=0.11326095461845398\n",
      "   +1.1569 if cp<=0.08899649679660798\n",
      "   +0.5985 if cp<=0.042369706928730023 & cp>=-0.007594978809356689\n",
      "   +0.0000 if cp>=0.13737648725509644\n",
      "   +1.7929 if cp>=0.09133401811122895\n",
      "Run episode 269 with rewards 8.0\n",
      "============ 270 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.8204 if cp<=0.08978134840726854\n",
      "   -0.8152 if cv<=1.026763415336609\n",
      "   -0.1275 if cp>=0.0012259725015610478\n",
      "   -0.0000 if cp>=0.13123147189617157\n",
      "   -0.5729 if cp<=-0.0027062825858592964\n",
      "--------------\n",
      "   +1.5507 if cp<=0.11326095461845398\n",
      "   +1.5507 if cp<=0.08899649679660798\n",
      "   +0.2086 if cp<=0.042369706928730023 & cp>=-0.007594978809356689\n",
      "   -0.0000 if cp>=0.09133401811122895\n",
      "   +0.2090 if cp>=-0.0027062825858592964\n",
      "Run episode 270 with rewards 10.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 271 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 0, 0, 0]\n",
      "   -0.8801 if cp<=0.08978134840726854\n",
      "   -0.6716 if cv<=1.026763415336609\n",
      "   +0.2233 if cp>=0.0012259725015610478\n",
      "   -0.5954 if cp<=-0.0027062825858592964\n",
      "   -0.1848 if cp<=0.05039232522249222 & cp>=0.009021226270124322\n",
      "--------------\n",
      "   +0.1292 if cp<=0.11326095461845398\n",
      "   +2.3759 if cp<=0.08899649679660798\n",
      "   +0.5995 if cp<=0.042369706928730023 & cp>=-0.007594978809356689\n",
      "   -0.8836 if cp>=-0.0027062825858592964\n",
      "   -1.8342 if cp>=0.05039232522249222\n",
      "Run episode 271 with rewards 9.0\n",
      "============ 272 ===========\n",
      "11 actions [1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0]\n",
      "   -0.1379 if cp<=0.08978134840726854\n",
      "   -1.9054 if cv<=1.026763415336609\n",
      "   +0.2487 if cp>=0.0012259725015610478\n",
      "   -0.0000 if cp<=-0.0027062825858592964\n",
      "   -0.7912 if cp<=0.05148428604006768\n",
      "--------------\n",
      "   +0.9842 if cp<=0.08899649679660798\n",
      "   +1.3689 if cp<=0.042369706928730023 & cp>=-0.007594978809356689\n",
      "   +0.3865 if cp>=-0.0027062825858592964\n",
      "   -0.9824 if cp>=0.05039232522249222\n",
      "   -1.7252 if cv>=1.1986680030822754\n",
      "Run episode 272 with rewards 11.0\n",
      "============ 273 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 0, 1, 0]\n",
      "   -0.6207 if cp<=0.08978134840726854\n",
      "   -1.3205 if cv<=1.026763415336609\n",
      "   +0.2846 if cp>=0.0012259725015610478\n",
      "   -1.7646 if cp<=0.05148428604006768\n",
      "   +0.7082 if cv>=1.5390312671661377\n",
      "--------------\n",
      "   +1.2768 if cp<=0.08899649679660798\n",
      "   +0.6519 if cp<=0.042369706928730023 & cp>=-0.007594978809356689\n",
      "   -0.8806 if cp>=0.05039232522249222\n",
      "   -1.2567 if cv>=1.1986680030822754\n",
      "   +1.4850 if cp>=0.007453040685504696 & cv<=1.3432111740112305\n",
      "Run episode 273 with rewards 10.0\n",
      "============ 274 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 0]\n",
      "   -0.8973 if cp<=0.08978134840726854\n",
      "   -0.6346 if cv<=1.026763415336609\n",
      "   -0.6346 if cp<=0.05148428604006768\n",
      "   +0.0000 if cv>=1.5390312671661377\n",
      "   -0.6644 if cp>=0.0591226302087307 & cv<=1.2045042276382447\n",
      "--------------\n",
      "   +0.9031 if cp<=0.08899649679660798\n",
      "   +0.3480 if cp>=0.05039232522249222\n",
      "   -0.5174 if cv>=1.1986680030822754\n",
      "   +1.2814 if cp>=0.007453040685504696 & cv<=1.3432111740112305\n",
      "   +1.3505 if cp>=0.1445092260837555\n",
      "Run episode 274 with rewards 9.0\n",
      "============ 275 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.3580 if cp<=0.08978134840726854\n",
      "   -0.3365 if cv<=1.026763415336609\n",
      "   -0.3096 if cp<=0.05148428604006768\n",
      "   -0.0215 if cp>=0.0591226302087307 & cv<=1.2045042276382447\n",
      "   -2.5637 if \n",
      "--------------\n",
      "   +1.2208 if cp<=0.08899649679660798\n",
      "   +2.3760 if cv>=1.1986680030822754\n",
      "   +1.2208 if cp>=0.007453040685504696 & cv<=1.3432111740112305\n",
      "   +0.0000 if cp>=0.1445092260837555\n",
      "   +2.2532 if cp>=0.12859104573726654\n",
      "Run episode 275 with rewards 9.0\n",
      "============ 276 ===========\n",
      "8 actions [1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.8955 if cp<=0.08978134840726854\n",
      "   -0.8743 if cv<=1.026763415336609\n",
      "   -0.9047 if cp<=0.05148428604006768\n",
      "   -0.8955 if \n",
      "   -0.0882 if cp>=-0.00942128552123903\n",
      "--------------\n",
      "   +0.8712 if cp<=0.08899649679660798\n",
      "   -0.0250 if cv>=1.1986680030822754\n",
      "   +0.0785 if cp>=0.007453040685504696 & cv<=1.3432111740112305\n",
      "   -0.0000 if cp>=0.12859104573726654\n",
      "   +0.5682 if cp<=-0.03202964812517166\n",
      "Run episode 276 with rewards 8.0\n",
      "============ 277 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 0]\n",
      "   -0.8771 if cp<=0.08978134840726854\n",
      "   -0.8893 if cv<=1.026763415336609\n",
      "   -0.8893 if cp<=0.05148428604006768\n",
      "   -0.8771 if \n",
      "   -0.3528 if cp>=-0.0049970271997153756\n",
      "--------------\n",
      "   +0.8631 if cp<=0.08899649679660798\n",
      "   -0.0455 if cv>=1.1986680030822754\n",
      "   +0.2203 if cp>=0.007453040685504696 & cv<=1.3432111740112305\n",
      "   -0.0000 if cp<=-0.03202964812517166\n",
      "   -0.1385 if cp>=0.08041248470544815\n",
      "Run episode 277 with rewards 10.0\n",
      "============ 278 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.4907 if cp<=0.08978134840726854\n",
      "   -0.4820 if cv<=1.026763415336609\n",
      "   -0.4895 if cp<=0.05148428604006768\n",
      "   -3.0062 if \n",
      "   -2.5339 if cp>=-0.012145237997174263\n",
      "--------------\n",
      "   +1.1132 if cp<=0.08899649679660798\n",
      "   +2.5327 if cv>=1.1986680030822754\n",
      "   +0.1834 if cp>=0.007453040685504696 & cv<=1.3432111740112305\n",
      "   +2.5226 if cp>=0.08041248470544815\n",
      "   +0.3690 if cp<=-0.026954494416713715\n",
      "Run episode 278 with rewards 10.0\n",
      "============ 279 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -1.1423 if cp<=0.08978134840726854\n",
      "   -1.1310 if cp<=0.05148428604006768\n",
      "   -1.1384 if \n",
      "   -0.2726 if cp>=-0.012145237997174263\n",
      "   -0.0617 if cp>=0.01745939143002034\n",
      "--------------\n",
      "   +0.4503 if cp<=0.08899649679660798\n",
      "   -0.0014 if cv>=1.1986680030822754\n",
      "   -0.0104 if cp>=0.08041248470544815\n",
      "   +0.2159 if cp<=-0.026954494416713715\n",
      "   +0.4173 if cp<=-0.010064481571316718\n",
      "Run episode 279 with rewards 9.0\n",
      "============ 280 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 0, 1, 0, 0]\n",
      "   -1.3562 if cp<=0.08978134840726854\n",
      "   -1.1198 if cp<=0.05148428604006768\n",
      "   -0.8108 if \n",
      "   -0.8108 if cp>=-0.012145237997174263\n",
      "   +0.4723 if cp>=0.06555343046784402\n",
      "--------------\n",
      "   +1.3128 if cp<=0.08899649679660798\n",
      "   -1.7924 if cp>=0.08041248470544815\n",
      "   +0.0000 if cp<=-0.026954494416713715\n",
      "   +0.0000 if cp<=-0.010064481571316718\n",
      "   -1.0535 if cp>=0.014362649992108347\n",
      "Run episode 280 with rewards 10.0\n",
      "============ 281 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 0, 1, 0, 0, 0]\n",
      "   +0.0600 if cp<=0.08978134840726854\n",
      "   -2.9783 if cp<=0.05148428604006768\n",
      "   +0.0878 if \n",
      "   +0.0878 if cp>=-0.012145237997174263\n",
      "   -1.2281 if cp<=0.08084513992071152 & cp>=0.04063143357634545 & cv<=1.0509212970733643\n",
      "--------------\n",
      "   +0.2991 if cp<=0.08899649679660798\n",
      "   -0.2598 if cp>=0.08041248470544815\n",
      "   +0.0000 if cp<=-0.010064481571316718\n",
      "   -1.1507 if cp>=0.014362649992108347\n",
      "   -2.8165 if cp<=0.08084513992071152 & cv>=1.0509212970733643\n",
      "Run episode 281 with rewards 10.0\n",
      "============ 282 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 0, 1]\n",
      "   -3.5047 if cp<=0.05148428604006768\n",
      "   -0.1839 if \n",
      "   -0.1839 if cp>=-0.012145237997174263\n",
      "   +0.1378 if cp<=0.08084513992071152 & cp>=0.04063143357634545 & cv<=1.0509212970733643\n",
      "   -0.8402 if cp>=0.06424813047051431\n",
      "--------------\n",
      "   +1.3162 if cp<=0.08899649679660798\n",
      "   -1.0004 if cp>=0.08041248470544815\n",
      "   -0.6287 if cp>=0.014362649992108347\n",
      "   -0.0000 if cp<=0.08084513992071152 & cv>=1.0509212970733643\n",
      "   -2.8408 if cp<=0.06424813047051431 & cv>=0.8684391736984254\n",
      "Run episode 282 with rewards 9.0\n",
      "============ 283 ===========\n",
      "12 actions [1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0]\n",
      "   -2.1585 if cp<=0.05148428604006768\n",
      "   -1.0144 if \n",
      "   -0.2458 if cp>=-0.012145237997174263\n",
      "   +0.7500 if cp>=0.06424813047051431\n",
      "   -1.1426 if cp<=0.04456209614872933 & cp>=0.012826960347592842\n",
      "--------------\n",
      "   +0.4937 if cp<=0.08899649679660798\n",
      "   -0.8553 if cp>=0.08041248470544815\n",
      "   -0.9029 if cp>=0.014362649992108347\n",
      "   -0.0476 if cp<=0.06424813047051431 & cv>=0.8684391736984254\n",
      "   -0.4879 if cv>=1.3593555688858032\n",
      "Run episode 283 with rewards 12.0\n",
      "============ 284 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 0, 0]\n",
      "   -1.2873 if cp<=0.05148428604006768\n",
      "   -0.4578 if \n",
      "   +0.8295 if cp>=0.06424813047051431\n",
      "   -0.4406 if cp<=0.04456209614872933 & cp>=0.012826960347592842\n",
      "   -2.8922 if cp<=0.0813737437129021\n",
      "--------------\n",
      "   +2.1226 if cp<=0.08899649679660798\n",
      "   -2.2203 if cp>=0.08041248470544815\n",
      "   -0.4762 if cp>=0.014362649992108347\n",
      "   -0.6330 if cv>=1.3593555688858032\n",
      "   +0.0873 if cp<=0.03820151612162591 & cp>=0.013738771900534632\n",
      "Run episode 284 with rewards 10.0\n",
      "============ 285 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.9043 if cp<=0.05148428604006768\n",
      "   -0.9606 if \n",
      "   +0.0653 if cp>=0.06424813047051431\n",
      "   -1.0259 if cp<=0.0813737437129021\n",
      "   +0.3493 if cv>=1.5191487073898315\n",
      "--------------\n",
      "   +0.0741 if cp<=0.08899649679660798\n",
      "   +0.9253 if cp>=0.08041248470544815\n",
      "   +0.9991 if cp>=0.014362649992108347\n",
      "   -0.7289 if cv>=1.3593555688858032\n",
      "   +0.5202 if cp<=-0.004947845777496695\n",
      "Run episode 285 with rewards 10.0\n",
      "============ 286 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.7948 if cp<=0.05148428604006768\n",
      "   -1.6480 if \n",
      "   -1.2888 if cp<=0.0813737437129021\n",
      "   +0.1334 if cv>=1.5191487073898315\n",
      "   +0.1999 if cp>=0.17432862520217896\n",
      "--------------\n",
      "   +0.4143 if cp>=0.08041248470544815\n",
      "   +1.8556 if cp>=0.014362649992108347\n",
      "   +0.0723 if cv>=1.3593555688858032\n",
      "   +0.0000 if cp<=-0.004947845777496695\n",
      "   -0.1637 if cp>=0.17432862520217896\n",
      "Run episode 286 with rewards 9.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 287 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -1.3650 if cp<=0.05148428604006768\n",
      "   -1.3670 if \n",
      "   -1.4217 if cp<=0.0813737437129021\n",
      "   +0.0000 if cp>=0.17432862520217896\n",
      "   -0.0511 if cp>=0.00569068053737283\n",
      "--------------\n",
      "   -2.2914 if cp>=0.08041248470544815\n",
      "   -0.8111 if cp>=0.014362649992108347\n",
      "   -1.8602 if cv>=1.3593555688858032\n",
      "   -0.0000 if cp>=0.17432862520217896\n",
      "   +0.4584 if \n",
      "Run episode 287 with rewards 9.0\n",
      "============ 288 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 0, 0, 1]\n",
      "   -2.8041 if cp<=0.05148428604006768\n",
      "   -0.5122 if \n",
      "   -0.5122 if cp<=0.0813737437129021\n",
      "   +0.8133 if cp>=0.00569068053737283\n",
      "   +1.4091 if cp>=0.03517530448734761\n",
      "--------------\n",
      "   -0.0000 if cp>=0.08041248470544815\n",
      "   -0.0258 if cp>=0.014362649992108347\n",
      "   -0.0678 if cv>=1.3593555688858032\n",
      "   +0.6087 if \n",
      "   +0.4586 if cp<=-0.019401456415653228\n",
      "Run episode 288 with rewards 9.0\n",
      "============ 289 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 0, 1]\n",
      "   -1.3116 if cp<=0.05148428604006768\n",
      "   +0.1056 if \n",
      "   +0.1056 if cp>=0.00569068053737283\n",
      "   +0.6600 if cp>=0.03517530448734761\n",
      "   -2.7956 if cv<=1.023813819885254\n",
      "--------------\n",
      "   +0.2711 if cp>=0.014362649992108347\n",
      "   -0.0000 if cv>=1.3593555688858032\n",
      "   +0.2711 if \n",
      "   -0.0000 if cp<=-0.019401456415653228\n",
      "   +2.7151 if cp<=0.1040944203734398 & cv<=1.023813819885254\n",
      "Run episode 289 with rewards 10.0\n",
      "============ 290 ===========\n",
      "11 actions [1, 1, 0, 1, 1, 0, 1, 1, 1, 1, 1]\n",
      "   -0.6192 if cp<=0.05148428604006768\n",
      "   -0.9623 if cp>=0.00569068053737283\n",
      "   -0.3780 if cp>=0.03517530448734761\n",
      "   -0.6192 if cv<=1.023813819885254\n",
      "   +1.3768 if cp>=0.09201084673404694\n",
      "--------------\n",
      "   +1.0148 if cp>=0.014362649992108347\n",
      "   +1.3100 if \n",
      "   -0.0000 if cp<=-0.019401456415653228\n",
      "   +0.3743 if cp<=0.1040944203734398 & cv<=1.023813819885254\n",
      "   -1.5307 if cp>=0.09201084673404694\n",
      "Run episode 290 with rewards 11.0\n",
      "============ 291 ===========\n",
      "21 actions [1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1]\n",
      "   +0.8441 if cp<=0.05148428604006768\n",
      "   -1.7222 if cp>=0.00569068053737283\n",
      "   +0.7740 if cv<=1.023813819885254\n",
      "   -0.0000 if cp>=0.09201084673404694\n",
      "   -3.1800 if cv<=0.1519053429365158\n",
      "--------------\n",
      "   +0.8097 if cp>=0.014362649992108347\n",
      "   -0.6496 if \n",
      "   -0.4573 if cp<=0.1040944203734398 & cv<=1.023813819885254\n",
      "   -0.0000 if cp>=0.09201084673404694\n",
      "   +3.1308 if cv<=0.1519053429365158\n",
      "Run episode 291 with rewards 21.0\n",
      "============ 292 ===========\n",
      "60 actions [1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0]\n",
      "   +1.3678 if cp<=0.05148428604006768\n",
      "   -0.0000 if cp>=0.00569068053737283\n",
      "   +1.3678 if cv<=1.023813819885254\n",
      "   -4.9855 if cv<=0.1519053429365158\n",
      "   +0.1045 if cp>=-0.018449028953909874\n",
      "--------------\n",
      "   -0.0000 if cp>=0.014362649992108347\n",
      "   -1.1359 if \n",
      "   -1.1359 if cp<=0.1040944203734398 & cv<=1.023813819885254\n",
      "   +4.9762 if cv<=0.1519053429365158\n",
      "   -0.0820 if cp>=-0.018449028953909874\n",
      "Run episode 292 with rewards 60.0\n",
      "============ 293 ===========\n",
      "38 actions [1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0]\n",
      "   -0.1344 if cp<=0.05148428604006768\n",
      "   +1.5991 if cv<=1.023813819885254\n",
      "   -6.8137 if cv<=0.1519053429365158\n",
      "   +1.5991 if cp>=-0.018449028953909874\n",
      "   +0.5265 if cp<=0.13107053935527802\n",
      "--------------\n",
      "   -1.6913 if \n",
      "   -0.6072 if cp<=0.1040944203734398 & cv<=1.023813819885254\n",
      "   +6.7329 if cv<=0.1519053429365158\n",
      "   -1.6913 if cp>=-0.018449028953909874\n",
      "   -1.0795 if cv>=0.19578039050102233\n",
      "Run episode 293 with rewards 38.0\n",
      "============ 294 ===========\n",
      "62 actions [1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0]\n",
      "   +0.1688 if cv<=1.023813819885254\n",
      "   -3.4712 if cv<=0.1519053429365158\n",
      "   +0.1688 if cp>=-0.018449028953909874\n",
      "   +0.1688 if cp<=0.13107053935527802\n",
      "   +0.4864 if cv>=0.24919366240501403\n",
      "--------------\n",
      "   +0.1111 if \n",
      "   +2.6308 if cv<=0.1519053429365158\n",
      "   +0.1111 if cp>=-0.018449028953909874\n",
      "   -2.5196 if cv>=0.19578039050102233\n",
      "   -0.3137 if cv>=0.24919366240501403\n",
      "Run episode 294 with rewards 62.0\n",
      "============ 295 ===========\n",
      "96 actions [1, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1]\n",
      "   +1.8274 if cv<=1.023813819885254\n",
      "   -4.5182 if cv<=0.1519053429365158\n",
      "   -6.4850 if cp>=-0.018449028953909874\n",
      "   +2.3605 if cv>=0.24919366240501403\n",
      "   +4.4760 if pa<=0.01773676276206971\n",
      "--------------\n",
      "   -0.3894 if \n",
      "   +3.7664 if cv<=0.1519053429365158\n",
      "   -4.1558 if cv>=0.19578039050102233\n",
      "   -2.7309 if cv>=0.24919366240501403\n",
      "   +3.6259 if cp>=-0.015706661529839037 & pav<=-0.17972677946090698\n",
      "Run episode 295 with rewards 96.0\n",
      "============ 296 ===========\n",
      "29 actions [1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1]\n",
      "   -4.7874 if cv<=0.1519053429365158\n",
      "   -4.1955 if cp>=-0.018449028953909874\n",
      "   +4.9321 if cv>=0.24919366240501403\n",
      "   +5.5471 if pa<=0.01773676276206971\n",
      "   -3.3824 if cv>=0.03317546844482422 & pav>=-0.09780763089656824\n",
      "--------------\n",
      "   +2.6902 if cv<=0.1519053429365158\n",
      "   -6.0191 if cv>=0.19578039050102233\n",
      "   -4.6732 if cv>=0.24919366240501403\n",
      "   +3.9410 if cp>=-0.015706661529839037 & pav<=-0.17972677946090698\n",
      "   +3.9504 if cv>=0.03317546844482422 & pa>=0.005767002236098054 & pav>=-0.09780763089656824\n",
      "Run episode 296 with rewards 29.0\n",
      "============ 297 ===========\n",
      "23 actions [1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1]\n",
      "   -3.7871 if cv<=0.1519053429365158\n",
      "   +1.3355 if cp>=-0.018449028953909874\n",
      "   -0.0000 if cv>=0.24919366240501403\n",
      "   +1.3355 if pa<=0.01773676276206971\n",
      "   -1.6886 if cv<=0.0051872795447707185\n",
      "--------------\n",
      "   -4.0620 if cv>=0.19578039050102233\n",
      "   +0.0000 if cv>=0.24919366240501403\n",
      "   -1.2679 if cp>=-0.015706661529839037 & pav<=-0.17972677946090698\n",
      "   +0.0000 if cv>=0.03317546844482422 & pa>=0.005767002236098054 & pav>=-0.09780763089656824\n",
      "   +1.6986 if \n",
      "Run episode 297 with rewards 23.0\n",
      "============ 298 ===========\n",
      "28 actions [1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0]\n",
      "   -6.3233 if cv<=0.1519053429365158\n",
      "   +1.4462 if cp>=-0.018449028953909874\n",
      "   +1.4462 if pa<=0.01773676276206971\n",
      "   -0.9471 if cv<=0.0051872795447707185\n",
      "   +1.0051 if cv>=0.15732401311397554 & pav<=-0.5833407998085022\n",
      "--------------\n",
      "   -1.1098 if cv>=0.19578039050102233\n",
      "   -1.1098 if cv>=0.24919366240501403\n",
      "   -0.3092 if cp>=-0.015706661529839037 & pav<=-0.17972677946090698\n",
      "   -0.1905 if \n",
      "   +3.7104 if pav>=-0.4054083943367004\n",
      "Run episode 298 with rewards 28.0\n",
      "============ 299 ===========\n",
      "27 actions [1, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1]\n",
      "   -5.4543 if cv<=0.1519053429365158\n",
      "   +1.5435 if cp>=-0.018449028953909874\n",
      "   +1.5435 if pa<=0.01773676276206971\n",
      "   +0.4879 if cv>=0.15732401311397554 & pav<=-0.5833407998085022\n",
      "   +3.0743 if cp<=0.03545091077685356 & pav<=-0.3348627388477325 & pav>=-0.4250331342220306\n",
      "--------------\n",
      "   -2.9283 if cv>=0.19578039050102233\n",
      "   -0.0791 if cv>=0.24919366240501403\n",
      "   +0.0736 if cp>=-0.015706661529839037 & pav<=-0.17972677946090698\n",
      "   +1.3743 if pav>=-0.4054083943367004\n",
      "   +1.4750 if cv>=0.021045234426856043 & pav>=-0.3348627388477325\n",
      "Run episode 299 with rewards 27.0\n",
      "============ 300 ===========\n",
      "29 actions [1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1]\n",
      "   -4.9827 if cv<=0.1519053429365158\n",
      "   +0.9638 if cp>=-0.018449028953909874\n",
      "   +0.9638 if pa<=0.01773676276206971\n",
      "   -0.0000 if cp<=0.03545091077685356 & pav<=-0.3348627388477325 & pav>=-0.4250331342220306\n",
      "   +3.2228 if cv>=0.08067982178181415 & pav<=-0.33907229900360103\n",
      "--------------\n",
      "   -1.0617 if cv>=0.19578039050102233\n",
      "   -0.7891 if cv>=0.24919366240501403\n",
      "   +1.1171 if pav>=-0.4054083943367004\n",
      "   +2.5491 if cv>=0.021045234426856043 & pav>=-0.3348627388477325\n",
      "   +2.5119 if cp<=0.04202333763241768 & cp>=0.016937226802110673 & pav>=-0.33907229900360103\n",
      "Run episode 300 with rewards 29.0\n",
      "============ 301 ===========\n",
      "22 actions [1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0]\n",
      "   -2.1792 if cv<=0.1519053429365158\n",
      "   -1.2980 if cp>=-0.018449028953909874\n",
      "   -0.0906 if pa<=0.01773676276206971\n",
      "   +4.2716 if cv>=0.08067982178181415 & pav<=-0.33907229900360103\n",
      "   +1.3428 if cv>=0.20293758809566498\n",
      "--------------\n",
      "   -1.2070 if cv>=0.19578039050102233\n",
      "   +2.9125 if pav>=-0.4054083943367004\n",
      "   +3.8667 if cv>=0.021045234426856043 & pav>=-0.3348627388477325\n",
      "   +0.0000 if cp<=0.04202333763241768 & cp>=0.016937226802110673 & pav>=-0.33907229900360103\n",
      "   +0.3025 if cv<=0.020081946626305584\n",
      "Run episode 301 with rewards 22.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 302 ===========\n",
      "23 actions [1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1]\n",
      "   -1.6361 if cv<=0.1519053429365158\n",
      "   -0.6342 if cp>=-0.018449028953909874\n",
      "   +1.1013 if cv>=0.08067982178181415 & pav<=-0.33907229900360103\n",
      "   +0.3031 if cv>=0.20293758809566498\n",
      "   +4.5797 if cv>=0.18689856827259063 & pav<=-0.35845692157745357\n",
      "--------------\n",
      "   -1.3901 if cv>=0.19578039050102233\n",
      "   +0.8288 if pav>=-0.4054083943367004\n",
      "   +0.1970 if cv>=0.021045234426856043 & pav>=-0.3348627388477325\n",
      "   +0.9428 if cv<=0.020081946626305584\n",
      "   +4.3148 if cv>=0.007691760547459126 & pav>=-0.35845692157745357\n",
      "Run episode 302 with rewards 23.0\n",
      "============ 303 ===========\n",
      "30 actions [1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0]\n",
      "   -1.5216 if cv<=0.1519053429365158\n",
      "   -0.3079 if cp>=-0.018449028953909874\n",
      "   +2.3785 if cv>=0.08067982178181415 & pav<=-0.33907229900360103\n",
      "   +2.3785 if cv>=0.18689856827259063 & pav<=-0.35845692157745357\n",
      "   -0.7665 if cv>=0.04636150747537613\n",
      "--------------\n",
      "   +0.0252 if cv>=0.19578039050102233\n",
      "   +1.6504 if pav>=-0.4054083943367004\n",
      "   -0.0000 if cv<=0.020081946626305584\n",
      "   +2.6548 if cv>=0.007691760547459126 & pav>=-0.35845692157745357\n",
      "   +1.0656 if cv<=0.2246885895729065 & cv>=0.04636150747537613 & pav>=-0.5229982733726501\n",
      "Run episode 303 with rewards 30.0\n",
      "============ 304 ===========\n",
      "20 actions [1, 1, 0, 1, 0, 1, 0, 0, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 0]\n",
      "   -0.8574 if cv<=0.1519053429365158\n",
      "   +1.9868 if cv>=0.08067982178181415 & pav<=-0.33907229900360103\n",
      "   +3.3985 if cv>=0.18689856827259063 & pav<=-0.35845692157745357\n",
      "   -0.9007 if cv>=0.04636150747537613\n",
      "   -4.9173 if cp>=0.1711114585399628 & cv<=0.24946441650390627 & pav<=-0.5864616274833679\n",
      "--------------\n",
      "   -0.6949 if cv>=0.19578039050102233\n",
      "   +1.6347 if pav>=-0.4054083943367004\n",
      "   +3.5452 if cv>=0.007691760547459126 & pav>=-0.35845692157745357\n",
      "   +0.2000 if cv<=0.2246885895729065 & cv>=0.04636150747537613 & pav>=-0.5229982733726501\n",
      "   +4.8559 if cv<=0.24946441650390627 & pav<=-0.5864616274833679\n",
      "Run episode 304 with rewards 20.0\n",
      "============ 305 ===========\n",
      "28 actions [1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 0, 0]\n",
      "   +1.1106 if cv>=0.08067982178181415 & pav<=-0.33907229900360103\n",
      "   +1.9998 if cv>=0.18689856827259063 & pav<=-0.35845692157745357\n",
      "   +0.3991 if cv>=0.04636150747537613\n",
      "   -0.0000 if cp>=0.1711114585399628 & cv<=0.24946441650390627 & pav<=-0.5864616274833679\n",
      "   +1.6231 if cp>=-0.010680424235761165 & cv<=0.00487673836760223\n",
      "--------------\n",
      "   +0.6912 if cv>=0.19578039050102233\n",
      "   +2.0559 if pav>=-0.4054083943367004\n",
      "   +2.2763 if cv>=0.007691760547459126 & pav>=-0.35845692157745357\n",
      "   +4.9550 if cv<=0.24946441650390627 & pav<=-0.5864616274833679\n",
      "   -2.8299 if cp>=-0.010680424235761165 & cv<=0.00487673836760223\n",
      "Run episode 305 with rewards 28.0\n",
      "============ 306 ===========\n",
      "26 actions [1, 1, 0, 1, 0, 1, 0, 0, 1, 0, 0, 1, 1, 0, 0, 1, 1, 0, 0, 0, 1, 0, 1, 1, 1, 0]\n",
      "   +2.1958 if cv>=0.08067982178181415 & pav<=-0.33907229900360103\n",
      "   +2.1959 if cv>=0.18689856827259063 & pav<=-0.35845692157745357\n",
      "   +1.1843 if cv>=0.04636150747537613\n",
      "   +0.0601 if cp>=-0.010680424235761165 & cv<=0.00487673836760223\n",
      "   +6.2545 if pa>=0.012658704072237015\n",
      "--------------\n",
      "   +0.8797 if pav>=-0.4054083943367004\n",
      "   +3.4665 if cv>=0.007691760547459126 & pav>=-0.35845692157745357\n",
      "   +3.4728 if cv<=0.24946441650390627 & pav<=-0.5864616274833679\n",
      "   -0.0611 if cp>=-0.010680424235761165 & cv<=0.00487673836760223\n",
      "   -6.3467 if pa>=0.012658704072237015\n",
      "Run episode 306 with rewards 26.0\n",
      "============ 307 ===========\n",
      "47 actions [1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 0, 1, 0, 0, 1, 0, 1, 0, 0, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 1, 1, 1, 0, 1]\n",
      "   +4.0215 if cv>=0.08067982178181415 & pav<=-0.33907229900360103\n",
      "   +1.8482 if cv>=0.18689856827259063 & pav<=-0.35845692157745357\n",
      "   +0.3753 if cv>=0.04636150747537613\n",
      "   -0.0000 if pa>=0.012658704072237015\n",
      "   +3.3695 if cp>=0.05849012732505798\n",
      "--------------\n",
      "   -0.2517 if pav>=-0.4054083943367004\n",
      "   +5.0699 if cv>=0.007691760547459126 & pav>=-0.35845692157745357\n",
      "   +0.7384 if cv<=0.24946441650390627 & pav<=-0.5864616274833679\n",
      "   +0.0000 if pa>=0.012658704072237015\n",
      "   +4.2740 if pav>=-0.1207556426525116\n",
      "Run episode 307 with rewards 47.0\n",
      "============ 308 ===========\n",
      "45 actions [1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 1, 0, 0, 1, 0, 0, 1, 0, 1, 1, 1]\n",
      "   +2.6123 if cv>=0.08067982178181415 & pav<=-0.33907229900360103\n",
      "   +2.1897 if cv>=0.18689856827259063 & pav<=-0.35845692157745357\n",
      "   -0.7039 if cv>=0.04636150747537613\n",
      "   +3.9147 if cp>=0.05849012732505798\n",
      "   -2.5375 if cp>=0.06770181655883789 & pa>=-0.10972143560647965 & pav>=-0.21598087251186365\n",
      "--------------\n",
      "   -0.1921 if pav>=-0.4054083943367004\n",
      "   +5.5263 if cv>=0.007691760547459126 & pav>=-0.35845692157745357\n",
      "   +1.8947 if cv<=0.24946441650390627 & pav<=-0.5864616274833679\n",
      "   +5.9216 if pav>=-0.1207556426525116\n",
      "   -5.4403 if cp>=0.1187881499528885 & pa<=-0.11743783950805664\n",
      "Run episode 308 with rewards 45.0\n",
      "============ 309 ===========\n",
      "41 actions [1, 1, 0, 1, 0, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 0, 1, 1, 0, 0, 1, 1, 0]\n",
      "   +1.7923 if cv>=0.08067982178181415 & pav<=-0.33907229900360103\n",
      "   +1.7923 if cv>=0.18689856827259063 & pav<=-0.35845692157745357\n",
      "   +3.2647 if cp>=0.05849012732505798\n",
      "   -1.9967 if cp>=0.06770181655883789 & pa>=-0.10972143560647965 & pav>=-0.21598087251186365\n",
      "   +2.0516 if pav<=-0.36785814762115476\n",
      "--------------\n",
      "   +7.1799 if cv>=0.007691760547459126 & pav>=-0.35845692157745357\n",
      "   +0.1026 if cv<=0.24946441650390627 & pav<=-0.5864616274833679\n",
      "   +5.9538 if pav>=-0.1207556426525116\n",
      "   -6.2564 if cp>=0.1187881499528885 & pa<=-0.11743783950805664\n",
      "   -4.5412 if cp<=0.11515994966030121 & cp>=0.07602255791425708 & pa<=-0.12145113945007324\n",
      "Run episode 309 with rewards 41.0\n",
      "============ 310 ===========\n",
      "32 actions [1, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 0, 1, 0, 1, 0]\n",
      "   +1.0745 if cv>=0.18689856827259063 & pav<=-0.35845692157745357\n",
      "   +2.7474 if cp>=0.05849012732505798\n",
      "   +0.0103 if cp>=0.06770181655883789 & pa>=-0.10972143560647965 & pav>=-0.21598087251186365\n",
      "   +3.5515 if pav<=-0.36785814762115476\n",
      "   +3.1100 if cp>=0.05014294013381005 & cv>=-0.40063217282295227 & pa<=-0.08500519394874573 & pav<=-0.18836319446563704\n",
      "--------------\n",
      "   +7.6244 if cv>=0.007691760547459126 & pav>=-0.35845692157745357\n",
      "   +6.6559 if pav>=-0.1207556426525116\n",
      "   +0.0000 if cp>=0.1187881499528885 & pa<=-0.11743783950805664\n",
      "   +0.0000 if cp<=0.11515994966030121 & cp>=0.07602255791425708 & pa<=-0.12145113945007324\n",
      "   -1.6487 if cp>=-0.0265260711312294 & pa<=-0.07224208116531372 & pav<=-0.18836319446563704\n",
      "Run episode 310 with rewards 32.0\n",
      "============ 311 ===========\n",
      "33 actions [1, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 0, 1, 0, 0, 1, 1, 0, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0]\n",
      "   +1.9426 if cv>=0.18689856827259063 & pav<=-0.35845692157745357\n",
      "   -0.0000 if cp>=0.05849012732505798\n",
      "   +3.0391 if pav<=-0.36785814762115476\n",
      "   -0.0000 if cp>=0.05014294013381005 & cv>=-0.40063217282295227 & pa<=-0.08500519394874573 & pav<=-0.18836319446563704\n",
      "   -3.0611 if cp>=0.01671094335615635 & cv<=0.008783733844757084 & pa>=-0.1186882436275482\n",
      "--------------\n",
      "   +5.9433 if cv>=0.007691760547459126 & pav>=-0.35845692157745357\n",
      "   +4.2991 if pav>=-0.1207556426525116\n",
      "   +0.0000 if cp>=0.1187881499528885 & pa<=-0.11743783950805664\n",
      "   -2.9042 if cp>=-0.0265260711312294 & pa<=-0.07224208116531372 & pav<=-0.18836319446563704\n",
      "   +3.3371 if cp<=0.026951853558421137 & cp>=-0.011111549660563469 & cv<=0.008783733844757084 & pa<=-0.07782108932733535 & pav<=-0.1129704773426056 & pav>=-0.23996430039405817\n",
      "Run episode 311 with rewards 33.0\n",
      "============ 312 ===========\n",
      "33 actions [1, 1, 0, 1, 0, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 0, 0, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 0]\n",
      "   -1.4253 if cv>=0.18689856827259063 & pav<=-0.35845692157745357\n",
      "   +2.8049 if pav<=-0.36785814762115476\n",
      "   -1.8229 if cp>=0.05014294013381005 & cv>=-0.40063217282295227 & pa<=-0.08500519394874573 & pav<=-0.18836319446563704\n",
      "   -2.2125 if cp>=0.01671094335615635 & cv<=0.008783733844757084 & pa>=-0.1186882436275482\n",
      "   +3.7441 if cp>=0.07280243188142776\n",
      "--------------\n",
      "   +5.1251 if cv>=0.007691760547459126 & pav>=-0.35845692157745357\n",
      "   +4.1020 if pav>=-0.1207556426525116\n",
      "   -2.2608 if cp>=-0.0265260711312294 & pa<=-0.07224208116531372 & pav<=-0.18836319446563704\n",
      "   +0.9651 if cp<=0.026951853558421137 & cp>=-0.011111549660563469 & cv<=0.008783733844757084 & pa<=-0.07782108932733535 & pav<=-0.1129704773426056 & pav>=-0.23996430039405817\n",
      "   +4.2592 if cp>=0.016548550315201284 & pa>=-0.05183913037180899 & pav<=-0.2660750448703766\n",
      "Run episode 312 with rewards 33.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 313 ===========\n",
      "38 actions [1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1, 1, 0, 0, 1, 0, 0, 1, 0, 1, 0, 0]\n",
      "   +4.4023 if pav<=-0.36785814762115476\n",
      "   +0.0000 if cp>=0.05014294013381005 & cv>=-0.40063217282295227 & pa<=-0.08500519394874573 & pav<=-0.18836319446563704\n",
      "   +0.0000 if cp>=0.01671094335615635 & cv<=0.008783733844757084 & pa>=-0.1186882436275482\n",
      "   +0.0000 if cp>=0.07280243188142776\n",
      "   -2.0906 if cp>=0.01688995584845543\n",
      "--------------\n",
      "   +7.9124 if cv>=0.007691760547459126 & pav>=-0.35845692157745357\n",
      "   +4.3587 if pav>=-0.1207556426525116\n",
      "   -2.4012 if cp>=-0.0265260711312294 & pa<=-0.07224208116531372 & pav<=-0.18836319446563704\n",
      "   -0.0000 if cp>=0.016548550315201284 & pa>=-0.05183913037180899 & pav<=-0.2660750448703766\n",
      "   -2.6489 if pa>=-0.0943380519747734 & pav<=-0.11136764138936994\n",
      "Run episode 313 with rewards 38.0\n",
      "============ 314 ===========\n",
      "59 actions [1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 0, 0, 1, 0, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1, 0, 0, 0, 1, 0, 1]\n",
      "   +3.9162 if pav<=-0.36785814762115476\n",
      "   +0.0000 if cp>=0.01671094335615635 & cv<=0.008783733844757084 & pa>=-0.1186882436275482\n",
      "   -0.7632 if cp>=0.07280243188142776\n",
      "   -0.6920 if cp>=0.01688995584845543\n",
      "   +3.6793 if cp>=0.13275983929634094\n",
      "--------------\n",
      "   +5.3660 if cv>=0.007691760547459126 & pav>=-0.35845692157745357\n",
      "   +1.7098 if pav>=-0.1207556426525116\n",
      "   -2.6340 if cp>=-0.0265260711312294 & pa<=-0.07224208116531372 & pav<=-0.18836319446563704\n",
      "   -2.5780 if pa>=-0.0943380519747734 & pav<=-0.11136764138936994\n",
      "   -4.1738 if cp>=0.13275983929634094\n",
      "Run episode 314 with rewards 59.0\n",
      "============ 315 ===========\n",
      "58 actions [1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 0, 0, 0, 1, 0]\n",
      "   +3.8466 if pav<=-0.36785814762115476\n",
      "   -1.0583 if cp>=0.07280243188142776\n",
      "   +1.6683 if cp>=0.01688995584845543\n",
      "   -0.0000 if cp>=0.13275983929634094\n",
      "   -4.3676 if cv<=0.1876722902059555 & cv>=-0.17802864313125608 & pa>=-0.14913274645805358 & pav>=-0.4390673696994781\n",
      "--------------\n",
      "   +2.0692 if cv>=0.007691760547459126 & pav>=-0.35845692157745357\n",
      "   -5.4858 if cp>=-0.0265260711312294 & pa<=-0.07224208116531372 & pav<=-0.18836319446563704\n",
      "   -1.8628 if pa>=-0.0943380519747734 & pav<=-0.11136764138936994\n",
      "   +0.0000 if cp>=0.13275983929634094\n",
      "   +4.6659 if cp>=-0.010085745528340297 & pa>=-0.14913274645805358 & pav>=-0.4390673696994781\n",
      "Run episode 315 with rewards 58.0\n",
      "============ 316 ===========\n",
      "105 actions [1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 0, 0, 0, 1, 1, 0, 0, 1, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 0, 0, 0, 0, 0, 1]\n",
      "   +5.0039 if pav<=-0.36785814762115476\n",
      "   +0.0000 if cp>=0.07280243188142776\n",
      "   +1.0347 if cp>=0.01688995584845543\n",
      "   -3.4478 if cv<=0.1876722902059555 & cv>=-0.17802864313125608 & pa>=-0.14913274645805358 & pav>=-0.4390673696994781\n",
      "   +3.8177 if cp<=-0.050125050544738765 & pa<=-0.15760475695133208 & pav>=0.027507158741355058\n",
      "--------------\n",
      "   +3.1045 if cv>=0.007691760547459126 & pav>=-0.35845692157745357\n",
      "   -6.5939 if cp>=-0.0265260711312294 & pa<=-0.07224208116531372 & pav<=-0.18836319446563704\n",
      "   -2.9668 if pa>=-0.0943380519747734 & pav<=-0.11136764138936994\n",
      "   +4.4582 if cp>=-0.010085745528340297 & pa>=-0.14913274645805358 & pav>=-0.4390673696994781\n",
      "   -3.8177 if cp<=-0.050125050544738765 & pa<=-0.15760475695133208 & pav>=0.027507158741355058\n",
      "Run episode 316 with rewards 105.0\n",
      "best\n",
      "============ 317 ===========\n",
      "53 actions [1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 0, 0, 0, 1, 1, 1, 0, 1, 0, 0, 0, 1, 1, 0, 1, 0, 1, 0, 0, 0]\n",
      "   +4.9671 if pav<=-0.36785814762115476\n",
      "   +1.0380 if cp>=0.01688995584845543\n",
      "   -4.4418 if cv<=0.1876722902059555 & cv>=-0.17802864313125608 & pa>=-0.14913274645805358 & pav>=-0.4390673696994781\n",
      "   +1.8417 if cp<=-0.050125050544738765 & pa<=-0.15760475695133208 & pav>=0.027507158741355058\n",
      "   -4.6245 if cp>=0.14984695613384247\n",
      "--------------\n",
      "   +0.2638 if cv>=0.007691760547459126 & pav>=-0.35845692157745357\n",
      "   -4.4207 if cp>=-0.0265260711312294 & pa<=-0.07224208116531372 & pav<=-0.18836319446563704\n",
      "   +3.0619 if cp>=-0.010085745528340297 & pa>=-0.14913274645805358 & pav>=-0.4390673696994781\n",
      "   -1.8417 if cp<=-0.050125050544738765 & pa<=-0.15760475695133208 & pav>=0.027507158741355058\n",
      "   +4.6216 if cp>=0.14984695613384247\n",
      "Run episode 317 with rewards 53.0\n",
      "============ 318 ===========\n",
      "153 actions [1, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 0, 1, 0, 0, 0, 0, 1, 1, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0, 1, 1, 1, 0, 1, 0, 0, 0, 1, 1, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 0, 0, 0, 1, 1, 1, 1, 0, 1, 1, 0, 0, 0, 0, 1, 0, 1, 1, 1, 0, 0, 1, 0, 1, 1, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 0, 0, 1, 0, 1, 1, 0, 1, 0, 0, 0, 1, 1, 0, 1, 0, 0, 0, 1, 0, 0, 1, 0, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 0, 1, 1, 0, 0, 0, 1, 1, 0, 0, 0]\n",
      "   +4.9306 if pav<=-0.36785814762115476\n",
      "   -4.8026 if cv<=0.1876722902059555 & cv>=-0.17802864313125608 & pa>=-0.14913274645805358 & pav>=-0.4390673696994781\n",
      "   -0.0000 if cp<=-0.050125050544738765 & pa<=-0.15760475695133208 & pav>=0.027507158741355058\n",
      "   -0.0000 if cp>=0.14984695613384247\n",
      "   +4.2783 if cv>=-0.5460035800933838 & pa<=-0.14712669849395751 & pav>=-0.16282519698143003\n",
      "--------------\n",
      "   -6.1651 if cp>=-0.0265260711312294 & pa<=-0.07224208116531372 & pav<=-0.18836319446563704\n",
      "   +5.3862 if cp>=-0.010085745528340297 & pa>=-0.14913274645805358 & pav>=-0.4390673696994781\n",
      "   -0.0000 if cp<=-0.050125050544738765 & pa<=-0.15760475695133208 & pav>=0.027507158741355058\n",
      "   -0.0000 if cp>=0.14984695613384247\n",
      "   -3.6787 if cv>=-0.5460035800933838 & pa<=-0.14712669849395751 & pav>=-0.16282519698143003\n",
      "Run episode 318 with rewards 153.0\n",
      "best\n",
      "============ 319 ===========\n",
      "92 actions [1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 0, 0, 1, 1, 1, 0, 0, 0, 0, 1, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 1, 0, 0, 1, 0, 0, 1, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 0, 1, 1, 0, 0, 1, 0, 0]\n",
      "   +7.8193 if pav<=-0.36785814762115476\n",
      "   -4.9610 if cv<=0.1876722902059555 & cv>=-0.17802864313125608 & pa>=-0.14913274645805358 & pav>=-0.4390673696994781\n",
      "   +0.0000 if cp>=0.14984695613384247\n",
      "   +1.4410 if cv>=-0.5460035800933838 & pa<=-0.14712669849395751 & pav>=-0.16282519698143003\n",
      "   -0.8944 if cp<=-0.14827337265014628 & cp>=-1.543892741203308 & pa>=-0.04421053752303123 & pav>=-0.34174778461456295\n",
      "--------------\n",
      "   -5.6996 if cp>=-0.0265260711312294 & pa<=-0.07224208116531372 & pav<=-0.18836319446563704\n",
      "   +4.0437 if cp>=-0.010085745528340297 & pa>=-0.14913274645805358 & pav>=-0.4390673696994781\n",
      "   +0.0000 if cp>=0.14984695613384247\n",
      "   -1.1065 if cv>=-0.5460035800933838 & pa<=-0.14712669849395751 & pav>=-0.16282519698143003\n",
      "   +0.8944 if cp<=-0.14827337265014628 & cp>=-1.543892741203308 & pa>=-0.04421053752303123 & pav>=-0.34174778461456295\n",
      "Run episode 319 with rewards 92.0\n",
      "============ 320 ===========\n",
      "81 actions [1, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 1, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1, 1, 0, 1, 0, 0, 0, 1, 1, 0, 0, 1, 0]\n",
      "   +4.7007 if pav<=-0.36785814762115476\n",
      "   -4.8996 if cv<=0.1876722902059555 & cv>=-0.17802864313125608 & pa>=-0.14913274645805358 & pav>=-0.4390673696994781\n",
      "   +3.4255 if cv>=-0.5460035800933838 & pa<=-0.14712669849395751 & pav>=-0.16282519698143003\n",
      "   -0.8054 if cp<=-0.14827337265014628 & cp>=-1.543892741203308 & pa>=-0.04421053752303123 & pav>=-0.34174778461456295\n",
      "   +1.3712 if cp<=-0.002269201446324597 & cp>=-0.09520515352487546 & pav>=-0.4522567927837372\n",
      "--------------\n",
      "   -8.6224 if cp>=-0.0265260711312294 & pa<=-0.07224208116531372 & pav<=-0.18836319446563704\n",
      "   +8.3560 if cp>=-0.010085745528340297 & pa>=-0.14913274645805358 & pav>=-0.4390673696994781\n",
      "   -2.1783 if cv>=-0.5460035800933838 & pa<=-0.14712669849395751 & pav>=-0.16282519698143003\n",
      "   +0.8054 if cp<=-0.14827337265014628 & cp>=-1.543892741203308 & pa>=-0.04421053752303123 & pav>=-0.34174778461456295\n",
      "   -1.3694 if cp>=-0.09520515352487546 & pav>=-0.4522567927837372\n",
      "Run episode 320 with rewards 81.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 321 ===========\n",
      "34 actions [1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 0, 1, 0]\n",
      "   +7.3512 if pav<=-0.36785814762115476\n",
      "   -8.1931 if cv<=0.1876722902059555 & cv>=-0.17802864313125608 & pa>=-0.14913274645805358 & pav>=-0.4390673696994781\n",
      "   +1.9202 if cv>=-0.5460035800933838 & pa<=-0.14712669849395751 & pav>=-0.16282519698143003\n",
      "   +3.6165 if cp<=-0.002269201446324597 & cp>=-0.09520515352487546 & pav>=-0.4522567927837372\n",
      "   -1.3298 if cv<=-0.5648040175437927\n",
      "--------------\n",
      "   -1.5163 if cp>=-0.0265260711312294 & pa<=-0.07224208116531372 & pav<=-0.18836319446563704\n",
      "   +2.1389 if cp>=-0.010085745528340297 & pa>=-0.14913274645805358 & pav>=-0.4390673696994781\n",
      "   -1.5335 if cv>=-0.5460035800933838 & pa<=-0.14712669849395751 & pav>=-0.16282519698143003\n",
      "   -0.7346 if cp>=-0.09520515352487546 & pav>=-0.4522567927837372\n",
      "   +4.1468 if cv<=-0.5648040175437927 & pa>=0.06829707324504852\n",
      "Run episode 321 with rewards 34.0\n",
      "============ 322 ===========\n",
      "43 actions [1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 0, 0, 1, 0, 0, 0, 1, 1, 1, 1, 0, 0, 0, 1, 1, 0, 0, 1, 0, 0]\n",
      "   +4.6545 if pav<=-0.36785814762115476\n",
      "   -3.6789 if cv<=0.1876722902059555 & cv>=-0.17802864313125608 & pa>=-0.14913274645805358 & pav>=-0.4390673696994781\n",
      "   -0.0000 if cv>=-0.5460035800933838 & pa<=-0.14712669849395751 & pav>=-0.16282519698143003\n",
      "   -0.0000 if cp<=-0.002269201446324597 & cp>=-0.09520515352487546 & pav>=-0.4522567927837372\n",
      "   +4.3827 if pa>=0.0244790967553854\n",
      "--------------\n",
      "   -3.7001 if cp>=-0.0265260711312294 & pa<=-0.07224208116531372 & pav<=-0.18836319446563704\n",
      "   +2.8314 if cp>=-0.010085745528340297 & pa>=-0.14913274645805358 & pav>=-0.4390673696994781\n",
      "   +0.0000 if cv>=-0.5460035800933838 & pa<=-0.14712669849395751 & pav>=-0.16282519698143003\n",
      "   +0.0000 if cv<=-0.5648040175437927 & pa>=0.06829707324504852\n",
      "   -5.5584 if pa>=0.0244790967553854\n",
      "Run episode 322 with rewards 43.0\n",
      "============ 323 ===========\n",
      "52 actions [1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 0, 0, 1, 0, 0, 0, 0, 0, 1, 0, 1, 0, 0, 0, 1, 1, 1, 1, 0, 0, 0, 1, 1, 0, 1, 0, 1, 0, 0, 0, 0]\n",
      "   +5.7616 if pav<=-0.36785814762115476\n",
      "   -3.8287 if cv<=0.1876722902059555 & cv>=-0.17802864313125608 & pa>=-0.14913274645805358 & pav>=-0.4390673696994781\n",
      "   -1.9674 if cp<=-0.002269201446324597 & cp>=-0.09520515352487546 & pav>=-0.4522567927837372\n",
      "   +0.0000 if pa>=0.0244790967553854\n",
      "   +2.1013 if cp>=0.05010749995708466 & cv<=-0.3382517576217651 & pa<=-0.14806674420833588 & pa>=-0.16267224848270417 & pav>=-0.27804165482521037\n",
      "--------------\n",
      "   -4.3546 if cp>=-0.0265260711312294 & pa<=-0.07224208116531372 & pav<=-0.18836319446563704\n",
      "   +4.4743 if cp>=-0.010085745528340297 & pa>=-0.14913274645805358 & pav>=-0.4390673696994781\n",
      "   +0.0000 if cv<=-0.5648040175437927 & pa>=0.06829707324504852\n",
      "   +0.0000 if pa>=0.0244790967553854\n",
      "   -3.3837 if cp>=0.05010749995708466 & cv<=-0.3382517576217651 & cv>=-0.5427643299102783\n",
      "Run episode 323 with rewards 52.0\n",
      "============ 324 ===========\n",
      "25 actions [1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 0, 0, 0, 1, 0, 1, 0, 0, 1, 0]\n",
      "   +6.2188 if pav<=-0.36785814762115476\n",
      "   -3.0735 if cv<=0.1876722902059555 & cv>=-0.17802864313125608 & pa>=-0.14913274645805358 & pav>=-0.4390673696994781\n",
      "   -0.0351 if cp<=-0.002269201446324597 & cp>=-0.09520515352487546 & pav>=-0.4522567927837372\n",
      "   -0.0000 if cp>=0.05010749995708466 & cv<=-0.3382517576217651 & pa<=-0.14806674420833588 & pa>=-0.16267224848270417 & pav>=-0.27804165482521037\n",
      "   -3.2793 if cp>=0.0828644409775734\n",
      "--------------\n",
      "   -3.0920 if cp>=-0.0265260711312294 & pa<=-0.07224208116531372 & pav<=-0.18836319446563704\n",
      "   +2.3865 if cp>=-0.010085745528340297 & pa>=-0.14913274645805358 & pav>=-0.4390673696994781\n",
      "   -0.3401 if pa>=0.0244790967553854\n",
      "   -3.7394 if cp>=0.05010749995708466 & cv<=-0.3382517576217651 & cv>=-0.5427643299102783\n",
      "   +3.2793 if cp>=0.0828644409775734\n",
      "Run episode 324 with rewards 25.0\n",
      "============ 325 ===========\n",
      "51 actions [1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 0, 1, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0, 1, 1, 1, 1, 0, 1, 0, 0, 0, 1, 0, 1, 0, 0, 1, 1, 0, 0, 1, 0, 0]\n",
      "   +4.2124 if pav<=-0.36785814762115476\n",
      "   -2.2208 if cv<=0.1876722902059555 & cv>=-0.17802864313125608 & pa>=-0.14913274645805358 & pav>=-0.4390673696994781\n",
      "   -0.0000 if cp<=-0.002269201446324597 & cp>=-0.09520515352487546 & pav>=-0.4522567927837372\n",
      "   -1.7050 if cp>=0.0828644409775734\n",
      "   +5.3675 if cp<=0.05881190598011017 & cv>=0.2146193116903305\n",
      "--------------\n",
      "   -3.9264 if cp>=-0.0265260711312294 & pa<=-0.07224208116531372 & pav<=-0.18836319446563704\n",
      "   +2.5870 if cp>=-0.010085745528340297 & pa>=-0.14913274645805358 & pav>=-0.4390673696994781\n",
      "   +0.0000 if cp>=0.05010749995708466 & cv<=-0.3382517576217651 & cv>=-0.5427643299102783\n",
      "   +3.7432 if cp>=0.0828644409775734\n",
      "   -5.6738 if cp<=0.05881190598011017 & cv>=0.2146193116903305\n",
      "Run episode 325 with rewards 51.0\n",
      "============ 326 ===========\n",
      "15 actions [0, 0, 1, 0, 1, 0, 0, 0, 1, 1, 0, 1, 0, 0, 1]\n",
      "   +5.9428 if pav<=-0.36785814762115476\n",
      "   -0.4003 if cv<=0.1876722902059555 & cv>=-0.17802864313125608 & pa>=-0.14913274645805358 & pav>=-0.4390673696994781\n",
      "   -0.0000 if cp>=0.0828644409775734\n",
      "   +1.8302 if cp<=0.05881190598011017 & cv>=0.2146193116903305\n",
      "   -3.9095 if cv<=0.049300000071525574 & pa>=-0.12229782342910765 & pav<=-0.27689608931541443\n",
      "--------------\n",
      "   -7.7307 if cp>=-0.0265260711312294 & pa<=-0.07224208116531372 & pav<=-0.18836319446563704\n",
      "   +2.8886 if cp>=-0.010085745528340297 & pa>=-0.14913274645805358 & pav>=-0.4390673696994781\n",
      "   -0.0000 if cp>=0.0828644409775734\n",
      "   -2.2442 if cp<=0.05881190598011017 & cv>=0.2146193116903305\n",
      "   +4.9547 if cp>=-0.007593466900289059 & pa<=-0.07239581644535065 & pav<=-0.27689608931541443\n",
      "Run episode 326 with rewards 15.0\n",
      "============ 327 ===========\n",
      "16 actions [0, 1, 0, 0, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 0, 1]\n",
      "   +0.0000 if pav<=-0.36785814762115476\n",
      "   +0.7325 if cv<=0.1876722902059555 & cv>=-0.17802864313125608 & pa>=-0.14913274645805358 & pav>=-0.4390673696994781\n",
      "   +0.0000 if cp<=0.05881190598011017 & cv>=0.2146193116903305\n",
      "   +0.0000 if cv<=0.049300000071525574 & pa>=-0.12229782342910765 & pav<=-0.27689608931541443\n",
      "   +3.3308 if cv>=-0.19738071262836457\n",
      "--------------\n",
      "   -0.0000 if cp>=-0.0265260711312294 & pa<=-0.07224208116531372 & pav<=-0.18836319446563704\n",
      "   -0.0000 if cp>=-0.010085745528340297 & pa>=-0.14913274645805358 & pav>=-0.4390673696994781\n",
      "   -0.0000 if cp<=0.05881190598011017 & cv>=0.2146193116903305\n",
      "   -0.0000 if cp>=-0.007593466900289059 & pa<=-0.07239581644535065 & pav<=-0.27689608931541443\n",
      "   -3.6219 if cv>=-0.19738071262836457\n",
      "Run episode 327 with rewards 16.0\n",
      "============ 328 ===========\n",
      "18 actions [0, 1, 0, 1, 0, 0, 0, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0]\n",
      "   +0.0000 if pav<=-0.36785814762115476\n",
      "   +0.6397 if cv<=0.1876722902059555 & cv>=-0.17802864313125608 & pa>=-0.14913274645805358 & pav>=-0.4390673696994781\n",
      "   +0.0000 if cv<=0.049300000071525574 & pa>=-0.12229782342910765 & pav<=-0.27689608931541443\n",
      "   +0.6397 if cv>=-0.19738071262836457\n",
      "   -1.1500 if cp>=-0.045515719801187515 & pav>=0.6889917254447938\n",
      "--------------\n",
      "   +0.0000 if cp>=-0.0265260711312294 & pa<=-0.07224208116531372 & pav<=-0.18836319446563704\n",
      "   +0.0000 if cp<=0.05881190598011017 & cv>=0.2146193116903305\n",
      "   +0.0000 if cp>=-0.007593466900289059 & pa<=-0.07239581644535065 & pav<=-0.27689608931541443\n",
      "   -0.7196 if cv>=-0.19738071262836457\n",
      "   +1.1500 if cp>=-0.045515719801187515 & pav>=0.6889917254447938\n",
      "Run episode 328 with rewards 18.0\n",
      "============ 329 ===========\n",
      "16 actions [0, 0, 1, 1, 0, 0, 1, 0, 1, 0, 0, 1, 0, 0, 0, 0]\n",
      "   +0.0000 if pav<=-0.36785814762115476\n",
      "   +1.8632 if cv<=0.1876722902059555 & cv>=-0.17802864313125608 & pa>=-0.14913274645805358 & pav>=-0.4390673696994781\n",
      "   +1.8632 if cv>=-0.19738071262836457\n",
      "   -1.6945 if cp>=-0.045515719801187515 & pav>=0.6889917254447938\n",
      "   -3.2967 if cp>=-0.018701504170894615 & cv<=-0.10313368476927252\n",
      "--------------\n",
      "   +0.0000 if cp>=-0.0265260711312294 & pa<=-0.07224208116531372 & pav<=-0.18836319446563704\n",
      "   +0.0000 if cp>=-0.007593466900289059 & pa<=-0.07239581644535065 & pav<=-0.27689608931541443\n",
      "   -2.7658 if cv>=-0.19738071262836457\n",
      "   +1.6945 if cp>=-0.045515719801187515 & pav>=0.6889917254447938\n",
      "   +3.2967 if cp>=-0.018701504170894615 & cv<=-0.10313368476927252\n",
      "Run episode 329 with rewards 16.0\n",
      "============ 330 ===========\n",
      "17 actions [0, 1, 0, 0, 1, 0, 1, 0, 1, 1, 0, 0, 0, 1, 1, 0, 0]\n",
      "   +0.5435 if cv<=0.1876722902059555 & cv>=-0.17802864313125608 & pa>=-0.14913274645805358 & pav>=-0.4390673696994781\n",
      "   +0.5435 if cv>=-0.19738071262836457\n",
      "   +0.0000 if cp>=-0.045515719801187515 & pav>=0.6889917254447938\n",
      "   +0.0000 if cp>=-0.018701504170894615 & cv<=-0.10313368476927252\n",
      "   +1.1415 if cv>=-0.20626969635486603\n",
      "--------------\n",
      "   -0.0000 if cp>=-0.0265260711312294 & pa<=-0.07224208116531372 & pav<=-0.18836319446563704\n",
      "   -0.4113 if cv>=-0.19738071262836457\n",
      "   -0.0000 if cp>=-0.045515719801187515 & pav>=0.6889917254447938\n",
      "   -0.0000 if cp>=-0.018701504170894615 & cv<=-0.10313368476927252\n",
      "   -1.1371 if cv>=-0.20626969635486603\n",
      "Run episode 330 with rewards 17.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 331 ===========\n",
      "14 actions [0, 0, 0, 0, 0, 1, 1, 1, 1, 0, 0, 1, 1, 0]\n",
      "   +0.6951 if cv<=0.1876722902059555 & cv>=-0.17802864313125608 & pa>=-0.14913274645805358 & pav>=-0.4390673696994781\n",
      "   +0.6951 if cv>=-0.19738071262836457\n",
      "   -1.7496 if cp>=-0.018701504170894615 & cv<=-0.10313368476927252\n",
      "   +0.6951 if cv>=-0.20626969635486603\n",
      "   +1.4411 if cv>=-0.3392065048217773 & pav<=0.6531276464462281\n",
      "--------------\n",
      "   -0.3497 if cv>=-0.19738071262836457\n",
      "   +2.2983 if cp>=-0.045515719801187515 & pav>=0.6889917254447938\n",
      "   +2.9224 if cp>=-0.018701504170894615 & cv<=-0.10313368476927252\n",
      "   -0.3497 if cv>=-0.20626969635486603\n",
      "   -2.8369 if cv>=-0.21936514973640442\n",
      "Run episode 331 with rewards 14.0\n",
      "============ 332 ===========\n",
      "12 actions [0, 0, 0, 0, 0, 1, 0, 1, 0, 0, 0, 0]\n",
      "   +0.4533 if cv<=0.1876722902059555 & cv>=-0.17802864313125608 & pa>=-0.14913274645805358 & pav>=-0.4390673696994781\n",
      "   +0.5747 if cv>=-0.19738071262836457\n",
      "   +0.0000 if cp>=-0.018701504170894615 & cv<=-0.10313368476927252\n",
      "   +0.5747 if cv>=-0.3392065048217773 & pav<=0.6531276464462281\n",
      "   +3.0217 if cp>=-0.08876736760139464 & cv<=-0.18450306355953217 & cv>=-0.6471563220024109\n",
      "--------------\n",
      "   -0.5160 if cv>=-0.19738071262836457\n",
      "   -0.0000 if cp>=-0.045515719801187515 & pav>=0.6889917254447938\n",
      "   -0.0000 if cp>=-0.018701504170894615 & cv<=-0.10313368476927252\n",
      "   -0.5160 if cv>=-0.21936514973640442\n",
      "   -0.7447 if cv>=-0.3730471909046173\n",
      "Run episode 332 with rewards 12.0\n",
      "============ 333 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 1, 0, 0, 1, 1]\n",
      "   +0.2473 if cv<=0.1876722902059555 & cv>=-0.17802864313125608 & pa>=-0.14913274645805358 & pav>=-0.4390673696994781\n",
      "   +0.2473 if cv>=-0.19738071262836457\n",
      "   +0.2473 if cv>=-0.3392065048217773 & pav<=0.6531276464462281\n",
      "   +0.7958 if cp>=-0.08876736760139464 & cv<=-0.18450306355953217 & cv>=-0.6471563220024109\n",
      "   +3.0590 if cv>=-0.8589064717292785\n",
      "--------------\n",
      "   -0.3305 if cv>=-0.19738071262836457\n",
      "   +1.2282 if cp>=-0.018701504170894615 & cv<=-0.10313368476927252\n",
      "   -0.3305 if cv>=-0.21936514973640442\n",
      "   -0.4365 if cv>=-0.3730471909046173\n",
      "   -3.3534 if cp>=-0.03794348612427711 & cv>=-0.8589064717292785\n",
      "Run episode 333 with rewards 10.0\n",
      "============ 334 ===========\n",
      "12 actions [0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 0]\n",
      "   +0.0302 if cv>=-0.19738071262836457\n",
      "   +0.0634 if cv>=-0.3392065048217773 & pav<=0.6531276464462281\n",
      "   +0.1544 if cp>=-0.08876736760139464 & cv<=-0.18450306355953217 & cv>=-0.6471563220024109\n",
      "   +2.3018 if cv>=-0.8589064717292785\n",
      "   -1.7074 if cp>=-0.07290158569812774 & cv<=-0.8819729208946228\n",
      "--------------\n",
      "   -0.1820 if cv>=-0.19738071262836457\n",
      "   +0.0000 if cp>=-0.018701504170894615 & cv<=-0.10313368476927252\n",
      "   -0.3269 if cv>=-0.3730471909046173\n",
      "   -0.7344 if cp>=-0.03794348612427711 & cv>=-0.8589064717292785\n",
      "   +1.7074 if cp>=-0.07290158569812774 & cv<=-0.8819729208946228\n",
      "Run episode 334 with rewards 12.0\n",
      "============ 335 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 1, 1, 0, 1, 0]\n",
      "   +0.4717 if cv>=-0.3392065048217773 & pav<=0.6531276464462281\n",
      "   +0.7704 if cp>=-0.08876736760139464 & cv<=-0.18450306355953217 & cv>=-0.6471563220024109\n",
      "   +2.9154 if cv>=-0.8589064717292785\n",
      "   -0.6108 if cp>=-0.07290158569812774 & cv<=-0.8819729208946228\n",
      "   -1.6702 if cv<=-0.7808522701263427\n",
      "--------------\n",
      "   -0.4121 if cv>=-0.19738071262836457\n",
      "   -0.4121 if cv>=-0.3730471909046173\n",
      "   -1.7739 if cp>=-0.03794348612427711 & cv>=-0.8589064717292785\n",
      "   +1.4157 if cp>=-0.07290158569812774 & cv<=-0.8819729208946228\n",
      "   +1.4656 if pa>=0.18415261805057526\n",
      "Run episode 335 with rewards 10.0\n",
      "============ 336 ===========\n",
      "13 actions [0, 0, 0, 0, 0, 1, 1, 0, 0, 1, 1, 0, 1]\n",
      "   +1.2816 if cp>=-0.08876736760139464 & cv<=-0.18450306355953217 & cv>=-0.6471563220024109\n",
      "   +1.1723 if cv>=-0.8589064717292785\n",
      "   -0.6024 if cp>=-0.07290158569812774 & cv<=-0.8819729208946228\n",
      "   -0.8432 if cv<=-0.7808522701263427\n",
      "   -1.8551 if cp<=-0.0607950821518898 & cv<=-0.6743402004241943\n",
      "--------------\n",
      "   -0.2497 if cv>=-0.3730471909046173\n",
      "   -1.4385 if cp>=-0.03794348612427711 & cv>=-0.8589064717292785\n",
      "   +0.5944 if cp>=-0.07290158569812774 & cv<=-0.8819729208946228\n",
      "   +0.0477 if pa>=0.18415261805057526\n",
      "   +2.2573 if cp<=-0.0607950821518898 & cp>=-0.0907419815659523 & cv<=-0.6743402004241943\n",
      "Run episode 336 with rewards 13.0\n",
      "============ 337 ===========\n",
      "14 actions [0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1]\n",
      "   +1.1005 if cp>=-0.08876736760139464 & cv<=-0.18450306355953217 & cv>=-0.6471563220024109\n",
      "   +2.0994 if cv>=-0.8589064717292785\n",
      "   -1.9966 if cv<=-0.7808522701263427\n",
      "   -2.1009 if cp<=-0.0607950821518898 & cv<=-0.6743402004241943\n",
      "   +1.5260 if cp<=-0.08722304105758666 & cp>=-0.12294302582740783\n",
      "--------------\n",
      "   -1.0275 if cv>=-0.3730471909046173\n",
      "   -2.1462 if cp>=-0.03794348612427711 & cv>=-0.8589064717292785\n",
      "   +1.2724 if cp>=-0.07290158569812774 & cv<=-0.8819729208946228\n",
      "   +1.6266 if cp<=-0.0607950821518898 & cp>=-0.0907419815659523 & cv<=-0.6743402004241943\n",
      "   -2.1644 if cp<=-0.08722304105758666 & cp>=-0.12294302582740783 & cv>=-0.7658876061439515\n",
      "Run episode 337 with rewards 14.0\n",
      "============ 338 ===========\n",
      "11 actions [0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1]\n",
      "   +1.7777 if cv>=-0.8589064717292785\n",
      "   -3.7138 if cv<=-0.7808522701263427\n",
      "   -0.2885 if cp<=-0.0607950821518898 & cv<=-0.6743402004241943\n",
      "   -0.6620 if cp<=-0.08722304105758666 & cp>=-0.12294302582740783\n",
      "   +1.7308 if cp<=-0.039311173558235164 & cv>=-0.6024247765541076\n",
      "--------------\n",
      "   -1.5805 if cp>=-0.03794348612427711 & cv>=-0.8589064717292785\n",
      "   +0.0000 if cp>=-0.07290158569812774 & cv<=-0.8819729208946228\n",
      "   +1.0010 if cp<=-0.0607950821518898 & cp>=-0.0907419815659523 & cv<=-0.6743402004241943\n",
      "   -0.3432 if cp<=-0.08722304105758666 & cp>=-0.12294302582740783 & cv>=-0.7658876061439515\n",
      "   +2.4253 if cp>=-0.07292750477790831 & cv<=-0.758466100692749\n",
      "Run episode 338 with rewards 11.0\n",
      "============ 339 ===========\n",
      "14 actions [0, 0, 0, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1]\n",
      "   +2.0281 if cv>=-0.8589064717292785\n",
      "   -2.2586 if cv<=-0.7808522701263427\n",
      "   -0.0000 if cp<=-0.08722304105758666 & cp>=-0.12294302582740783\n",
      "   -0.0000 if cp<=-0.039311173558235164 & cv>=-0.6024247765541076\n",
      "   -1.4167 if cv>=-0.8077098727226257 & pav>=1.0598484277725222\n",
      "--------------\n",
      "   -0.5079 if cp>=-0.03794348612427711 & cv>=-0.8589064717292785\n",
      "   -0.1684 if cp<=-0.0607950821518898 & cp>=-0.0907419815659523 & cv<=-0.6743402004241943\n",
      "   -0.0000 if cp<=-0.08722304105758666 & cp>=-0.12294302582740783 & cv>=-0.7658876061439515\n",
      "   +1.5631 if cp>=-0.07292750477790831 & cv<=-0.758466100692749\n",
      "   -1.9200 if cp>=-0.044538408517837524 & cv>=-0.6175356507301331\n",
      "Run episode 339 with rewards 14.0\n",
      "============ 340 ===========\n",
      "13 actions [0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0]\n",
      "   +3.9364 if cv>=-0.8589064717292785\n",
      "   -0.9539 if cv<=-0.7808522701263427\n",
      "   +0.0000 if cp<=-0.039311173558235164 & cv>=-0.6024247765541076\n",
      "   +0.9436 if cv>=-0.8077098727226257 & pav>=1.0598484277725222\n",
      "   -4.0135 if cp<=-0.04747360572218895 & cv<=-0.8227745175361634\n",
      "--------------\n",
      "   -3.4615 if cp>=-0.03794348612427711 & cv>=-0.8589064717292785\n",
      "   +0.6000 if cp<=-0.0607950821518898 & cp>=-0.0907419815659523 & cv<=-0.6743402004241943\n",
      "   +0.5217 if cp>=-0.07292750477790831 & cv<=-0.758466100692749\n",
      "   -0.3297 if cp>=-0.044538408517837524 & cv>=-0.6175356507301331\n",
      "   +1.7361 if cp<=-0.04747360572218895 & cp>=-0.0872575506567955 & cv<=-0.8227745175361634\n",
      "Run episode 340 with rewards 13.0\n",
      "============ 341 ===========\n",
      "12 actions [0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1]\n",
      "   +2.2086 if cv>=-0.8589064717292785\n",
      "   -0.6248 if cv<=-0.7808522701263427\n",
      "   +1.5768 if cv>=-0.8077098727226257 & pav>=1.0598484277725222\n",
      "   -1.9531 if cp<=-0.04747360572218895 & cv<=-0.8227745175361634\n",
      "   +1.2224 if cp<=-0.03643642589449882 & cp>=-0.10944492518901823 & cv>=-0.996459698677063\n",
      "--------------\n",
      "   -0.4948 if cp>=-0.03794348612427711 & cv>=-0.8589064717292785\n",
      "   -0.1513 if cp<=-0.0607950821518898 & cp>=-0.0907419815659523 & cv<=-0.6743402004241943\n",
      "   -0.0375 if cp>=-0.07292750477790831 & cv<=-0.758466100692749\n",
      "   +0.1473 if cp<=-0.04747360572218895 & cp>=-0.0872575506567955 & cv<=-0.8227745175361634\n",
      "   -0.8972 if cp>=-0.06631259322166441\n",
      "Run episode 341 with rewards 12.0\n",
      "============ 342 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 1, 0, 1, 0]\n",
      "   +3.9750 if cv>=-0.8589064717292785\n",
      "   +1.1272 if cv>=-0.8077098727226257 & pav>=1.0598484277725222\n",
      "   -1.2965 if cp<=-0.04747360572218895 & cv<=-0.8227745175361634\n",
      "   -0.8203 if cp<=-0.03643642589449882 & cp>=-0.10944492518901823 & cv>=-0.996459698677063\n",
      "   -1.6654 if cv>=-0.9883442401885987\n",
      "--------------\n",
      "   -1.5641 if cp>=-0.03794348612427711 & cv>=-0.8589064717292785\n",
      "   +0.5550 if cp<=-0.0607950821518898 & cp>=-0.0907419815659523 & cv<=-0.6743402004241943\n",
      "   +0.7339 if cp<=-0.04747360572218895 & cp>=-0.0872575506567955 & cv<=-0.8227745175361634\n",
      "   +1.0573 if cp>=-0.06631259322166441\n",
      "   -1.6640 if cp>=-0.0607352390885353 & cv>=-0.7968869686126709\n",
      "Run episode 342 with rewards 9.0\n",
      "============ 343 ===========\n",
      "12 actions [0, 0, 1, 0, 0, 1, 0, 0, 0, 1, 0, 1]\n",
      "   +1.7180 if cv>=-0.8589064717292785\n",
      "   -0.3212 if cv>=-0.8077098727226257 & pav>=1.0598484277725222\n",
      "   +0.0000 if cp<=-0.04747360572218895 & cv<=-0.8227745175361634\n",
      "   -0.2222 if cv>=-0.9883442401885987\n",
      "   -0.2362 if pav>=1.622745156288147\n",
      "--------------\n",
      "   -0.8788 if cp>=-0.03794348612427711 & cv>=-0.8589064717292785\n",
      "   +0.0000 if cp<=-0.04747360572218895 & cp>=-0.0872575506567955 & cv<=-0.8227745175361634\n",
      "   +0.2950 if cp>=-0.06631259322166441\n",
      "   -0.8788 if cp>=-0.0607352390885353 & cv>=-0.7968869686126709\n",
      "   -0.8408 if cp>=-0.007302252575755117\n",
      "Run episode 343 with rewards 12.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 344 ===========\n",
      "14 actions [0, 0, 0, 0, 1, 1, 0, 1, 0, 0, 0, 0, 0, 0]\n",
      "   -0.1159 if cv>=-0.8589064717292785\n",
      "   +1.1478 if cv>=-0.8077098727226257 & pav>=1.0598484277725222\n",
      "   -0.2181 if cv>=-0.9883442401885987\n",
      "   +1.6155 if pav>=1.622745156288147\n",
      "   -3.8217 if cp>=0.027288890630006796 & cv<=-0.22523599267005906\n",
      "--------------\n",
      "   -0.4231 if cp>=-0.03794348612427711 & cv>=-0.8589064717292785\n",
      "   +0.6008 if cp>=-0.06631259322166441\n",
      "   -0.7989 if cp>=-0.0607352390885353 & cv>=-0.7968869686126709\n",
      "   +2.0720 if cp>=-0.007302252575755117\n",
      "   -3.2501 if cv>=-0.22523599267005906\n",
      "Run episode 344 with rewards 14.0\n",
      "============ 345 ===========\n",
      "11 actions [0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1]\n",
      "   -1.8300 if cv>=-0.8077098727226257 & pav>=1.0598484277725222\n",
      "   +2.8599 if cv>=-0.9883442401885987\n",
      "   -2.1026 if pav>=1.622745156288147\n",
      "   +0.0000 if cp>=0.027288890630006796 & cv<=-0.22523599267005906\n",
      "   -2.7738 if cp<=-0.05627180784940719 & cp>=-0.1142797589302063\n",
      "--------------\n",
      "   -3.1067 if cp>=-0.06631259322166441\n",
      "   -3.1067 if cp>=-0.0607352390885353 & cv>=-0.7968869686126709\n",
      "   +0.0000 if cp>=-0.007302252575755117\n",
      "   -0.9771 if cv>=-0.22523599267005906\n",
      "   +2.4990 if cp>=-0.08838635087013244\n",
      "Run episode 345 with rewards 11.0\n",
      "============ 346 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 1, 1, 0]\n",
      "   +0.0605 if cv>=-0.8077098727226257 & pav>=1.0598484277725222\n",
      "   +1.9109 if cv>=-0.9883442401885987\n",
      "   -0.9515 if pav>=1.622745156288147\n",
      "   +0.3654 if cp<=-0.05627180784940719 & cp>=-0.1142797589302063\n",
      "   -1.4709 if cv<=-1.164633870124817 & cv>=-1.164633870124817\n",
      "--------------\n",
      "   -0.1803 if cp>=-0.06631259322166441\n",
      "   -0.7400 if cp>=-0.0607352390885353 & cv>=-0.7968869686126709\n",
      "   -0.1789 if cv>=-0.22523599267005906\n",
      "   -0.1446 if cp>=-0.08838635087013244\n",
      "   -1.6984 if cv>=-0.970184862613678\n",
      "Run episode 346 with rewards 10.0\n",
      "============ 347 ===========\n",
      "8 actions [0, 0, 0, 0, 0, 0, 0, 1]\n",
      "   +1.7540 if cv>=-0.9883442401885987\n",
      "   +0.5082 if pav>=1.622745156288147\n",
      "   -0.9065 if cp<=-0.05627180784940719 & cp>=-0.1142797589302063\n",
      "   -0.0000 if cv<=-1.164633870124817 & cv>=-1.164633870124817\n",
      "   -1.3183 if pav>=2.0847787857055664\n",
      "--------------\n",
      "   -1.7338 if cp>=-0.06631259322166441\n",
      "   -0.6577 if cp>=-0.0607352390885353 & cv>=-0.7968869686126709\n",
      "   -0.2812 if cv>=-0.22523599267005906\n",
      "   -0.6577 if cv>=-0.970184862613678\n",
      "   +1.4729 if cv<=-1.1707822561264039\n",
      "Run episode 347 with rewards 8.0\n",
      "============ 348 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +1.0730 if cv>=-0.9883442401885987\n",
      "   +3.2632 if pav>=1.622745156288147\n",
      "   +3.2456 if cp<=-0.05627180784940719 & cp>=-0.1142797589302063\n",
      "   +3.2456 if pav>=2.0847787857055664\n",
      "   +3.2456 if pa>=0.17850427329540253\n",
      "--------------\n",
      "   -0.9454 if cp>=-0.06631259322166441\n",
      "   -0.8814 if cp>=-0.0607352390885353 & cv>=-0.7968869686126709\n",
      "   -0.8814 if cv>=-0.970184862613678\n",
      "   -3.2189 if cv<=-1.1707822561264039\n",
      "   -3.2827 if cp<=-0.01339891161769628\n",
      "Run episode 348 with rewards 9.0\n",
      "============ 349 ===========\n",
      "8 actions [0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   -0.0033 if pav>=1.622745156288147\n",
      "   -0.0056 if cp<=-0.05627180784940719 & cp>=-0.1142797589302063\n",
      "   -0.0056 if pav>=2.0847787857055664\n",
      "   -0.0057 if pa>=0.17850427329540253\n",
      "   +1.4421 if cp>=-0.02150057107210159\n",
      "--------------\n",
      "   -1.5590 if cp>=-0.06631259322166441\n",
      "   -1.3276 if cv>=-0.970184862613678\n",
      "   -0.0126 if cv<=-1.1707822561264039\n",
      "   -0.2315 if cp<=-0.01339891161769628\n",
      "   -0.6707 if cp<=0.011960964463651181\n",
      "Run episode 349 with rewards 8.0\n",
      "============ 350 ===========\n",
      "33 actions [0, 1, 0, 1, 1, 0, 1, 1, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1]\n",
      "   -0.0000 if cp<=-0.05627180784940719 & cp>=-0.1142797589302063\n",
      "   -0.3324 if pav>=2.0847787857055664\n",
      "   -0.0000 if pa>=0.17850427329540253\n",
      "   +1.1065 if cp>=-0.02150057107210159\n",
      "   +0.5818 if cp>=0.02638936415314675\n",
      "--------------\n",
      "   -0.5873 if cp>=-0.06631259322166441\n",
      "   -1.7420 if cv>=-0.970184862613678\n",
      "   +2.4871 if cp<=-0.01339891161769628\n",
      "   +1.1547 if cp<=0.011960964463651181\n",
      "   +3.1556 if pa>=0.16682326793670654\n",
      "Run episode 350 with rewards 33.0\n",
      "============ 351 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 1, 0, 1, 1, 1]\n",
      "   -0.0000 if pav>=2.0847787857055664\n",
      "   +0.0048 if pa>=0.17850427329540253\n",
      "   +0.0973 if cp>=-0.02150057107210159\n",
      "   -0.0000 if cp>=0.02638936415314675\n",
      "   +5.0727 if cp<=-0.015216048434376716 & cv>=-0.00019178946968167793 & pa<=0.028405169770121575 & pa<=0.04051305800676348\n",
      "--------------\n",
      "   -2.2640 if cv>=-0.970184862613678\n",
      "   +6.1885 if cp<=-0.01339891161769628\n",
      "   -0.6555 if cp<=0.011960964463651181\n",
      "   +0.0445 if pa>=0.16682326793670654\n",
      "   -3.8676 if cp<=-0.015216048434376716 & cv>=-0.00019178946968167793 & pa<=0.04051305800676348\n",
      "Run episode 351 with rewards 10.0\n",
      "============ 352 ===========\n",
      "46 actions [0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.0367 if pa>=0.17850427329540253\n",
      "   -0.9148 if cp>=-0.02150057107210159\n",
      "   +3.8517 if cp>=0.02638936415314675\n",
      "   +0.0000 if cp<=-0.015216048434376716 & cv>=-0.00019178946968167793 & pa<=0.028405169770121575 & pa<=0.04051305800676348\n",
      "   -1.8995 if cp>=0.003932586498558523\n",
      "--------------\n",
      "   -2.7431 if cv>=-0.970184862613678\n",
      "   +1.5306 if cp<=-0.01339891161769628\n",
      "   +3.2409 if cp<=0.011960964463651181\n",
      "   +0.0000 if cp<=-0.015216048434376716 & cv>=-0.00019178946968167793 & pa<=0.04051305800676348\n",
      "   -1.1433 if cp<=0.003932586498558523\n",
      "Run episode 352 with rewards 46.0\n",
      "============ 353 ===========\n",
      "23 actions [1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0]\n",
      "   -0.6932 if pa>=0.17850427329540253\n",
      "   -1.3536 if cp>=-0.02150057107210159\n",
      "   +3.3855 if cp>=0.02638936415314675\n",
      "   +2.0141 if cp>=0.003932586498558523\n",
      "   -4.2243 if cp<=0.040508739650249516\n",
      "--------------\n",
      "   -5.4464 if cv>=-0.970184862613678\n",
      "   +1.2016 if cp<=-0.01339891161769628\n",
      "   +4.4451 if cp<=0.011960964463651181\n",
      "   +2.7606 if cp<=0.003932586498558523\n",
      "   +2.9981 if \n",
      "Run episode 353 with rewards 23.0\n",
      "============ 354 ===========\n",
      "25 actions [1, 0, 0, 1, 0, 1, 1, 0, 1, 0, 0, 1, 1, 1, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1]\n",
      "   -0.0941 if cp>=-0.02150057107210159\n",
      "   +2.1340 if cp>=0.02638936415314675\n",
      "   +0.8712 if cp>=0.003932586498558523\n",
      "   -0.8625 if cp<=0.040508739650249516\n",
      "   -4.1860 if pav>=0.9139646291732788\n",
      "--------------\n",
      "   -1.1053 if cv>=-0.970184862613678\n",
      "   +2.8291 if cp<=0.011960964463651181\n",
      "   +2.4131 if cp<=0.003932586498558523\n",
      "   -1.1053 if \n",
      "   -3.7471 if cv>=-0.3446968972682952\n",
      "Run episode 354 with rewards 25.0\n",
      "============ 355 ===========\n",
      "47 actions [0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 1, 0, 0, 0, 0, 0, 1, 1, 1, 0]\n",
      "   -0.0000 if cp>=0.02638936415314675\n",
      "   -0.0000 if cp>=0.003932586498558523\n",
      "   -0.2417 if cp<=0.040508739650249516\n",
      "   -0.0000 if pav>=0.9139646291732788\n",
      "   -4.2778 if cv<=-0.07183882594108569\n",
      "--------------\n",
      "   -0.3330 if cv>=-0.970184862613678\n",
      "   -0.3330 if cp<=0.011960964463651181\n",
      "   -0.3330 if cp<=0.003932586498558523\n",
      "   -0.3330 if cv>=-0.3446968972682952\n",
      "   +4.2744 if cv<=-0.07183882594108569\n",
      "Run episode 355 with rewards 47.0\n",
      "============ 356 ===========\n",
      "36 actions [0, 0, 1, 1, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1]\n",
      "   +0.0000 if cp>=0.02638936415314675\n",
      "   -0.7501 if cp<=0.040508739650249516\n",
      "   -0.0172 if pav>=0.9139646291732788\n",
      "   -2.3940 if cv<=-0.07183882594108569\n",
      "   +4.3947 if pa<=0.02414458617568016 & pav<=0.11306872069835668\n",
      "--------------\n",
      "   +0.5127 if cp<=0.011960964463651181\n",
      "   +0.5127 if cp<=0.003932586498558523\n",
      "   -5.1760 if cv>=-0.3446968972682952\n",
      "   +4.2748 if cv<=-0.07183882594108569\n",
      "   +3.3845 if pa>=0.02414458617568016\n",
      "Run episode 356 with rewards 36.0\n",
      "============ 357 ===========\n",
      "23 actions [1, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 0, 0, 1, 0, 1, 1, 0, 1, 0, 0, 1, 0]\n",
      "   -1.3633 if cp<=0.040508739650249516\n",
      "   +0.0002 if pav>=0.9139646291732788\n",
      "   +0.5217 if cv<=-0.07183882594108569\n",
      "   +0.3764 if pa<=0.02414458617568016 & pav<=0.11306872069835668\n",
      "   +3.7566 if cv>=0.17104287445545197 & pav<=0.04846886172890663\n",
      "--------------\n",
      "   +1.6952 if cp<=0.011960964463651181\n",
      "   -7.2348 if cv>=-0.3446968972682952\n",
      "   +2.8961 if cv<=-0.07183882594108569\n",
      "   +4.6890 if pa>=0.02414458617568016\n",
      "   +5.2490 if cp<=0.03653797507286072 & cv<=0.17104287445545197 & pav<=0.04846886172890663\n",
      "Run episode 357 with rewards 23.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 358 ===========\n",
      "21 actions [1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 0, 1, 0, 1, 1]\n",
      "   -1.1284 if cp<=0.040508739650249516\n",
      "   -0.8783 if cv<=-0.07183882594108569\n",
      "   -1.1284 if pa<=0.02414458617568016 & pav<=0.11306872069835668\n",
      "   +0.4040 if cv>=0.17104287445545197 & pav<=0.04846886172890663\n",
      "   +2.3377 if cv>=-0.03481434732675552 & pav<=-0.3617499887943267\n",
      "--------------\n",
      "   -1.8509 if cv>=-0.3446968972682952\n",
      "   +4.0543 if cv<=-0.07183882594108569\n",
      "   +0.0000 if pa>=0.02414458617568016\n",
      "   -0.2181 if cp<=0.03653797507286072 & cv<=0.17104287445545197 & pav<=0.04846886172890663\n",
      "   +5.1087 if cp<=0.009908768162131312 & cv<=0.1573768675327301 & pav>=-0.46949173212051387\n",
      "Run episode 358 with rewards 21.0\n",
      "============ 359 ===========\n",
      "31 actions [1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1]\n",
      "   -1.9687 if cp<=0.040508739650249516\n",
      "   -0.0003 if cv<=-0.07183882594108569\n",
      "   -1.9687 if pa<=0.02414458617568016 & pav<=0.11306872069835668\n",
      "   +0.1797 if cv>=-0.03481434732675552 & pav<=-0.3617499887943267\n",
      "   +4.4665 if cv>=0.02264917641878128 & pav<=-0.3477258384227752\n",
      "--------------\n",
      "   +0.4144 if cv>=-0.3446968972682952\n",
      "   +0.0560 if cv<=-0.07183882594108569\n",
      "   -1.6824 if cp<=0.03653797507286072 & cv<=0.17104287445545197 & pav<=0.04846886172890663\n",
      "   +3.3067 if cp<=0.009908768162131312 & cv<=0.1573768675327301 & pav>=-0.46949173212051387\n",
      "   -3.1828 if cv>=0.19919684529304504\n",
      "Run episode 359 with rewards 31.0\n",
      "============ 360 ===========\n",
      "34 actions [1, 1, 0, 1, 0, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1]\n",
      "   -3.8813 if cp<=0.040508739650249516\n",
      "   -1.6910 if pa<=0.02414458617568016 & pav<=0.11306872069835668\n",
      "   +1.0957 if cv>=-0.03481434732675552 & pav<=-0.3617499887943267\n",
      "   +4.9300 if cv>=0.02264917641878128 & pav<=-0.3477258384227752\n",
      "   +1.2454 if pa>=-0.04931034520268438\n",
      "--------------\n",
      "   +0.3174 if cv>=-0.3446968972682952\n",
      "   +1.0505 if cp<=0.03653797507286072 & cv<=0.17104287445545197 & pav<=0.04846886172890663\n",
      "   +1.0506 if cp<=0.009908768162131312 & cv<=0.1573768675327301 & pav>=-0.46949173212051387\n",
      "   -3.7516 if cv>=0.19919684529304504\n",
      "   -1.5522 if cp>=0.02562003955245018 & cv>=0.0022663669660687447 & cv>=0.18106700479984283 & pav>=-0.310505986213684\n",
      "Run episode 360 with rewards 34.0\n",
      "============ 361 ===========\n",
      "10 actions [1, 1, 1, 0, 1, 1, 1, 1, 0, 0]\n",
      "   -7.1757 if cp<=0.040508739650249516\n",
      "   +2.7746 if pa<=0.02414458617568016 & pav<=0.11306872069835668\n",
      "   +6.8399 if cv>=0.02264917641878128 & pav<=-0.3477258384227752\n",
      "   +2.5041 if pa>=-0.04931034520268438\n",
      "   -5.0552 if \n",
      "--------------\n",
      "   +0.6406 if cp<=0.03653797507286072 & cv<=0.17104287445545197 & pav<=0.04846886172890663\n",
      "   +0.0000 if cp<=0.009908768162131312 & cv<=0.1573768675327301 & pav>=-0.46949173212051387\n",
      "   -1.6248 if cv>=0.19919684529304504\n",
      "   -0.6884 if cp>=0.02562003955245018 & cv>=0.0022663669660687447 & cv>=0.18106700479984283 & pav>=-0.310505986213684\n",
      "   +4.1014 if pav>=0.2653047740459442\n",
      "Run episode 361 with rewards 10.0\n",
      "============ 362 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   +3.3710 if cp<=0.040508739650249516\n",
      "   -3.4697 if pa<=0.02414458617568016 & pav<=0.11306872069835668\n",
      "   -2.3911 if cv>=0.02264917641878128 & pav<=-0.3477258384227752\n",
      "   -3.4697 if \n",
      "   +5.1377 if cp<=-0.013676274754106998 & cv>=0.4963960409164429\n",
      "--------------\n",
      "   +0.0261 if cp<=0.03653797507286072 & cv<=0.17104287445545197 & pav<=0.04846886172890663\n",
      "   +1.4294 if cv>=0.19919684529304504\n",
      "   -0.0000 if cp>=0.02562003955245018 & cv>=0.0022663669660687447 & cv>=0.18106700479984283 & pav>=-0.310505986213684\n",
      "   -0.0000 if pav>=0.2653047740459442\n",
      "   -3.0381 if cp<=-0.013676274754106998 & cv>=0.4963960409164429\n",
      "Run episode 362 with rewards 10.0\n",
      "============ 363 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -1.2215 if cp<=0.040508739650249516\n",
      "   -1.0723 if pa<=0.02414458617568016 & pav<=0.11306872069835668\n",
      "   -1.0723 if \n",
      "   +0.0000 if cp<=-0.013676274754106998 & cv>=0.4963960409164429\n",
      "   -0.5396 if pa>=0.0051304916851222515\n",
      "--------------\n",
      "   +0.3181 if cp<=0.03653797507286072 & cv<=0.17104287445545197 & pav<=0.04846886172890663\n",
      "   +0.3681 if cv>=0.19919684529304504\n",
      "   -0.0000 if pav>=0.2653047740459442\n",
      "   -0.0000 if cp<=-0.013676274754106998 & cv>=0.4963960409164429\n",
      "   +0.5818 if cp<=-0.013234452530741691\n",
      "Run episode 363 with rewards 9.0\n",
      "============ 364 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 0, 0]\n",
      "   -2.9345 if cp<=0.040508739650249516\n",
      "   +0.0224 if pa<=0.02414458617568016 & pav<=0.11306872069835668\n",
      "   +0.0224 if \n",
      "   -0.0000 if pa>=0.0051304916851222515\n",
      "   +9.6889 if cp>=0.08511115610599519\n",
      "--------------\n",
      "   +0.3074 if cp<=0.03653797507286072 & cv<=0.17104287445545197 & pav<=0.04846886172890663\n",
      "   -0.3069 if cv>=0.19919684529304504\n",
      "   +0.0000 if cp<=-0.013676274754106998 & cv>=0.4963960409164429\n",
      "   +0.0000 if cp<=-0.013234452530741691\n",
      "   +1.3310 if cp<=0.08511115610599519\n",
      "Run episode 364 with rewards 10.0\n",
      "============ 365 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   +0.2407 if cp<=0.040508739650249516\n",
      "   -8.3630 if pa<=0.02414458617568016 & pav<=0.11306872069835668\n",
      "   -8.4079 if \n",
      "   -5.4486 if cp>=0.08511115610599519\n",
      "   +1.0000 if cp<=0.04404636174440384\n",
      "--------------\n",
      "   +0.0810 if cp<=0.03653797507286072 & cv<=0.17104287445545197 & pav<=0.04846886172890663\n",
      "   +3.2383 if cv>=0.19919684529304504\n",
      "   +0.0844 if cp<=-0.013234452530741691\n",
      "   +3.3102 if cp<=0.08511115610599519\n",
      "   +0.0855 if cp<=0.04404636174440384\n",
      "Run episode 365 with rewards 9.0\n",
      "============ 366 ===========\n",
      "12 actions [1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 1, 1]\n",
      "   -0.3969 if pa<=0.02414458617568016 & pav<=0.11306872069835668\n",
      "   -0.3969 if \n",
      "   +0.0480 if cp>=0.08511115610599519\n",
      "   +0.0000 if cp<=0.04404636174440384\n",
      "   -0.0254 if cp<=0.08477887511253358 & cp>=0.0483964703977108\n",
      "--------------\n",
      "   +0.0000 if cv>=0.19919684529304504\n",
      "   -0.0000 if cp<=-0.013234452530741691\n",
      "   +0.0000 if cp<=0.08511115610599519\n",
      "   -0.0000 if cp<=0.04404636174440384\n",
      "   +0.0000 if cp<=0.0483964703977108\n",
      "Run episode 366 with rewards 12.0\n",
      "============ 367 ===========\n",
      "66 actions [1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 1, 0, 0]\n",
      "   -1.4293 if pa<=0.02414458617568016 & pav<=0.11306872069835668\n",
      "   -1.4293 if \n",
      "   +4.8146 if cp>=0.08511115610599519\n",
      "   +0.9623 if cp<=0.08477887511253358 & cp>=0.0483964703977108\n",
      "   +2.9224 if cv>=1.1548423767089844\n",
      "--------------\n",
      "   -2.4667 if cv>=0.19919684529304504\n",
      "   +2.8531 if cp<=0.08511115610599519\n",
      "   +0.9796 if cp<=0.04404636174440384\n",
      "   +1.8508 if cp<=0.0483964703977108\n",
      "   -2.4593 if cv>=1.1548423767089844\n",
      "Run episode 367 with rewards 66.0\n",
      "============ 368 ===========\n",
      "11 actions [1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0]\n",
      "   +0.7104 if pa<=0.02414458617568016 & pav<=0.11306872069835668\n",
      "   +1.1499 if \n",
      "   +4.5768 if cp>=0.08511115610599519\n",
      "   +1.5781 if cv>=1.1548423767089844\n",
      "   -6.0343 if cp<=0.0868325233459473 & cv<=0.8284024596214294\n",
      "--------------\n",
      "   -3.0188 if cv>=0.19919684529304504\n",
      "   +5.1592 if cp<=0.08511115610599519\n",
      "   +1.4421 if cp<=0.0483964703977108\n",
      "   -4.2817 if cv>=1.1548423767089844\n",
      "   -6.5911 if cp>=0.03985011205077171 & cv>=0.8284024596214294 & pa<=0.023325443267822276 & pa>=-0.05468779429793358\n",
      "Run episode 368 with rewards 11.0\n",
      "============ 369 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 0, 1]\n",
      "   -3.2546 if \n",
      "   -5.5260 if cp>=0.08511115610599519\n",
      "   +1.1427 if cv>=1.1548423767089844\n",
      "   -0.0629 if cp<=0.0868325233459473 & cv<=0.8284024596214294\n",
      "   +2.3472 if cp>=0.020207712426781675 & cv>=1.1412917375564575\n",
      "--------------\n",
      "   +0.9403 if cv>=0.19919684529304504\n",
      "   +1.0695 if cp<=0.08511115610599519\n",
      "   -0.5098 if cv>=1.1548423767089844\n",
      "   +0.0000 if cp>=0.03985011205077171 & cv>=0.8284024596214294 & pa<=0.023325443267822276 & pa>=-0.05468779429793358\n",
      "   +2.0327 if cp<=0.020207712426781675 & cv>=0.9458302855491638\n",
      "Run episode 369 with rewards 10.0\n",
      "============ 370 ===========\n",
      "34 actions [1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -1.4769 if \n",
      "   +6.1951 if cp>=0.08511115610599519\n",
      "   +1.6465 if cv>=1.1548423767089844\n",
      "   +1.6465 if cp>=0.020207712426781675 & cv>=1.1412917375564575\n",
      "   -0.8818 if pav>=0.006291650701314211\n",
      "--------------\n",
      "   +3.3987 if cv>=0.19919684529304504\n",
      "   +3.4121 if cp<=0.08511115610599519\n",
      "   +3.3968 if cv>=1.1548423767089844\n",
      "   +0.0004 if cp<=0.020207712426781675 & cv>=0.9458302855491638\n",
      "   +0.0031 if cp<=0.05527282506227494\n",
      "Run episode 370 with rewards 34.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 371 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 0, 0, 0, 0]\n",
      "   -1.2095 if \n",
      "   +9.8503 if cp>=0.08511115610599519\n",
      "   +6.9587 if cv>=1.1548423767089844\n",
      "   +6.9625 if cp>=0.020207712426781675 & cv>=1.1412917375564575\n",
      "   +1.0000 if cv>=1.7561767101287842\n",
      "--------------\n",
      "   -2.7361 if cv>=0.19919684529304504\n",
      "   +4.8524 if cp<=0.08511115610599519\n",
      "   -4.7964 if cv>=1.1548423767089844\n",
      "   +2.6294 if cp<=0.05527282506227494\n",
      "   -0.8963 if cv>=1.7561767101287842\n",
      "Run episode 371 with rewards 10.0\n",
      "============ 372 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -3.0429 if \n",
      "   -2.8977 if cp>=0.08511115610599519\n",
      "   +0.1369 if cv>=1.1548423767089844\n",
      "   +0.1369 if cp>=0.020207712426781675 & cv>=1.1412917375564575\n",
      "   +1.5735 if cv>=1.0037715196609498\n",
      "--------------\n",
      "   +1.0358 if cv>=0.19919684529304504\n",
      "   +1.4795 if cp<=0.08511115610599519\n",
      "   -0.0000 if cv>=1.1548423767089844\n",
      "   +0.9885 if cp<=0.05527282506227494\n",
      "   +0.4452 if pav>=0.01164502277970314\n",
      "Run episode 372 with rewards 9.0\n",
      "============ 373 ===========\n",
      "26 actions [1, 1, 1, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1]\n",
      "   -0.7223 if \n",
      "   -0.0807 if cp>=0.08511115610599519\n",
      "   +9.4463 if cp>=0.020207712426781675 & cv>=1.1412917375564575\n",
      "   +8.3970 if cv>=1.0037715196609498\n",
      "   +1.0000 if cp>=0.08174191415309906\n",
      "--------------\n",
      "   -4.6274 if cv>=0.19919684529304504\n",
      "   -4.5693 if cp<=0.08511115610599519\n",
      "   +2.6022 if cp<=0.05527282506227494\n",
      "   +0.0000 if pav>=0.01164502277970314\n",
      "   +5.5996 if cp<=0.04164111316204072\n",
      "Run episode 373 with rewards 26.0\n",
      "============ 374 ===========\n",
      "27 actions [1, 1, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.4914 if \n",
      "   -0.0000 if cp>=0.020207712426781675 & cv>=1.1412917375564575\n",
      "   -0.0000 if cv>=1.0037715196609498\n",
      "   -0.0000 if cp>=0.08174191415309906\n",
      "   -4.5979 if cp>=0.04363469779491425 & pa<=-0.1040220856666565 & pa>=-0.127776101231575 & pav>=-0.5624414682388306 & pav>=-0.8160780072212219\n",
      "--------------\n",
      "   -2.9448 if cv>=0.19919684529304504\n",
      "   -4.0343 if cp<=0.08511115610599519\n",
      "   +3.4342 if cp<=0.05527282506227494\n",
      "   +4.2126 if cp<=0.04164111316204072\n",
      "   -4.0548 if pa>=-0.09353861957788467 & pav<=-0.8160780072212219\n",
      "Run episode 374 with rewards 27.0\n",
      "============ 375 ===========\n",
      "13 actions [1, 0, 1, 1, 1, 0, 0, 1, 1, 1, 1, 1, 0]\n",
      "   -1.7743 if \n",
      "   +0.0000 if cp>=0.020207712426781675 & cv>=1.1412917375564575\n",
      "   +0.0000 if cv>=1.0037715196609498\n",
      "   +0.0000 if cp>=0.04363469779491425 & pa<=-0.1040220856666565 & pa>=-0.127776101231575 & pav>=-0.5624414682388306 & pav>=-0.8160780072212219\n",
      "   +5.4900 if cp<=0.013327199593186378 & cv<=0.4403892993927002 & pa>=-0.10237340927124021 & pav<=-0.5955362558364868\n",
      "--------------\n",
      "   -2.2609 if cp<=0.08511115610599519\n",
      "   +0.7376 if cp<=0.05527282506227494\n",
      "   +4.3272 if cp<=0.04164111316204072\n",
      "   -6.1564 if pa>=-0.09353861957788467 & pav<=-0.8160780072212219\n",
      "   -6.2133 if cp<=0.013327199593186378 & cv<=0.4403892993927002 & pa>=-0.10237340927124021 & pav<=-0.5955362558364868\n",
      "Run episode 375 with rewards 13.0\n",
      "============ 376 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   -0.8825 if \n",
      "   -5.8337 if cp>=0.020207712426781675 & cv>=1.1412917375564575\n",
      "   +0.0000 if cp>=0.04363469779491425 & pa<=-0.1040220856666565 & pa>=-0.127776101231575 & pav>=-0.5624414682388306 & pav>=-0.8160780072212219\n",
      "   +0.6706 if cp<=0.013327199593186378 & cv<=0.4403892993927002 & pa>=-0.10237340927124021 & pav<=-0.5955362558364868\n",
      "   +5.3423 if pa>=-0.02455228753387928\n",
      "--------------\n",
      "   +3.5351 if cp<=0.08511115610599519\n",
      "   -2.3288 if cp<=0.04164111316204072\n",
      "   -4.2533 if pa>=-0.09353861957788467 & pav<=-0.8160780072212219\n",
      "   -0.6773 if cp<=0.013327199593186378 & cv<=0.4403892993927002 & pa>=-0.10237340927124021 & pav<=-0.5955362558364868\n",
      "   -4.7700 if pa>=-0.02455228753387928\n",
      "Run episode 376 with rewards 9.0\n",
      "============ 377 ===========\n",
      "8 actions [0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.6514 if \n",
      "   -0.0000 if cp>=0.020207712426781675 & cv>=1.1412917375564575\n",
      "   -0.0000 if cp<=0.013327199593186378 & cv<=0.4403892993927002 & pa>=-0.10237340927124021 & pav<=-0.5955362558364868\n",
      "   +0.6514 if pa>=-0.02455228753387928\n",
      "   +0.2932 if cp<=-0.02963837869465351\n",
      "--------------\n",
      "   -0.3711 if cp<=0.08511115610599519\n",
      "   -0.3711 if cp<=0.04164111316204072\n",
      "   +0.0000 if pa>=-0.09353861957788467 & pav<=-0.8160780072212219\n",
      "   -0.3711 if pa>=-0.02455228753387928\n",
      "   -0.0244 if cp<=-0.06148641109466552\n",
      "Run episode 377 with rewards 8.0\n",
      "============ 378 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +1.3543 if \n",
      "   +0.0000 if cp>=0.020207712426781675 & cv>=1.1412917375564575\n",
      "   +1.3543 if pa>=-0.02455228753387928\n",
      "   -0.0502 if cp<=-0.02963837869465351\n",
      "   +0.4812 if cp<=0.035158231109380725\n",
      "--------------\n",
      "   -1.0098 if cp<=0.08511115610599519\n",
      "   -1.0098 if cp<=0.04164111316204072\n",
      "   -1.0098 if pa>=-0.02455228753387928\n",
      "   -0.0000 if cp<=-0.06148641109466552\n",
      "   -0.0230 if cp<=0.012272758409380916\n",
      "Run episode 378 with rewards 9.0\n",
      "============ 379 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.6491 if \n",
      "   +0.6491 if pa>=-0.02455228753387928\n",
      "   -0.0314 if cp<=-0.02963837869465351\n",
      "   +0.6491 if cp<=0.035158231109380725\n",
      "   +0.1297 if cp<=0.016183263622224338 & cp>=-0.03466478697955608\n",
      "--------------\n",
      "   -0.5920 if cp<=0.08511115610599519\n",
      "   -0.5920 if cp<=0.04164111316204072\n",
      "   -0.5920 if pa>=-0.02455228753387928\n",
      "   -0.1074 if cp<=0.012272758409380916\n",
      "   -0.2529 if cp>=0.025946998223662376\n",
      "Run episode 379 with rewards 9.0\n",
      "============ 380 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.9215 if \n",
      "   +0.9215 if pa>=-0.02455228753387928\n",
      "   +0.9215 if cp<=0.035158231109380725\n",
      "   +0.2771 if cp<=0.016183263622224338 & cp>=-0.03466478697955608\n",
      "   -0.0460 if cp<=-0.04327711537480354\n",
      "--------------\n",
      "   -0.8950 if cp<=0.08511115610599519\n",
      "   -0.8950 if cp<=0.04164111316204072\n",
      "   -0.8950 if pa>=-0.02455228753387928\n",
      "   -0.0000 if cp>=0.025946998223662376\n",
      "   -0.0444 if cp<=-0.011193541251122948\n",
      "Run episode 380 with rewards 9.0\n",
      "============ 381 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.6399 if \n",
      "   +0.6399 if pa>=-0.02455228753387928\n",
      "   +0.6399 if cp<=0.035158231109380725\n",
      "   +0.4744 if cp<=0.016183263622224338 & cp>=-0.03466478697955608\n",
      "   -0.0441 if cp<=-0.07903616726398469\n",
      "--------------\n",
      "   -0.5485 if cp<=0.08511115610599519\n",
      "   -0.5485 if cp<=0.04164111316204072\n",
      "   -0.5485 if pa>=-0.02455228753387928\n",
      "   -0.5485 if cp<=-0.011193541251122948\n",
      "   +0.0336 if cp<=-0.07903616726398469\n",
      "Run episode 381 with rewards 10.0\n",
      "============ 382 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +1.1376 if \n",
      "   +0.1864 if pa>=-0.02455228753387928\n",
      "   +1.1376 if cp<=0.035158231109380725\n",
      "   +1.0009 if cp<=0.016183263622224338 & cp>=-0.03466478697955608\n",
      "   +0.2965 if cp<=-0.00849759066477418 & cp>=-0.02513997592031955\n",
      "--------------\n",
      "   -1.2190 if cp<=0.08511115610599519\n",
      "   -1.2190 if cp<=0.04164111316204072\n",
      "   -0.1087 if pa>=-0.02455228753387928\n",
      "   -0.2385 if cp<=-0.011193541251122948\n",
      "   -0.4891 if cp<=-0.00849759066477418 & cp>=-0.09581913203001022\n",
      "Run episode 382 with rewards 10.0\n",
      "============ 383 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +1.0523 if \n",
      "   +0.2934 if cp<=0.035158231109380725\n",
      "   +0.1213 if cp<=0.016183263622224338 & cp>=-0.03466478697955608\n",
      "   +0.0553 if cp<=-0.00849759066477418 & cp>=-0.02513997592031955\n",
      "   +1.0525 if cp>=-0.006861220742575822\n",
      "--------------\n",
      "   -1.4321 if cp<=0.08511115610599519\n",
      "   -1.4321 if cp<=0.04164111316204072\n",
      "   +0.0043 if cp<=-0.011193541251122948\n",
      "   -0.0173 if cp<=-0.00849759066477418 & cp>=-0.09581913203001022\n",
      "   -0.0771 if cp<=0.021132018789649015\n",
      "Run episode 383 with rewards 9.0\n",
      "============ 384 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +1.1562 if \n",
      "   +0.1395 if cp<=0.035158231109380725\n",
      "   +0.0770 if cp<=0.016183263622224338 & cp>=-0.03466478697955608\n",
      "   +1.1729 if cp>=-0.006861220742575822\n",
      "   +0.5932 if cp>=0.042923372238874435\n",
      "--------------\n",
      "   -1.7131 if cp<=0.08511115610599519\n",
      "   -0.3070 if cp<=0.04164111316204072\n",
      "   +0.0827 if cp<=-0.00849759066477418 & cp>=-0.09581913203001022\n",
      "   +0.0042 if cp<=0.021132018789649015\n",
      "   +0.1813 if pa>=0.20311139523983002\n",
      "Run episode 384 with rewards 9.0\n",
      "============ 385 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +1.0811 if \n",
      "   +0.4206 if cp<=0.035158231109380725\n",
      "   +1.1426 if cp>=-0.006861220742575822\n",
      "   +0.0000 if cp>=0.042923372238874435\n",
      "   -0.1562 if pa>=0.17650346457958221\n",
      "--------------\n",
      "   -0.9468 if cp<=0.08511115610599519\n",
      "   -0.9468 if cp<=0.04164111316204072\n",
      "   +0.1201 if cp<=-0.00849759066477418 & cp>=-0.09581913203001022\n",
      "   -0.0000 if pa>=0.20311139523983002\n",
      "   -0.4816 if cp<=0.03571414425969124 & cp>=-0.03343653492629528\n",
      "Run episode 385 with rewards 10.0\n",
      "============ 386 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +1.3245 if \n",
      "   +0.0214 if cp<=0.035158231109380725\n",
      "   +1.4775 if cp>=-0.006861220742575822\n",
      "   +0.0000 if pa>=0.17650346457958221\n",
      "   +0.6427 if cp>=0.04537826031446457\n",
      "--------------\n",
      "   -1.1573 if cp<=0.08511115610599519\n",
      "   -0.2777 if cp<=0.04164111316204072\n",
      "   +0.2207 if cp<=-0.00849759066477418 & cp>=-0.09581913203001022\n",
      "   -0.4578 if cp<=0.03571414425969124 & cp>=-0.03343653492629528\n",
      "   -1.0417 if cp>=0.031421162933111195\n",
      "Run episode 386 with rewards 9.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 387 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +1.2677 if \n",
      "   +1.2677 if cp<=0.035158231109380725\n",
      "   -0.0000 if cp>=-0.006861220742575822\n",
      "   -0.0000 if cp>=0.04537826031446457\n",
      "   +0.5821 if cp<=-0.025655345246195792\n",
      "--------------\n",
      "   -1.2831 if cp<=0.08511115610599519\n",
      "   -1.2831 if cp<=0.04164111316204072\n",
      "   -0.6647 if cp<=0.03571414425969124 & cp>=-0.03343653492629528\n",
      "   -0.0000 if cp>=0.031421162933111195\n",
      "   -0.1095 if cp<=-0.05803776532411575\n",
      "Run episode 387 with rewards 9.0\n",
      "============ 388 ===========\n",
      "11 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.7542 if \n",
      "   +0.7542 if cp<=0.035158231109380725\n",
      "   +0.0000 if cp>=-0.006861220742575822\n",
      "   +0.7542 if cp<=-0.025655345246195792\n",
      "   +0.0415 if cp<=-0.07161058485507965\n",
      "--------------\n",
      "   -0.7694 if cp<=0.08511115610599519\n",
      "   -0.7694 if cp<=0.04164111316204072\n",
      "   -0.0000 if cp<=0.03571414425969124 & cp>=-0.03343653492629528\n",
      "   -0.1048 if cp<=-0.05803776532411575\n",
      "   -0.3302 if cp<=-0.03937894478440285\n",
      "Run episode 388 with rewards 11.0\n",
      "============ 389 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 1]\n",
      "   +2.6637 if \n",
      "   +0.5566 if cp<=0.035158231109380725\n",
      "   +0.0272 if cp<=-0.025655345246195792\n",
      "   -0.0375 if cp<=-0.07161058485507965\n",
      "   +0.2768 if cp<=0.03894823417067528 & cp>=0.03894823417067528\n",
      "--------------\n",
      "   -1.9911 if cp<=0.08511115610599519\n",
      "   -0.9270 if cp<=0.04164111316204072\n",
      "   +0.0236 if cp<=-0.05803776532411575\n",
      "   +0.0236 if cp<=-0.03937894478440285\n",
      "   -1.2437 if cp>=0.03894823417067528\n",
      "Run episode 389 with rewards 10.0\n",
      "============ 390 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +4.2616 if \n",
      "   +4.2546 if cp<=0.035158231109380725\n",
      "   +4.8539 if cp<=-0.07161058485507965\n",
      "   +0.0009 if cp<=0.03894823417067528 & cp>=0.03894823417067528\n",
      "   +1.0000 if pa>=0.20884059369564056\n",
      "--------------\n",
      "   -3.4381 if cp<=0.08511115610599519\n",
      "   -3.5577 if cp<=0.04164111316204072\n",
      "   -4.2807 if cp<=-0.05803776532411575\n",
      "   +0.1398 if cp>=0.03894823417067528\n",
      "   -0.5353 if pa>=0.20884059369564056\n",
      "Run episode 390 with rewards 9.0\n",
      "============ 391 ===========\n",
      "25 actions [0, 0, 1, 1, 0, 1, 1, 0, 1, 0, 1, 0, 0, 0, 1, 1, 0, 1, 0, 0, 1, 0, 0, 1, 0]\n",
      "   +0.0757 if \n",
      "   +0.0757 if cp<=0.035158231109380725\n",
      "   -0.0001 if cp<=-0.07161058485507965\n",
      "   +0.0000 if pa>=0.20884059369564056\n",
      "   +0.0390 if cp<=-0.0019791558384895306 & cp>=-0.07214042842388153\n",
      "--------------\n",
      "   -0.0195 if cp<=0.08511115610599519\n",
      "   -0.0195 if cp<=0.04164111316204072\n",
      "   -0.0006 if cp<=-0.05803776532411575\n",
      "   +0.0000 if pa>=0.20884059369564056\n",
      "   -0.0105 if cp<=-0.0019791558384895306 & cp>=-0.07214042842388153\n",
      "Run episode 391 with rewards 25.0\n",
      "============ 392 ===========\n",
      "30 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1]\n",
      "   -0.5790 if \n",
      "   -0.5790 if cp<=0.035158231109380725\n",
      "   -1.0893 if cp<=-0.07161058485507965\n",
      "   +0.5079 if cp<=-0.0019791558384895306 & cp>=-0.07214042842388153\n",
      "   +1.3978 if cv>=-0.006005787011235947\n",
      "--------------\n",
      "   +0.4732 if cp<=0.08511115610599519\n",
      "   +0.4732 if cp<=0.04164111316204072\n",
      "   -0.9258 if cp<=-0.05803776532411575\n",
      "   -0.0915 if cp<=-0.0019791558384895306 & cp>=-0.07214042842388153\n",
      "   -4.6827 if cv>=0.0032726963050663505\n",
      "Run episode 392 with rewards 30.0\n",
      "============ 393 ===========\n",
      "77 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0]\n",
      "   -1.8592 if \n",
      "   -1.8592 if cp<=0.035158231109380725\n",
      "   +0.0000 if cp<=-0.07161058485507965\n",
      "   +5.1628 if cv>=-0.006005787011235947\n",
      "   +0.1347 if cp<=-0.04039113074541091\n",
      "--------------\n",
      "   +2.1824 if cp<=0.08511115610599519\n",
      "   +2.1824 if cp<=0.04164111316204072\n",
      "   -2.6064 if cp<=-0.05803776532411575\n",
      "   -6.3951 if cv>=0.0032726963050663505\n",
      "   -1.7891 if cv>=-0.1713063508272171\n",
      "Run episode 393 with rewards 77.0\n",
      "============ 394 ===========\n",
      "29 actions [0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1]\n",
      "   -1.9742 if \n",
      "   -1.9742 if cp<=0.035158231109380725\n",
      "   +6.9712 if cv>=-0.006005787011235947\n",
      "   -1.9603 if cp<=-0.04039113074541091\n",
      "   +0.4525 if cp>=-0.07967990785837173 & cv<=0.027285762876272206\n",
      "--------------\n",
      "   +1.2080 if cp<=0.08511115610599519\n",
      "   +1.2080 if cp<=0.04164111316204072\n",
      "   +0.8455 if cp<=-0.05803776532411575\n",
      "   -6.3128 if cv>=0.0032726963050663505\n",
      "   -1.9191 if pav<=-0.04228796362876886\n",
      "Run episode 394 with rewards 29.0\n",
      "============ 395 ===========\n",
      "27 actions [0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0]\n",
      "   -1.3958 if \n",
      "   -1.3958 if cp<=0.035158231109380725\n",
      "   +5.8310 if cv>=-0.006005787011235947\n",
      "   -3.2990 if cp<=-0.04039113074541091\n",
      "   +1.4223 if cp>=-0.03484929278492928 & cv<=0.002189529081806547\n",
      "--------------\n",
      "   +1.4570 if cp<=0.08511115610599519\n",
      "   +1.4570 if cp<=0.04164111316204072\n",
      "   -3.7933 if cv>=0.0032726963050663505\n",
      "   -1.6424 if pav<=-0.04228796362876886\n",
      "   -1.9833 if cp>=-0.03484929278492928\n",
      "Run episode 395 with rewards 27.0\n",
      "============ 396 ===========\n",
      "30 actions [0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 1, 0, 1, 0, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1]\n",
      "   -0.5945 if cp<=0.035158231109380725\n",
      "   +2.2715 if cv>=-0.006005787011235947\n",
      "   -0.0001 if cp<=-0.04039113074541091\n",
      "   -3.7739 if cp>=-0.03484929278492928 & cv<=0.002189529081806547\n",
      "   +5.2463 if cp<=0.04512087628245354 & cp>=0.03134352266788483 & cv<=0.01739900633692742 & pav<=0.45145429372787477\n",
      "--------------\n",
      "   +2.3391 if cp<=0.04164111316204072\n",
      "   -2.1356 if cv>=0.0032726963050663505\n",
      "   -0.0000 if pav<=-0.04228796362876886\n",
      "   -1.6228 if cp>=-0.03484929278492928\n",
      "   +5.2710 if cp>=0.04512087628245354 & cv<=0.01739900633692742\n",
      "Run episode 396 with rewards 30.0\n",
      "============ 397 ===========\n",
      "35 actions [1, 0, 1, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 0, 1, 0]\n",
      "   -1.8522 if cp<=0.035158231109380725\n",
      "   +3.8788 if cv>=-0.006005787011235947\n",
      "   -1.7862 if cp>=-0.03484929278492928 & cv<=0.002189529081806547\n",
      "   -0.0000 if cp<=0.04512087628245354 & cp>=0.03134352266788483 & cv<=0.01739900633692742 & pav<=0.45145429372787477\n",
      "   -2.8782 if pa>=0.06703887581825256 & pav<=0.37684307098388675\n",
      "--------------\n",
      "   +3.1099 if cp<=0.04164111316204072\n",
      "   -3.2805 if cv>=0.0032726963050663505\n",
      "   +0.9476 if cp>=-0.03484929278492928\n",
      "   -0.0000 if cp>=0.04512087628245354 & cv<=0.01739900633692742\n",
      "   +4.8258 if cp<=-0.0399047426879406 & pa>=0.07637757211923599\n",
      "Run episode 397 with rewards 35.0\n",
      "============ 398 ===========\n",
      "26 actions [1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0]\n",
      "   -1.1994 if cp<=0.035158231109380725\n",
      "   +1.6230 if cv>=-0.006005787011235947\n",
      "   -0.2881 if cp>=-0.03484929278492928 & cv<=0.002189529081806547\n",
      "   +0.0001 if pa>=0.06703887581825256 & pav<=0.37684307098388675\n",
      "   +2.5297 if cp<=0.03783386647701263 & cv>=0.17730991244316102\n",
      "--------------\n",
      "   +2.9195 if cp<=0.04164111316204072\n",
      "   -1.6156 if cv>=0.0032726963050663505\n",
      "   +1.1608 if cp>=-0.03484929278492928\n",
      "   +0.0000 if cp<=-0.0399047426879406 & pa>=0.07637757211923599\n",
      "   -2.5972 if cv>=0.17730991244316102\n",
      "Run episode 398 with rewards 26.0\n",
      "============ 399 ===========\n",
      "27 actions [1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 1]\n",
      "   -0.0207 if cp<=0.035158231109380725\n",
      "   +0.8151 if cv>=-0.006005787011235947\n",
      "   -0.8358 if cp>=-0.03484929278492928 & cv<=0.002189529081806547\n",
      "   +3.5945 if cp<=0.03783386647701263 & cv>=0.17730991244316102\n",
      "   +4.3414 if cv<=0.018969770520925522 & cv>=0.018969770520925522\n",
      "--------------\n",
      "   +1.3184 if cp<=0.04164111316204072\n",
      "   -0.5484 if cv>=0.0032726963050663505\n",
      "   +1.3184 if cp>=-0.03484929278492928\n",
      "   -3.6431 if cv>=0.17730991244316102\n",
      "   -4.3370 if cv<=0.018969770520925522 & cv>=0.018969770520925522\n",
      "Run episode 399 with rewards 27.0\n",
      "============ 400 ===========\n",
      "54 actions [1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 0, 1, 0, 1, 0, 0, 1, 1, 1, 0]\n",
      "   +1.3455 if cv>=-0.006005787011235947\n",
      "   -1.2499 if cp>=-0.03484929278492928 & cv<=0.002189529081806547\n",
      "   +2.3134 if cp<=0.03783386647701263 & cv>=0.17730991244316102\n",
      "   -0.0000 if cv<=0.018969770520925522 & cv>=0.018969770520925522\n",
      "   -3.7086 if cp<=0.0024102717638015752 & pav>=-0.09590193629264829\n",
      "--------------\n",
      "   +2.1971 if cp<=0.04164111316204072\n",
      "   +2.1971 if cp>=-0.03484929278492928\n",
      "   -4.5396 if cv>=0.17730991244316102\n",
      "   +0.0000 if cv<=0.018969770520925522 & cv>=0.018969770520925522\n",
      "   -3.0924 if cp>=0.0024102717638015752 & cv<=0.23597658574581146\n",
      "Run episode 400 with rewards 54.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 401 ===========\n",
      "41 actions [1, 0, 1, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1]\n",
      "   +2.0168 if cv>=-0.006005787011235947\n",
      "   -2.5304 if cp>=-0.03484929278492928 & cv<=0.002189529081806547\n",
      "   +3.0174 if cp<=0.03783386647701263 & cv>=0.17730991244316102\n",
      "   -2.3073 if cp<=0.0024102717638015752 & pav>=-0.09590193629264829\n",
      "   -5.2568 if cp<=0.020045047998428347 & cv>=-0.15370164215564727 & pav<=-0.01035560145974157 & pav>=-0.10891051739454269\n",
      "--------------\n",
      "   +0.5235 if cp<=0.04164111316204072\n",
      "   +0.5235 if cp>=-0.03484929278492928\n",
      "   -4.5238 if cv>=0.17730991244316102\n",
      "   -0.0355 if cp>=0.0024102717638015752 & cv<=0.23597658574581146\n",
      "   +1.7694 if cp<=0.01561872959136963\n",
      "Run episode 401 with rewards 41.0\n",
      "============ 402 ===========\n",
      "12 actions [1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0]\n",
      "   -4.3464 if cp>=-0.03484929278492928 & cv<=0.002189529081806547\n",
      "   +2.2056 if cp<=0.03783386647701263 & cv>=0.17730991244316102\n",
      "   -0.0000 if cp<=0.0024102717638015752 & pav>=-0.09590193629264829\n",
      "   -0.0001 if cp<=0.020045047998428347 & cv>=-0.15370164215564727 & pav<=-0.01035560145974157 & pav>=-0.10891051739454269\n",
      "   +2.3474 if cv>=0.15168578922748566 & pav>=-0.3281581997871399\n",
      "--------------\n",
      "   +0.7634 if cp<=0.04164111316204072\n",
      "   +0.5540 if cp>=-0.03484929278492928\n",
      "   -3.1652 if cv>=0.17730991244316102\n",
      "   +2.9366 if cp<=0.01561872959136963\n",
      "   -5.1985 if pa>=0.03088420443236828\n",
      "Run episode 402 with rewards 12.0\n",
      "============ 403 ===========\n",
      "11 actions [0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0]\n",
      "   -1.3804 if cp>=-0.03484929278492928 & cv<=0.002189529081806547\n",
      "   -0.4649 if cp<=0.03783386647701263 & cv>=0.17730991244316102\n",
      "   -1.3804 if cp<=0.020045047998428347 & cv>=-0.15370164215564727 & pav<=-0.01035560145974157 & pav>=-0.10891051739454269\n",
      "   +0.0000 if cv>=0.15168578922748566 & pav>=-0.3281581997871399\n",
      "   +3.2502 if cv<=0.19198768138885497\n",
      "--------------\n",
      "   -0.7237 if cp<=0.04164111316204072\n",
      "   -0.6110 if cv>=0.17730991244316102\n",
      "   +1.6928 if cp<=0.01561872959136963\n",
      "   -0.0000 if pa>=0.03088420443236828\n",
      "   +3.4589 if cv>=0.19198768138885497\n",
      "Run episode 403 with rewards 11.0\n",
      "============ 404 ===========\n",
      "13 actions [0, 0, 0, 0, 1, 0, 0, 1, 0, 1, 0, 0, 1]\n",
      "   -0.4886 if cp>=-0.03484929278492928 & cv<=0.002189529081806547\n",
      "   -0.0000 if cp<=0.03783386647701263 & cv>=0.17730991244316102\n",
      "   -0.0000 if cp<=0.020045047998428347 & cv>=-0.15370164215564727 & pav<=-0.01035560145974157 & pav>=-0.10891051739454269\n",
      "   +1.4828 if cv<=0.19198768138885497\n",
      "   +2.8211 if cv>=-0.6252917647361755\n",
      "--------------\n",
      "   +0.3380 if cp<=0.04164111316204072\n",
      "   -0.0000 if cv>=0.17730991244316102\n",
      "   +1.3940 if cp<=0.01561872959136963\n",
      "   -0.0000 if cv>=0.19198768138885497\n",
      "   -2.8155 if cv>=-0.6252917647361755\n",
      "Run episode 404 with rewards 13.0\n",
      "============ 405 ===========\n",
      "12 actions [0, 0, 1, 0, 0, 0, 0, 1, 0, 1, 0, 0]\n",
      "   -0.8172 if cp>=-0.03484929278492928 & cv<=0.002189529081806547\n",
      "   +0.4693 if cp<=0.020045047998428347 & cv>=-0.15370164215564727 & pav<=-0.01035560145974157 & pav>=-0.10891051739454269\n",
      "   +0.8369 if cv<=0.19198768138885497\n",
      "   +2.7658 if cv>=-0.6252917647361755\n",
      "   +3.0203 if cp<=-0.02404255308210848 & cv<=-0.7451942205429075 & cv>=-0.7863846540451049\n",
      "--------------\n",
      "   +0.8487 if cp<=0.04164111316204072\n",
      "   +0.8487 if cp<=0.01561872959136963\n",
      "   -0.0000 if cv>=0.19198768138885497\n",
      "   -2.1188 if cv>=-0.6252917647361755\n",
      "   -1.2754 if cp<=-0.05857237428426741\n",
      "Run episode 405 with rewards 12.0\n",
      "============ 406 ===========\n",
      "22 actions [0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 0, 0]\n",
      "   -3.7348 if cp>=-0.03484929278492928 & cv<=0.002189529081806547\n",
      "   -0.4811 if cv<=0.19198768138885497\n",
      "   +2.7093 if cv>=-0.6252917647361755\n",
      "   +2.8568 if cp<=-0.02404255308210848 & cv<=-0.7451942205429075 & cv>=-0.7863846540451049\n",
      "   +3.2295 if cp>=-0.028355496004223824\n",
      "--------------\n",
      "   +1.0157 if cp<=0.04164111316204072\n",
      "   +1.0157 if cp<=0.01561872959136963\n",
      "   +0.6446 if cv>=-0.6252917647361755\n",
      "   +0.3711 if cp<=-0.05857237428426741\n",
      "   -2.7646 if cv>=-0.2168764531612395\n",
      "Run episode 406 with rewards 22.0\n",
      "============ 407 ===========\n",
      "17 actions [0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1]\n",
      "   -2.2796 if cp>=-0.03484929278492928 & cv<=0.002189529081806547\n",
      "   +2.0023 if cv>=-0.6252917647361755\n",
      "   +0.0000 if cp<=-0.02404255308210848 & cv<=-0.7451942205429075 & cv>=-0.7863846540451049\n",
      "   -0.6164 if cp>=-0.028355496004223824\n",
      "   +4.6706 if cp>=-0.04872879832983017 & cv>=-0.20927202105522155\n",
      "--------------\n",
      "   +0.8966 if cp<=0.04164111316204072\n",
      "   +1.8444 if cp<=0.01561872959136963\n",
      "   +0.8966 if cv>=-0.6252917647361755\n",
      "   -6.0829 if cv>=-0.2168764531612395\n",
      "   +1.1712 if cp>=0.001866795495152479\n",
      "Run episode 407 with rewards 17.0\n",
      "============ 408 ===========\n",
      "32 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 0, 0, 0]\n",
      "   -0.3666 if cp>=-0.03484929278492928 & cv<=0.002189529081806547\n",
      "   +0.8486 if cv>=-0.6252917647361755\n",
      "   -0.5056 if cp>=-0.028355496004223824\n",
      "   +2.3705 if cp>=-0.04872879832983017 & cv>=-0.20927202105522155\n",
      "   +2.7016 if cp<=-0.06992651075124741 & cv<=-0.40823468565940857\n",
      "--------------\n",
      "   +1.9081 if cp<=0.01561872959136963\n",
      "   +1.9081 if cv>=-0.6252917647361755\n",
      "   -4.5713 if cv>=-0.2168764531612395\n",
      "   -0.3586 if cp>=0.001866795495152479\n",
      "   -2.1363 if cp<=-0.06992651075124741 & cv<=-0.40823468565940857\n",
      "Run episode 408 with rewards 32.0\n",
      "============ 409 ===========\n",
      "15 actions [0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1]\n",
      "   +0.7961 if cv>=-0.6252917647361755\n",
      "   -1.2726 if cp>=-0.028355496004223824\n",
      "   +6.4105 if cp>=-0.04872879832983017 & cv>=-0.20927202105522155\n",
      "   +0.2800 if cp<=-0.06992651075124741 & cv<=-0.40823468565940857\n",
      "   -2.3400 if cp>=-0.055509365350008014 & cv>=-0.0550266645848751\n",
      "--------------\n",
      "   +2.5398 if cp<=0.01561872959136963\n",
      "   +1.5632 if cv>=-0.6252917647361755\n",
      "   -6.2307 if cv>=-0.2168764531612395\n",
      "   -0.0852 if cp<=-0.06992651075124741 & cv<=-0.40823468565940857\n",
      "   +3.6966 if cp<=-0.043363699316978456 & cv<=-0.0440541535615921 & cv>=-0.0550266645848751\n",
      "Run episode 409 with rewards 15.0\n",
      "============ 410 ===========\n",
      "27 actions [0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0]\n",
      "   +1.1945 if cv>=-0.6252917647361755\n",
      "   -0.0000 if cp>=-0.028355496004223824\n",
      "   +0.9451 if cp>=-0.04872879832983017 & cv>=-0.20927202105522155\n",
      "   +0.3964 if cp>=-0.055509365350008014 & cv>=-0.0550266645848751\n",
      "   +2.7592 if cp<=-0.0961535781621933\n",
      "--------------\n",
      "   +1.6123 if cp<=0.01561872959136963\n",
      "   +1.6123 if cv>=-0.6252917647361755\n",
      "   -5.2699 if cv>=-0.2168764531612395\n",
      "   -0.0000 if cp<=-0.043363699316978456 & cv<=-0.0440541535615921 & cv>=-0.0550266645848751\n",
      "   -0.3640 if cp<=-0.06603465527296065\n",
      "Run episode 410 with rewards 27.0\n",
      "============ 411 ===========\n",
      "27 actions [0, 0, 1, 0, 1, 1, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0]\n",
      "   +1.5692 if cv>=-0.6252917647361755\n",
      "   +0.9634 if cp>=-0.04872879832983017 & cv>=-0.20927202105522155\n",
      "   +1.0777 if cp>=-0.055509365350008014 & cv>=-0.0550266645848751\n",
      "   +0.0000 if cp<=-0.0961535781621933\n",
      "   -2.9810 if cp>=0.011240015178918842 & cv<=-0.2459404230117798\n",
      "--------------\n",
      "   +2.5233 if cp<=0.01561872959136963\n",
      "   +1.9129 if cv>=-0.6252917647361755\n",
      "   -5.8551 if cv>=-0.2168764531612395\n",
      "   -0.0000 if cp<=-0.06603465527296065\n",
      "   -3.5976 if cp>=-0.025784768909215924 & cv<=-0.23421481847763062 & cv>=-0.2459404230117798\n",
      "Run episode 411 with rewards 27.0\n",
      "============ 412 ===========\n",
      "19 actions [0, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1]\n",
      "   +0.9431 if cv>=-0.6252917647361755\n",
      "   +0.9141 if cp>=-0.04872879832983017 & cv>=-0.20927202105522155\n",
      "   -2.0923 if cp>=-0.055509365350008014 & cv>=-0.0550266645848751\n",
      "   -0.0000 if cp>=0.011240015178918842 & cv<=-0.2459404230117798\n",
      "   -5.5879 if cv<=-0.17461458444595337 & pav<=0.24383857548236848\n",
      "--------------\n",
      "   +3.3154 if cp<=0.01561872959136963\n",
      "   +3.3154 if cv>=-0.6252917647361755\n",
      "   -5.2054 if cv>=-0.2168764531612395\n",
      "   -0.0000 if cp>=-0.025784768909215924 & cv<=-0.23421481847763062 & cv>=-0.2459404230117798\n",
      "   -1.9747 if cp<=-0.03568050637841224 & cv<=-0.17790853083133698\n",
      "Run episode 412 with rewards 19.0\n",
      "============ 413 ===========\n",
      "31 actions [0, 1, 0, 1, 0, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0]\n",
      "   +3.7388 if cv>=-0.6252917647361755\n",
      "   +0.8868 if cp>=-0.04872879832983017 & cv>=-0.20927202105522155\n",
      "   +0.8868 if cp>=-0.055509365350008014 & cv>=-0.0550266645848751\n",
      "   -0.0000 if cv<=-0.17461458444595337 & pav<=0.24383857548236848\n",
      "   -3.2009 if cv<=-0.2201950430870056\n",
      "--------------\n",
      "   +0.9567 if cp<=0.01561872959136963\n",
      "   +0.9567 if cv>=-0.6252917647361755\n",
      "   -5.8196 if cv>=-0.2168764531612395\n",
      "   +2.5667 if cp<=-0.03568050637841224 & cv<=-0.17790853083133698\n",
      "   -1.2130 if cv>=-0.08040570542216288\n",
      "Run episode 413 with rewards 31.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 414 ===========\n",
      "35 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1, 1, 0, 0, 1, 0, 0, 1, 1, 1, 1]\n",
      "   +0.6875 if cv>=-0.6252917647361755\n",
      "   +0.4065 if cp>=-0.04872879832983017 & cv>=-0.20927202105522155\n",
      "   +0.4544 if cp>=-0.055509365350008014 & cv>=-0.0550266645848751\n",
      "   +0.1203 if cv<=-0.2201950430870056\n",
      "   -3.4186 if cp>=-0.040320660918951035 & cv>=-0.23030851781368256 & pav>=0.2925656735897064\n",
      "--------------\n",
      "   +2.2335 if cp<=0.01561872959136963\n",
      "   -1.8833 if cv>=-0.2168764531612395\n",
      "   +2.1952 if cp<=-0.03568050637841224 & cv<=-0.17790853083133698\n",
      "   -1.8833 if cv>=-0.08040570542216288\n",
      "   +1.4116 if cv>=-0.23030851781368256\n",
      "Run episode 414 with rewards 35.0\n",
      "============ 415 ===========\n",
      "43 actions [1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 1, 1, 1, 0, 1, 0, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0]\n",
      "   +0.7733 if cv>=-0.6252917647361755\n",
      "   +1.5550 if cp>=-0.04872879832983017 & cv>=-0.20927202105522155\n",
      "   +2.9567 if cp>=-0.055509365350008014 & cv>=-0.0550266645848751\n",
      "   -0.0000 if cp>=-0.040320660918951035 & cv>=-0.23030851781368256 & pav>=0.2925656735897064\n",
      "   -6.1775 if pa>=-0.030136505141854286\n",
      "--------------\n",
      "   +3.8216 if cp<=0.01561872959136963\n",
      "   -1.2933 if cv>=-0.2168764531612395\n",
      "   +2.9170 if cp<=-0.03568050637841224 & cv<=-0.17790853083133698\n",
      "   -3.4090 if cv>=-0.08040570542216288\n",
      "   +4.6553 if pa>=-0.030136505141854286\n",
      "Run episode 415 with rewards 43.0\n",
      "============ 416 ===========\n",
      "41 actions [1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0]\n",
      "   +3.6999 if cv>=-0.6252917647361755\n",
      "   -0.6147 if cp>=-0.04872879832983017 & cv>=-0.20927202105522155\n",
      "   +0.4926 if cp>=-0.055509365350008014 & cv>=-0.0550266645848751\n",
      "   -3.7508 if pa>=-0.030136505141854286\n",
      "   -1.1731 if \n",
      "--------------\n",
      "   +3.2522 if cp<=0.01561872959136963\n",
      "   +1.1864 if cp<=-0.03568050637841224 & cv<=-0.17790853083133698\n",
      "   -1.5509 if cv>=-0.08040570542216288\n",
      "   +2.8150 if pa>=-0.030136505141854286\n",
      "   -3.1321 if cp>=0.01727009303867821 & cv<=-0.11352295279502869 & cv>=-0.5109813451766968 & pa<=-0.03632425293326377\n",
      "Run episode 416 with rewards 41.0\n",
      "============ 417 ===========\n",
      "43 actions [0, 1, 1, 1, 1, 0, 0, 0, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0]\n",
      "   +5.1303 if cv>=-0.6252917647361755\n",
      "   +1.6197 if cp>=-0.04872879832983017 & cv>=-0.20927202105522155\n",
      "   -4.2004 if pa>=-0.030136505141854286\n",
      "   -2.8265 if \n",
      "   -4.6015 if cv<=-0.19501404464244843 & pa>=-0.06241026520729064\n",
      "--------------\n",
      "   +4.4498 if cp<=0.01561872959136963\n",
      "   -4.6706 if cv>=-0.08040570542216288\n",
      "   +3.7754 if pa>=-0.030136505141854286\n",
      "   -1.9034 if cp>=0.01727009303867821 & cv<=-0.11352295279502869 & cv>=-0.5109813451766968 & pa<=-0.03632425293326377\n",
      "   +2.2738 if pav>=0.9239763021469116\n",
      "Run episode 417 with rewards 43.0\n",
      "============ 418 ===========\n",
      "93 actions [0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 1, 0, 1, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 1, 0, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 1, 1, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0]\n",
      "   +1.3093 if cv>=-0.6252917647361755\n",
      "   -1.4789 if pa>=-0.030136505141854286\n",
      "   +1.3093 if \n",
      "   -5.6111 if cv<=-0.19501404464244843 & pa>=-0.06241026520729064\n",
      "   -2.3893 if pav>=0.40491151809692383\n",
      "--------------\n",
      "   +5.7036 if cp<=0.01561872959136963\n",
      "   -5.8416 if cv>=-0.08040570542216288\n",
      "   +2.8193 if pa>=-0.030136505141854286\n",
      "   -0.0000 if pav>=0.9239763021469116\n",
      "   -1.4922 if cp>=0.025516934692859657 & pa<=-0.05377823412418365 & pav>=-0.004281467944383572\n",
      "Run episode 418 with rewards 93.0\n",
      "============ 419 ===========\n",
      "29 actions [0, 1, 0, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1, 0, 1, 1, 0, 0, 1, 0, 1]\n",
      "   -1.1682 if pa>=-0.030136505141854286\n",
      "   +3.2740 if \n",
      "   -2.8671 if cv<=-0.19501404464244843 & pa>=-0.06241026520729064\n",
      "   -4.6509 if pav>=0.40491151809692383\n",
      "   -5.2273 if cp<=0.03783285915851593 & cp>=0.022212772816419604 & cv<=0.041210611909627916 & pa<=0.004101862479001286\n",
      "--------------\n",
      "   +5.6364 if cp<=0.01561872959136963\n",
      "   -6.7886 if cv>=-0.08040570542216288\n",
      "   +3.1388 if pa>=-0.030136505141854286\n",
      "   -0.0000 if cp>=0.025516934692859657 & pa<=-0.05377823412418365 & pav>=-0.004281467944383572\n",
      "   -5.3999 if cp<=0.022212772816419604 & cp>=0.013451980240643027 & cv<=-0.15052068531513213 & pav<=0.23156238794326783\n",
      "Run episode 419 with rewards 29.0\n",
      "============ 420 ===========\n",
      "26 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 0, 1, 1, 0, 1]\n",
      "   +3.0487 if \n",
      "   -0.4537 if cv<=-0.19501404464244843 & pa>=-0.06241026520729064\n",
      "   -5.0549 if pav>=0.40491151809692383\n",
      "   +0.0000 if cp<=0.03783285915851593 & cp>=0.022212772816419604 & cv<=0.041210611909627916 & pa<=0.004101862479001286\n",
      "   -3.0907 if cp>=0.04576713591814041\n",
      "--------------\n",
      "   +2.9615 if cp<=0.01561872959136963\n",
      "   -4.1149 if cv>=-0.08040570542216288\n",
      "   +2.1012 if pa>=-0.030136505141854286\n",
      "   -0.0000 if cp<=0.022212772816419604 & cp>=0.013451980240643027 & cv<=-0.15052068531513213 & pav<=0.23156238794326783\n",
      "   +3.1616 if cp>=0.04576713591814041\n",
      "Run episode 420 with rewards 26.0\n",
      "============ 421 ===========\n",
      "36 actions [0, 0, 1, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0]\n",
      "   +1.8162 if \n",
      "   -1.5805 if cv<=-0.19501404464244843 & pa>=-0.06241026520729064\n",
      "   -3.6830 if pav>=0.40491151809692383\n",
      "   -0.0000 if cp>=0.04576713591814041\n",
      "   +3.8360 if cv>=-0.0331319123506546 & pa<=0.12608087062835696\n",
      "--------------\n",
      "   +4.0288 if cp<=0.01561872959136963\n",
      "   -5.8733 if cv>=-0.08040570542216288\n",
      "   +4.0288 if pa>=-0.030136505141854286\n",
      "   +0.0000 if cp>=0.04576713591814041\n",
      "   -2.5357 if cp>=-0.08032147586345673\n",
      "Run episode 421 with rewards 36.0\n",
      "============ 422 ===========\n",
      "28 actions [0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1]\n",
      "   +3.8648 if \n",
      "   -3.4020 if cv<=-0.19501404464244843 & pa>=-0.06241026520729064\n",
      "   -3.2650 if pav>=0.40491151809692383\n",
      "   +1.3638 if cv>=-0.0331319123506546 & pa<=0.12608087062835696\n",
      "   -2.9299 if cp>=0.024207504466176033 & cv<=-0.01504175923764704 & pav<=0.2671926021575928\n",
      "--------------\n",
      "   +1.6655 if cp<=0.01561872959136963\n",
      "   -5.0134 if cv>=-0.08040570542216288\n",
      "   +0.9011 if pa>=-0.030136505141854286\n",
      "   +0.9011 if cp>=-0.08032147586345673\n",
      "   -3.3027 if cp>=0.05022110044956207\n",
      "Run episode 422 with rewards 28.0\n",
      "============ 423 ===========\n",
      "56 actions [0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1]\n",
      "   +2.7979 if \n",
      "   -3.5268 if cv<=-0.19501404464244843 & pa>=-0.06241026520729064\n",
      "   -0.8841 if pav>=0.40491151809692383\n",
      "   +0.0000 if cp>=0.024207504466176033 & cv<=-0.01504175923764704 & pav<=0.2671926021575928\n",
      "   +6.4005 if cp>=0.003799381013959653 & pav>=0.3350503623485565\n",
      "--------------\n",
      "   -0.0189 if cp<=0.01561872959136963\n",
      "   -4.9473 if cv>=-0.08040570542216288\n",
      "   +3.4005 if pa>=-0.030136505141854286\n",
      "   -0.0000 if cp>=0.05022110044956207\n",
      "   -5.3251 if cp>=0.003799381013959653 & pav>=0.3350503623485565\n",
      "Run episode 423 with rewards 56.0\n",
      "============ 424 ===========\n",
      "22 actions [0, 1, 0, 0, 1, 1, 0, 1, 0, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1]\n",
      "   +5.8580 if \n",
      "   -4.5716 if cv<=-0.19501404464244843 & pa>=-0.06241026520729064\n",
      "   -2.4557 if pav>=0.40491151809692383\n",
      "   -0.0000 if cp>=0.003799381013959653 & pav>=0.3350503623485565\n",
      "   -2.1394 if cv>=-0.21263043582439423\n",
      "--------------\n",
      "   -3.4330 if cp<=0.01561872959136963\n",
      "   -6.6765 if cv>=-0.08040570542216288\n",
      "   +5.1620 if pa>=-0.030136505141854286\n",
      "   +0.0000 if cp>=0.003799381013959653 & pav>=0.3350503623485565\n",
      "   +2.1362 if cv>=-0.21263043582439423\n",
      "Run episode 424 with rewards 22.0\n",
      "============ 425 ===========\n",
      "11 actions [0, 0, 1, 0, 0, 1, 0, 0, 1, 0, 1]\n",
      "   +3.0400 if \n",
      "   +1.0573 if cv<=-0.19501404464244843 & pa>=-0.06241026520729064\n",
      "   -3.5841 if pav>=0.40491151809692383\n",
      "   +1.9827 if cv>=-0.21263043582439423\n",
      "   -2.1138 if cv>=-0.16294299960136413 & pa<=0.05562272146344185\n",
      "--------------\n",
      "   +1.4534 if cp<=0.01561872959136963\n",
      "   -5.0915 if cv>=-0.08040570542216288\n",
      "   +1.4534 if pa>=-0.030136505141854286\n",
      "   +1.6639 if cv>=-0.21263043582439423\n",
      "   -3.4893 if cp>=-0.03024218529462814 & pa>=0.05562272146344185\n",
      "Run episode 425 with rewards 11.0\n",
      "============ 426 ===========\n",
      "24 actions [0, 0, 0, 1, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1]\n",
      "   +1.9783 if \n",
      "   -1.2612 if pav>=0.40491151809692383\n",
      "   +3.2395 if cv>=-0.21263043582439423\n",
      "   +0.0226 if cv>=-0.16294299960136413 & pa<=0.05562272146344185\n",
      "   -1.0379 if cp<=0.031134653836488724\n",
      "--------------\n",
      "   +1.8096 if cp<=0.01561872959136963\n",
      "   -0.8497 if cv>=-0.08040570542216288\n",
      "   -1.1021 if cv>=-0.21263043582439423\n",
      "   -1.7353 if cp>=-0.03024218529462814 & pa>=0.05562272146344185\n",
      "   +1.3145 if cp>=0.019903704524040226\n",
      "Run episode 426 with rewards 24.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 427 ===========\n",
      "18 actions [0, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0]\n",
      "   +1.8324 if \n",
      "   -2.7150 if pav>=0.40491151809692383\n",
      "   +4.1359 if cv>=-0.21263043582439423\n",
      "   +1.8324 if cp<=0.031134653836488724\n",
      "   -4.1571 if cp<=-0.029710795730352384 & pav<=0.4057833790779114\n",
      "--------------\n",
      "   +3.4123 if cp<=0.01561872959136963\n",
      "   -3.5996 if cv>=-0.21263043582439423\n",
      "   -0.0000 if cp>=-0.03024218529462814 & pa>=0.05562272146344185\n",
      "   -0.0000 if cp>=0.019903704524040226\n",
      "   -6.6937 if cp>=-0.029710795730352384 & cv<=-0.029697448015213006 & pav<=0.6635422229766847\n",
      "Run episode 427 with rewards 18.0\n",
      "============ 428 ===========\n",
      "22 actions [0, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0]\n",
      "   +0.6852 if \n",
      "   -0.8608 if pav>=0.40491151809692383\n",
      "   +3.0704 if cv>=-0.21263043582439423\n",
      "   +0.5866 if cp<=-0.029710795730352384 & pav<=0.4057833790779114\n",
      "   +0.8442 if cp>=-0.0043625675782095474 & cv<=-0.20490638613700865 & cv>=-0.3839738488197327\n",
      "--------------\n",
      "   +3.6069 if cp<=0.01561872959136963\n",
      "   -2.9859 if cv>=-0.21263043582439423\n",
      "   +0.0000 if cp>=-0.03024218529462814 & pa>=0.05562272146344185\n",
      "   -5.3422 if cp>=-0.029710795730352384 & cv<=-0.029697448015213006 & pav<=0.6635422229766847\n",
      "   -0.0002 if cp>=0.01166258379817009\n",
      "Run episode 428 with rewards 22.0\n",
      "============ 429 ===========\n",
      "31 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0]\n",
      "   +0.9522 if \n",
      "   -1.2539 if pav>=0.40491151809692383\n",
      "   +3.8960 if cv>=-0.21263043582439423\n",
      "   -3.9969 if cp>=-0.0043625675782095474 & cv<=-0.20490638613700865 & cv>=-0.3839738488197327\n",
      "   -3.9090 if cp>=-0.00970416776835918 & cv<=-0.17072314620018006 & cv>=-0.3531870424747467\n",
      "--------------\n",
      "   +2.6943 if cp<=0.01561872959136963\n",
      "   -3.0739 if cv>=-0.21263043582439423\n",
      "   -4.2340 if cp>=-0.029710795730352384 & cv<=-0.029697448015213006 & pav<=0.6635422229766847\n",
      "   +0.0000 if cp>=0.01166258379817009\n",
      "   +4.9126 if cp>=-0.00970416776835918 & cv<=-0.17072314620018006\n",
      "Run episode 429 with rewards 31.0\n",
      "============ 430 ===========\n",
      "19 actions [0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1]\n",
      "   -2.3006 if pav>=0.40491151809692383\n",
      "   +3.6088 if cv>=-0.21263043582439423\n",
      "   -1.8242 if cp>=-0.0043625675782095474 & cv<=-0.20490638613700865 & cv>=-0.3839738488197327\n",
      "   -1.8242 if cp>=-0.00970416776835918 & cv<=-0.17072314620018006 & cv>=-0.3531870424747467\n",
      "   -0.8233 if pav<=0.37351378798484813\n",
      "--------------\n",
      "   +1.8291 if cp<=0.01561872959136963\n",
      "   -3.3967 if cv>=-0.21263043582439423\n",
      "   -2.9041 if cp>=-0.029710795730352384 & cv<=-0.029697448015213006 & pav<=0.6635422229766847\n",
      "   +0.2068 if cp>=-0.00970416776835918 & cv<=-0.17072314620018006\n",
      "   +3.1254 if cv>=-0.25188755989074707\n",
      "Run episode 430 with rewards 19.0\n",
      "============ 431 ===========\n",
      "28 actions [0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0]\n",
      "   -1.6188 if pav>=0.40491151809692383\n",
      "   +4.9129 if cv>=-0.21263043582439423\n",
      "   -3.9973 if cp>=-0.0043625675782095474 & cv<=-0.20490638613700865 & cv>=-0.3839738488197327\n",
      "   +0.2396 if cp>=-0.00970416776835918 & cv<=-0.17072314620018006 & cv>=-0.3531870424747467\n",
      "   -0.6619 if cp>=0.02444547899067402\n",
      "--------------\n",
      "   +0.9330 if cp<=0.01561872959136963\n",
      "   -1.9735 if cv>=-0.21263043582439423\n",
      "   +0.2680 if cp>=-0.029710795730352384 & cv<=-0.029697448015213006 & pav<=0.6635422229766847\n",
      "   -1.9735 if cv>=-0.25188755989074707\n",
      "   -0.7425 if cv>=-0.38140528798103335 & pav<=0.6044306874275208\n",
      "Run episode 431 with rewards 28.0\n",
      "============ 432 ===========\n",
      "26 actions [0, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0]\n",
      "   -3.0518 if pav>=0.40491151809692383\n",
      "   +2.9211 if cv>=-0.21263043582439423\n",
      "   +0.0000 if cp>=-0.0043625675782095474 & cv<=-0.20490638613700865 & cv>=-0.3839738488197327\n",
      "   +0.0000 if cp>=0.02444547899067402\n",
      "   -0.8923 if cp>=-0.07649402171373366\n",
      "--------------\n",
      "   +3.1071 if cp<=0.01561872959136963\n",
      "   -1.4663 if cv>=-0.21263043582439423\n",
      "   -1.4663 if cv>=-0.25188755989074707\n",
      "   -1.3231 if cv>=-0.38140528798103335 & pav<=0.6044306874275208\n",
      "   -0.2052 if cv>=-0.3831693470478058\n",
      "Run episode 432 with rewards 26.0\n",
      "============ 433 ===========\n",
      "22 actions [0, 0, 1, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1]\n",
      "   +1.0151 if pav>=0.40491151809692383\n",
      "   +0.3746 if cv>=-0.21263043582439423\n",
      "   -3.3669 if cp>=-0.0043625675782095474 & cv<=-0.20490638613700865 & cv>=-0.3839738488197327\n",
      "   -3.1634 if cp>=-0.07649402171373366\n",
      "   +2.8103 if pav<=0.32987090945243835\n",
      "--------------\n",
      "   +3.3875 if cp<=0.01561872959136963\n",
      "   -1.0051 if cv>=-0.21263043582439423\n",
      "   -1.0051 if cv>=-0.25188755989074707\n",
      "   -0.0569 if cv>=-0.38140528798103335 & pav<=0.6044306874275208\n",
      "   -3.5937 if cp<=0.02586142159998417 & cv>=0.0071222675032913685\n",
      "Run episode 433 with rewards 22.0\n",
      "============ 434 ===========\n",
      "42 actions [1, 0, 0, 0, 1, 1, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 1, 0, 1]\n",
      "   -1.3159 if pav>=0.40491151809692383\n",
      "   -2.4732 if cp>=-0.0043625675782095474 & cv<=-0.20490638613700865 & cv>=-0.3839738488197327\n",
      "   -0.1330 if cp>=-0.07649402171373366\n",
      "   +5.9699 if pav<=0.32987090945243835\n",
      "   -4.1321 if pav<=0.38094785809516907\n",
      "--------------\n",
      "   +4.9339 if cp<=0.01561872959136963\n",
      "   -2.2431 if cv>=-0.21263043582439423\n",
      "   -2.2431 if cv>=-0.25188755989074707\n",
      "   -2.5382 if cp<=0.02586142159998417 & cv>=0.0071222675032913685\n",
      "   +3.3049 if cp>=0.03322835490107536 & cv<=-0.058255794830620045 & pav<=0.38094785809516907\n",
      "Run episode 434 with rewards 42.0\n",
      "============ 435 ===========\n",
      "21 actions [0, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1]\n",
      "   -0.5061 if pav>=0.40491151809692383\n",
      "   -0.0000 if cp>=-0.0043625675782095474 & cv<=-0.20490638613700865 & cv>=-0.3839738488197327\n",
      "   +2.8358 if pav<=0.32987090945243835\n",
      "   -0.4637 if pav<=0.38094785809516907\n",
      "   -2.0616 if cv<=0.11150049269199437 & cv>=-0.03321457430720327\n",
      "--------------\n",
      "   +3.1869 if cp<=0.01561872959136963\n",
      "   -3.3004 if cv>=-0.25188755989074707\n",
      "   -2.1071 if cp<=0.02586142159998417 & cv>=0.0071222675032913685\n",
      "   +0.0000 if cp>=0.03322835490107536 & cv<=-0.058255794830620045 & pav<=0.38094785809516907\n",
      "   +1.9764 if cv<=0.11150049269199437 & cv>=-0.03321457430720327\n",
      "Run episode 435 with rewards 21.0\n",
      "============ 436 ===========\n",
      "19 actions [0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 1]\n",
      "   -2.9914 if pav>=0.40491151809692383\n",
      "   +2.3421 if pav<=0.32987090945243835\n",
      "   +2.2912 if pav<=0.38094785809516907\n",
      "   -1.7110 if cv<=0.11150049269199437 & cv>=-0.03321457430720327\n",
      "   +5.2378 if cp<=-0.0028377354610711275 & cv<=-0.1796262562274933 & pav<=0.5404149889945985\n",
      "--------------\n",
      "   +2.5514 if cp<=0.01561872959136963\n",
      "   -4.4015 if cv>=-0.25188755989074707\n",
      "   -1.9573 if cp<=0.02586142159998417 & cv>=0.0071222675032913685\n",
      "   +1.1770 if cv<=0.11150049269199437 & cv>=-0.03321457430720327\n",
      "   +1.8801 if cp>=-0.0028377354610711275 & pav<=0.6536567211151123 & pav>=0.3791709542274475\n",
      "Run episode 436 with rewards 19.0\n",
      "============ 437 ===========\n",
      "15 actions [0, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1]\n",
      "   -2.0469 if pav>=0.40491151809692383\n",
      "   +1.1640 if pav<=0.32987090945243835\n",
      "   +1.9900 if pav<=0.38094785809516907\n",
      "   +3.0275 if cp<=-0.0028377354610711275 & cv<=-0.1796262562274933 & pav<=0.5404149889945985\n",
      "   -2.1095 if cp<=-0.0629555769264698 & cv<=-0.2190219610929489 & cv>=-0.4033523440361023\n",
      "--------------\n",
      "   +1.3511 if cp<=0.01561872959136963\n",
      "   -1.1593 if cv>=-0.25188755989074707\n",
      "   -0.0037 if cp<=0.02586142159998417 & cv>=0.0071222675032913685\n",
      "   +0.0000 if cp>=-0.0028377354610711275 & pav<=0.6536567211151123 & pav>=0.3791709542274475\n",
      "   -2.0859 if cv>=-0.2190219610929489\n",
      "Run episode 437 with rewards 15.0\n",
      "============ 438 ===========\n",
      "13 actions [0, 0, 0, 1, 0, 0, 0, 1, 1, 1, 0, 1, 0]\n",
      "   -1.0314 if pav>=0.40491151809692383\n",
      "   +1.4972 if pav<=0.38094785809516907\n",
      "   +2.2351 if cp<=-0.0028377354610711275 & cv<=-0.1796262562274933 & pav<=0.5404149889945985\n",
      "   -1.2672 if cp<=-0.0629555769264698 & cv<=-0.2190219610929489 & cv>=-0.4033523440361023\n",
      "   +4.3567 if cp>=-0.04995304122567176 & cv<=-0.19306864738464355\n",
      "--------------\n",
      "   +0.5099 if cp<=0.01561872959136963\n",
      "   +0.4317 if cv>=-0.25188755989074707\n",
      "   -0.0790 if cp<=0.02586142159998417 & cv>=0.0071222675032913685\n",
      "   +0.4317 if cv>=-0.2190219610929489\n",
      "   -4.4098 if cv>=-0.37838345766067505\n",
      "Run episode 438 with rewards 13.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 439 ===========\n",
      "16 actions [0, 0, 1, 0, 1, 0, 0, 0, 1, 1, 1, 0, 1, 0, 0, 1]\n",
      "   +1.0710 if pav<=0.38094785809516907\n",
      "   -0.0000 if cp<=-0.0028377354610711275 & cv<=-0.1796262562274933 & pav<=0.5404149889945985\n",
      "   +0.0577 if cp<=-0.0629555769264698 & cv<=-0.2190219610929489 & cv>=-0.4033523440361023\n",
      "   +2.2070 if cp>=-0.04995304122567176 & cv<=-0.19306864738464355\n",
      "   -3.5503 if cp>=-0.030894178897142403 & cv<=-0.3756087779998779\n",
      "--------------\n",
      "   +1.0615 if cp<=0.01561872959136963\n",
      "   -0.6615 if cv>=-0.25188755989074707\n",
      "   -0.6615 if cv>=-0.2190219610929489\n",
      "   -2.8770 if cv>=-0.37838345766067505\n",
      "   +3.9828 if cp>=-0.030894178897142403 & cv<=-0.3756087779998779\n",
      "Run episode 439 with rewards 16.0\n",
      "============ 440 ===========\n",
      "11 actions [0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 1]\n",
      "   +0.8759 if pav<=0.38094785809516907\n",
      "   +0.6893 if cp<=-0.0629555769264698 & cv<=-0.2190219610929489 & cv>=-0.4033523440361023\n",
      "   +3.7730 if cp>=-0.04995304122567176 & cv<=-0.19306864738464355\n",
      "   -2.1839 if cp>=-0.030894178897142403 & cv<=-0.3756087779998779\n",
      "   -1.2149 if cp>=-0.10381387174129486 & cv<=-0.4397297501564026\n",
      "--------------\n",
      "   -0.1073 if cp<=0.01561872959136963\n",
      "   -1.5109 if cv>=-0.25188755989074707\n",
      "   -1.5109 if cv>=-0.37838345766067505\n",
      "   +2.2079 if cp>=-0.030894178897142403 & cv<=-0.3756087779998779\n",
      "   +1.5996 if cv<=-0.4397297501564026\n",
      "Run episode 440 with rewards 11.0\n",
      "============ 441 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 1, 0, 1, 0]\n",
      "   +0.9476 if pav<=0.38094785809516907\n",
      "   +3.6114 if cp>=-0.04995304122567176 & cv<=-0.19306864738464355\n",
      "   +1.3184 if cp>=-0.030894178897142403 & cv<=-0.3756087779998779\n",
      "   +0.5692 if cp>=-0.10381387174129486 & cv<=-0.4397297501564026\n",
      "   +2.3606 if cv<=-0.9644651412963867 & cv>=-0.9644651412963867\n",
      "--------------\n",
      "   -1.4009 if cv>=-0.25188755989074707\n",
      "   -1.4009 if cv>=-0.37838345766067505\n",
      "   -1.2753 if cp>=-0.030894178897142403 & cv<=-0.3756087779998779\n",
      "   -3.1272 if cv<=-0.4397297501564026\n",
      "   +3.1728 if cp<=-0.07926877588033676 & cp>=-0.12178932875394821 & cv<=-0.9644651412963867\n",
      "Run episode 441 with rewards 9.0\n",
      "============ 442 ===========\n",
      "12 actions [0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 1]\n",
      "   +0.7446 if pav<=0.38094785809516907\n",
      "   +2.0859 if cp>=-0.04995304122567176 & cv<=-0.19306864738464355\n",
      "   -0.0000 if cp>=-0.030894178897142403 & cv<=-0.3756087779998779\n",
      "   -0.0000 if cv<=-0.9644651412963867 & cv>=-0.9644651412963867\n",
      "   -3.0526 if cp>=-0.09506242722272873 & cv<=-0.897532868385315\n",
      "--------------\n",
      "   -1.0695 if cv>=-0.25188755989074707\n",
      "   -1.0695 if cv>=-0.37838345766067505\n",
      "   -0.6234 if cv<=-0.4397297501564026\n",
      "   -0.5000 if cp<=-0.07926877588033676 & cp>=-0.12178932875394821 & cv<=-0.9644651412963867\n",
      "   +1.9189 if cp>=-0.09506242722272873 & cv<=-0.897532868385315\n",
      "Run episode 442 with rewards 12.0\n",
      "============ 443 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 1, 1, 0, 0]\n",
      "   +1.5412 if pav<=0.38094785809516907\n",
      "   +2.5029 if cp>=-0.04995304122567176 & cv<=-0.19306864738464355\n",
      "   +0.0000 if cv<=-0.9644651412963867 & cv>=-0.9644651412963867\n",
      "   -1.1891 if cp>=-0.09506242722272873 & cv<=-0.897532868385315\n",
      "   -2.2124 if cp<=-0.05066479071974752 & cp>=-0.08742385804653167 & cv>=-0.7479702353477478\n",
      "--------------\n",
      "   -1.2941 if cv>=-0.25188755989074707\n",
      "   -1.8203 if cv>=-0.37838345766067505\n",
      "   -2.2916 if cv<=-0.4397297501564026\n",
      "   +1.4824 if cp>=-0.09506242722272873 & cv<=-0.897532868385315\n",
      "   +3.3534 if cp<=-0.05066479071974752 & cp>=-0.08742385804653167 & cv>=-0.7479702353477478\n",
      "Run episode 443 with rewards 10.0\n",
      "============ 444 ===========\n",
      "11 actions [0, 0, 0, 0, 0, 1, 1, 1, 1, 0, 0]\n",
      "   +0.6598 if pav<=0.38094785809516907\n",
      "   +2.2753 if cp>=-0.04995304122567176 & cv<=-0.19306864738464355\n",
      "   -1.2268 if cp>=-0.09506242722272873 & cv<=-0.897532868385315\n",
      "   +0.0000 if cp<=-0.05066479071974752 & cp>=-0.08742385804653167 & cv>=-0.7479702353477478\n",
      "   +1.8033 if cp>=-0.05876535326242446 & cv<=-0.864766800403595\n",
      "--------------\n",
      "   -1.4218 if cv>=-0.37838345766067505\n",
      "   -0.1411 if cv<=-0.4397297501564026\n",
      "   -0.0660 if cp>=-0.09506242722272873 & cv<=-0.897532868385315\n",
      "   +0.0000 if cp<=-0.05066479071974752 & cp>=-0.08742385804653167 & cv>=-0.7479702353477478\n",
      "   -2.1454 if cp>=-0.05876535326242446 & cv<=-0.864766800403595\n",
      "Run episode 444 with rewards 11.0\n",
      "============ 445 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 1, 1, 1]\n",
      "   +1.5685 if pav<=0.38094785809516907\n",
      "   +2.2991 if cp>=-0.04995304122567176 & cv<=-0.19306864738464355\n",
      "   -1.9006 if cp>=-0.09506242722272873 & cv<=-0.897532868385315\n",
      "   +0.0000 if cp>=-0.05876535326242446 & cv<=-0.864766800403595\n",
      "   +2.4689 if cv<=-0.5986118316650391 & pa<=0.08116307109594345\n",
      "--------------\n",
      "   -2.1262 if cv>=-0.37838345766067505\n",
      "   +1.1762 if cv<=-0.4397297501564026\n",
      "   +0.5863 if cp>=-0.09506242722272873 & cv<=-0.897532868385315\n",
      "   +0.0000 if cp>=-0.05876535326242446 & cv<=-0.864766800403595\n",
      "   -3.4287 if cv<=-0.5986118316650391 & pa<=0.08116307109594345\n",
      "Run episode 445 with rewards 10.0\n",
      "============ 446 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +1.2423 if pav<=0.38094785809516907\n",
      "   +0.8303 if cp>=-0.04995304122567176 & cv<=-0.19306864738464355\n",
      "   +0.0536 if cp>=-0.09506242722272873 & cv<=-0.897532868385315\n",
      "   +0.0234 if cv<=-0.5986118316650391 & pa<=0.08116307109594345\n",
      "   +4.2570 if cp<=0.019913791492581368 & cv>=-1.1805861234664916\n",
      "--------------\n",
      "   -1.4120 if cv>=-0.37838345766067505\n",
      "   -4.3080 if cv<=-0.4397297501564026\n",
      "   -0.3279 if cp>=-0.09506242722272873 & cv<=-0.897532868385315\n",
      "   -0.0086 if cv<=-0.5986118316650391 & pa<=0.08116307109594345\n",
      "   -5.3234 if cp<=-0.06536239981651307\n",
      "Run episode 446 with rewards 10.0\n",
      "============ 447 ===========\n",
      "14 actions [0, 0, 0, 1, 1, 0, 0, 1, 0, 0, 1, 1, 0, 1]\n",
      "   +1.6748 if pav<=0.38094785809516907\n",
      "   +1.3460 if cp>=-0.04995304122567176 & cv<=-0.19306864738464355\n",
      "   +0.0400 if cp>=-0.09506242722272873 & cv<=-0.897532868385315\n",
      "   +0.1213 if cp<=0.019913791492581368 & cv>=-1.1805861234664916\n",
      "   +0.6336 if cv>=0.03707673400640488\n",
      "--------------\n",
      "   -2.4671 if cv>=-0.37838345766067505\n",
      "   +3.0969 if cv<=-0.4397297501564026\n",
      "   +0.0186 if cp>=-0.09506242722272873 & cv<=-0.897532868385315\n",
      "   +9.2492 if cp<=-0.06536239981651307\n",
      "   +2.5205 if pa>=0.20861507952213287\n",
      "Run episode 447 with rewards 14.0\n",
      "============ 448 ===========\n",
      "18 actions [1, 0, 1, 1, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 1, 1, 0, 1]\n",
      "   +1.1976 if pav<=0.38094785809516907\n",
      "   +1.7164 if cp>=-0.04995304122567176 & cv<=-0.19306864738464355\n",
      "   +3.4447 if cp<=0.019913791492581368 & cv>=-1.1805861234664916\n",
      "   +0.0000 if cv>=0.03707673400640488\n",
      "   -2.9508 if cp<=0.03630542904138565\n",
      "--------------\n",
      "   -1.7314 if cv>=-0.37838345766067505\n",
      "   +2.7916 if cv<=-0.4397297501564026\n",
      "   -0.2249 if cp<=-0.06536239981651307\n",
      "   -0.0000 if pa>=0.20861507952213287\n",
      "   +3.3036 if cp<=0.03630542904138565 & cp>=0.012310020439326766 & cv<=-0.3234410047531127 & cv>=-0.4036816656589508\n",
      "Run episode 448 with rewards 18.0\n",
      "============ 449 ===========\n",
      "12 actions [0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0]\n",
      "   +0.6309 if pav<=0.38094785809516907\n",
      "   +1.8566 if cp>=-0.04995304122567176 & cv<=-0.19306864738464355\n",
      "   +5.1017 if cp<=0.019913791492581368 & cv>=-1.1805861234664916\n",
      "   -4.6110 if cp<=0.03630542904138565\n",
      "   +4.4939 if cv>=0.10356131792068508 & pa>=0.044592663645744324\n",
      "--------------\n",
      "   -0.3469 if cv>=-0.37838345766067505\n",
      "   +2.6820 if cv<=-0.4397297501564026\n",
      "   +0.0000 if cp<=-0.06536239981651307\n",
      "   +0.0000 if cp<=0.03630542904138565 & cp>=0.012310020439326766 & cv<=-0.3234410047531127 & cv>=-0.4036816656589508\n",
      "   -3.8276 if cv>=0.10356131792068508 & pa>=0.044592663645744324\n",
      "Run episode 449 with rewards 12.0\n",
      "============ 450 ===========\n",
      "14 actions [0, 0, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1, 0]\n",
      "   -0.4253 if cp>=-0.04995304122567176 & cv<=-0.19306864738464355\n",
      "   +1.6220 if cp<=0.019913791492581368 & cv>=-1.1805861234664916\n",
      "   +1.6220 if cp<=0.03630542904138565\n",
      "   +0.0000 if cv>=0.10356131792068508 & pa>=0.044592663645744324\n",
      "   -1.9730 if cp<=-0.032393964380025855\n",
      "--------------\n",
      "   -1.8466 if cv>=-0.37838345766067505\n",
      "   +4.9100 if cv<=-0.4397297501564026\n",
      "   -0.0000 if cp<=0.03630542904138565 & cp>=0.012310020439326766 & cv<=-0.3234410047531127 & cv>=-0.4036816656589508\n",
      "   -0.0000 if cv>=0.10356131792068508 & pa>=0.044592663645744324\n",
      "   -2.2003 if cp<=-0.032393964380025855 & cv>=-0.4169110655784607\n",
      "Run episode 450 with rewards 14.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 451 ===========\n",
      "14 actions [0, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0]\n",
      "   -2.0497 if cp>=-0.04995304122567176 & cv<=-0.19306864738464355\n",
      "   +2.1133 if cp<=0.019913791492581368 & cv>=-1.1805861234664916\n",
      "   +2.1133 if cp<=0.03630542904138565\n",
      "   -2.8599 if cp<=-0.032393964380025855\n",
      "   +0.0819 if cp>=-0.0008214945555664599\n",
      "--------------\n",
      "   -1.4390 if cv>=-0.37838345766067505\n",
      "   +4.7111 if cv<=-0.4397297501564026\n",
      "   +0.0000 if cv>=0.10356131792068508 & pa>=0.044592663645744324\n",
      "   -0.5837 if cp<=-0.032393964380025855 & cv>=-0.4169110655784607\n",
      "   +2.7195 if cp<=-0.03829079344868659 & cp>=-0.06067507341504097 & cv<=-0.4289552986621857\n",
      "Run episode 451 with rewards 14.0\n",
      "============ 452 ===========\n",
      "19 actions [0, 0, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0]\n",
      "   -2.0603 if cp>=-0.04995304122567176 & cv<=-0.19306864738464355\n",
      "   +0.1989 if cp<=0.019913791492581368 & cv>=-1.1805861234664916\n",
      "   +0.1989 if cp<=0.03630542904138565\n",
      "   -0.1226 if cp<=-0.032393964380025855\n",
      "   +2.9462 if cv>=-0.23861417174339294\n",
      "--------------\n",
      "   -2.6984 if cv>=-0.37838345766067505\n",
      "   +3.2687 if cv<=-0.4397297501564026\n",
      "   -2.5608 if cp<=-0.032393964380025855 & cv>=-0.4169110655784607\n",
      "   +3.3148 if cp<=-0.03829079344868659 & cp>=-0.06067507341504097 & cv<=-0.4289552986621857\n",
      "   +1.2881 if cv>=-0.4331047058105469\n",
      "Run episode 452 with rewards 19.0\n",
      "============ 453 ===========\n",
      "18 actions [0, 1, 0, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1]\n",
      "   -1.2924 if cp>=-0.04995304122567176 & cv<=-0.19306864738464355\n",
      "   +2.4191 if cp<=0.019913791492581368 & cv>=-1.1805861234664916\n",
      "   -2.2054 if cp<=0.03630542904138565\n",
      "   +2.5384 if cv>=-0.23861417174339294\n",
      "   +3.4095 if cv<=-0.3561486184597015 & cv>=-0.35848461389541625\n",
      "--------------\n",
      "   -4.5433 if cv>=-0.37838345766067505\n",
      "   +2.6817 if cv<=-0.4397297501564026\n",
      "   -0.6289 if cp<=-0.032393964380025855 & cv>=-0.4169110655784607\n",
      "   +0.6245 if cp<=-0.03829079344868659 & cp>=-0.06067507341504097 & cv<=-0.4289552986621857\n",
      "   +4.5033 if cp<=0.025622789934277537 & cv>=-0.3561486184597015\n",
      "Run episode 453 with rewards 18.0\n",
      "============ 454 ===========\n",
      "25 actions [0, 0, 1, 1, 0, 1, 0, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0]\n",
      "   +2.6240 if cp<=0.019913791492581368 & cv>=-1.1805861234664916\n",
      "   -4.4240 if cp<=0.03630542904138565\n",
      "   +3.1625 if cv>=-0.23861417174339294\n",
      "   -0.0000 if cv<=-0.3561486184597015 & cv>=-0.35848461389541625\n",
      "   +3.7392 if cp>=0.022259723395109177\n",
      "--------------\n",
      "   -1.1665 if cv>=-0.37838345766067505\n",
      "   -0.7967 if cv<=-0.4397297501564026\n",
      "   -2.2000 if cp<=-0.032393964380025855 & cv>=-0.4169110655784607\n",
      "   -1.1659 if cp<=0.025622789934277537 & cv>=-0.3561486184597015\n",
      "   +2.2536 if cp>=-0.038338860124349596\n",
      "Run episode 454 with rewards 25.0\n",
      "============ 455 ===========\n",
      "19 actions [0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0]\n",
      "   -0.6368 if cp<=0.019913791492581368 & cv>=-1.1805861234664916\n",
      "   -0.6368 if cp<=0.03630542904138565\n",
      "   +1.7598 if cv>=-0.23861417174339294\n",
      "   -0.0000 if cp>=0.022259723395109177\n",
      "   -2.6992 if cv<=-0.34373854994773867\n",
      "--------------\n",
      "   +0.0650 if cv>=-0.37838345766067505\n",
      "   -6.0806 if cp<=-0.032393964380025855 & cv>=-0.4169110655784607\n",
      "   +0.0649 if cp<=0.025622789934277537 & cv>=-0.3561486184597015\n",
      "   +1.9627 if cp>=-0.038338860124349596\n",
      "   -4.5970 if cv>=-0.14372158348560332\n",
      "Run episode 455 with rewards 19.0\n",
      "============ 456 ===========\n",
      "35 actions [0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1]\n",
      "   -1.3464 if cp<=0.019913791492581368 & cv>=-1.1805861234664916\n",
      "   -1.3464 if cp<=0.03630542904138565\n",
      "   +1.3115 if cv>=-0.23861417174339294\n",
      "   -2.6579 if cv<=-0.34373854994773867\n",
      "   +2.7860 if cv>=-0.12977617681026452\n",
      "--------------\n",
      "   +1.0732 if cv>=-0.37838345766067505\n",
      "   -5.5005 if cp<=-0.032393964380025855 & cv>=-0.4169110655784607\n",
      "   +1.9909 if cp>=-0.038338860124349596\n",
      "   -5.7427 if cv>=-0.14372158348560332\n",
      "   +1.5690 if cp<=-0.03525497019290924 & cp>=-0.0573449581861496\n",
      "Run episode 456 with rewards 35.0\n",
      "============ 457 ===========\n",
      "17 actions [0, 1, 0, 1, 0, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0]\n",
      "   -0.0978 if cp<=0.019913791492581368 & cv>=-1.1805861234664916\n",
      "   -0.0978 if cp<=0.03630542904138565\n",
      "   -3.4928 if cv<=-0.34373854994773867\n",
      "   +2.6287 if cv>=-0.12977617681026452\n",
      "   +5.8259 if cp>=-0.00829817987978456 & cv<=-0.03615560457110405 & cv>=-0.23023841083049773\n",
      "--------------\n",
      "   -4.6330 if cp<=-0.032393964380025855 & cv>=-0.4169110655784607\n",
      "   +2.0419 if cp>=-0.038338860124349596\n",
      "   -5.0820 if cv>=-0.14372158348560332\n",
      "   -1.5284 if cp<=-0.03525497019290924 & cp>=-0.0573449581861496\n",
      "   -5.9644 if cp>=-0.00829817987978456 & cv<=-0.03615560457110405 & cv>=-0.23023841083049773\n",
      "Run episode 457 with rewards 17.0\n",
      "============ 458 ===========\n",
      "14 actions [0, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1]\n",
      "   -1.2735 if cp<=0.03630542904138565\n",
      "   -0.9164 if cv<=-0.34373854994773867\n",
      "   +2.2363 if cv>=-0.12977617681026452\n",
      "   -0.0000 if cp>=-0.00829817987978456 & cv<=-0.03615560457110405 & cv>=-0.23023841083049773\n",
      "   -1.6949 if cp>=-0.05470555052161216 & cv<=-0.5487983763217925\n",
      "--------------\n",
      "   -5.8243 if cp<=-0.032393964380025855 & cv>=-0.4169110655784607\n",
      "   +0.5658 if cp>=-0.038338860124349596\n",
      "   -2.1675 if cv>=-0.14372158348560332\n",
      "   -0.0000 if cp>=-0.00829817987978456 & cv<=-0.03615560457110405 & cv>=-0.23023841083049773\n",
      "   +2.9025 if cv<=-0.03711924038361744 & cv>=-0.19354985058307647\n",
      "Run episode 458 with rewards 14.0\n",
      "============ 459 ===========\n",
      "11 actions [1, 0, 1, 1, 1, 1, 0, 1, 1, 1, 1]\n",
      "   -0.2888 if cp<=0.03630542904138565\n",
      "   -1.7067 if cv<=-0.34373854994773867\n",
      "   +0.0538 if cv>=-0.12977617681026452\n",
      "   -1.2877 if cp>=-0.05470555052161216 & cv<=-0.5487983763217925\n",
      "   +0.4739 if cv<=-0.1738680750131607\n",
      "--------------\n",
      "   -5.0339 if cp<=-0.032393964380025855 & cv>=-0.4169110655784607\n",
      "   +0.1570 if cp>=-0.038338860124349596\n",
      "   -0.1743 if cv>=-0.14372158348560332\n",
      "   +0.3313 if cv<=-0.03711924038361744 & cv>=-0.19354985058307647\n",
      "   +1.4225 if cp>=-0.03238692507147789\n",
      "Run episode 459 with rewards 11.0\n",
      "============ 460 ===========\n",
      "19 actions [1, 0, 1, 1, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 1, 0, 1, 0]\n",
      "   -0.7084 if cp<=0.03630542904138565\n",
      "   +0.0000 if cv<=-0.34373854994773867\n",
      "   +0.0000 if cp>=-0.05470555052161216 & cv<=-0.5487983763217925\n",
      "   +0.0000 if cv<=-0.1738680750131607\n",
      "   +3.8650 if cv<=0.16083937883377075 & cv>=0.16083937883377075\n",
      "--------------\n",
      "   -0.0000 if cp<=-0.032393964380025855 & cv>=-0.4169110655784607\n",
      "   -0.2592 if cv>=-0.14372158348560332\n",
      "   -0.0000 if cv<=-0.03711924038361744 & cv>=-0.19354985058307647\n",
      "   -0.2592 if cp>=-0.03238692507147789\n",
      "   +3.3669 if cp>=-0.014995683915913105 & cv<=0.5548528432846072\n",
      "Run episode 460 with rewards 19.0\n",
      "============ 461 ===========\n",
      "16 actions [1, 1, 1, 0, 1, 0, 0, 1, 1, 1, 0, 0, 1, 0, 1, 0]\n",
      "   -0.5409 if cp<=0.03630542904138565\n",
      "   -0.0000 if cv<=-0.34373854994773867\n",
      "   -0.0000 if cp>=-0.05470555052161216 & cv<=-0.5487983763217925\n",
      "   -0.0000 if cv<=0.16083937883377075 & cv>=0.16083937883377075\n",
      "   +5.4769 if pa>=0.017293987795710564\n",
      "--------------\n",
      "   +0.0000 if cp<=-0.032393964380025855 & cv>=-0.4169110655784607\n",
      "   -1.1725 if cv>=-0.14372158348560332\n",
      "   -1.1725 if cp>=-0.03238692507147789\n",
      "   +4.1860 if cp>=-0.014995683915913105 & cv<=0.5548528432846072\n",
      "   -4.7869 if pa>=0.017293987795710564\n",
      "Run episode 461 with rewards 16.0\n",
      "============ 462 ===========\n",
      "17 actions [1, 1, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1]\n",
      "   -0.7341 if cp<=0.03630542904138565\n",
      "   -0.0000 if cv<=-0.34373854994773867\n",
      "   -0.0000 if cv<=0.16083937883377075 & cv>=0.16083937883377075\n",
      "   -0.0000 if pa>=0.017293987795710564\n",
      "   +3.6291 if cp<=0.039033856242895126 & cp>=0.039033856242895126\n",
      "--------------\n",
      "   -1.2627 if cv>=-0.14372158348560332\n",
      "   -1.2627 if cp>=-0.03238692507147789\n",
      "   +4.0555 if cp>=-0.014995683915913105 & cv<=0.5548528432846072\n",
      "   +0.0000 if pa>=0.017293987795710564\n",
      "   +2.1937 if pa<=-0.0827326700091362\n",
      "Run episode 462 with rewards 17.0\n",
      "============ 463 ===========\n",
      "15 actions [0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 1, 1, 0, 0]\n",
      "   -2.4829 if cp<=0.03630542904138565\n",
      "   +0.0000 if cv<=0.16083937883377075 & cv>=0.16083937883377075\n",
      "   +0.0635 if pa>=0.017293987795710564\n",
      "   +0.0000 if cp<=0.039033856242895126 & cp>=0.039033856242895126\n",
      "   -2.5795 if cp<=0.11767894923686983 & cv<=0.6285211324691773 & pav<=-0.8845067024230957\n",
      "--------------\n",
      "   -0.3574 if cv>=-0.14372158348560332\n",
      "   -0.3574 if cp>=-0.03238692507147789\n",
      "   +5.5990 if cp>=-0.014995683915913105 & cv<=0.5548528432846072\n",
      "   -0.8343 if pa<=-0.0827326700091362\n",
      "   -1.4181 if pav>=-0.8845067024230957\n",
      "Run episode 463 with rewards 15.0\n",
      "============ 464 ===========\n",
      "11 actions [0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -1.2212 if cp<=0.03630542904138565\n",
      "   -0.0000 if pa>=0.017293987795710564\n",
      "   -0.0000 if cp<=0.039033856242895126 & cp>=0.039033856242895126\n",
      "   -1.7793 if cp<=0.11767894923686983 & cv<=0.6285211324691773 & pav<=-0.8845067024230957\n",
      "   -3.4926 if cv<=-0.009890666604042003\n",
      "--------------\n",
      "   -4.8603 if cv>=-0.14372158348560332\n",
      "   +0.0001 if cp>=-0.014995683915913105 & cv<=0.5548528432846072\n",
      "   +9.0511 if pa<=-0.0827326700091362\n",
      "   +0.1087 if pav>=-0.8845067024230957\n",
      "   +5.1114 if cv>=0.03167402595281601\n",
      "Run episode 464 with rewards 11.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 465 ===========\n",
      "59 actions [1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0]\n",
      "   -2.2733 if cp<=0.03630542904138565\n",
      "   -0.0000 if pa>=0.017293987795710564\n",
      "   -0.0000 if cp<=0.11767894923686983 & cv<=0.6285211324691773 & pav<=-0.8845067024230957\n",
      "   -0.9347 if cv<=-0.009890666604042003\n",
      "   +4.3848 if cv<=0.04976443201303482 & pa<=-0.014844256453216076\n",
      "--------------\n",
      "   -0.1041 if cv>=-0.14372158348560332\n",
      "  -13.0280 if pa<=-0.0827326700091362\n",
      "   +1.8108 if pav>=-0.8845067024230957\n",
      "   -0.1145 if cv>=0.03167402595281601\n",
      "   -3.5285 if pa<=-0.014844256453216076\n",
      "Run episode 465 with rewards 59.0\n",
      "============ 466 ===========\n",
      "39 actions [1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0]\n",
      "   -3.0893 if cp<=0.03630542904138565\n",
      "   +1.4021 if cp<=0.11767894923686983 & cv<=0.6285211324691773 & pav<=-0.8845067024230957\n",
      "   -0.4726 if cv<=-0.009890666604042003\n",
      "   +5.6995 if cv<=0.04976443201303482 & pa<=-0.014844256453216076\n",
      "   +5.6788 if cp>=-0.03677854388952255 & cv>=0.7537194848060608 & pa<=0.018563964217901244 & pa>=-0.0365343280136585\n",
      "--------------\n",
      "   -2.3411 if pa<=-0.0827326700091362\n",
      "   +3.6950 if pav>=-0.8845067024230957\n",
      "   +0.1209 if cv>=0.03167402595281601\n",
      "   -5.9246 if pa<=-0.014844256453216076\n",
      "   -5.2555 if cp>=-0.03677854388952255 & cv>=0.7537194848060608 & pa<=0.018563964217901244 & pa>=-0.0365343280136585\n",
      "Run episode 466 with rewards 39.0\n",
      "============ 467 ===========\n",
      "36 actions [1, 1, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0]\n",
      "   -3.0025 if cp<=0.03630542904138565\n",
      "   -0.0003 if cp<=0.11767894923686983 & cv<=0.6285211324691773 & pav<=-0.8845067024230957\n",
      "   +3.6553 if cv<=0.04976443201303482 & pa<=-0.014844256453216076\n",
      "   +1.7565 if cp>=-0.03677854388952255 & cv>=0.7537194848060608 & pa<=0.018563964217901244 & pa>=-0.0365343280136585\n",
      "   +2.2445 if cp>=0.02668801359832291 & cv>=-0.0037775576114652473 & pa<=-0.03839494362473487 & pa>=-0.09515789896249771\n",
      "--------------\n",
      "   -0.4759 if pa<=-0.0827326700091362\n",
      "   +0.0215 if pav>=-0.8845067024230957\n",
      "   -4.7817 if pa<=-0.014844256453216076\n",
      "   -1.4842 if cp>=-0.03677854388952255 & cv>=0.7537194848060608 & pa<=0.018563964217901244 & pa>=-0.0365343280136585\n",
      "   +2.4975 if cp<=0.02668801359832291 & pa>=-0.03839494362473487\n",
      "Run episode 467 with rewards 36.0\n",
      "============ 468 ===========\n",
      "45 actions [1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1]\n",
      "   -0.9939 if cp<=0.03630542904138565\n",
      "   +2.3161 if cv<=0.04976443201303482 & pa<=-0.014844256453216076\n",
      "   +0.0000 if cp>=-0.03677854388952255 & cv>=0.7537194848060608 & pa<=0.018563964217901244 & pa>=-0.0365343280136585\n",
      "   +0.0000 if cp>=0.02668801359832291 & cv>=-0.0037775576114652473 & pa<=-0.03839494362473487 & pa>=-0.09515789896249771\n",
      "   -4.2215 if cv<=0.36153778433799744 & cv>=0.36153778433799744\n",
      "--------------\n",
      "   -0.1001 if pa<=-0.0827326700091362\n",
      "   -6.7844 if pa<=-0.014844256453216076\n",
      "   +0.0000 if cp>=-0.03677854388952255 & cv>=0.7537194848060608 & pa<=0.018563964217901244 & pa>=-0.0365343280136585\n",
      "   +5.8146 if cp<=0.02668801359832291 & pa>=-0.03839494362473487\n",
      "   -4.0408 if pa>=-0.0297720767557621\n",
      "Run episode 468 with rewards 45.0\n",
      "============ 469 ===========\n",
      "41 actions [1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0]\n",
      "   -1.3331 if cp<=0.03630542904138565\n",
      "   +0.3957 if cv<=0.04976443201303482 & pa<=-0.014844256453216076\n",
      "   +0.1954 if cp>=0.02668801359832291 & cv>=-0.0037775576114652473 & pa<=-0.03839494362473487 & pa>=-0.09515789896249771\n",
      "   -0.0000 if cv<=0.36153778433799744 & cv>=0.36153778433799744\n",
      "   -2.7255 if cp<=0.020008792728185662\n",
      "--------------\n",
      "   -0.5477 if pa<=-0.0827326700091362\n",
      "   -2.1721 if pa<=-0.014844256453216076\n",
      "   +8.2973 if cp<=0.02668801359832291 & pa>=-0.03839494362473487\n",
      "   -1.0566 if pa>=-0.0297720767557621\n",
      "   -3.2082 if \n",
      "Run episode 469 with rewards 41.0\n",
      "============ 470 ===========\n",
      "54 actions [0, 1, 1, 1, 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.7087 if cp<=0.03630542904138565\n",
      "   +1.6658 if cv<=0.04976443201303482 & pa<=-0.014844256453216076\n",
      "   +0.3052 if cp>=0.02668801359832291 & cv>=-0.0037775576114652473 & pa<=-0.03839494362473487 & pa>=-0.09515789896249771\n",
      "   -1.6280 if cp<=0.020008792728185662\n",
      "   -0.4221 if cp<=-0.01413026172667739\n",
      "--------------\n",
      "   -3.6124 if pa<=-0.014844256453216076\n",
      "   +2.9094 if cp<=0.02668801359832291 & pa>=-0.03839494362473487\n",
      "   +2.9094 if pa>=-0.0297720767557621\n",
      "   -1.9154 if \n",
      "   -1.7456 if cp<=0.044853828847408295 & cv<=0.40483230352401733\n",
      "Run episode 470 with rewards 54.0\n",
      "============ 471 ===========\n",
      "31 actions [1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   -0.0020 if cp<=0.03630542904138565\n",
      "   +0.9029 if cv<=0.04976443201303482 & pa<=-0.014844256453216076\n",
      "   -0.2370 if cp<=0.020008792728185662\n",
      "   -2.0363 if cp<=-0.01413026172667739\n",
      "   +2.7489 if cv>=1.410703420639038\n",
      "--------------\n",
      "   -5.1191 if pa<=-0.014844256453216076\n",
      "   +4.8346 if cp<=0.02668801359832291 & pa>=-0.03839494362473487\n",
      "   +0.0942 if pa>=-0.0297720767557621\n",
      "   -1.6875 if \n",
      "   -3.5959 if cv>=1.410703420639038\n",
      "Run episode 471 with rewards 31.0\n",
      "============ 472 ===========\n",
      "50 actions [1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1]\n",
      "   +1.4667 if cv<=0.04976443201303482 & pa<=-0.014844256453216076\n",
      "   +1.5573 if cp<=0.020008792728185662\n",
      "   -0.9402 if cp<=-0.01413026172667739\n",
      "   -0.0000 if cv>=1.410703420639038\n",
      "   -2.7889 if cp<=-0.03465805575251579\n",
      "--------------\n",
      "   -7.1884 if pa<=-0.014844256453216076\n",
      "   +1.3093 if cp<=0.02668801359832291 & pa>=-0.03839494362473487\n",
      "   +0.8687 if \n",
      "   +0.0000 if cv>=1.410703420639038\n",
      "   -0.1725 if cp<=-0.008972546085715278 & pa<=-0.03741154819726944\n",
      "Run episode 472 with rewards 50.0\n",
      "============ 473 ===========\n",
      "102 actions [1, 1, 1, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1]\n",
      "   +1.4456 if cv<=0.04976443201303482 & pa<=-0.014844256453216076\n",
      "   -1.1768 if cp<=0.020008792728185662\n",
      "   -1.5851 if cp<=-0.01413026172667739\n",
      "   +0.3073 if cp<=-0.03465805575251579\n",
      "   +4.6241 if cv>=0.5454139351844788 & pa>=0.013824989460408688\n",
      "--------------\n",
      "   -8.5933 if pa<=-0.014844256453216076\n",
      "   +2.5780 if cp<=0.02668801359832291 & pa>=-0.03839494362473487\n",
      "   +1.8832 if \n",
      "   -0.0802 if cp<=-0.008972546085715278 & pa<=-0.03741154819726944\n",
      "   -6.5670 if cp<=-0.05504380837082862 & cv>=0.5454139351844788 & pa>=0.013824989460408688\n",
      "Run episode 473 with rewards 102.0\n",
      "============ 474 ===========\n",
      "31 actions [1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0, 1, 1]\n",
      "   +0.9912 if cv<=0.04976443201303482 & pa<=-0.014844256453216076\n",
      "   -3.3357 if cp<=0.020008792728185662\n",
      "   +0.5402 if cp<=-0.01413026172667739\n",
      "   +6.4144 if cv>=0.5454139351844788 & pa>=0.013824989460408688\n",
      "   +7.1917 if cp<=-0.023654081299900997 & pa>=0.11995361447334289 & pav<=0.22339849472045903 & pav>=-0.060157436132430964\n",
      "--------------\n",
      "   -7.8440 if pa<=-0.014844256453216076\n",
      "   +2.7134 if cp<=0.02668801359832291 & pa>=-0.03839494362473487\n",
      "   -1.3870 if \n",
      "   -2.8447 if cp<=-0.05504380837082862 & cv>=0.5454139351844788 & pa>=0.013824989460408688\n",
      "   +3.5687 if cp>=-0.023654081299900997\n",
      "Run episode 474 with rewards 31.0\n",
      "============ 475 ===========\n",
      "34 actions [1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.8059 if cv<=0.04976443201303482 & pa<=-0.014844256453216076\n",
      "   -0.3705 if cp<=0.020008792728185662\n",
      "   -0.0000 if cv>=0.5454139351844788 & pa>=0.013824989460408688\n",
      "   +4.3900 if cp<=-0.023654081299900997 & pa>=0.11995361447334289 & pav<=0.22339849472045903 & pav>=-0.060157436132430964\n",
      "   -1.6678 if cp<=0.03404759615659719\n",
      "--------------\n",
      "   -6.5900 if pa<=-0.014844256453216076\n",
      "   +1.3458 if cp<=0.02668801359832291 & pa>=-0.03839494362473487\n",
      "   -0.0000 if cp<=-0.05504380837082862 & cv>=0.5454139351844788 & pa>=0.013824989460408688\n",
      "   +1.5356 if cp>=-0.023654081299900997\n",
      "   +0.8292 if \n",
      "Run episode 475 with rewards 34.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 476 ===========\n",
      "44 actions [0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0]\n",
      "   +1.5990 if cv<=0.04976443201303482 & pa<=-0.014844256453216076\n",
      "   -0.4895 if cp<=0.020008792728185662\n",
      "   -0.0000 if cp<=-0.023654081299900997 & pa>=0.11995361447334289 & pav<=0.22339849472045903 & pav>=-0.060157436132430964\n",
      "   +0.3830 if cp<=0.03404759615659719\n",
      "   -2.7475 if pa>=0.006362945586442998\n",
      "--------------\n",
      "   -6.5456 if pa<=-0.014844256453216076\n",
      "   +2.3181 if cp<=0.02668801359832291 & pa>=-0.03839494362473487\n",
      "   -0.8167 if cp>=-0.023654081299900997\n",
      "   +0.9440 if \n",
      "   -1.4854 if cp<=0.026104770973324816 & cv>=0.8160672545433044 & pa<=0.006362945586442998\n",
      "Run episode 476 with rewards 44.0\n",
      "============ 477 ===========\n",
      "67 actions [1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0]\n",
      "   +1.6887 if cv<=0.04976443201303482 & pa<=-0.014844256453216076\n",
      "   -0.6865 if cp<=0.020008792728185662\n",
      "   +0.0131 if cp<=0.03404759615659719\n",
      "   -1.3277 if pa>=0.006362945586442998\n",
      "   -1.9537 if cp<=0.017783930711448227\n",
      "--------------\n",
      "   -6.5160 if pa<=-0.014844256453216076\n",
      "   +2.6240 if cp<=0.02668801359832291 & pa>=-0.03839494362473487\n",
      "   +0.9921 if \n",
      "   -1.0883 if cp<=0.026104770973324816 & cv>=0.8160672545433044 & pa<=0.006362945586442998\n",
      "   +0.7220 if pa>=0.012831219471991076\n",
      "Run episode 477 with rewards 67.0\n",
      "============ 478 ===========\n",
      "36 actions [1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0]\n",
      "   +1.5490 if cv<=0.04976443201303482 & pa<=-0.014844256453216076\n",
      "   -0.8173 if cp<=0.020008792728185662\n",
      "   -0.6793 if pa>=0.006362945586442998\n",
      "   -0.8173 if cp<=0.017783930711448227\n",
      "   -1.6618 if cp<=0.022967843338847178 & pa>=-0.04171781986951825\n",
      "--------------\n",
      "   -4.9524 if pa<=-0.014844256453216076\n",
      "   +4.1485 if cp<=0.02668801359832291 & pa>=-0.03839494362473487\n",
      "   +0.6817 if \n",
      "  +15.3898 if cp<=0.026104770973324816 & cv>=0.8160672545433044 & pa<=0.006362945586442998\n",
      "   +1.0000 if cv>=1.9666568040847778\n",
      "Run episode 478 with rewards 36.0\n",
      "============ 479 ===========\n",
      "30 actions [1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0]\n",
      "   +0.8066 if cv<=0.04976443201303482 & pa<=-0.014844256453216076\n",
      "   -0.3242 if cp<=0.020008792728185662\n",
      "   -0.3242 if cp<=0.017783930711448227\n",
      "   -2.2666 if cp<=0.022967843338847178 & pa>=-0.04171781986951825\n",
      "   -1.8739 if pav>=1.7401851415634155\n",
      "--------------\n",
      "   -4.1309 if pa<=-0.014844256453216076\n",
      "   +3.8040 if cp<=0.02668801359832291 & pa>=-0.03839494362473487\n",
      "   +0.1928 if cp<=0.026104770973324816 & cv>=0.8160672545433044 & pa<=0.006362945586442998\n",
      "   +0.0000 if cv>=1.9666568040847778\n",
      "   +2.9490 if pav>=1.7401851415634155\n",
      "Run episode 479 with rewards 30.0\n",
      "============ 480 ===========\n",
      "41 actions [1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0]\n",
      "   +1.3628 if cv<=0.04976443201303482 & pa<=-0.014844256453216076\n",
      "   +0.0349 if cp<=0.020008792728185662\n",
      "   -4.2956 if cp<=0.022967843338847178 & pa>=-0.04171781986951825\n",
      "   +0.0000 if pav>=1.7401851415634155\n",
      "   +4.5710 if cp<=-0.030799390375614147 & cp>=-0.06142492964863775 & cv<=-0.5499199509620667\n",
      "--------------\n",
      "   -4.4072 if pa<=-0.014844256453216076\n",
      "   +5.0132 if cp<=0.02668801359832291 & pa>=-0.03839494362473487\n",
      "   +0.1605 if cp<=0.026104770973324816 & cv>=0.8160672545433044 & pa<=0.006362945586442998\n",
      "   +0.0000 if pav>=1.7401851415634155\n",
      "   -4.6439 if cp<=-0.030799390375614147 & cp>=-0.06142492964863775 & cv<=-0.5499199509620667\n",
      "Run episode 480 with rewards 41.0\n",
      "============ 481 ===========\n",
      "37 actions [1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0]\n",
      "   +1.6188 if cv<=0.04976443201303482 & pa<=-0.014844256453216076\n",
      "   -0.3948 if cp<=0.020008792728185662\n",
      "   -4.0174 if cp<=0.022967843338847178 & pa>=-0.04171781986951825\n",
      "   -0.3302 if cp<=-0.030799390375614147 & cp>=-0.06142492964863775 & cv<=-0.5499199509620667\n",
      "   -3.6177 if cp>=0.008089380338788033 & pa>=-0.06074124574661255\n",
      "--------------\n",
      "   -1.4271 if pa<=-0.014844256453216076\n",
      "   +2.6363 if cp<=0.02668801359832291 & pa>=-0.03839494362473487\n",
      "   +0.0621 if cp<=0.026104770973324816 & cv>=0.8160672545433044 & pa<=0.006362945586442998\n",
      "   +1.3551 if cp<=-0.030799390375614147 & cp>=-0.06142492964863775 & cv<=-0.5499199509620667\n",
      "   -3.6281 if pa<=-0.06074124574661255\n",
      "Run episode 481 with rewards 37.0\n",
      "============ 482 ===========\n",
      "42 actions [1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0]\n",
      "   +0.8189 if cv<=0.04976443201303482 & pa<=-0.014844256453216076\n",
      "   +0.7580 if cp<=0.020008792728185662\n",
      "   -4.5240 if cp<=0.022967843338847178 & pa>=-0.04171781986951825\n",
      "   +0.0000 if cp>=0.008089380338788033 & pa>=-0.06074124574661255\n",
      "   +0.5837 if pa>=-0.06844343096017838\n",
      "--------------\n",
      "   -2.2115 if pa<=-0.014844256453216076\n",
      "   +3.6592 if cp<=0.02668801359832291 & pa>=-0.03839494362473487\n",
      "   +0.8322 if cp<=-0.030799390375614147 & cp>=-0.06142492964863775 & cv<=-0.5499199509620667\n",
      "   -1.8173 if pa<=-0.06074124574661255\n",
      "   -1.3761 if \n",
      "Run episode 482 with rewards 42.0\n",
      "============ 483 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 0, 0, 0]\n",
      "   +2.0464 if cv<=0.04976443201303482 & pa<=-0.014844256453216076\n",
      "   -1.6455 if cp<=0.020008792728185662\n",
      "   -2.0925 if cp<=0.022967843338847178 & pa>=-0.04171781986951825\n",
      "   -0.2836 if pa>=-0.06844343096017838\n",
      "   -4.2872 if cp<=0.044938699901103975 & cv>=-0.5590342283248901 & pa<=0.001404622895643139\n",
      "--------------\n",
      "   -5.0004 if pa<=-0.014844256453216076\n",
      "   +3.1455 if cp<=0.02668801359832291 & pa>=-0.03839494362473487\n",
      "   +0.0000 if pa<=-0.06074124574661255\n",
      "   +0.9344 if \n",
      "   -3.8213 if cp<=0.16220876872539522 & pa<=0.07676468491554264 & pa>=0.001404622895643139\n",
      "Run episode 483 with rewards 9.0\n",
      "============ 484 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.1104 if cv<=0.04976443201303482 & pa<=-0.014844256453216076\n",
      "   -2.7095 if cp<=0.020008792728185662\n",
      "   -0.2149 if cp<=0.022967843338847178 & pa>=-0.04171781986951825\n",
      "   -3.2122 if cp<=0.044938699901103975 & cv>=-0.5590342283248901 & pa<=0.001404622895643139\n",
      "   -1.1977 if cp<=-0.014942694827914237 & cp>=-0.02596331909298897\n",
      "--------------\n",
      "   +8.1599 if pa<=-0.014844256453216076\n",
      "   +1.8577 if cp<=0.02668801359832291 & pa>=-0.03839494362473487\n",
      "   +5.7586 if \n",
      "   +2.2568 if cp<=0.16220876872539522 & pa<=0.07676468491554264 & pa>=0.001404622895643139\n",
      "   +1.0000 if cp<=0.03793084919452668 & cp>=-0.02596331909298897\n",
      "Run episode 484 with rewards 10.0\n",
      "============ 485 ===========\n",
      "20 actions [0, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 0, 0, 0, 0]\n",
      "   -0.0000 if cp<=0.020008792728185662\n",
      "   -0.0000 if cp<=0.022967843338847178 & pa>=-0.04171781986951825\n",
      "   -0.0000 if cp<=0.044938699901103975 & cv>=-0.5590342283248901 & pa<=0.001404622895643139\n",
      "   -0.0000 if cp<=-0.014942694827914237 & cp>=-0.02596331909298897\n",
      "   -0.0167 if cp<=0.05142684578895569\n",
      "--------------\n",
      "  -10.4714 if pa<=-0.014844256453216076\n",
      "   +0.6173 if cp<=0.02668801359832291 & pa>=-0.03839494362473487\n",
      "   -4.5828 if \n",
      "   +7.4364 if cp<=0.16220876872539522 & pa<=0.07676468491554264 & pa>=0.001404622895643139\n",
      "   -1.3202 if cp>=0.077769373357296\n",
      "Run episode 485 with rewards 20.0\n",
      "============ 486 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +1.1913 if cp<=0.020008792728185662\n",
      "   +0.0000 if cp<=0.044938699901103975 & cv>=-0.5590342283248901 & pa<=0.001404622895643139\n",
      "   +0.0000 if cp<=-0.014942694827914237 & cp>=-0.02596331909298897\n",
      "   +1.8233 if cp<=0.05142684578895569\n",
      "   +3.3730 if cv>=0.5522191524505615\n",
      "--------------\n",
      "   -1.7397 if pa<=-0.014844256453216076\n",
      "   -2.4857 if \n",
      "   +3.3702 if cp<=0.16220876872539522 & pa<=0.07676468491554264 & pa>=0.001404622895643139\n",
      "   -0.0000 if cp>=0.077769373357296\n",
      "   -3.2759 if cv>=0.5522191524505615\n",
      "Run episode 486 with rewards 10.0\n",
      "============ 487 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +1.7002 if cp<=0.020008792728185662\n",
      "   +0.0714 if cp<=0.044938699901103975 & cv>=-0.5590342283248901 & pa<=0.001404622895643139\n",
      "   +1.7002 if cp<=0.05142684578895569\n",
      "   +0.0000 if cv>=0.5522191524505615\n",
      "   +0.1874 if cp<=-0.030918489396572112\n",
      "--------------\n",
      "   -0.4983 if pa<=-0.014844256453216076\n",
      "   -0.7143 if \n",
      "   -0.3715 if cp<=0.16220876872539522 & pa<=0.07676468491554264 & pa>=0.001404622895643139\n",
      "   +0.0000 if cv>=0.5522191524505615\n",
      "   -0.6854 if cp>=-0.004361427947878834\n",
      "Run episode 487 with rewards 9.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 488 ===========\n",
      "31 actions [0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.5760 if cp<=0.020008792728185662\n",
      "   -0.0011 if cp<=0.044938699901103975 & cv>=-0.5590342283248901 & pa<=0.001404622895643139\n",
      "   +0.5760 if cp<=0.05142684578895569\n",
      "   -8.6925 if cp<=-0.030918489396572112\n",
      "   -6.8025 if cp<=-0.07118324264883995\n",
      "--------------\n",
      "   +0.0000 if pa<=-0.014844256453216076\n",
      "   -0.4742 if \n",
      "   -0.7178 if cp<=0.16220876872539522 & pa<=0.07676468491554264 & pa>=0.001404622895643139\n",
      "   -0.3138 if cp>=-0.004361427947878834\n",
      "   +0.1708 if pa>=0.17870649695396423\n",
      "Run episode 488 with rewards 31.0\n",
      "============ 489 ===========\n",
      "42 actions [0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1]\n",
      "   +0.5892 if cp<=0.020008792728185662\n",
      "   +1.2021 if cp<=0.05142684578895569\n",
      "   -6.8383 if cp<=-0.030918489396572112\n",
      "   -2.6105 if cp<=-0.07118324264883995\n",
      "   +2.0120 if pav<=1.2166028022766113\n",
      "--------------\n",
      "   -2.5534 if \n",
      "   -0.7930 if cp<=0.16220876872539522 & pa<=0.07676468491554264 & pa>=0.001404622895643139\n",
      "   -1.9008 if cp>=-0.004361427947878834\n",
      "   +0.0008 if pa>=0.17870649695396423\n",
      "   +0.7550 if cp<=-0.03774789348244667\n",
      "Run episode 489 with rewards 42.0\n",
      "============ 490 ===========\n",
      "52 actions [0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 1]\n",
      "   -3.6990 if cp<=0.05142684578895569\n",
      "   -2.0782 if cp<=-0.030918489396572112\n",
      "   -2.0999 if cp<=-0.07118324264883995\n",
      "   +5.6576 if pav<=1.2166028022766113\n",
      "   -5.5782 if cp<=-0.03458094745874403 & pa>=0.04717824831604961\n",
      "--------------\n",
      "   -2.3344 if \n",
      "   -1.4701 if cp<=0.16220876872539522 & pa<=0.07676468491554264 & pa>=0.001404622895643139\n",
      "   -1.6517 if cp>=-0.004361427947878834\n",
      "   -0.1171 if cp<=-0.03774789348244667\n",
      "   +3.9044 if cp<=-0.03458094745874403 & pa>=0.04717824831604961\n",
      "Run episode 490 with rewards 52.0\n",
      "============ 491 ===========\n",
      "42 actions [0, 0, 0, 0, 1, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1, 0, 1, 1, 1, 1]\n",
      "   -4.5807 if cp<=0.05142684578895569\n",
      "   -1.6523 if cp<=-0.07118324264883995\n",
      "   +6.3328 if pav<=1.2166028022766113\n",
      "   -5.6951 if cp<=-0.03458094745874403 & pa>=0.04717824831604961\n",
      "   -2.9805 if cp<=-0.04269019141793249 & pa<=0.03353222459554675\n",
      "--------------\n",
      "   -2.7892 if \n",
      "   -1.7717 if cp<=0.16220876872539522 & pa<=0.07676468491554264 & pa>=0.001404622895643139\n",
      "   -0.4698 if cp>=-0.004361427947878834\n",
      "   +3.1986 if cp<=-0.03458094745874403 & pa>=0.04717824831604961\n",
      "   +2.5428 if cv<=-0.6239863276481629 & pa<=0.03353222459554675 & pav>=1.071730160713196\n",
      "Run episode 491 with rewards 42.0\n",
      "============ 492 ===========\n",
      "28 actions [0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   -3.5862 if cp<=0.05142684578895569\n",
      "   +4.1631 if pav<=1.2166028022766113\n",
      "   -5.5271 if cp<=-0.03458094745874403 & pa>=0.04717824831604961\n",
      "   +1.5098 if cp<=-0.04269019141793249 & pa<=0.03353222459554675\n",
      "   -3.9811 if cp<=0.014974704384803835 & cp>=-0.027884004265069942 & cv<=-0.5792981863021851 & pa<=0.05490263700485233 & pa>=-0.0167272739112377\n",
      "--------------\n",
      "   -2.0701 if \n",
      "   -3.0873 if cp<=0.16220876872539522 & pa<=0.07676468491554264 & pa>=0.001404622895643139\n",
      "   +3.9873 if cp<=-0.03458094745874403 & pa>=0.04717824831604961\n",
      "   +1.7284 if cv<=-0.6239863276481629 & pa<=0.03353222459554675 & pav>=1.071730160713196\n",
      "   +5.0105 if cp<=0.014974704384803835 & cp>=-0.027884004265069942 & cv<=-0.5792981863021851 & pa<=0.05490263700485233 & pa>=-0.0167272739112377\n",
      "Run episode 492 with rewards 28.0\n",
      "============ 493 ===========\n",
      "26 actions [1, 1, 0, 0, 1, 0, 1, 0, 0, 0, 1, 0, 0, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0]\n",
      "   -4.3043 if cp<=0.05142684578895569\n",
      "   +2.3117 if pav<=1.2166028022766113\n",
      "   -1.6313 if cp<=-0.03458094745874403 & pa>=0.04717824831604961\n",
      "   +0.0000 if cp<=0.014974704384803835 & cp>=-0.027884004265069942 & cv<=-0.5792981863021851 & pa<=0.05490263700485233 & pa>=-0.0167272739112377\n",
      "   +3.0028 if cp<=0.00831114295870066 & cp>=-0.02452445179224014\n",
      "--------------\n",
      "   -0.1355 if \n",
      "   -3.7982 if cp<=0.16220876872539522 & pa<=0.07676468491554264 & pa>=0.001404622895643139\n",
      "   +1.1052 if cp<=-0.03458094745874403 & pa>=0.04717824831604961\n",
      "   +0.0000 if cp<=0.014974704384803835 & cp>=-0.027884004265069942 & cv<=-0.5792981863021851 & pa<=0.05490263700485233 & pa>=-0.0167272739112377\n",
      "   -1.9186 if cv>=1.1702983379364014\n",
      "Run episode 493 with rewards 26.0\n",
      "============ 494 ===========\n",
      "27 actions [1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 0]\n",
      "   -5.5345 if cp<=0.05142684578895569\n",
      "   +3.1131 if pav<=1.2166028022766113\n",
      "   -0.0000 if cp<=-0.03458094745874403 & pa>=0.04717824831604961\n",
      "   -0.0000 if cp<=0.00831114295870066 & cp>=-0.02452445179224014\n",
      "   -4.4758 if cp>=0.06165559962391854 & cv<=0.007343012373894453 & pa>=-0.07736329734325409\n",
      "--------------\n",
      "   -0.2006 if \n",
      "   +0.0000 if cp<=0.16220876872539522 & pa<=0.07676468491554264 & pa>=0.001404622895643139\n",
      "   +0.0000 if cp<=-0.03458094745874403 & pa>=0.04717824831604961\n",
      "   +0.0000 if cv>=1.1702983379364014\n",
      "   +3.7603 if cp>=0.06165559962391854 & cv<=0.007343012373894453 & pa>=-0.07736329734325409\n",
      "Run episode 494 with rewards 27.0\n",
      "============ 495 ===========\n",
      "81 actions [1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0, 0]\n",
      "   -6.4589 if cp<=0.05142684578895569\n",
      "   +3.1539 if pav<=1.2166028022766113\n",
      "   +1.4355 if cp<=0.00831114295870066 & cp>=-0.02452445179224014\n",
      "   -3.1137 if cp>=0.06165559962391854 & cv<=0.007343012373894453 & pa>=-0.07736329734325409\n",
      "   +5.5536 if cp>=0.04271374866366386 & cv>=-0.04070341140031815 & pa>=-0.03534149006009102\n",
      "--------------\n",
      "   -1.9138 if \n",
      "   +0.0000 if cp<=0.16220876872539522 & pa<=0.07676468491554264 & pa>=0.001404622895643139\n",
      "   +0.0000 if cv>=1.1702983379364014\n",
      "   +3.8511 if cp>=0.06165559962391854 & cv<=0.007343012373894453 & pa>=-0.07736329734325409\n",
      "   +3.7186 if cp<=0.052005684375762945 & cv<=-0.04070341140031815\n",
      "Run episode 495 with rewards 81.0\n",
      "============ 496 ===========\n",
      "10 actions [1, 1, 1, 1, 0, 0, 1, 1, 1, 0]\n",
      "   -7.2872 if cp<=0.05142684578895569\n",
      "   +3.4903 if pav<=1.2166028022766113\n",
      "   -1.8780 if cp>=0.06165559962391854 & cv<=0.007343012373894453 & pa>=-0.07736329734325409\n",
      "   +4.9755 if cp>=0.04271374866366386 & cv>=-0.04070341140031815 & pa>=-0.03534149006009102\n",
      "   +5.0755 if cp<=-0.010602208785712719 & cv>=0.5406747460365295 & pa>=0.03220278024673462\n",
      "--------------\n",
      "   -2.1099 if \n",
      "   -1.6653 if cp<=0.16220876872539522 & pa<=0.07676468491554264 & pa>=0.001404622895643139\n",
      "   +2.4716 if cp>=0.06165559962391854 & cv<=0.007343012373894453 & pa>=-0.07736329734325409\n",
      "   +2.0642 if cp<=0.052005684375762945 & cv<=-0.04070341140031815\n",
      "   +3.9416 if cp>=-0.010602208785712719 & cv>=-0.6213500499725342 & pa>=-0.01880129426717756\n",
      "Run episode 496 with rewards 10.0\n",
      "============ 497 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 0, 1, 1, 1]\n",
      "   +1.6204 if cp<=0.05142684578895569\n",
      "   -7.0673 if pav<=1.2166028022766113\n",
      "   -0.0000 if cp>=0.04271374866366386 & cv>=-0.04070341140031815 & pa>=-0.03534149006009102\n",
      "   -0.0000 if cp<=-0.010602208785712719 & cv>=0.5406747460365295 & pa>=0.03220278024673462\n",
      "   +4.3455 if cp<=0.01636929120868445 & cp>=-0.009472728427499532\n",
      "--------------\n",
      "   -3.9286 if \n",
      "   +0.0000 if cp>=0.06165559962391854 & cv<=0.007343012373894453 & pa>=-0.07736329734325409\n",
      "   +0.0000 if cp<=0.052005684375762945 & cv<=-0.04070341140031815\n",
      "   +0.0000 if cp>=-0.010602208785712719 & cv>=-0.6213500499725342 & pa>=-0.01880129426717756\n",
      "   +3.2698 if cp<=-0.009472728427499532\n",
      "Run episode 497 with rewards 9.0\n",
      "============ 498 ===========\n",
      "11 actions [1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0]\n",
      "   -2.6618 if cp<=0.05142684578895569\n",
      "   +5.4436 if pav<=1.2166028022766113\n",
      "   +0.0000 if cp<=-0.010602208785712719 & cv>=0.5406747460365295 & pa>=0.03220278024673462\n",
      "   +0.0000 if cp<=0.01636929120868445 & cp>=-0.009472728427499532\n",
      "   -9.6919 if cp<=0.07799144536256791\n",
      "--------------\n",
      "   -1.0738 if \n",
      "   +0.0000 if cp>=0.06165559962391854 & cv<=0.007343012373894453 & pa>=-0.07736329734325409\n",
      "   +0.0000 if cp>=-0.010602208785712719 & cv>=-0.6213500499725342 & pa>=-0.01880129426717756\n",
      "   +0.0000 if cp<=-0.009472728427499532\n",
      "   -1.7761 if cp<=0.10781937390565872 & cp>=0.07799144536256791\n",
      "Run episode 498 with rewards 11.0\n",
      "============ 499 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.0336 if cp<=0.05142684578895569\n",
      "  -16.0850 if pav<=1.2166028022766113\n",
      "   -0.0200 if cp<=0.01636929120868445 & cp>=-0.009472728427499532\n",
      "   -0.0461 if cp<=0.07799144536256791\n",
      "   -1.2210 if cv<=1.211381435394287\n",
      "--------------\n",
      "   +0.2199 if \n",
      "   +0.0771 if cp>=-0.010602208785712719 & cv>=-0.6213500499725342 & pa>=-0.01880129426717756\n",
      "   +0.0000 if cp<=-0.009472728427499532\n",
      "   +0.0017 if cp<=0.10781937390565872 & cp>=0.07799144536256791\n",
      "   +0.1195 if cv<=1.211381435394287 & pa<=-0.0626402273774147\n",
      "Run episode 499 with rewards 9.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 500 ===========\n",
      "29 actions [1, 1, 0, 1, 1, 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0]\n",
      "   -3.9206 if cp<=0.05142684578895569\n",
      "  +13.4323 if pav<=1.2166028022766113\n",
      "   -6.4889 if cp<=0.07799144536256791\n",
      "   -6.1157 if cv<=1.211381435394287\n",
      "   +2.2667 if cp>=0.1459137499332428\n",
      "--------------\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=-0.010602208785712719 & cv>=-0.6213500499725342 & pa>=-0.01880129426717756\n",
      "   -0.0000 if cp<=0.10781937390565872 & cp>=0.07799144536256791\n",
      "   +0.0000 if cv<=1.211381435394287 & pa<=-0.0626402273774147\n",
      "   +0.0000 if cp>=0.10280091911554337\n",
      "Run episode 500 with rewards 29.0\n",
      "============ 501 ===========\n",
      "31 actions [1, 1, 1, 0, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1, 1, 0]\n",
      "   -3.7712 if cp<=0.05142684578895569\n",
      "   +3.7851 if pav<=1.2166028022766113\n",
      "   -3.3573 if cp<=0.07799144536256791\n",
      "   +3.7851 if cv<=1.211381435394287\n",
      "   -4.2105 if pav>=-0.5855000376701355\n",
      "--------------\n",
      "   -0.0145 if \n",
      "   -0.1669 if cp<=0.10781937390565872 & cp>=0.07799144536256791\n",
      "   +0.1413 if cv<=1.211381435394287 & pa<=-0.0626402273774147\n",
      "   +0.0000 if cp>=0.10280091911554337\n",
      "   -6.1189 if pa>=-0.022251424565911254 & pav<=-0.5855000376701355\n",
      "Run episode 501 with rewards 31.0\n",
      "============ 502 ===========\n",
      "20 actions [1, 1, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1, 0, 1]\n",
      "   -2.7260 if cp<=0.05142684578895569\n",
      "   +3.8797 if pav<=1.2166028022766113\n",
      "   +3.8797 if cv<=1.211381435394287\n",
      "   -4.4836 if pav>=-0.5855000376701355\n",
      "   -5.7957 if cp<=0.06820031255483627 & pa>=-0.14038896560668945 & pav>=-0.7154013514518738\n",
      "--------------\n",
      "   +2.6316 if \n",
      "   -3.1427 if cp<=0.10781937390565872 & cp>=0.07799144536256791\n",
      "   -0.5630 if cv<=1.211381435394287 & pa<=-0.0626402273774147\n",
      "   -0.0000 if pa>=-0.022251424565911254 & pav<=-0.5855000376701355\n",
      "   -5.6272 if pa>=-0.14038896560668945 & pav<=-0.7154013514518738\n",
      "Run episode 502 with rewards 20.0\n",
      "============ 503 ===========\n",
      "19 actions [1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0]\n",
      "   +2.4056 if pav<=1.2166028022766113\n",
      "   +2.4056 if cv<=1.211381435394287\n",
      "   -0.6120 if pav>=-0.5855000376701355\n",
      "   -1.2880 if cp<=0.06820031255483627 & pa>=-0.14038896560668945 & pav>=-0.7154013514518738\n",
      "   -4.3639 if pav>=-0.6246950507164002\n",
      "--------------\n",
      "   +2.6281 if \n",
      "   -0.0000 if cp<=0.10781937390565872 & cp>=0.07799144536256791\n",
      "   -1.3757 if cv<=1.211381435394287 & pa<=-0.0626402273774147\n",
      "   -0.3770 if pa>=-0.14038896560668945 & pav<=-0.7154013514518738\n",
      "   -3.9266 if cp<=0.03380240127444268 & pav<=-0.6246950507164002\n",
      "Run episode 503 with rewards 19.0\n",
      "============ 504 ===========\n",
      "17 actions [1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 1, 0]\n",
      "   +1.9372 if pav<=1.2166028022766113\n",
      "   +1.9372 if cv<=1.211381435394287\n",
      "   -1.5080 if cp<=0.06820031255483627 & pa>=-0.14038896560668945 & pav>=-0.7154013514518738\n",
      "   -4.8143 if pav>=-0.6246950507164002\n",
      "   +1.0914 if cp>=0.08636940568685532 & pav<=-0.5716214656829833\n",
      "--------------\n",
      "   +2.7827 if \n",
      "   +0.4301 if cv<=1.211381435394287 & pa<=-0.0626402273774147\n",
      "   -2.0753 if pa>=-0.14038896560668945 & pav<=-0.7154013514518738\n",
      "   -0.6468 if cp<=0.03380240127444268 & pav<=-0.6246950507164002\n",
      "   -1.2164 if cp<=0.11835430711507798 & cp>=0.08636940568685532 & cv<=0.633049750328064 & pav<=-0.5716214656829833\n",
      "Run episode 504 with rewards 17.0\n",
      "============ 505 ===========\n",
      "19 actions [1, 1, 1, 1, 0, 0, 1, 0, 0, 1, 1, 0, 1, 0, 0, 1, 0, 1, 1]\n",
      "   +1.5058 if pav<=1.2166028022766113\n",
      "   +1.5058 if cv<=1.211381435394287\n",
      "   -3.1211 if cp<=0.06820031255483627 & pa>=-0.14038896560668945 & pav>=-0.7154013514518738\n",
      "   -1.8460 if pav>=-0.6246950507164002\n",
      "   -1.0336 if cp>=0.036258614808321016\n",
      "--------------\n",
      "   +2.5010 if \n",
      "   -3.4503 if pa>=-0.14038896560668945 & pav<=-0.7154013514518738\n",
      "   +1.2599 if cp<=0.03380240127444268 & pav<=-0.6246950507164002\n",
      "   -0.0000 if cp<=0.11835430711507798 & cp>=0.08636940568685532 & cv<=0.633049750328064 & pav<=-0.5716214656829833\n",
      "   +1.5580 if cp<=0.0690134957432747 & cp>=0.0029328573087696016 & cp>=0.036258614808321016\n",
      "Run episode 505 with rewards 19.0\n",
      "============ 506 ===========\n",
      "19 actions [1, 1, 1, 1, 0, 0, 1, 0, 0, 1, 1, 0, 1, 0, 0, 1, 0, 0, 0]\n",
      "   +1.3383 if pav<=1.2166028022766113\n",
      "   +1.3383 if cv<=1.211381435394287\n",
      "   -2.7438 if cp<=0.06820031255483627 & pa>=-0.14038896560668945 & pav>=-0.7154013514518738\n",
      "   -1.3761 if pav>=-0.6246950507164002\n",
      "   -4.2233 if cp<=0.04952674955129623 & cv>=0.3803305745124817\n",
      "--------------\n",
      "   +1.3866 if \n",
      "   -2.0250 if pa>=-0.14038896560668945 & pav<=-0.7154013514518738\n",
      "   +0.0000 if cp<=0.03380240127444268 & pav<=-0.6246950507164002\n",
      "   +4.0677 if cp<=0.0690134957432747 & cp>=0.0029328573087696016 & cp>=0.036258614808321016\n",
      "   -3.6527 if cv>=0.7570434212684631\n",
      "Run episode 506 with rewards 19.0\n",
      "============ 507 ===========\n",
      "13 actions [1, 1, 1, 0, 0, 1, 1, 0, 0, 1, 0, 1, 0]\n",
      "   +3.3336 if pav<=1.2166028022766113\n",
      "   -0.6552 if cp<=0.06820031255483627 & pa>=-0.14038896560668945 & pav>=-0.7154013514518738\n",
      "   -3.2457 if pav>=-0.6246950507164002\n",
      "   -0.8493 if cp<=0.04952674955129623 & cv>=0.3803305745124817\n",
      "   -5.0698 if cp<=-0.01262186300009489 & cv>=0.35300416946411134\n",
      "--------------\n",
      "   +0.5214 if \n",
      "   -4.4244 if pa>=-0.14038896560668945 & pav<=-0.7154013514518738\n",
      "   +2.1934 if cp<=0.0690134957432747 & cp>=0.0029328573087696016 & cp>=0.036258614808321016\n",
      "   +0.0000 if cv>=0.7570434212684631\n",
      "   +4.4509 if cp<=-0.01262186300009489 & cv>=0.35300416946411134\n",
      "Run episode 507 with rewards 13.0\n",
      "============ 508 ===========\n",
      "10 actions [1, 1, 1, 0, 1, 1, 0, 1, 1, 1]\n",
      "   -0.6182 if pav<=1.2166028022766113\n",
      "   -3.1489 if pav>=-0.6246950507164002\n",
      "   +1.8784 if cp<=0.04952674955129623 & cv>=0.3803305745124817\n",
      "   -0.0000 if cp<=-0.01262186300009489 & cv>=0.35300416946411134\n",
      "   -6.3203 if cp>=0.08989604562520981\n",
      "--------------\n",
      "   +0.6801 if \n",
      "   -1.9985 if pa>=-0.14038896560668945 & pav<=-0.7154013514518738\n",
      "   +2.3183 if cp<=0.0690134957432747 & cp>=0.0029328573087696016 & cp>=0.036258614808321016\n",
      "   +0.0000 if cp<=-0.01262186300009489 & cv>=0.35300416946411134\n",
      "   +2.2482 if cp<=0.018583789281547074\n",
      "Run episode 508 with rewards 10.0\n",
      "============ 509 ===========\n",
      "18 actions [1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0]\n",
      "   +2.4042 if pav<=1.2166028022766113\n",
      "   -4.5851 if pav>=-0.6246950507164002\n",
      "   +0.5364 if cp<=0.04952674955129623 & cv>=0.3803305745124817\n",
      "  +11.4559 if cp>=0.08989604562520981\n",
      "   +1.9363 if cp>=0.11964180320501328\n",
      "--------------\n",
      "   +0.7260 if \n",
      "   -1.4807 if pa>=-0.14038896560668945 & pav<=-0.7154013514518738\n",
      "   +0.0436 if cp<=0.0690134957432747 & cp>=0.0029328573087696016 & cp>=0.036258614808321016\n",
      "   -0.0000 if cp<=0.018583789281547074\n",
      "   +1.6554 if cp<=0.06585139855742456 & cp>=0.046877358108758926\n",
      "Run episode 509 with rewards 18.0\n",
      "============ 510 ===========\n",
      "16 actions [1, 1, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0]\n",
      "   +3.1337 if pav<=1.2166028022766113\n",
      "   -6.2295 if pav>=-0.6246950507164002\n",
      "   +0.0000 if cp>=0.08989604562520981\n",
      "   +0.0000 if cp>=0.11964180320501328\n",
      "   +0.6800 if pav<=-0.37777405381202694 & pav>=-0.6509152889251709\n",
      "--------------\n",
      "   +1.7784 if \n",
      "   -1.8836 if pa>=-0.14038896560668945 & pav<=-0.7154013514518738\n",
      "   +0.9368 if cp<=0.0690134957432747 & cp>=0.0029328573087696016 & cp>=0.036258614808321016\n",
      "   -1.2274 if cp<=0.06585139855742456 & cp>=0.046877358108758926\n",
      "   -2.6893 if cv>=0.28194304704666157 & pav>=-0.7432695508003234\n",
      "Run episode 510 with rewards 16.0\n",
      "============ 511 ===========\n",
      "14 actions [1, 1, 1, 0, 1, 1, 0, 0, 0, 1, 0, 1, 1, 1]\n",
      "   +1.7726 if pav<=1.2166028022766113\n",
      "   -4.6296 if pav>=-0.6246950507164002\n",
      "   -0.3405 if cp>=0.08989604562520981\n",
      "   -0.9090 if pav<=-0.37777405381202694 & pav>=-0.6509152889251709\n",
      "   -7.8962 if cp>=0.12813447415828705\n",
      "--------------\n",
      "   +0.6111 if \n",
      "   -0.5682 if pa>=-0.14038896560668945 & pav<=-0.7154013514518738\n",
      "   -0.1610 if cp<=0.06585139855742456 & cp>=0.046877358108758926\n",
      "   +0.4738 if cv>=0.28194304704666157 & pav>=-0.7432695508003234\n",
      "   +2.5600 if cp>=0.12813447415828705 & cv<=0.4224066734313965\n",
      "Run episode 511 with rewards 14.0\n",
      "============ 512 ===========\n",
      "20 actions [1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 0, 1]\n",
      "   +3.5166 if pav<=1.2166028022766113\n",
      "   -5.5910 if pav>=-0.6246950507164002\n",
      "   -1.0839 if pav<=-0.37777405381202694 & pav>=-0.6509152889251709\n",
      "   +7.4964 if cp>=0.12813447415828705\n",
      "   -2.9835 if cp<=0.06180045604705811 & cv>=0.410202294588089\n",
      "--------------\n",
      "   +0.0183 if \n",
      "   -0.5787 if pa>=-0.14038896560668945 & pav<=-0.7154013514518738\n",
      "   -0.2345 if cv>=0.28194304704666157 & pav>=-0.7432695508003234\n",
      "   -0.0000 if cp>=0.12813447415828705 & cv<=0.4224066734313965\n",
      "   +1.8795 if cp<=0.06180045604705811 & cv>=0.410202294588089\n",
      "Run episode 512 with rewards 20.0\n",
      "============ 513 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.5929 if pav<=1.2166028022766113\n",
      "   -3.2422 if pav>=-0.6246950507164002\n",
      "   +3.7360 if cp>=0.12813447415828705\n",
      "   -3.9446 if cp<=0.06180045604705811 & cv>=0.410202294588089\n",
      "   +2.9417 if cp>=0.02766814008355141\n",
      "--------------\n",
      "   +0.6820 if \n",
      "   -0.2483 if pa>=-0.14038896560668945 & pav<=-0.7154013514518738\n",
      "   +0.5667 if cv>=0.28194304704666157 & pav>=-0.7432695508003234\n",
      "   +3.5642 if cp<=0.06180045604705811 & cv>=0.410202294588089\n",
      "   +1.4865 if cp<=0.02766814008355141 & pav>=-0.37035724520683266\n",
      "Run episode 513 with rewards 9.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 514 ===========\n",
      "25 actions [0, 1, 0, 0, 1, 0, 1, 1, 1, 1, 1, 0, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0]\n",
      "   -2.6603 if pav>=-0.6246950507164002\n",
      "   +1.2177 if cp>=0.12813447415828705\n",
      "   +2.7735 if cp<=0.06180045604705811 & cv>=0.410202294588089\n",
      "  +14.5425 if cp>=0.02766814008355141\n",
      "   +1.9473 if cp>=-0.00777187906205653\n",
      "--------------\n",
      "   -6.1153 if \n",
      "   +2.1212 if cv>=0.28194304704666157 & pav>=-0.7432695508003234\n",
      "   +1.6708 if cp<=0.06180045604705811 & cv>=0.410202294588089\n",
      "   +4.7260 if cp<=0.02766814008355141 & pav>=-0.37035724520683266\n",
      "   -9.5864 if cp>=0.025294383987784393\n",
      "Run episode 514 with rewards 25.0\n",
      "============ 515 ===========\n",
      "52 actions [0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 1, 0, 0, 0, 1, 0, 1, 1, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -2.6290 if pav>=-0.6246950507164002\n",
      "   +4.4343 if cp<=0.06180045604705811 & cv>=0.410202294588089\n",
      "   +0.0022 if cp>=0.02766814008355141\n",
      "   -1.5706 if cp>=-0.00777187906205653\n",
      "   +6.1982 if cp<=0.006835730094462633 & cp>=0.0014689753763377721 & pa<=0.06051899641752243\n",
      "--------------\n",
      "   -0.9702 if \n",
      "   -0.9793 if cv>=0.28194304704666157 & pav>=-0.7432695508003234\n",
      "   +4.0067 if cp<=0.02766814008355141 & pav>=-0.37035724520683266\n",
      "   -0.0000 if cp>=0.025294383987784393\n",
      "   -7.9526 if cp<=0.006835730094462633 & cv<=0.3771171629428864 & pa<=0.08779068440198899 & pav<=0.41170703172683726\n",
      "Run episode 515 with rewards 52.0\n",
      "============ 516 ===========\n",
      "32 actions [0, 0, 1, 1, 1, 1, 1, 0, 1, 0, 1, 0, 0, 0, 0, 1, 0, 0, 1, 0, 0, 1, 0, 1, 1, 1, 0, 1, 0, 1, 0, 0]\n",
      "   -2.4104 if pav>=-0.6246950507164002\n",
      "   +4.1537 if cp<=0.06180045604705811 & cv>=0.410202294588089\n",
      "   -1.8958 if cp>=-0.00777187906205653\n",
      "   -0.0000 if cp<=0.006835730094462633 & cp>=0.0014689753763377721 & pa<=0.06051899641752243\n",
      "   -5.7284 if cp>=-0.06273479014635086 & cv<=0.5024940133094787 & cv>=0.12671606242656708 & pa>=0.03286732882261277\n",
      "--------------\n",
      "   -4.1956 if \n",
      "   +2.4239 if cv>=0.28194304704666157 & pav>=-0.7432695508003234\n",
      "   +4.9958 if cp<=0.02766814008355141 & pav>=-0.37035724520683266\n",
      "   -6.8411 if cp<=0.006835730094462633 & cv<=0.3771171629428864 & pa<=0.08779068440198899 & pav<=0.41170703172683726\n",
      "   +5.8839 if cv>=-0.24457525610923767 & pav>=0.33867928385734575\n",
      "Run episode 516 with rewards 32.0\n",
      "============ 517 ===========\n",
      "23 actions [0, 0, 1, 1, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 0, 1, 0]\n",
      "   -0.5493 if pav>=-0.6246950507164002\n",
      "   +2.4095 if cp<=0.06180045604705811 & cv>=0.410202294588089\n",
      "   -2.6866 if cp>=-0.00777187906205653\n",
      "   +0.0000 if cp>=-0.06273479014635086 & cv<=0.5024940133094787 & cv>=0.12671606242656708 & pa>=0.03286732882261277\n",
      "   -3.9226 if pav>=0.5364760756492615\n",
      "--------------\n",
      "   -4.8085 if \n",
      "   +4.4774 if cp<=0.02766814008355141 & pav>=-0.37035724520683266\n",
      "   +7.7072 if cp<=0.006835730094462633 & cv<=0.3771171629428864 & pa<=0.08779068440198899 & pav<=0.41170703172683726\n",
      "   -0.0000 if cv>=-0.24457525610923767 & pav>=0.33867928385734575\n",
      "   +6.2819 if cv>=0.3177134096622468 & pav>=-0.7209678053855896\n",
      "Run episode 517 with rewards 23.0\n",
      "============ 518 ===========\n",
      "17 actions [1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0]\n",
      "   -2.5616 if pav>=-0.6246950507164002\n",
      "   +0.5134 if cp<=0.06180045604705811 & cv>=0.410202294588089\n",
      "   -1.2282 if cp>=-0.00777187906205653\n",
      "   -0.7934 if pav>=0.5364760756492615\n",
      "   +2.7484 if cp>=0.02844161204993725 & pav>=-0.04020192695315913\n",
      "--------------\n",
      "   -4.5553 if \n",
      "   +4.7676 if cp<=0.02766814008355141 & pav>=-0.37035724520683266\n",
      "   +0.0000 if cp<=0.006835730094462633 & cv<=0.3771171629428864 & pa<=0.08779068440198899 & pav<=0.41170703172683726\n",
      "   +6.3516 if cv>=0.3177134096622468 & pav>=-0.7209678053855896\n",
      "   -2.5317 if cp>=0.02844161204993725 & pav>=-0.04020192695315913\n",
      "Run episode 518 with rewards 17.0\n",
      "============ 519 ===========\n",
      "14 actions [1, 1, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1]\n",
      "   -2.4201 if pav>=-0.6246950507164002\n",
      "   -0.7180 if cp>=-0.00777187906205653\n",
      "   -0.0000 if pav>=0.5364760756492615\n",
      "   -0.0000 if cp>=0.02844161204993725 & pav>=-0.04020192695315913\n",
      "   -1.5076 if cp<=-0.033406380191445345 & cv<=0.5138146758079531\n",
      "--------------\n",
      "   +2.5511 if \n",
      "   +0.3664 if cp<=0.02766814008355141 & pav>=-0.37035724520683266\n",
      "   +0.4485 if cv>=0.3177134096622468 & pav>=-0.7209678053855896\n",
      "   +0.0000 if cp>=0.02844161204993725 & pav>=-0.04020192695315913\n",
      "   -5.6609 if cp<=0.06075665429234505 & cv>=0.5138146758079531\n",
      "Run episode 519 with rewards 14.0\n",
      "============ 520 ===========\n",
      "34 actions [1, 0, 1, 1, 0, 1, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 0, 0, 1, 0, 1, 0]\n",
      "   -5.6976 if pav>=-0.6246950507164002\n",
      "   +3.9061 if cp>=-0.00777187906205653\n",
      "   +0.0000 if cp>=0.02844161204993725 & pav>=-0.04020192695315913\n",
      "   +0.0000 if cp<=-0.033406380191445345 & cv<=0.5138146758079531\n",
      "  +12.6338 if cp>=0.0900518611073494\n",
      "--------------\n",
      "   -4.3785 if \n",
      "   +3.9923 if cp<=0.02766814008355141 & pav>=-0.37035724520683266\n",
      "   +4.1146 if cv>=0.3177134096622468 & pav>=-0.7209678053855896\n",
      "   -0.7702 if cp<=0.06075665429234505 & cv>=0.5138146758079531\n",
      "  -10.7475 if cp>=0.0900518611073494\n",
      "Run episode 520 with rewards 34.0\n",
      "============ 521 ===========\n",
      "48 actions [1, 0, 1, 0, 0, 0, 0, 1, 1, 1, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1, 1, 1, 0, 1, 0, 0, 0, 1, 1, 0, 1, 0, 1, 0, 0, 0, 1, 1, 0, 0, 1]\n",
      "   -5.1559 if pav>=-0.6246950507164002\n",
      "   +4.1708 if cp>=-0.00777187906205653\n",
      "   +0.0000 if cp<=-0.033406380191445345 & cv<=0.5138146758079531\n",
      "   +0.0000 if cp>=0.0900518611073494\n",
      "   -4.0028 if cp<=0.019582501053810125 & cp>=-0.010461837612092495 & cv<=0.04960751309990884 & pa>=-0.14058155417442322\n",
      "--------------\n",
      "   -4.9290 if \n",
      "   +6.9038 if cp<=0.02766814008355141 & pav>=-0.37035724520683266\n",
      "   -0.0217 if cv>=0.3177134096622468 & pav>=-0.7209678053855896\n",
      "   -0.0000 if cp>=0.0900518611073494\n",
      "   -6.3104 if cp>=0.001480318093672411 & cv>=0.04960751309990884 & pa>=-0.05005654245615006\n",
      "Run episode 521 with rewards 48.0\n",
      "============ 522 ===========\n",
      "25 actions [1, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1, 1, 0, 0, 1, 0, 0, 1, 0]\n",
      "   -0.6381 if pav>=-0.6246950507164002\n",
      "   +0.2639 if cp>=-0.00777187906205653\n",
      "   +0.0000 if cp>=0.0900518611073494\n",
      "   -2.3001 if cp<=0.019582501053810125 & cp>=-0.010461837612092495 & cv<=0.04960751309990884 & pa>=-0.14058155417442322\n",
      "   +5.3097 if cp>=0.026142028719186788 & cv<=-0.2887256205081939 & pa>=-0.03863524049520492\n",
      "--------------\n",
      "   -6.2701 if \n",
      "   +7.5909 if cp<=0.02766814008355141 & pav>=-0.37035724520683266\n",
      "   -0.0027 if cv>=0.3177134096622468 & pav>=-0.7209678053855896\n",
      "   -6.2349 if cp>=0.001480318093672411 & cv>=0.04960751309990884 & pa>=-0.05005654245615006\n",
      "   -5.2738 if cp>=0.01977927349507809 & cv<=-0.1591957479715347 & cv<=-0.2887256205081939 & pa>=-0.03863524049520492\n",
      "Run episode 522 with rewards 25.0\n",
      "============ 523 ===========\n",
      "23 actions [1, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1]\n",
      "   -1.0106 if pav>=-0.6246950507164002\n",
      "   +0.8460 if cp>=-0.00777187906205653\n",
      "   -1.5944 if cp<=0.019582501053810125 & cp>=-0.010461837612092495 & cv<=0.04960751309990884 & pa>=-0.14058155417442322\n",
      "   +0.0000 if cp>=0.026142028719186788 & cv<=-0.2887256205081939 & pa>=-0.03863524049520492\n",
      "   -2.6912 if cv>=-0.009875047951936715 & pav>=-0.38328475952148433\n",
      "--------------\n",
      "   -3.7862 if \n",
      "   +6.3707 if cp<=0.02766814008355141 & pav>=-0.37035724520683266\n",
      "   -0.0000 if cp>=0.001480318093672411 & cv>=0.04960751309990884 & pa>=-0.05005654245615006\n",
      "   -0.0000 if cp>=0.01977927349507809 & cv<=-0.1591957479715347 & cv<=-0.2887256205081939 & pa>=-0.03863524049520492\n",
      "   -3.7136 if cp>=0.012437111325562002 & cv<=-0.009875047951936715 & pav<=-0.29916530251502976\n",
      "Run episode 523 with rewards 23.0\n",
      "============ 524 ===========\n",
      "46 actions [1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 0, 1, 0, 1, 0, 0, 1, 0]\n",
      "   -0.5001 if pav>=-0.6246950507164002\n",
      "   +0.6968 if cp>=-0.00777187906205653\n",
      "   -0.6324 if cp<=0.019582501053810125 & cp>=-0.010461837612092495 & cv<=0.04960751309990884 & pa>=-0.14058155417442322\n",
      "   -5.3531 if cv>=-0.009875047951936715 & pav>=-0.38328475952148433\n",
      "   -1.8151 if cv<=-0.024858080595731732\n",
      "--------------\n",
      "   -3.7726 if \n",
      "   +6.0817 if cp<=0.02766814008355141 & pav>=-0.37035724520683266\n",
      "   +0.0000 if cp>=0.001480318093672411 & cv>=0.04960751309990884 & pa>=-0.05005654245615006\n",
      "   +0.0000 if cp>=0.012437111325562002 & cv<=-0.009875047951936715 & pav<=-0.29916530251502976\n",
      "   +2.8287 if cp<=-0.01555599421262741 & cp>=-0.027320092916488646 & cv>=0.15564769208431245 & pav>=-0.4505378305912018\n",
      "Run episode 524 with rewards 46.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 525 ===========\n",
      "39 actions [1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0]\n",
      "   +1.6885 if cp>=-0.00777187906205653\n",
      "   -1.7945 if cp<=0.019582501053810125 & cp>=-0.010461837612092495 & cv<=0.04960751309990884 & pa>=-0.14058155417442322\n",
      "   -8.6139 if cv>=-0.009875047951936715 & pav>=-0.38328475952148433\n",
      "   -1.7887 if cv<=-0.024858080595731732\n",
      "   +3.0156 if cv>=-0.10684785991907067 & pa<=-0.11931860446929932 & pav>=-0.4177037179470062\n",
      "--------------\n",
      "   -3.3844 if \n",
      "   +5.5370 if cp<=0.02766814008355141 & pav>=-0.37035724520683266\n",
      "   -0.0000 if cp>=0.012437111325562002 & cv<=-0.009875047951936715 & pav<=-0.29916530251502976\n",
      "   -0.0000 if cp<=-0.01555599421262741 & cp>=-0.027320092916488646 & cv>=0.15564769208431245 & pav>=-0.4505378305912018\n",
      "   -1.8846 if cp>=0.010045910254120854 & pa<=-0.11931860446929932 & pav>=-0.4177037179470062\n",
      "Run episode 525 with rewards 39.0\n",
      "============ 526 ===========\n",
      "36 actions [1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 0, 0, 0, 0, 1, 1, 1, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1]\n",
      "   -1.2053 if cp<=0.019582501053810125 & cp>=-0.010461837612092495 & cv<=0.04960751309990884 & pa>=-0.14058155417442322\n",
      "   -6.1207 if cv>=-0.009875047951936715 & pav>=-0.38328475952148433\n",
      "   -1.1674 if cv<=-0.024858080595731732\n",
      "   +3.7472 if cv>=-0.10684785991907067 & pa<=-0.11931860446929932 & pav>=-0.4177037179470062\n",
      "   +2.4824 if cv>=-0.13155211061239241 & pav<=-0.40680339932441706\n",
      "--------------\n",
      "   -4.7784 if \n",
      "   +5.5046 if cp<=0.02766814008355141 & pav>=-0.37035724520683266\n",
      "   +0.0014 if cp<=-0.01555599421262741 & cp>=-0.027320092916488646 & cv>=0.15564769208431245 & pav>=-0.4505378305912018\n",
      "   -3.8275 if cp>=0.010045910254120854 & pa<=-0.11931860446929932 & pav>=-0.4177037179470062\n",
      "   +1.7564 if pav>=-0.40680339932441706\n",
      "Run episode 526 with rewards 36.0\n",
      "============ 527 ===========\n",
      "29 actions [1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 0, 1, 1, 0, 1, 0, 1, 0, 0]\n",
      "   -1.8874 if cp<=0.019582501053810125 & cp>=-0.010461837612092495 & cv<=0.04960751309990884 & pa>=-0.14058155417442322\n",
      "   -3.1658 if cv>=-0.009875047951936715 & pav>=-0.38328475952148433\n",
      "   +0.7491 if cv>=-0.10684785991907067 & pa<=-0.11931860446929932 & pav>=-0.4177037179470062\n",
      "   +1.3371 if cv>=-0.13155211061239241 & pav<=-0.40680339932441706\n",
      "   -3.0554 if pa>=-0.12005524337291718 & pav<=-0.1270468831062317 & pav>=-0.28179323673248274\n",
      "--------------\n",
      "   -2.9107 if \n",
      "   +4.7904 if cp<=0.02766814008355141 & pav>=-0.37035724520683266\n",
      "   -3.6489 if cp>=0.010045910254120854 & pa<=-0.11931860446929932 & pav>=-0.4177037179470062\n",
      "   +0.7436 if pav>=-0.40680339932441706\n",
      "   -1.6998 if pav<=-0.37573719024658203 & pav>=-0.37573719024658203\n",
      "Run episode 527 with rewards 29.0\n",
      "============ 528 ===========\n",
      "38 actions [1, 1, 0, 1, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 0, 1]\n",
      "   -1.4649 if cp<=0.019582501053810125 & cp>=-0.010461837612092495 & cv<=0.04960751309990884 & pa>=-0.14058155417442322\n",
      "   -2.7232 if cv>=-0.009875047951936715 & pav>=-0.38328475952148433\n",
      "   +2.3094 if cv>=-0.13155211061239241 & pav<=-0.40680339932441706\n",
      "   -0.1297 if pa>=-0.12005524337291718 & pav<=-0.1270468831062317 & pav>=-0.28179323673248274\n",
      "   +1.6090 if cp>=0.016003631055355072\n",
      "--------------\n",
      "   -3.0529 if \n",
      "   +5.0053 if cp<=0.02766814008355141 & pav>=-0.37035724520683266\n",
      "   -3.7720 if cp>=0.010045910254120854 & pa<=-0.11931860446929932 & pav>=-0.4177037179470062\n",
      "   -0.0000 if pav<=-0.37573719024658203 & pav>=-0.37573719024658203\n",
      "   +1.7897 if pa>=-0.009864386171102524\n",
      "Run episode 528 with rewards 38.0\n",
      "============ 529 ===========\n",
      "26 actions [1, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1, 1, 0, 0, 1, 0, 1, 0]\n",
      "   -2.2247 if cp<=0.019582501053810125 & cp>=-0.010461837612092495 & cv<=0.04960751309990884 & pa>=-0.14058155417442322\n",
      "   -0.9603 if cv>=-0.009875047951936715 & pav>=-0.38328475952148433\n",
      "   +2.2997 if cv>=-0.13155211061239241 & pav<=-0.40680339932441706\n",
      "   +0.0383 if cp>=0.016003631055355072\n",
      "   -4.9807 if cp>=0.02352438606321812 & pa>=-0.07041605859994886 & pav>=-0.3676524877548218\n",
      "--------------\n",
      "   -3.1885 if \n",
      "   +8.0804 if cp<=0.02766814008355141 & pav>=-0.37035724520683266\n",
      "   -0.0000 if cp>=0.010045910254120854 & pa<=-0.11931860446929932 & pav>=-0.4177037179470062\n",
      "   -0.0000 if pa>=-0.009864386171102524\n",
      "   +4.9340 if cp>=0.02352438606321812 & pa>=-0.07041605859994886 & pav>=-0.3676524877548218\n",
      "Run episode 529 with rewards 26.0\n",
      "============ 530 ===========\n",
      "22 actions [1, 1, 0, 1, 0, 0, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 0, 1, 0]\n",
      "   -0.2929 if cp<=0.019582501053810125 & cp>=-0.010461837612092495 & cv<=0.04960751309990884 & pa>=-0.14058155417442322\n",
      "   -1.1752 if cv>=-0.009875047951936715 & pav>=-0.38328475952148433\n",
      "   +1.9732 if cv>=-0.13155211061239241 & pav<=-0.40680339932441706\n",
      "   +0.0000 if cp>=0.02352438606321812 & pa>=-0.07041605859994886 & pav>=-0.3676524877548218\n",
      "   +0.3015 if pa>=-0.14173828065395355 & pav>=-0.41148310899734497\n",
      "--------------\n",
      "   -2.2816 if \n",
      "   +5.6195 if cp<=0.02766814008355141 & pav>=-0.37035724520683266\n",
      "   -0.1855 if cp>=0.010045910254120854 & pa<=-0.11931860446929932 & pav>=-0.4177037179470062\n",
      "   -0.0000 if cp>=0.02352438606321812 & pa>=-0.07041605859994886 & pav>=-0.3676524877548218\n",
      "   -1.0599 if pav<=-0.41148310899734497\n",
      "Run episode 530 with rewards 22.0\n",
      "============ 531 ===========\n",
      "28 actions [1, 1, 0, 1, 0, 0, 0, 1, 0, 0, 1, 1, 1, 0, 0, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 0]\n",
      "   +2.0142 if cp<=0.019582501053810125 & cp>=-0.010461837612092495 & cv<=0.04960751309990884 & pa>=-0.14058155417442322\n",
      "   -1.3924 if cv>=-0.009875047951936715 & pav>=-0.38328475952148433\n",
      "   +1.5534 if cv>=-0.13155211061239241 & pav<=-0.40680339932441706\n",
      "   +0.4147 if pa>=-0.14173828065395355 & pav>=-0.41148310899734497\n",
      "   -2.0105 if pav>=0.122157983481884\n",
      "--------------\n",
      "   -1.7151 if \n",
      "   +4.9758 if cp<=0.02766814008355141 & pav>=-0.37035724520683266\n",
      "   +0.0000 if cp>=0.010045910254120854 & pa<=-0.11931860446929932 & pav>=-0.4177037179470062\n",
      "   -1.2422 if pav<=-0.41148310899734497\n",
      "   -5.2060 if cp>=0.0022633814252913 & cv>=-0.20899319648742676 & pa>=-0.10059787780046463\n",
      "Run episode 531 with rewards 28.0\n",
      "============ 532 ===========\n",
      "24 actions [1, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 0, 1, 1, 0, 1, 0]\n",
      "   +3.3894 if cp<=0.019582501053810125 & cp>=-0.010461837612092495 & cv<=0.04960751309990884 & pa>=-0.14058155417442322\n",
      "   -4.5557 if cv>=-0.009875047951936715 & pav>=-0.38328475952148433\n",
      "   +1.6000 if cv>=-0.13155211061239241 & pav<=-0.40680339932441706\n",
      "   -3.6944 if pav>=0.122157983481884\n",
      "   -3.2244 if pa>=-0.04911992698907852\n",
      "--------------\n",
      "   -0.7147 if \n",
      "   +3.2666 if cp<=0.02766814008355141 & pav>=-0.37035724520683266\n",
      "   -1.7692 if pav<=-0.41148310899734497\n",
      "   -2.1450 if cp>=0.0022633814252913 & cv>=-0.20899319648742676 & pa>=-0.10059787780046463\n",
      "   +3.0356 if pa>=-0.04911992698907852\n",
      "Run episode 532 with rewards 24.0\n",
      "============ 533 ===========\n",
      "30 actions [1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 0, 0, 0, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1]\n",
      "   -0.0045 if cp<=0.019582501053810125 & cp>=-0.010461837612092495 & cv<=0.04960751309990884 & pa>=-0.14058155417442322\n",
      "   -6.1043 if cv>=-0.009875047951936715 & pav>=-0.38328475952148433\n",
      "   -1.9423 if pav>=0.122157983481884\n",
      "   -0.0088 if pa>=-0.04911992698907852\n",
      "   +1.5877 if cp>=0.062418568134307864 & pa>=-0.18463978469371795 & pav<=-0.17864483594894395\n",
      "--------------\n",
      "   +0.8112 if cp<=0.02766814008355141 & pav>=-0.37035724520683266\n",
      "   -2.5267 if pav<=-0.41148310899734497\n",
      "   -1.6219 if cp>=0.0022633814252913 & cv>=-0.20899319648742676 & pa>=-0.10059787780046463\n",
      "   +0.8112 if pa>=-0.04911992698907852\n",
      "   -1.8958 if cp>=0.08987121284008026\n",
      "Run episode 533 with rewards 30.0\n",
      "============ 534 ===========\n",
      "22 actions [1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0, 0, 0, 0]\n",
      "   -5.3433 if cv>=-0.009875047951936715 & pav>=-0.38328475952148433\n",
      "   -3.6416 if pav>=0.122157983481884\n",
      "   +1.7381 if pa>=-0.04911992698907852\n",
      "   +2.4158 if cp>=0.062418568134307864 & pa>=-0.18463978469371795 & pav<=-0.17864483594894395\n",
      "   +2.0686 if cp>=0.04887635484337808 & cv<=0.0037318736314773653\n",
      "--------------\n",
      "   -1.2300 if pav<=-0.41148310899734497\n",
      "   -1.8258 if cp>=0.0022633814252913 & cv>=-0.20899319648742676 & pa>=-0.10059787780046463\n",
      "   -1.6141 if pa>=-0.04911992698907852\n",
      "   -0.0000 if cp>=0.08987121284008026\n",
      "   -1.7722 if cp>=0.04887635484337808\n",
      "Run episode 534 with rewards 22.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 535 ===========\n",
      "20 actions [1, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 0]\n",
      "   -5.8263 if cv>=-0.009875047951936715 & pav>=-0.38328475952148433\n",
      "   -0.6032 if pav>=0.122157983481884\n",
      "   -0.0000 if cp>=0.062418568134307864 & pa>=-0.18463978469371795 & pav<=-0.17864483594894395\n",
      "   +2.8836 if cp>=0.04887635484337808 & cv<=0.0037318736314773653\n",
      "   +4.2911 if cp>=0.03794880956411362 & cv<=0.18794735074043273 & cv>=0.10957186222076444\n",
      "--------------\n",
      "   -1.7722 if pav<=-0.41148310899734497\n",
      "   +0.7877 if cp>=0.0022633814252913 & cv>=-0.20899319648742676 & pa>=-0.10059787780046463\n",
      "   -1.8590 if pa>=-0.04911992698907852\n",
      "   -2.9013 if cp>=0.04887635484337808\n",
      "   -4.4077 if cp>=0.03794880956411362 & cv<=0.18794735074043273 & cv>=0.10957186222076444\n",
      "Run episode 535 with rewards 20.0\n",
      "============ 536 ===========\n",
      "29 actions [0, 0, 1, 1, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 0, 1]\n",
      "   -5.3161 if cv>=-0.009875047951936715 & pav>=-0.38328475952148433\n",
      "   -0.0000 if pav>=0.122157983481884\n",
      "   -0.0000 if cp>=0.04887635484337808 & cv<=0.0037318736314773653\n",
      "   -0.0000 if cp>=0.03794880956411362 & cv<=0.18794735074043273 & cv>=0.10957186222076444\n",
      "   +2.1750 if cp<=0.0071456166915595636 & cv>=0.2361815243959427\n",
      "--------------\n",
      "   -3.9889 if pav<=-0.41148310899734497\n",
      "   +0.2394 if pa>=-0.04911992698907852\n",
      "   -0.0000 if cp>=0.04887635484337808\n",
      "   -0.0000 if cp>=0.03794880956411362 & cv<=0.18794735074043273 & cv>=0.10957186222076444\n",
      "   +1.4983 if cp>=0.017335234209895134\n",
      "Run episode 536 with rewards 29.0\n",
      "============ 537 ===========\n",
      "30 actions [1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 0, 1, 0, 1, 0]\n",
      "   -3.6983 if cv>=-0.009875047951936715 & pav>=-0.38328475952148433\n",
      "   +0.0000 if cp>=0.04887635484337808 & cv<=0.0037318736314773653\n",
      "   +0.0000 if cp>=0.03794880956411362 & cv<=0.18794735074043273 & cv>=0.10957186222076444\n",
      "   +0.9398 if cp<=0.0071456166915595636 & cv>=0.2361815243959427\n",
      "   -2.9224 if pav>=0.5672976970672607\n",
      "--------------\n",
      "   -5.3172 if pav<=-0.41148310899734497\n",
      "   -0.0740 if pa>=-0.04911992698907852\n",
      "   +0.0000 if cp>=0.03794880956411362 & cv<=0.18794735074043273 & cv>=0.10957186222076444\n",
      "   +1.8880 if cp>=0.017335234209895134\n",
      "   +3.1557 if pav>=0.5672976970672607\n",
      "Run episode 537 with rewards 30.0\n",
      "============ 538 ===========\n",
      "30 actions [1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0]\n",
      "   -3.2600 if cv>=-0.009875047951936715 & pav>=-0.38328475952148433\n",
      "   +0.0000 if cp>=0.03794880956411362 & cv<=0.18794735074043273 & cv>=0.10957186222076444\n",
      "   +0.0000 if cp<=0.0071456166915595636 & cv>=0.2361815243959427\n",
      "   +0.0000 if pav>=0.5672976970672607\n",
      "   -5.7007 if cv>=0.43804454803466797 & pav>=-0.5946303367614746\n",
      "--------------\n",
      "   -4.9490 if pav<=-0.41148310899734497\n",
      "   +0.7776 if pa>=-0.04911992698907852\n",
      "   +0.6184 if cp>=0.017335234209895134\n",
      "   -0.0000 if pav>=0.5672976970672607\n",
      "   +5.7425 if cp>=0.07845514267683029 & cv>=0.43804454803466797 & pav>=-0.5946303367614746\n",
      "Run episode 538 with rewards 30.0\n",
      "============ 539 ===========\n",
      "24 actions [1, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 0]\n",
      "   -4.1021 if cv>=-0.009875047951936715 & pav>=-0.38328475952148433\n",
      "   +1.0690 if cp<=0.0071456166915595636 & cv>=0.2361815243959427\n",
      "   +0.0000 if pav>=0.5672976970672607\n",
      "   +0.0000 if cv>=0.43804454803466797 & pav>=-0.5946303367614746\n",
      "   +2.5684 if cp>=0.07118642330169678\n",
      "--------------\n",
      "   -5.6244 if pav<=-0.41148310899734497\n",
      "   +1.1719 if pa>=-0.04911992698907852\n",
      "   +1.0671 if cp>=0.017335234209895134\n",
      "   -0.0000 if cp>=0.07845514267683029 & cv>=0.43804454803466797 & pav>=-0.5946303367614746\n",
      "   -2.8837 if cp>=0.07118642330169678\n",
      "Run episode 539 with rewards 24.0\n",
      "============ 540 ===========\n",
      "25 actions [1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 0, 1, 1, 0]\n",
      "   -4.0206 if cv>=-0.009875047951936715 & pav>=-0.38328475952148433\n",
      "   +0.7032 if cp<=0.0071456166915595636 & cv>=0.2361815243959427\n",
      "   -0.0000 if cv>=0.43804454803466797 & pav>=-0.5946303367614746\n",
      "   -0.0000 if cp>=0.07118642330169678\n",
      "   +2.7220 if cp<=0.008678823150694376 & pav<=-0.36146447062492365 & pav>=-0.46016164422035216\n",
      "--------------\n",
      "   -2.2739 if pav<=-0.41148310899734497\n",
      "   +0.8473 if pa>=-0.04911992698907852\n",
      "   +1.5369 if cp>=0.017335234209895134\n",
      "   +0.0000 if cp>=0.07118642330169678\n",
      "   -3.0514 if pav<=-0.36146447062492365\n",
      "Run episode 540 with rewards 25.0\n",
      "============ 541 ===========\n",
      "50 actions [1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 0, 0, 0, 1, 1, 1, 0, 1, 0, 0, 1, 0, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0]\n",
      "   -3.7306 if cv>=-0.009875047951936715 & pav>=-0.38328475952148433\n",
      "   +0.0000 if cp<=0.0071456166915595636 & cv>=0.2361815243959427\n",
      "   +1.4413 if cp>=0.07118642330169678\n",
      "   +0.0000 if cp<=0.008678823150694376 & pav<=-0.36146447062492365 & pav>=-0.46016164422035216\n",
      "   -1.6596 if cp>=0.08964531868696213\n",
      "--------------\n",
      "   -1.7373 if pav<=-0.41148310899734497\n",
      "   +0.8550 if pa>=-0.04911992698907852\n",
      "   +0.0728 if cp>=0.017335234209895134\n",
      "   -3.9745 if pav<=-0.36146447062492365\n",
      "   +1.6729 if cp>=0.08964531868696213\n",
      "Run episode 541 with rewards 50.0\n",
      "============ 542 ===========\n",
      "36 actions [1, 1, 0, 1, 0, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 0, 0, 1, 0, 0, 1, 0]\n",
      "   -4.3198 if cv>=-0.009875047951936715 & pav>=-0.38328475952148433\n",
      "   +0.0000 if cp>=0.07118642330169678\n",
      "   +0.3188 if cp<=0.008678823150694376 & pav<=-0.36146447062492365 & pav>=-0.46016164422035216\n",
      "   +0.0000 if cp>=0.08964531868696213\n",
      "   -4.1255 if cv<=-0.5637408256530761 & pav>=-0.004294549860060111\n",
      "--------------\n",
      "   -3.2372 if pav<=-0.41148310899734497\n",
      "   +3.0680 if pa>=-0.04911992698907852\n",
      "   -4.8015 if pav<=-0.36146447062492365\n",
      "   +0.0000 if cp>=0.08964531868696213\n",
      "   +4.2981 if cp>=0.013436807692050946 & pa>=-0.09517753571271895 & pav>=-0.19049062430858604\n",
      "Run episode 542 with rewards 36.0\n",
      "============ 543 ===========\n",
      "66 actions [1, 1, 0, 0, 0, 0, 1, 1, 1, 0, 0, 1, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0, 0, 1, 1, 1, 0, 1, 0, 0, 1, 0, 0, 1, 1, 0, 0, 1, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 0, 0, 1, 1, 0, 0, 0, 1, 0, 1, 1, 0, 0, 0, 1, 0, 1, 0]\n",
      "   -5.6627 if cv>=-0.009875047951936715 & pav>=-0.38328475952148433\n",
      "   +3.7458 if cp<=0.008678823150694376 & pav<=-0.36146447062492365 & pav>=-0.46016164422035216\n",
      "   +0.0000 if cp>=0.08964531868696213\n",
      "   -2.8748 if cv<=-0.5637408256530761 & pav>=-0.004294549860060111\n",
      "   +5.5850 if cp>=-0.024115147069096565 & cv>=0.017739456146955504 & pa>=-0.05935828387737274\n",
      "--------------\n",
      "   -1.6712 if pav<=-0.41148310899734497\n",
      "   +0.7949 if pa>=-0.04911992698907852\n",
      "   -4.4498 if pav<=-0.36146447062492365\n",
      "   +0.0000 if cp>=0.013436807692050946 & pa>=-0.09517753571271895 & pav>=-0.19049062430858604\n",
      "   -4.2755 if cp>=-0.024115147069096565 & cv>=0.017739456146955504 & pa>=-0.05935828387737274\n",
      "Run episode 543 with rewards 66.0\n",
      "============ 544 ===========\n",
      "32 actions [1, 0, 1, 1, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 0, 1, 1, 0, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1]\n",
      "   -2.5849 if cv>=-0.009875047951936715 & pav>=-0.38328475952148433\n",
      "   +0.8614 if cp<=0.008678823150694376 & pav<=-0.36146447062492365 & pav>=-0.46016164422035216\n",
      "   -4.9128 if cv<=-0.5637408256530761 & pav>=-0.004294549860060111\n",
      "   +2.4105 if cp>=-0.024115147069096565 & cv>=0.017739456146955504 & pa>=-0.05935828387737274\n",
      "   +3.6651 if cp>=-0.015427916310727596\n",
      "--------------\n",
      "   -3.1129 if pav<=-0.41148310899734497\n",
      "   +1.6482 if pa>=-0.04911992698907852\n",
      "   -3.2625 if pav<=-0.36146447062492365\n",
      "   -3.7324 if cp>=-0.024115147069096565 & cv>=0.017739456146955504 & pa>=-0.05935828387737274\n",
      "   -3.6651 if cp>=-0.015427916310727596\n",
      "Run episode 544 with rewards 32.0\n",
      "============ 545 ===========\n",
      "13 actions [0, 0, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1]\n",
      "   -2.0481 if cv>=-0.009875047951936715 & pav>=-0.38328475952148433\n",
      "   -2.4129 if cv<=-0.5637408256530761 & pav>=-0.004294549860060111\n",
      "   +1.7508 if cp>=-0.024115147069096565 & cv>=0.017739456146955504 & pa>=-0.05935828387737274\n",
      "   +6.2727 if cp>=-0.015427916310727596\n",
      "   -3.6846 if cp>=-0.019593695923686028 & pav>=-0.26002068519592286\n",
      "--------------\n",
      "   -1.0051 if pav<=-0.41148310899734497\n",
      "   -2.4546 if pav<=-0.36146447062492365\n",
      "   -1.9347 if cp>=-0.024115147069096565 & cv>=0.017739456146955504 & pa>=-0.05935828387737274\n",
      "   -6.4283 if cp>=-0.015427916310727596\n",
      "   +3.6447 if cp>=-0.019593695923686028 & pav>=-0.26002068519592286\n",
      "Run episode 545 with rewards 13.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 546 ===========\n",
      "13 actions [0, 0, 0, 1, 0, 0, 0, 0, 1, 1, 1, 1, 1]\n",
      "   +0.0000 if cv>=-0.009875047951936715 & pav>=-0.38328475952148433\n",
      "   -2.4862 if cv<=-0.5637408256530761 & pav>=-0.004294549860060111\n",
      "   +0.4251 if cp>=-0.015427916310727596\n",
      "   -0.0133 if cp>=-0.019593695923686028 & pav>=-0.26002068519592286\n",
      "   +2.1768 if cp>=-0.037626151740550985\n",
      "--------------\n",
      "   +0.0000 if pav<=-0.36146447062492365\n",
      "   +0.0000 if cp>=-0.024115147069096565 & cv>=0.017739456146955504 & pa>=-0.05935828387737274\n",
      "   -0.4762 if cp>=-0.015427916310727596\n",
      "   -0.0094 if cp>=-0.019593695923686028 & pav>=-0.26002068519592286\n",
      "   -2.1845 if cp>=-0.037626151740550985\n",
      "Run episode 546 with rewards 13.0\n",
      "============ 547 ===========\n",
      "14 actions [0, 0, 0, 0, 0, 1, 1, 1, 0, 0, 1, 1, 0, 1]\n",
      "   -3.0780 if cv<=-0.5637408256530761 & pav>=-0.004294549860060111\n",
      "   -1.0964 if cp>=-0.015427916310727596\n",
      "   -1.0964 if cp>=-0.019593695923686028 & pav>=-0.26002068519592286\n",
      "   +1.8496 if cp>=-0.037626151740550985\n",
      "   +0.9591 if cp>=-0.09162965416908264\n",
      "--------------\n",
      "   +0.0000 if pav<=-0.36146447062492365\n",
      "   +1.1827 if cp>=-0.015427916310727596\n",
      "   +1.1827 if cp>=-0.019593695923686028 & pav>=-0.26002068519592286\n",
      "   -2.0996 if cp>=-0.037626151740550985\n",
      "   -4.1500 if cv>=-0.5487690806388853\n",
      "Run episode 547 with rewards 14.0\n",
      "============ 548 ===========\n",
      "13 actions [0, 0, 0, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1]\n",
      "   +1.9091 if cv<=-0.5637408256530761 & pav>=-0.004294549860060111\n",
      "   -0.0000 if cp>=-0.015427916310727596\n",
      "   +0.1236 if cp>=-0.019593695923686028 & pav>=-0.26002068519592286\n",
      "   +1.1430 if cp>=-0.037626151740550985\n",
      "   -4.0688 if cv<=-0.751824676990509\n",
      "--------------\n",
      "   +0.0000 if cp>=-0.015427916310727596\n",
      "   -0.4133 if cp>=-0.019593695923686028 & pav>=-0.26002068519592286\n",
      "   -1.0531 if cp>=-0.037626151740550985\n",
      "   -1.9438 if cv>=-0.5487690806388853\n",
      "   -3.7416 if cp>=-0.0592588499188423 & cv<=-0.5635031700134278 & cv>=-0.751824676990509\n",
      "Run episode 548 with rewards 13.0\n",
      "============ 549 ===========\n",
      "15 actions [1, 0, 0, 0, 1, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0]\n",
      "   +2.1593 if cv<=-0.5637408256530761 & pav>=-0.004294549860060111\n",
      "   +0.6631 if cp>=-0.019593695923686028 & pav>=-0.26002068519592286\n",
      "   +0.8435 if cp>=-0.037626151740550985\n",
      "   +0.6760 if cv<=-0.751824676990509\n",
      "   -4.7269 if cp>=-0.12576246559619902 & cv<=-0.8223621726036072\n",
      "--------------\n",
      "   -0.3012 if cp>=-0.019593695923686028 & pav>=-0.26002068519592286\n",
      "   -2.9015 if cp>=-0.037626151740550985\n",
      "   -0.3012 if cv>=-0.5487690806388853\n",
      "   -0.0233 if cp>=-0.0592588499188423 & cv<=-0.5635031700134278 & cv>=-0.751824676990509\n",
      "   -0.9395 if cv>=-0.6313811659812927\n",
      "Run episode 549 with rewards 15.0\n",
      "============ 550 ===========\n",
      "18 actions [0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0]\n",
      "   +1.3287 if cv<=-0.5637408256530761 & pav>=-0.004294549860060111\n",
      "   -0.0000 if cp>=-0.037626151740550985\n",
      "   -0.3112 if cv<=-0.751824676990509\n",
      "   -2.2032 if cp>=-0.12576246559619902 & cv<=-0.8223621726036072\n",
      "   -3.2496 if cv<=-0.4027028322219849 & pa<=-0.014950125291943549\n",
      "--------------\n",
      "   +0.0000 if cp>=-0.019593695923686028 & pav>=-0.26002068519592286\n",
      "   +0.0000 if cp>=-0.037626151740550985\n",
      "   +1.6757 if cv>=-0.5487690806388853\n",
      "   -0.0515 if cv>=-0.6313811659812927\n",
      "   -2.8478 if cv>=-0.4027028322219849\n",
      "Run episode 550 with rewards 18.0\n",
      "============ 551 ===========\n",
      "14 actions [0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1]\n",
      "   +0.0000 if cv<=-0.5637408256530761 & pav>=-0.004294549860060111\n",
      "   +0.0000 if cv<=-0.751824676990509\n",
      "   +0.0000 if cp>=-0.12576246559619902 & cv<=-0.8223621726036072\n",
      "   -0.0000 if cv<=-0.4027028322219849 & pa<=-0.014950125291943549\n",
      "   +3.0303 if cp>=-0.10472514629364013 & cv>=-0.25245015025138856\n",
      "--------------\n",
      "   +0.0000 if cp>=-0.037626151740550985\n",
      "   +1.3843 if cv>=-0.5487690806388853\n",
      "   +1.3843 if cv>=-0.6313811659812927\n",
      "   -6.0144 if cv>=-0.4027028322219849\n",
      "   +1.1993 if cp<=-0.08234153240919112\n",
      "Run episode 551 with rewards 14.0\n",
      "============ 552 ===========\n",
      "18 actions [0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 0, 1]\n",
      "   -2.0205 if cv<=-0.5637408256530761 & pav>=-0.004294549860060111\n",
      "   +0.0000 if cp>=-0.12576246559619902 & cv<=-0.8223621726036072\n",
      "   +0.0000 if cv<=-0.4027028322219849 & pa<=-0.014950125291943549\n",
      "   +0.4541 if cp>=-0.10472514629364013 & cv>=-0.25245015025138856\n",
      "   +1.3287 if cv>=-0.3799165904521942\n",
      "--------------\n",
      "   -2.9251 if cv>=-0.5487690806388853\n",
      "   +2.4081 if cv>=-0.6313811659812927\n",
      "   -2.9251 if cv>=-0.4027028322219849\n",
      "   +0.0902 if cp<=-0.08234153240919112\n",
      "   +0.2503 if cv<=-0.5740789890289306\n",
      "Run episode 552 with rewards 18.0\n",
      "============ 553 ===========\n",
      "18 actions [0, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0]\n",
      "   -1.6164 if cv<=-0.5637408256530761 & pav>=-0.004294549860060111\n",
      "   +0.0000 if cp>=-0.12576246559619902 & cv<=-0.8223621726036072\n",
      "   +0.6338 if cp>=-0.10472514629364013 & cv>=-0.25245015025138856\n",
      "   +0.8999 if cv>=-0.3799165904521942\n",
      "   +1.5071 if cp<=-0.10264502167701721 & cp>=-0.1288241595029831 & cv<=-0.40347102880477903 & cv>=-0.41322424411773684\n",
      "--------------\n",
      "   -0.9668 if cv>=-0.5487690806388853\n",
      "   +0.6514 if cv>=-0.6313811659812927\n",
      "   -3.3223 if cv>=-0.4027028322219849\n",
      "   +1.6183 if cv<=-0.5740789890289306\n",
      "   -1.5709 if cp<=-0.10264502167701721 & cp>=-0.1288241595029831 & cv<=-0.40347102880477903 & cv>=-0.41322424411773684\n",
      "Run episode 553 with rewards 18.0\n",
      "============ 554 ===========\n",
      "13 actions [0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1]\n",
      "   -1.7107 if cv<=-0.5637408256530761 & pav>=-0.004294549860060111\n",
      "   +0.7994 if cp>=-0.10472514629364013 & cv>=-0.25245015025138856\n",
      "   +0.7543 if cv>=-0.3799165904521942\n",
      "   -0.0000 if cp<=-0.10264502167701721 & cp>=-0.1288241595029831 & cv<=-0.40347102880477903 & cv>=-0.41322424411773684\n",
      "   -2.9106 if cp>=0.01348829977214337 & cv<=-0.4179383933544159\n",
      "--------------\n",
      "   -1.6459 if cv>=-0.5487690806388853\n",
      "   -1.3987 if cv>=-0.4027028322219849\n",
      "   +2.1368 if cv<=-0.5740789890289306\n",
      "   +0.0000 if cp<=-0.10264502167701721 & cp>=-0.1288241595029831 & cv<=-0.40347102880477903 & cv>=-0.41322424411773684\n",
      "   +3.9178 if cp>=0.01348829977214337 & cv<=-0.4179383933544159\n",
      "Run episode 554 with rewards 13.0\n",
      "============ 555 ===========\n",
      "13 actions [0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0]\n",
      "   -0.7630 if cv<=-0.5637408256530761 & pav>=-0.004294549860060111\n",
      "   +0.7169 if cp>=-0.10472514629364013 & cv>=-0.25245015025138856\n",
      "   +0.7169 if cv>=-0.3799165904521942\n",
      "   -0.0429 if cp>=0.01348829977214337 & cv<=-0.4179383933544159\n",
      "   +4.3759 if pa>=0.19839505851268768\n",
      "--------------\n",
      "   -4.8425 if cv>=-0.5487690806388853\n",
      "   -0.4382 if cv>=-0.4027028322219849\n",
      "   +0.9950 if cv<=-0.5740789890289306\n",
      "   +0.1303 if cp>=0.01348829977214337 & cv<=-0.4179383933544159\n",
      "   -4.3861 if pa>=0.19839505851268768\n",
      "Run episode 555 with rewards 13.0\n",
      "============ 556 ===========\n",
      "15 actions [0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0]\n",
      "   -2.1777 if cv<=-0.5637408256530761 & pav>=-0.004294549860060111\n",
      "   +0.2120 if cp>=-0.10472514629364013 & cv>=-0.25245015025138856\n",
      "   +0.2120 if cv>=-0.3799165904521942\n",
      "   -0.0004 if pa>=0.19839505851268768\n",
      "   -0.0935 if cp<=-0.07672685980796813 & cv<=-0.6172473788261413\n",
      "--------------\n",
      "   -3.2355 if cv>=-0.5487690806388853\n",
      "   -0.3993 if cv>=-0.4027028322219849\n",
      "   +2.3362 if cv<=-0.5740789890289306\n",
      "   +0.0022 if pa>=0.19839505851268768\n",
      "   +0.0997 if cp<=-0.07672685980796813 & cv<=-0.6172473788261413\n",
      "Run episode 556 with rewards 15.0\n",
      "============ 557 ===========\n",
      "14 actions [0, 0, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1, 1, 1]\n",
      "   -1.5946 if cv<=-0.5637408256530761 & pav>=-0.004294549860060111\n",
      "   +0.3779 if cp>=-0.10472514629364013 & cv>=-0.25245015025138856\n",
      "   +0.3779 if cv>=-0.3799165904521942\n",
      "   -0.0395 if cp<=-0.07672685980796813 & cv<=-0.6172473788261413\n",
      "   +0.9000 if cp>=-0.05364058390259742\n",
      "--------------\n",
      "   -2.3795 if cv>=-0.5487690806388853\n",
      "   -0.4544 if cv>=-0.4027028322219849\n",
      "   +1.6924 if cv<=-0.5740789890289306\n",
      "   +0.0421 if cp<=-0.07672685980796813 & cv<=-0.6172473788261413\n",
      "   -1.8471 if cv>=-0.42066980600357057\n",
      "Run episode 557 with rewards 14.0\n",
      "============ 558 ===========\n",
      "16 actions [0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 0, 0, 0]\n",
      "   +0.1366 if cv<=-0.5637408256530761 & pav>=-0.004294549860060111\n",
      "   +0.3689 if cp>=-0.10472514629364013 & cv>=-0.25245015025138856\n",
      "   +0.3689 if cv>=-0.3799165904521942\n",
      "   -0.1861 if cp>=-0.05364058390259742\n",
      "   +9.1720 if cp<=-0.028132556006312367 & cv<=-0.6323006510734558\n",
      "--------------\n",
      "   -2.6837 if cv>=-0.5487690806388853\n",
      "   -0.4026 if cv>=-0.4027028322219849\n",
      "   +1.6612 if cv<=-0.5740789890289306\n",
      "   -0.4026 if cv>=-0.42066980600357057\n",
      "   -3.2576 if cp<=-0.028132556006312367 & cp>=-0.058773454278707504 & cv<=-0.6323006510734558\n",
      "Run episode 558 with rewards 16.0\n",
      "============ 559 ===========\n",
      "15 actions [0, 0, 0, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 1, 1]\n",
      "   +0.7627 if cp>=-0.10472514629364013 & cv>=-0.25245015025138856\n",
      "   +0.7627 if cv>=-0.3799165904521942\n",
      "   -0.3632 if cp>=-0.05364058390259742\n",
      "   -3.2152 if cp<=-0.028132556006312367 & cv<=-0.6323006510734558\n",
      "   -9.2670 if pa>=0.19010968506336212\n",
      "--------------\n",
      "   -3.8790 if cv>=-0.5487690806388853\n",
      "   +2.6548 if cv<=-0.5740789890289306\n",
      "   -0.5499 if cv>=-0.42066980600357057\n",
      "   -0.0000 if cp<=-0.028132556006312367 & cp>=-0.058773454278707504 & cv<=-0.6323006510734558\n",
      "   +1.0755 if cv<=-0.4363577663898468 & cv>=-0.6303159594535828\n",
      "Run episode 559 with rewards 15.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 560 ===========\n",
      "15 actions [0, 0, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0]\n",
      "   +0.3163 if cp>=-0.10472514629364013 & cv>=-0.25245015025138856\n",
      "   +0.7317 if cv>=-0.3799165904521942\n",
      "   -0.9023 if cp<=-0.028132556006312367 & cv<=-0.6323006510734558\n",
      "   +4.3590 if pa>=0.19010968506336212\n",
      "   +1.5205 if cv<=-0.3822151839733124 & cv>=-0.567147719860077\n",
      "--------------\n",
      "   -1.7863 if cv>=-0.5487690806388853\n",
      "   -0.1463 if cv<=-0.5740789890289306\n",
      "   -1.7863 if cv>=-0.42066980600357057\n",
      "   -0.4321 if cv<=-0.4363577663898468 & cv>=-0.6303159594535828\n",
      "   +2.3072 if cp<=-0.07542093992233274 & cp>=-0.10174219012260437 & cv<=-0.567147719860077\n",
      "Run episode 560 with rewards 15.0\n",
      "============ 561 ===========\n",
      "15 actions [0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1]\n",
      "   +1.8669 if cv>=-0.3799165904521942\n",
      "   -2.1125 if cp<=-0.028132556006312367 & cv<=-0.6323006510734558\n",
      "   -0.1326 if pa>=0.19010968506336212\n",
      "   +3.1929 if cv<=-0.3822151839733124 & cv>=-0.567147719860077\n",
      "   -1.7697 if cv>=-0.6228690624237061\n",
      "--------------\n",
      "   -3.4364 if cv>=-0.5487690806388853\n",
      "   -1.0967 if cv>=-0.42066980600357057\n",
      "   +0.2606 if cv<=-0.4363577663898468 & cv>=-0.6303159594535828\n",
      "   +1.8278 if cp<=-0.07542093992233274 & cp>=-0.10174219012260437 & cv<=-0.567147719860077\n",
      "   +1.3686 if cv>=-0.6228690624237061\n",
      "Run episode 561 with rewards 15.0\n",
      "============ 562 ===========\n",
      "14 actions [0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1]\n",
      "   +0.2763 if cv>=-0.3799165904521942\n",
      "   -1.6867 if cp<=-0.028132556006312367 & cv<=-0.6323006510734558\n",
      "   +2.2712 if cv<=-0.3822151839733124 & cv>=-0.567147719860077\n",
      "   +2.5476 if cv>=-0.6228690624237061\n",
      "   -1.4996 if cv<=-0.5510812044143677\n",
      "--------------\n",
      "   -0.9996 if cv>=-0.5487690806388853\n",
      "   -0.9996 if cv>=-0.42066980600357057\n",
      "   +0.9052 if cp<=-0.07542093992233274 & cp>=-0.10174219012260437 & cv<=-0.567147719860077\n",
      "   -0.6731 if cv>=-0.6228690624237061\n",
      "   -1.9263 if cv>=-0.5510812044143677\n",
      "Run episode 562 with rewards 14.0\n",
      "============ 563 ===========\n",
      "11 actions [0, 0, 0, 0, 1, 0, 1, 0, 0, 0, 0]\n",
      "   -0.9235 if cp<=-0.028132556006312367 & cv<=-0.6323006510734558\n",
      "   +0.0015 if cv<=-0.3822151839733124 & cv>=-0.567147719860077\n",
      "   +5.2152 if cv>=-0.6228690624237061\n",
      "   -1.6973 if cv<=-0.5510812044143677\n",
      "   +5.4306 if pa>=0.20458000898361206\n",
      "--------------\n",
      "   -0.3909 if cv>=-0.5487690806388853\n",
      "   -0.3909 if cv>=-0.42066980600357057\n",
      "   -4.1352 if cp<=-0.07542093992233274 & cp>=-0.10174219012260437 & cv<=-0.567147719860077\n",
      "   -0.3909 if cv>=-0.5510812044143677\n",
      "   -1.2299 if cv>=-0.7991953253746032\n",
      "Run episode 563 with rewards 11.0\n",
      "============ 564 ===========\n",
      "13 actions [1, 0, 0, 0, 0, 0, 1, 1, 0, 1, 1, 0, 0]\n",
      "   -7.4145 if cp<=-0.028132556006312367 & cv<=-0.6323006510734558\n",
      "   +2.3583 if cv>=-0.6228690624237061\n",
      "   -7.1638 if cv<=-0.5510812044143677\n",
      "   +1.7597 if pa>=0.20458000898361206\n",
      "   +1.0000 if cp>=-0.0802658274769783 & cv<=-0.7389729619026184\n",
      "--------------\n",
      "   -1.4706 if cv>=-0.42066980600357057\n",
      "   +3.4555 if cp<=-0.07542093992233274 & cp>=-0.10174219012260437 & cv<=-0.567147719860077\n",
      "   -2.9258 if cv>=-0.5510812044143677\n",
      "   -3.1911 if cv>=-0.7991953253746032\n",
      "   +8.4750 if \n",
      "Run episode 564 with rewards 13.0\n",
      "============ 565 ===========\n",
      "20 actions [0, 0, 0, 1, 1, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 0, 1, 1]\n",
      "   +0.0000 if cp<=-0.028132556006312367 & cv<=-0.6323006510734558\n",
      "   +1.4430 if cv>=-0.6228690624237061\n",
      "   -0.1386 if cv<=-0.5510812044143677\n",
      "   +0.0000 if pa>=0.20458000898361206\n",
      "   +2.7052 if cp>=0.01540307812392712\n",
      "--------------\n",
      "   +0.0000 if cp<=-0.07542093992233274 & cp>=-0.10174219012260437 & cv<=-0.567147719860077\n",
      "   +0.3913 if cv>=-0.5510812044143677\n",
      "   +0.3939 if cv>=-0.7991953253746032\n",
      "   +0.3939 if \n",
      "   +2.4282 if cv<=-0.5502384185791016\n",
      "Run episode 565 with rewards 20.0\n",
      "============ 566 ===========\n",
      "21 actions [0, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 0, 1, 1, 1, 0, 0, 0, 1, 0, 1]\n",
      "   -0.0000 if cp<=-0.028132556006312367 & cv<=-0.6323006510734558\n",
      "   +0.9586 if cv>=-0.6228690624237061\n",
      "   -1.2603 if cv<=-0.5510812044143677\n",
      "   -0.0000 if cp>=0.01540307812392712\n",
      "   +3.8610 if cp>=-0.015105414018034922 & pav<=0.5829270958900452\n",
      "--------------\n",
      "   -1.7775 if cv>=-0.5510812044143677\n",
      "   +1.5464 if cv>=-0.7991953253746032\n",
      "   +1.5464 if \n",
      "   +3.3238 if cv<=-0.5502384185791016\n",
      "   -2.6140 if cp>=-0.015105414018034922 & cv<=-0.04402178898453712\n",
      "Run episode 566 with rewards 21.0\n",
      "============ 567 ===========\n",
      "16 actions [0, 0, 0, 1, 0, 1, 0, 0, 1, 1, 1, 1, 0, 0, 0, 1]\n",
      "   +0.7226 if cv>=-0.6228690624237061\n",
      "   -1.4895 if cv<=-0.5510812044143677\n",
      "   +1.8192 if cp>=0.01540307812392712\n",
      "   +2.1297 if cp>=-0.015105414018034922 & pav<=0.5829270958900452\n",
      "   +3.0499 if cp<=0.021777350455522537 & cv>=-0.5368143320083618 & pa<=0.06500580906867981\n",
      "--------------\n",
      "   -2.1014 if cv>=-0.5510812044143677\n",
      "   +0.3692 if cv>=-0.7991953253746032\n",
      "   +2.4706 if cv<=-0.5502384185791016\n",
      "   -0.6438 if cp>=-0.015105414018034922 & cv<=-0.04402178898453712\n",
      "   +3.3407 if cp<=-0.028944363817572576\n",
      "Run episode 567 with rewards 16.0\n",
      "============ 568 ===========\n",
      "27 actions [0, 0, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 1, 1, 1, 0, 1, 1, 1, 1, 0, 1, 0, 0, 0, 0, 0]\n",
      "   -0.4394 if cv<=-0.5510812044143677\n",
      "   +0.4234 if cp>=0.01540307812392712\n",
      "   +1.5296 if cp>=-0.015105414018034922 & pav<=0.5829270958900452\n",
      "   +1.3191 if cp<=0.021777350455522537 & cv>=-0.5368143320083618 & pa<=0.06500580906867981\n",
      "   +4.5211 if cv<=-0.603090763092041 & cv>=-0.603090763092041\n",
      "--------------\n",
      "   -2.8292 if cv>=-0.5510812044143677\n",
      "   -0.9220 if cv<=-0.5502384185791016\n",
      "   +1.6894 if cp>=-0.015105414018034922 & cv<=-0.04402178898453712\n",
      "   +3.9773 if cp<=-0.028944363817572576\n",
      "   +1.5781 if pa<=0.06492841243743896\n",
      "Run episode 568 with rewards 27.0\n",
      "============ 569 ===========\n",
      "20 actions [0, 0, 0, 0, 1, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 1, 1, 0, 0]\n",
      "   -2.5804 if cv<=-0.5510812044143677\n",
      "   +4.1768 if cp>=-0.015105414018034922 & pav<=0.5829270958900452\n",
      "   +0.7085 if cp<=0.021777350455522537 & cv>=-0.5368143320083618 & pa<=0.06500580906867981\n",
      "   +0.0000 if cv<=-0.603090763092041 & cv>=-0.603090763092041\n",
      "   +6.9168 if pa<=0.03521315157413483 & pav>=0.8671541690826416\n",
      "--------------\n",
      "   -3.2038 if cv>=-0.5510812044143677\n",
      "   +0.3940 if cp>=-0.015105414018034922 & cv<=-0.04402178898453712\n",
      "   +3.1226 if cp<=-0.028944363817572576\n",
      "   -0.0103 if pa<=0.06492841243743896\n",
      "   +3.6804 if cp<=-0.040692998468875884 & cv<=0.02017902433872225 & cv>=-0.522035676240921 & pa>=0.12731001973152162\n",
      "Run episode 569 with rewards 20.0\n",
      "============ 570 ===========\n",
      "17 actions [0, 0, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1]\n",
      "   -2.4492 if cv<=-0.5510812044143677\n",
      "   +1.2076 if cp>=-0.015105414018034922 & pav<=0.5829270958900452\n",
      "   +1.1539 if cp<=0.021777350455522537 & cv>=-0.5368143320083618 & pa<=0.06500580906867981\n",
      "   +3.0140 if pa<=0.03521315157413483 & pav>=0.8671541690826416\n",
      "   +2.4165 if cv<=-0.43731397986412046 & cv>=-0.6319775462150574\n",
      "--------------\n",
      "   -3.2933 if cv>=-0.5510812044143677\n",
      "   -0.2594 if cp>=-0.015105414018034922 & cv<=-0.04402178898453712\n",
      "   +1.2782 if cp<=-0.028944363817572576\n",
      "   +4.0251 if cp<=-0.040692998468875884 & cv<=0.02017902433872225 & cv>=-0.522035676240921 & pa>=0.12731001973152162\n",
      "   +1.6379 if cv>=-0.43731397986412046\n",
      "Run episode 570 with rewards 17.0\n",
      "============ 571 ===========\n",
      "15 actions [0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1]\n",
      "   -1.9087 if cv<=-0.5510812044143677\n",
      "   +0.0000 if cp>=-0.015105414018034922 & pav<=0.5829270958900452\n",
      "   -0.5763 if pa<=0.03521315157413483 & pav>=0.8671541690826416\n",
      "   +1.8033 if cv<=-0.43731397986412046 & cv>=-0.6319775462150574\n",
      "   +3.4170 if cv>=-0.34476134181022644\n",
      "--------------\n",
      "   -3.3025 if cv>=-0.5510812044143677\n",
      "   -1.3745 if cp<=-0.028944363817572576\n",
      "   -0.0000 if cp<=-0.040692998468875884 & cv<=0.02017902433872225 & cv>=-0.522035676240921 & pa>=0.12731001973152162\n",
      "   +2.5971 if cv>=-0.43731397986412046\n",
      "   +4.5116 if cv<=-0.34476134181022644\n",
      "Run episode 571 with rewards 15.0\n",
      "============ 572 ===========\n",
      "20 actions [0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0]\n",
      "   -0.0000 if cv<=-0.5510812044143677\n",
      "   -0.0000 if pa<=0.03521315157413483 & pav>=0.8671541690826416\n",
      "   -0.0000 if cv<=-0.43731397986412046 & cv>=-0.6319775462150574\n",
      "   +3.2148 if cv>=-0.34476134181022644\n",
      "   -0.5647 if cv<=-0.16249298453330993 & cv>=-0.3620862901210785\n",
      "--------------\n",
      "   +0.0854 if cv>=-0.5510812044143677\n",
      "   -0.2673 if cp<=-0.028944363817572576\n",
      "   +0.0854 if cv>=-0.43731397986412046\n",
      "   +3.2837 if cv<=-0.34476134181022644\n",
      "   -1.2128 if cv>=-0.16249298453330993\n",
      "Run episode 572 with rewards 20.0\n",
      "============ 573 ===========\n",
      "20 actions [0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0]\n",
      "   +0.0000 if cv<=-0.5510812044143677\n",
      "   +0.0000 if cv<=-0.43731397986412046 & cv>=-0.6319775462150574\n",
      "   +3.1873 if cv>=-0.34476134181022644\n",
      "   +2.0939 if cv<=-0.16249298453330993 & cv>=-0.3620862901210785\n",
      "   -0.6401 if cv>=-0.36897230744361875\n",
      "--------------\n",
      "   -0.5232 if cv>=-0.5510812044143677\n",
      "   -0.5232 if cp<=-0.028944363817572576\n",
      "   +4.8125 if cv<=-0.34476134181022644\n",
      "   -0.4642 if cv>=-0.16249298453330993\n",
      "   -0.8032 if cp<=-0.08342123925685882 & cv>=-0.36441707611083984\n",
      "Run episode 573 with rewards 20.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 574 ===========\n",
      "24 actions [0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0]\n",
      "   +0.0000 if cv<=-0.5510812044143677\n",
      "   +2.9897 if cv>=-0.34476134181022644\n",
      "   +0.1921 if cv<=-0.16249298453330993 & cv>=-0.3620862901210785\n",
      "   +1.0149 if cv>=-0.36897230744361875\n",
      "   -0.9443 if cp<=-0.026961584389209738 & pav<=0.8807593703269958\n",
      "--------------\n",
      "   -0.4192 if cv>=-0.5510812044143677\n",
      "   +0.3735 if cp<=-0.028944363817572576\n",
      "   +4.3263 if cv<=-0.34476134181022644\n",
      "   -0.0077 if cp<=-0.08342123925685882 & cv>=-0.36441707611083984\n",
      "   -1.3525 if cp>=-0.026961584389209738 & cv>=-0.16068916022777557\n",
      "Run episode 574 with rewards 24.0\n",
      "============ 575 ===========\n",
      "19 actions [0, 0, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1]\n",
      "   +1.2749 if cv>=-0.34476134181022644\n",
      "   +1.1195 if cv<=-0.16249298453330993 & cv>=-0.3620862901210785\n",
      "   +2.9619 if cv>=-0.36897230744361875\n",
      "   -0.1630 if cp<=-0.026961584389209738 & pav<=0.8807593703269958\n",
      "   -3.1812 if cp>=0.006239661946892747 & cv<=-0.17970661222934722\n",
      "--------------\n",
      "   -1.0611 if cv>=-0.5510812044143677\n",
      "   +0.3741 if cp<=-0.028944363817572576\n",
      "   +2.9168 if cv<=-0.34476134181022644\n",
      "   -0.2961 if cp>=-0.026961584389209738 & cv>=-0.16068916022777557\n",
      "   +3.2605 if cp>=0.006239661946892747 & cv<=-0.17970661222934722\n",
      "Run episode 575 with rewards 19.0\n",
      "============ 576 ===========\n",
      "25 actions [0, 0, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1]\n",
      "   +0.2396 if cv>=-0.34476134181022644\n",
      "   +0.1809 if cv<=-0.16249298453330993 & cv>=-0.3620862901210785\n",
      "   +1.9200 if cv>=-0.36897230744361875\n",
      "   +0.0000 if cp>=0.006239661946892747 & cv<=-0.17970661222934722\n",
      "   +3.2279 if cv>=-0.3632604777812958\n",
      "--------------\n",
      "   -3.0977 if cv>=-0.5510812044143677\n",
      "   +1.1478 if cp<=-0.028944363817572576\n",
      "   +2.7018 if cv<=-0.34476134181022644\n",
      "   -0.0000 if cp>=0.006239661946892747 & cv<=-0.17970661222934722\n",
      "   +3.7581 if cp<=-0.055467529594898216 & cv>=-0.4518553853034973\n",
      "Run episode 576 with rewards 25.0\n",
      "============ 577 ===========\n",
      "15 actions [0, 0, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 0]\n",
      "   +1.0712 if cv>=-0.34476134181022644\n",
      "   +1.0623 if cv<=-0.16249298453330993 & cv>=-0.3620862901210785\n",
      "   +1.0712 if cv>=-0.36897230744361875\n",
      "   +1.0712 if cv>=-0.3632604777812958\n",
      "   +2.6031 if cv>=-0.42012333273887636\n",
      "--------------\n",
      "   -5.8946 if cv>=-0.5510812044143677\n",
      "   +0.8630 if cp<=-0.028944363817572576\n",
      "   +2.2917 if cv<=-0.34476134181022644\n",
      "   +5.3321 if cp<=-0.055467529594898216 & cv>=-0.4518553853034973\n",
      "   +0.6420 if \n",
      "Run episode 577 with rewards 15.0\n",
      "============ 578 ===========\n",
      "27 actions [0, 0, 1, 0, 0, 1, 1, 0, 0, 0, 1, 1, 1, 0, 1, 1, 0, 1, 1, 0, 1, 0, 0, 1, 0, 0, 1]\n",
      "   +1.1689 if cv>=-0.34476134181022644\n",
      "   +1.1689 if cv>=-0.36897230744361875\n",
      "   +1.1689 if cv>=-0.3632604777812958\n",
      "   +0.0468 if cv>=-0.42012333273887636\n",
      "   +0.0468 if cv>=-0.4477526426315307\n",
      "--------------\n",
      "   -2.2296 if cv>=-0.5510812044143677\n",
      "   +1.2570 if cp<=-0.028944363817572576\n",
      "   +2.0423 if cv<=-0.34476134181022644\n",
      "   +4.9574 if cp<=-0.055467529594898216 & cv>=-0.4518553853034973\n",
      "   +5.1193 if pav>=0.9306615114212037\n",
      "Run episode 578 with rewards 27.0\n",
      "============ 579 ===========\n",
      "12 actions [0, 0, 0, 0, 1, 0, 0, 1, 1, 0, 0, 1]\n",
      "   +1.3780 if cv>=-0.34476134181022644\n",
      "   +1.3780 if cv>=-0.36897230744361875\n",
      "   +1.3780 if cv>=-0.3632604777812958\n",
      "   -1.3296 if cv>=-0.4477526426315307\n",
      "   +1.6555 if cp>=-0.13273919224739075\n",
      "--------------\n",
      "   -0.3519 if cv>=-0.5510812044143677\n",
      "   +0.5081 if cv<=-0.34476134181022644\n",
      "   +2.7875 if cp<=-0.055467529594898216 & cv>=-0.4518553853034973\n",
      "   +2.3281 if pav>=0.9306615114212037\n",
      "   +1.9156 if cp<=-0.08197017759084699 & pa<=0.14847938120365142 & pav>=0.2090885877609253\n",
      "Run episode 579 with rewards 12.0\n",
      "============ 580 ===========\n",
      "12 actions [0, 0, 0, 0, 1, 0, 0, 0, 1, 0, 1, 0]\n",
      "   +0.3075 if cv>=-0.34476134181022644\n",
      "   +0.3075 if cv>=-0.36897230744361875\n",
      "   +0.3075 if cv>=-0.3632604777812958\n",
      "   +2.0450 if cp>=-0.13273919224739075\n",
      "   +1.8968 if cv>=-0.5724661588668823\n",
      "--------------\n",
      "   -1.4122 if cv<=-0.34476134181022644\n",
      "   +0.0000 if cp<=-0.055467529594898216 & cv>=-0.4518553853034973\n",
      "   +3.6800 if pav>=0.9306615114212037\n",
      "   -0.5635 if cp<=-0.08197017759084699 & pa<=0.14847938120365142 & pav>=0.2090885877609253\n",
      "   -1.3382 if cv<=-0.766245985031128\n",
      "Run episode 580 with rewards 12.0\n",
      "============ 581 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 1]\n",
      "   +0.5634 if cv>=-0.36897230744361875\n",
      "   +0.5634 if cv>=-0.3632604777812958\n",
      "   +2.7350 if cp>=-0.13273919224739075\n",
      "   +0.7421 if cv>=-0.5724661588668823\n",
      "   -3.1828 if cp>=0.018273039534688017 & cv<=-0.6724956154823301\n",
      "--------------\n",
      "   -0.6853 if cv<=-0.34476134181022644\n",
      "   +1.6069 if pav>=0.9306615114212037\n",
      "   +0.0000 if cp<=-0.08197017759084699 & pa<=0.14847938120365142 & pav>=0.2090885877609253\n",
      "   +1.6069 if cv<=-0.766245985031128\n",
      "   -4.4196 if cp<=0.018273039534688017 & cv<=-0.6724956154823301\n",
      "Run episode 581 with rewards 10.0\n",
      "============ 582 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.8008 if cv>=-0.3632604777812958\n",
      "   +2.0555 if cp>=-0.13273919224739075\n",
      "   +1.1535 if cv>=-0.5724661588668823\n",
      "   +0.0000 if cp>=0.018273039534688017 & cv<=-0.6724956154823301\n",
      "  +12.2970 if pa>=0.20933806896209717\n",
      "--------------\n",
      "   -2.6440 if cv<=-0.34476134181022644\n",
      "   -4.5253 if pav>=0.9306615114212037\n",
      "   -4.5253 if cv<=-0.766245985031128\n",
      "   -4.6075 if cp<=0.018273039534688017 & cv<=-0.6724956154823301\n",
      "   +0.3932 if pa>=0.20933806896209717\n",
      "Run episode 582 with rewards 9.0\n",
      "============ 583 ===========\n",
      "19 actions [0, 0, 1, 0, 0, 0, 1, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 1, 1]\n",
      "   +0.8591 if cv>=-0.3632604777812958\n",
      "   +1.0106 if cp>=-0.13273919224739075\n",
      "   +0.9138 if cv>=-0.5724661588668823\n",
      "   +0.0000 if pa>=0.20933806896209717\n",
      "   +1.0105 if cp>=-0.05476180911064147\n",
      "--------------\n",
      "   +2.3636 if cv<=-0.34476134181022644\n",
      "   +5.1351 if pav>=0.9306615114212037\n",
      "   +5.1351 if cv<=-0.766245985031128\n",
      "   +5.2110 if cp<=0.018273039534688017 & cv<=-0.6724956154823301\n",
      "   -0.2018 if cp>=-0.05476180911064147\n",
      "Run episode 583 with rewards 19.0\n",
      "============ 584 ===========\n",
      "13 actions [0, 0, 1, 0, 0, 0, 1, 1, 0, 1, 0, 1, 0]\n",
      "   +0.6052 if cv>=-0.3632604777812958\n",
      "   -0.9103 if cp>=-0.13273919224739075\n",
      "   +3.7368 if cv>=-0.5724661588668823\n",
      "   +1.7944 if cp>=-0.05476180911064147\n",
      "   -4.6129 if cp>=-0.023984786123037338 & cv<=-0.36364597678184507\n",
      "--------------\n",
      "   +4.6002 if cv<=-0.34476134181022644\n",
      "   -0.0405 if pav>=0.9306615114212037\n",
      "   -0.0000 if cv<=-0.766245985031128\n",
      "   +1.0174 if cp<=0.018273039534688017 & cv<=-0.6724956154823301\n",
      "   -3.4734 if cp<=-0.023984786123037338 & cv>=-0.6429487109184265\n",
      "Run episode 584 with rewards 13.0\n",
      "============ 585 ===========\n",
      "16 actions [0, 0, 1, 0, 1, 0, 0, 0, 1, 1, 0, 1, 0, 0, 1, 1]\n",
      "   +0.5506 if cp>=-0.13273919224739075\n",
      "   +1.4701 if cv>=-0.5724661588668823\n",
      "   +2.4712 if cp>=-0.05476180911064147\n",
      "   -1.9977 if cp>=-0.023984786123037338 & cv<=-0.36364597678184507\n",
      "   -0.4143 if cp>=-0.07049536406993866\n",
      "--------------\n",
      "   +2.1240 if cv<=-0.34476134181022644\n",
      "   -0.2348 if pav>=0.9306615114212037\n",
      "   +1.2164 if cp<=0.018273039534688017 & cv<=-0.6724956154823301\n",
      "   -1.9962 if cp<=-0.023984786123037338 & cv>=-0.6429487109184265\n",
      "   +0.7029 if cp<=-0.07049536406993866 & cp>=-0.09681049138307571 & cv<=-0.6299632310867309\n",
      "Run episode 585 with rewards 16.0\n",
      "============ 586 ===========\n",
      "19 actions [0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 0, 0, 1, 1, 0, 1, 0]\n",
      "   -0.4927 if cp>=-0.13273919224739075\n",
      "   +2.4233 if cv>=-0.5724661588668823\n",
      "   +1.9100 if cp>=-0.05476180911064147\n",
      "   -2.6591 if cp>=-0.023984786123037338 & cv<=-0.36364597678184507\n",
      "   +0.0791 if cp>=-0.023174965754151337\n",
      "--------------\n",
      "   +3.8820 if cv<=-0.34476134181022644\n",
      "   +1.1884 if cp<=0.018273039534688017 & cv<=-0.6724956154823301\n",
      "   -3.0466 if cp<=-0.023984786123037338 & cv>=-0.6429487109184265\n",
      "   +0.0000 if cp<=-0.07049536406993866 & cp>=-0.09681049138307571 & cv<=-0.6299632310867309\n",
      "   -3.5481 if cp<=-0.023174965754151337 & cv>=-0.3878459632396698\n",
      "Run episode 586 with rewards 19.0\n",
      "============ 587 ===========\n",
      "14 actions [0, 0, 1, 0, 0, 0, 0, 1, 1, 0, 1, 1, 0, 1]\n",
      "   +1.0368 if cp>=-0.13273919224739075\n",
      "   +2.6247 if cv>=-0.5724661588668823\n",
      "   +1.9279 if cp>=-0.05476180911064147\n",
      "   -1.8756 if cp>=-0.023984786123037338 & cv<=-0.36364597678184507\n",
      "   -2.8137 if cp>=0.0027383690699934985 & cv<=-0.1834866613149643\n",
      "--------------\n",
      "   +3.7662 if cv<=-0.34476134181022644\n",
      "   +0.3768 if cp<=0.018273039534688017 & cv<=-0.6724956154823301\n",
      "   -2.9811 if cp<=-0.023984786123037338 & cv>=-0.6429487109184265\n",
      "   -0.4426 if cp<=-0.023174965754151337 & cv>=-0.3878459632396698\n",
      "   -2.5458 if cp<=0.0027383690699934985 & cv<=-0.37825884819030764 & cv>=-0.381545352935791\n",
      "Run episode 587 with rewards 14.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 588 ===========\n",
      "14 actions [0, 0, 1, 0, 1, 0, 1, 0, 0, 0, 0, 1, 1, 1]\n",
      "   -1.3396 if cv>=-0.5724661588668823\n",
      "   +4.9901 if cp>=-0.05476180911064147\n",
      "   -2.5714 if cp>=-0.023984786123037338 & cv<=-0.36364597678184507\n",
      "   -0.0000 if cp>=0.0027383690699934985 & cv<=-0.1834866613149643\n",
      "   +0.3297 if cp>=-0.03651637285947799\n",
      "--------------\n",
      "   +4.7921 if cv<=-0.34476134181022644\n",
      "   -2.3634 if cp<=-0.023984786123037338 & cv>=-0.6429487109184265\n",
      "   -0.0000 if cp<=-0.023174965754151337 & cv>=-0.3878459632396698\n",
      "   -0.0000 if cp<=0.0027383690699934985 & cv<=-0.37825884819030764 & cv>=-0.381545352935791\n",
      "   -2.5274 if cv<=-0.48592911958694446\n",
      "Run episode 588 with rewards 14.0\n",
      "============ 589 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.8301 if cv>=-0.5724661588668823\n",
      "   +2.5178 if cp>=-0.05476180911064147\n",
      "   -2.6420 if cp>=-0.023984786123037338 & cv<=-0.36364597678184507\n",
      "   +0.8301 if cp>=-0.03651637285947799\n",
      "   +6.0836 if pa>=0.19724588096141815\n",
      "--------------\n",
      "   +3.2029 if cv<=-0.34476134181022644\n",
      "   -5.8813 if cp<=-0.023984786123037338 & cv>=-0.6429487109184265\n",
      "   -0.0000 if cp<=0.0027383690699934985 & cv<=-0.37825884819030764 & cv>=-0.381545352935791\n",
      "  -11.4848 if cv<=-0.48592911958694446\n",
      "   -5.6547 if cp<=-0.05965327396988868\n",
      "Run episode 589 with rewards 10.0\n",
      "============ 590 ===========\n",
      "25 actions [0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1]\n",
      "   +2.5468 if cp>=-0.05476180911064147\n",
      "   +0.0000 if cp>=-0.023984786123037338 & cv<=-0.36364597678184507\n",
      "   +2.5468 if cp>=-0.03651637285947799\n",
      "   +0.0000 if pa>=0.19724588096141815\n",
      "   +0.2185 if cp>=0.00035197040560888167\n",
      "--------------\n",
      "   -0.3304 if cv<=-0.34476134181022644\n",
      "   +2.4467 if cp<=-0.023984786123037338 & cv>=-0.6429487109184265\n",
      "   +1.2274 if cv<=-0.48592911958694446\n",
      "  +15.9855 if cp<=-0.05965327396988868\n",
      "   +1.0000 if pa>=0.17266440391540527\n",
      "Run episode 590 with rewards 25.0\n",
      "============ 591 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 1]\n",
      "   +0.1833 if cp>=-0.05476180911064147\n",
      "   +0.0687 if cp>=-0.023984786123037338 & cv<=-0.36364597678184507\n",
      "   +0.3073 if cp>=-0.03651637285947799\n",
      "   +0.1782 if cp>=0.00035197040560888167\n",
      "   +5.8451 if cp>=-0.047620078921318046\n",
      "--------------\n",
      "   -0.0186 if cp<=-0.023984786123037338 & cv>=-0.6429487109184265\n",
      "   +4.5145 if cv<=-0.48592911958694446\n",
      "   +4.2297 if cp<=-0.05965327396988868\n",
      "   -0.0016 if pa>=0.17266440391540527\n",
      "   +4.4963 if cp<=-0.047620078921318046 & cv>=0.40846053361892753 & pa<=0.07298430651426316\n",
      "Run episode 591 with rewards 9.0\n",
      "============ 592 ===========\n",
      "11 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   -2.7614 if cp>=-0.05476180911064147\n",
      "   +4.2075 if cp>=-0.03651637285947799\n",
      "   +6.7221 if cp>=0.00035197040560888167\n",
      "   -2.7614 if cp>=-0.047620078921318046\n",
      "   -6.9913 if cp<=-0.02539630942046642\n",
      "--------------\n",
      "   -0.0118 if cp<=-0.023984786123037338 & cv>=-0.6429487109184265\n",
      "  -10.4336 if cv<=-0.48592911958694446\n",
      "  -11.4207 if cp<=-0.05965327396988868\n",
      "   -2.8446 if cp<=-0.047620078921318046 & cv>=0.40846053361892753 & pa<=0.07298430651426316\n",
      "   -0.7000 if \n",
      "Run episode 592 with rewards 11.0\n",
      "============ 593 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 1, 1, 1, 1, 1]\n",
      "   +1.1206 if cp>=-0.03651637285947799\n",
      "   +1.1205 if cp>=0.00035197040560888167\n",
      "   +1.1206 if cp>=-0.047620078921318046\n",
      "   +0.0001 if cp<=-0.02539630942046642\n",
      "   +0.2687 if cp<=0.0023578389082103968 & cp>=-0.05450810119509697\n",
      "--------------\n",
      "   -1.7811 if cv<=-0.48592911958694446\n",
      "  +19.6301 if cp<=-0.05965327396988868\n",
      "   +1.3998 if cp<=-0.047620078921318046 & cv>=0.40846053361892753 & pa<=0.07298430651426316\n",
      "   -5.5158 if \n",
      "   +1.0000 if cp>=-0.10635128617286682\n",
      "Run episode 593 with rewards 10.0\n",
      "============ 594 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.2632 if cp>=-0.03651637285947799\n",
      "   +0.0000 if cp>=0.00035197040560888167\n",
      "   +0.2772 if cp>=-0.047620078921318046\n",
      "   +0.2899 if cp<=0.0023578389082103968 & cp>=-0.05450810119509697\n",
      "   +0.1795 if cp>=-0.03469414860010147\n",
      "--------------\n",
      "   +2.4133 if cv<=-0.48592911958694446\n",
      "   +0.1670 if cp<=-0.05965327396988868\n",
      "   +0.0000 if cp<=-0.047620078921318046 & cv>=0.40846053361892753 & pa<=0.07298430651426316\n",
      "   -3.3458 if \n",
      "   -5.5790 if cp<=-0.10460600703954696\n",
      "Run episode 594 with rewards 9.0\n",
      "============ 595 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 1, 1, 1, 1]\n",
      "   +0.3077 if cp>=-0.03651637285947799\n",
      "   +5.4928 if cp>=-0.047620078921318046\n",
      "   +5.4928 if cp<=0.0023578389082103968 & cp>=-0.05450810119509697\n",
      "   +0.3077 if cp>=-0.03469414860010147\n",
      "  -13.8000 if cp<=-0.03481278121471404\n",
      "--------------\n",
      "   +4.9243 if cv<=-0.48592911958694446\n",
      "  +11.5296 if cp<=-0.05965327396988868\n",
      "   -1.3654 if \n",
      "   +8.8034 if cp<=-0.10460600703954696\n",
      "   -2.4544 if cp>=-0.08579383045434952\n",
      "Run episode 595 with rewards 10.0\n",
      "============ 596 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 1]\n",
      "   +1.5920 if cp>=-0.047620078921318046\n",
      "   +0.4451 if cp<=0.0023578389082103968 & cp>=-0.05450810119509697\n",
      "   +1.9128 if cp>=-0.03469414860010147\n",
      "   -0.3208 if cp<=-0.03481278121471404\n",
      "   +0.0287 if cp>=0.016768505424261095\n",
      "--------------\n",
      "   +0.0070 if cv<=-0.48592911958694446\n",
      "   -0.0000 if cp<=-0.05965327396988868\n",
      "   +0.0000 if cp<=-0.10460600703954696\n",
      "   -0.1024 if cp>=-0.08579383045434952\n",
      "   -0.1330 if cp>=-0.028109125420451162\n",
      "Run episode 596 with rewards 9.0\n",
      "============ 597 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +1.7453 if cp>=-0.047620078921318046\n",
      "   -0.2052 if cp<=0.0023578389082103968 & cp>=-0.05450810119509697\n",
      "   +1.6341 if cp>=-0.03469414860010147\n",
      "  +11.3893 if cp<=-0.03481278121471404\n",
      "   +5.9949 if pa>=0.16410782933235168\n",
      "--------------\n",
      "   -3.9027 if cv<=-0.48592911958694446\n",
      "  -10.3252 if cp<=-0.05965327396988868\n",
      "   +3.3347 if cp>=-0.08579383045434952\n",
      "   -3.7867 if cp>=-0.028109125420451162\n",
      "   +0.2775 if cp>=-0.04316165372729301\n",
      "Run episode 597 with rewards 9.0\n",
      "============ 598 ===========\n",
      "76 actions [1, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   +0.2557 if cp>=-0.047620078921318046\n",
      "   +2.8740 if cp>=-0.03469414860010147\n",
      "   -2.6202 if cp<=-0.03481278121471404\n",
      "   -0.0001 if pa>=0.16410782933235168\n",
      "   -1.1192 if cp<=0.013620760291814806 & cp>=-0.049213089793920514\n",
      "--------------\n",
      "   -0.1550 if cv<=-0.48592911958694446\n",
      "   +0.0000 if cp<=-0.05965327396988868\n",
      "   -0.6474 if cp>=-0.08579383045434952\n",
      "   -0.6474 if cp>=-0.028109125420451162\n",
      "   +0.0000 if pa>=0.18647193908691406\n",
      "Run episode 598 with rewards 76.0\n",
      "============ 599 ===========\n",
      "12 actions [0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1]\n",
      "   +1.2012 if cp>=-0.047620078921318046\n",
      "   +3.5808 if cp>=-0.03469414860010147\n",
      "   -3.2536 if cp<=-0.03481278121471404\n",
      "   -3.4930 if cp<=0.013620760291814806 & cp>=-0.049213089793920514\n",
      "   -5.9067 if cv<=0.7587981224060059 & pa<=-0.04109515622258186 & pa>=-0.04109515622258186\n",
      "--------------\n",
      "   +2.5840 if cv<=-0.48592911958694446\n",
      "   +0.5498 if cp<=-0.05965327396988868\n",
      "   -2.1031 if cp>=-0.08579383045434952\n",
      "   -0.1624 if cp>=-0.028109125420451162\n",
      "   +7.3688 if pa<=-0.04109515622258186 & pa>=-0.04109515622258186\n",
      "Run episode 599 with rewards 12.0\n",
      "============ 600 ===========\n",
      "10 actions [0, 0, 1, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +2.3351 if cp>=-0.03469414860010147\n",
      "   -0.5429 if cp<=-0.03481278121471404\n",
      "   -0.1075 if cp<=0.013620760291814806 & cp>=-0.049213089793920514\n",
      "   +0.0000 if cv<=0.7587981224060059 & pa<=-0.04109515622258186 & pa>=-0.04109515622258186\n",
      "   +1.5402 if cp<=0.032041883841156964 & cp>=-0.03530169650912284\n",
      "--------------\n",
      "   -7.7952 if cv<=-0.48592911958694446\n",
      "   -9.9355 if cp<=-0.05965327396988868\n",
      "   +1.0336 if cp>=-0.08579383045434952\n",
      "   +0.0111 if pa<=-0.04109515622258186 & pa>=-0.04109515622258186\n",
      "   -3.9999 if cp<=-0.09085370600223541 & cv>=-0.9018606424331664\n",
      "Run episode 600 with rewards 10.0\n",
      "============ 601 ===========\n",
      "45 actions [0, 0, 0, 1, 1, 0, 0, 1, 1, 1, 1, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 1, 0, 0, 1, 1, 1, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 1, 1]\n",
      "   +0.5359 if cp>=-0.03469414860010147\n",
      "   -0.0019 if cp<=-0.03481278121471404\n",
      "   +0.5359 if cp<=0.013620760291814806 & cp>=-0.049213089793920514\n",
      "   +0.5359 if cp<=0.032041883841156964 & cp>=-0.03530169650912284\n",
      "   +2.3290 if cp>=-0.0022452570963650935\n",
      "--------------\n",
      "   +7.8567 if cv<=-0.48592911958694446\n",
      "  +10.3754 if cp<=-0.05965327396988868\n",
      "   +1.4429 if cp>=-0.08579383045434952\n",
      "   +3.7420 if cp<=-0.09085370600223541 & cv>=-0.9018606424331664\n",
      "   +1.7541 if cp<=-0.0022452570963650935 & cp>=-0.013248843140900133\n",
      "Run episode 601 with rewards 45.0\n",
      "============ 602 ===========\n",
      "31 actions [0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0]\n",
      "   -1.6618 if cp>=-0.03469414860010147\n",
      "   -1.7915 if cp<=0.013620760291814806 & cp>=-0.049213089793920514\n",
      "   +4.5387 if cp<=0.032041883841156964 & cp>=-0.03530169650912284\n",
      "   +3.8552 if cp>=-0.0022452570963650935\n",
      "   +2.5906 if cp<=-0.010153554938733562 & pa<=0.15080216526985168 & pav<=0.3774047851562505\n",
      "--------------\n",
      "   +1.2021 if cv<=-0.48592911958694446\n",
      "   +3.2010 if cp<=-0.05965327396988868\n",
      "   -0.0000 if cp<=-0.09085370600223541 & cv>=-0.9018606424331664\n",
      "   +4.5421 if cp<=-0.0022452570963650935 & cp>=-0.013248843140900133\n",
      "   +2.4007 if cp<=-0.010153554938733562 & pav>=0.3774047851562505\n",
      "Run episode 602 with rewards 31.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 603 ===========\n",
      "64 actions [0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -1.2185 if cp<=0.013620760291814806 & cp>=-0.049213089793920514\n",
      "   +1.9664 if cp<=0.032041883841156964 & cp>=-0.03530169650912284\n",
      "   +4.4917 if cp>=-0.0022452570963650935\n",
      "   +2.7836 if cp<=-0.010153554938733562 & pa<=0.15080216526985168 & pav<=0.3774047851562505\n",
      "   -1.4716 if cv>=-0.5812749862670898 & pa>=0.06490002572536469\n",
      "--------------\n",
      "   +1.0952 if cv<=-0.48592911958694446\n",
      "   +4.1316 if cp<=-0.05965327396988868\n",
      "   +0.0000 if cp<=-0.0022452570963650935 & cp>=-0.013248843140900133\n",
      "   +3.0422 if cp<=-0.010153554938733562 & pav>=0.3774047851562505\n",
      "   -2.3879 if cp>=0.029278839007020024 & pa<=0.06490002572536469\n",
      "Run episode 603 with rewards 64.0\n",
      "============ 604 ===========\n",
      "14 actions [0, 0, 0, 1, 1, 0, 0, 0, 0, 1, 1, 1, 0, 1]\n",
      "   +0.6190 if cp<=0.032041883841156964 & cp>=-0.03530169650912284\n",
      "   +4.0205 if cp>=-0.0022452570963650935\n",
      "   +3.1587 if cp<=-0.010153554938733562 & pa<=0.15080216526985168 & pav<=0.3774047851562505\n",
      "   +0.0000 if cv>=-0.5812749862670898 & pa>=0.06490002572536469\n",
      "   +4.3339 if pa>=0.04364911839365959\n",
      "--------------\n",
      "   +3.9302 if cv<=-0.48592911958694446\n",
      "   +3.9488 if cp<=-0.05965327396988868\n",
      "   +4.8743 if cp<=-0.010153554938733562 & pav>=0.3774047851562505\n",
      "   +0.0001 if cp>=0.029278839007020024 & pa<=0.06490002572536469\n",
      "   -4.4897 if pa>=0.04364911839365959\n",
      "Run episode 604 with rewards 14.0\n",
      "============ 605 ===========\n",
      "36 actions [1, 0, 1, 1, 0, 1, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 1, 1, 0, 0, 1, 0, 1, 1, 1, 0]\n",
      "   +0.0634 if cp<=0.032041883841156964 & cp>=-0.03530169650912284\n",
      "   +2.3431 if cp>=-0.0022452570963650935\n",
      "   -0.0000 if cp<=-0.010153554938733562 & pa<=0.15080216526985168 & pav<=0.3774047851562505\n",
      "   +0.5908 if pa>=0.04364911839365959\n",
      "   -4.0006 if cp<=0.035833798348903656 & cp>=0.014669831842184069 & cv<=-0.26903582811355586 & cv>=-0.3494704008102417\n",
      "--------------\n",
      "   +5.0538 if cv<=-0.48592911958694446\n",
      "   -6.2348 if cp<=-0.05965327396988868\n",
      "   -0.0260 if cp<=-0.010153554938733562 & pav>=0.3774047851562505\n",
      "   -1.6548 if pa>=0.04364911839365959\n",
      "   +5.7727 if cp<=0.035833798348903656 & cp>=0.014669831842184069 & cv<=-0.26903582811355586 & cv>=-0.3494704008102417\n",
      "Run episode 605 with rewards 36.0\n",
      "============ 606 ===========\n",
      "33 actions [1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 0, 0, 0, 0, 1, 1, 1, 0, 0, 1, 1, 0, 0, 1, 0, 1, 1, 1, 0, 0]\n",
      "   +0.1890 if cp<=0.032041883841156964 & cp>=-0.03530169650912284\n",
      "   +1.7732 if cp>=-0.0022452570963650935\n",
      "   -0.0000 if pa>=0.04364911839365959\n",
      "   -0.0000 if cp<=0.035833798348903656 & cp>=0.014669831842184069 & cv<=-0.26903582811355586 & cv>=-0.3494704008102417\n",
      "   -4.3144 if cp<=-0.03322482854127884 & pav>=-0.18702502548694577\n",
      "--------------\n",
      "   +4.0863 if cv<=-0.48592911958694446\n",
      "   -0.0000 if cp<=-0.05965327396988868\n",
      "   -0.0000 if pa>=0.04364911839365959\n",
      "   -0.0000 if cp<=0.035833798348903656 & cp>=0.014669831842184069 & cv<=-0.26903582811355586 & cv>=-0.3494704008102417\n",
      "   +4.2909 if cp<=-0.03322482854127884 & pav>=-0.18702502548694577\n",
      "Run episode 606 with rewards 33.0\n",
      "============ 607 ===========\n",
      "36 actions [0, 0, 0, 0, 1, 1, 1, 1, 0, 1, 1, 1, 1, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0]\n",
      "   +1.5752 if cp<=0.032041883841156964 & cp>=-0.03530169650912284\n",
      "   +0.0000 if cp>=-0.0022452570963650935\n",
      "   +0.0000 if cp<=0.035833798348903656 & cp>=0.014669831842184069 & cv<=-0.26903582811355586 & cv>=-0.3494704008102417\n",
      "   -1.4964 if cp<=-0.03322482854127884 & pav>=-0.18702502548694577\n",
      "   +4.0386 if cv>=-0.02298504672944544 & pa>=-0.05069269686937332\n",
      "--------------\n",
      "   +5.5856 if cv<=-0.48592911958694446\n",
      "   +3.5266 if cp<=-0.05965327396988868\n",
      "   +0.0000 if cp<=0.035833798348903656 & cp>=0.014669831842184069 & cv<=-0.26903582811355586 & cv>=-0.3494704008102417\n",
      "   +4.0188 if cp<=-0.03322482854127884 & pav>=-0.18702502548694577\n",
      "   -3.5660 if cv<=0.15306578874588012\n",
      "Run episode 607 with rewards 36.0\n",
      "============ 608 ===========\n",
      "25 actions [0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 1, 1, 0, 1, 0, 0, 0, 0, 0, 1, 1]\n",
      "   +4.8324 if cp<=0.032041883841156964 & cp>=-0.03530169650912284\n",
      "   -0.0009 if cp>=-0.0022452570963650935\n",
      "   +0.7813 if cp<=-0.03322482854127884 & pav>=-0.18702502548694577\n",
      "   +3.4829 if cv>=-0.02298504672944544 & pa>=-0.05069269686937332\n",
      "   -6.3067 if cp<=-0.034411467611789696 & pav>=0.09288948774337769\n",
      "--------------\n",
      "   +0.2885 if cv<=-0.48592911958694446\n",
      "   +3.6128 if cp<=-0.05965327396988868\n",
      "   +2.7559 if cp<=-0.03322482854127884 & pav>=-0.18702502548694577\n",
      "   -5.4086 if cv<=0.15306578874588012\n",
      "   +7.5280 if cp<=-0.034411467611789696 & pav>=0.09288948774337769\n",
      "Run episode 608 with rewards 25.0\n",
      "============ 609 ===========\n",
      "25 actions [0, 0, 0, 1, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 1, 1, 0, 0, 0, 0]\n",
      "   +0.6499 if cp<=0.032041883841156964 & cp>=-0.03530169650912284\n",
      "   +1.8721 if cp<=-0.03322482854127884 & pav>=-0.18702502548694577\n",
      "   +2.1542 if cv>=-0.02298504672944544 & pa>=-0.05069269686937332\n",
      "   -2.2772 if cp<=-0.034411467611789696 & pav>=0.09288948774337769\n",
      "   +3.5953 if cv>=0.5439275503158569\n",
      "--------------\n",
      "   +5.2224 if cp<=-0.05965327396988868\n",
      "   +1.4788 if cp<=-0.03322482854127884 & pav>=-0.18702502548694577\n",
      "   -0.7664 if cv<=0.15306578874588012\n",
      "   +1.0266 if cp<=-0.034411467611789696 & pav>=0.09288948774337769\n",
      "   -3.8109 if cv>=0.5439275503158569\n",
      "Run episode 609 with rewards 25.0\n",
      "============ 610 ===========\n",
      "26 actions [0, 0, 0, 1, 1, 1, 1, 1, 0, 0, 1, 0, 1, 0, 1, 1, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1]\n",
      "   -1.8358 if cp<=-0.03322482854127884 & pav>=-0.18702502548694577\n",
      "   +1.8784 if cv>=-0.02298504672944544 & pa>=-0.05069269686937332\n",
      "   -3.3886 if cp<=-0.034411467611789696 & pav>=0.09288948774337769\n",
      "   -1.7374 if cv>=0.5439275503158569\n",
      "   +3.5629 if cp<=-0.009111440367996685 & pa<=0.187040513753891\n",
      "--------------\n",
      "   +4.0001 if cp<=-0.05965327396988868\n",
      "   +3.9045 if cp<=-0.03322482854127884 & pav>=-0.18702502548694577\n",
      "   +3.2028 if cp<=-0.034411467611789696 & pav>=0.09288948774337769\n",
      "   +2.7815 if cv>=0.5439275503158569\n",
      "   -3.3385 if cp<=-0.009111440367996685 & pa<=0.187040513753891\n",
      "Run episode 610 with rewards 26.0\n",
      "============ 611 ===========\n",
      "76 actions [1, 0, 0, 0, 0, 1, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0, 0, 0, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 0, 1, 1, 0, 1, 0, 0, 0, 1, 1, 1, 0, 1, 0, 0, 0, 1, 1, 0, 0, 0, 1, 0]\n",
      "   -2.1452 if cp<=-0.03322482854127884 & pav>=-0.18702502548694577\n",
      "   +0.1054 if cv>=-0.02298504672944544 & pa>=-0.05069269686937332\n",
      "   -0.9811 if cp<=-0.034411467611789696 & pav>=0.09288948774337769\n",
      "   +1.2032 if cp<=-0.009111440367996685 & pa<=0.187040513753891\n",
      "   +4.5849 if cp<=-0.03587022423744202 & cv>=0.2077135443687439 & pa<=0.06390629708766937\n",
      "--------------\n",
      "   +5.1744 if cp<=-0.05965327396988868\n",
      "   +4.5778 if cp<=-0.03322482854127884 & pav>=-0.18702502548694577\n",
      "   +2.7286 if cp<=-0.034411467611789696 & pav>=0.09288948774337769\n",
      "   -0.0671 if cp<=-0.009111440367996685 & pa<=0.187040513753891\n",
      "   -3.1483 if cp<=-0.03587022423744202\n",
      "Run episode 611 with rewards 76.0\n",
      "============ 612 ===========\n",
      "54 actions [0, 0, 0, 0, 1, 1, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 0, 1, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1]\n",
      "   -6.2399 if cp<=-0.03322482854127884 & pav>=-0.18702502548694577\n",
      "   -0.1929 if cp<=-0.034411467611789696 & pav>=0.09288948774337769\n",
      "   +2.0023 if cp<=-0.009111440367996685 & pa<=0.187040513753891\n",
      "   +1.1538 if cp<=-0.03587022423744202 & cv>=0.2077135443687439 & pa<=0.06390629708766937\n",
      "   -5.4220 if cp<=-0.030882379040122032 & cp>=-0.030882379040122032 & pa<=0.010370077565312386 & pav>=0.5240278244018555\n",
      "--------------\n",
      "   +0.0194 if cp<=-0.05965327396988868\n",
      "   +7.6998 if cp<=-0.03322482854127884 & pav>=-0.18702502548694577\n",
      "   +0.1639 if cp<=-0.034411467611789696 & pav>=0.09288948774337769\n",
      "   -0.8499 if cp<=-0.03587022423744202\n",
      "   -3.6692 if cp>=-0.03719917684793472 & cv<=0.025820722803473473 & pav<=0.5240278244018555\n",
      "Run episode 612 with rewards 54.0\n",
      "============ 613 ===========\n",
      "11 actions [0, 0, 0, 1, 0, 0, 0, 1, 1, 0, 1]\n",
      "   -3.4815 if cp<=-0.03322482854127884 & pav>=-0.18702502548694577\n",
      "   +4.1471 if cp<=-0.009111440367996685 & pa<=0.187040513753891\n",
      "   +1.1675 if cp<=-0.03587022423744202 & cv>=0.2077135443687439 & pa<=0.06390629708766937\n",
      "   -0.0000 if cp<=-0.030882379040122032 & cp>=-0.030882379040122032 & pa<=0.010370077565312386 & pav>=0.5240278244018555\n",
      "   -6.4747 if pa<=0.03343319296836854 & pa>=0.018497720733284952 & pav>=0.644528722763062\n",
      "--------------\n",
      "   +3.5547 if cp<=-0.03322482854127884 & pav>=-0.18702502548694577\n",
      "   +0.8139 if cp<=-0.034411467611789696 & pav>=0.09288948774337769\n",
      "   -1.9077 if cp<=-0.03587022423744202\n",
      "   -1.6459 if cp>=-0.03719917684793472 & cv<=0.025820722803473473 & pav<=0.5240278244018555\n",
      "   -3.0808 if cp>=-0.033374309539794915 & pa<=0.018497720733284952\n",
      "Run episode 613 with rewards 11.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 614 ===========\n",
      "12 actions [0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +7.9472 if cp<=-0.03322482854127884 & pav>=-0.18702502548694577\n",
      "   +7.9908 if cp<=-0.009111440367996685 & pa<=0.187040513753891\n",
      "   +0.0681 if cp<=-0.03587022423744202 & cv>=0.2077135443687439 & pa<=0.06390629708766937\n",
      "   -2.2324 if pa<=0.03343319296836854 & pa>=0.018497720733284952 & pav>=0.644528722763062\n",
      "   +1.9523 if cp<=0.0007613603374920785 & cp>=0.0007613603374920785\n",
      "--------------\n",
      "   -7.6333 if cp<=-0.03322482854127884 & pav>=-0.18702502548694577\n",
      "   -8.0171 if cp<=-0.03587022423744202\n",
      "   -1.8107 if cp>=-0.03719917684793472 & cv<=0.025820722803473473 & pav<=0.5240278244018555\n",
      "   -1.4764 if cp>=-0.033374309539794915 & pa<=0.018497720733284952\n",
      "   -1.9057 if cp>=0.0007613603374920785\n",
      "Run episode 614 with rewards 12.0\n",
      "============ 615 ===========\n",
      "27 actions [1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.0000 if cp<=-0.03322482854127884 & pav>=-0.18702502548694577\n",
      "   +1.4547 if cp<=-0.009111440367996685 & pa<=0.187040513753891\n",
      "   +0.8050 if pa<=0.03343319296836854 & pa>=0.018497720733284952 & pav>=0.644528722763062\n",
      "   +0.0000 if cp<=0.0007613603374920785 & cp>=0.0007613603374920785\n",
      "   -2.8845 if cp>=-0.00776861871127037 & cv<=-0.6317243456840512\n",
      "--------------\n",
      "  +13.4198 if cp<=-0.03322482854127884 & pav>=-0.18702502548694577\n",
      "  +13.6557 if cp<=-0.03587022423744202\n",
      "   -1.5681 if cp>=-0.03719917684793472 & cv<=0.025820722803473473 & pav<=0.5240278244018555\n",
      "   -4.9034 if cp>=0.0007613603374920785\n",
      "   +3.5870 if cp<=-0.00776861871127037\n",
      "Run episode 615 with rewards 27.0\n",
      "============ 616 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 1, 1, 1]\n",
      "   -0.0000 if cp<=-0.03322482854127884 & pav>=-0.18702502548694577\n",
      "   +1.7892 if cp<=-0.009111440367996685 & pa<=0.187040513753891\n",
      "   -0.0000 if pa<=0.03343319296836854 & pa>=0.018497720733284952 & pav>=0.644528722763062\n",
      "   -1.6318 if cp>=-0.00776861871127037 & cv<=-0.6317243456840512\n",
      "   +2.8388 if cv>=0.9835466742515564\n",
      "--------------\n",
      "   +0.8140 if cp<=-0.03322482854127884 & pav>=-0.18702502548694577\n",
      "   +2.5592 if cp<=-0.03587022423744202\n",
      "   -5.4694 if cp>=0.0007613603374920785\n",
      "   +3.1180 if cp<=-0.00776861871127037\n",
      "   -2.8390 if cv>=0.9835466742515564\n",
      "Run episode 616 with rewards 9.0\n",
      "============ 617 ===========\n",
      "11 actions [0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0]\n",
      "   +0.3960 if cp<=-0.009111440367996685 & pa<=0.187040513753891\n",
      "   -0.0000 if pa<=0.03343319296836854 & pa>=0.018497720733284952 & pav>=0.644528722763062\n",
      "   +0.0142 if cp>=-0.00776861871127037 & cv<=-0.6317243456840512\n",
      "   -0.0000 if cv>=0.9835466742515564\n",
      "   +0.5460 if cp>=-0.026930531114339826\n",
      "--------------\n",
      "   -6.1226 if cp<=-0.03587022423744202\n",
      "   -2.6507 if cp>=0.0007613603374920785\n",
      "   -9.8968 if cp<=-0.00776861871127037\n",
      "   -1.4238 if cv>=0.9835466742515564\n",
      "   +0.2966 if cv<=-0.936708664894104\n",
      "Run episode 617 with rewards 11.0\n",
      "============ 618 ===========\n",
      "32 actions [1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   +0.0006 if cp<=-0.009111440367996685 & pa<=0.187040513753891\n",
      "   -2.2093 if cp>=-0.00776861871127037 & cv<=-0.6317243456840512\n",
      "   -0.0000 if cv>=0.9835466742515564\n",
      "   +0.3994 if cp>=-0.026930531114339826\n",
      "   +0.3991 if cp>=-0.006431763526052225\n",
      "--------------\n",
      "   +9.1387 if cp<=-0.03587022423744202\n",
      "   -3.7790 if cp>=0.0007613603374920785\n",
      "  +10.0354 if cp<=-0.00776861871127037\n",
      "   +1.1978 if cv>=0.9835466742515564\n",
      "   +1.0000 if pa>=0.204343780875206\n",
      "Run episode 618 with rewards 32.0\n",
      "============ 619 ===========\n",
      "26 actions [0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   -0.0254 if cp<=-0.009111440367996685 & pa<=0.187040513753891\n",
      "   +0.1920 if cp>=-0.00776861871127037 & cv<=-0.6317243456840512\n",
      "   +1.2276 if cp>=-0.026930531114339826\n",
      "   +1.2533 if cp>=-0.006431763526052225\n",
      "   +0.4148 if cp>=0.04448941871523857 & cv>=-0.7084046483039855\n",
      "--------------\n",
      "   +0.6979 if cp<=-0.03587022423744202\n",
      "   -4.3380 if cp>=0.0007613603374920785\n",
      "   +4.7445 if cp<=-0.00776861871127037\n",
      "   -0.6019 if cv>=0.9835466742515564\n",
      "   -1.4752 if cp>=-0.010048963874578471 & cv<=-0.7084046483039855\n",
      "Run episode 619 with rewards 26.0\n",
      "============ 620 ===========\n",
      "28 actions [0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   -0.0020 if cp>=-0.00776861871127037 & cv<=-0.6317243456840512\n",
      "   +1.0115 if cp>=-0.026930531114339826\n",
      "   +2.2778 if cp>=-0.006431763526052225\n",
      "   +0.0424 if cp>=0.04448941871523857 & cv>=-0.7084046483039855\n",
      "   -0.7720 if cp<=0.026039887219667466 & pa<=0.09933845698833468 & pa>=0.07330677658319473\n",
      "--------------\n",
      "   +0.9936 if cp<=-0.03587022423744202\n",
      "   -2.3259 if cp>=0.0007613603374920785\n",
      "   +4.5745 if cp<=-0.00776861871127037\n",
      "   +0.1339 if cp>=-0.010048963874578471 & cv<=-0.7084046483039855\n",
      "   +0.0106 if cp<=-0.006269068922847509\n",
      "Run episode 620 with rewards 28.0\n",
      "============ 621 ===========\n",
      "33 actions [1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0]\n",
      "   +0.8397 if cp>=-0.026930531114339826\n",
      "   +2.5960 if cp>=-0.006431763526052225\n",
      "   +0.1962 if cp>=0.04448941871523857 & cv>=-0.7084046483039855\n",
      "   -0.7542 if cp<=0.026039887219667466 & pa<=0.09933845698833468 & pa>=0.07330677658319473\n",
      "   +0.6075 if cp>=0.0008335401071235553\n",
      "--------------\n",
      "   +1.0966 if cp<=-0.03587022423744202\n",
      "   -1.9570 if cp>=0.0007613603374920785\n",
      "   +4.3826 if cp<=-0.00776861871127037\n",
      "   +0.1539 if cp>=-0.010048963874578471 & cv<=-0.7084046483039855\n",
      "   +0.0316 if cp<=0.0008335401071235553 & cv>=-0.5956482529640198\n",
      "Run episode 621 with rewards 33.0\n",
      "============ 622 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 1, 1, 1, 1]\n",
      "   +1.0326 if cp>=-0.026930531114339826\n",
      "   +2.6306 if cp>=-0.006431763526052225\n",
      "   +0.0000 if cp<=0.026039887219667466 & pa<=0.09933845698833468 & pa>=0.07330677658319473\n",
      "   +0.8985 if cp>=0.0008335401071235553\n",
      "   -1.0987 if cp<=-0.013207717612385723 & cv>=0.43865622878074645 & pa<=0.022167965024709715 & pav>=-1.2190670013427733\n",
      "--------------\n",
      "   +1.3207 if cp<=-0.03587022423744202\n",
      "   -1.7656 if cp>=0.0007613603374920785\n",
      "   +4.3806 if cp<=-0.00776861871127037\n",
      "   -0.3293 if cp>=-0.010048963874578471 & cv<=-0.7084046483039855\n",
      "   +0.1628 if \n",
      "Run episode 622 with rewards 10.0\n",
      "============ 623 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.8242 if cp>=-0.026930531114339826\n",
      "   +0.8034 if cp>=-0.006431763526052225\n",
      "   +0.8034 if cp>=0.0008335401071235553\n",
      "   +0.0000 if cp<=-0.013207717612385723 & cv>=0.43865622878074645 & pa<=0.022167965024709715 & pav>=-1.2190670013427733\n",
      "   +0.6577 if cp>=0.02538983076810837\n",
      "--------------\n",
      "   -8.0273 if cp<=-0.03587022423744202\n",
      "   -4.4539 if cp>=0.0007613603374920785\n",
      "  -16.2074 if cp<=-0.00776861871127037\n",
      "   -0.7785 if cp>=-0.010048963874578471 & cv<=-0.7084046483039855\n",
      "   +0.6977 if pa>=0.20430512726306915\n",
      "Run episode 623 with rewards 10.0\n",
      "============ 624 ===========\n",
      "36 actions [1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0]\n",
      "   +0.2824 if cp>=-0.026930531114339826\n",
      "   +0.2824 if cp>=-0.006431763526052225\n",
      "   +0.2824 if cp>=0.0008335401071235553\n",
      "   +0.2554 if cp>=0.02538983076810837\n",
      "   +0.1431 if cp>=0.03705778121948242\n",
      "--------------\n",
      "  +10.8426 if cp<=-0.03587022423744202\n",
      "   -0.3615 if cp>=0.0007613603374920785\n",
      "  +18.0553 if cp<=-0.00776861871127037\n",
      "   -0.4130 if cp>=-0.010048963874578471 & cv<=-0.7084046483039855\n",
      "   +1.0000 if pa>=0.20098604261875153\n",
      "Run episode 624 with rewards 36.0\n",
      "============ 625 ===========\n",
      "39 actions [1, 1, 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1]\n",
      "   +1.8847 if cp>=-0.026930531114339826\n",
      "   +1.8847 if cp>=-0.006431763526052225\n",
      "   +1.4673 if cp>=0.0008335401071235553\n",
      "   +0.7942 if cp>=0.02538983076810837\n",
      "   -0.2911 if cv>=1.7185720205307007\n",
      "--------------\n",
      "   +0.9702 if cp<=-0.03587022423744202\n",
      "   +4.9037 if cp<=-0.00776861871127037\n",
      "   -3.0622 if cp>=-0.010048963874578471 & cv<=-0.7084046483039855\n",
      "   -0.0000 if pa>=0.20098604261875153\n",
      "   -3.7733 if cp>=-0.003743463428691022 & cv<=0.938897430896759 & cv>=-0.6107020974159241\n",
      "Run episode 625 with rewards 39.0\n",
      "============ 626 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 1, 1, 1]\n",
      "   +4.1523 if cp>=-0.026930531114339826\n",
      "   +2.2208 if cp>=-0.006431763526052225\n",
      "   +0.4611 if cp>=0.0008335401071235553\n",
      "   +0.0363 if cp>=0.02538983076810837\n",
      "   -2.1955 if cp>=-0.013318288326263427\n",
      "--------------\n",
      "   +3.4530 if cp<=-0.03587022423744202\n",
      "   +1.3390 if cp<=-0.00776861871127037\n",
      "   -1.5415 if cp>=-0.010048963874578471 & cv<=-0.7084046483039855\n",
      "   -3.6431 if cp>=-0.003743463428691022 & cv<=0.938897430896759 & cv>=-0.6107020974159241\n",
      "   +3.9046 if cp>=-0.036233464628458015 & pav>=-0.5417560815811158\n",
      "Run episode 626 with rewards 9.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 627 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +1.5219 if cp>=-0.026930531114339826\n",
      "   +1.1707 if cp>=-0.006431763526052225\n",
      "   +0.6724 if cp>=0.0008335401071235553\n",
      "   +1.1707 if cp>=-0.013318288326263427\n",
      "   +0.6617 if cp<=0.01535042803734541 & cp>=-0.015208255313336846\n",
      "--------------\n",
      "  -15.4411 if cp<=-0.03587022423744202\n",
      "   -2.4513 if cp>=-0.010048963874578471 & cv<=-0.7084046483039855\n",
      "   -1.2087 if cp>=-0.003743463428691022 & cv<=0.938897430896759 & cv>=-0.6107020974159241\n",
      "   -1.6591 if cp>=-0.036233464628458015 & pav>=-0.5417560815811158\n",
      "   +0.1160 if cv>=-0.9367234826087951\n",
      "Run episode 627 with rewards 9.0\n",
      "============ 628 ===========\n",
      "24 actions [1, 1, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   +1.1587 if cp>=-0.026930531114339826\n",
      "   +0.3878 if cp>=-0.006431763526052225\n",
      "   +0.0000 if cp>=0.0008335401071235553\n",
      "   +0.5983 if cp>=-0.013318288326263427\n",
      "   +0.8550 if cp>=-0.017564947903156273\n",
      "--------------\n",
      "  +16.0540 if cp<=-0.03587022423744202\n",
      "   +2.3085 if cp>=-0.010048963874578471 & cv<=-0.7084046483039855\n",
      "   +1.1383 if cp>=-0.003743463428691022 & cv<=0.938897430896759 & cv>=-0.6107020974159241\n",
      "   +0.8852 if cp>=-0.036233464628458015 & pav>=-0.5417560815811158\n",
      "   +1.0000 if cp<=-0.06984694600105286\n",
      "Run episode 628 with rewards 24.0\n",
      "============ 629 ===========\n",
      "11 actions [0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 0]\n",
      "   +2.3860 if cp>=-0.026930531114339826\n",
      "   +2.3716 if cp>=-0.006431763526052225\n",
      "   +3.2695 if cp>=-0.013318288326263427\n",
      "   -1.7898 if cp>=-0.017564947903156273\n",
      "   +2.8352 if cv>=0.4276161670684815 & pa>=-0.07842590808868406\n",
      "--------------\n",
      "   +5.4544 if cp<=-0.03587022423744202\n",
      "   +0.0000 if cp>=-0.010048963874578471 & cv<=-0.7084046483039855\n",
      "   -1.5684 if cp>=-0.003743463428691022 & cv<=0.938897430896759 & cv>=-0.6107020974159241\n",
      "   +0.5698 if cp<=-0.06984694600105286\n",
      "   -1.7997 if cp<=-0.03214076533913612\n",
      "Run episode 629 with rewards 11.0\n",
      "============ 630 ===========\n",
      "40 actions [0, 1, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   +1.5726 if cp>=-0.026930531114339826\n",
      "   +0.7958 if cp>=-0.006431763526052225\n",
      "   +1.1892 if cp>=-0.013318288326263427\n",
      "   +0.0000 if cv>=0.4276161670684815 & pa>=-0.07842590808868406\n",
      "   -8.3202 if pa>=0.19240222871303558\n",
      "--------------\n",
      "   +6.7806 if cp<=-0.03587022423744202\n",
      "   +0.4808 if cp>=-0.003743463428691022 & cv<=0.938897430896759 & cv>=-0.6107020974159241\n",
      "   +4.1644 if cp<=-0.06984694600105286\n",
      "   +4.8226 if cp<=-0.03214076533913612\n",
      "   +1.0000 if pa>=0.19240222871303558\n",
      "Run episode 630 with rewards 40.0\n",
      "============ 631 ===========\n",
      "30 actions [0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +1.3889 if cp>=-0.026930531114339826\n",
      "   +2.2495 if cp>=-0.006431763526052225\n",
      "   +2.2495 if cp>=-0.013318288326263427\n",
      "   -0.0000 if pa>=0.19240222871303558\n",
      "   +3.2919 if cp<=-0.026950085535645478 & cp>=-0.05606635883450508 & cv<=-0.18724162876605988 & pa<=-0.02351783290505409 & pa>=-0.048780073970556254\n",
      "--------------\n",
      "   +2.5381 if cp<=-0.03587022423744202\n",
      "   +0.3527 if cp<=-0.06984694600105286\n",
      "   +5.4741 if cp<=-0.03214076533913612\n",
      "   +0.0000 if pa>=0.19240222871303558\n",
      "   -2.3708 if cp<=-0.026950085535645478\n",
      "Run episode 631 with rewards 30.0\n",
      "============ 632 ===========\n",
      "49 actions [1, 1, 1, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   +3.5554 if cp>=-0.026930531114339826\n",
      "   +0.4169 if cp>=-0.006431763526052225\n",
      "   +1.6490 if cp>=-0.013318288326263427\n",
      "   +0.0000 if cp<=-0.026950085535645478 & cp>=-0.05606635883450508 & cv<=-0.18724162876605988 & pa<=-0.02351783290505409 & pa>=-0.048780073970556254\n",
      "   +1.4245 if cp<=-0.0049789028242230296 & cp>=-0.037420854717493034 & cv<=-0.6027088642120361\n",
      "--------------\n",
      "   +3.3385 if cp<=-0.03587022423744202\n",
      "   +0.8776 if cp<=-0.06984694600105286\n",
      "   +3.3385 if cp<=-0.03214076533913612\n",
      "   -2.6534 if cp<=-0.026950085535645478\n",
      "   +1.2199 if cp<=-0.0049789028242230296 & pa>=0.12957899868488312\n",
      "Run episode 632 with rewards 49.0\n",
      "============ 633 ===========\n",
      "43 actions [0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0]\n",
      "   +5.6283 if cp>=-0.026930531114339826\n",
      "   -3.0815 if cp>=-0.006431763526052225\n",
      "   -0.3382 if cp>=-0.013318288326263427\n",
      "   +1.2417 if cp<=-0.0049789028242230296 & cp>=-0.037420854717493034 & cv<=-0.6027088642120361\n",
      "   -1.6292 if cp>=-0.040861565619707094 & pa<=0.018070582859218143 & pa>=-0.0317732412368059\n",
      "--------------\n",
      "   +2.1131 if cp<=-0.03587022423744202\n",
      "   +3.8016 if cp<=-0.03214076533913612\n",
      "   +0.4042 if cp<=-0.026950085535645478\n",
      "   -0.0146 if cp<=-0.0049789028242230296 & pa>=0.12957899868488312\n",
      "   +4.9100 if cp<=0.03184648863971242 & cp>=-0.00874204467982051 & cv<=-0.01927787512540817 & cv>=-0.4080519378185272\n",
      "Run episode 633 with rewards 43.0\n",
      "============ 634 ===========\n",
      "42 actions [1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0]\n",
      "   +1.1050 if cp>=-0.026930531114339826\n",
      "   +1.1050 if cp>=-0.006431763526052225\n",
      "   +0.0000 if cp<=-0.0049789028242230296 & cp>=-0.037420854717493034 & cv<=-0.6027088642120361\n",
      "   +0.4928 if cp>=-0.040861565619707094 & pa<=0.018070582859218143 & pa>=-0.0317732412368059\n",
      "   -5.5277 if pa>=-0.0286546777933836\n",
      "--------------\n",
      "   +0.0000 if cp<=-0.03587022423744202\n",
      "   +0.0000 if cp<=-0.03214076533913612\n",
      "   +0.0000 if cp<=-0.026950085535645478\n",
      "   +7.1448 if cp<=0.03184648863971242 & cp>=-0.00874204467982051 & cv<=-0.01927787512540817 & cv>=-0.4080519378185272\n",
      "   +3.7980 if pa>=-0.0286546777933836\n",
      "Run episode 634 with rewards 42.0\n",
      "============ 635 ===========\n",
      "36 actions [1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0]\n",
      "   +5.7523 if cp>=-0.026930531114339826\n",
      "   +5.5896 if cp>=-0.006431763526052225\n",
      "   -6.0493 if cp>=-0.040861565619707094 & pa<=0.018070582859218143 & pa>=-0.0317732412368059\n",
      "   -6.4334 if pa>=-0.0286546777933836\n",
      "   +4.2186 if cp>=0.01989547163248062 & cv>=0.9898729920387268 & pa>=-0.11732776761054992\n",
      "--------------\n",
      "   +0.2728 if cp<=-0.03587022423744202\n",
      "   +0.2728 if cp<=-0.03214076533913612\n",
      "   -0.0000 if cp<=0.03184648863971242 & cp>=-0.00874204467982051 & cv<=-0.01927787512540817 & cv>=-0.4080519378185272\n",
      "   +6.9213 if pa>=-0.0286546777933836\n",
      "   -5.4166 if \n",
      "Run episode 635 with rewards 36.0\n",
      "============ 636 ===========\n",
      "14 actions [1, 1, 1, 1, 1, 0, 1, 0, 0, 0, 0, 1, 0, 1]\n",
      "   -1.2011 if cp>=-0.026930531114339826\n",
      "   +3.6144 if cp>=-0.006431763526052225\n",
      "   -1.4648 if cp>=-0.040861565619707094 & pa<=0.018070582859218143 & pa>=-0.0317732412368059\n",
      "   -3.3624 if pa>=-0.0286546777933836\n",
      "   +5.3361 if cp<=0.021000906825065634 & cp>=-0.027449455112218857 & cv<=-0.6120274066925049\n",
      "--------------\n",
      "   +0.0411 if cp<=-0.03587022423744202\n",
      "   +0.0411 if cp<=-0.03214076533913612\n",
      "   +1.3822 if pa>=-0.0286546777933836\n",
      "   +1.3520 if \n",
      "   -5.7532 if cp<=0.021000906825065634 & cp>=-0.027449455112218857 & cv<=-0.6120274066925049\n",
      "Run episode 636 with rewards 14.0\n",
      "============ 637 ===========\n",
      "63 actions [0, 1, 1, 1, 0, 0, 1, 0, 1, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 1, 1, 0, 1, 1, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 1]\n",
      "   +2.5296 if cp>=-0.006431763526052225\n",
      "   -0.9251 if cp>=-0.040861565619707094 & pa<=0.018070582859218143 & pa>=-0.0317732412368059\n",
      "   -3.1473 if pa>=-0.0286546777933836\n",
      "   -0.0000 if cp<=0.021000906825065634 & cp>=-0.027449455112218857 & cv<=-0.6120274066925049\n",
      "   +8.0301 if cp>=0.1480809897184372\n",
      "--------------\n",
      "   -0.0000 if cp<=-0.03214076533913612\n",
      "   +2.1347 if pa>=-0.0286546777933836\n",
      "   +0.5076 if \n",
      "   -0.0000 if cp<=0.021000906825065634 & cp>=-0.027449455112218857 & cv<=-0.6120274066925049\n",
      "   -8.0404 if cp>=0.1480809897184372\n",
      "Run episode 637 with rewards 63.0\n",
      "============ 638 ===========\n",
      "41 actions [1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0]\n",
      "   +6.4830 if cp>=-0.006431763526052225\n",
      "   -3.6897 if cp>=-0.040861565619707094 & pa<=0.018070582859218143 & pa>=-0.0317732412368059\n",
      "   -4.4484 if pa>=-0.0286546777933836\n",
      "   +0.0001 if cp>=0.1480809897184372\n",
      "   -4.6383 if cp>=-0.04533849507570266 & pa<=-0.026608033478260032 & pav>=-0.32130151391029355\n",
      "--------------\n",
      "   +2.2752 if pa>=-0.0286546777933836\n",
      "   +1.5513 if \n",
      "   -1.2342 if cp<=0.021000906825065634 & cp>=-0.027449455112218857 & cv<=-0.6120274066925049\n",
      "   +0.0000 if cp>=0.1480809897184372\n",
      "   -3.2770 if cv>=-0.32584766745567323 & pa<=-0.026608033478260032 & pav<=-0.32130151391029355\n",
      "Run episode 638 with rewards 41.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 639 ===========\n",
      "37 actions [1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 0, 1, 0, 1, 0, 0, 0, 1, 1, 1, 0, 0]\n",
      "   +4.0298 if cp>=-0.006431763526052225\n",
      "   -1.6931 if cp>=-0.040861565619707094 & pa<=0.018070582859218143 & pa>=-0.0317732412368059\n",
      "   -2.4417 if pa>=-0.0286546777933836\n",
      "   -1.8516 if cp>=-0.04533849507570266 & pa<=-0.026608033478260032 & pav>=-0.32130151391029355\n",
      "   -3.3975 if pav>=0.7017183303833008\n",
      "--------------\n",
      "   +1.5686 if pa>=-0.0286546777933836\n",
      "   +1.0216 if \n",
      "   +3.2908 if cp<=0.021000906825065634 & cp>=-0.027449455112218857 & cv<=-0.6120274066925049\n",
      "   -3.8706 if cv>=-0.32584766745567323 & pa<=-0.026608033478260032 & pav<=-0.32130151391029355\n",
      "   +3.5477 if pav>=0.7017183303833008\n",
      "Run episode 639 with rewards 37.0\n",
      "============ 640 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 1, 1]\n",
      "   +0.0000 if cp>=-0.006431763526052225\n",
      "   +0.0000 if pa>=-0.0286546777933836\n",
      "   -0.8857 if cp>=-0.04533849507570266 & pa<=-0.026608033478260032 & pav>=-0.32130151391029355\n",
      "   +0.0000 if pav>=0.7017183303833008\n",
      "   +4.4903 if cp>=-0.03340458124876022\n",
      "--------------\n",
      "   +0.0000 if pa>=-0.0286546777933836\n",
      "   +0.0000 if cp<=0.021000906825065634 & cp>=-0.027449455112218857 & cv<=-0.6120274066925049\n",
      "   -4.9415 if cv>=-0.32584766745567323 & pa<=-0.026608033478260032 & pav<=-0.32130151391029355\n",
      "   +0.0000 if pav>=0.7017183303833008\n",
      "   -4.4455 if cp>=-0.03340458124876022\n",
      "Run episode 640 with rewards 10.0\n",
      "============ 641 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +2.3014 if cp>=-0.006431763526052225\n",
      "   -0.8552 if cp>=-0.04533849507570266 & pa<=-0.026608033478260032 & pav>=-0.32130151391029355\n",
      "  +17.0444 if pav>=0.7017183303833008\n",
      "   -2.0335 if cp>=-0.03340458124876022\n",
      "   +1.0000 if cp<=-0.07043810039758683\n",
      "--------------\n",
      "   -0.4796 if cp<=0.021000906825065634 & cp>=-0.027449455112218857 & cv<=-0.6120274066925049\n",
      "   +1.1495 if cv>=-0.32584766745567323 & pa<=-0.026608033478260032 & pav<=-0.32130151391029355\n",
      "  -15.5688 if pav>=0.7017183303833008\n",
      "   -2.6947 if cp>=-0.03340458124876022\n",
      "   -2.5962 if cp<=-0.07043810039758683\n",
      "Run episode 641 with rewards 10.0\n",
      "============ 642 ===========\n",
      "18 actions [0, 0, 0, 1, 1, 0, 1, 1, 1, 1, 0, 0, 0, 1, 0, 1, 0, 1]\n",
      "   +0.0000 if cp>=-0.006431763526052225\n",
      "   +0.0000 if pav>=0.7017183303833008\n",
      "   +0.7915 if cp>=-0.03340458124876022\n",
      "   -0.0000 if cp<=-0.07043810039758683\n",
      "   +0.7915 if \n",
      "--------------\n",
      "   +0.4732 if cv>=-0.32584766745567323 & pa<=-0.026608033478260032 & pav<=-0.32130151391029355\n",
      "  +19.0553 if pav>=0.7017183303833008\n",
      "  -12.1190 if cp>=-0.03340458124876022\n",
      "  +14.8659 if cp<=-0.07043810039758683\n",
      "   +1.0000 if cp<=-0.033793761581182476 & cp>=-0.09986886829137802\n",
      "Run episode 642 with rewards 18.0\n",
      "============ 643 ===========\n",
      "39 actions [0, 0, 1, 0, 1, 1, 1, 0, 1, 1, 1, 0, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 1, 0, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1]\n",
      "   -0.0183 if pav>=0.7017183303833008\n",
      "   -0.0130 if cp>=-0.03340458124876022\n",
      "   -0.0000 if cp<=-0.07043810039758683\n",
      "   -1.6229 if \n",
      "   +3.0871 if cv>=0.41205036640167236\n",
      "--------------\n",
      "   +5.9262 if pav>=0.7017183303833008\n",
      "   -1.5969 if cp>=-0.03340458124876022\n",
      "   +0.0000 if cp<=-0.07043810039758683\n",
      "   +3.6754 if cp<=-0.033793761581182476 & cp>=-0.09986886829137802\n",
      "   -1.5039 if cv>=0.41205036640167236\n",
      "Run episode 643 with rewards 39.0\n",
      "============ 644 ===========\n",
      "17 actions [1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 1, 0, 0, 1, 0, 1, 0]\n",
      "   -0.0000 if pav>=0.7017183303833008\n",
      "   -1.2559 if cp>=-0.03340458124876022\n",
      "   -1.2559 if \n",
      "   +3.4780 if cv>=0.41205036640167236\n",
      "   +1.9673 if cv>=0.15242976546287537 & pav>=-0.4133064389228821\n",
      "--------------\n",
      "   -0.0000 if pav>=0.7017183303833008\n",
      "   -1.7313 if cp>=-0.03340458124876022\n",
      "   -0.0000 if cp<=-0.033793761581182476 & cp>=-0.09986886829137802\n",
      "   -1.6433 if cv>=0.41205036640167236\n",
      "   +4.5958 if cp<=0.026310219988226892 & cv<=0.15242976546287537\n",
      "Run episode 644 with rewards 17.0\n",
      "============ 645 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -3.3570 if cp>=-0.03340458124876022\n",
      "   -2.8002 if \n",
      "   +4.0563 if cv>=0.41205036640167236\n",
      "   +2.3408 if cv>=0.15242976546287537 & pav>=-0.4133064389228821\n",
      "   +4.7031 if cv<=0.16569899916648864 & cv>=0.009062296152114901\n",
      "--------------\n",
      "   +0.0000 if pav>=0.7017183303833008\n",
      "   +2.4168 if cp>=-0.03340458124876022\n",
      "   -3.0690 if cv>=0.41205036640167236\n",
      "   +0.5573 if cp<=0.026310219988226892 & cv<=0.15242976546287537\n",
      "   -5.3270 if cv<=0.16569899916648864 & cv>=0.009062296152114901\n",
      "Run episode 645 with rewards 10.0\n",
      "============ 646 ===========\n",
      "11 actions [1, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1]\n",
      "   +0.0606 if cp>=-0.03340458124876022\n",
      "   -0.2300 if \n",
      "  +16.5583 if cv>=0.41205036640167236\n",
      "   +2.4540 if cv<=0.16569899916648864 & cv>=0.009062296152114901\n",
      "   +1.0000 if cp<=0.023607008159160614\n",
      "--------------\n",
      "   -1.9860 if cp>=-0.03340458124876022\n",
      "  -16.1862 if cv>=0.41205036640167236\n",
      "   +4.6673 if cp<=0.026310219988226892 & cv<=0.15242976546287537\n",
      "   -4.1836 if cv<=0.16569899916648864 & cv>=0.009062296152114901\n",
      "   -0.1242 if cp>=0.06588528156280518\n",
      "Run episode 646 with rewards 11.0\n",
      "============ 647 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   -2.2405 if \n",
      "   +0.0024 if cv>=0.41205036640167236\n",
      "   +0.0452 if cv<=0.16569899916648864 & cv>=0.009062296152114901\n",
      "  +15.9887 if cp<=0.023607008159160614\n",
      "   +5.2368 if cv<=-0.050286516547203064\n",
      "--------------\n",
      "   +0.4504 if cp>=-0.03340458124876022\n",
      "   -1.9248 if cv>=0.41205036640167236\n",
      "  -13.9655 if cp<=0.026310219988226892 & cv<=0.15242976546287537\n",
      "   -1.6219 if cv<=0.16569899916648864 & cv>=0.009062296152114901\n",
      "   -3.8804 if cp>=-0.02330021746456623 & cv<=-0.050286516547203064\n",
      "Run episode 647 with rewards 9.0\n",
      "============ 648 ===========\n",
      "16 actions [0, 1, 0, 0, 1, 0, 0, 1, 1, 1, 0, 0, 1, 0, 0, 1]\n",
      "   +0.0000 if \n",
      "   +0.0000 if cv<=0.16569899916648864 & cv>=0.009062296152114901\n",
      "   +0.0000 if cp<=0.023607008159160614\n",
      "   -0.0000 if cv<=-0.050286516547203064\n",
      "   +0.0000 if cp<=0.005103253852576026\n",
      "--------------\n",
      "   +0.0000 if cv>=0.41205036640167236\n",
      "   -0.0000 if cp<=0.026310219988226892 & cv<=0.15242976546287537\n",
      "   +0.0000 if cv<=0.16569899916648864 & cv>=0.009062296152114901\n",
      "   -0.0000 if cp>=-0.02330021746456623 & cv<=-0.050286516547203064\n",
      "   -0.0000 if cp>=0.01930469647049904\n",
      "Run episode 648 with rewards 16.0\n",
      "============ 649 ===========\n",
      "17 actions [0, 1, 0, 0, 1, 1, 0, 1, 0, 0, 1, 0, 1, 0, 0, 0, 0]\n",
      "   +1.4123 if \n",
      "   +1.4123 if cp<=0.023607008159160614\n",
      "   -2.8230 if cv<=-0.050286516547203064\n",
      "   +2.1546 if cp<=0.005103253852576026\n",
      "   -2.5726 if cv<=-0.1671016663312912\n",
      "--------------\n",
      "   +0.0000 if cv>=0.41205036640167236\n",
      "   -2.0079 if cp<=0.026310219988226892 & cv<=0.15242976546287537\n",
      "   +1.7797 if cp>=-0.02330021746456623 & cv<=-0.050286516547203064\n",
      "   +0.0000 if cp>=0.01930469647049904\n",
      "   +2.7573 if cp>=0.011668125167489052\n",
      "Run episode 649 with rewards 17.0\n",
      "============ 650 ===========\n",
      "29 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0]\n",
      "   +0.8731 if cp<=0.023607008159160614\n",
      "   -1.5441 if cv<=-0.050286516547203064\n",
      "   +3.4385 if cp<=0.005103253852576026\n",
      "   -1.5441 if cv<=-0.1671016663312912\n",
      "   -3.2343 if cp<=0.0038610774092376265 & cv<=-0.06026184186339365\n",
      "--------------\n",
      "   +0.2343 if cp<=0.026310219988226892 & cv<=0.15242976546287537\n",
      "   +0.8817 if cp>=-0.02330021746456623 & cv<=-0.050286516547203064\n",
      "   +0.0000 if cp>=0.01930469647049904\n",
      "   +0.0000 if cp>=0.011668125167489052\n",
      "   -2.3395 if cp>=0.0038610774092376265 & cv<=-0.06026184186339365\n",
      "Run episode 650 with rewards 29.0\n",
      "============ 651 ===========\n",
      "17 actions [0, 1, 0, 1, 0, 1, 0, 0, 0, 0, 0, 0, 1, 1, 1, 0, 1]\n",
      "   -2.7055 if cv<=-0.050286516547203064\n",
      "   +4.4037 if cp<=0.005103253852576026\n",
      "   -2.7055 if cv<=-0.1671016663312912\n",
      "   -2.7055 if cp<=0.0038610774092376265 & cv<=-0.06026184186339365\n",
      "   +3.1620 if cp>=-0.10225586146116257 & cv<=-0.1778705447912216\n",
      "--------------\n",
      "   -1.4874 if cp<=0.026310219988226892 & cv<=0.15242976546287537\n",
      "   -0.0000 if cp>=-0.02330021746456623 & cv<=-0.050286516547203064\n",
      "   -0.0000 if cp>=0.011668125167489052\n",
      "   -0.0000 if cp>=0.0038610774092376265 & cv<=-0.06026184186339365\n",
      "   +3.9605 if cp>=-0.0515497252345085 & cv<=-0.041531393490731004\n",
      "Run episode 651 with rewards 17.0\n",
      "============ 652 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   -1.4877 if cv<=-0.050286516547203064\n",
      "   +3.6418 if cp<=0.005103253852576026\n",
      "   -1.4877 if cp<=0.0038610774092376265 & cv<=-0.06026184186339365\n",
      "   +1.3864 if cp>=-0.10225586146116257 & cv<=-0.1778705447912216\n",
      "   -1.8967 if cv>=-0.17740730941295624\n",
      "--------------\n",
      "   -3.7332 if cp<=0.026310219988226892 & cv<=0.15242976546287537\n",
      "   -0.0000 if cp>=-0.02330021746456623 & cv<=-0.050286516547203064\n",
      "   -0.0000 if cp>=0.0038610774092376265 & cv<=-0.06026184186339365\n",
      "   +3.1355 if cp>=-0.0515497252345085 & cv<=-0.041531393490731004\n",
      "   -9.3414 if pa>=0.18627186119556427\n",
      "Run episode 652 with rewards 9.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 653 ===========\n",
      "38 actions [1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0, 1, 1, 1, 1, 0, 0, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1]\n",
      "   +0.8670 if cv<=-0.050286516547203064\n",
      "   +1.0102 if cp<=0.005103253852576026\n",
      "   +0.8670 if cp<=0.0038610774092376265 & cv<=-0.06026184186339365\n",
      "   +0.1433 if cv>=-0.17740730941295624\n",
      "   +0.3117 if cp<=-0.04298636168241501\n",
      "--------------\n",
      "   +9.0085 if cp<=0.026310219988226892 & cv<=0.15242976546287537\n",
      "   +0.0000 if cp>=0.0038610774092376265 & cv<=-0.06026184186339365\n",
      "   -2.6589 if cp>=-0.0515497252345085 & cv<=-0.041531393490731004\n",
      "  +13.5254 if pa>=0.18627186119556427\n",
      "   -8.4418 if cp>=-0.07897479236125945\n",
      "Run episode 653 with rewards 38.0\n",
      "============ 654 ===========\n",
      "20 actions [1, 0, 1, 0, 1, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1, 1, 1, 1, 1, 1]\n",
      "   +0.7445 if cv<=-0.050286516547203064\n",
      "   +0.3085 if cp<=0.005103253852576026\n",
      "   +0.7445 if cp<=0.0038610774092376265 & cv<=-0.06026184186339365\n",
      "   +1.2887 if cp<=-0.04298636168241501\n",
      "   -2.4186 if cv<=-0.39824419021606444\n",
      "--------------\n",
      "   +6.1599 if cp<=0.026310219988226892 & cv<=0.15242976546287537\n",
      "   -3.8814 if cp>=-0.0515497252345085 & cv<=-0.041531393490731004\n",
      "   +6.7611 if pa>=0.18627186119556427\n",
      "   -4.0797 if cp>=-0.07897479236125945\n",
      "   +3.7844 if pav>=1.7159202098846436\n",
      "Run episode 654 with rewards 20.0\n",
      "============ 655 ===========\n",
      "14 actions [1, 0, 0, 0, 0, 0, 1, 1, 0, 0, 1, 0, 0, 0]\n",
      "   +0.7695 if cv<=-0.050286516547203064\n",
      "   -1.0048 if cp<=0.0038610774092376265 & cv<=-0.06026184186339365\n",
      "   +0.0080 if cp<=-0.04298636168241501\n",
      "   +0.7645 if cv<=-0.39824419021606444\n",
      "   -3.7523 if cp>=-0.020270028151571744 & cv<=-0.039606671780347824 & cv<=-0.623085904121399 & pa>=-0.011095964722335335\n",
      "--------------\n",
      "   +0.3032 if cp<=0.026310219988226892 & cv<=0.15242976546287537\n",
      "   -4.8315 if cp>=-0.0515497252345085 & cv<=-0.041531393490731004\n",
      "   -9.0709 if pa>=0.18627186119556427\n",
      "   +2.0610 if cp>=-0.07897479236125945\n",
      "   -5.4080 if cv>=-0.039606671780347824\n",
      "Run episode 655 with rewards 14.0\n",
      "============ 656 ===========\n",
      "18 actions [0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1]\n",
      "   +0.5233 if cv<=-0.050286516547203064\n",
      "   +0.5233 if cp<=0.0038610774092376265 & cv<=-0.06026184186339365\n",
      "   -0.2056 if cv<=-0.39824419021606444\n",
      "   -0.0000 if cp>=-0.020270028151571744 & cv<=-0.039606671780347824 & cv<=-0.623085904121399 & pa>=-0.011095964722335335\n",
      "   -3.0599 if cv<=-0.6051307916641235\n",
      "--------------\n",
      "   -4.0564 if cp>=-0.0515497252345085 & cv<=-0.041531393490731004\n",
      "  +11.0487 if pa>=0.18627186119556427\n",
      "   +1.4940 if cp>=-0.07897479236125945\n",
      "   -1.3783 if cv>=-0.039606671780347824\n",
      "   -2.5371 if cv>=0.1791733056306839\n",
      "Run episode 656 with rewards 18.0\n",
      "============ 657 ===========\n",
      "13 actions [0, 0, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1, 0]\n",
      "   +1.9186 if cv<=-0.050286516547203064\n",
      "   +1.9186 if cp<=0.0038610774092376265 & cv<=-0.06026184186339365\n",
      "   -5.3496 if cv<=-0.39824419021606444\n",
      "   -0.3537 if cv<=-0.6051307916641235\n",
      "   +2.8240 if cp>=-0.04727659374475479\n",
      "--------------\n",
      "   -0.6201 if cp>=-0.0515497252345085 & cv<=-0.041531393490731004\n",
      "   -8.7393 if pa>=0.18627186119556427\n",
      "   +3.1770 if cp>=-0.07897479236125945\n",
      "   +0.0000 if cv>=0.1791733056306839\n",
      "   -5.7244 if cv>=-0.2326713502407074\n",
      "Run episode 657 with rewards 13.0\n",
      "============ 658 ===========\n",
      "40 actions [0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 1, 1, 0, 1, 1, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 1, 0, 0, 0, 0, 1]\n",
      "   +1.9560 if cv<=-0.050286516547203064\n",
      "   -0.1697 if cp<=0.0038610774092376265 & cv<=-0.06026184186339365\n",
      "   -4.8062 if cv<=-0.39824419021606444\n",
      "   +2.7767 if cp>=-0.04727659374475479\n",
      "   +1.4193 if cp<=-0.008235304802656166 & cp>=-0.03152563944458961 & cv<=-0.5641242861747742\n",
      "--------------\n",
      "   -0.3937 if cp>=-0.0515497252345085 & cv<=-0.041531393490731004\n",
      "   +9.1783 if pa>=0.18627186119556427\n",
      "   +2.7404 if cp>=-0.07897479236125945\n",
      "   -2.2348 if cv>=-0.2326713502407074\n",
      "   +1.9295 if cv<=-0.3710662961006165\n",
      "Run episode 658 with rewards 40.0\n",
      "============ 659 ===========\n",
      "28 actions [0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0]\n",
      "   +0.5982 if cv<=-0.050286516547203064\n",
      "   -5.0213 if cv<=-0.39824419021606444\n",
      "   +4.4967 if cp>=-0.04727659374475479\n",
      "   -0.0000 if cp<=-0.008235304802656166 & cp>=-0.03152563944458961 & cv<=-0.5641242861747742\n",
      "   -6.5093 if cv<=0.030752715468406695 & pa>=0.1497717320919037\n",
      "--------------\n",
      "   +5.7607 if pa>=0.18627186119556427\n",
      "   +2.6446 if cp>=-0.07897479236125945\n",
      "   +0.0829 if cv>=-0.2326713502407074\n",
      "   +2.1972 if cv<=-0.3710662961006165\n",
      "   -2.3605 if cv>=0.030752715468406695\n",
      "Run episode 659 with rewards 28.0\n",
      "============ 660 ===========\n",
      "21 actions [1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0]\n",
      "   +0.8696 if cv<=-0.050286516547203064\n",
      "   -5.2427 if cv<=-0.39824419021606444\n",
      "   +8.3122 if cp>=-0.04727659374475479\n",
      "   +0.0086 if cv<=0.030752715468406695 & pa>=0.1497717320919037\n",
      "   -2.8443 if \n",
      "--------------\n",
      "   +5.2640 if pa>=0.18627186119556427\n",
      "   +0.4164 if cp>=-0.07897479236125945\n",
      "   +3.7787 if cv<=-0.3710662961006165\n",
      "   +0.6939 if cv>=0.030752715468406695\n",
      "   +5.3779 if cp<=-0.0413671001791954 & pav<=0.5963305473327637\n",
      "Run episode 660 with rewards 21.0\n",
      "============ 661 ===========\n",
      "27 actions [0, 0, 0, 1, 0, 1, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1]\n",
      "   +1.2076 if cv<=-0.050286516547203064\n",
      "   -4.3619 if cv<=-0.39824419021606444\n",
      "   +3.5340 if cp>=-0.04727659374475479\n",
      "   +1.5213 if \n",
      "   -1.7826 if cp<=-0.04550653696060181 & cp>=-0.04550653696060181\n",
      "--------------\n",
      "   +0.0000 if pa>=0.18627186119556427\n",
      "   +2.8248 if cv<=-0.3710662961006165\n",
      "   +2.0858 if cv>=0.030752715468406695\n",
      "   +5.2683 if cp<=-0.0413671001791954 & pav<=0.5963305473327637\n",
      "   +1.2683 if pav>=0.6657417416572571\n",
      "Run episode 661 with rewards 27.0\n",
      "============ 662 ===========\n",
      "14 actions [0, 0, 0, 1, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.9651 if cv<=-0.39824419021606444\n",
      "   +5.7845 if cp>=-0.04727659374475479\n",
      "   -0.5460 if \n",
      "   +0.0000 if cp<=-0.04550653696060181 & cp>=-0.04550653696060181\n",
      "   -3.6066 if cp>=-0.02697360776364803 & cv<=-0.4006426572799683 & pa<=0.04895145744085312\n",
      "--------------\n",
      "   +0.4038 if cv<=-0.3710662961006165\n",
      "   +0.6040 if cv>=0.030752715468406695\n",
      "   +5.2732 if cp<=-0.0413671001791954 & pav<=0.5963305473327637\n",
      "   +4.4707 if pav>=0.6657417416572571\n",
      "   -5.1247 if cv<=-0.4006426572799683 & pa>=0.04895145744085312 & pav<=0.9874295115470887 & pav>=0.6849217653274537\n",
      "Run episode 662 with rewards 14.0\n",
      "============ 663 ===========\n",
      "13 actions [0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1]\n",
      "   +0.5360 if cv<=-0.39824419021606444\n",
      "   +2.7468 if cp>=-0.04727659374475479\n",
      "   +1.8860 if \n",
      "   -2.4398 if cp>=-0.02697360776364803 & cv<=-0.4006426572799683 & pa<=0.04895145744085312\n",
      "   -1.6670 if pav>=1.546839952468872\n",
      "--------------\n",
      "   -5.4407 if cv>=0.030752715468406695\n",
      "   -6.9543 if cp<=-0.0413671001791954 & pav<=0.5963305473327637\n",
      "   +2.6101 if pav>=0.6657417416572571\n",
      "   -1.0608 if cv<=-0.4006426572799683 & pa>=0.04895145744085312 & pav<=0.9874295115470887 & pav>=0.6849217653274537\n",
      "   +2.4969 if pav>=1.546839952468872\n",
      "Run episode 663 with rewards 13.0\n",
      "============ 664 ===========\n",
      "11 actions [0, 0, 0, 0, 1, 1, 0, 1, 0, 0, 0]\n",
      "   +1.7233 if cp>=-0.04727659374475479\n",
      "   +3.5690 if \n",
      "   -0.0000 if cp>=-0.02697360776364803 & cv<=-0.4006426572799683 & pa<=0.04895145744085312\n",
      "   -0.0000 if pav>=1.546839952468872\n",
      "   -2.5980 if cp>=-0.06647885069251058 & cv<=-0.584407365322113\n",
      "--------------\n",
      "   +0.0000 if cv>=0.030752715468406695\n",
      "   +0.0000 if cp<=-0.0413671001791954 & pav<=0.5963305473327637\n",
      "   -4.3968 if pav>=0.6657417416572571\n",
      "   +0.0000 if pav>=1.546839952468872\n",
      "   +7.6769 if cp>=-0.09897337406873702 & cv<=-0.584407365322113\n",
      "Run episode 664 with rewards 11.0\n",
      "============ 665 ===========\n",
      "29 actions [0, 0, 0, 1, 0, 0, 1, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +3.2361 if cp>=-0.04727659374475479\n",
      "   -3.4403 if \n",
      "   +0.5182 if cp>=-0.02697360776364803 & cv<=-0.4006426572799683 & pa<=0.04895145744085312\n",
      "   +0.5382 if cp>=-0.06647885069251058 & cv<=-0.584407365322113\n",
      "   +3.2362 if cp>=-0.03946101665496825\n",
      "--------------\n",
      "   +0.0000 if cv>=0.030752715468406695\n",
      "   +0.0000 if cp<=-0.0413671001791954 & pav<=0.5963305473327637\n",
      "   +3.6389 if pav>=0.6657417416572571\n",
      "   -1.1269 if cp>=-0.09897337406873702 & cv<=-0.584407365322113\n",
      "  +10.0123 if cp<=-0.03946101665496825\n",
      "Run episode 665 with rewards 29.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 666 ===========\n",
      "24 actions [0, 0, 1, 0, 0, 0, 1, 1, 0, 1, 1, 1, 0, 1, 1, 1, 0, 1, 1, 1, 0, 0, 0, 0]\n",
      "   +0.8494 if cp>=-0.04727659374475479\n",
      "   +0.8270 if \n",
      "   -3.8806 if cp>=-0.06647885069251058 & cv<=-0.584407365322113\n",
      "   +0.8494 if cp>=-0.03946101665496825\n",
      "   +3.8758 if cp<=0.03722149133682251 & cp>=-0.03286185450851915 & pa<=0.12440450489521027 & pav>=0.7082181215286261\n",
      "--------------\n",
      "   +0.9706 if cp<=-0.0413671001791954 & pav<=0.5963305473327637\n",
      "   +3.7832 if pav>=0.6657417416572571\n",
      "   +3.1911 if cp>=-0.09897337406873702 & cv<=-0.584407365322113\n",
      "   +0.9834 if cp<=-0.03946101665496825\n",
      "   -3.0940 if cp>=-0.03286185450851915 & cv<=-0.5792052030563355\n",
      "Run episode 666 with rewards 24.0\n",
      "============ 667 ===========\n",
      "38 actions [0, 0, 1, 0, 1, 1, 1, 1, 1, 0, 1, 0, 0, 0, 0, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0]\n",
      "   +1.0790 if cp>=-0.04727659374475479\n",
      "   -2.6607 if cp>=-0.06647885069251058 & cv<=-0.584407365322113\n",
      "   +3.9313 if cp>=-0.03946101665496825\n",
      "   -1.1668 if cp<=0.03722149133682251 & cp>=-0.03286185450851915 & pa<=0.12440450489521027 & pav>=0.7082181215286261\n",
      "   -4.9270 if cp>=0.005543145630508667 & cv<=-0.16304155588150024\n",
      "--------------\n",
      "   +0.5761 if pav>=0.6657417416572571\n",
      "   +0.4754 if cp>=-0.09897337406873702 & cv<=-0.584407365322113\n",
      "   +1.8731 if cp<=-0.03946101665496825\n",
      "   +0.4754 if cp>=-0.03286185450851915 & cv<=-0.5792052030563355\n",
      "   +5.4682 if cv<=-0.355834037065506\n",
      "Run episode 667 with rewards 38.0\n",
      "============ 668 ===========\n",
      "56 actions [0, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 1, 1, 1, 1, 0, 0, 1, 0, 0, 0]\n",
      "   -1.1132 if cp>=-0.06647885069251058 & cv<=-0.584407365322113\n",
      "   +5.4036 if cp>=-0.03946101665496825\n",
      "   -1.1132 if cp<=0.03722149133682251 & cp>=-0.03286185450851915 & pa<=0.12440450489521027 & pav>=0.7082181215286261\n",
      "   +0.0000 if cp>=0.005543145630508667 & cv<=-0.16304155588150024\n",
      "   +5.4347 if cv<=0.5816660642623901 & cv>=-0.3121891796588897 & pa<=0.016492818668484694 & pa>=-0.0020245578605681555\n",
      "--------------\n",
      "   +0.4574 if pav>=0.6657417416572571\n",
      "   +0.4574 if cp>=-0.09897337406873702 & cv<=-0.584407365322113\n",
      "   -0.5777 if cp<=-0.03946101665496825\n",
      "   +4.9881 if cv<=-0.355834037065506\n",
      "   +5.0029 if pa>=0.016492818668484694\n",
      "Run episode 668 with rewards 56.0\n",
      "============ 669 ===========\n",
      "23 actions [0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0]\n",
      "   -0.0000 if cp>=-0.06647885069251058 & cv<=-0.584407365322113\n",
      "   +3.3756 if cp>=-0.03946101665496825\n",
      "   -4.0320 if cp<=0.03722149133682251 & cp>=-0.03286185450851915 & pa<=0.12440450489521027 & pav>=0.7082181215286261\n",
      "   +1.7116 if cv<=0.5816660642623901 & cv>=-0.3121891796588897 & pa<=0.016492818668484694 & pa>=-0.0020245578605681555\n",
      "   +2.4306 if cp>=-0.027155796065926552\n",
      "--------------\n",
      "   -0.0000 if cp>=-0.09897337406873702 & cv<=-0.584407365322113\n",
      "   +1.6950 if cp<=-0.03946101665496825\n",
      "   +5.8466 if cv<=-0.355834037065506\n",
      "   +4.3993 if pa>=0.016492818668484694\n",
      "   +5.0192 if cp<=-0.027155796065926552 & cp>=-0.0379655696451664 & pa<=0.05006180331110958 & pa>=0.024950450286269188 & pav<=0.639930248260498\n",
      "Run episode 669 with rewards 23.0\n",
      "============ 670 ===========\n",
      "38 actions [0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0]\n",
      "   +2.3677 if cp>=-0.03946101665496825\n",
      "   -0.4860 if cp<=0.03722149133682251 & cp>=-0.03286185450851915 & pa<=0.12440450489521027 & pav>=0.7082181215286261\n",
      "   -0.0000 if cv<=0.5816660642623901 & cv>=-0.3121891796588897 & pa<=0.016492818668484694 & pa>=-0.0020245578605681555\n",
      "   +3.2974 if cp>=-0.027155796065926552\n",
      "   +5.6734 if cp>=-0.034614034742116925 & cv>=-0.3133296966552734\n",
      "--------------\n",
      "   +0.8462 if cp<=-0.03946101665496825\n",
      "   +7.3078 if cv<=-0.355834037065506\n",
      "   +3.8781 if pa>=0.016492818668484694\n",
      "   +0.0000 if cp<=-0.027155796065926552 & cp>=-0.0379655696451664 & pa<=0.05006180331110958 & pa>=0.024950450286269188 & pav<=0.639930248260498\n",
      "   -2.7900 if cp>=-0.034614034742116925\n",
      "Run episode 670 with rewards 38.0\n",
      "============ 671 ===========\n",
      "35 actions [0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1]\n",
      "   +1.5594 if cp>=-0.03946101665496825\n",
      "   -2.5071 if cp<=0.03722149133682251 & cp>=-0.03286185450851915 & pa<=0.12440450489521027 & pav>=0.7082181215286261\n",
      "   +5.3296 if cp>=-0.027155796065926552\n",
      "   +2.3346 if cp>=-0.034614034742116925 & cv>=-0.3133296966552734\n",
      "   +3.3524 if cv<=-0.38871951699256896 & pa<=0.017361655458807947\n",
      "--------------\n",
      "   +0.5417 if cp<=-0.03946101665496825\n",
      "   +2.6514 if cv<=-0.355834037065506\n",
      "   +6.9680 if pa>=0.016492818668484694\n",
      "   -0.7237 if cp>=-0.034614034742116925\n",
      "   -0.9118 if cp<=0.007986146956682205 & cv>=-0.38871951699256896\n",
      "Run episode 671 with rewards 35.0\n",
      "============ 672 ===========\n",
      "30 actions [1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0]\n",
      "   +0.1607 if cp<=0.03722149133682251 & cp>=-0.03286185450851915 & pa<=0.12440450489521027 & pav>=0.7082181215286261\n",
      "   +4.7744 if cp>=-0.027155796065926552\n",
      "   +4.0245 if cp>=-0.034614034742116925 & cv>=-0.3133296966552734\n",
      "   +2.0532 if cv<=-0.38871951699256896 & pa<=0.017361655458807947\n",
      "   +1.5182 if cp>=0.000867682695388821 & cv>=0.5974749445915227\n",
      "--------------\n",
      "   +2.3354 if cv<=-0.355834037065506\n",
      "   +4.1347 if pa>=0.016492818668484694\n",
      "   +0.2143 if cp>=-0.034614034742116925\n",
      "   +1.3404 if cp<=0.007986146956682205 & cv>=-0.38871951699256896\n",
      "   -9.4642 if pa>=0.18278515338897705\n",
      "Run episode 672 with rewards 30.0\n",
      "============ 673 ===========\n",
      "31 actions [0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   +4.2029 if cp>=-0.027155796065926552\n",
      "   +4.3174 if cp>=-0.034614034742116925 & cv>=-0.3133296966552734\n",
      "   +2.9559 if cv<=-0.38871951699256896 & pa<=0.017361655458807947\n",
      "   -0.0080 if cp>=0.000867682695388821 & cv>=0.5974749445915227\n",
      "   +2.6271 if cp>=-0.03595842123031615 & cv<=-0.5351442337036133\n",
      "--------------\n",
      "   -1.0768 if cv<=-0.355834037065506\n",
      "   +2.7093 if pa>=0.016492818668484694\n",
      "   +2.2210 if cp<=0.007986146956682205 & cv>=-0.38871951699256896\n",
      "   +0.0000 if pa>=0.18278515338897705\n",
      "   +3.1521 if cp<=-0.03595842123031615 & cv<=-0.5351442337036133\n",
      "Run episode 673 with rewards 31.0\n",
      "============ 674 ===========\n",
      "39 actions [0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1]\n",
      "   +2.1969 if cp>=-0.027155796065926552\n",
      "   +5.1598 if cp>=-0.034614034742116925 & cv>=-0.3133296966552734\n",
      "   +3.6862 if cv<=-0.38871951699256896 & pa<=0.017361655458807947\n",
      "   +0.0776 if cp>=-0.03595842123031615 & cv<=-0.5351442337036133\n",
      "   -0.3246 if cp>=-0.0559227429330349 & pa<=0.04258175194263458\n",
      "--------------\n",
      "   -0.7676 if cv<=-0.355834037065506\n",
      "   +4.1622 if pa>=0.016492818668484694\n",
      "   +0.8379 if cp<=0.007986146956682205 & cv>=-0.38871951699256896\n",
      "   +0.1491 if cp<=-0.03595842123031615 & cv<=-0.5351442337036133\n",
      "   +0.9693 if cv<=-0.4304511249065399\n",
      "Run episode 674 with rewards 39.0\n",
      "============ 675 ===========\n",
      "55 actions [0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 1]\n",
      "   +1.7443 if cp>=-0.027155796065926552\n",
      "   +5.7936 if cp>=-0.034614034742116925 & cv>=-0.3133296966552734\n",
      "   +1.7164 if cv<=-0.38871951699256896 & pa<=0.017361655458807947\n",
      "   +1.0665 if cp>=-0.0559227429330349 & pa<=0.04258175194263458\n",
      "   +2.4086 if cv>=0.9960935115814209\n",
      "--------------\n",
      "   -0.5476 if cv<=-0.355834037065506\n",
      "   +5.0310 if pa>=0.016492818668484694\n",
      "   -0.5417 if cp<=0.007986146956682205 & cv>=-0.38871951699256896\n",
      "   +1.3087 if cv<=-0.4304511249065399\n",
      "   -2.4950 if cv>=0.9960935115814209\n",
      "Run episode 675 with rewards 55.0\n",
      "============ 676 ===========\n",
      "45 actions [0, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 0, 1]\n",
      "   +2.2209 if cp>=-0.027155796065926552\n",
      "   +4.7405 if cp>=-0.034614034742116925 & cv>=-0.3133296966552734\n",
      "   +4.3808 if cv<=-0.38871951699256896 & pa<=0.017361655458807947\n",
      "   +4.8620 if cv>=0.9960935115814209\n",
      "   +2.9787 if cp<=-0.02132668569684026 & cv>=0.5395361065864563 & pa<=0.01840092428028584\n",
      "--------------\n",
      "   -0.1477 if cv<=-0.355834037065506\n",
      "   +5.4388 if pa>=0.016492818668484694\n",
      "   -0.1477 if cv<=-0.4304511249065399\n",
      "   -5.4041 if cv>=0.9960935115814209\n",
      "   -2.5954 if cp<=-0.02132668569684026 & cv>=0.5395361065864563 & pa<=0.01840092428028584\n",
      "Run episode 676 with rewards 45.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 677 ===========\n",
      "56 actions [1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 1, 0, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1, 0, 1]\n",
      "   +6.0905 if cp>=-0.034614034742116925 & cv>=-0.3133296966552734\n",
      "   +2.8589 if cv<=-0.38871951699256896 & pa<=0.017361655458807947\n",
      "   +0.0004 if cv>=0.9960935115814209\n",
      "   +0.0001 if cp<=-0.02132668569684026 & cv>=0.5395361065864563 & pa<=0.01840092428028584\n",
      "   -3.9025 if cp<=-0.027831528335809708 & pa<=0.04310643374919893\n",
      "--------------\n",
      "   +4.2334 if cv<=-0.355834037065506\n",
      "   +5.2928 if pa>=0.016492818668484694\n",
      "   -0.0001 if cv>=0.9960935115814209\n",
      "   +0.0001 if cp<=-0.02132668569684026 & cv>=0.5395361065864563 & pa<=0.01840092428028584\n",
      "   +5.0342 if cp>=-0.013536681979894634 & cv>=0.07957192165777191 & pa>=0.02368280179798603\n",
      "Run episode 677 with rewards 56.0\n",
      "============ 678 ===========\n",
      "500 actions [1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 0, 0, 0, 0, 1, 1, 1, 1, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0]\n",
      "   +4.4005 if cp>=-0.034614034742116925 & cv>=-0.3133296966552734\n",
      "   -1.4219 if cv<=-0.38871951699256896 & pa<=0.017361655458807947\n",
      "   -0.0000 if cv>=0.9960935115814209\n",
      "   -0.0000 if cp<=-0.027831528335809708 & pa<=0.04310643374919893\n",
      "   +3.8268 if cp<=0.04204743355512619 & cp>=0.025603938847780228 & cv>=0.17478539049625397 & pa<=0.032073907554149635 & pa>=0.013494865968823433\n",
      "--------------\n",
      "   +6.9184 if cv<=-0.355834037065506\n",
      "   +7.0150 if pa>=0.016492818668484694\n",
      "   +0.0000 if cv>=0.9960935115814209\n",
      "   +5.6943 if cp>=-0.013536681979894634 & cv>=0.07957192165777191 & pa>=0.02368280179798603\n",
      "   -4.0822 if cp<=0.04204743355512619 & cp>=0.025603938847780228 & cv>=0.17478539049625397 & pa<=0.032073907554149635 & pa>=0.013494865968823433\n",
      "Run episode 678 with rewards 500.0\n",
      "best\n",
      "============ 679 ===========\n",
      "181 actions [1, 1, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 1, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1, 1, 0, 1, 1, 0, 0, 0, 0, 1, 0, 1, 1, 1, 0, 1, 0, 1, 0, 0, 0, 1, 1, 1]\n",
      "   +5.2844 if cp>=-0.034614034742116925 & cv>=-0.3133296966552734\n",
      "   -1.8209 if cv<=-0.38871951699256896 & pa<=0.017361655458807947\n",
      "   +0.0000 if cp<=-0.027831528335809708 & pa<=0.04310643374919893\n",
      "   -1.8171 if cp<=0.04204743355512619 & cp>=0.025603938847780228 & cv>=0.17478539049625397 & pa<=0.032073907554149635 & pa>=0.013494865968823433\n",
      "   -3.3222 if cp<=0.07435744106769562 & cv<=0.18928985595703127 & cv>=-0.19226446449756623\n",
      "--------------\n",
      "   +7.4507 if cv<=-0.355834037065506\n",
      "   +6.2705 if pa>=0.016492818668484694\n",
      "   +6.3014 if cp>=-0.013536681979894634 & cv>=0.07957192165777191 & pa>=0.02368280179798603\n",
      "   +1.2371 if cp<=0.04204743355512619 & cp>=0.025603938847780228 & cv>=0.17478539049625397 & pa<=0.032073907554149635 & pa>=0.013494865968823433\n",
      "   +5.1923 if cp<=0.26750234961509706 & cv<=0.18928985595703127 & cv>=-0.20182600617408752 & pa>=0.030181336030364055\n",
      "Run episode 679 with rewards 181.0\n",
      "============ 680 ===========\n",
      "79 actions [1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 0, 0, 0, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 1, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0]\n",
      "   +4.6052 if cp>=-0.034614034742116925 & cv>=-0.3133296966552734\n",
      "   -0.8493 if cv<=-0.38871951699256896 & pa<=0.017361655458807947\n",
      "   -0.5697 if cp<=0.04204743355512619 & cp>=0.025603938847780228 & cv>=0.17478539049625397 & pa<=0.032073907554149635 & pa>=0.013494865968823433\n",
      "   -0.1296 if cp<=0.07435744106769562 & cv<=0.18928985595703127 & cv>=-0.19226446449756623\n",
      "   -1.9677 if cp<=0.02906462922692299 & cv>=-0.19317975640296936 & pav>=-0.5581390857696533\n",
      "--------------\n",
      "   +6.2723 if cv<=-0.355834037065506\n",
      "  +10.4352 if pa>=0.016492818668484694\n",
      "   +1.5482 if cp>=-0.013536681979894634 & cv>=0.07957192165777191 & pa>=0.02368280179798603\n",
      "   +6.4288 if cp<=0.26750234961509706 & cv<=0.18928985595703127 & cv>=-0.20182600617408752 & pa>=0.030181336030364055\n",
      "   -7.9491 if cp>=0.006855762097984591 & pa>=0.019812779501080513 & pav<=0.2848671078681946 & pav>=-0.13741451501846313 & pav>=0.21130068600177768\n",
      "Run episode 680 with rewards 79.0\n",
      "============ 681 ===========\n",
      "183 actions [0, 0, 1, 0, 1, 1, 1, 1, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   +4.2561 if cp>=-0.034614034742116925 & cv>=-0.3133296966552734\n",
      "   -0.0000 if cv<=-0.38871951699256896 & pa<=0.017361655458807947\n",
      "   -0.0000 if cp<=0.04204743355512619 & cp>=0.025603938847780228 & cv>=0.17478539049625397 & pa<=0.032073907554149635 & pa>=0.013494865968823433\n",
      "   -1.4885 if cp<=0.02906462922692299 & cv>=-0.19317975640296936 & pav>=-0.5581390857696533\n",
      "   -7.2816 if cp>=0.10262355208396912\n",
      "--------------\n",
      "   +5.7136 if cv<=-0.355834037065506\n",
      "   +9.0263 if pa>=0.016492818668484694\n",
      "   +0.8067 if cp<=0.26750234961509706 & cv<=0.18928985595703127 & cv>=-0.20182600617408752 & pa>=0.030181336030364055\n",
      "   -0.0000 if cp>=0.006855762097984591 & pa>=0.019812779501080513 & pav<=0.2848671078681946 & pav>=-0.13741451501846313 & pav>=0.21130068600177768\n",
      "   +7.5874 if cp>=0.10262355208396912\n",
      "Run episode 681 with rewards 183.0\n",
      "============ 682 ===========\n",
      "215 actions [0, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 1, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 1, 1, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 0, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0, 1]\n",
      "   +4.7122 if cp>=-0.034614034742116925 & cv>=-0.3133296966552734\n",
      "   +0.0000 if cv<=-0.38871951699256896 & pa<=0.017361655458807947\n",
      "   -1.2752 if cp<=0.02906462922692299 & cv>=-0.19317975640296936 & pav>=-0.5581390857696533\n",
      "  +12.5151 if cp>=0.10262355208396912\n",
      "   +2.1548 if cp<=-0.012556010484695436 & cv>=0.40120365619659426 & pa<=0.022912210598587987 & pa>=0.007211415097117438\n",
      "--------------\n",
      "   +6.7285 if cv<=-0.355834037065506\n",
      "  +10.2284 if pa>=0.016492818668484694\n",
      "   +0.4193 if cp<=0.26750234961509706 & cv<=0.18928985595703127 & cv>=-0.20182600617408752 & pa>=0.030181336030364055\n",
      "  -12.5150 if cp>=0.10262355208396912\n",
      "   -0.7829 if cp<=0.03829369321465492 & cv>=-0.18413475155830383 & pa<=0.022912210598587987\n",
      "Run episode 682 with rewards 215.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 683 ===========\n",
      "313 actions [1, 1, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 1, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 0, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 0, 1, 0, 1, 0, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 1, 0, 0, 0, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 1, 0, 0, 1, 1, 1, 1, 0, 0, 1, 0, 1, 1, 1, 0]\n",
      "   +4.5979 if cp>=-0.034614034742116925 & cv>=-0.3133296966552734\n",
      "   -1.5242 if cp<=0.02906462922692299 & cv>=-0.19317975640296936 & pav>=-0.5581390857696533\n",
      "   -0.0001 if cp>=0.10262355208396912\n",
      "   +0.4302 if cp<=-0.012556010484695436 & cv>=0.40120365619659426 & pa<=0.022912210598587987 & pa>=0.007211415097117438\n",
      "   -4.5681 if cp>=0.011282020062208176 & cv>=-0.3754034459590912 & pav>=0.3639517068862915\n",
      "--------------\n",
      "   +7.0075 if cv<=-0.355834037065506\n",
      "  +10.8571 if pa>=0.016492818668484694\n",
      "   -0.0002 if cp>=0.10262355208396912\n",
      "   -0.2600 if cp<=0.03829369321465492 & cv>=-0.18413475155830383 & pa<=0.022912210598587987\n",
      "   +4.6816 if cp>=0.011282020062208176 & cv>=-0.3754034459590912 & pav>=0.3639517068862915\n",
      "Run episode 683 with rewards 313.0\n",
      "============ 684 ===========\n",
      "51 actions [0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 1, 1, 0, 0, 1, 1, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0]\n",
      "   +4.0285 if cp>=-0.034614034742116925 & cv>=-0.3133296966552734\n",
      "   -2.3179 if cp<=0.02906462922692299 & cv>=-0.19317975640296936 & pav>=-0.5581390857696533\n",
      "   -0.1676 if cp<=-0.012556010484695436 & cv>=0.40120365619659426 & pa<=0.022912210598587987 & pa>=0.007211415097117438\n",
      "   -3.3725 if cp>=0.011282020062208176 & cv>=-0.3754034459590912 & pav>=0.3639517068862915\n",
      "   +4.4303 if cp<=0.0065903091803193115 & cv<=-0.15541872680187224 & cv>=-0.3479008138179779 & pa<=0.018555673211812975 & pa>=-0.015197885595262048\n",
      "--------------\n",
      "   +4.9374 if cv<=-0.355834037065506\n",
      "  +11.7621 if pa>=0.016492818668484694\n",
      "   +1.3983 if cp<=0.03829369321465492 & cv>=-0.18413475155830383 & pa<=0.022912210598587987\n",
      "   +3.4608 if cp>=0.011282020062208176 & cv>=-0.3754034459590912 & pav>=0.3639517068862915\n",
      "   -2.2845 if cp<=0.0065903091803193115 & pa<=0.018555673211812975 & pav<=0.16068623960018164\n",
      "Run episode 684 with rewards 51.0\n",
      "============ 685 ===========\n",
      "56 actions [1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 0, 1, 1, 0, 1, 0, 0, 0, 0, 1, 1, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1]\n",
      "   +4.4757 if cp>=-0.034614034742116925 & cv>=-0.3133296966552734\n",
      "   -2.7670 if cp<=0.02906462922692299 & cv>=-0.19317975640296936 & pav>=-0.5581390857696533\n",
      "   -0.0000 if cp>=0.011282020062208176 & cv>=-0.3754034459590912 & pav>=0.3639517068862915\n",
      "   +0.9933 if cp<=0.0065903091803193115 & cv<=-0.15541872680187224 & cv>=-0.3479008138179779 & pa<=0.018555673211812975 & pa>=-0.015197885595262048\n",
      "   -4.0483 if cp>=-0.011767697520554054 & cv>=-0.18865907192230222 & pav>=-0.0907118096947669\n",
      "--------------\n",
      "  +10.0175 if cv<=-0.355834037065506\n",
      "   +8.5691 if pa>=0.016492818668484694\n",
      "   -0.0001 if cp>=0.011282020062208176 & cv>=-0.3754034459590912 & pav>=0.3639517068862915\n",
      "   -2.3265 if cp<=0.0065903091803193115 & pa<=0.018555673211812975 & pav<=0.16068623960018164\n",
      "   +2.7021 if cp>=-0.011767697520554054 & pa>=-0.08533065021038053 & pav>=-0.2820633053779602\n",
      "Run episode 685 with rewards 56.0\n",
      "============ 686 ===========\n",
      "42 actions [1, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0, 0, 0, 0, 1, 0, 0, 1, 1, 1, 0, 0, 1, 1, 1, 0, 0, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0]\n",
      "   +2.0474 if cp>=-0.034614034742116925 & cv>=-0.3133296966552734\n",
      "   -0.7484 if cp<=0.02906462922692299 & cv>=-0.19317975640296936 & pav>=-0.5581390857696533\n",
      "   -0.0000 if cp<=0.0065903091803193115 & cv<=-0.15541872680187224 & cv>=-0.3479008138179779 & pa<=0.018555673211812975 & pa>=-0.015197885595262048\n",
      "   -3.7635 if cp>=-0.011767697520554054 & cv>=-0.18865907192230222 & pav>=-0.0907118096947669\n",
      "   +4.7869 if cp>=0.052984513342380524 & cv>=-0.5137308835983276 & pa<=-0.0892702043056488 & pav>=-0.09476862102746962\n",
      "--------------\n",
      "   +9.5775 if cv<=-0.355834037065506\n",
      "   -0.0001 if pa>=0.016492818668484694\n",
      "   -6.4067 if cp<=0.0065903091803193115 & pa<=0.018555673211812975 & pav<=0.16068623960018164\n",
      "   +5.2507 if cp>=-0.011767697520554054 & pa>=-0.08533065021038053 & pav>=-0.2820633053779602\n",
      "   -4.2250 if cv>=-0.5137308835983276 & pa<=-0.0892702043056488 & pav>=-0.09476862102746962\n",
      "Run episode 686 with rewards 42.0\n",
      "============ 687 ===========\n",
      "14 actions [1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 1, 1]\n",
      "   +1.0564 if cp>=-0.034614034742116925 & cv>=-0.3133296966552734\n",
      "   -3.1758 if cp<=0.02906462922692299 & cv>=-0.19317975640296936 & pav>=-0.5581390857696533\n",
      "   -1.2045 if cp>=-0.011767697520554054 & cv>=-0.18865907192230222 & pav>=-0.0907118096947669\n",
      "   +5.0772 if cp>=0.052984513342380524 & cv>=-0.5137308835983276 & pa<=-0.0892702043056488 & pav>=-0.09476862102746962\n",
      "   +3.4652 if pa>=-0.08225837051868438 & pav<=-0.557180118560791\n",
      "--------------\n",
      "   +3.4504 if cv<=-0.355834037065506\n",
      "   -0.5244 if cp<=0.0065903091803193115 & pa<=0.018555673211812975 & pav<=0.16068623960018164\n",
      "   +6.0591 if cp>=-0.011767697520554054 & pa>=-0.08533065021038053 & pav>=-0.2820633053779602\n",
      "   +0.7305 if cv>=-0.5137308835983276 & pa<=-0.0892702043056488 & pav>=-0.09476862102746962\n",
      "   +5.3381 if cp>=0.05466810241341592 & cv>=0.165700963139534 & pa>=-0.08225837051868438 & pav>=-0.557180118560791\n",
      "Run episode 687 with rewards 14.0\n",
      "============ 688 ===========\n",
      "15 actions [1, 0, 0, 0, 0, 0, 1, 1, 0, 1, 0, 0, 0, 1, 0]\n",
      "   -3.4429 if cp<=0.02906462922692299 & cv>=-0.19317975640296936 & pav>=-0.5581390857696533\n",
      "   -0.0040 if cp>=-0.011767697520554054 & cv>=-0.18865907192230222 & pav>=-0.0907118096947669\n",
      "   +0.0000 if cp>=0.052984513342380524 & cv>=-0.5137308835983276 & pa<=-0.0892702043056488 & pav>=-0.09476862102746962\n",
      "   +2.6104 if pa>=-0.08225837051868438 & pav<=-0.557180118560791\n",
      "  +22.0000 if cp>=0.04674165099859238\n",
      "--------------\n",
      "   -0.0000 if cv<=-0.355834037065506\n",
      "   +0.6107 if cp>=-0.011767697520554054 & pa>=-0.08533065021038053 & pav>=-0.2820633053779602\n",
      "   -0.0000 if cv>=-0.5137308835983276 & pa<=-0.0892702043056488 & pav>=-0.09476862102746962\n",
      "   -0.0000 if cp>=0.05466810241341592 & cv>=0.165700963139534 & pa>=-0.08225837051868438 & pav>=-0.557180118560791\n",
      "  -20.0000 if cp>=0.04674165099859238\n",
      "Run episode 688 with rewards 15.0\n",
      "============ 689 ===========\n",
      "13 actions [1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.0000 if cp<=0.02906462922692299 & cv>=-0.19317975640296936 & pav>=-0.5581390857696533\n",
      "   -1.1715 if cp>=-0.011767697520554054 & cv>=-0.18865907192230222 & pav>=-0.0907118096947669\n",
      "   +0.0000 if pa>=-0.08225837051868438 & pav<=-0.557180118560791\n",
      "   +0.0000 if cp>=0.04674165099859238\n",
      "   +4.3720 if cp>=0.03795802742242813\n",
      "--------------\n",
      "   -1.8321 if cv<=-0.355834037065506\n",
      "   +1.6821 if cp>=-0.011767697520554054 & pa>=-0.08533065021038053 & pav>=-0.2820633053779602\n",
      "   -0.0000 if cp>=0.05466810241341592 & cv>=0.165700963139534 & pa>=-0.08225837051868438 & pav>=-0.557180118560791\n",
      "   -0.0000 if cp>=0.04674165099859238\n",
      "   -4.2446 if cp>=0.03795802742242813\n",
      "Run episode 689 with rewards 13.0\n",
      "============ 690 ===========\n",
      "55 actions [0, 0, 1, 1, 1, 0, 1, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 1, 1, 1, 0, 0, 0, 1, 0, 0, 1, 1, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 1]\n",
      "   -0.2213 if cp<=0.02906462922692299 & cv>=-0.19317975640296936 & pav>=-0.5581390857696533\n",
      "   +0.0000 if cp>=-0.011767697520554054 & cv>=-0.18865907192230222 & pav>=-0.0907118096947669\n",
      "   +0.0000 if cp>=0.04674165099859238\n",
      "   +0.0000 if cp>=0.03795802742242813\n",
      "   +2.4718 if cv>=0.1892169862985611\n",
      "--------------\n",
      "  +22.4707 if cv<=-0.355834037065506\n",
      "   +0.2529 if cp>=-0.011767697520554054 & pa>=-0.08533065021038053 & pav>=-0.2820633053779602\n",
      "   +0.0000 if cp>=0.04674165099859238\n",
      "   +0.6382 if cp>=0.03795802742242813\n",
      "   +1.0000 if cp<=-0.0647235631942749\n",
      "Run episode 690 with rewards 55.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 691 ===========\n",
      "45 actions [1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 0, 0, 0, 1, 1, 1, 1, 0, 1, 1, 0, 0, 1, 0, 0, 1, 1, 0, 0, 0, 1, 1, 1, 0, 0, 0, 1, 1, 1]\n",
      "   +0.6731 if cp<=0.02906462922692299 & cv>=-0.19317975640296936 & pav>=-0.5581390857696533\n",
      "   +0.0000 if cp>=-0.011767697520554054 & cv>=-0.18865907192230222 & pav>=-0.0907118096947669\n",
      "   +0.0000 if cp>=0.03795802742242813\n",
      "   +2.2001 if cv>=0.1892169862985611\n",
      "   -4.9530 if cp>=-0.049146933108568186 & pa>=-0.03179724290966987 & pav>=-0.10419337600469587\n",
      "--------------\n",
      "   +5.8806 if cv<=-0.355834037065506\n",
      "   -0.0000 if cp>=-0.011767697520554054 & pa>=-0.08533065021038053 & pav>=-0.2820633053779602\n",
      "   -0.0000 if cp>=0.03795802742242813\n",
      "   +0.9861 if cp<=-0.0647235631942749\n",
      "   -1.4361 if cv<=-0.17454801499843597 & pav>=0.18681923151016236\n",
      "Run episode 691 with rewards 45.0\n",
      "============ 692 ===========\n",
      "140 actions [1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 1, 0, 0, 0, 0, 1, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1, 1, 0, 0, 0, 1, 1, 1, 0, 0, 0, 1, 1, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 1, 1, 0]\n",
      "   +1.3322 if cp<=0.02906462922692299 & cv>=-0.19317975640296936 & pav>=-0.5581390857696533\n",
      "   +0.8364 if cp>=0.03795802742242813\n",
      "   +2.3139 if cv>=0.1892169862985611\n",
      "   -5.6896 if cp>=-0.049146933108568186 & pa>=-0.03179724290966987 & pav>=-0.10419337600469587\n",
      "   -4.7766 if cp<=0.055050821602344514 & cp<=0.05979763790965081 & cv<=0.05247054472565652 & cv>=0.03656104952096939\n",
      "--------------\n",
      "   +4.5009 if cv<=-0.355834037065506\n",
      "   -0.8274 if cp>=0.03795802742242813\n",
      "   +0.0000 if cp<=-0.0647235631942749\n",
      "   -1.1032 if cv<=-0.17454801499843597 & pav>=0.18681923151016236\n",
      "   +4.6826 if cp<=0.055050821602344514 & cp<=0.05979763790965081 & cv<=0.05247054472565652 & cv>=0.03656104952096939 & pa<=-0.022326898202300063 & pav>=-0.5104069352149964\n",
      "Run episode 692 with rewards 140.0\n",
      "============ 693 ===========\n",
      "30 actions [1, 0, 0, 1, 0, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0]\n",
      "   +1.7921 if cp<=0.02906462922692299 & cv>=-0.19317975640296936 & pav>=-0.5581390857696533\n",
      "   +3.1806 if cv>=0.1892169862985611\n",
      "   -5.9334 if cp>=-0.049146933108568186 & pa>=-0.03179724290966987 & pav>=-0.10419337600469587\n",
      "   -0.0001 if cp<=0.055050821602344514 & cp<=0.05979763790965081 & cv<=0.05247054472565652 & cv>=0.03656104952096939\n",
      "   +3.2204 if cp<=0.15199558436870575 & cp>=0.09747559428215027 & pa<=-0.035654114186763765 & pa>=-0.058777347952127454\n",
      "--------------\n",
      "   +4.4923 if cv<=-0.355834037065506\n",
      "   -0.8401 if cp>=0.03795802742242813\n",
      "   -1.6662 if cv<=-0.17454801499843597 & pav>=0.18681923151016236\n",
      "   -0.0000 if cp<=0.055050821602344514 & cp<=0.05979763790965081 & cv<=0.05247054472565652 & cv>=0.03656104952096939 & pa<=-0.022326898202300063 & pav>=-0.5104069352149964\n",
      "   +7.1824 if cp>=0.15199558436870575 & cv>=0.007548167929053308 & pa<=-0.026042421907186506 & pa>=-0.035654114186763765 & pav>=-0.26806231737136843\n",
      "Run episode 693 with rewards 30.0\n",
      "============ 694 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   +1.3614 if cp<=0.02906462922692299 & cv>=-0.19317975640296936 & pav>=-0.5581390857696533\n",
      "   +2.1244 if cv>=0.1892169862985611\n",
      "   -1.0318 if cp>=-0.049146933108568186 & pa>=-0.03179724290966987 & pav>=-0.10419337600469587\n",
      "   -0.0000 if cp<=0.15199558436870575 & cp>=0.09747559428215027 & pa<=-0.035654114186763765 & pa>=-0.058777347952127454\n",
      "   -4.0912 if cp>=-0.015111393295228481\n",
      "--------------\n",
      "   +4.8717 if cv<=-0.355834037065506\n",
      "   -0.0000 if cp>=0.03795802742242813\n",
      "   -1.1558 if cv<=-0.17454801499843597 & pav>=0.18681923151016236\n",
      "   -0.0000 if cp>=0.15199558436870575 & cv>=0.007548167929053308 & pa<=-0.026042421907186506 & pa>=-0.035654114186763765 & pav>=-0.26806231737136843\n",
      "   +4.4355 if cp>=-0.015111393295228481\n",
      "Run episode 694 with rewards 10.0\n",
      "============ 695 ===========\n",
      "15 actions [1, 1, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0]\n",
      "  -10.4034 if cp<=0.02906462922692299 & cv>=-0.19317975640296936 & pav>=-0.5581390857696533\n",
      "  +13.7582 if cv>=0.1892169862985611\n",
      "   -3.6252 if cp>=-0.049146933108568186 & pa>=-0.03179724290966987 & pav>=-0.10419337600469587\n",
      "   +7.7223 if cp>=-0.015111393295228481\n",
      "   +1.0000 if cp<=0.041873242706060416\n",
      "--------------\n",
      "   +0.0000 if cv<=-0.355834037065506\n",
      "   +0.0000 if cv<=-0.17454801499843597 & pav>=0.18681923151016236\n",
      "   +0.0000 if cp>=0.15199558436870575 & cv>=0.007548167929053308 & pa<=-0.026042421907186506 & pa>=-0.035654114186763765 & pav>=-0.26806231737136843\n",
      "   -5.4031 if cp>=-0.015111393295228481\n",
      "  -19.9912 if cp>=0.041873242706060416\n",
      "Run episode 695 with rewards 15.0\n",
      "============ 696 ===========\n",
      "37 actions [1, 0, 1, 0, 1, 0, 0, 0, 1, 1, 1, 0, 1, 0, 0, 1, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1, 1, 0, 1, 1, 0, 1]\n",
      "   -1.4889 if cp<=0.02906462922692299 & cv>=-0.19317975640296936 & pav>=-0.5581390857696533\n",
      "   +3.8302 if cv>=0.1892169862985611\n",
      "   -2.2890 if cp>=-0.049146933108568186 & pa>=-0.03179724290966987 & pav>=-0.10419337600469587\n",
      "   +1.3739 if cp>=-0.015111393295228481\n",
      "  -20.6272 if cv<=-0.6099578261375427\n",
      "--------------\n",
      "   +9.4921 if cv<=-0.355834037065506\n",
      "   +6.8392 if cv<=-0.17454801499843597 & pav>=0.18681923151016236\n",
      "  -12.5281 if cp>=-0.015111393295228481\n",
      "   -1.1591 if cp>=0.041873242706060416\n",
      "   +1.0000 if cp<=-0.0694348469376564\n",
      "Run episode 696 with rewards 37.0\n",
      "============ 697 ===========\n",
      "41 actions [0, 1, 1, 0, 1, 0, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0, 1, 0, 0, 1, 1, 1, 0, 0, 1, 1, 1, 0, 1, 0, 1]\n",
      "   -0.1120 if cp<=0.02906462922692299 & cv>=-0.19317975640296936 & pav>=-0.5581390857696533\n",
      "   +4.6857 if cv>=0.1892169862985611\n",
      "   -3.0231 if cp>=-0.049146933108568186 & pa>=-0.03179724290966987 & pav>=-0.10419337600469587\n",
      "   -0.0000 if cv<=-0.6099578261375427\n",
      "   -4.0268 if cv<=0.02617583200335503 & cv>=-0.17208473682403563 & pa>=-0.047200413048267366\n",
      "--------------\n",
      "   +3.1952 if cv<=-0.355834037065506\n",
      "   +0.5009 if cv<=-0.17454801499843597 & pav>=0.18681923151016236\n",
      "   -4.0443 if cp>=-0.015111393295228481\n",
      "   -0.0000 if cp>=0.041873242706060416\n",
      "   -4.9066 if cp<=-0.017561182007193567 & cp>=-0.021064428985118865 & cv<=0.02617583200335503 & pa>=-0.06073121577501297\n",
      "Run episode 697 with rewards 41.0\n",
      "============ 698 ===========\n",
      "85 actions [1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 0, 0, 1, 1, 0, 1, 0, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0, 0, 0, 1, 1, 1, 0, 1, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 0, 1, 0, 0, 0, 1, 1, 1, 1, 1, 0, 1, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 0, 0, 1, 1, 0, 1, 1, 0, 0, 0]\n",
      "   -0.3726 if cp<=0.02906462922692299 & cv>=-0.19317975640296936 & pav>=-0.5581390857696533\n",
      "   +4.7363 if cv>=0.1892169862985611\n",
      "   -0.0000 if cp>=-0.049146933108568186 & pa>=-0.03179724290966987 & pav>=-0.10419337600469587\n",
      "   -3.5232 if cv<=0.02617583200335503 & cv>=-0.17208473682403563 & pa>=-0.047200413048267366\n",
      "   -3.0415 if pa>=-0.037713561207056046\n",
      "--------------\n",
      "   +1.5980 if cv<=-0.355834037065506\n",
      "   +2.6603 if cv<=-0.17454801499843597 & pav>=0.18681923151016236\n",
      "   -5.0419 if cp>=-0.015111393295228481\n",
      "   -3.3049 if cp<=-0.017561182007193567 & cp>=-0.021064428985118865 & cv<=0.02617583200335503 & pa>=-0.06073121577501297\n",
      "   +3.2376 if pa>=-0.037713561207056046\n",
      "Run episode 698 with rewards 85.0\n",
      "============ 699 ===========\n",
      "28 actions [1, 0, 0, 0, 1, 1, 1, 1, 0, 0, 0, 0, 1, 0, 1, 1, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 0]\n",
      "   -1.7105 if cp<=0.02906462922692299 & cv>=-0.19317975640296936 & pav>=-0.5581390857696533\n",
      "   +7.6042 if cv>=0.1892169862985611\n",
      "   -2.4589 if cv<=0.02617583200335503 & cv>=-0.17208473682403563 & pa>=-0.047200413048267366\n",
      "   +2.0877 if pa>=-0.037713561207056046\n",
      "   -5.3311 if pa>=-0.03850002065300941\n",
      "--------------\n",
      "   +6.9078 if cv<=-0.17454801499843597 & pav>=0.18681923151016236\n",
      "   -7.0368 if cp>=-0.015111393295228481\n",
      "   +0.0001 if cp<=-0.017561182007193567 & cp>=-0.021064428985118865 & cv<=0.02617583200335503 & pa>=-0.06073121577501297\n",
      "   +1.0857 if pa>=-0.037713561207056046\n",
      "   +4.0328 if pa>=-0.03850002065300941\n",
      "Run episode 699 with rewards 28.0\n",
      "============ 700 ===========\n",
      "80 actions [1, 0, 0, 1, 0, 0, 1, 1, 1, 1, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1, 1, 1, 0, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 1, 0, 0, 0, 1, 1, 0, 0, 1, 0, 1, 0, 0, 0, 1, 1, 1, 1, 0, 1]\n",
      "   +2.6286 if cv>=0.1892169862985611\n",
      "   -2.6040 if cv<=0.02617583200335503 & cv>=-0.17208473682403563 & pa>=-0.047200413048267366\n",
      "   -0.0221 if pa>=-0.037713561207056046\n",
      "   -3.3741 if pa>=-0.03850002065300941\n",
      "   -3.0358 if pav>=0.48719537258148193\n",
      "--------------\n",
      "   +3.4987 if cv<=-0.17454801499843597 & pav>=0.18681923151016236\n",
      "   -6.2721 if cp>=-0.015111393295228481\n",
      "   +0.4640 if pa>=-0.037713561207056046\n",
      "   +1.2432 if pa>=-0.03850002065300941\n",
      "   +5.1194 if pav>=0.48719537258148193\n",
      "Run episode 700 with rewards 80.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 701 ===========\n",
      "43 actions [1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 1, 1, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 1, 1, 0]\n",
      "   +2.9139 if cv>=0.1892169862985611\n",
      "   -3.5867 if cv<=0.02617583200335503 & cv>=-0.17208473682403563 & pa>=-0.047200413048267366\n",
      "   -3.7050 if pa>=-0.03850002065300941\n",
      "   -1.9156 if pav>=0.48719537258148193\n",
      "   +3.0625 if cp>=-0.014220194704830642 & cv<=0.00796423787251116 & cv>=-0.35157954692840576 & pa>=-0.0018889692611992245\n",
      "--------------\n",
      "   +3.7189 if cv<=-0.17454801499843597 & pav>=0.18681923151016236\n",
      "   -7.5978 if cp>=-0.015111393295228481\n",
      "   +3.4619 if pa>=-0.03850002065300941\n",
      "   +4.2766 if pav>=0.48719537258148193\n",
      "   -2.7002 if cp>=-0.014220194704830642 & cv<=0.00796423787251116 & cv>=-0.35157954692840576 & pa>=-0.0018889692611992245\n",
      "Run episode 701 with rewards 43.0\n",
      "============ 702 ===========\n",
      "42 actions [0, 0, 1, 1, 0, 1, 1, 1, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 0, 0, 1, 0]\n",
      "   +2.3051 if cv>=0.1892169862985611\n",
      "   +0.0000 if cv<=0.02617583200335503 & cv>=-0.17208473682403563 & pa>=-0.047200413048267366\n",
      "   -3.3455 if pa>=-0.03850002065300941\n",
      "   +0.0000 if cp>=-0.014220194704830642 & cv<=0.00796423787251116 & cv>=-0.35157954692840576 & pa>=-0.0018889692611992245\n",
      "   -3.6753 if cp>=-0.035480418056249616 & cv<=-0.5028872013092041\n",
      "--------------\n",
      "   +2.5283 if cv<=-0.17454801499843597 & pav>=0.18681923151016236\n",
      "   -5.6222 if cp>=-0.015111393295228481\n",
      "   +3.6163 if pa>=-0.03850002065300941\n",
      "   +4.9481 if pav>=0.48719537258148193\n",
      "   +2.8129 if cp<=-0.04529189988970756 & pa>=-0.0931693524122238\n",
      "Run episode 702 with rewards 42.0\n",
      "============ 703 ===========\n",
      "29 actions [1, 0, 0, 1, 0, 0, 1, 1, 1, 1, 1, 0, 0, 1, 0, 0, 1, 0, 0, 1, 0, 0, 1, 1, 1, 0, 0, 1, 0]\n",
      "   +5.4606 if cv>=0.1892169862985611\n",
      "   +3.0234 if cv<=0.02617583200335503 & cv>=-0.17208473682403563 & pa>=-0.047200413048267366\n",
      "   -4.8184 if pa>=-0.03850002065300941\n",
      "   -2.1192 if cp>=-0.035480418056249616 & cv<=-0.5028872013092041\n",
      "   -3.4219 if pa>=-0.023259121924638748\n",
      "--------------\n",
      "   -6.1462 if cp>=-0.015111393295228481\n",
      "   +3.7638 if pa>=-0.03850002065300941\n",
      "   +5.8776 if pav>=0.48719537258148193\n",
      "   -0.0001 if cp<=-0.04529189988970756 & pa>=-0.0931693524122238\n",
      "   +3.0470 if cp>=-0.03904662877321243 & cv<=-0.19197620153427122\n",
      "Run episode 703 with rewards 29.0\n",
      "============ 704 ===========\n",
      "44 actions [0, 1, 1, 1, 0, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 1, 0, 0, 0, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 0, 0, 0, 1, 1, 1, 1, 0, 1, 0]\n",
      "   +3.1184 if cv>=0.1892169862985611\n",
      "   +2.7043 if cv<=0.02617583200335503 & cv>=-0.17208473682403563 & pa>=-0.047200413048267366\n",
      "   -2.7223 if pa>=-0.03850002065300941\n",
      "   +0.0000 if pa>=-0.023259121924638748\n",
      "   +3.5971 if cp>=-0.04776382893323898 & pa>=-0.05607988983392709 & pav<=0.024232217669487063\n",
      "--------------\n",
      "   -0.0000 if cp>=-0.015111393295228481\n",
      "   +3.2695 if pa>=-0.03850002065300941\n",
      "   +2.9015 if pav>=0.48719537258148193\n",
      "   +0.7325 if cp>=-0.03904662877321243 & cv<=-0.19197620153427122\n",
      "   +3.5983 if cp>=-0.04776382893323898 & pa>=-0.05607988983392709 & pav>=0.024232217669487063\n",
      "Run episode 704 with rewards 44.0\n",
      "============ 705 ===========\n",
      "109 actions [0, 1, 1, 1, 0, 1, 1, 0, 0, 1, 0, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 0, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 0, 1, 0, 0, 1, 0, 0, 1, 1, 0, 1, 0, 0, 1, 0, 0, 1, 1, 0, 1, 1, 0, 0, 1, 0, 0, 1, 1, 0, 1]\n",
      "   +3.2710 if cv>=0.1892169862985611\n",
      "   +4.9736 if cv<=0.02617583200335503 & cv>=-0.17208473682403563 & pa>=-0.047200413048267366\n",
      "   -2.3634 if pa>=-0.03850002065300941\n",
      "   +2.9149 if cp>=-0.04776382893323898 & pa>=-0.05607988983392709 & pav<=0.024232217669487063\n",
      "   -3.7868 if pa>=0.03478226065635681\n",
      "--------------\n",
      "   +3.2320 if pa>=-0.03850002065300941\n",
      "   -0.0000 if pav>=0.48719537258148193\n",
      "   +0.1671 if cp>=-0.03904662877321243 & cv<=-0.19197620153427122\n",
      "   +1.9859 if cp>=-0.04776382893323898 & pa>=-0.05607988983392709 & pav>=0.024232217669487063\n",
      "   +3.9504 if pa>=0.03478226065635681\n",
      "Run episode 705 with rewards 109.0\n",
      "============ 706 ===========\n",
      "68 actions [1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 1, 1, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1]\n",
      "   +0.4584 if cv>=0.1892169862985611\n",
      "   +3.5957 if cv<=0.02617583200335503 & cv>=-0.17208473682403563 & pa>=-0.047200413048267366\n",
      "   +2.9736 if cp>=-0.04776382893323898 & pa>=-0.05607988983392709 & pav<=0.024232217669487063\n",
      "   -1.7172 if pa>=0.03478226065635681\n",
      "   +5.0091 if cp<=0.075119623541832 & cv>=0.21265302300453187 & pa<=0.009697789140045657\n",
      "--------------\n",
      "   +3.1881 if pa>=-0.03850002065300941\n",
      "   +1.4941 if cp>=-0.03904662877321243 & cv<=-0.19197620153427122\n",
      "   +2.9276 if cp>=-0.04776382893323898 & pa>=-0.05607988983392709 & pav>=0.024232217669487063\n",
      "   +2.0172 if pa>=0.03478226065635681\n",
      "   -4.3695 if pa<=0.009697789140045657 & pa>=-0.015755659341812115 & pav<=-0.4268376469612121\n",
      "Run episode 706 with rewards 68.0\n",
      "============ 707 ===========\n",
      "64 actions [0, 1, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 1, 1, 0, 0, 0, 1, 0, 0, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 0, 1, 0, 0, 0, 0, 1, 0, 0, 1, 1, 1, 1, 0, 1, 1]\n",
      "   -0.7514 if cv<=0.02617583200335503 & cv>=-0.17208473682403563 & pa>=-0.047200413048267366\n",
      "   +3.4485 if cp>=-0.04776382893323898 & pa>=-0.05607988983392709 & pav<=0.024232217669487063\n",
      "   -0.0000 if pa>=0.03478226065635681\n",
      "   +4.7855 if cp<=0.075119623541832 & cv>=0.21265302300453187 & pa<=0.009697789140045657\n",
      "   +3.3818 if pa>=0.026700621470808983\n",
      "--------------\n",
      "   +2.8721 if pa>=-0.03850002065300941\n",
      "   +5.7408 if cp>=-0.04776382893323898 & pa>=-0.05607988983392709 & pav>=0.024232217669487063\n",
      "   -0.0000 if pa>=0.03478226065635681\n",
      "   -0.5401 if pa<=0.009697789140045657 & pa>=-0.015755659341812115 & pav<=-0.4268376469612121\n",
      "   -3.1539 if pa>=0.026700621470808983\n",
      "Run episode 707 with rewards 64.0\n",
      "============ 708 ===========\n",
      "69 actions [1, 0, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 1, 1, 0, 0, 0, 1, 1, 0, 1, 0, 0, 0, 1, 0, 1, 0, 0, 0, 1, 0, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 1, 1, 1]\n",
      "   -3.3036 if cv<=0.02617583200335503 & cv>=-0.17208473682403563 & pa>=-0.047200413048267366\n",
      "   +5.1880 if cp>=-0.04776382893323898 & pa>=-0.05607988983392709 & pav<=0.024232217669487063\n",
      "   +2.9712 if cp<=0.075119623541832 & cv>=0.21265302300453187 & pa<=0.009697789140045657\n",
      "   -0.0000 if pa>=0.026700621470808983\n",
      "   +5.2864 if cp>=0.04412740245461464 & cv>=-0.19487300813198088 & pa>=-0.022463067248463624\n",
      "--------------\n",
      "   +2.9007 if pa>=-0.03850002065300941\n",
      "   +3.9631 if cp>=-0.04776382893323898 & pa>=-0.05607988983392709 & pav>=0.024232217669487063\n",
      "   -0.0000 if pa<=0.009697789140045657 & pa>=-0.015755659341812115 & pav<=-0.4268376469612121\n",
      "   -0.0000 if pa>=0.026700621470808983\n",
      "   -2.1421 if cp>=0.04412740245461464 & cv>=-0.19487300813198088\n",
      "Run episode 708 with rewards 69.0\n",
      "============ 709 ===========\n",
      "81 actions [1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0, 1, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 0, 0, 1, 0, 0, 1, 0, 0, 0, 1, 1, 1, 1, 1, 1, 0, 1, 0, 0, 1, 1, 0, 1, 1, 1, 1]\n",
      "   +2.1567 if cv<=0.02617583200335503 & cv>=-0.17208473682403563 & pa>=-0.047200413048267366\n",
      "   +2.2863 if cp>=-0.04776382893323898 & pa>=-0.05607988983392709 & pav<=0.024232217669487063\n",
      "   +3.6277 if cp<=0.075119623541832 & cv>=0.21265302300453187 & pa<=0.009697789140045657\n",
      "   +0.0000 if cp>=0.04412740245461464 & cv>=-0.19487300813198088 & pa>=-0.022463067248463624\n",
      "   -4.8638 if pa>=-0.030518822371959686\n",
      "--------------\n",
      "   +3.8258 if pa>=-0.03850002065300941\n",
      "   +4.2510 if cp>=-0.04776382893323898 & pa>=-0.05607988983392709 & pav>=0.024232217669487063\n",
      "   +0.0000 if pa>=0.026700621470808983\n",
      "   -3.9932 if cp>=0.04412740245461464 & cv>=-0.19487300813198088\n",
      "   -5.0166 if cp<=0.026582035049796105 & cp>=-0.41823059320449824 & cv>=-0.9277861595153809 & pa<=-0.07009865790605545 & pav<=0.2624934852123261\n",
      "Run episode 709 with rewards 81.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 710 ===========\n",
      "56 actions [1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 0, 0, 0, 1, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 1, 0, 0, 1]\n",
      "   -0.0259 if cv<=0.02617583200335503 & cv>=-0.17208473682403563 & pa>=-0.047200413048267366\n",
      "   -0.0059 if cp>=-0.04776382893323898 & pa>=-0.05607988983392709 & pav<=0.024232217669487063\n",
      "   +4.1563 if cp<=0.075119623541832 & cv>=0.21265302300453187 & pa<=0.009697789140045657\n",
      "   -5.2721 if pa>=-0.030518822371959686\n",
      "   -3.6539 if pav>=1.0696226358413696\n",
      "--------------\n",
      "   +4.4392 if pa>=-0.03850002065300941\n",
      "   +3.6552 if cp>=-0.04776382893323898 & pa>=-0.05607988983392709 & pav>=0.024232217669487063\n",
      "   -4.6428 if cp>=0.04412740245461464 & cv>=-0.19487300813198088\n",
      "   -2.4335 if cp<=0.026582035049796105 & cp>=-0.41823059320449824 & cv>=-0.9277861595153809 & pa<=-0.07009865790605545 & pav<=0.2624934852123261\n",
      "   +3.6546 if pav>=1.0696226358413696\n",
      "Run episode 710 with rewards 56.0\n",
      "============ 711 ===========\n",
      "59 actions [1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 0, 0, 1, 0, 0, 0, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 1, 0, 0]\n",
      "   -0.3485 if cv<=0.02617583200335503 & cv>=-0.17208473682403563 & pa>=-0.047200413048267366\n",
      "   +1.3685 if cp<=0.075119623541832 & cv>=0.21265302300453187 & pa<=0.009697789140045657\n",
      "   -4.3451 if pa>=-0.030518822371959686\n",
      "   -0.0029 if pav>=1.0696226358413696\n",
      "   +3.1369 if pa>=-0.07599802315235134\n",
      "--------------\n",
      "   +2.7073 if pa>=-0.03850002065300941\n",
      "   -0.0000 if cp>=-0.04776382893323898 & pa>=-0.05607988983392709 & pav>=0.024232217669487063\n",
      "   -4.5265 if cp>=0.04412740245461464 & cv>=-0.19487300813198088\n",
      "   +0.0003 if pav>=1.0696226358413696\n",
      "   -4.5935 if cp<=0.04629714787006378 & cv<=-0.1810250282287597 & cv>=-0.5992398858070374 & pav>=-0.30699750781059265\n",
      "Run episode 711 with rewards 59.0\n",
      "============ 712 ===========\n",
      "39 actions [1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0]\n",
      "   -0.6184 if cv<=0.02617583200335503 & cv>=-0.17208473682403563 & pa>=-0.047200413048267366\n",
      "   +2.8189 if cp<=0.075119623541832 & cv>=0.21265302300453187 & pa<=0.009697789140045657\n",
      "   -8.4380 if pa>=-0.030518822371959686\n",
      "   +0.7026 if pa>=-0.07599802315235134\n",
      "   +5.0132 if cp<=0.06186518445611003 & pa>=-0.048528204858303066\n",
      "--------------\n",
      "   +2.0716 if pa>=-0.03850002065300941\n",
      "   -5.3462 if cp>=0.04412740245461464 & cv>=-0.19487300813198088\n",
      "   -0.7203 if pav>=1.0696226358413696\n",
      "   -2.4726 if cp<=0.04629714787006378 & cv<=-0.1810250282287597 & cv>=-0.5992398858070374 & pav>=-0.30699750781059265\n",
      "   +6.0718 if cp>=0.06186518445611003 & cv<=-0.39094918966293335 & pa>=-0.10297572612762451\n",
      "Run episode 712 with rewards 39.0\n",
      "============ 713 ===========\n",
      "44 actions [1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 1, 1, 1, 0, 0, 0, 1, 1, 0]\n",
      "   +2.2870 if cp<=0.075119623541832 & cv>=0.21265302300453187 & pa<=0.009697789140045657\n",
      "   -3.7987 if pa>=-0.030518822371959686\n",
      "   +0.2952 if pa>=-0.07599802315235134\n",
      "   +0.1904 if cp<=0.06186518445611003 & pa>=-0.048528204858303066\n",
      "   -1.7890 if cp>=0.04458161592483522 & cv<=-0.18475767374038676 & pa>=-0.07823140621185302\n",
      "--------------\n",
      "   +3.7485 if pa>=-0.03850002065300941\n",
      "   -6.2535 if cp>=0.04412740245461464 & cv>=-0.19487300813198088\n",
      "   -4.1542 if cp<=0.04629714787006378 & cv<=-0.1810250282287597 & cv>=-0.5992398858070374 & pav>=-0.30699750781059265\n",
      "   +2.9651 if cp>=0.06186518445611003 & cv<=-0.39094918966293335 & pa>=-0.10297572612762451\n",
      "   +2.5925 if cp>=0.04458161592483522 & cv<=-0.18475767374038676 & pa>=-0.07823140621185302 & pav>=-0.8812572479248046\n",
      "Run episode 713 with rewards 44.0\n",
      "============ 714 ===========\n",
      "89 actions [1, 1, 0, 0, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 1, 0, 1, 1, 1]\n",
      "   +3.3274 if cp<=0.075119623541832 & cv>=0.21265302300453187 & pa<=0.009697789140045657\n",
      "   -3.9392 if pa>=-0.030518822371959686\n",
      "   +0.8860 if pa>=-0.07599802315235134\n",
      "   -2.5818 if cp>=0.04458161592483522 & cv<=-0.18475767374038676 & pa>=-0.07823140621185302\n",
      "   +3.1629 if cp>=0.04017169401049615 & cv<=-0.3665565848350525 & pa<=-0.11248192042112351\n",
      "--------------\n",
      "   +1.7379 if pa>=-0.03850002065300941\n",
      "   -5.7957 if cp>=0.04412740245461464 & cv>=-0.19487300813198088\n",
      "   -2.9265 if cp<=0.04629714787006378 & cv<=-0.1810250282287597 & cv>=-0.5992398858070374 & pav>=-0.30699750781059265\n",
      "   +5.5013 if cp>=0.06186518445611003 & cv<=-0.39094918966293335 & pa>=-0.10297572612762451\n",
      "   -2.8508 if cp>=0.07865175604820251 & cv<=-0.3665565848350525\n",
      "Run episode 714 with rewards 89.0\n",
      "origin 616.3175596180145 new 629.1829403139513 not updated\n",
      "============ 715 ===========\n",
      "48 actions [1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0]\n",
      "   +2.6372 if cp<=0.075119623541832 & cv>=0.21265302300453187 & pa<=0.009697789140045657\n",
      "   -7.8061 if pa>=-0.030518822371959686\n",
      "   -3.3043 if cp>=0.04458161592483522 & cv<=-0.18475767374038676 & pa>=-0.07823140621185302\n",
      "   +4.4530 if cp>=0.04017169401049615 & cv<=-0.3665565848350525 & pa<=-0.11248192042112351\n",
      "   +4.3180 if pa>=-0.031191036850214\n",
      "--------------\n",
      "   +1.7379 if pa>=-0.03850002065300941\n",
      "   -5.7957 if cp>=0.04412740245461464 & cv>=-0.19487300813198088\n",
      "   -2.9265 if cp<=0.04629714787006378 & cv<=-0.1810250282287597 & cv>=-0.5992398858070374 & pav>=-0.30699750781059265\n",
      "   +5.5013 if cp>=0.06186518445611003 & cv<=-0.39094918966293335 & pa>=-0.10297572612762451\n",
      "   -2.8508 if cp>=0.07865175604820251 & cv<=-0.3665565848350525\n",
      "Run episode 715 with rewards 48.0\n",
      "============ 716 ===========\n",
      "29 actions [0, 0, 1, 1, 1, 1, 1, 0, 1, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 0, 1]\n",
      "   -5.6694 if pa>=-0.030518822371959686\n",
      "   -5.4648 if cp>=0.04458161592483522 & cv<=-0.18475767374038676 & pa>=-0.07823140621185302\n",
      "   +1.2916 if cp>=0.04017169401049615 & cv<=-0.3665565848350525 & pa<=-0.11248192042112351\n",
      "   +3.0742 if pa>=-0.031191036850214\n",
      "   -2.6945 if pav>=1.1673734188079834\n",
      "--------------\n",
      "   -6.3009 if cp>=0.04412740245461464 & cv>=-0.19487300813198088\n",
      "   -2.7320 if cp<=0.04629714787006378 & cv<=-0.1810250282287597 & cv>=-0.5992398858070374 & pav>=-0.30699750781059265\n",
      "   +4.9719 if cp>=0.06186518445611003 & cv<=-0.39094918966293335 & pa>=-0.10297572612762451\n",
      "   -2.3129 if cp>=0.07865175604820251 & cv<=-0.3665565848350525\n",
      "   +1.7181 if cp>=0.04075162932276726 & pav<=0.02081843167543418\n",
      "Run episode 716 with rewards 29.0\n",
      "============ 717 ===========\n",
      "26 actions [1, 1, 1, 1, 0, 1, 0, 0, 0, 0, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0]\n",
      "   -1.9185 if pa>=-0.030518822371959686\n",
      "   -3.8493 if cp>=0.04458161592483522 & cv<=-0.18475767374038676 & pa>=-0.07823140621185302\n",
      "   -1.3119 if pa>=-0.031191036850214\n",
      "  +15.8328 if pav>=1.1673734188079834\n",
      "   +0.9031 if cv<=0.20975317358970644 & cv>=-0.3790894687175751\n",
      "--------------\n",
      "   -6.3531 if cp>=0.04412740245461464 & cv>=-0.19487300813198088\n",
      "   +3.3285 if cp<=0.04629714787006378 & cv<=-0.1810250282287597 & cv>=-0.5992398858070374 & pav>=-0.30699750781059265\n",
      "   +0.0000 if cp>=0.06186518445611003 & cv<=-0.39094918966293335 & pa>=-0.10297572612762451\n",
      "   +0.0103 if cp>=0.07865175604820251 & cv<=-0.3665565848350525\n",
      "   +3.6935 if cp<=0.07811114192008972 & cp>=0.05779665932059289 & cv>=0.20975317358970644\n",
      "Run episode 717 with rewards 26.0\n",
      "============ 718 ===========\n",
      "41 actions [1, 1, 1, 0, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0, 1, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 1, 1, 0, 0, 0]\n",
      "   -2.7567 if pa>=-0.030518822371959686\n",
      "   +0.0000 if cp>=0.04458161592483522 & cv<=-0.18475767374038676 & pa>=-0.07823140621185302\n",
      "   -2.7567 if pa>=-0.031191036850214\n",
      "   +0.0000 if pav>=1.1673734188079834\n",
      "   +1.0870 if cp<=0.041605349630117416 & pa>=-0.12886464595794678\n",
      "--------------\n",
      "   -3.0765 if cp>=0.04412740245461464 & cv>=-0.19487300813198088\n",
      "   +3.7139 if cp<=0.04629714787006378 & cv<=-0.1810250282287597 & cv>=-0.5992398858070374 & pav>=-0.30699750781059265\n",
      "   +0.0000 if cp>=0.07865175604820251 & cv<=-0.3665565848350525\n",
      "   +0.0000 if cp<=0.07811114192008972 & cp>=0.05779665932059289 & cv>=0.20975317358970644\n",
      "   -2.6833 if cv>=0.7460460662841797\n",
      "Run episode 718 with rewards 41.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 719 ===========\n",
      "33 actions [1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0]\n",
      "   -4.6995 if pa>=-0.030518822371959686\n",
      "   -4.6995 if pa>=-0.031191036850214\n",
      "   +0.0000 if pav>=1.1673734188079834\n",
      "   +6.7651 if cp<=0.041605349630117416 & pa>=-0.12886464595794678\n",
      "   +0.7213 if pa>=-0.08575988560914993\n",
      "--------------\n",
      "   -5.1188 if cp>=0.04412740245461464 & cv>=-0.19487300813198088\n",
      "   +0.4418 if cp<=0.04629714787006378 & cv<=-0.1810250282287597 & cv>=-0.5992398858070374 & pav>=-0.30699750781059265\n",
      "   -1.6278 if cp<=0.07811114192008972 & cp>=0.05779665932059289 & cv>=0.20975317358970644\n",
      "   +2.9306 if cv>=0.7460460662841797\n",
      "   +4.3649 if cp>=0.10349424928426743 & pa<=-0.10887056589126587 & pav>=-0.02769304625689965\n",
      "Run episode 719 with rewards 33.0\n",
      "============ 720 ===========\n",
      "41 actions [1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 1, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0, 0]\n",
      "   -4.7386 if pa>=-0.030518822371959686\n",
      "   -4.7386 if pa>=-0.031191036850214\n",
      "   -0.0142 if cp<=0.041605349630117416 & pa>=-0.12886464595794678\n",
      "   +0.8443 if pa>=-0.08575988560914993\n",
      "   -3.4093 if cp>=0.1470099538564682\n",
      "--------------\n",
      "   -4.7178 if cp>=0.04412740245461464 & cv>=-0.19487300813198088\n",
      "   +0.6238 if cp<=0.07811114192008972 & cp>=0.05779665932059289 & cv>=0.20975317358970644\n",
      "   +0.0641 if cv>=0.7460460662841797\n",
      "   +3.1161 if cp>=0.10349424928426743 & pa<=-0.10887056589126587 & pav>=-0.02769304625689965\n",
      "   +4.0670 if cp>=0.1470099538564682\n",
      "Run episode 720 with rewards 41.0\n",
      "============ 721 ===========\n",
      "36 actions [1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 1, 0, 0, 1]\n",
      "   -4.3012 if pa>=-0.030518822371959686\n",
      "   -4.3012 if pa>=-0.031191036850214\n",
      "   +3.4718 if pa>=-0.08575988560914993\n",
      "   -0.0000 if cp>=0.1470099538564682\n",
      "   -3.0472 if cp>=0.07487835735082626 & cv<=-0.5289833545684814\n",
      "--------------\n",
      "   -4.5667 if cp>=0.04412740245461464 & cv>=-0.19487300813198088\n",
      "   -0.5498 if cp<=0.07811114192008972 & cp>=0.05779665932059289 & cv>=0.20975317358970644\n",
      "   -0.0000 if cp>=0.10349424928426743 & pa<=-0.10887056589126587 & pav>=-0.02769304625689965\n",
      "   -0.0000 if cp>=0.1470099538564682\n",
      "   +3.0472 if cp>=0.07487835735082626 & cv<=-0.5289833545684814\n",
      "Run episode 721 with rewards 36.0\n",
      "============ 722 ===========\n",
      "38 actions [1, 1, 1, 1, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 0, 0, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 0]\n",
      "   -6.6429 if pa>=-0.030518822371959686\n",
      "   +1.4479 if pa>=-0.031191036850214\n",
      "   +0.5688 if pa>=-0.08575988560914993\n",
      "   +0.0000 if cp>=0.07487835735082626 & cv<=-0.5289833545684814\n",
      "   +3.9969 if cp>=0.054877445101737976 & pav>=-0.07983152568340264\n",
      "--------------\n",
      "   -3.3203 if cp>=0.04412740245461464 & cv>=-0.19487300813198088\n",
      "   -0.9457 if cp<=0.07811114192008972 & cp>=0.05779665932059289 & cv>=0.20975317358970644\n",
      "   +0.0000 if cp>=0.1470099538564682\n",
      "   +0.0000 if cp>=0.07487835735082626 & cv<=-0.5289833545684814\n",
      "   -4.0028 if cp>=0.054877445101737976 & pav>=-0.07983152568340264\n",
      "Run episode 722 with rewards 38.0\n",
      "============ 723 ===========\n",
      "17 actions [0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0, 1, 1, 0, 0]\n",
      "   -3.1649 if pa>=-0.030518822371959686\n",
      "   -3.1649 if pa>=-0.031191036850214\n",
      "   -1.0350 if pa>=-0.08575988560914993\n",
      "   +1.3086 if cp>=0.054877445101737976 & pav>=-0.07983152568340264\n",
      "   +2.2278 if pa>=-0.05446858629584313\n",
      "--------------\n",
      "   -4.0792 if cp>=0.04412740245461464 & cv>=-0.19487300813198088\n",
      "   -0.9070 if cp<=0.07811114192008972 & cp>=0.05779665932059289 & cv>=0.20975317358970644\n",
      "   -0.3795 if cp>=0.07487835735082626 & cv<=-0.5289833545684814\n",
      "   -1.2380 if cp>=0.054877445101737976 & pav>=-0.07983152568340264\n",
      "   +2.6069 if pav>=1.3766132593154907\n",
      "Run episode 723 with rewards 17.0\n",
      "============ 724 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -3.3984 if pa>=-0.030518822371959686\n",
      "   -3.3984 if pa>=-0.031191036850214\n",
      "   -0.0000 if cp>=0.054877445101737976 & pav>=-0.07983152568340264\n",
      "   +1.7864 if pa>=-0.05446858629584313\n",
      "   +1.3009 if cv<=0.5757819294929505\n",
      "--------------\n",
      "  +14.3158 if cp>=0.04412740245461464 & cv>=-0.19487300813198088\n",
      "   +6.6765 if cp<=0.07811114192008972 & cp>=0.05779665932059289 & cv>=0.20975317358970644\n",
      "   +0.8191 if cp>=0.054877445101737976 & pav>=-0.07983152568340264\n",
      "   +1.7247 if pav>=1.3766132593154907\n",
      "   -1.4207 if cv<=0.06799533199518926 & pa<=-0.03155852705240248\n",
      "Run episode 724 with rewards 10.0\n",
      "============ 725 ===========\n",
      "12 actions [1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0]\n",
      "   -0.8701 if pa>=-0.030518822371959686\n",
      "   -0.8701 if pa>=-0.031191036850214\n",
      "   -0.8701 if pa>=-0.05446858629584313\n",
      "   -0.6870 if cv<=0.5757819294929505\n",
      "   -0.8701 if \n",
      "--------------\n",
      "  -15.8503 if cp>=0.04412740245461464 & cv>=-0.19487300813198088\n",
      "   -6.8533 if cp<=0.07811114192008972 & cp>=0.05779665932059289 & cv>=0.20975317358970644\n",
      "   -1.7510 if pav>=1.3766132593154907\n",
      "   -1.4424 if cv<=0.06799533199518926 & pa<=-0.03155852705240248\n",
      "   +0.3753 if cp>=0.11249744296073914\n",
      "Run episode 725 with rewards 12.0\n",
      "origin 0.8214143081085442 new 0.8246802275067997 not updated\n",
      "============ 726 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.8701 if pa>=-0.030518822371959686\n",
      "   -0.8701 if pa>=-0.031191036850214\n",
      "   -0.8701 if pa>=-0.05446858629584313\n",
      "   -0.6870 if cv<=0.5757819294929505\n",
      "   -0.8701 if \n",
      "--------------\n",
      "  +15.8503 if cp>=0.04412740245461464 & cv>=-0.19487300813198088\n",
      "   +6.8533 if cp<=0.07811114192008972 & cp>=0.05779665932059289 & cv>=0.20975317358970644\n",
      "   +1.7510 if pav>=1.3766132593154907\n",
      "   +1.4424 if cv<=0.06799533199518926 & pa<=-0.03155852705240248\n",
      "   +1.0000 if cp>=0.1427488625049591\n",
      "Run episode 726 with rewards 10.0\n",
      "============ 727 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 0, 0, 0]\n",
      "   -0.8234 if pa>=-0.030518822371959686\n",
      "   -0.8234 if pa>=-0.031191036850214\n",
      "   -0.8234 if pa>=-0.05446858629584313\n",
      "   -0.8234 if \n",
      "   -0.8234 if \n",
      "--------------\n",
      "  -17.0742 if cp>=0.04412740245461464 & cv>=-0.19487300813198088\n",
      "   -7.2410 if cp<=0.07811114192008972 & cp>=0.05779665932059289 & cv>=0.20975317358970644\n",
      "   -1.8447 if pav>=1.3766132593154907\n",
      "   -1.5195 if cv<=0.06799533199518926 & pa<=-0.03155852705240248\n",
      "   +0.7606 if cp>=0.11492908298969269\n",
      "Run episode 727 with rewards 9.0\n",
      "============ 728 ===========\n",
      "25 actions [0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1]\n",
      "   -0.4133 if pa>=-0.030518822371959686\n",
      "   -0.4133 if pa>=-0.031191036850214\n",
      "   +4.2471 if \n",
      "   -7.6054 if cp<=0.007558041810989382\n",
      "   +4.6565 if cp>=-0.004436877835541963\n",
      "--------------\n",
      "  +17.0742 if cp>=0.04412740245461464 & cv>=-0.19487300813198088\n",
      "   +7.2410 if cp<=0.07811114192008972 & cp>=0.05779665932059289 & cv>=0.20975317358970644\n",
      "   +1.8447 if pav>=1.3766132593154907\n",
      "   +1.5195 if cv<=0.06799533199518926 & pa<=-0.03155852705240248\n",
      "   +1.0000 if cp>=0.09605304896831512\n",
      "Run episode 728 with rewards 25.0\n",
      "============ 729 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 0, 0, 0, 0]\n",
      "   -1.0225 if pa>=-0.031191036850214\n",
      "   -1.0224 if \n",
      "   -2.4580 if cp<=0.007558041810989382\n",
      "   +4.7019 if cp>=-0.004436877835541963\n",
      "   +2.3810 if cp<=0.05242711752653129 & cp>=-0.034441054984927166 & cv<=1.4928545951843262\n",
      "--------------\n",
      "  -16.0460 if cp>=0.04412740245461464 & cv>=-0.19487300813198088\n",
      "   +1.4093 if cp<=0.07811114192008972 & cp>=0.05779665932059289 & cv>=0.20975317358970644\n",
      "   +0.9864 if pav>=1.3766132593154907\n",
      "   +0.2965 if cv<=0.06799533199518926 & pa<=-0.03155852705240248\n",
      "   +1.0000 if cp>=0.05242711752653129 & cv>=1.4928545951843262\n",
      "Run episode 729 with rewards 10.0\n",
      "============ 730 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -4.8985 if pa>=-0.031191036850214\n",
      "   +2.5268 if cp<=0.007558041810989382\n",
      "  -27.8866 if cp>=-0.004436877835541963\n",
      "  -11.1921 if cp<=0.05242711752653129 & cp>=-0.034441054984927166 & cv<=1.4928545951843262\n",
      "   +0.1904 if cp>=0.06870026886463165\n",
      "--------------\n",
      "  +16.7224 if cp>=0.04412740245461464 & cv>=-0.19487300813198088\n",
      "   +2.1422 if cp<=0.07811114192008972 & cp>=0.05779665932059289 & cv>=0.20975317358970644\n",
      "   +0.9347 if pav>=1.3766132593154907\n",
      "   +0.9476 if cp>=0.05242711752653129 & cv>=1.4928545951843262\n",
      "   +1.0000 if cp<=0.00013828594237566636 & cv>=0.7564861893653869\n",
      "Run episode 730 with rewards 10.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 731 ===========\n",
      "40 actions [0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   -1.5786 if pa>=-0.031191036850214\n",
      "   -2.7228 if cp<=0.007558041810989382\n",
      "  +36.3158 if cp>=-0.004436877835541963\n",
      "  +11.6649 if cp<=0.05242711752653129 & cp>=-0.034441054984927166 & cv<=1.4928545951843262\n",
      "   +1.0000 if cp>=-0.016388232260942458\n",
      "--------------\n",
      "   -0.0000 if cp>=0.04412740245461464 & cv>=-0.19487300813198088\n",
      "   -0.0000 if cp<=0.07811114192008972 & cp>=0.05779665932059289 & cv>=0.20975317358970644\n",
      "   -0.0000 if cp>=0.05242711752653129 & cv>=1.4928545951843262\n",
      "   +0.0000 if cp<=0.00013828594237566636 & cv>=0.7564861893653869\n",
      "   +1.0544 if cp<=-0.03311111629009247\n",
      "Run episode 731 with rewards 40.0\n",
      "============ 732 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 1, 1]\n",
      "   -0.6963 if pa>=-0.031191036850214\n",
      "   -2.5263 if cp<=0.007558041810989382\n",
      "   +4.0529 if cp>=-0.004436877835541963\n",
      "   +6.4454 if cp<=0.05242711752653129 & cp>=-0.034441054984927166 & cv<=1.4928545951843262\n",
      "   +3.6055 if cp<=-0.10507812052965164 & cv>=0.25810013711452523 & pa>=0.16520115435123445\n",
      "--------------\n",
      "   +0.0000 if cp>=0.04412740245461464 & cv>=-0.19487300813198088\n",
      "   +0.0000 if cp>=0.05242711752653129 & cv>=1.4928545951843262\n",
      "   +0.9469 if cp<=0.00013828594237566636 & cv>=0.7564861893653869\n",
      "   +0.6671 if cp<=-0.03311111629009247\n",
      "   -4.2801 if cp<=-0.10507812052965164 & cv>=0.25810013711452523\n",
      "Run episode 732 with rewards 9.0\n",
      "============ 733 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +22.4675 if cp<=0.007558041810989382\n",
      "   +0.8864 if cp>=-0.004436877835541963\n",
      "   +1.4076 if cp<=0.05242711752653129 & cp>=-0.034441054984927166 & cv<=1.4928545951843262\n",
      "   +0.7877 if cp<=-0.10507812052965164 & cv>=0.25810013711452523 & pa>=0.16520115435123445\n",
      "   +1.0000 if pa>=0.2049277275800705\n",
      "--------------\n",
      "   -0.0000 if cp>=0.05242711752653129 & cv>=1.4928545951843262\n",
      "   -2.3235 if cp<=0.00013828594237566636 & cv>=0.7564861893653869\n",
      "  -20.6686 if cp<=-0.03311111629009247\n",
      "  -10.5029 if cp<=-0.10507812052965164 & cv>=0.25810013711452523\n",
      "   +1.0000 if pa>=0.2049277275800705\n",
      "Run episode 733 with rewards 10.0\n",
      "============ 734 ===========\n",
      "13 actions [0, 1, 0, 0, 0, 0, 1, 0, 0, 0, 1, 0, 0]\n",
      "   +0.0000 if cp<=0.007558041810989382\n",
      "   -0.0000 if cp>=-0.004436877835541963\n",
      "   +0.0000 if cp<=0.05242711752653129 & cp>=-0.034441054984927166 & cv<=1.4928545951843262\n",
      "   -0.0000 if pa>=0.2049277275800705\n",
      "   +0.0000 if cp<=-0.08377774059772491\n",
      "--------------\n",
      "   -0.0000 if cp<=0.00013828594237566636 & cv>=0.7564861893653869\n",
      "   +0.0000 if cp<=-0.03311111629009247\n",
      "   -0.0000 if cp<=-0.10507812052965164 & cv>=0.25810013711452523\n",
      "   -0.0000 if pa>=0.2049277275800705\n",
      "   +0.0000 if cp<=-0.08377774059772491\n",
      "Run episode 734 with rewards 13.0\n",
      "============ 735 ===========\n",
      "16 actions [0, 0, 1, 1, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1]\n",
      "   +0.8540 if cp<=0.007558041810989382\n",
      "   -0.0000 if cp>=-0.004436877835541963\n",
      "   -0.0000 if cp<=0.05242711752653129 & cp>=-0.034441054984927166 & cv<=1.4928545951843262\n",
      "  -22.7036 if cp<=-0.08377774059772491\n",
      "   +1.0000 if pa>=0.2072102427482605\n",
      "--------------\n",
      "   -0.0000 if cp<=0.00013828594237566636 & cv>=0.7564861893653869\n",
      "   -0.3318 if cp<=-0.03311111629009247\n",
      "   -0.0000 if cp<=-0.10507812052965164 & cv>=0.25810013711452523\n",
      "  +14.7897 if pa>=0.2049277275800705\n",
      "   -1.4138 if cp>=-0.04077611863613129\n",
      "Run episode 735 with rewards 16.0\n",
      "============ 736 ===========\n",
      "15 actions [0, 1, 0, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +2.1932 if cp<=0.007558041810989382\n",
      "   +1.5421 if cp<=0.05242711752653129 & cp>=-0.034441054984927166 & cv<=1.4928545951843262\n",
      "   +0.6815 if cp<=-0.08377774059772491\n",
      "   +0.0000 if pa>=0.2072102427482605\n",
      "   -5.1288 if cp>=-0.03894275054335594 & cv<=-0.03009612113237381\n",
      "--------------\n",
      "   -1.4362 if cp<=-0.03311111629009247\n",
      "   +0.0000 if cp<=-0.10507812052965164 & cv>=0.25810013711452523\n",
      "   +0.0000 if pa>=0.2049277275800705\n",
      "   +3.4643 if cp>=-0.04077611863613129\n",
      "   -5.1374 if cp>=-0.03894275054335594 & pav<=0.3237149119377136\n",
      "Run episode 736 with rewards 15.0\n",
      "============ 737 ===========\n",
      "69 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1]\n",
      "   -2.5694 if cp<=0.007558041810989382\n",
      "   +7.0559 if cp<=0.05242711752653129 & cp>=-0.034441054984927166 & cv<=1.4928545951843262\n",
      "  -18.6819 if cp<=-0.08377774059772491\n",
      "   -9.3437 if cp>=-0.03894275054335594 & cv<=-0.03009612113237381\n",
      "   +1.0000 if pa>=0.17767150700092316\n",
      "--------------\n",
      "   -1.6534 if cp<=-0.03311111629009247\n",
      "   +0.0000 if pa>=0.2049277275800705\n",
      "   +0.5293 if cp>=-0.04077611863613129\n",
      "   -1.6250 if cp>=-0.03894275054335594 & pav<=0.3237149119377136\n",
      "   +2.6723 if cv<=-0.16110713183879832 & pa<=-0.0028371288906782863\n",
      "Run episode 737 with rewards 69.0\n",
      "============ 738 ===========\n",
      "31 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0]\n",
      "   -2.1398 if cp<=0.007558041810989382\n",
      "   +5.8996 if cp<=0.05242711752653129 & cp>=-0.034441054984927166 & cv<=1.4928545951843262\n",
      "   -0.0000 if cp<=-0.08377774059772491\n",
      "   -9.2609 if cp>=-0.03894275054335594 & cv<=-0.03009612113237381\n",
      "   -4.1025 if cp<=-0.03089664280414581 & cv>=0.14785062074661257 & pa<=0.09443505704402927\n",
      "--------------\n",
      "   -2.8464 if cp<=-0.03311111629009247\n",
      "   -4.9237 if cp>=-0.04077611863613129\n",
      "   +0.2284 if cp>=-0.03894275054335594 & pav<=0.3237149119377136\n",
      "   +3.0723 if cv<=-0.16110713183879832 & pa<=-0.0028371288906782863\n",
      "   +4.6408 if \n",
      "Run episode 738 with rewards 31.0\n",
      "============ 739 ===========\n",
      "59 actions [0, 1, 0, 0, 0, 0, 1, 1, 1, 0, 0, 1, 1, 0, 0, 1, 1, 0, 1, 1, 0, 1, 1, 1, 1, 1, 0, 1, 1, 1, 0, 1, 0, 0, 1, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0, 0, 0]\n",
      "   +1.5149 if cp<=0.007558041810989382\n",
      "   +2.0993 if cp<=0.05242711752653129 & cp>=-0.034441054984927166 & cv<=1.4928545951843262\n",
      "   -4.9058 if cp>=-0.03894275054335594 & cv<=-0.03009612113237381\n",
      "   -4.9815 if cp<=-0.03089664280414581 & cv>=0.14785062074661257 & pa<=0.09443505704402927\n",
      "   -2.4256 if pa>=-0.0002260424807900563\n",
      "--------------\n",
      "   -4.4641 if cp<=-0.03311111629009247\n",
      "   -4.7029 if cp>=-0.04077611863613129\n",
      "   +0.5701 if cv<=-0.16110713183879832 & pa<=-0.0028371288906782863\n",
      "   +4.5110 if \n",
      "   -1.0060 if cp>=-0.031050803139805794\n",
      "Run episode 739 with rewards 59.0\n",
      "============ 740 ===========\n",
      "42 actions [0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 1, 1]\n",
      "   +1.4485 if cp<=0.05242711752653129 & cp>=-0.034441054984927166 & cv<=1.4928545951843262\n",
      "   -6.5572 if cp>=-0.03894275054335594 & cv<=-0.03009612113237381\n",
      "   -0.0001 if cp<=-0.03089664280414581 & cv>=0.14785062074661257 & pa<=0.09443505704402927\n",
      "   -1.3559 if pa>=-0.0002260424807900563\n",
      "   +2.5423 if cv<=0.22765169143676803 & pa<=0.10268924236297608 & pav<=0.5660633563995363\n",
      "--------------\n",
      "   -0.3377 if cp<=-0.03311111629009247\n",
      "   -2.5150 if cp>=-0.04077611863613129\n",
      "   +1.5476 if \n",
      "   +1.8851 if cp>=-0.031050803139805794\n",
      "   -2.0219 if pav<=0.5660633563995363\n",
      "Run episode 740 with rewards 42.0\n",
      "============ 741 ===========\n",
      "35 actions [0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0, 0, 1, 1]\n",
      "   -1.1990 if cp<=0.05242711752653129 & cp>=-0.034441054984927166 & cv<=1.4928545951843262\n",
      "   -7.9735 if cp>=-0.03894275054335594 & cv<=-0.03009612113237381\n",
      "   -0.4575 if pa>=-0.0002260424807900563\n",
      "   +4.5477 if cv<=0.22765169143676803 & pa<=0.10268924236297608 & pav<=0.5660633563995363\n",
      "   +2.5485 if pav<=0.3263791859149933 & pav>=0.26626923084259035\n",
      "--------------\n",
      "   +1.2685 if cp>=-0.04077611863613129\n",
      "   +0.7956 if \n",
      "   +2.2732 if cp>=-0.031050803139805794\n",
      "   -5.7787 if pav<=0.5660633563995363\n",
      "   +2.5200 if cp>=0.009112686850130558\n",
      "Run episode 741 with rewards 35.0\n",
      "============ 742 ===========\n",
      "106 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1, 0, 1]\n",
      "   -1.7131 if cp<=0.05242711752653129 & cp>=-0.034441054984927166 & cv<=1.4928545951843262\n",
      "   -7.6062 if cp>=-0.03894275054335594 & cv<=-0.03009612113237381\n",
      "   +6.2254 if cv<=0.22765169143676803 & pa<=0.10268924236297608 & pav<=0.5660633563995363\n",
      "   -0.0047 if pav<=0.3263791859149933 & pav>=0.26626923084259035\n",
      "   -5.8463 if cp<=0.03317312300205231 & cv<=0.20159789919853213 & cv>=0.012772643938660623 & pa<=0.0634071871638298\n",
      "--------------\n",
      "   +0.3856 if cp>=-0.04077611863613129\n",
      "   +0.3857 if cp>=-0.031050803139805794\n",
      "   +0.3847 if pav<=0.5660633563995363\n",
      "   +0.3858 if cp>=0.009112686850130558\n",
      "  -16.6569 if cv>=0.012772643938660623 & pa<=0.04000654146075249\n",
      "Run episode 742 with rewards 106.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 743 ===========\n",
      "247 actions [0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 1, 0, 0, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 0, 1, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 0, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0]\n",
      "   -3.0523 if cp<=0.05242711752653129 & cp>=-0.034441054984927166 & cv<=1.4928545951843262\n",
      "  -10.3052 if cp>=-0.03894275054335594 & cv<=-0.03009612113237381\n",
      "   +9.2739 if cv<=0.22765169143676803 & pa<=0.10268924236297608 & pav<=0.5660633563995363\n",
      "   +0.0000 if cp<=0.03317312300205231 & cv<=0.20159789919853213 & cv>=0.012772643938660623 & pa<=0.0634071871638298\n",
      "   -4.6522 if cp<=0.014588776044547558 & cv<=0.15069590508937838 & cv>=-0.006235650274902582 & pav>=0.10310453921556473\n",
      "--------------\n",
      "   +1.8201 if cp>=-0.04077611863613129\n",
      "   +1.8202 if cp>=-0.031050803139805794\n",
      "   -1.6332 if cp>=0.009112686850130558\n",
      "   -5.8399 if cv>=0.012772643938660623 & pa<=0.04000654146075249\n",
      "   -1.5033 if pa<=0.06037392467260361\n",
      "Run episode 743 with rewards 247.0\n",
      "============ 744 ===========\n",
      "27 actions [0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1]\n",
      "   -2.7675 if cp<=0.05242711752653129 & cp>=-0.034441054984927166 & cv<=1.4928545951843262\n",
      "   -7.8095 if cp>=-0.03894275054335594 & cv<=-0.03009612113237381\n",
      "  +10.1414 if cv<=0.22765169143676803 & pa<=0.10268924236297608 & pav<=0.5660633563995363\n",
      "   -5.7854 if cp<=0.014588776044547558 & cv<=0.15069590508937838 & cv>=-0.006235650274902582 & pav>=0.10310453921556473\n",
      "   -3.8458 if cp<=0.5493624687194826 & cp<=0.9980917453765875 & cp>=0.19966367781162261 & pav<=0.3622794270515442\n",
      "--------------\n",
      "   +1.8220 if cp>=-0.04077611863613129\n",
      "   +1.8221 if cp>=-0.031050803139805794\n",
      "   -1.5794 if cp>=0.009112686850130558\n",
      "   -3.5493 if cv>=0.012772643938660623 & pa<=0.04000654146075249\n",
      "   -2.0591 if pa<=-0.002861756691709157\n",
      "Run episode 744 with rewards 27.0\n",
      "============ 745 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -2.4929 if cp>=-0.03894275054335594 & cv<=-0.03009612113237381\n",
      "   +3.8339 if cv<=0.22765169143676803 & pa<=0.10268924236297608 & pav<=0.5660633563995363\n",
      "   -0.0000 if cp<=0.014588776044547558 & cv<=0.15069590508937838 & cv>=-0.006235650274902582 & pav>=0.10310453921556473\n",
      "   -0.0000 if cp<=0.5493624687194826 & cp<=0.9980917453765875 & cp>=0.19966367781162261 & pav<=0.3622794270515442\n",
      "   -2.8174 if cp>=-0.009661125019192696\n",
      "--------------\n",
      "   +1.1077 if cp>=-0.04077611863613129\n",
      "   +1.7005 if cp>=-0.031050803139805794\n",
      "   -0.6059 if cv>=0.012772643938660623 & pa<=0.04000654146075249\n",
      "   -3.0811 if pa<=-0.002861756691709157\n",
      "   +2.8769 if cp>=-0.009661125019192696\n",
      "Run episode 745 with rewards 10.0\n",
      "============ 746 ===========\n",
      "59 actions [1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1, 1, 0]\n",
      "   -5.6771 if cp>=-0.03894275054335594 & cv<=-0.03009612113237381\n",
      "  -11.2007 if cv<=0.22765169143676803 & pa<=0.10268924236297608 & pav<=0.5660633563995363\n",
      "   +0.0000 if cp<=0.014588776044547558 & cv<=0.15069590508937838 & cv>=-0.006235650274902582 & pav>=0.10310453921556473\n",
      "  +16.2144 if cp>=-0.009661125019192696\n",
      "   +1.5905 if cp>=0.04797224923968316\n",
      "--------------\n",
      "   +1.1416 if cp>=-0.04077611863613129\n",
      "   +1.1416 if cp>=-0.031050803139805794\n",
      "   -0.2450 if pa<=-0.002861756691709157\n",
      "   +1.1416 if cp>=-0.009661125019192696\n",
      "   -0.2450 if cp>=0.02136669456958771\n",
      "Run episode 746 with rewards 59.0\n",
      "============ 747 ===========\n",
      "24 actions [1, 1, 1, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0]\n",
      "   -7.8957 if cp>=-0.03894275054335594 & cv<=-0.03009612113237381\n",
      "   -1.2048 if cv<=0.22765169143676803 & pa<=0.10268924236297608 & pav<=0.5660633563995363\n",
      "   +6.6464 if cp>=-0.009661125019192696\n",
      "   +1.2021 if cp>=0.04797224923968316\n",
      "   -4.9163 if pa>=0.006735433824360371\n",
      "--------------\n",
      "   +1.4901 if cp>=-0.04077611863613129\n",
      "   +1.4901 if cp>=-0.031050803139805794\n",
      "   -0.2430 if cp>=-0.009661125019192696\n",
      "   -0.2873 if cp>=0.02136669456958771\n",
      "   +5.7247 if cp<=0.005630539916455748 & pa>=-0.010592951439321034\n",
      "Run episode 747 with rewards 24.0\n",
      "============ 748 ===========\n",
      "69 actions [0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0]\n",
      "   -7.7975 if cp>=-0.03894275054335594 & cv<=-0.03009612113237381\n",
      "   +2.6568 if cv<=0.22765169143676803 & pa<=0.10268924236297608 & pav<=0.5660633563995363\n",
      "  +10.3107 if cp>=-0.009661125019192696\n",
      "   -0.0000 if pa>=0.006735433824360371\n",
      "   -4.7466 if pa>=-0.14691468179225922\n",
      "--------------\n",
      "   +1.4291 if cp>=-0.04077611863613129\n",
      "   +1.4291 if cp>=-0.031050803139805794\n",
      "   -0.0000 if cp>=0.02136669456958771\n",
      "   -0.0000 if cp<=0.005630539916455748 & pa>=-0.010592951439321034\n",
      "   -2.6146 if cv<=0.23176607489585876 & pa<=-0.09208391308784482\n",
      "Run episode 748 with rewards 69.0\n",
      "============ 749 ===========\n",
      "12 actions [1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0]\n",
      "   -7.6699 if cp>=-0.03894275054335594 & cv<=-0.03009612113237381\n",
      "   +3.2504 if cv<=0.22765169143676803 & pa<=0.10268924236297608 & pav<=0.5660633563995363\n",
      "   +8.9354 if cp>=-0.009661125019192696\n",
      "   -5.0795 if pa>=-0.14691468179225922\n",
      "   -7.1584 if pa>=-0.026311570778489113\n",
      "--------------\n",
      "   +2.1688 if cp>=-0.04077611863613129\n",
      "   +2.1532 if cp>=-0.031050803139805794\n",
      "   +0.0000 if cp<=0.005630539916455748 & pa>=-0.010592951439321034\n",
      "   -3.4434 if cv<=0.23176607489585876 & pa<=-0.09208391308784482\n",
      "   +6.8549 if pa>=-0.026311570778489113\n",
      "Run episode 749 with rewards 12.0\n",
      "============ 750 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -10.7509 if cp>=-0.03894275054335594 & cv<=-0.03009612113237381\n",
      "  -31.2953 if cp>=-0.009661125019192696\n",
      "   -9.5018 if pa>=-0.14691468179225922\n",
      "  -20.8379 if pa>=-0.026311570778489113\n",
      "   +1.0000 if cp>=0.044376367330551184\n",
      "--------------\n",
      "  +14.8131 if cp>=-0.04077611863613129\n",
      "  +14.8199 if cp>=-0.031050803139805794\n",
      "   -1.4876 if cv<=0.23176607489585876 & pa<=-0.09208391308784482\n",
      "   -2.9614 if pa>=-0.026311570778489113\n",
      "   +1.0000 if cv>=0.9076663732528689\n",
      "Run episode 750 with rewards 10.0\n",
      "============ 751 ===========\n",
      "28 actions [0, 0, 0, 0, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +5.8673 if cp>=-0.03894275054335594 & cv<=-0.03009612113237381\n",
      "  +51.8876 if cp>=-0.009661125019192696\n",
      "   +8.4744 if pa>=-0.14691468179225922\n",
      "   -9.2437 if pa>=-0.026311570778489113\n",
      "   +1.0000 if cp>=-0.0442769967019558\n",
      "--------------\n",
      "   -0.0000 if cp>=-0.04077611863613129\n",
      "   -0.0000 if cp>=-0.031050803139805794\n",
      "   -0.0000 if cv<=0.23176607489585876 & pa<=-0.09208391308784482\n",
      "   +0.0000 if pa>=-0.026311570778489113\n",
      "   +0.0000 if cp>=0.09947250783443451\n",
      "Run episode 751 with rewards 28.0\n",
      "============ 752 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 1, 1, 1]\n",
      "   +5.8281 if cp>=-0.03894275054335594 & cv<=-0.03009612113237381\n",
      "   +4.5216 if cp>=-0.009661125019192696\n",
      "   -1.0777 if pa>=-0.14691468179225922\n",
      "   -1.0777 if pa>=-0.026311570778489113\n",
      "   +4.4371 if cp<=-0.08506006896495819 & cv>=-0.23230903148651122 & pa<=0.13605860173702242 & pav<=0.5406783699989323\n",
      "--------------\n",
      "   -1.7399 if cp>=-0.04077611863613129\n",
      "   -1.6522 if cp>=-0.031050803139805794\n",
      "   +0.0000 if cv<=0.23176607489585876 & pa<=-0.09208391308784482\n",
      "   +1.3544 if pa>=-0.026311570778489113\n",
      "   -2.8127 if cv>=1.1157054901123047\n",
      "Run episode 752 with rewards 10.0\n",
      "============ 753 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   -2.2910 if cp>=-0.03894275054335594 & cv<=-0.03009612113237381\n",
      "   -1.7769 if cp>=-0.009661125019192696\n",
      "  +23.9390 if pa>=-0.14691468179225922\n",
      "   -1.7438 if cp<=-0.08506006896495819 & cv>=-0.23230903148651122 & pa<=0.13605860173702242 & pav<=0.5406783699989323\n",
      "   +1.0000 if cp>=-0.06964339315891266 & cv>=-1.2106812477111817\n",
      "--------------\n",
      "   +4.7745 if cp>=-0.04077611863613129\n",
      "   -3.4462 if cp>=-0.031050803139805794\n",
      "   +4.6987 if pa>=-0.026311570778489113\n",
      "   -0.0032 if cv>=1.1157054901123047\n",
      "   +2.2939 if cp<=0.0018499439582228706 & cp>=-0.027639055252075193\n",
      "Run episode 753 with rewards 9.0\n",
      "============ 754 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   +1.9550 if cp>=-0.03894275054335594 & cv<=-0.03009612113237381\n",
      "   -0.6794 if cp>=-0.009661125019192696\n",
      "  -11.1611 if pa>=-0.14691468179225922\n",
      "   -0.6667 if cp<=-0.08506006896495819 & cv>=-0.23230903148651122 & pa<=0.13605860173702242 & pav<=0.5406783699989323\n",
      "   -1.0858 if cp<=-0.05658329278230667\n",
      "--------------\n",
      "   -0.0000 if cp>=-0.04077611863613129\n",
      "   -0.0000 if cp>=-0.031050803139805794\n",
      "   -0.0000 if pa>=-0.026311570778489113\n",
      "   -0.0000 if cp<=0.0018499439582228706 & cp>=-0.027639055252075193\n",
      "   +0.0000 if cv>=0.01986089162528515\n",
      "Run episode 754 with rewards 10.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 755 ===========\n",
      "8 actions [0, 0, 0, 0, 0, 0, 0, 1]\n",
      "   +0.0106 if cp>=-0.03894275054335594 & cv<=-0.03009612113237381\n",
      "  +19.4595 if cp>=-0.009661125019192696\n",
      "   +2.0308 if pa>=-0.14691468179225922\n",
      "   +0.0059 if cp<=-0.05658329278230667\n",
      "   +1.0000 if cp>=0.010544661059975625\n",
      "--------------\n",
      "  -18.9365 if cp>=-0.04077611863613129\n",
      "  -18.9365 if cp>=-0.031050803139805794\n",
      "  +13.3980 if pa>=-0.026311570778489113\n",
      "  +13.0439 if cp<=0.0018499439582228706 & cp>=-0.027639055252075193\n",
      "   +1.0000 if cp<=0.07927177250385285 & cp>=0.010544661059975625\n",
      "Run episode 755 with rewards 8.0\n",
      "============ 756 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.0002 if cp>=-0.03894275054335594 & cv<=-0.03009612113237381\n",
      "   -0.0001 if cp>=-0.009661125019192696\n",
      "   -0.0615 if pa>=-0.14691468179225922\n",
      "   +0.0000 if cp>=0.010544661059975625\n",
      "   +0.0000 if pa>=0.1716444194316864\n",
      "--------------\n",
      "   +9.7379 if cp>=-0.04077611863613129\n",
      "   +1.2286 if cp>=-0.031050803139805794\n",
      "   +7.3885 if pa>=-0.026311570778489113\n",
      "  +13.6865 if cp<=0.0018499439582228706 & cp>=-0.027639055252075193\n",
      "   +1.0000 if cp<=-0.005686639575287695 & cp>=-0.031243145465850827\n",
      "Run episode 756 with rewards 10.0\n",
      "============ 757 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 1, 1]\n",
      "   +0.0000 if cp>=-0.03894275054335594 & cv<=-0.03009612113237381\n",
      "   +0.0014 if cp>=-0.009661125019192696\n",
      "   +0.0009 if pa>=-0.14691468179225922\n",
      "   +0.0000 if pa>=0.1716444194316864\n",
      "   +0.0013 if cp>=0.024889921769499786\n",
      "--------------\n",
      "  -17.7781 if cp>=-0.04077611863613129\n",
      "  -15.8916 if cp>=-0.031050803139805794\n",
      "  +16.2311 if pa>=-0.026311570778489113\n",
      "  +14.8348 if cp<=0.0018499439582228706 & cp>=-0.027639055252075193\n",
      "   +1.0000 if cp>=0.06504021733999253\n",
      "Run episode 757 with rewards 10.0\n",
      "============ 758 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 0]\n",
      "   -8.3052 if cp>=-0.03894275054335594 & cv<=-0.03009612113237381\n",
      "   -1.7299 if cp>=-0.009661125019192696\n",
      "   -8.3067 if pa>=-0.14691468179225922\n",
      "   +0.1389 if cp>=0.024889921769499786\n",
      "   -0.2577 if cp<=0.0022228164598345774 & cp>=-0.03731728494167328\n",
      "--------------\n",
      "   +1.0003 if cp>=-0.04077611863613129\n",
      "   -7.0602 if cp>=-0.031050803139805794\n",
      "  +15.2082 if pa>=-0.026311570778489113\n",
      "  +10.9164 if cp<=0.0018499439582228706 & cp>=-0.027639055252075193\n",
      "   +1.0000 if cp<=0.029271246120333674\n",
      "Run episode 758 with rewards 9.0\n",
      "============ 759 ===========\n",
      "24 actions [1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 0, 0, 0]\n",
      "   +7.1408 if cp>=-0.03894275054335594 & cv<=-0.03009612113237381\n",
      "   +7.5548 if cp>=-0.009661125019192696\n",
      "  +12.5051 if pa>=-0.14691468179225922\n",
      "   +1.7241 if cp<=0.0022228164598345774 & cp>=-0.03731728494167328\n",
      "   +1.0000 if cp<=-0.02696772888302803\n",
      "--------------\n",
      "   +6.5236 if cp>=-0.04077611863613129\n",
      "  +11.2151 if cp>=-0.031050803139805794\n",
      "  +11.7733 if pa>=-0.026311570778489113\n",
      "   +8.4508 if cp<=0.0018499439582228706 & cp>=-0.027639055252075193\n",
      "   +1.0000 if cp>=0.0716276690363884\n",
      "Run episode 759 with rewards 24.0\n",
      "============ 760 ===========\n",
      "21 actions [1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1]\n",
      "   +6.2185 if cp>=-0.03894275054335594 & cv<=-0.03009612113237381\n",
      "  +13.7454 if cp>=-0.009661125019192696\n",
      "   +7.2479 if pa>=-0.14691468179225922\n",
      "   +6.1926 if cp<=0.0022228164598345774 & cp>=-0.03731728494167328\n",
      "  -10.5379 if cp<=-0.10151265263557434 & cv<=-0.7574181914329529\n",
      "--------------\n",
      "   +2.8858 if cp>=-0.04077611863613129\n",
      "   +4.8829 if cp>=-0.031050803139805794\n",
      "  +16.6454 if pa>=-0.026311570778489113\n",
      "   +4.6288 if cp<=0.0018499439582228706 & cp>=-0.027639055252075193\n",
      "  +11.5367 if cp<=-0.10151265263557434 & cv<=-0.7574181914329529\n",
      "Run episode 760 with rewards 21.0\n",
      "============ 761 ===========\n",
      "10 actions [1, 1, 1, 1, 0, 1, 0, 1, 1, 1]\n",
      "   -0.9148 if cp>=-0.03894275054335594 & cv<=-0.03009612113237381\n",
      "   +5.5349 if cp>=-0.009661125019192696\n",
      "   +5.5346 if pa>=-0.14691468179225922\n",
      "   +0.0006 if cp<=-0.10151265263557434 & cv<=-0.7574181914329529\n",
      "   -2.4427 if cp>=0.0007285057799890637 & cv<=-1.303498387336731\n",
      "--------------\n",
      "  +14.0729 if cp>=-0.031050803139805794\n",
      "   +9.4572 if pa>=-0.026311570778489113\n",
      "   -0.0013 if cp<=0.0018499439582228706 & cp>=-0.027639055252075193\n",
      "   -0.0005 if cp<=-0.10151265263557434 & cv<=-0.7574181914329529\n",
      "  -27.5079 if cv<=-1.303498387336731\n",
      "Run episode 761 with rewards 10.0\n",
      "============ 762 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   +1.4691 if cp>=-0.03894275054335594 & cv<=-0.03009612113237381\n",
      "   -1.1300 if cp>=-0.009661125019192696\n",
      "   -1.1267 if pa>=-0.14691468179225922\n",
      "   +0.9428 if cp>=0.0007285057799890637 & cv<=-1.303498387336731\n",
      "   +0.9702 if cp<=0.07089610397815704\n",
      "--------------\n",
      "  +12.8468 if cp>=-0.031050803139805794\n",
      "   +0.0000 if pa>=-0.026311570778489113\n",
      "   +0.0000 if cp<=0.0018499439582228706 & cp>=-0.027639055252075193\n",
      "   +0.0000 if cv<=-1.303498387336731\n",
      "   +7.4437 if cp<=0.09426277279853822 & cp>=0.07089610397815704 & cv>=0.6190513968467714\n",
      "Run episode 762 with rewards 10.0\n",
      "============ 763 ===========\n",
      "12 actions [0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1]\n",
      "   +0.0000 if cp>=-0.03894275054335594 & cv<=-0.03009612113237381\n",
      "   +0.0001 if cp>=-0.009661125019192696\n",
      "   +0.0000 if pa>=-0.14691468179225922\n",
      "   -0.0001 if cp<=0.07089610397815704\n",
      "   +0.0002 if cp>=0.09636596888303757\n",
      "--------------\n",
      "  -17.1966 if cp>=-0.031050803139805794\n",
      "  +13.9079 if pa>=-0.026311570778489113\n",
      "   -0.0000 if cv<=-1.303498387336731\n",
      "   -8.4340 if cp<=0.09426277279853822 & cp>=0.07089610397815704 & cv>=0.6190513968467714\n",
      "   -0.4562 if cp>=0.138588947057724\n",
      "Run episode 763 with rewards 12.0\n",
      "============ 764 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.3072 if cp>=-0.009661125019192696\n",
      "   +0.2722 if pa>=-0.14691468179225922\n",
      "   +0.2722 if cp<=0.07089610397815704\n",
      "   -0.0000 if cp>=0.09636596888303757\n",
      "   +0.2562 if cp<=0.03936351761221886 & cp>=0.014722466096282028\n",
      "--------------\n",
      "  -14.8321 if cp>=-0.031050803139805794\n",
      "  -16.3594 if pa>=-0.026311570778489113\n",
      "   +2.0900 if cp<=0.09426277279853822 & cp>=0.07089610397815704 & cv>=0.6190513968467714\n",
      "   +0.1131 if cp>=0.138588947057724\n",
      "   -0.4360 if cp<=-0.028630018234252923\n",
      "Run episode 764 with rewards 10.0\n",
      "============ 765 ===========\n",
      "43 actions [0, 1, 1, 0, 0, 0, 1, 1, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   +0.0000 if cp>=-0.009661125019192696\n",
      "   -0.0000 if pa>=-0.14691468179225922\n",
      "   -0.0000 if cp<=0.07089610397815704\n",
      "   -0.0000 if cp<=0.03936351761221886 & cp>=0.014722466096282028\n",
      "   +0.0000 if cp>=-0.1010687991976738\n",
      "--------------\n",
      "  -15.3914 if cp>=-0.031050803139805794\n",
      "  +15.7347 if pa>=-0.026311570778489113\n",
      "   +1.1124 if cp<=0.09426277279853822 & cp>=0.07089610397815704 & cv>=0.6190513968467714\n",
      "  +30.5452 if cp<=-0.028630018234252923\n",
      "   +1.0000 if cp<=-0.012404267117381094\n",
      "Run episode 765 with rewards 43.0\n",
      "============ 766 ===========\n",
      "39 actions [0, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0]\n",
      "   -0.3368 if cp>=-0.009661125019192696\n",
      "   +0.2694 if pa>=-0.14691468179225922\n",
      "   +0.2694 if cp<=0.07089610397815704\n",
      "   +0.2694 if cp>=-0.1010687991976738\n",
      "   +3.6395 if cp<=-0.015537058562040329 & pa<=0.008280977047979836\n",
      "--------------\n",
      "   -3.7617 if cp>=-0.031050803139805794\n",
      "   +7.1688 if pa>=-0.026311570778489113\n",
      "   -0.5577 if cp<=0.09426277279853822 & cp>=0.07089610397815704 & cv>=0.6190513968467714\n",
      "   +1.4523 if cp<=-0.028630018234252923\n",
      "   -4.1693 if cp<=0.07201786041259767 & cp>=-0.03741768449544906 & cv<=0.3473871231079104 & cv>=-0.34509175419807436\n",
      "Run episode 766 with rewards 39.0\n",
      "============ 767 ===========\n",
      "19 actions [0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   +0.0757 if cp>=-0.009661125019192696\n",
      "   +1.3102 if pa>=-0.14691468179225922\n",
      "   +1.2937 if cp>=-0.1010687991976738\n",
      "   +1.1035 if cp<=-0.015537058562040329 & pa<=0.008280977047979836\n",
      "   +1.7230 if cp>=-0.03802762404084205 & cv>=-0.13835332095622996 & pa>=-0.035922744870185846\n",
      "--------------\n",
      "  +14.9941 if cp>=-0.031050803139805794\n",
      "   +3.2039 if pa>=-0.026311570778489113\n",
      "   +5.2794 if cp<=-0.028630018234252923\n",
      "   +0.1487 if cp<=0.07201786041259767 & cp>=-0.03741768449544906 & cv<=0.3473871231079104 & cv>=-0.34509175419807436\n",
      "  -18.3934 if cp>=-0.03802762404084205 & cv<=0.7934888124465942\n",
      "Run episode 767 with rewards 19.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 768 ===========\n",
      "38 actions [1, 1, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1]\n",
      "   +0.9286 if pa>=-0.14691468179225922\n",
      "   +0.9287 if cp>=-0.1010687991976738\n",
      "   +1.3678 if cp<=-0.015537058562040329 & pa<=0.008280977047979836\n",
      "   +0.3915 if cp>=-0.03802762404084205 & cv>=-0.13835332095622996 & pa>=-0.035922744870185846\n",
      "   +1.0393 if cv>=-0.4207946419715881\n",
      "--------------\n",
      "  -18.2698 if cp>=-0.031050803139805794\n",
      "   -2.1392 if pa>=-0.026311570778489113\n",
      "  +13.4497 if cp<=-0.028630018234252923\n",
      "  -10.9383 if cp>=-0.03802762404084205 & cv<=0.7934888124465942\n",
      "   +1.0000 if cp>=0.08325021713972092\n",
      "Run episode 768 with rewards 38.0\n",
      "============ 769 ===========\n",
      "46 actions [0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0]\n",
      "   +0.8935 if pa>=-0.14691468179225922\n",
      "   +0.8923 if cp>=-0.1010687991976738\n",
      "   +0.9825 if cp<=-0.015537058562040329 & pa<=0.008280977047979836\n",
      "   +0.9009 if cv>=-0.4207946419715881\n",
      "   +1.0693 if cp<=-0.020154571533203124 & cv>=0.42597771286964414 & pa<=0.007759261876344699\n",
      "--------------\n",
      "   -3.1527 if cp>=-0.031050803139805794\n",
      "   +3.0003 if pa>=-0.026311570778489113\n",
      "   +4.2019 if cp<=-0.028630018234252923\n",
      "   -5.6132 if cp>=-0.03802762404084205 & cv<=0.7934888124465942\n",
      "   +1.1530 if cv<=0.42597771286964414 & pa<=0.007759261876344699\n",
      "Run episode 769 with rewards 46.0\n",
      "============ 770 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 1, 1, 1, 1, 1]\n",
      "   +0.2523 if pa>=-0.14691468179225922\n",
      "   +3.9353 if cp<=-0.015537058562040329 & pa<=0.008280977047979836\n",
      "   +1.7769 if cv>=-0.4207946419715881\n",
      "   -6.5241 if cp<=-0.020154571533203124 & cv>=0.42597771286964414 & pa<=0.007759261876344699\n",
      "   -8.3502 if cv>=1.7829713821411133\n",
      "--------------\n",
      "   -0.1955 if cp>=-0.031050803139805794\n",
      "   -0.3756 if pa>=-0.026311570778489113\n",
      "   +8.8241 if cp<=-0.028630018234252923\n",
      "   -9.0174 if cp>=-0.03802762404084205 & cv<=0.7934888124465942\n",
      "  +17.6572 if cp>=0.020645424723625183 & cv>=1.0051301717758179\n",
      "Run episode 770 with rewards 10.0\n",
      "============ 771 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   -0.0000 if cp<=-0.015537058562040329 & pa<=0.008280977047979836\n",
      "   +0.0068 if cv>=-0.4207946419715881\n",
      "   -0.0000 if cp<=-0.020154571533203124 & cv>=0.42597771286964414 & pa<=0.007759261876344699\n",
      "   -0.0000 if cv>=1.7829713821411133\n",
      "   +0.0062 if cp<=-0.04822569862008094\n",
      "--------------\n",
      "  -20.9992 if pa>=-0.026311570778489113\n",
      "   -6.3043 if cp<=-0.028630018234252923\n",
      "  -12.3709 if cp>=-0.03802762404084205 & cv<=0.7934888124465942\n",
      "   +2.3495 if cp>=0.020645424723625183 & cv>=1.0051301717758179\n",
      "   +1.0000 if cv>=-0.5903610467910767\n",
      "Run episode 771 with rewards 9.0\n",
      "============ 772 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 0, 1, 0, 1, 1]\n",
      "   +0.0000 if cv>=-0.4207946419715881\n",
      "   -0.0000 if cp<=-0.020154571533203124 & cv>=0.42597771286964414 & pa<=0.007759261876344699\n",
      "   -0.0000 if cv>=1.7829713821411133\n",
      "   -0.0000 if cp<=-0.04822569862008094\n",
      "   +0.0000 if cp<=-0.08926325589418412\n",
      "--------------\n",
      "  +21.0686 if pa>=-0.026311570778489113\n",
      "   +9.8403 if cp<=-0.028630018234252923\n",
      "   +8.8403 if cp>=-0.03802762404084205 & cv<=0.7934888124465942\n",
      "   +2.1852 if cp>=0.020645424723625183 & cv>=1.0051301717758179\n",
      "   +1.0000 if cp<=-0.08926325589418412\n",
      "Run episode 772 with rewards 10.0\n",
      "============ 773 ===========\n",
      "26 actions [0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 0, 0, 1, 1, 1, 0, 0, 1]\n",
      "   +7.6085 if cv>=-0.4207946419715881\n",
      "   -0.0000 if cp<=-0.020154571533203124 & cv>=0.42597771286964414 & pa<=0.007759261876344699\n",
      "   -0.0000 if cv>=1.7829713821411133\n",
      "   -0.0000 if cp<=-0.04822569862008094\n",
      "  +17.5613 if cp>=0.10357026755809784\n",
      "--------------\n",
      "   -0.0000 if pa>=-0.026311570778489113\n",
      "   -0.0000 if cp<=-0.028630018234252923\n",
      "   +2.2179 if cp>=-0.03802762404084205 & cv<=0.7934888124465942\n",
      "   -0.0000 if cp>=0.020645424723625183 & cv>=1.0051301717758179\n",
      "  -20.0000 if cp>=0.13323834538459778\n",
      "Run episode 773 with rewards 26.0\n",
      "============ 774 ===========\n",
      "13 actions [0, 0, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0]\n",
      "   +5.9679 if cv>=-0.4207946419715881\n",
      "   +0.0000 if cv>=1.7829713821411133\n",
      "   -0.8989 if cp<=-0.04822569862008094\n",
      "   +0.0000 if cp>=0.10357026755809784\n",
      "   -2.6642 if cv<=-0.43566459417343106 & pav<=0.4759480357170105\n",
      "--------------\n",
      "   +0.2173 if pa>=-0.026311570778489113\n",
      "   +0.3165 if cp<=-0.028630018234252923\n",
      "   +1.1888 if cp>=-0.03802762404084205 & cv<=0.7934888124465942\n",
      "   -0.0000 if cp>=0.13323834538459778\n",
      "   +3.2574 if cv<=-0.43566459417343106 & pa<=0.009781138971447945\n",
      "Run episode 774 with rewards 13.0\n",
      "============ 775 ===========\n",
      "10 actions [0, 0, 0, 1, 0, 0, 0, 0, 0, 0]\n",
      "   +1.6951 if cv>=-0.4207946419715881\n",
      "   +9.2944 if cp<=-0.04822569862008094\n",
      "   +0.0000 if cp>=0.10357026755809784\n",
      "   +0.0000 if cv<=-0.43566459417343106 & pav<=0.4759480357170105\n",
      "   +3.4790 if cv>=-0.5771737456321716\n",
      "--------------\n",
      "   -4.8968 if pa>=-0.026311570778489113\n",
      "   -1.0291 if cp<=-0.028630018234252923\n",
      "   +4.3383 if cp>=-0.03802762404084205 & cv<=0.7934888124465942\n",
      "   +0.0000 if cv<=-0.43566459417343106 & pa<=0.009781138971447945\n",
      "   +2.0443 if pav>=1.1848350763320923\n",
      "Run episode 775 with rewards 10.0\n",
      "============ 776 ===========\n",
      "27 actions [0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 1]\n",
      "  +15.1525 if cv>=-0.4207946419715881\n",
      "  -25.9544 if cp<=-0.04822569862008094\n",
      "   -0.0000 if cv<=-0.43566459417343106 & pav<=0.4759480357170105\n",
      "  +11.6916 if cv>=-0.5771737456321716\n",
      "   +1.0000 if cp>=-0.03544632568955421\n",
      "--------------\n",
      "   +6.8051 if pa>=-0.026311570778489113\n",
      "  +12.7453 if cp<=-0.028630018234252923\n",
      "   -6.7056 if cp>=-0.03802762404084205 & cv<=0.7934888124465942\n",
      "  +12.6246 if pav>=1.1848350763320923\n",
      "   +1.0000 if cp>=-0.06299213767051696\n",
      "Run episode 776 with rewards 27.0\n",
      "============ 777 ===========\n",
      "14 actions [0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0]\n",
      "   +9.0333 if cv>=-0.4207946419715881\n",
      "   -3.1368 if cp<=-0.04822569862008094\n",
      "   +9.0333 if cv>=-0.5771737456321716\n",
      "   -3.9233 if cp>=-0.03544632568955421\n",
      "   +2.3889 if cp>=-0.05360198095440864\n",
      "--------------\n",
      "   +3.3341 if pa>=-0.026311570778489113\n",
      "   +2.1829 if cp<=-0.028630018234252923\n",
      "   +1.1368 if cp>=-0.03802762404084205 & cv<=0.7934888124465942\n",
      "   +0.0465 if pav>=1.1848350763320923\n",
      "   +1.0902 if cv<=-0.5513045132160186 & pa<=0.03804200440645218\n",
      "Run episode 777 with rewards 14.0\n",
      "============ 778 ===========\n",
      "40 actions [0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1]\n",
      "   +0.2964 if cv>=-0.4207946419715881\n",
      "   -9.2875 if cp<=-0.04822569862008094\n",
      "   -1.5918 if cv>=-0.5771737456321716\n",
      "   +4.5885 if cp>=-0.03544632568955421\n",
      "   +3.9600 if cv>=-0.5420906901359558\n",
      "--------------\n",
      "   +7.9300 if pa>=-0.026311570778489113\n",
      "  +11.2440 if cp<=-0.028630018234252923\n",
      "   -3.2493 if cp>=-0.03802762404084205 & cv<=0.7934888124465942\n",
      "   -0.6604 if cv<=-0.5513045132160186 & pa<=0.03804200440645218\n",
      "   +2.5003 if pa>=0.19004392623901367\n",
      "Run episode 778 with rewards 40.0\n",
      "============ 779 ===========\n",
      "40 actions [0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 0, 1, 0, 1, 1, 1]\n",
      "   -0.0062 if cp<=-0.04822569862008094\n",
      "   +7.4419 if cv>=-0.5771737456321716\n",
      "  -10.1877 if cp>=-0.03544632568955421\n",
      "   +5.6125 if cv>=-0.5420906901359558\n",
      "  +15.9188 if cv>=-0.802869927883148 & pa<=0.0458693839609623 & pa>=-0.012248658540192947\n",
      "--------------\n",
      "   +8.0321 if pa>=-0.026311570778489113\n",
      "   +8.8724 if cp<=-0.028630018234252923\n",
      "  -10.2497 if cp>=-0.03802762404084205 & cv<=0.7934888124465942\n",
      "   +0.0000 if pa>=0.19004392623901367\n",
      "   +8.8777 if cp<=0.024577738344669347 & cv<=-0.802869927883148 & pa>=0.0458693839609623\n",
      "Run episode 779 with rewards 40.0\n",
      "============ 780 ===========\n",
      "52 actions [0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 0, 1]\n",
      "   +4.3566 if cv>=-0.5771737456321716\n",
      "   -4.9261 if cp>=-0.03544632568955421\n",
      "   +4.3566 if cv>=-0.5420906901359558\n",
      "   +7.0998 if cv>=-0.802869927883148 & pa<=0.0458693839609623 & pa>=-0.012248658540192947\n",
      "   -1.1148 if cp<=-0.03258969932794571\n",
      "--------------\n",
      "   +8.2842 if pa>=-0.026311570778489113\n",
      "   +8.7952 if cp<=-0.028630018234252923\n",
      "  -11.1468 if cp>=-0.03802762404084205 & cv<=0.7934888124465942\n",
      "   +0.0000 if cp<=0.024577738344669347 & cv<=-0.802869927883148 & pa>=0.0458693839609623\n",
      "   +0.0875 if pa>=-0.05123867318034171\n",
      "Run episode 780 with rewards 52.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 781 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 1, 1, 1]\n",
      "   -3.6076 if cv>=-0.5771737456321716\n",
      "  +11.9695 if cp>=-0.03544632568955421\n",
      "   -3.6077 if cv>=-0.5420906901359558\n",
      "   +3.0547 if cv>=-0.802869927883148 & pa<=0.0458693839609623 & pa>=-0.012248658540192947\n",
      "   -1.4571 if cp>=-0.02844759151339529\n",
      "--------------\n",
      "  +10.5584 if pa>=-0.026311570778489113\n",
      "  +14.1791 if cp<=-0.028630018234252923\n",
      "  -17.3971 if cp>=-0.03802762404084205 & cv<=0.7934888124465942\n",
      "   +1.6217 if pa>=-0.05123867318034171\n",
      "   +8.1424 if cv>=1.5721946954727173\n",
      "Run episode 781 with rewards 10.0\n",
      "============ 782 ===========\n",
      "25 actions [1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0]\n",
      "   +0.9972 if cv>=-0.5771737456321716\n",
      "   -4.7934 if cp>=-0.03544632568955421\n",
      "   +0.9972 if cv>=-0.5420906901359558\n",
      "   +1.1125 if cv>=-0.802869927883148 & pa<=0.0458693839609623 & pa>=-0.012248658540192947\n",
      "   +1.0000 if cp<=0.004717699380125854 & cp>=-0.021816829405725\n",
      "--------------\n",
      "   +4.9824 if pa>=-0.026311570778489113\n",
      "  -28.2227 if cp<=-0.028630018234252923\n",
      "   -4.3889 if cp>=-0.03802762404084205 & cv<=0.7934888124465942\n",
      "  -12.1441 if cv>=1.5721946954727173\n",
      "   +0.6877 if cv>=-1.1285931587219238\n",
      "Run episode 782 with rewards 25.0\n",
      "============ 783 ===========\n",
      "37 actions [1, 1, 0, 0, 0, 1, 0, 0, 1, 0, 1, 1, 1, 1, 0, 0, 0, 0, 1, 0, 1, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -3.3065 if cp>=-0.03544632568955421\n",
      "   -0.3683 if cv>=-0.5420906901359558\n",
      "   -1.0420 if cv>=-0.802869927883148 & pa<=0.0458693839609623 & pa>=-0.012248658540192947\n",
      "   -1.0658 if cp<=0.004717699380125854 & cp>=-0.021816829405725\n",
      "   +2.8864 if cv>=-0.3572936177253723\n",
      "--------------\n",
      "   +6.7713 if pa>=-0.026311570778489113\n",
      "   +2.1132 if cp<=-0.028630018234252923\n",
      "   -5.1689 if cp>=-0.03802762404084205 & cv<=0.7934888124465942\n",
      "  +25.4987 if cv>=1.5721946954727173\n",
      "   +4.7651 if cp>=0.05019206553697587 & cv<=-0.3572936177253723\n",
      "Run episode 783 with rewards 37.0\n",
      "============ 784 ===========\n",
      "21 actions [0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0]\n",
      "   -5.3340 if cp>=-0.03544632568955421\n",
      "   -4.9534 if cv>=-0.802869927883148 & pa<=0.0458693839609623 & pa>=-0.012248658540192947\n",
      "   -7.1806 if cp<=0.004717699380125854 & cp>=-0.021816829405725\n",
      "  +11.2700 if cv>=-0.3572936177253723\n",
      "  -12.7269 if cp>=0.005873615201562645 & cv<=-0.1623561292886734 & pa<=-0.0491552084684372\n",
      "--------------\n",
      "   +6.1892 if pa>=-0.026311570778489113\n",
      "   -1.8517 if cp>=-0.03802762404084205 & cv<=0.7934888124465942\n",
      "  -20.3396 if cv>=1.5721946954727173\n",
      "   -3.3314 if cp>=0.05019206553697587 & cv<=-0.3572936177253723\n",
      "   -2.4069 if cp<=0.005873615201562645 & cp>=-0.04656471833586693 & pa<=-0.01534419935196638\n",
      "Run episode 784 with rewards 21.0\n",
      "============ 785 ===========\n",
      "52 actions [0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0]\n",
      "   +1.6330 if cp>=-0.03544632568955421\n",
      "   -2.5485 if cp<=0.004717699380125854 & cp>=-0.021816829405725\n",
      "   +1.5877 if cv>=-0.3572936177253723\n",
      "   +8.9054 if cp>=0.005873615201562645 & cv<=-0.1623561292886734 & pa<=-0.0491552084684372\n",
      "   +1.9921 if cp>=0.05962105467915535\n",
      "--------------\n",
      "   +5.8572 if pa>=-0.026311570778489113\n",
      "   -0.0000 if cv>=1.5721946954727173\n",
      "   -0.0000 if cp>=0.05019206553697587 & cv<=-0.3572936177253723\n",
      "   -0.0000 if cp<=0.005873615201562645 & cp>=-0.04656471833586693 & pa<=-0.01534419935196638\n",
      "   -6.7203 if cp<=0.007934830151498318 & cp>=0.007934830151498318\n",
      "Run episode 785 with rewards 52.0\n",
      "============ 786 ===========\n",
      "49 actions [0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0]\n",
      "   -1.7498 if cp>=-0.03544632568955421\n",
      "   -0.7947 if cp<=0.004717699380125854 & cp>=-0.021816829405725\n",
      "   +1.2240 if cp>=0.005873615201562645 & cv<=-0.1623561292886734 & pa<=-0.0491552084684372\n",
      "   +1.7389 if cp>=0.05962105467915535\n",
      "   +5.4309 if cp>=-0.024932920560240737\n",
      "--------------\n",
      "   +9.6995 if pa>=-0.026311570778489113\n",
      "   -0.0000 if cv>=1.5721946954727173\n",
      "   -0.0007 if cp>=0.05019206553697587 & cv<=-0.3572936177253723\n",
      "   -0.0000 if cp<=0.007934830151498318 & cp>=0.007934830151498318\n",
      "   -3.2296 if pa>=-0.047730707377195356\n",
      "Run episode 786 with rewards 49.0\n",
      "============ 787 ===========\n",
      "29 actions [1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0]\n",
      "   -2.1519 if cp>=-0.03544632568955421\n",
      "   +0.1261 if cp>=0.005873615201562645 & cv<=-0.1623561292886734 & pa<=-0.0491552084684372\n",
      "   +0.0620 if cp>=0.05962105467915535\n",
      "   -1.9157 if cp>=-0.024932920560240737\n",
      "  +14.2857 if cp>=-0.07537788003683082 & pa<=-0.03513774946331977\n",
      "--------------\n",
      "   +8.6172 if pa>=-0.026311570778489113\n",
      "   -0.3555 if cp>=0.05019206553697587 & cv<=-0.3572936177253723\n",
      "   +0.0000 if cp<=0.007934830151498318 & cp>=0.007934830151498318\n",
      "   -1.5316 if pa>=-0.047730707377195356\n",
      "   +0.0776 if pa>=-0.03513774946331977\n",
      "Run episode 787 with rewards 29.0\n",
      "============ 788 ===========\n",
      "41 actions [1, 1, 1, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 1, 1, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 0, 0, 0, 1]\n",
      "   -0.0857 if cp>=-0.03544632568955421\n",
      "   +0.6497 if cp>=0.005873615201562645 & cv<=-0.1623561292886734 & pa<=-0.0491552084684372\n",
      "   -0.0504 if cp>=-0.024932920560240737\n",
      "   +1.9891 if cp>=-0.07537788003683082 & pa<=-0.03513774946331977\n",
      "   +2.6849 if cp>=0.027525609731674196 & pa<=-0.01805284358561036\n",
      "--------------\n",
      "   +6.2574 if pa>=-0.026311570778489113\n",
      "   -0.0029 if cp>=0.05019206553697587 & cv<=-0.3572936177253723\n",
      "   -2.7878 if pa>=-0.047730707377195356\n",
      "   -2.7877 if pa>=-0.03513774946331977\n",
      "   +1.5452 if cp<=0.027525609731674196 & pa<=-0.01805284358561036\n",
      "Run episode 788 with rewards 41.0\n",
      "============ 789 ===========\n",
      "45 actions [0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0]\n",
      "   -1.7179 if cp>=-0.03544632568955421\n",
      "   +0.0000 if cp>=0.005873615201562645 & cv<=-0.1623561292886734 & pa<=-0.0491552084684372\n",
      "   +6.7243 if cp>=-0.07537788003683082 & pa<=-0.03513774946331977\n",
      "   +0.0000 if cp>=0.027525609731674196 & pa<=-0.01805284358561036\n",
      "   -1.9756 if pa>=-0.08030913770198822 & pav>=-0.1669993102550506\n",
      "--------------\n",
      "   +3.0128 if pa>=-0.026311570778489113\n",
      "   -0.8069 if pa>=-0.047730707377195356\n",
      "   -0.4099 if pa>=-0.03513774946331977\n",
      "   -2.2574 if cp<=0.027525609731674196 & pa<=-0.01805284358561036\n",
      "   +4.0706 if cp>=-0.011145844124257565 & cv>=-0.4120159447193146 & pa>=-0.08030913770198822 & pav>=-0.1669993102550506\n",
      "Run episode 789 with rewards 45.0\n",
      "============ 790 ===========\n",
      "40 actions [1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0]\n",
      "   -2.1631 if cp>=-0.03544632568955421\n",
      "   +7.2824 if cp>=-0.07537788003683082 & pa<=-0.03513774946331977\n",
      "   +0.1100 if cp>=0.027525609731674196 & pa<=-0.01805284358561036\n",
      "   -1.4002 if pa>=-0.08030913770198822 & pav>=-0.1669993102550506\n",
      "   +1.1335 if cp>=-0.04571914300322533\n",
      "--------------\n",
      "   +6.6456 if pa>=-0.026311570778489113\n",
      "   -2.5755 if pa>=-0.047730707377195356\n",
      "   -3.3900 if cp<=0.027525609731674196 & pa<=-0.01805284358561036\n",
      "   -0.1566 if cp>=-0.011145844124257565 & cv>=-0.4120159447193146 & pa>=-0.08030913770198822 & pav>=-0.1669993102550506\n",
      "   -3.9203 if cp>=-0.04571914300322533 & cv>=0.23535468280315508 & pa>=0.00709881912916903\n",
      "Run episode 790 with rewards 40.0\n",
      "============ 791 ===========\n",
      "56 actions [1, 1, 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   +0.5734 if cp>=-0.03544632568955421\n",
      "   +4.4124 if cp>=-0.07537788003683082 & pa<=-0.03513774946331977\n",
      "   -1.2048 if pa>=-0.08030913770198822 & pav>=-0.1669993102550506\n",
      "   +0.4879 if cp>=-0.04571914300322533\n",
      "   -1.9712 if cp<=0.08466603606939319 & cv>=-0.8088746309280396\n",
      "--------------\n",
      "   +0.3843 if pa>=-0.026311570778489113\n",
      "   +3.1497 if pa>=-0.047730707377195356\n",
      "  +20.5040 if cp<=0.027525609731674196 & pa<=-0.01805284358561036\n",
      "   -2.9851 if cp>=-0.04571914300322533 & cv>=0.23535468280315508 & pa>=0.00709881912916903\n",
      "   +1.2509 if cp<=0.03951573371887208\n",
      "Run episode 791 with rewards 56.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 792 ===========\n",
      "39 actions [1, 1, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   +3.3791 if cp>=-0.03544632568955421\n",
      "   +5.7175 if cp>=-0.07537788003683082 & pa<=-0.03513774946331977\n",
      "   -2.6432 if pa>=-0.08030913770198822 & pav>=-0.1669993102550506\n",
      "   -1.1668 if cp<=0.08466603606939319 & cv>=-0.8088746309280396\n",
      "   -3.1987 if cp>=0.05775800347328188 & pa>=-0.03302092105150222\n",
      "--------------\n",
      "   +1.7385 if pa>=-0.047730707377195356\n",
      "   +5.6778 if cp<=0.027525609731674196 & pa<=-0.01805284358561036\n",
      "   -3.3602 if cp>=-0.04571914300322533 & cv>=0.23535468280315508 & pa>=0.00709881912916903\n",
      "   +1.7298 if cp<=0.03951573371887208\n",
      "   -5.6801 if cp<=0.05775800347328188 & cp>=-0.003936700988560915 & pav<=-0.5432045459747314 & pav>=-0.9675068855285645\n",
      "Run episode 792 with rewards 39.0\n",
      "============ 793 ===========\n",
      "41 actions [1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 0, 1, 0]\n",
      "   -2.6407 if cp>=-0.03544632568955421\n",
      "  +10.5515 if cp>=-0.07537788003683082 & pa<=-0.03513774946331977\n",
      "   -3.3521 if pa>=-0.08030913770198822 & pav>=-0.1669993102550506\n",
      "   -0.0000 if cp>=0.05775800347328188 & pa>=-0.03302092105150222\n",
      "  +11.4667 if cv>=1.1754945516586304\n",
      "--------------\n",
      "   +4.2264 if pa>=-0.047730707377195356\n",
      "   +6.4627 if cp<=0.027525609731674196 & pa<=-0.01805284358561036\n",
      "   -0.0001 if cp>=-0.04571914300322533 & cv>=0.23535468280315508 & pa>=0.00709881912916903\n",
      "   -5.1511 if cp<=0.05775800347328188 & cp>=-0.003936700988560915 & pav<=-0.5432045459747314 & pav>=-0.9675068855285645\n",
      "   +4.4229 if cp<=0.020345282554626476 & cp>=-0.003952613612636924 & cv<=-0.6019219994544983\n",
      "Run episode 793 with rewards 41.0\n",
      "============ 794 ===========\n",
      "36 actions [1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1]\n",
      "   +2.3432 if cp>=-0.03544632568955421\n",
      "   +8.4371 if cp>=-0.07537788003683082 & pa<=-0.03513774946331977\n",
      "   -5.8417 if pa>=-0.08030913770198822 & pav>=-0.1669993102550506\n",
      "   -3.5090 if cv>=1.1754945516586304\n",
      "  -12.9465 if cv>=1.2003542184829712\n",
      "--------------\n",
      "   +7.2298 if pa>=-0.047730707377195356\n",
      "   -8.1481 if cp<=0.027525609731674196 & pa<=-0.01805284358561036\n",
      "   +0.0000 if cp<=0.05775800347328188 & cp>=-0.003936700988560915 & pav<=-0.5432045459747314 & pav>=-0.9675068855285645\n",
      "   +0.0000 if cp<=0.020345282554626476 & cp>=-0.003952613612636924 & cv<=-0.6019219994544983\n",
      "  +13.2293 if pav>=1.9521206617355347\n",
      "Run episode 794 with rewards 36.0\n",
      "============ 795 ===========\n",
      "27 actions [0, 0, 1, 0, 0, 1, 0, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +10.7439 if cp>=-0.07537788003683082 & pa<=-0.03513774946331977\n",
      "   +4.1164 if pa>=-0.08030913770198822 & pav>=-0.1669993102550506\n",
      "   +6.4094 if cv>=1.1754945516586304\n",
      "  +15.4343 if cv>=1.2003542184829712\n",
      "   +1.0000 if cp>=0.08252348005771637\n",
      "--------------\n",
      "   +4.0400 if pa>=-0.047730707377195356\n",
      "   -2.5922 if cp<=0.027525609731674196 & pa<=-0.01805284358561036\n",
      "   -0.0027 if cp<=0.05775800347328188 & cp>=-0.003936700988560915 & pav<=-0.5432045459747314 & pav>=-0.9675068855285645\n",
      "   -0.0000 if pav>=1.9521206617355347\n",
      "  +10.9639 if cp<=0.04579650238156319 & cp>=-0.0016961710061877836 & cv>=0.9857339859008789 & pa<=-0.038856636732816696\n",
      "Run episode 795 with rewards 27.0\n",
      "============ 796 ===========\n",
      "17 actions [0, 0, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1]\n",
      "   -1.1847 if cp>=-0.07537788003683082 & pa<=-0.03513774946331977\n",
      "   +3.6924 if pa>=-0.08030913770198822 & pav>=-0.1669993102550506\n",
      "   +1.5720 if cv>=1.1754945516586304\n",
      "   -0.0000 if cv>=1.2003542184829712\n",
      "   -4.6974 if cv<=-0.3283865541219711 & pa<=-0.028812553733587265\n",
      "--------------\n",
      "   +6.8347 if pa>=-0.047730707377195356\n",
      "   -1.2464 if cp<=0.027525609731674196 & pa<=-0.01805284358561036\n",
      "   +0.0002 if cp<=0.05775800347328188 & cp>=-0.003936700988560915 & pav<=-0.5432045459747314 & pav>=-0.9675068855285645\n",
      "   +4.2046 if cp<=0.04579650238156319 & cp>=-0.0016961710061877836 & cv>=0.9857339859008789 & pa<=-0.038856636732816696\n",
      "   -2.5205 if cp<=-0.023622351512312886 & pa>=-0.028812553733587265\n",
      "Run episode 796 with rewards 17.0\n",
      "============ 797 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 1]\n",
      "   +9.8207 if cp>=-0.07537788003683082 & pa<=-0.03513774946331977\n",
      "   +4.6679 if pa>=-0.08030913770198822 & pav>=-0.1669993102550506\n",
      "  +10.1337 if cv>=1.1754945516586304\n",
      "   +3.7961 if cv<=-0.3283865541219711 & pa<=-0.028812553733587265\n",
      "   +1.0000 if cv>=1.7422420978546143\n",
      "--------------\n",
      "   -4.8403 if pa>=-0.047730707377195356\n",
      "   -9.1500 if cp<=0.027525609731674196 & pa<=-0.01805284358561036\n",
      "  -11.5975 if cp<=0.04579650238156319 & cp>=-0.0016961710061877836 & cv>=0.9857339859008789 & pa<=-0.038856636732816696\n",
      "   +5.7340 if cp<=-0.023622351512312886 & pa>=-0.028812553733587265\n",
      "   +3.1875 if pa>=0.010711681097745895\n",
      "Run episode 797 with rewards 9.0\n",
      "============ 798 ===========\n",
      "12 actions [1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0]\n",
      "   +0.0018 if cp>=-0.07537788003683082 & pa<=-0.03513774946331977\n",
      "  -10.8373 if pa>=-0.08030913770198822 & pav>=-0.1669993102550506\n",
      "   +0.0019 if cv>=1.1754945516586304\n",
      "   +0.0007 if cv<=-0.3283865541219711 & pa<=-0.028812553733587265\n",
      "  +10.4150 if cp>=0.012942176871001729\n",
      "--------------\n",
      "   +6.5198 if pa>=-0.047730707377195356\n",
      "   +5.3101 if cp<=0.027525609731674196 & pa<=-0.01805284358561036\n",
      "   +6.7304 if cp<=0.04579650238156319 & cp>=-0.0016961710061877836 & cv>=0.9857339859008789 & pa<=-0.038856636732816696\n",
      "  +15.6794 if cp<=-0.023622351512312886 & pa>=-0.028812553733587265\n",
      "   -1.9672 if cp>=0.012942176871001729\n",
      "Run episode 798 with rewards 12.0\n",
      "============ 799 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -5.7400 if cp>=-0.07537788003683082 & pa<=-0.03513774946331977\n",
      "   -7.0596 if pa>=-0.08030913770198822 & pav>=-0.1669993102550506\n",
      "   -5.7053 if cv>=1.1754945516586304\n",
      "  -12.5245 if cp>=0.012942176871001729\n",
      "   +1.0000 if cp>=-0.014102870970964427 & cv<=0.9282734870910647\n",
      "--------------\n",
      "   +0.5338 if pa>=-0.047730707377195356\n",
      "   -2.1716 if cp<=0.027525609731674196 & pa<=-0.01805284358561036\n",
      "   -2.3002 if cp<=0.04579650238156319 & cp>=-0.0016961710061877836 & cv>=0.9857339859008789 & pa<=-0.038856636732816696\n",
      "   +2.2343 if cp<=-0.023622351512312886 & pa>=-0.028812553733587265\n",
      "   +1.0374 if cp<=-0.014102870970964427\n",
      "Run episode 799 with rewards 9.0\n",
      "============ 800 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +5.7400 if cp>=-0.07537788003683082 & pa<=-0.03513774946331977\n",
      "   +7.0596 if pa>=-0.08030913770198822 & pav>=-0.1669993102550506\n",
      "   +5.7053 if cv>=1.1754945516586304\n",
      "  +12.5245 if cp>=0.012942176871001729\n",
      "   +1.0000 if cp<=0.04491744786500932 & cp>=0.012841114774346352\n",
      "--------------\n",
      "   +0.0803 if cp<=0.027525609731674196 & pa<=-0.01805284358561036\n",
      "   +0.0000 if cp<=0.04579650238156319 & cp>=-0.0016961710061877836 & cv>=0.9857339859008789 & pa<=-0.038856636732816696\n",
      "   +0.0000 if cp<=-0.023622351512312886 & pa>=-0.028812553733587265\n",
      "   +0.0000 if cp<=-0.014102870970964427\n",
      "   +0.0802 if pa>=-0.038898635655641556\n",
      "Run episode 800 with rewards 9.0\n",
      "============ 801 ===========\n",
      "34 actions [1, 1, 1, 0, 0, 1, 0, 0, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 0, 1, 0, 1, 1, 1, 0, 0, 1, 1, 0]\n",
      "   -0.1669 if cp>=-0.07537788003683082 & pa<=-0.03513774946331977\n",
      "  -15.3908 if pa>=-0.08030913770198822 & pav>=-0.1669993102550506\n",
      "   -0.1659 if cv>=1.1754945516586304\n",
      "  +15.1824 if cp>=0.012942176871001729\n",
      "   -0.1645 if cp<=-0.02825912870466709\n",
      "--------------\n",
      "   -0.0000 if cp<=0.027525609731674196 & pa<=-0.01805284358561036\n",
      "   -0.0000 if cp<=0.04579650238156319 & cp>=-0.0016961710061877836 & cv>=0.9857339859008789 & pa<=-0.038856636732816696\n",
      "   +0.0416 if cp<=-0.023622351512312886 & pa>=-0.028812553733587265\n",
      "   +0.0610 if pa>=-0.038898635655641556\n",
      "   +0.0611 if cp<=0.004842420341446999\n",
      "Run episode 801 with rewards 34.0\n",
      "============ 802 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 0, 0, 0]\n",
      "   -2.3383 if cp>=-0.07537788003683082 & pa<=-0.03513774946331977\n",
      "   -3.4191 if pa>=-0.08030913770198822 & pav>=-0.1669993102550506\n",
      "   -0.0000 if cv>=1.1754945516586304\n",
      "   +6.1796 if cp>=0.012942176871001729\n",
      "   +4.0575 if cp>=-0.02646387815475464 & cv>=0.15217526257038116 & pa>=-0.026889921352267254\n",
      "--------------\n",
      "   +2.8368 if cp<=0.027525609731674196 & pa<=-0.01805284358561036\n",
      "   +5.2418 if cp<=-0.023622351512312886 & pa>=-0.028812553733587265\n",
      "   -1.6293 if pa>=-0.038898635655641556\n",
      "   -1.0967 if cp<=0.004842420341446999\n",
      "   -5.1646 if pa>=-0.026889921352267254 & pav<=-0.5405943036079407\n",
      "Run episode 802 with rewards 9.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 803 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -11.5322 if cp>=-0.07537788003683082 & pa<=-0.03513774946331977\n",
      "   -4.6081 if pa>=-0.08030913770198822 & pav>=-0.1669993102550506\n",
      "  -10.0738 if cp>=0.012942176871001729\n",
      "   -2.0917 if cp>=-0.02646387815475464 & cv>=0.15217526257038116 & pa>=-0.026889921352267254\n",
      "   +1.0000 if cp>=0.06514372676610947\n",
      "--------------\n",
      "  +15.1527 if cp<=0.027525609731674196 & pa<=-0.01805284358561036\n",
      "   +0.0000 if cp<=-0.023622351512312886 & pa>=-0.028812553733587265\n",
      "   +0.0000 if pa>=-0.038898635655641556\n",
      "   +0.0000 if pa>=-0.026889921352267254 & pav<=-0.5405943036079407\n",
      "   +6.0000 if cv>=1.225123405456543\n",
      "Run episode 803 with rewards 10.0\n",
      "============ 804 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +11.7589 if cp>=-0.07537788003683082 & pa<=-0.03513774946331977\n",
      "   +4.5381 if pa>=-0.08030913770198822 & pav>=-0.1669993102550506\n",
      "  +10.2596 if cp>=0.012942176871001729\n",
      "   +1.9991 if cp>=-0.02646387815475464 & cv>=0.15217526257038116 & pa>=-0.026889921352267254\n",
      "   +1.0000 if cp>=0.09659264534711838\n",
      "--------------\n",
      "   +0.0000 if cp<=0.027525609731674196 & pa<=-0.01805284358561036\n",
      "   +0.0000 if cp<=-0.023622351512312886 & pa>=-0.028812553733587265\n",
      "   +0.0001 if pa>=-0.026889921352267254 & pav<=-0.5405943036079407\n",
      "   -0.0000 if cv>=1.225123405456543\n",
      "   +0.8135 if cp<=0.012834234535694123\n",
      "Run episode 804 with rewards 9.0\n",
      "============ 805 ===========\n",
      "11 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -4.5532 if cp>=-0.07537788003683082 & pa<=-0.03513774946331977\n",
      "  -15.0712 if pa>=-0.08030913770198822 & pav>=-0.1669993102550506\n",
      "   -3.9726 if cp>=0.012942176871001729\n",
      "   -0.7741 if cp>=-0.02646387815475464 & cv>=0.15217526257038116 & pa>=-0.026889921352267254\n",
      "   -6.5667 if cp<=-0.05522804409265518\n",
      "--------------\n",
      "   -0.0000 if cp<=0.027525609731674196 & pa<=-0.01805284358561036\n",
      "   -0.0002 if pa>=-0.026889921352267254 & pav<=-0.5405943036079407\n",
      "   -0.0000 if cv>=1.225123405456543\n",
      "  +15.4533 if cp<=0.012834234535694123\n",
      "  +15.6561 if cp<=-0.05522804409265518\n",
      "Run episode 805 with rewards 11.0\n",
      "============ 806 ===========\n",
      "11 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +18.5186 if cp>=-0.07537788003683082 & pa<=-0.03513774946331977\n",
      "  +10.8540 if pa>=-0.08030913770198822 & pav>=-0.1669993102550506\n",
      "  +19.0323 if cp>=0.012942176871001729\n",
      "   +5.3890 if cp<=-0.05522804409265518\n",
      "   +1.0000 if cp>=0.16763320565223694\n",
      "--------------\n",
      "   +0.3496 if pa>=-0.026889921352267254 & pav<=-0.5405943036079407\n",
      "   -0.0166 if cv>=1.225123405456543\n",
      "   +2.0617 if cp<=0.012834234535694123\n",
      "   +0.0000 if cp<=-0.05522804409265518\n",
      "   +0.0000 if pav>=0.04957278072834015\n",
      "Run episode 806 with rewards 11.0\n",
      "============ 807 ===========\n",
      "44 actions [1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 1, 0, 1, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0]\n",
      "  +13.3835 if cp>=-0.07537788003683082 & pa<=-0.03513774946331977\n",
      "   -9.3945 if pa>=-0.08030913770198822 & pav>=-0.1669993102550506\n",
      "   -5.4415 if cp>=0.012942176871001729\n",
      "  -29.9080 if cp<=-0.05522804409265518\n",
      "   +1.0000 if cp<=-0.15691490471363068\n",
      "--------------\n",
      "   -0.0000 if pa>=-0.026889921352267254 & pav<=-0.5405943036079407\n",
      "   -0.0000 if cv>=1.225123405456543\n",
      "   -0.0002 if cp<=0.012834234535694123\n",
      "   -0.0002 if pav>=0.04957278072834015\n",
      "   +0.0000 if cp<=-0.0674626901745796\n",
      "Run episode 807 with rewards 44.0\n",
      "============ 808 ===========\n",
      "294 actions [1, 0, 1, 0, 0, 1, 1, 0, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 0, 0, 0, 0, 1, 1, 1, 1, 0, 1, 0, 1, 0, 0, 0, 0, 1, 1, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 1, 1, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 0, 1, 1, 1, 1, 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1, 0, 0, 0, 0, 0, 1, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 0, 0, 0, 0, 1]\n",
      "  +16.7433 if cp>=-0.07537788003683082 & pa<=-0.03513774946331977\n",
      "  -11.7751 if pa>=-0.08030913770198822 & pav>=-0.1669993102550506\n",
      "   -6.0839 if cp>=0.012942176871001729\n",
      "  +12.9605 if cp<=-0.05522804409265518\n",
      "  -12.5788 if pa>=-0.023632127419114118\n",
      "--------------\n",
      "   +0.0000 if pa>=-0.026889921352267254 & pav<=-0.5405943036079407\n",
      "   -0.6766 if cp<=0.012834234535694123\n",
      "   -0.6397 if pav>=0.04957278072834015\n",
      "   +0.0000 if cp<=-0.0674626901745796\n",
      "   +3.3349 if cp>=0.04015385508537293 & cv<=-0.5491171956062317\n",
      "Run episode 808 with rewards 294.0\n",
      "origin 4509.642028923088 new 127232.02428886238 not updated\n",
      "============ 809 ===========\n",
      "160 actions [1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +16.7433 if cp>=-0.07537788003683082 & pa<=-0.03513774946331977\n",
      "  -11.7751 if pa>=-0.08030913770198822 & pav>=-0.1669993102550506\n",
      "   -6.0839 if cp>=0.012942176871001729\n",
      "  +12.9605 if cp<=-0.05522804409265518\n",
      "  -12.5788 if pa>=-0.023632127419114118\n",
      "--------------\n",
      "   +0.5626 if pa>=-0.026889921352267254 & pav<=-0.5405943036079407\n",
      "   -0.9114 if cp<=0.012834234535694123\n",
      "   -0.3127 if pav>=0.04957278072834015\n",
      "   -0.0000 if cp>=0.04015385508537293 & cv<=-0.5491171956062317\n",
      "   +5.2959 if pa>=0.07285664230585098\n",
      "Run episode 809 with rewards 160.0\n",
      "============ 810 ===========\n",
      "128 actions [1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0]\n",
      "   +4.5856 if cp>=-0.07537788003683082 & pa<=-0.03513774946331977\n",
      "   -7.7076 if pa>=-0.08030913770198822 & pav>=-0.1669993102550506\n",
      "  +10.2798 if cp<=-0.05522804409265518\n",
      "  -10.6310 if pa>=-0.023632127419114118\n",
      "   +3.8816 if cv>=1.320513129234314\n",
      "--------------\n",
      "   +0.7014 if pa>=-0.026889921352267254 & pav<=-0.5405943036079407\n",
      "   -0.3412 if cp<=0.012834234535694123\n",
      "   -0.2416 if pav>=0.04957278072834015\n",
      "   +6.4289 if pa>=0.07285664230585098\n",
      "   -3.8624 if cv>=1.320513129234314\n",
      "Run episode 810 with rewards 128.0\n",
      "============ 811 ===========\n",
      "86 actions [1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 0, 0, 1, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0]\n",
      "   +4.3314 if cp>=-0.07537788003683082 & pa<=-0.03513774946331977\n",
      "   -7.4457 if pa>=-0.08030913770198822 & pav>=-0.1669993102550506\n",
      "  +10.2224 if cp<=-0.05522804409265518\n",
      "  -11.8447 if pa>=-0.023632127419114118\n",
      "   +5.2167 if cp>=-0.5646108388900756 & cv>=0.5881808161735534 & pa>=0.024630822241306357\n",
      "--------------\n",
      "   +0.9594 if pa>=-0.026889921352267254 & pav<=-0.5405943036079407\n",
      "   +0.4221 if cp<=0.012834234535694123\n",
      "   +6.4548 if pa>=0.07285664230585098\n",
      "   +0.0000 if cv>=1.320513129234314\n",
      "   -4.9898 if cp>=-0.5646108388900756 & cv>=0.5881808161735534 & pa>=0.024630822241306357\n",
      "Run episode 811 with rewards 86.0\n",
      "============ 812 ===========\n",
      "138 actions [0, 1, 0, 1, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 0, 0, 0, 1, 1, 1, 0, 1, 0, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 0, 0, 1, 1, 1, 0, 1, 0, 0, 1, 1, 0, 0, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0, 0, 0, 0, 0, 1, 1, 1, 1, 0, 1, 0, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 0, 1, 0, 1, 0, 0, 1, 1, 0, 0, 0, 1, 0, 1, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 0, 0, 1, 1, 0, 1, 1, 1, 0, 0]\n",
      "   -5.2828 if pa>=-0.08030913770198822 & pav>=-0.1669993102550506\n",
      "   +3.1983 if cp<=-0.05522804409265518\n",
      "   -9.0791 if pa>=-0.023632127419114118\n",
      "   +0.0000 if cp>=-0.5646108388900756 & cv>=0.5881808161735534 & pa>=0.024630822241306357\n",
      "   +3.0139 if \n",
      "--------------\n",
      "   +1.5990 if pa>=-0.026889921352267254 & pav<=-0.5405943036079407\n",
      "   +2.2945 if cp<=0.012834234535694123\n",
      "   +0.6268 if pa>=0.07285664230585098\n",
      "   +0.0000 if cp>=-0.5646108388900756 & cv>=0.5881808161735534 & pa>=0.024630822241306357\n",
      "   -5.5510 if cp>=-0.10265520215034471 & cv>=-0.019121920689940442 & pa>=-0.03923779353499412\n",
      "Run episode 812 with rewards 138.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 813 ===========\n",
      "133 actions [1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 0, 0, 0, 0, 1, 0, 1, 0, 0, 1, 1, 1, 0, 0, 0, 1, 1, 1, 0, 0, 1, 0, 0, 0, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 0, 0, 1, 1, 1, 1, 0, 1, 0, 1, 0, 0, 0, 1, 1, 0, 1, 0, 0, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 0, 0, 1, 1, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1]\n",
      "   -7.4127 if pa>=-0.08030913770198822 & pav>=-0.1669993102550506\n",
      "   +0.6842 if cp<=-0.05522804409265518\n",
      "  -10.2138 if pa>=-0.023632127419114118\n",
      "   +3.8861 if \n",
      "   +3.8732 if cp<=-0.32884781956672643\n",
      "--------------\n",
      "   -0.0000 if pa>=-0.026889921352267254 & pav<=-0.5405943036079407\n",
      "   +0.3351 if cp<=0.012834234535694123\n",
      "   -0.0000 if pa>=0.07285664230585098\n",
      "   -4.6616 if cp>=-0.10265520215034471 & cv>=-0.019121920689940442 & pa>=-0.03923779353499412\n",
      "   +2.3556 if cp<=-0.0002582243629149126\n",
      "Run episode 813 with rewards 133.0\n",
      "============ 814 ===========\n",
      "34 actions [1, 1, 1, 0, 0, 0, 1, 0, 1, 0, 0, 0, 1, 0, 1, 0, 0, 1, 1, 1, 1, 1, 0, 0, 0, 1, 0, 0, 1, 0, 0, 1, 1, 0]\n",
      "   -8.5681 if pa>=-0.08030913770198822 & pav>=-0.1669993102550506\n",
      "  -10.3323 if pa>=-0.023632127419114118\n",
      "   +4.1868 if \n",
      "   +2.6580 if cp<=-0.32884781956672643\n",
      "   -2.6383 if cp>=-0.34096229076385487 & pa<=-0.07572603374719619 & pav>=0.3079322457313538\n",
      "--------------\n",
      "   -1.8190 if pa>=-0.026889921352267254 & pav<=-0.5405943036079407\n",
      "   -0.1635 if cp<=0.012834234535694123\n",
      "   -1.7321 if cp>=-0.10265520215034471 & cv>=-0.019121920689940442 & pa>=-0.03923779353499412\n",
      "   +3.3140 if cp<=-0.0002582243629149126\n",
      "   +2.3190 if cp>=-0.34096229076385487 & pa<=-0.07572603374719619 & pav>=0.3079322457313538\n",
      "Run episode 814 with rewards 34.0\n",
      "============ 815 ===========\n",
      "52 actions [1, 1, 0, 0, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 1, 0, 1, 0, 0, 0, 1, 0, 1, 1, 1, 1, 0, 0, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 0, 1, 1]\n",
      "   -6.6861 if pa>=-0.08030913770198822 & pav>=-0.1669993102550506\n",
      "   -7.1655 if pa>=-0.023632127419114118\n",
      "   +4.3342 if \n",
      "   -0.0004 if cp<=-0.32884781956672643\n",
      "   -4.4982 if cp>=-0.003906810656189917 & cv<=-0.32005358338356016\n",
      "--------------\n",
      "   +0.0645 if pa>=-0.026889921352267254 & pav<=-0.5405943036079407\n",
      "   -2.2720 if cp>=-0.10265520215034471 & cv>=-0.019121920689940442 & pa>=-0.03923779353499412\n",
      "   +3.1185 if cp<=-0.0002582243629149126\n",
      "   +3.9970 if cp>=-0.34096229076385487 & pa<=-0.07572603374719619 & pav>=0.3079322457313538\n",
      "   -2.8071 if cp>=-0.02125366516411304 & pa>=-0.06651261895895004\n",
      "Run episode 815 with rewards 52.0\n",
      "============ 816 ===========\n",
      "24 actions [1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0]\n",
      "   -5.1286 if pa>=-0.08030913770198822 & pav>=-0.1669993102550506\n",
      "   -7.7450 if pa>=-0.023632127419114118\n",
      "   +3.2246 if \n",
      "   -4.4124 if cp>=-0.003906810656189917 & cv<=-0.32005358338356016\n",
      "   -5.0081 if cp>=0.03220488503575325 & cv<=-0.22621752619743346\n",
      "--------------\n",
      "   -0.0800 if cp>=-0.10265520215034471 & cv>=-0.019121920689940442 & pa>=-0.03923779353499412\n",
      "   +4.0088 if cp<=-0.0002582243629149126\n",
      "   +0.0000 if cp>=-0.34096229076385487 & pa<=-0.07572603374719619 & pav>=0.3079322457313538\n",
      "   -3.2389 if cp>=-0.02125366516411304 & pa>=-0.06651261895895004\n",
      "   +4.9947 if cp>=0.03220488503575325 & cv<=-0.22621752619743346\n",
      "Run episode 816 with rewards 24.0\n",
      "============ 817 ===========\n",
      "37 actions [1, 1, 1, 1, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0]\n",
      "   -0.1052 if pa>=-0.08030913770198822 & pav>=-0.1669993102550506\n",
      "   -8.1826 if pa>=-0.023632127419114118\n",
      "   +4.0696 if cp>=-0.003906810656189917 & cv<=-0.32005358338356016\n",
      "   +4.0696 if cp>=0.03220488503575325 & cv<=-0.22621752619743346\n",
      "   +2.6920 if cv>=-0.11448113620281203\n",
      "--------------\n",
      "   +0.8757 if cp>=-0.10265520215034471 & cv>=-0.019121920689940442 & pa>=-0.03923779353499412\n",
      "   +0.4810 if cp<=-0.0002582243629149126\n",
      "   -0.1420 if cp>=-0.02125366516411304 & pa>=-0.06651261895895004\n",
      "   -0.0087 if cp>=0.03220488503575325 & cv<=-0.22621752619743346\n",
      "   +4.3652 if cp>=0.12920795381069183\n",
      "Run episode 817 with rewards 37.0\n",
      "============ 818 ===========\n",
      "41 actions [1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0, 0]\n",
      "   -6.7129 if pa>=-0.023632127419114118\n",
      "   +2.7376 if cp>=-0.003906810656189917 & cv<=-0.32005358338356016\n",
      "   +3.1144 if cp>=0.03220488503575325 & cv<=-0.22621752619743346\n",
      "   -2.0738 if cv>=-0.11448113620281203\n",
      "   +5.5475 if cv>=-0.043623993545770644\n",
      "--------------\n",
      "   +0.1096 if cp>=-0.10265520215034471 & cv>=-0.019121920689940442 & pa>=-0.03923779353499412\n",
      "  +16.1306 if cp<=-0.0002582243629149126\n",
      "   -0.9516 if cp>=-0.02125366516411304 & pa>=-0.06651261895895004\n",
      "   -1.0008 if cp>=0.12920795381069183\n",
      "   +5.3077 if cp>=0.066692154109478 & cv<=-0.043623993545770644 & pa>=-0.09447202682495118\n",
      "Run episode 818 with rewards 41.0\n",
      "============ 819 ===========\n",
      "29 actions [1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1]\n",
      "  -11.8199 if pa>=-0.023632127419114118\n",
      "   +3.8841 if cp>=-0.003906810656189917 & cv<=-0.32005358338356016\n",
      "   +3.9213 if cp>=0.03220488503575325 & cv<=-0.22621752619743346\n",
      "   +7.2728 if cv>=-0.043623993545770644\n",
      "   +7.6147 if cp<=0.0517123080790043 & pa<=-0.10847876220941544\n",
      "--------------\n",
      "   +1.1239 if cp<=-0.0002582243629149126\n",
      "   +0.6715 if cp>=-0.02125366516411304 & pa>=-0.06651261895895004\n",
      "   +0.0000 if cp>=0.12920795381069183\n",
      "   -0.1284 if cp>=0.066692154109478 & cv<=-0.043623993545770644 & pa>=-0.09447202682495118\n",
      "  -10.2102 if pa<=-0.10847876220941544 & pa>=-0.10847876220941544\n",
      "Run episode 819 with rewards 29.0\n",
      "origin 49.53566451347549 new 1289.7160049169875 not updated\n",
      "============ 820 ===========\n",
      "78 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 1, 1, 0, 1, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0]\n",
      "  -11.8199 if pa>=-0.023632127419114118\n",
      "   +3.8841 if cp>=-0.003906810656189917 & cv<=-0.32005358338356016\n",
      "   +3.9213 if cp>=0.03220488503575325 & cv<=-0.22621752619743346\n",
      "   +7.2728 if cv>=-0.043623993545770644\n",
      "   +7.6147 if cp<=0.0517123080790043 & pa<=-0.10847876220941544\n",
      "--------------\n",
      "   -0.0005 if cp<=-0.0002582243629149126\n",
      "   +1.1966 if cp>=-0.02125366516411304 & pa>=-0.06651261895895004\n",
      "   +0.0000 if cp>=0.066692154109478 & cv<=-0.043623993545770644 & pa>=-0.09447202682495118\n",
      "   +0.0000 if pa<=-0.10847876220941544 & pa>=-0.10847876220941544\n",
      "   -2.4881 if cp>=0.1531858175992966 & cv<=-0.0336802095174789\n",
      "Run episode 820 with rewards 78.0\n",
      "============ 821 ===========\n",
      "28 actions [1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 1, 0, 0, 1, 1, 0, 1, 0, 0]\n",
      "   -9.2218 if pa>=-0.023632127419114118\n",
      "   +0.0001 if cp>=0.03220488503575325 & cv<=-0.22621752619743346\n",
      "   +4.7471 if cv>=-0.043623993545770644\n",
      "   +4.7086 if cp<=0.0517123080790043 & pa<=-0.10847876220941544\n",
      "   -1.9020 if cp>=-0.048043880611658096 & pav>=0.17005795240402222\n",
      "--------------\n",
      "   -0.7141 if cp<=-0.0002582243629149126\n",
      "   -0.0000 if cp>=-0.02125366516411304 & pa>=-0.06651261895895004\n",
      "   -0.0000 if pa<=-0.10847876220941544 & pa>=-0.10847876220941544\n",
      "   -0.0000 if cp>=0.1531858175992966 & cv<=-0.0336802095174789\n",
      "   +2.6097 if cp>=-0.048043880611658096 & pav>=0.17005795240402222\n",
      "Run episode 821 with rewards 28.0\n",
      "============ 822 ===========\n",
      "38 actions [1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 0, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 1, 1]\n",
      "   -7.1176 if pa>=-0.023632127419114118\n",
      "   +3.2642 if cv>=-0.043623993545770644\n",
      "   -0.0000 if cp<=0.0517123080790043 & pa<=-0.10847876220941544\n",
      "   -1.0137 if cp>=-0.048043880611658096 & pav>=0.17005795240402222\n",
      "   +2.4126 if cp>=0.1641111969947815\n",
      "--------------\n",
      "   +0.0000 if cp<=-0.0002582243629149126\n",
      "   +0.8487 if cp>=-0.02125366516411304 & pa>=-0.06651261895895004\n",
      "   -0.3844 if cp>=0.1531858175992966 & cv<=-0.0336802095174789\n",
      "   +2.8746 if cp>=-0.048043880611658096 & pav>=0.17005795240402222\n",
      "   -1.9721 if pav>=-0.0043178369756787785\n",
      "Run episode 822 with rewards 38.0\n",
      "============ 823 ===========\n",
      "75 actions [1, 1, 1, 0, 0, 0, 0, 0, 1, 1, 0, 0, 1, 1, 1, 0, 0, 0, 1, 0, 0, 1, 0, 1, 1, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 0, 1, 0, 0, 1, 0, 0, 0, 0, 1, 0, 1, 0, 0, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 0, 1, 0]\n",
      "   -6.8850 if pa>=-0.023632127419114118\n",
      "   +3.4821 if cv>=-0.043623993545770644\n",
      "   +0.0319 if cp>=-0.048043880611658096 & pav>=0.17005795240402222\n",
      "   +3.8316 if cp>=0.1641111969947815\n",
      "   -2.4323 if pav>=0.7055728435516357\n",
      "--------------\n",
      "   +0.6678 if cp>=-0.02125366516411304 & pa>=-0.06651261895895004\n",
      "   -1.5770 if cp>=0.1531858175992966 & cv<=-0.0336802095174789\n",
      "   +0.6227 if cp>=-0.048043880611658096 & pav>=0.17005795240402222\n",
      "   -0.7794 if pav>=-0.0043178369756787785\n",
      "   +3.3104 if pav>=0.7055728435516357\n",
      "Run episode 823 with rewards 75.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 824 ===========\n",
      "40 actions [1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0, 0, 1, 0, 1, 1, 0, 0, 0, 1, 0, 1, 0, 0, 1, 1, 1, 0, 1, 1, 0, 1, 1, 0, 0]\n",
      "   -6.3910 if pa>=-0.023632127419114118\n",
      "   +2.7241 if cv>=-0.043623993545770644\n",
      "   -0.0000 if cp>=0.1641111969947815\n",
      "   -1.5840 if pav>=0.7055728435516357\n",
      "   -4.7254 if cp>=-0.08255252540111539 & pav>=0.3803399980068208\n",
      "--------------\n",
      "   +1.9183 if cp>=-0.02125366516411304 & pa>=-0.06651261895895004\n",
      "   -0.0000 if cp>=0.1531858175992966 & cv<=-0.0336802095174789\n",
      "   -1.0116 if pav>=-0.0043178369756787785\n",
      "   +2.3098 if pav>=0.7055728435516357\n",
      "   +5.2011 if cp>=-0.08255252540111539 & pa<=-0.06537016332149505 & pav>=0.3803399980068208\n",
      "Run episode 824 with rewards 40.0\n",
      "============ 825 ===========\n",
      "15 actions [1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0]\n",
      "   -5.1780 if pa>=-0.023632127419114118\n",
      "   +2.4918 if cv>=-0.043623993545770644\n",
      "   -0.0000 if pav>=0.7055728435516357\n",
      "   -0.2079 if cp>=-0.08255252540111539 & pav>=0.3803399980068208\n",
      "   -4.3828 if pa<=-0.11740158945322035 & pav>=0.166239157319069\n",
      "--------------\n",
      "   +4.7457 if cp>=-0.02125366516411304 & pa>=-0.06651261895895004\n",
      "   -0.2375 if pav>=-0.0043178369756787785\n",
      "   +0.0000 if pav>=0.7055728435516357\n",
      "   +0.6057 if cp>=-0.08255252540111539 & pa<=-0.06537016332149505 & pav>=0.3803399980068208\n",
      "   -4.7292 if cv>=0.9338870644569397\n",
      "Run episode 825 with rewards 15.0\n",
      "============ 826 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 0, 1, 0, 1, 1]\n",
      "   -0.0060 if pa>=-0.023632127419114118\n",
      "  -11.4839 if cv>=-0.043623993545770644\n",
      "   -0.0000 if cp>=-0.08255252540111539 & pav>=0.3803399980068208\n",
      "   -0.0000 if pa<=-0.11740158945322035 & pav>=0.166239157319069\n",
      "  +10.9473 if pa>=-0.18868781328201295 & pav<=-0.4748471140861509\n",
      "--------------\n",
      "   +4.8449 if cp>=-0.02125366516411304 & pa>=-0.06651261895895004\n",
      "   +0.0000 if pav>=-0.0043178369756787785\n",
      "   +0.0000 if cp>=-0.08255252540111539 & pa<=-0.06537016332149505 & pav>=0.3803399980068208\n",
      "   -0.4120 if cv>=0.9338870644569397\n",
      "  -10.8635 if cv<=-0.021022325754165648 & pa<=-0.18868781328201295\n",
      "Run episode 826 with rewards 10.0\n",
      "============ 827 ===========\n",
      "23 actions [0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 0, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1]\n",
      "   +0.0051 if pa>=-0.023632127419114118\n",
      "  +11.1251 if cv>=-0.043623993545770644\n",
      "   +0.0000 if pa<=-0.11740158945322035 & pav>=0.166239157319069\n",
      "  +11.6241 if pa>=-0.18868781328201295 & pav<=-0.4748471140861509\n",
      "   +5.9503 if cp>=0.0635843276977539\n",
      "--------------\n",
      "   -0.2670 if cp>=-0.02125366516411304 & pa>=-0.06651261895895004\n",
      "   -0.0000 if cp>=-0.08255252540111539 & pa<=-0.06537016332149505 & pav>=0.3803399980068208\n",
      "  +17.1593 if cv>=0.9338870644569397\n",
      "   -0.7294 if cv<=-0.021022325754165648 & pa<=-0.18868781328201295\n",
      "   +1.0000 if cp>=0.0635843276977539\n",
      "Run episode 827 with rewards 23.0\n",
      "============ 828 ===========\n",
      "25 actions [0, 1, 0, 0, 0, 1, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 0, 1, 1]\n",
      "   -1.0848 if pa>=-0.023632127419114118\n",
      "   +4.6291 if cv>=-0.043623993545770644\n",
      "   +0.0000 if pa>=-0.18868781328201295 & pav<=-0.4748471140861509\n",
      "   +0.0000 if cp>=0.0635843276977539\n",
      "   +3.4359 if cp>=-0.05553732439875603 & pa>=-0.009383329562842846\n",
      "--------------\n",
      "   -0.0000 if cp>=-0.02125366516411304 & pa>=-0.06651261895895004\n",
      "   -0.0000 if cv>=0.9338870644569397\n",
      "   -0.0000 if cv<=-0.021022325754165648 & pa<=-0.18868781328201295\n",
      "   -0.0000 if cp>=0.0635843276977539\n",
      "   +3.3256 if cp>=-0.0700481429696083 & cv<=-0.06355783417820902 & pa<=-0.009383329562842846\n",
      "Run episode 828 with rewards 25.0\n",
      "============ 829 ===========\n",
      "23 actions [0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1]\n",
      "   -3.2482 if pa>=-0.023632127419114118\n",
      "   +2.7094 if cv>=-0.043623993545770644\n",
      "   +0.0000 if pa>=-0.18868781328201295 & pav<=-0.4748471140861509\n",
      "   +3.2334 if cp>=-0.05553732439875603 & pa>=-0.009383329562842846\n",
      "   +4.6011 if cv>=-0.21892825961112977\n",
      "--------------\n",
      "   +0.0000 if cv>=0.9338870644569397\n",
      "   +0.0000 if cv<=-0.021022325754165648 & pa<=-0.18868781328201295\n",
      "   +0.0000 if cp>=0.0635843276977539\n",
      "   +2.1357 if cp>=-0.0700481429696083 & cv<=-0.06355783417820902 & pa<=-0.009383329562842846\n",
      "   +4.4867 if cp>=-0.09741552919149399 & cv<=-0.21892825961112977 & cv<=-0.4165248990058899\n",
      "Run episode 829 with rewards 23.0\n",
      "============ 830 ===========\n",
      "34 actions [1, 1, 1, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1]\n",
      "   -3.2885 if pa>=-0.023632127419114118\n",
      "   +2.2403 if cv>=-0.043623993545770644\n",
      "   +1.2417 if cp>=-0.05553732439875603 & pa>=-0.009383329562842846\n",
      "   +4.6823 if cv>=-0.21892825961112977\n",
      "   -2.2986 if cp>=-0.03959100693464279\n",
      "--------------\n",
      "   +0.0000 if cv>=0.9338870644569397\n",
      "   +0.0000 if cp>=0.0635843276977539\n",
      "   +3.8460 if cp>=-0.0700481429696083 & cv<=-0.06355783417820902 & pa<=-0.009383329562842846\n",
      "   +0.0000 if cp>=-0.09741552919149399 & cv<=-0.21892825961112977 & cv<=-0.4165248990058899\n",
      "   +2.6698 if cp>=-0.04905690178275107 & cv<=-0.17772068679332734\n",
      "Run episode 830 with rewards 34.0\n",
      "============ 831 ===========\n",
      "115 actions [1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 0, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 1, 0, 0, 0, 0, 1, 1, 1, 0, 0, 0, 1, 0, 0, 1, 1, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 0, 1, 0, 0, 0, 1, 0, 1, 0, 0, 1, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0, 0]\n",
      "   -7.2227 if pa>=-0.023632127419114118\n",
      "   +1.5374 if cv>=-0.043623993545770644\n",
      "   -0.1710 if cv>=-0.21892825961112977\n",
      "   -0.4092 if cp>=-0.03959100693464279\n",
      "   +3.2435 if pav<=-0.05673154294490812\n",
      "--------------\n",
      "   +0.0000 if cv>=0.9338870644569397\n",
      "   +5.1436 if cp>=-0.0700481429696083 & cv<=-0.06355783417820902 & pa<=-0.009383329562842846\n",
      "   +0.0000 if cp>=-0.09741552919149399 & cv<=-0.21892825961112977 & cv<=-0.4165248990058899\n",
      "   +0.0056 if cp>=-0.04905690178275107 & cv<=-0.17772068679332734\n",
      "   +3.5975 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "Run episode 831 with rewards 115.0\n",
      "============ 832 ===========\n",
      "15 actions [0, 0, 0, 1, 0, 1, 0, 0, 0, 1, 1, 1, 0, 1, 0]\n",
      "   +2.2615 if pa>=-0.023632127419114118\n",
      "   +1.8656 if cv>=-0.043623993545770644\n",
      "   +0.0000 if cp>=-0.03959100693464279\n",
      "   +2.9793 if pav<=-0.05673154294490812\n",
      "   +4.4415 if cp>=-0.0417468436062336\n",
      "--------------\n",
      "   +4.8115 if cp>=-0.0700481429696083 & cv<=-0.06355783417820902 & pa<=-0.009383329562842846\n",
      "   +4.4230 if cp>=-0.09741552919149399 & cv<=-0.21892825961112977 & cv<=-0.4165248990058899\n",
      "   +0.0667 if cp>=-0.04905690178275107 & cv<=-0.17772068679332734\n",
      "   +3.8475 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   -4.5695 if cp>=-0.0417468436062336\n",
      "Run episode 832 with rewards 15.0\n",
      "============ 833 ===========\n",
      "34 actions [1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0]\n",
      "   -8.3730 if pa>=-0.023632127419114118\n",
      "   +0.0137 if cv>=-0.043623993545770644\n",
      "   +0.0214 if pav<=-0.05673154294490812\n",
      "  +10.5341 if cp>=-0.0417468436062336\n",
      "   -4.9219 if cp<=-0.0929919347167015 & cv>=-0.5999084830284118\n",
      "--------------\n",
      "   +1.8471 if cp>=-0.0700481429696083 & cv<=-0.06355783417820902 & pa<=-0.009383329562842846\n",
      "   +1.4252 if cp>=-0.09741552919149399 & cv<=-0.21892825961112977 & cv<=-0.4165248990058899\n",
      "  +12.5141 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   -6.8511 if cp>=-0.0417468436062336\n",
      "   +6.0000 if cp<=-0.0929919347167015 & cv>=-0.5999084830284118\n",
      "Run episode 833 with rewards 34.0\n",
      "============ 834 ===========\n",
      "14 actions [0, 0, 0, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 0]\n",
      "   -5.7267 if pa>=-0.023632127419114118\n",
      "   -1.1755 if pav<=-0.05673154294490812\n",
      "  +10.1506 if cp>=-0.0417468436062336\n",
      "   -0.0000 if cp<=-0.0929919347167015 & cv>=-0.5999084830284118\n",
      "   +1.7738 if cp<=-0.035622831434011445\n",
      "--------------\n",
      "   +0.0857 if cp>=-0.0700481429696083 & cv<=-0.06355783417820902 & pa<=-0.009383329562842846\n",
      "   -3.8782 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   +8.8715 if cp>=-0.0417468436062336\n",
      "   +0.0073 if cp<=-0.0929919347167015 & cv>=-0.5999084830284118\n",
      "  -14.3865 if pa<=-0.03891203999519348\n",
      "Run episode 834 with rewards 14.0\n",
      "============ 835 ===========\n",
      "33 actions [0, 0, 0, 0, 0, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   -1.5318 if pa>=-0.023632127419114118\n",
      "   +0.4214 if pav<=-0.05673154294490812\n",
      "   +6.2492 if cp>=-0.0417468436062336\n",
      "  +11.4104 if cp<=-0.035622831434011445\n",
      "   +1.2143 if cp<=-0.1023374393582344\n",
      "--------------\n",
      "   -2.0000 if cp>=-0.0700481429696083 & cv<=-0.06355783417820902 & pa<=-0.009383329562842846\n",
      "  +17.3188 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   -9.9445 if cp>=-0.0417468436062336\n",
      "   +6.5804 if pa<=-0.03891203999519348\n",
      "   +3.7119 if pa>=0.206472247838974\n",
      "Run episode 835 with rewards 33.0\n",
      "============ 836 ===========\n",
      "22 actions [1, 0, 0, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1, 1, 1, 1]\n",
      "   +1.0675 if pa>=-0.023632127419114118\n",
      "   +1.1193 if cp>=-0.0417468436062336\n",
      "   +5.8512 if cp<=-0.035622831434011445\n",
      "   +0.0000 if cp<=-0.1023374393582344\n",
      "   +1.5141 if cp<=0.004807969741523279\n",
      "--------------\n",
      "   +9.5424 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   -3.8510 if cp>=-0.0417468436062336\n",
      "   -0.0000 if pa<=-0.03891203999519348\n",
      "   -0.0000 if pa>=0.206472247838974\n",
      "   +4.2973 if \n",
      "Run episode 836 with rewards 22.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 837 ===========\n",
      "26 actions [0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 1, 0, 0, 1]\n",
      "   +1.4636 if pa>=-0.023632127419114118\n",
      "   +1.4636 if cp>=-0.0417468436062336\n",
      "   -0.0000 if cp<=-0.035622831434011445\n",
      "   +0.0019 if cp<=0.004807969741523279\n",
      "   -2.9099 if cp<=0.03190875686705113 & pa>=0.04645461142063141\n",
      "--------------\n",
      "   -1.1431 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   +2.2066 if cp>=-0.0417468436062336\n",
      "   -0.0000 if pa<=-0.03891203999519348\n",
      "   +2.2066 if \n",
      "   -3.0779 if cp>=0.01846439763903618\n",
      "Run episode 837 with rewards 26.0\n",
      "============ 838 ===========\n",
      "38 actions [0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   -6.5393 if pa>=-0.023632127419114118\n",
      "  +14.9748 if cp>=-0.0417468436062336\n",
      "   -6.7066 if cp<=0.004807969741523279\n",
      "   -2.9876 if cp<=0.03190875686705113 & pa>=0.04645461142063141\n",
      "   +3.8083 if cp<=-0.014455646276473999 & cp>=-0.014455646276473999\n",
      "--------------\n",
      "   +8.1254 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   -4.3314 if cp>=-0.0417468436062336\n",
      "   -1.6589 if \n",
      "   -9.6993 if cp>=0.01846439763903618\n",
      "   +1.0000 if cp>=0.19433210790157318\n",
      "Run episode 838 with rewards 38.0\n",
      "============ 839 ===========\n",
      "16 actions [1, 1, 1, 0, 0, 1, 1, 1, 0, 0, 1, 1, 0, 0, 0, 1]\n",
      "   +2.0457 if pa>=-0.023632127419114118\n",
      "   +2.9119 if cp>=-0.0417468436062336\n",
      "   -2.1633 if cp<=0.004807969741523279\n",
      "   +0.0000 if cp<=-0.014455646276473999 & cp>=-0.014455646276473999\n",
      "   -3.5463 if cp<=0.006192276068031797 & pav>=1.408513617515564\n",
      "--------------\n",
      "   +1.2911 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   +1.3284 if cp>=-0.0417468436062336\n",
      "   +1.3284 if \n",
      "   +0.0373 if cp>=0.01846439763903618\n",
      "   -4.8433 if cv<=-0.8734624743461609 & pav<=1.408513617515564\n",
      "Run episode 839 with rewards 16.0\n",
      "============ 840 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "  +14.3405 if pa>=-0.023632127419114118\n",
      "  -10.7889 if cp>=-0.0417468436062336\n",
      "   -3.1890 if cp<=0.004807969741523279\n",
      "   +0.5165 if cp<=0.006192276068031797 & pav>=1.408513617515564\n",
      "   -5.2820 if cp>=0.09644676744937897 & cv>=0.37139537930488586\n",
      "--------------\n",
      "   -4.6263 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   +4.8365 if cp>=-0.0417468436062336\n",
      "   +4.8365 if \n",
      "   -0.0001 if cv<=-0.8734624743461609 & pav<=1.408513617515564\n",
      "   +9.4211 if cp>=0.03215428814291954\n",
      "Run episode 840 with rewards 9.0\n",
      "============ 841 ===========\n",
      "11 actions [1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.1261 if pa>=-0.023632127419114118\n",
      "   -0.0938 if cp>=-0.0417468436062336\n",
      "   -0.1264 if cp<=0.004807969741523279\n",
      "   +0.0000 if cp>=0.09644676744937897 & cv>=0.37139537930488586\n",
      "   +0.0077 if cp<=0.025113640725612653 & cp>=-0.011055708117783069\n",
      "--------------\n",
      "   +1.1560 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   +1.1559 if cp>=-0.0417468436062336\n",
      "   +1.1559 if \n",
      "   -0.0001 if cp>=0.03215428814291954\n",
      "   +0.1886 if cp>=-0.011055708117783069\n",
      "Run episode 841 with rewards 11.0\n",
      "============ 842 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.0160 if pa>=-0.023632127419114118\n",
      "  +29.1799 if cp>=-0.0417468436062336\n",
      "   -5.8321 if cp<=0.004807969741523279\n",
      "  -20.4840 if cp<=0.025113640725612653 & cp>=-0.011055708117783069\n",
      "   -0.5181 if cp<=0.06783881783485413\n",
      "--------------\n",
      "   -7.0085 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "  -10.1825 if cp>=-0.0417468436062336\n",
      "  -10.1825 if \n",
      "  -10.6384 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp>=0.06783881783485413\n",
      "Run episode 842 with rewards 10.0\n",
      "============ 843 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.0000 if cp>=-0.0417468436062336\n",
      "   -0.0000 if cp<=0.004807969741523279\n",
      "   -0.0000 if cp<=0.025113640725612653 & cp>=-0.011055708117783069\n",
      "   -0.0000 if cp<=0.06783881783485413\n",
      "   +0.0000 if pa>=0.20180636644363403\n",
      "--------------\n",
      "  +23.8603 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   +7.1469 if cp>=-0.0417468436062336\n",
      "  +18.0987 if \n",
      "   +1.4116 if cp>=-0.011055708117783069\n",
      "   +1.0000 if pa>=0.20180636644363403\n",
      "Run episode 843 with rewards 9.0\n",
      "============ 844 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.0000 if cp>=-0.0417468436062336\n",
      "   -0.0000 if cp<=0.004807969741523279\n",
      "   +0.0000 if cp<=0.06783881783485413\n",
      "   -0.0000 if pa>=0.20180636644363403\n",
      "   +0.0000 if cp>=0.023306390643119814\n",
      "--------------\n",
      "  -12.2829 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   -5.6006 if cp>=-0.0417468436062336\n",
      "  -11.6186 if \n",
      "   -2.4491 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp<=0.04604074209928514\n",
      "Run episode 844 with rewards 9.0\n",
      "origin 1.3401103608628009e-05 new 1.3401103611615882e-05 not updated\n",
      "============ 845 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   +0.0000 if cp>=-0.0417468436062336\n",
      "   -0.0000 if cp<=0.004807969741523279\n",
      "   +0.0000 if cp<=0.06783881783485413\n",
      "   -0.0000 if pa>=0.20180636644363403\n",
      "   +0.0000 if cp>=0.023306390643119814\n",
      "--------------\n",
      "  +12.2829 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   +5.6006 if cp>=-0.0417468436062336\n",
      "  +11.6186 if \n",
      "   +2.4491 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp>=-0.08325323909521103\n",
      "Run episode 845 with rewards 9.0\n",
      "origin 1.652260407755254e-05 new 1.6522604077778723e-05 not updated\n",
      "============ 846 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.0000 if cp>=-0.0417468436062336\n",
      "   -0.0000 if cp<=0.004807969741523279\n",
      "   +0.0000 if cp<=0.06783881783485413\n",
      "   -0.0000 if pa>=0.20180636644363403\n",
      "   +0.0000 if cp>=0.023306390643119814\n",
      "--------------\n",
      "  -23.0762 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "  -10.5227 if cp>=-0.0417468436062336\n",
      "  -21.8287 if \n",
      "   -4.6019 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp<=0.05636055916547776 & cp>=0.025244850479066383\n",
      "Run episode 846 with rewards 9.0\n",
      "============ 847 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   +0.0000 if cp>=-0.0417468436062336\n",
      "   -0.0000 if cp<=0.004807969741523279\n",
      "   +0.0000 if cp<=0.06783881783485413\n",
      "   +0.0000 if cp>=0.023306390643119814\n",
      "   +0.0000 if cp<=0.030480073764920235\n",
      "--------------\n",
      "  +23.0762 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "  +10.5227 if cp>=-0.0417468436062336\n",
      "  +21.8287 if \n",
      "   +4.6019 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp>=0.030480073764920235\n",
      "Run episode 847 with rewards 10.0\n",
      "============ 848 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.0000 if cp>=-0.0417468436062336\n",
      "   -0.0000 if cp<=0.004807969741523279\n",
      "   +0.0000 if cp<=0.06783881783485413\n",
      "   +0.0000 if cp>=0.023306390643119814\n",
      "   +0.0000 if cp>=0.1434757113456726\n",
      "--------------\n",
      "   -6.7261 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   -5.2554 if cp>=-0.0417468436062336\n",
      "   -9.1124 if \n",
      "   -3.2356 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp<=0.05148868635296822\n",
      "Run episode 848 with rewards 10.0\n",
      "============ 849 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   +0.0000 if cp>=-0.0417468436062336\n",
      "   -0.0000 if cp<=0.004807969741523279\n",
      "   -0.0000 if cp<=0.06783881783485413\n",
      "   +0.0000 if cp>=0.023306390643119814\n",
      "   +0.0000 if cp>=-0.09954945892095565\n",
      "--------------\n",
      "   +7.2804 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   +4.6075 if cp>=-0.0417468436062336\n",
      "   +9.6328 if \n",
      "   +3.1897 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp>=-0.09954945892095565\n",
      "Run episode 849 with rewards 10.0\n",
      "============ 850 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.0000 if cp>=-0.0417468436062336\n",
      "   -0.0000 if cp<=0.004807969741523279\n",
      "   -0.0000 if cp<=0.06783881783485413\n",
      "   +0.0000 if cp>=-0.09954945892095565\n",
      "   +0.0000 if cp<=0.10944398641586305\n",
      "--------------\n",
      "  -18.1832 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "  -11.5218 if cp>=-0.0417468436062336\n",
      "  -24.0728 if \n",
      "   -7.9806 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp<=0.04131789430975914\n",
      "Run episode 850 with rewards 9.0\n",
      "============ 851 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   +0.0000 if cp>=-0.0417468436062336\n",
      "   +0.0000 if cp<=0.06783881783485413\n",
      "   +0.0000 if cp>=-0.09954945892095565\n",
      "   +0.0000 if cp<=0.10944398641586305\n",
      "   +0.0000 if \n",
      "--------------\n",
      "  +18.1832 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "  +11.5218 if cp>=-0.0417468436062336\n",
      "  +24.0728 if \n",
      "   +7.9806 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp<=-0.06078440025448799\n",
      "Run episode 851 with rewards 10.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 852 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.0000 if cp>=-0.0417468436062336\n",
      "   +0.0000 if cp<=0.06783881783485413\n",
      "   +0.0000 if cp>=-0.09954945892095565\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=0.11069078743457794\n",
      "--------------\n",
      "   -6.3259 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   -4.4817 if cp>=-0.0417468436062336\n",
      "   -8.9812 if \n",
      "   -3.4664 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp<=-0.009092813171446322\n",
      "Run episode 852 with rewards 10.0\n",
      "============ 853 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.0000 if cp>=-0.0417468436062336\n",
      "   -0.0000 if cp<=0.06783881783485413\n",
      "   +0.0000 if cp>=-0.09954945892095565\n",
      "   -0.0000 if \n",
      "   +0.0000 if cp>=-0.13346708714962005\n",
      "--------------\n",
      "   +6.7002 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   +4.4411 if cp>=-0.0417468436062336\n",
      "   +9.3314 if \n",
      "   +3.4350 if cp>=-0.011055708117783069\n",
      "   +0.8064 if cp>=-0.09364504218101502\n",
      "Run episode 853 with rewards 10.0\n",
      "============ 854 ===========\n",
      "11 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   -0.0000 if cp<=0.06783881783485413\n",
      "   +0.0000 if cp>=-0.09954945892095565\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=-0.13346708714962005\n",
      "   +0.0000 if cp<=0.12199749648571015\n",
      "--------------\n",
      "  -16.3204 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "  -10.8366 if cp>=-0.0417468436062336\n",
      "  -22.7485 if \n",
      "   -8.3859 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp<=0.05600930526852608\n",
      "Run episode 854 with rewards 11.0\n",
      "============ 855 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   +0.0000 if cp<=0.06783881783485413\n",
      "   +0.0000 if cp>=-0.09954945892095565\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=-0.13346708714962005\n",
      "   +0.0000 if \n",
      "--------------\n",
      "  +17.0448 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   +9.2520 if cp>=-0.0417468436062336\n",
      "  +23.3107 if \n",
      "   +6.8349 if cp>=-0.011055708117783069\n",
      "   +0.9867 if cp>=-0.10385724902153015\n",
      "Run episode 855 with rewards 10.0\n",
      "============ 856 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.0000 if cp<=0.06783881783485413\n",
      "   +0.0000 if cp>=-0.09954945892095565\n",
      "   +0.0000 if \n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=0.12158681452274323\n",
      "--------------\n",
      "   -6.9042 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   -4.1986 if cp>=-0.0417468436062336\n",
      "  -10.0789 if \n",
      "   -3.4254 if cp>=-0.011055708117783069\n",
      "   +0.8777 if cp<=0.06710688769817352 & cp>=-0.0042602617992088185\n",
      "Run episode 856 with rewards 10.0\n",
      "============ 857 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.0000 if cp<=0.06783881783485413\n",
      "   -0.0000 if cp>=-0.09954945892095565\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp<=-0.010387426987290381\n",
      "   +0.0000 if pa>=0.18878094851970673\n",
      "--------------\n",
      "   +6.9042 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   +4.1986 if cp>=-0.0417468436062336\n",
      "  +10.0789 if \n",
      "   +3.4254 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp>=-0.08998237103223801\n",
      "Run episode 857 with rewards 9.0\n",
      "============ 858 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   -0.0000 if cp<=0.06783881783485413\n",
      "   +0.0000 if cp>=-0.09954945892095565\n",
      "   +0.0000 if \n",
      "   -0.0000 if cp<=-0.010387426987290381\n",
      "   +0.0000 if \n",
      "--------------\n",
      "  -17.2846 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "  -10.5229 if cp>=-0.0417468436062336\n",
      "  -25.2440 if \n",
      "   -8.5871 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp<=0.03303153738379479\n",
      "Run episode 858 with rewards 9.0\n",
      "============ 859 ===========\n",
      "11 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   +0.0000 if cp<=0.06783881783485413\n",
      "   +0.0000 if cp>=-0.09954945892095565\n",
      "   +0.0000 if \n",
      "   +0.0000 if \n",
      "   +0.0000 if \n",
      "--------------\n",
      "  +17.2846 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "  +10.5229 if cp>=-0.0417468436062336\n",
      "  +25.2440 if \n",
      "   +8.5871 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp>=0.028067443147301675\n",
      "Run episode 859 with rewards 11.0\n",
      "============ 860 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.0000 if cp>=-0.09954945892095565\n",
      "   +0.0000 if \n",
      "   -0.0000 if cp<=0.014139150269329569\n",
      "   -0.0000 if cp<=0.014139150269329569\n",
      "   +0.0000 if cp<=0.014139150269329569\n",
      "--------------\n",
      "   -6.5780 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   -4.1023 if cp>=-0.0417468436062336\n",
      "   -9.7547 if \n",
      "   -3.4341 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp<=-0.01981981471180916\n",
      "Run episode 860 with rewards 10.0\n",
      "============ 861 ===========\n",
      "11 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.0000 if cp>=-0.09954945892095565\n",
      "   -0.0000 if \n",
      "   +0.0000 if cp>=-0.016518618725240228\n",
      "   -0.0000 if cp>=-0.056311208009719844\n",
      "   +0.0000 if cp>=0.025557242333889008\n",
      "--------------\n",
      "   +6.5780 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   +4.1023 if cp>=-0.0417468436062336\n",
      "   +9.7547 if \n",
      "   +3.4341 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp>=0.025557242333889008\n",
      "Run episode 861 with rewards 11.0\n",
      "============ 862 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   -0.0000 if cp>=-0.09954945892095565\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp>=-0.016518618725240228\n",
      "   -0.0000 if cp>=-0.056311208009719844\n",
      "   +0.0000 if cp<=0.04671940580010414\n",
      "--------------\n",
      "  -16.1329 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "  -10.0767 if cp>=-0.0417468436062336\n",
      "  -23.9396 if \n",
      "   -8.4379 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp<=0.06484659761190414\n",
      "Run episode 862 with rewards 9.0\n",
      "============ 863 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   +0.0000 if cp>=-0.09954945892095565\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=-0.016518618725240228\n",
      "   +0.0000 if cp>=-0.056311208009719844\n",
      "   +0.0000 if \n",
      "--------------\n",
      "  +16.1329 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "  +10.0767 if cp>=-0.0417468436062336\n",
      "  +23.9396 if \n",
      "   +8.4379 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp>=0.03044514209032059\n",
      "Run episode 863 with rewards 10.0\n",
      "============ 864 ===========\n",
      "8 actions [0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.0000 if cp>=-0.09954945892095565\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=-0.056311208009719844\n",
      "   -0.0000 if cp<=-0.014356415905058383\n",
      "   +0.0000 if cp<=-0.014356415905058383\n",
      "--------------\n",
      "   -5.2529 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   -4.0270 if cp>=-0.0417468436062336\n",
      "   -8.8516 if \n",
      "   -3.9067 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp<=-0.014356415905058383\n",
      "Run episode 864 with rewards 8.0\n",
      "============ 865 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.0000 if cp>=-0.09954945892095565\n",
      "   -0.0001 if \n",
      "   +0.0000 if cp>=-0.056311208009719844\n",
      "   +0.0000 if cv>=0.028189880773425102\n",
      "   +0.0000 if cp>=-0.08984528630971908\n",
      "--------------\n",
      "   +6.0780 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   +3.7990 if cp>=-0.0417468436062336\n",
      "   +9.6020 if \n",
      "   +3.8256 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp>=-0.08984528630971908\n",
      "Run episode 865 with rewards 9.0\n",
      "============ 866 ===========\n",
      "8 actions [0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.0000 if cp>=-0.09954945892095565\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=-0.056311208009719844\n",
      "   +0.0000 if cv>=0.028189880773425102\n",
      "   +0.0000 if cp<=-0.027854081988334656\n",
      "--------------\n",
      "  -14.6449 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   -9.1783 if cp>=-0.0417468436062336\n",
      "  -23.1630 if \n",
      "   -9.2452 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp<=-0.018028270825743674\n",
      "Run episode 866 with rewards 8.0\n",
      "============ 867 ===========\n",
      "8 actions [1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   +0.0000 if cp>=-0.09954945892095565\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=-0.056311208009719844\n",
      "   +0.0000 if cv>=0.028189880773425102\n",
      "   +0.0000 if \n",
      "--------------\n",
      "  +14.6449 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   +9.1783 if cp>=-0.0417468436062336\n",
      "  +23.1630 if \n",
      "   +9.2452 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp>=-0.07202304899692535\n",
      "Run episode 867 with rewards 8.0\n",
      "============ 868 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=-0.056311208009719844\n",
      "   +0.0000 if cv>=0.028189880773425102\n",
      "   -0.0000 if cp<=-0.03735487163066864\n",
      "   +0.0000 if pav>=0.0498993843793869\n",
      "--------------\n",
      "   -5.5018 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   -4.1998 if cp>=-0.0417468436062336\n",
      "   -9.4165 if \n",
      "   -4.1118 if cp>=-0.011055708117783069\n",
      "   +0.9386 if cp>=0.03566761687397957\n",
      "Run episode 868 with rewards 10.0\n",
      "============ 869 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.0000 if \n",
      "   +0.0000 if cp>=-0.056311208009719844\n",
      "   +0.0000 if cv>=0.028189880773425102\n",
      "   -0.0000 if cp<=-0.03735487163066864\n",
      "   +0.0000 if pa>=0.16199545562267303\n",
      "--------------\n",
      "   +6.3376 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   +4.1292 if cp>=-0.0417468436062336\n",
      "   +9.8160 if \n",
      "   +3.7418 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp>=0.038768237084150316\n",
      "Run episode 869 with rewards 9.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 870 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp>=-0.056311208009719844\n",
      "   +0.0000 if cp<=-0.03735487163066864\n",
      "   +0.0000 if pa>=0.16199545562267303\n",
      "   +0.0000 if cp<=0.06495516672730448\n",
      "--------------\n",
      "  -15.5587 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "  -10.1515 if cp>=-0.0417468436062336\n",
      "  -24.1126 if \n",
      "   -9.2004 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp<=0.04273758009076119\n",
      "Run episode 870 with rewards 9.0\n",
      "============ 871 ===========\n",
      "11 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=-0.056311208009719844\n",
      "   +0.0000 if cp<=-0.03735487163066864\n",
      "   +0.0000 if cp<=0.06495516672730448\n",
      "   +0.0000 if \n",
      "--------------\n",
      "  +15.5587 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "  +10.1515 if cp>=-0.0417468436062336\n",
      "  +24.1126 if \n",
      "   +9.2004 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp>=0.02785092554986477\n",
      "Run episode 871 with rewards 11.0\n",
      "============ 872 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp>=-0.056311208009719844\n",
      "   -0.0000 if cp<=0.06495516672730448\n",
      "   -0.0000 if cp<=0.09421565383672716\n",
      "   +0.0000 if cp<=0.09421565383672716\n",
      "--------------\n",
      "   -5.5471 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   -3.8641 if cp>=-0.0417468436062336\n",
      "   -8.8416 if \n",
      "   -3.5250 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp<=0.05989469215273857\n",
      "Run episode 872 with rewards 10.0\n",
      "============ 873 ===========\n",
      "8 actions [1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   +0.0000 if cp>=-0.056311208009719844\n",
      "   -0.0001 if cp<=0.06495516672730448\n",
      "   -0.0001 if cp<=0.09421565383672716\n",
      "   -0.0001 if cp<=-0.02571234069764614\n",
      "   -0.0001 if cp<=-0.06782390773296357\n",
      "--------------\n",
      "   +6.9705 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   +3.4403 if cp>=-0.0417468436062336\n",
      "   +9.5574 if \n",
      "   +2.7718 if cp>=-0.011055708117783069\n",
      "   +1.0000 if pa>=0.18246857821941376\n",
      "Run episode 873 with rewards 8.0\n",
      "============ 874 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.0000 if cp<=0.06495516672730448\n",
      "   +0.0000 if cp<=0.09421565383672716\n",
      "   +0.0000 if cp<=-0.02571234069764614\n",
      "   +0.0000 if cp<=-0.06782390773296357\n",
      "   +0.0000 if cp<=0.01965144500136377\n",
      "--------------\n",
      "  -16.8416 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   -8.3779 if cp>=-0.0417468436062336\n",
      "  -23.1575 if \n",
      "   -6.7627 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp<=0.043039538711309444\n",
      "Run episode 874 with rewards 10.0\n",
      "============ 875 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   +0.0000 if cp<=0.06495516672730448\n",
      "   +0.0000 if cp<=0.09421565383672716\n",
      "   +0.0000 if cp<=-0.02571234069764614\n",
      "   +0.0000 if cp<=0.01965144500136377\n",
      "   +0.0000 if \n",
      "--------------\n",
      "  +16.8416 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   +8.3779 if cp>=-0.0417468436062336\n",
      "  +23.1575 if \n",
      "   +6.7627 if cp>=-0.011055708117783069\n",
      "   +1.0000 if pa>=0.19771774113178253\n",
      "Run episode 875 with rewards 9.0\n",
      "============ 876 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.0000 if cp<=0.06495516672730448\n",
      "   +0.0000 if cp<=0.09421565383672716\n",
      "   +0.0000 if cp<=0.01965144500136377\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=0.06249431148171425\n",
      "--------------\n",
      "   -5.8879 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   -4.7789 if cp>=-0.0417468436062336\n",
      "  -10.2193 if \n",
      "   -4.8297 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp<=-0.007788338791578997\n",
      "Run episode 876 with rewards 10.0\n",
      "============ 877 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.0000 if cp<=0.06495516672730448\n",
      "   -0.0000 if cp<=0.09421565383672716\n",
      "   -0.0000 if cp<=0.01965144500136377\n",
      "   -0.0000 if \n",
      "   +0.0000 if cp>=-0.0465687446296215\n",
      "--------------\n",
      "   +6.1252 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   +4.5267 if cp>=-0.0417468436062336\n",
      "  +10.4326 if \n",
      "   +4.8028 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp<=-0.0465687446296215 & cp>=-0.11644938290119171\n",
      "Run episode 877 with rewards 9.0\n",
      "============ 878 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   -0.0000 if cp<=0.06495516672730448\n",
      "   +0.0000 if cp<=0.09421565383672716\n",
      "   -0.0000 if cp<=0.01965144500136377\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=0.0493598960340023\n",
      "--------------\n",
      "  -15.6115 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "  -11.5398 if cp>=-0.0417468436062336\n",
      "  -26.5923 if \n",
      "  -12.2436 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp<=0.06027125120162964\n",
      "Run episode 878 with rewards 9.0\n",
      "============ 879 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   +0.0000 if cp<=0.06495516672730448\n",
      "   +0.0000 if cp<=0.09421565383672716\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=0.0493598960340023\n",
      "   +0.0000 if \n",
      "--------------\n",
      "  +15.6115 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "  +11.5398 if cp>=-0.0417468436062336\n",
      "  +26.5923 if \n",
      "  +12.2436 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp>=-0.084559565782547\n",
      "Run episode 879 with rewards 10.0\n",
      "============ 880 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.0000 if cp<=0.06495516672730448\n",
      "   +0.0000 if cp<=0.09421565383672716\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=0.035459516569972045\n",
      "   +0.0000 if cp<=0.035459516569972045 & cp>=0.007609676755964757\n",
      "--------------\n",
      "   -5.2062 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   -4.0285 if cp>=-0.0417468436062336\n",
      "   -9.1303 if \n",
      "   -4.2670 if cp>=-0.011055708117783069\n",
      "   +0.9983 if cp<=0.07581618428230286\n",
      "Run episode 880 with rewards 10.0\n",
      "============ 881 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.0001 if cp<=0.06495516672730448\n",
      "   -0.0001 if cp<=0.09421565383672716\n",
      "   -0.0001 if \n",
      "   +0.0000 if cp>=0.035459516569972045\n",
      "   +0.0000 if cp>=0.01904744114726782\n",
      "--------------\n",
      "   +6.6690 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   +3.5655 if cp>=-0.0417468436062336\n",
      "   +9.8034 if \n",
      "   +3.5871 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp>=0.034106360375881196\n",
      "Run episode 881 with rewards 9.0\n",
      "============ 882 ===========\n",
      "11 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   -0.0000 if cp<=0.06495516672730448\n",
      "   -0.0000 if cp<=0.09421565383672716\n",
      "   -0.0000 if \n",
      "   +0.0000 if cp>=0.035459516569972045\n",
      "   +0.0000 if cp<=0.024991386756300926\n",
      "--------------\n",
      "  -16.3286 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   -8.7518 if cp>=-0.0417468436062336\n",
      "  -24.0248 if \n",
      "   -8.8047 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp<=0.036584348231554036\n",
      "Run episode 882 with rewards 11.0\n",
      "============ 883 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   +0.0000 if cp<=0.06495516672730448\n",
      "   +0.0000 if cp<=0.09421565383672716\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=0.035459516569972045\n",
      "   +0.0000 if \n",
      "--------------\n",
      "  +16.3286 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   +8.7518 if cp>=-0.0417468436062336\n",
      "  +24.0248 if \n",
      "   +8.8047 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp>=-0.11779003590345383\n",
      "Run episode 883 with rewards 10.0\n",
      "============ 884 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.0000 if cp<=0.06495516672730448\n",
      "   +0.0000 if cp<=0.09421565383672716\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=0.02976034507155419\n",
      "   +0.0000 if cp<=0.02976034507155419 & cp>=0.0031768660061061394\n",
      "--------------\n",
      "   -6.1923 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   -3.7609 if cp>=-0.0417468436062336\n",
      "   -9.7866 if \n",
      "   -3.9620 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp<=0.06883824467658997\n",
      "Run episode 884 with rewards 9.0\n",
      "============ 885 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.0000 if cp<=0.06495516672730448\n",
      "   -0.0000 if cp<=0.09421565383672716\n",
      "   -0.0000 if \n",
      "   +0.0000 if cp>=0.02976034507155419\n",
      "   +0.0000 if cp>=0.017314466834068308\n",
      "--------------\n",
      "   +6.1923 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   +3.7609 if cp>=-0.0417468436062336\n",
      "   +9.7866 if \n",
      "   +3.9620 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp>=0.02815828062593937\n",
      "Run episode 885 with rewards 9.0\n",
      "============ 886 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.0000 if cp<=0.06495516672730448\n",
      "   +0.0000 if cp<=0.09421565383672716\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=0.02976034507155419\n",
      "   +0.0000 if cp<=0.0035026139579713454\n",
      "--------------\n",
      "  -15.0955 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   -9.1906 if cp>=-0.0417468436062336\n",
      "  -23.8819 if \n",
      "   -9.6831 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp<=-0.01780116148293018\n",
      "Run episode 886 with rewards 10.0\n",
      "============ 887 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   +0.0000 if cp<=0.06495516672730448\n",
      "   +0.0000 if cp<=0.09421565383672716\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=0.02976034507155419\n",
      "   +0.0000 if \n",
      "--------------\n",
      "  +15.0955 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   +9.1906 if cp>=-0.0417468436062336\n",
      "  +23.8819 if \n",
      "   +9.6831 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp<=-0.040793775022029875 & cp>=-0.10755325257778167\n",
      "Run episode 887 with rewards 9.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 888 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.0000 if cp<=0.06495516672730448\n",
      "   +0.0000 if cp<=0.09421565383672716\n",
      "   +0.0000 if \n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=-0.011722409166395664\n",
      "--------------\n",
      "   -5.7231 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   -3.6286 if cp>=-0.0417468436062336\n",
      "   -9.2481 if \n",
      "   -3.8589 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp<=-0.011722409166395664\n",
      "Run episode 888 with rewards 9.0\n",
      "============ 889 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.0001 if cp<=0.06495516672730448\n",
      "   -0.0001 if cp<=0.09421565383672716\n",
      "   -0.0001 if \n",
      "   +0.0000 if cp>=-0.003936840780079356\n",
      "   +0.0000 if cp>=-0.003936840780079356\n",
      "--------------\n",
      "   +6.3384 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   +3.3610 if cp>=-0.0417468436062336\n",
      "   +9.8121 if \n",
      "   +3.3774 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp<=-0.0599286712706089\n",
      "Run episode 889 with rewards 10.0\n",
      "============ 890 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.0000 if cp<=0.06495516672730448\n",
      "   +0.0000 if cp<=0.09421565383672716\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=0.02810605689883233\n",
      "   +0.0000 if cp<=0.02810605689883233 & cp>=-0.00032611628994345596\n",
      "--------------\n",
      "  -15.3014 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   -8.1646 if cp>=-0.0417468436062336\n",
      "  -23.7418 if \n",
      "   -8.2079 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp<=0.06902631223201752\n",
      "Run episode 890 with rewards 10.0\n",
      "============ 891 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   +0.0000 if cp<=0.06495516672730448\n",
      "   +0.0000 if cp<=0.09421565383672716\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=0.02810605689883233\n",
      "   +0.0000 if \n",
      "--------------\n",
      "  +15.3014 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   +8.1646 if cp>=-0.0417468436062336\n",
      "  +23.7418 if \n",
      "   +8.2079 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp>=0.04259990975260734\n",
      "Run episode 891 with rewards 9.0\n",
      "============ 892 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.0000 if cp<=0.09421565383672716\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=0.02810605689883233\n",
      "   -0.0000 if cp<=0.0008125176886096615\n",
      "   +0.0000 if cp<=0.0008125176886096615\n",
      "--------------\n",
      "   -6.5323 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   -3.4855 if cp>=-0.0417468436062336\n",
      "  -10.1355 if \n",
      "   -3.5040 if cp>=-0.011055708117783069\n",
      "   +1.0000 if pa>=-0.006689112633466721\n",
      "Run episode 892 with rewards 9.0\n",
      "============ 893 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.0000 if cp<=0.09421565383672716\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp>=0.02810605689883233\n",
      "   -0.0000 if cp>=-0.07977793514728546\n",
      "   +0.0000 if cp>=-0.04754561185836792\n",
      "--------------\n",
      "   +6.5323 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   +3.4855 if cp>=-0.0417468436062336\n",
      "  +10.1355 if \n",
      "   +3.5040 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp>=-0.07977793514728546\n",
      "Run episode 893 with rewards 10.0\n",
      "============ 894 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.0000 if cp<=0.09421565383672716\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=-0.07977793514728546\n",
      "   +0.0000 if cp>=-0.04754561185836792\n",
      "   +0.0000 if cp>=0.14297698438167572\n",
      "--------------\n",
      "  -16.1036 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   -8.6235 if cp>=-0.0417468436062336\n",
      "  -25.0176 if \n",
      "   -8.6690 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp<=0.05018402636051179\n",
      "Run episode 894 with rewards 9.0\n",
      "============ 895 ===========\n",
      "8 actions [1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   +0.0000 if cp<=0.09421565383672716\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=-0.07977793514728546\n",
      "   +0.0000 if cp>=-0.04754561185836792\n",
      "   +0.0000 if \n",
      "--------------\n",
      "  +16.1036 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   +8.6235 if cp>=-0.0417468436062336\n",
      "  +25.0176 if \n",
      "   +8.6690 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp>=0.04067362993955612\n",
      "Run episode 895 with rewards 8.0\n",
      "============ 896 ===========\n",
      "8 actions [0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=-0.07977793514728546\n",
      "   +0.0000 if cp>=-0.04754561185836792\n",
      "   -0.0000 if cp<=-0.02477074600756168\n",
      "   +0.0000 if cp>=0.015676871314644826\n",
      "--------------\n",
      "   -5.7761 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   -3.7925 if cp>=-0.0417468436062336\n",
      "   -9.8212 if \n",
      "   -3.8546 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp<=-0.03319260999560356\n",
      "Run episode 896 with rewards 8.0\n",
      "============ 897 ===========\n",
      "8 actions [1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=-0.07977793514728546\n",
      "   +0.0000 if cp>=-0.04754561185836792\n",
      "   -0.0000 if cp<=-0.02477074600756168\n",
      "   +0.0000 if cp<=0.023303029313683513\n",
      "--------------\n",
      "   +5.7761 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   +3.7925 if cp>=-0.0417468436062336\n",
      "   +9.8212 if \n",
      "   +3.8546 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp>=0.0392776444554329\n",
      "Run episode 897 with rewards 8.0\n",
      "============ 898 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=-0.07977793514728546\n",
      "   +0.0000 if cp>=-0.04754561185836792\n",
      "   +0.0000 if cp<=-0.02477074600756168\n",
      "   +0.0000 if cp<=0.0039769678376615075\n",
      "--------------\n",
      "  -13.9444 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   -9.1790 if cp>=-0.0417468436062336\n",
      "  -23.7335 if \n",
      "   -9.3290 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp<=0.04662562981247903\n",
      "Run episode 898 with rewards 9.0\n",
      "============ 899 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp>=-0.07977793514728546\n",
      "   +0.0000 if cp>=-0.04754561185836792\n",
      "   -0.0000 if cp<=0.0039769678376615075\n",
      "   +0.0000 if cp<=-0.10210026949644088\n",
      "--------------\n",
      "  +13.9444 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   +9.1790 if cp>=-0.0417468436062336\n",
      "  +23.7335 if \n",
      "   +9.3290 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp>=-0.10210026949644088\n",
      "Run episode 899 with rewards 9.0\n",
      "============ 900 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=-0.07977793514728546\n",
      "   -0.0000 if cp<=0.0039769678376615075\n",
      "   +0.0000 if cp<=-0.10210026949644088\n",
      "   +0.0000 if cp<=0.034863238781690606 & cp>=-0.031971486285328865\n",
      "--------------\n",
      "   -5.3822 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   -3.5656 if cp>=-0.0417468436062336\n",
      "   -9.1880 if \n",
      "   -3.6340 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp<=-0.01985575351864099\n",
      "Run episode 900 with rewards 10.0\n",
      "============ 901 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.0001 if \n",
      "   -0.0000 if cp>=-0.07977793514728546\n",
      "   -0.0001 if cp<=0.0039769678376615075\n",
      "   +0.0000 if cp<=-0.10210026949644088\n",
      "   -0.0001 if cp<=-0.03701553866267204\n",
      "--------------\n",
      "   +6.2785 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   +3.4645 if cp>=-0.0417468436062336\n",
      "   +9.5897 if \n",
      "   +3.3416 if cp>=-0.011055708117783069\n",
      "   +0.9905 if cp>=0.043911314010620116\n",
      "Run episode 901 with rewards 9.0\n",
      "============ 902 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp>=-0.07977793514728546\n",
      "   -0.0000 if cp<=0.0039769678376615075\n",
      "   -0.0000 if cp<=-0.03701553866267204\n",
      "   +0.0000 if cp<=0.0654622070491314\n",
      "--------------\n",
      "  -15.0132 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   -8.3236 if cp>=-0.0417468436062336\n",
      "  -22.9702 if \n",
      "   -8.0295 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp<=0.04310153648257256\n",
      "Run episode 902 with rewards 9.0\n",
      "============ 903 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=-0.07977793514728546\n",
      "   +0.0000 if cp<=0.0039769678376615075\n",
      "   +0.0000 if cp<=0.0654622070491314\n",
      "   +0.0000 if \n",
      "--------------\n",
      "  +15.0132 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   +8.3236 if cp>=-0.0417468436062336\n",
      "  +22.9702 if \n",
      "   +8.0295 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp<=-0.04149352014064789 & cp>=-0.10251039713621139\n",
      "Run episode 903 with rewards 9.0\n",
      "============ 904 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=-0.07977793514728546\n",
      "   -0.0000 if cp<=0.0654622070491314\n",
      "   +0.0000 if cp<=0.09619892239570618\n",
      "   +0.0000 if cp<=0.09619892239570618 & cp>=0.02830362394452095\n",
      "--------------\n",
      "   -5.8560 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   -3.5654 if cp>=-0.0417468436062336\n",
      "   -9.2784 if \n",
      "   -3.4507 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp<=0.04076817706227303\n",
      "Run episode 904 with rewards 9.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 905 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp>=-0.07977793514728546\n",
      "   -0.0000 if cp<=0.0654622070491314\n",
      "   -0.0000 if cp<=0.09619892239570618\n",
      "   -0.0000 if cp<=-0.015515549667179582\n",
      "--------------\n",
      "   +6.2451 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   +3.5479 if cp>=-0.0417468436062336\n",
      "   +9.4905 if \n",
      "   +3.2940 if cp>=-0.011055708117783069\n",
      "   +0.9867 if cp>=0.01761370338499546\n",
      "Run episode 905 with rewards 9.0\n",
      "============ 906 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.0654622070491314\n",
      "   +0.0000 if cp<=0.09619892239570618\n",
      "   -0.0000 if cp<=-0.015515549667179582\n",
      "   +0.0000 if cp>=0.035114061087369926\n",
      "--------------\n",
      "  -14.8631 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   -8.5004 if cp>=-0.0417468436062336\n",
      "  -22.6469 if \n",
      "   -7.8994 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp<=-0.017438083328306674\n",
      "Run episode 906 with rewards 10.0\n",
      "============ 907 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp<=0.0654622070491314\n",
      "   -0.0000 if cp<=0.09619892239570618\n",
      "   -0.0000 if cp<=-0.015515549667179582\n",
      "   +0.0000 if cp>=0.04220550432801247\n",
      "--------------\n",
      "  +14.8631 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   +8.5004 if cp>=-0.0417468436062336\n",
      "  +22.6469 if \n",
      "   +7.8994 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp>=0.04220550432801247\n",
      "Run episode 907 with rewards 10.0\n",
      "============ 908 ===========\n",
      "8 actions [0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.0000 if cp<=0.0654622070491314\n",
      "   +0.0000 if cp<=0.09619892239570618\n",
      "   -0.0000 if cp<=-0.015515549667179582\n",
      "   +0.0000 if cp>=0.04220550432801247\n",
      "   +0.0000 if cp>=0.0220481712371111\n",
      "--------------\n",
      "   -6.5425 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   -3.7417 if cp>=-0.0417468436062336\n",
      "   -9.9687 if \n",
      "   -3.4772 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp<=-0.007315804250538348\n",
      "Run episode 908 with rewards 8.0\n",
      "============ 909 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.0000 if cp<=0.0654622070491314\n",
      "   -0.0000 if cp<=0.09619892239570618\n",
      "   -0.0000 if cp<=-0.015515549667179582\n",
      "   -0.0000 if cp>=0.04220550432801247\n",
      "   +0.0000 if cp>=0.0011502198991365814\n",
      "--------------\n",
      "   +6.5425 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   +3.7417 if cp>=-0.0417468436062336\n",
      "   +9.9687 if \n",
      "   +3.4772 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp<=0.009617019072175027\n",
      "Run episode 909 with rewards 10.0\n",
      "============ 910 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   -0.0000 if cp<=0.0654622070491314\n",
      "   -0.0000 if cp<=0.09619892239570618\n",
      "   -0.0000 if cp<=-0.015515549667179582\n",
      "   +0.0000 if cp>=0.0011502198991365814\n",
      "   +0.0000 if cp>=0.133489727973938\n",
      "--------------\n",
      "  -16.0827 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   -9.2141 if cp>=-0.0417468436062336\n",
      "  -24.5214 if \n",
      "   -8.5638 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp<=0.06265927851200104\n",
      "Run episode 910 with rewards 10.0\n",
      "============ 911 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   +0.0000 if cp<=0.0654622070491314\n",
      "   +0.0000 if cp<=0.09619892239570618\n",
      "   +0.0000 if cp>=0.0011502198991365814\n",
      "   +0.0000 if cp>=0.133489727973938\n",
      "   +0.0000 if \n",
      "--------------\n",
      "  +16.0827 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   +9.2141 if cp>=-0.0417468436062336\n",
      "  +24.5214 if \n",
      "   +8.5638 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp>=0.038640872389078144\n",
      "Run episode 911 with rewards 9.0\n",
      "============ 912 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   -0.0000 if cp<=0.0654622070491314\n",
      "   -0.0000 if cp<=0.09619892239570618\n",
      "   +0.0000 if cp>=0.0011502198991365814\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=0.1103552281856537\n",
      "--------------\n",
      "   -6.1490 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   -3.5229 if cp>=-0.0417468436062336\n",
      "   -9.3755 if \n",
      "   -3.2743 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp<=0.055235907435417175\n",
      "Run episode 912 with rewards 10.0\n",
      "============ 913 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.0000 if cp<=0.0654622070491314\n",
      "   -0.0000 if cp<=0.09619892239570618\n",
      "   +0.0000 if cp>=0.0011502198991365814\n",
      "   -0.0000 if \n",
      "   +0.0000 if cp<=0.005304522626101971 & cp>=-0.04080380126833916\n",
      "--------------\n",
      "   +6.6635 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   +3.0676 if cp>=-0.0417468436062336\n",
      "   +9.8501 if \n",
      "   +2.7240 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp>=-0.08261779993772507\n",
      "Run episode 913 with rewards 9.0\n",
      "============ 914 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.0000 if cp<=0.0654622070491314\n",
      "   +0.0000 if cp<=0.09619892239570618\n",
      "   +0.0000 if cp>=0.0011502198991365814\n",
      "   +0.0000 if \n",
      "   +0.0000 if \n",
      "--------------\n",
      "  -16.0597 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   -7.4740 if cp>=-0.0417468436062336\n",
      "  -23.8209 if \n",
      "   -6.6459 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp<=0.04308824203908444\n",
      "Run episode 914 with rewards 9.0\n",
      "============ 915 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   +0.0000 if cp<=0.09619892239570618\n",
      "   +0.0000 if cp>=0.0011502198991365814\n",
      "   +0.0000 if \n",
      "   -0.0000 if \n",
      "   +0.0000 if \n",
      "--------------\n",
      "  +16.0597 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   +7.4740 if cp>=-0.0417468436062336\n",
      "  +23.8209 if \n",
      "   +6.6459 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp>=0.019971834495663643\n",
      "Run episode 915 with rewards 10.0\n",
      "============ 916 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.0000 if cp>=0.0011502198991365814\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.049646385014057166\n",
      "   +0.0000 if cp<=0.09039678573608399 & cp>=0.005609903670847416\n",
      "   +0.0000 if cp<=0.049646385014057166\n",
      "--------------\n",
      "  -16.2724 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   -8.7159 if cp>=-0.0417468436062336\n",
      "  -25.9469 if \n",
      "   -7.8430 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp<=0.09039678573608399 & cp>=0.005609903670847416\n",
      "Run episode 916 with rewards 10.0\n",
      "============ 917 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   +0.0000 if cp>=0.0011502198991365814\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.09039678573608399 & cp>=0.005609903670847416\n",
      "   +0.0000 if \n",
      "   +0.0000 if \n",
      "--------------\n",
      "  +16.2724 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   +8.7159 if cp>=-0.0417468436062336\n",
      "  +25.9469 if \n",
      "   +7.8430 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp>=0.02628929950296879\n",
      "Run episode 917 with rewards 10.0\n",
      "============ 918 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.09039678573608399 & cp>=0.005609903670847416\n",
      "   +0.0000 if cp>=0.020215270482003694\n",
      "   +0.0000 if cp>=0.06228298842906953\n",
      "   +0.0000 if cp>=0.11687477678060532\n",
      "--------------\n",
      "   -6.5524 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   -3.5096 if cp>=-0.0417468436062336\n",
      "  -10.4479 if \n",
      "   -3.1581 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp<=-0.009357788600027561\n",
      "Run episode 918 with rewards 10.0\n",
      "============ 919 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.0000 if \n",
      "   +0.0000 if cp<=0.09039678573608399 & cp>=0.005609903670847416\n",
      "   +0.0000 if cp>=0.020215270482003694\n",
      "   +0.0000 if cp>=0.06228298842906953\n",
      "   +0.0000 if cp<=-0.06868215501308442\n",
      "--------------\n",
      "   +6.5524 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   +3.5096 if cp>=-0.0417468436062336\n",
      "  +10.4479 if \n",
      "   +3.1581 if cp>=-0.011055708117783069\n",
      "   +1.0000 if pa>=0.1828460395336151\n",
      "Run episode 919 with rewards 10.0\n",
      "origin 1.3945485023831947e-05 new 1.3945486780414235e-05 not updated\n",
      "============ 920 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   -0.0000 if \n",
      "   +0.0000 if cp<=0.09039678573608399 & cp>=0.005609903670847416\n",
      "   +0.0000 if cp>=0.020215270482003694\n",
      "   +0.0000 if cp>=0.06228298842906953\n",
      "   +0.0000 if cp<=-0.06868215501308442\n",
      "--------------\n",
      "  -16.2842 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   -8.7501 if cp>=-0.0417468436062336\n",
      "  -25.9952 if \n",
      "   -7.8779 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp<=0.07108138501644135\n",
      "Run episode 920 with rewards 10.0\n",
      "============ 921 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.09039678573608399 & cp>=0.005609903670847416\n",
      "   +0.0000 if cp>=0.020215270482003694\n",
      "   +0.0000 if cp<=-0.06868215501308442\n",
      "   +0.0000 if \n",
      "--------------\n",
      "  +16.2842 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   +8.7501 if cp>=-0.0417468436062336\n",
      "  +25.9952 if \n",
      "   +7.8779 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp>=-0.09693067520856857\n",
      "Run episode 921 with rewards 9.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 922 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.09039678573608399 & cp>=0.005609903670847416\n",
      "   +0.0000 if cp<=-0.06868215501308442\n",
      "   +0.0000 if cp>=-0.0024803904816508185\n",
      "   +0.0000 if cp>=0.07077031582593918\n",
      "--------------\n",
      "   -5.5051 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   -3.7035 if cp>=-0.0417468436062336\n",
      "   -9.8035 if \n",
      "   -3.6500 if cp>=-0.011055708117783069\n",
      "   +0.9458 if cp<=0.029440216347575196 & cp>=-0.0024803904816508185\n",
      "Run episode 922 with rewards 9.0\n",
      "============ 923 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.0000 if \n",
      "   +0.0000 if cp<=0.09039678573608399 & cp>=0.005609903670847416\n",
      "   +0.0000 if cp>=-0.0024803904816508185\n",
      "   +0.0000 if cp>=0.07077031582593918\n",
      "   +0.0000 if cp<=-0.04920747950673103\n",
      "--------------\n",
      "   +6.1562 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   +3.2181 if cp>=-0.0417468436062336\n",
      "  +10.3839 if \n",
      "   +3.5901 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp>=-0.07978708893060685\n",
      "Run episode 923 with rewards 9.0\n",
      "============ 924 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.09039678573608399 & cp>=0.005609903670847416\n",
      "   +0.0000 if cp>=-0.0024803904816508185\n",
      "   -0.0000 if cp<=-0.04920747950673103\n",
      "   +0.0000 if cp>=0.13205553591251373\n",
      "--------------\n",
      "  -15.1528 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   -7.9385 if cp>=-0.0417468436062336\n",
      "  -25.5765 if \n",
      "   -8.8540 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp<=0.03706912621855736\n",
      "Run episode 924 with rewards 9.0\n",
      "============ 925 ===========\n",
      "8 actions [1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.09039678573608399 & cp>=0.005609903670847416\n",
      "   +0.0000 if cp>=-0.0024803904816508185\n",
      "   +0.0000 if cp>=0.13205553591251373\n",
      "   +0.0000 if \n",
      "--------------\n",
      "  +15.1528 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   +7.9385 if cp>=-0.0417468436062336\n",
      "  +25.5765 if \n",
      "   +8.8540 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp>=-0.07968364655971527\n",
      "Run episode 925 with rewards 8.0\n",
      "============ 926 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.09039678573608399 & cp>=0.005609903670847416\n",
      "   +0.0000 if cp>=-0.0024803904816508185\n",
      "   +0.0000 if cp<=-0.021152627840638143 & cp>=-0.037670196592807764\n",
      "   +0.0000 if cp<=-0.021152627840638143 & cp>=-0.037670196592807764\n",
      "--------------\n",
      "   -5.4604 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   -3.7517 if cp>=-0.0417468436062336\n",
      "  -10.0944 if \n",
      "   -3.9520 if cp>=-0.011055708117783069\n",
      "   +0.9478 if cp>=0.03460865840315819\n",
      "Run episode 926 with rewards 10.0\n",
      "============ 927 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.0000 if \n",
      "   +0.0000 if cp<=0.09039678573608399 & cp>=0.005609903670847416\n",
      "   -0.0000 if cp<=-0.021152627840638143 & cp>=-0.037670196592807764\n",
      "   -0.0000 if cp<=-0.041491083800792694\n",
      "   +0.0000 if pa>=0.20019814372062683\n",
      "--------------\n",
      "   +5.7774 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   +3.7110 if cp>=-0.0417468436062336\n",
      "  +10.2292 if \n",
      "   +3.7971 if cp>=-0.011055708117783069\n",
      "   +0.9988 if cp>=0.03752316609025001\n",
      "Run episode 927 with rewards 9.0\n",
      "============ 928 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.0000 if \n",
      "   -0.0000 if cp<=0.09039678573608399 & cp>=0.005609903670847416\n",
      "   -0.0000 if cp<=-0.021152627840638143 & cp>=-0.037670196592807764\n",
      "   -0.0000 if cp<=-0.041491083800792694\n",
      "   +0.0000 if cp>=0.024540945142507552\n",
      "--------------\n",
      "  -14.1467 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   -9.1010 if cp>=-0.0417468436062336\n",
      "  -25.0616 if \n",
      "   -9.3118 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp<=0.03429219126701355\n",
      "Run episode 928 with rewards 10.0\n",
      "============ 929 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.09039678573608399 & cp>=0.005609903670847416\n",
      "   +0.0000 if cp<=-0.041491083800792694\n",
      "   +0.0000 if cp>=0.024540945142507552\n",
      "   +0.0000 if \n",
      "--------------\n",
      "  +14.1467 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   +9.1010 if cp>=-0.0417468436062336\n",
      "  +25.0616 if \n",
      "   +9.3118 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp>=0.046165012568235395\n",
      "Run episode 929 with rewards 10.0\n",
      "============ 930 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.09039678573608399 & cp>=0.005609903670847416\n",
      "   +0.0000 if cp>=0.024540945142507552\n",
      "   +0.0000 if cp>=0.07787436544895172\n",
      "   +0.0000 if cp>=0.13032735884189606\n",
      "--------------\n",
      "   -5.1108 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   -3.8055 if cp>=-0.0417468436062336\n",
      "   -9.8941 if \n",
      "   -3.8859 if cp>=-0.011055708117783069\n",
      "   +0.8823 if cp<=0.07787436544895172 & cp>=-0.004348193202167749\n",
      "Run episode 930 with rewards 10.0\n",
      "============ 931 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.0000 if \n",
      "   +0.0000 if cp<=0.09039678573608399 & cp>=0.005609903670847416\n",
      "   +0.0000 if cp>=0.024540945142507552\n",
      "   +0.0000 if cp>=0.07787436544895172\n",
      "   +0.0000 if cp<=-0.06525699570775031\n",
      "--------------\n",
      "   +5.8487 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   +2.9739 if cp>=-0.0417468436062336\n",
      "  +10.5444 if \n",
      "   +3.8148 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp<=-0.03744562268257141 & cp>=-0.10557414889335633\n",
      "Run episode 931 with rewards 9.0\n",
      "============ 932 ===========\n",
      "11 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=0.024540945142507552\n",
      "   +0.0000 if cp>=0.07787436544895172\n",
      "   -0.0000 if cp<=-0.06525699570775031\n",
      "   +0.0000 if cp>=0.03826398439705373\n",
      "--------------\n",
      "  -14.3910 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   -7.3421 if cp>=-0.0417468436062336\n",
      "  -25.9700 if \n",
      "   -9.4111 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp<=0.03826398439705373\n",
      "Run episode 932 with rewards 11.0\n",
      "============ 933 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=0.024540945142507552\n",
      "   +0.0000 if cp>=0.07787436544895172\n",
      "   +0.0000 if cp>=0.03826398439705373\n",
      "   +0.0000 if \n",
      "--------------\n",
      "  +14.3910 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   +7.3421 if cp>=-0.0417468436062336\n",
      "  +25.9700 if \n",
      "   +9.4111 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp>=-0.12556499242782593\n",
      "Run episode 933 with rewards 9.0\n",
      "============ 934 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=0.024540945142507552\n",
      "   +0.0000 if cp>=0.07787436544895172\n",
      "   -0.0000 if cp<=0.052323675155639654\n",
      "   +0.0000 if cp<=0.052323675155639654\n",
      "--------------\n",
      "   -5.2337 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   -2.9394 if cp>=-0.0417468436062336\n",
      "   -9.7139 if \n",
      "   -3.6918 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp<=0.052323675155639654\n",
      "Run episode 934 with rewards 9.0\n",
      "============ 935 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.0000 if cp>=0.024540945142507552\n",
      "   -0.0000 if cp>=0.07787436544895172\n",
      "   -0.0001 if cp<=0.052323675155639654\n",
      "   -0.0000 if cp<=-0.06055009961128235\n",
      "   -0.0001 if cp<=-0.02908329218626022\n",
      "--------------\n",
      "   +5.8388 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   +2.6397 if cp>=-0.0417468436062336\n",
      "  +10.2505 if \n",
      "   +3.1719 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp<=-0.06055009961128235\n",
      "Run episode 935 with rewards 10.0\n",
      "============ 936 ===========\n",
      "8 actions [0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.0000 if cp>=0.07787436544895172\n",
      "   -0.0000 if cp<=0.052323675155639654\n",
      "   -0.0000 if cp<=-0.06055009961128235\n",
      "   -0.0000 if cp<=-0.02908329218626022\n",
      "   +0.0000 if cp>=0.13375325798988344\n",
      "--------------\n",
      "  -14.0113 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   -6.3761 if cp>=-0.0417468436062336\n",
      "  -24.6398 if \n",
      "   -7.6534 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp<=0.0660781905055046\n",
      "Run episode 936 with rewards 8.0\n",
      "============ 937 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   +0.0000 if cp>=0.07787436544895172\n",
      "   +0.0000 if cp<=0.052323675155639654\n",
      "   +0.0000 if cp<=-0.02908329218626022\n",
      "   +0.0000 if cp>=0.13375325798988344\n",
      "   +0.0000 if \n",
      "--------------\n",
      "  +14.0113 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   +6.3761 if cp>=-0.0417468436062336\n",
      "  +24.6398 if \n",
      "   +7.6534 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp<=-0.06855656504631043\n",
      "Run episode 937 with rewards 9.0\n",
      "============ 938 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.0000 if cp>=0.07787436544895172\n",
      "   +0.0000 if cp<=0.052323675155639654\n",
      "   +0.0000 if cp>=0.13375325798988344\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.013526160269975664\n",
      "--------------\n",
      "   -5.6047 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   -3.0797 if cp>=-0.0417468436062336\n",
      "  -10.6749 if \n",
      "   -3.6109 if cp>=-0.011055708117783069\n",
      "   +0.9390 if cp<=0.06580120474100114 & cp>=0.0028154776431620126\n",
      "Run episode 938 with rewards 10.0\n",
      "origin 1.3602740831729954e-05 new 1.3602741165713404e-05 not updated\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 939 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   +0.0000 if cp>=0.07787436544895172\n",
      "   +0.0000 if cp<=0.052323675155639654\n",
      "   +0.0000 if cp>=0.13375325798988344\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.013526160269975664\n",
      "--------------\n",
      "   +5.6047 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   +3.0797 if cp>=-0.0417468436062336\n",
      "  +10.6749 if \n",
      "   +3.6109 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp>=0.03832313343882561\n",
      "Run episode 939 with rewards 10.0\n",
      "origin 1.3790736457273445e-05 new 1.3790736612702304e-05 not updated\n",
      "============ 940 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.0000 if cp>=0.07787436544895172\n",
      "   +0.0000 if cp<=0.052323675155639654\n",
      "   +0.0000 if cp>=0.13375325798988344\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.013526160269975664\n",
      "--------------\n",
      "  -13.7676 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   -7.5791 if cp>=-0.0417468436062336\n",
      "  -26.2363 if \n",
      "   -8.8838 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp<=0.03262781873345375\n",
      "Run episode 940 with rewards 9.0\n",
      "============ 941 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   +0.0000 if cp>=0.07787436544895172\n",
      "   +0.0000 if cp<=0.052323675155639654\n",
      "   +0.0000 if cp>=0.13375325798988344\n",
      "   +0.0000 if \n",
      "   +0.0000 if \n",
      "--------------\n",
      "  +13.7676 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   +7.5791 if cp>=-0.0417468436062336\n",
      "  +26.2363 if \n",
      "   +8.8838 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp>=0.041728127747774124\n",
      "Run episode 941 with rewards 9.0\n",
      "============ 942 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.0000 if cp>=0.07787436544895172\n",
      "   -0.0000 if cp<=0.052323675155639654\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=0.023248720541596414\n",
      "   +0.0000 if cp>=0.03365621119737625\n",
      "--------------\n",
      "   -5.1041 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   -2.8972 if cp>=-0.0417468436062336\n",
      "   -9.8140 if \n",
      "   -3.3809 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp<=0.03365621119737625\n",
      "Run episode 942 with rewards 10.0\n",
      "============ 943 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   +0.0000 if cp>=0.07787436544895172\n",
      "   -0.0001 if cp<=0.052323675155639654\n",
      "   -0.0001 if \n",
      "   +0.0000 if cp>=0.023248720541596414\n",
      "   +0.0000 if cp>=-0.08445569425821305\n",
      "--------------\n",
      "   +5.7494 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   +2.3897 if cp>=-0.0417468436062336\n",
      "  +10.3823 if \n",
      "   +3.3256 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp<=-0.04288899749517441 & cp>=-0.12402833402156829\n",
      "Run episode 943 with rewards 10.0\n",
      "============ 944 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.0000 if cp<=0.052323675155639654\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=0.023248720541596414\n",
      "   +0.0000 if cp>=-0.08445569425821305\n",
      "   +0.0000 if cp<=0.07551568001508713\n",
      "--------------\n",
      "  -13.8316 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   -5.8148 if cp>=-0.0417468436062336\n",
      "  -25.0525 if \n",
      "   -8.0743 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp<=0.07551568001508713\n",
      "Run episode 944 with rewards 9.0\n",
      "============ 945 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   +0.0000 if cp<=0.052323675155639654\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=0.023248720541596414\n",
      "   +0.0000 if cp>=-0.08445569425821305\n",
      "   +0.0000 if \n",
      "--------------\n",
      "  +13.8316 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   +5.8148 if cp>=-0.0417468436062336\n",
      "  +25.0525 if \n",
      "   +8.0743 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp>=-0.08664461523294449\n",
      "Run episode 945 with rewards 10.0\n",
      "============ 946 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=0.023248720541596414\n",
      "   +0.0000 if cp>=-0.08445569425821305\n",
      "   +0.0000 if cp>=0.07026785910129547\n",
      "   +0.0000 if cp>=0.030876000225543983\n",
      "--------------\n",
      "   -5.0855 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   -2.8433 if cp>=-0.0417468436062336\n",
      "  -10.5304 if \n",
      "   -4.0632 if cp>=-0.011055708117783069\n",
      "   +1.0093 if cp<=0.07026785910129547\n",
      "Run episode 946 with rewards 9.0\n",
      "============ 947 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.0000 if \n",
      "   +0.0000 if cp>=0.023248720541596414\n",
      "   -0.0000 if cp>=-0.08445569425821305\n",
      "   -0.0000 if cp>=0.07026785910129547\n",
      "   +0.0000 if cp>=-0.027729899063706397\n",
      "--------------\n",
      "   +5.0855 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   +2.8433 if cp>=-0.0417468436062336\n",
      "  +10.5304 if \n",
      "   +4.0632 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp>=0.03465619832277298\n",
      "Run episode 947 with rewards 10.0\n",
      "============ 948 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp>=0.023248720541596414\n",
      "   -0.0000 if cp>=-0.08445569425821305\n",
      "   -0.0000 if cp>=-0.027729899063706397\n",
      "   +0.0000 if cp<=0.06422427147626877\n",
      "--------------\n",
      "  -12.3348 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   -6.9127 if cp>=-0.0417468436062336\n",
      "  -25.5576 if \n",
      "   -9.8715 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp<=0.06422427147626877\n",
      "Run episode 948 with rewards 9.0\n",
      "============ 949 ===========\n",
      "8 actions [1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=0.023248720541596414\n",
      "   +0.0000 if cp>=-0.08445569425821305\n",
      "   +0.0000 if cp>=-0.027729899063706397\n",
      "   +0.0000 if \n",
      "--------------\n",
      "  +12.3348 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   +6.9127 if cp>=-0.0417468436062336\n",
      "  +25.5576 if \n",
      "   +9.8715 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp>=0.03584125190973282\n",
      "Run episode 949 with rewards 8.0\n",
      "============ 950 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=-0.08445569425821305\n",
      "   +0.0000 if cp>=-0.027729899063706397\n",
      "   -0.0000 if cp<=-0.0021090394468046706\n",
      "   +0.0000 if cp>=0.03744957298040391\n",
      "--------------\n",
      "   -4.7094 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   -2.8110 if cp>=-0.0417468436062336\n",
      "   -9.9847 if \n",
      "   -3.9910 if cp>=-0.011055708117783069\n",
      "   +0.9745 if cp<=0.03744957298040391\n",
      "Run episode 950 with rewards 10.0\n",
      "============ 951 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.0001 if \n",
      "   -0.0000 if cp>=-0.08445569425821305\n",
      "   +0.0000 if cp>=-0.027729899063706397\n",
      "   -0.0001 if cp<=-0.0021090394468046706\n",
      "   -0.0000 if cp>=-0.12081197798252105\n",
      "--------------\n",
      "   +5.7637 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   +1.7385 if cp>=-0.0417468436062336\n",
      "  +10.9102 if \n",
      "   +3.8936 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp<=-0.04901122227311134 & cp>=-0.12081197798252105\n",
      "Run episode 951 with rewards 10.0\n",
      "============ 952 ===========\n",
      "8 actions [0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=-0.08445569425821305\n",
      "   -0.0000 if cp<=-0.0021090394468046706\n",
      "   +0.0000 if cp>=-0.12081197798252105\n",
      "   +0.0000 if cp<=0.02725728154182435\n",
      "--------------\n",
      "  -14.2192 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   -4.3276 if cp>=-0.0417468436062336\n",
      "  -26.9638 if \n",
      "   -9.6524 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp<=0.06906987130641938\n",
      "Run episode 952 with rewards 8.0\n",
      "============ 953 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=-0.08445569425821305\n",
      "   +0.0000 if cp<=-0.0021090394468046706\n",
      "   +0.0000 if cp>=-0.12081197798252105\n",
      "   +0.0000 if \n",
      "--------------\n",
      "  +14.2192 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   +4.3276 if cp>=-0.0417468436062336\n",
      "  +26.9638 if \n",
      "   +9.6524 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp>=0.03652787283062935\n",
      "Run episode 953 with rewards 9.0\n",
      "============ 954 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=-0.08445569425821305\n",
      "   +0.0000 if cp>=-0.12081197798252105\n",
      "   -0.0000 if cp<=0.0017773238767404128\n",
      "   +0.0000 if cp<=0.0017773238767404128\n",
      "--------------\n",
      "   -5.7339 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   -1.7950 if cp>=-0.0417468436062336\n",
      "  -10.9547 if \n",
      "   -3.9579 if cp>=-0.011055708117783069\n",
      "   +1.0000 if pa>=-0.009421331807971\n",
      "Run episode 954 with rewards 10.0\n",
      "============ 955 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp>=-0.08445569425821305\n",
      "   -0.0000 if cp>=-0.12081197798252105\n",
      "   -0.0000 if cp<=-0.03349980637431144\n",
      "   +0.0000 if cp<=-0.007097758539021011 & cp>=-0.03349980637431144\n",
      "--------------\n",
      "   +5.7339 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   +1.7950 if cp>=-0.0417468436062336\n",
      "  +10.9547 if \n",
      "   +3.9579 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp>=-0.07238788157701492\n",
      "Run episode 955 with rewards 9.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 956 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=-0.08445569425821305\n",
      "   +0.0000 if cp>=-0.12081197798252105\n",
      "   +0.0000 if cp<=-0.03349980637431144\n",
      "   +0.0000 if cp<=0.05884182304143906\n",
      "--------------\n",
      "  -14.1856 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   -4.4634 if cp>=-0.0417468436062336\n",
      "  -27.1246 if \n",
      "   -9.8146 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp<=0.05884182304143906\n",
      "Run episode 956 with rewards 10.0\n",
      "============ 957 ===========\n",
      "11 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=-0.08445569425821305\n",
      "   +0.0000 if cp>=-0.12081197798252105\n",
      "   +0.0000 if cp<=0.05884182304143906\n",
      "   +0.0000 if \n",
      "--------------\n",
      "  +14.1856 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   +4.4634 if cp>=-0.0417468436062336\n",
      "  +27.1246 if \n",
      "   +9.8146 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp<=-0.04629026651382446 & cp>=-0.11172670125961304\n",
      "Run episode 957 with rewards 11.0\n",
      "============ 958 ===========\n",
      "11 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp>=-0.08445569425821305\n",
      "   -0.0000 if cp>=-0.12081197798252105\n",
      "   -0.0000 if cp<=0.052884843200445175\n",
      "   +0.0000 if pa>=0.017271123826503768\n",
      "--------------\n",
      "   -5.5898 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   -1.7588 if cp>=-0.0417468436062336\n",
      "  -10.6885 if \n",
      "   -3.8675 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp<=0.052884843200445175\n",
      "Run episode 958 with rewards 11.0\n",
      "origin 1.0618052361034422e-05 new 1.0618057960999538e-05 not updated\n",
      "============ 959 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp>=-0.08445569425821305\n",
      "   -0.0000 if cp>=-0.12081197798252105\n",
      "   -0.0000 if cp<=0.052884843200445175\n",
      "   +0.0000 if pa>=0.017271123826503768\n",
      "--------------\n",
      "  +23.1097 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   -6.8926 if cp>=-0.0417468436062336\n",
      "  +17.1096 if \n",
      "   -6.7975 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp<=-0.026223866268992424 & cp>=-0.07688234001398087\n",
      "Run episode 959 with rewards 9.0\n",
      "============ 960 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "  +11.4971 if \n",
      "  +11.4971 if cp>=-0.08445569425821305\n",
      "  +11.4971 if cp>=-0.12081197798252105\n",
      "   +6.6670 if cp<=0.052884843200445175\n",
      "   +1.0000 if cp<=-0.03007323816418648\n",
      "--------------\n",
      "  -15.7168 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   -4.6876 if cp>=-0.0417468436062336\n",
      "  -11.6361 if \n",
      "   -4.6229 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp<=-5.8554857969273476e-05\n",
      "Run episode 960 with rewards 10.0\n",
      "============ 961 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp>=-0.08445569425821305\n",
      "   -0.0000 if cp>=-0.12081197798252105\n",
      "   -0.0000 if cp<=0.052884843200445175\n",
      "   +0.0000 if cp<=-0.024724196270108224\n",
      "--------------\n",
      "  +20.4651 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   +4.0473 if cp>=-0.0417468436062336\n",
      "  +16.9413 if \n",
      "   +3.9920 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp<=-0.038469403982162476 & cp>=-0.10372947454452515\n",
      "Run episode 961 with rewards 9.0\n",
      "origin 1.627797241392732e-05 new 1.6277972413927924e-05 not updated\n",
      "============ 962 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp>=-0.08445569425821305\n",
      "   -0.0000 if cp>=-0.12081197798252105\n",
      "   -0.0000 if cp<=0.052884843200445175\n",
      "   +0.0000 if cp<=-0.024724196270108224\n",
      "--------------\n",
      "  -15.8651 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   -4.5149 if cp>=-0.0417468436062336\n",
      "  -14.9070 if \n",
      "   -4.4703 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp<=0.0406044788658619\n",
      "Run episode 962 with rewards 10.0\n",
      "============ 963 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp>=-0.08445569425821305\n",
      "   -0.0000 if cp>=-0.12081197798252105\n",
      "   -0.0000 if cp<=0.052884843200445175\n",
      "   +0.0000 if cp<=-0.030108211934566496\n",
      "--------------\n",
      "  +15.8651 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   +4.5149 if cp>=-0.0417468436062336\n",
      "  +14.9070 if \n",
      "   +4.4703 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp<=-0.044464156031608575 & cp>=-0.1109386146068573\n",
      "Run episode 963 with rewards 10.0\n",
      "origin 1.5028776328157154e-05 new 1.5028776328160728e-05 not updated\n",
      "============ 964 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp>=-0.08445569425821305\n",
      "   -0.0000 if cp>=-0.12081197798252105\n",
      "   -0.0000 if cp<=0.052884843200445175\n",
      "   +0.0000 if cp<=-0.030108211934566496\n",
      "--------------\n",
      "  -12.3559 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   -3.5162 if cp>=-0.0417468436062336\n",
      "  -11.6096 if \n",
      "   -3.4815 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp<=0.03794231787323952\n",
      "Run episode 964 with rewards 9.0\n",
      "============ 965 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=-0.08445569425821305\n",
      "   +0.0000 if cp>=-0.12081197798252105\n",
      "   +0.0000 if cp<=0.052884843200445175\n",
      "   +0.0000 if cp<=-0.028475760295987126\n",
      "--------------\n",
      "  +12.3559 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   +3.5162 if cp>=-0.0417468436062336\n",
      "  +11.6096 if \n",
      "   +3.4815 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp>=0.035057643055915834\n",
      "Run episode 965 with rewards 9.0\n",
      "============ 966 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=-0.08445569425821305\n",
      "   +0.0000 if cp>=-0.12081197798252105\n",
      "   +0.0000 if cp<=0.052884843200445175\n",
      "   +0.0000 if cp<=-0.031001512706279752\n",
      "--------------\n",
      "  -10.8369 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   -3.3035 if cp>=-0.0417468436062336\n",
      "  -10.3813 if \n",
      "   -3.2719 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp<=-0.031001512706279752\n",
      "Run episode 966 with rewards 9.0\n",
      "============ 967 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp>=-0.08445569425821305\n",
      "   -0.0000 if cp>=-0.12081197798252105\n",
      "   -0.0000 if cp<=0.052884843200445175\n",
      "   +0.0000 if cp<=0.005657285358756782\n",
      "--------------\n",
      "  +10.8369 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   +3.3035 if cp>=-0.0417468436062336\n",
      "  +10.3813 if \n",
      "   +3.2719 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp<=-0.058768171817064285\n",
      "Run episode 967 with rewards 9.0\n",
      "============ 968 ===========\n",
      "8 actions [0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=-0.08445569425821305\n",
      "   +0.0000 if cp>=-0.12081197798252105\n",
      "   +0.0000 if cp<=0.052884843200445175\n",
      "   +0.0000 if cp<=0.026709198206663134\n",
      "--------------\n",
      "   -9.9824 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   -3.4562 if cp>=-0.0417468436062336\n",
      "  -10.0771 if \n",
      "   -3.4267 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp<=0.048956332355737694\n",
      "Run episode 968 with rewards 8.0\n",
      "============ 969 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp>=-0.08445569425821305\n",
      "   -0.0000 if cp>=-0.12081197798252105\n",
      "   -0.0000 if cp<=0.052884843200445175\n",
      "   +0.0000 if cp>=0.0019266627263277779\n",
      "--------------\n",
      "   +9.9824 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   +3.4562 if cp>=-0.0417468436062336\n",
      "  +10.0771 if \n",
      "   +3.4267 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp<=0.0019266627263277779\n",
      "Run episode 969 with rewards 9.0\n",
      "============ 970 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=-0.08445569425821305\n",
      "   +0.0000 if cp>=-0.12081197798252105\n",
      "   -0.0000 if cp<=0.052884843200445175\n",
      "   +0.0000 if cp<=0.047785384207963945\n",
      "--------------\n",
      "   -9.4295 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   -3.3305 if cp>=-0.0417468436062336\n",
      "   -9.5847 if \n",
      "   -3.3026 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp<=0.047785384207963945\n",
      "Run episode 970 with rewards 9.0\n",
      "============ 971 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp>=-0.08445569425821305\n",
      "   -0.0000 if cp>=-0.12081197798252105\n",
      "   -0.0000 if cp<=0.052884843200445175\n",
      "   +0.0000 if cp<=-0.06879594847559929\n",
      "--------------\n",
      "   +9.4295 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   +3.3305 if cp>=-0.0417468436062336\n",
      "   +9.5847 if \n",
      "   +3.3026 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp>=-0.1018165871500969\n",
      "Run episode 971 with rewards 10.0\n",
      "============ 972 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=-0.08445569425821305\n",
      "   +0.0000 if cp>=-0.12081197798252105\n",
      "   +0.0000 if cp<=0.052884843200445175\n",
      "   +0.0000 if cp<=0.006780007667839528\n",
      "--------------\n",
      "  -24.4744 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   -8.6785 if cp>=-0.0417468436062336\n",
      "  -24.9115 if \n",
      "   -8.6063 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp<=0.07484680265188218\n",
      "Run episode 972 with rewards 9.0\n",
      "============ 973 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=-0.08445569425821305\n",
      "   +0.0000 if cp>=-0.12081197798252105\n",
      "   +0.0000 if cp<=0.052884843200445175\n",
      "   +0.0000 if \n",
      "--------------\n",
      "  +24.4744 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   +8.6785 if cp>=-0.0417468436062336\n",
      "  +24.9115 if \n",
      "   +8.6063 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp>=-0.09443235993385315\n",
      "Run episode 973 with rewards 10.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 974 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp>=-0.08445569425821305\n",
      "   -0.0000 if cp>=-0.12081197798252105\n",
      "   -0.0000 if cp<=0.0361582413315773\n",
      "   +0.0000 if cp<=0.0361582413315773\n",
      "--------------\n",
      "  -11.5571 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   -5.3298 if cp>=-0.0417468436062336\n",
      "  -12.9952 if \n",
      "   -5.2957 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp<=0.0361582413315773\n",
      "Run episode 974 with rewards 10.0\n",
      "origin 1.3400960409629748e-05 new 1.3400960410224367e-05 not updated\n",
      "============ 975 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp>=-0.08445569425821305\n",
      "   -0.0000 if cp>=-0.12081197798252105\n",
      "   -0.0000 if cp<=0.0361582413315773\n",
      "   +0.0000 if cp<=0.0361582413315773\n",
      "--------------\n",
      "  +11.5571 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   +5.3298 if cp>=-0.0417468436062336\n",
      "  +12.9952 if \n",
      "   +5.2957 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp>=0.04520869627594948\n",
      "Run episode 975 with rewards 9.0\n",
      "origin 1.645172134984259e-05 new 1.645172134984498e-05 not updated\n",
      "============ 976 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp>=-0.08445569425821305\n",
      "   -0.0000 if cp>=-0.12081197798252105\n",
      "   -0.0000 if cp<=0.0361582413315773\n",
      "   +0.0000 if cp<=0.0361582413315773\n",
      "--------------\n",
      "   -9.7870 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   -4.5135 if cp>=-0.0417468436062336\n",
      "  -11.0049 if \n",
      "   -4.4847 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp<=0.04821448698639871\n",
      "Run episode 976 with rewards 10.0\n",
      "============ 977 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   +0.0000 if cp>=-0.08445569425821305\n",
      "   +0.0000 if cp>=-0.12081197798252105\n",
      "   -0.0000 if cp<=0.0361582413315773\n",
      "   -0.0000 if cp<=-0.0518541119992733\n",
      "   +0.0000 if pa>=0.20420466363430023\n",
      "--------------\n",
      "   +9.7870 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   +4.5135 if cp>=-0.0417468436062336\n",
      "  +11.0049 if \n",
      "   +4.4847 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp>=-0.09580563753843307\n",
      "Run episode 977 with rewards 10.0\n",
      "============ 978 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   -0.0000 if cp>=-0.08445569425821305\n",
      "   -0.0000 if cp>=-0.12081197798252105\n",
      "   +0.0000 if cp<=0.0361582413315773\n",
      "   +0.0000 if cp<=-0.0518541119992733\n",
      "   +0.0000 if cp<=0.08769316822290421\n",
      "--------------\n",
      "   -8.5276 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   -3.9331 if cp>=-0.0417468436062336\n",
      "   -9.5891 if \n",
      "   -3.9079 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp<=0.058565668761730194\n",
      "Run episode 978 with rewards 10.0\n",
      "============ 979 ===========\n",
      "8 actions [1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.0000 if cp>=-0.08445569425821305\n",
      "   -0.0000 if cp>=-0.12081197798252105\n",
      "   -0.0000 if cp<=-0.0518541119992733\n",
      "   -0.0000 if cp<=0.08769316822290421\n",
      "   +0.0000 if cp<=-0.014376525580883022\n",
      "--------------\n",
      "   +8.5276 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   +3.9331 if cp>=-0.0417468436062336\n",
      "   +9.5891 if \n",
      "   +3.9079 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp>=-0.0854839488863945\n",
      "Run episode 979 with rewards 8.0\n",
      "============ 980 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.0000 if cp>=-0.08445569425821305\n",
      "   +0.0000 if cp>=-0.12081197798252105\n",
      "   +0.0000 if cp<=-0.0518541119992733\n",
      "   +0.0000 if cp<=0.08769316822290421\n",
      "   +0.0000 if cp<=0.005957419984042646\n",
      "--------------\n",
      "  -21.9099 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "  -10.1181 if cp>=-0.0417468436062336\n",
      "  -24.6501 if \n",
      "  -10.0535 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp<=0.04439392089843751\n",
      "Run episode 980 with rewards 9.0\n",
      "============ 981 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   +0.0000 if cp>=-0.08445569425821305\n",
      "   +0.0000 if cp>=-0.12081197798252105\n",
      "   +0.0000 if cp<=0.08769316822290421\n",
      "   +0.0000 if cp<=0.005957419984042646\n",
      "   +0.0000 if \n",
      "--------------\n",
      "  +21.9099 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "  +10.1181 if cp>=-0.0417468436062336\n",
      "  +24.6501 if \n",
      "  +10.0535 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp>=0.047439257800579074\n",
      "Run episode 981 with rewards 10.0\n",
      "============ 982 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   -0.0000 if cp>=-0.08445569425821305\n",
      "   -0.0000 if cp>=-0.12081197798252105\n",
      "   -0.0000 if cp<=0.08769316822290421\n",
      "   -0.0000 if \n",
      "   +0.0000 if cp<=0.09892480224370957\n",
      "--------------\n",
      "   -7.3133 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   -3.7944 if cp>=-0.0417468436062336\n",
      "   -8.6451 if \n",
      "   -3.7729 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp<=0.06955996304750442\n",
      "Run episode 982 with rewards 9.0\n",
      "============ 983 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.0000 if cp>=-0.08445569425821305\n",
      "   -0.0000 if cp>=-0.12081197798252105\n",
      "   -0.0000 if cp<=0.08769316822290421\n",
      "   -0.0000 if \n",
      "   +0.0000 if \n",
      "--------------\n",
      "   +7.4370 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   +3.6863 if cp>=-0.0417468436062336\n",
      "   +8.7645 if \n",
      "   +3.7607 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp>=-0.09200784713029861\n",
      "Run episode 983 with rewards 9.0\n",
      "============ 984 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.0000 if cp>=-0.12081197798252105\n",
      "   +0.0000 if cp<=0.08769316822290421\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=0.13233260810375214\n",
      "   +0.0000 if cp>=0.09074382334947587\n",
      "--------------\n",
      "  -17.9838 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   -8.9508 if cp>=-0.0417468436062336\n",
      "  -21.2306 if \n",
      "   -9.1306 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp<=0.036579555273056036\n",
      "Run episode 984 with rewards 9.0\n",
      "============ 985 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   +0.0000 if cp>=-0.12081197798252105\n",
      "   +0.0000 if cp<=0.08769316822290421\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp>=0.13233260810375214\n",
      "   +0.0000 if \n",
      "--------------\n",
      "  +17.9838 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   +8.9508 if cp>=-0.0417468436062336\n",
      "  +21.2306 if \n",
      "   +9.1306 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp>=0.02736170366406441\n",
      "Run episode 985 with rewards 9.0\n",
      "============ 986 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.0000 if cp>=-0.12081197798252105\n",
      "   +0.0000 if \n",
      "   -0.0000 if cp>=0.13233260810375214\n",
      "   -0.0000 if cp<=0.00343504697084428\n",
      "   +0.0000 if cp<=0.03609177954494954\n",
      "--------------\n",
      "   -6.4793 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   -3.8756 if cp>=-0.0417468436062336\n",
      "   -8.3946 if \n",
      "   -4.2576 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp<=-0.01905557960271835\n",
      "Run episode 986 with rewards 10.0\n",
      "============ 987 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.0000 if cp>=-0.12081197798252105\n",
      "   -0.0000 if \n",
      "   +0.0000 if cp>=0.13233260810375214\n",
      "   -0.0000 if cp<=0.00343504697084428\n",
      "   -0.0000 if cp<=-0.04474673569202423\n",
      "--------------\n",
      "   +7.3059 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   +3.7824 if cp>=-0.0417468436062336\n",
      "   +8.7819 if \n",
      "   +3.8601 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp>=0.04000912606716156\n",
      "Run episode 987 with rewards 10.0\n",
      "============ 988 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.0000 if cp>=-0.12081197798252105\n",
      "   +0.0000 if \n",
      "   -0.0000 if cp<=0.00343504697084428\n",
      "   +0.0000 if cp<=-0.04474673569202423\n",
      "   +0.0000 if cp<=0.07148492634296418 & cp>=-0.014466169103980065\n",
      "--------------\n",
      "  -17.6585 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   -9.1951 if cp>=-0.0417468436062336\n",
      "  -21.2809 if \n",
      "   -9.3857 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp<=0.07148492634296418\n",
      "Run episode 988 with rewards 10.0\n",
      "============ 989 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   +0.0000 if cp>=-0.12081197798252105\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.00343504697084428\n",
      "   +0.0000 if cp<=0.07148492634296418 & cp>=-0.014466169103980065\n",
      "   +0.0000 if \n",
      "--------------\n",
      "  +17.6585 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   +9.1951 if cp>=-0.0417468436062336\n",
      "  +21.2809 if \n",
      "   +9.3857 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp>=-0.08512559980154037\n",
      "Run episode 989 with rewards 9.0\n",
      "============ 990 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.0000 if cp>=-0.12081197798252105\n",
      "   +0.0000 if \n",
      "   -0.0000 if cp<=0.00343504697084428\n",
      "   +0.0000 if cp<=0.03274189643561841\n",
      "   +0.0000 if cp<=0.03274189643561841 & cp>=-0.028807778283953665\n",
      "--------------\n",
      "   -7.4836 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   -3.8968 if cp>=-0.0417468436062336\n",
      "   -9.0187 if \n",
      "   -3.9776 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp<=-0.018671831674873827\n",
      "Run episode 990 with rewards 9.0\n",
      "============ 991 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.0000 if cp>=-0.12081197798252105\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp<=0.00343504697084428\n",
      "   -0.0000 if cp<=0.03274189643561841\n",
      "   +0.0000 if cp<=-0.0446807861328125\n",
      "--------------\n",
      "   +7.4836 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   +3.8968 if cp>=-0.0417468436062336\n",
      "   +9.0187 if \n",
      "   +3.9776 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp>=0.019135314226150515\n",
      "Run episode 991 with rewards 9.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 992 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.0000 if cp>=-0.12081197798252105\n",
      "   +0.0000 if \n",
      "   -0.0000 if cp<=0.00343504697084428\n",
      "   -0.0000 if cp<=0.03274189643561841\n",
      "   +0.0000 if cp<=0.07958149611949922 & cp>=0.026817317306995395\n",
      "--------------\n",
      "  -18.3988 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   -9.6110 if cp>=-0.0417468436062336\n",
      "  -22.2035 if \n",
      "   -9.8096 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp<=0.04810818880796434\n",
      "Run episode 992 with rewards 9.0\n",
      "============ 993 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   +0.0000 if cp>=-0.12081197798252105\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.03274189643561841\n",
      "   +0.0000 if cp<=0.07958149611949922 & cp>=0.026817317306995395\n",
      "   +0.0000 if \n",
      "--------------\n",
      "  +18.3988 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   +9.6110 if cp>=-0.0417468436062336\n",
      "  +22.2035 if \n",
      "   +9.8096 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp<=-0.061570990830659866\n",
      "Run episode 993 with rewards 9.0\n",
      "============ 994 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.0000 if cp>=-0.12081197798252105\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.03274189643561841\n",
      "   -0.0000 if cp<=-0.005436258530244221\n",
      "   +0.0000 if cp>=0.06551872193813324\n",
      "--------------\n",
      "   -6.2182 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   -4.0982 if cp>=-0.0417468436062336\n",
      "   -8.5564 if \n",
      "   -4.4642 if cp>=-0.011055708117783069\n",
      "   +0.9165 if cp<=0.025334397330880172 & cp>=-0.005436258530244221\n",
      "Run episode 994 with rewards 10.0\n",
      "============ 995 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.0000 if cp>=-0.12081197798252105\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp<=0.03274189643561841\n",
      "   -0.0000 if cp<=-0.005436258530244221\n",
      "   +0.0000 if cp>=-0.009588232077658172\n",
      "--------------\n",
      "   +7.1465 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   +3.2490 if cp>=-0.0417468436062336\n",
      "   +9.4314 if \n",
      "   +3.4289 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp>=-0.08031314760446548\n",
      "Run episode 995 with rewards 9.0\n",
      "============ 996 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.0000 if cp>=-0.12081197798252105\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.03274189643561841\n",
      "   +0.0000 if cp<=-0.005436258530244221\n",
      "   +0.0000 if cp<=0.07175994515419007\n",
      "--------------\n",
      "  -17.3681 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   -7.9314 if cp>=-0.0417468436062336\n",
      "  -22.9564 if \n",
      "   -8.3687 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp<=0.050704315304756165\n",
      "Run episode 996 with rewards 9.0\n",
      "============ 997 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   +0.0000 if cp>=-0.12081197798252105\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=-0.005436258530244221\n",
      "   +0.0000 if cp<=0.07175994515419007\n",
      "   +0.0000 if \n",
      "--------------\n",
      "  +17.3681 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   +7.9314 if cp>=-0.0417468436062336\n",
      "  +22.9564 if \n",
      "   +8.3687 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp>=0.03947742357850075\n",
      "Run episode 997 with rewards 9.0\n",
      "============ 998 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.0000 if cp>=-0.12081197798252105\n",
      "   +0.0000 if \n",
      "   +0.0000 if cp<=0.07175994515419007\n",
      "   -0.0000 if cp<=0.014693167060613643\n",
      "   +0.0000 if cp<=0.014693167060613643\n",
      "--------------\n",
      "   -7.2701 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   -3.5376 if cp>=-0.0417468436062336\n",
      "   -9.8927 if \n",
      "   -3.8171 if cp>=-0.011055708117783069\n",
      "   +0.9833 if cp<=0.047245201468467724\n",
      "Run episode 998 with rewards 10.0\n",
      "============ 999 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.0000 if cp>=-0.12081197798252105\n",
      "   -0.0000 if \n",
      "   -0.0000 if cp<=0.07175994515419007\n",
      "   +0.0000 if cp>=0.009427319094538693\n",
      "   +0.0000 if cp>=0.009427319094538693\n",
      "--------------\n",
      "   +7.2701 if cp<=0.014357964508235455 & pa>=-0.06876160800457001\n",
      "   +3.5376 if cp>=-0.0417468436062336\n",
      "   +9.8927 if \n",
      "   +3.8171 if cp>=-0.011055708117783069\n",
      "   +1.0000 if cp>=0.026162701472640038\n",
      "Run episode 999 with rewards 9.0\n",
      "\n",
      "Done\n"
     ]
    }
   ],
   "source": [
    "rewards = train()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 27,
   "id": "3d20e8e0",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-------------------------\n",
      "   +4.4005 if cp>=-0.034614034742116925 & cv>=-0.3133296966552734\n",
      "   -1.4219 if cv<=-0.38871951699256896 & pa<=0.017361655458807947\n",
      "   -0.0000 if cv>=0.9960935115814209\n",
      "   -0.0000 if cp<=-0.027831528335809708 & pa<=0.04310643374919893\n",
      "   +3.8268 if cp<=0.04204743355512619 & cp>=0.025603938847780228 & cv>=0.17478539049625397 & pa<=0.032073907554149635 & pa>=0.013494865968823433\n",
      "-------------------------\n",
      "   +6.9184 if cv<=-0.355834037065506\n",
      "   +7.0150 if pa>=0.016492818668484694\n",
      "   +0.0000 if cv>=0.9960935115814209\n",
      "   +5.6943 if cp>=-0.013536681979894634 & cv>=0.07957192165777191 & pa>=0.02368280179798603\n",
      "   -4.0822 if cp<=0.04204743355512619 & cp>=0.025603938847780228 & cv>=0.17478539049625397 & pa<=0.032073907554149635 & pa>=0.013494865968823433\n"
     ]
    }
   ],
   "source": [
    "for i in range(2):\n",
    "    print('-------------------------')\n",
    "    print(actor.best_model[i].rules_)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 28,
   "id": "0b443f87",
   "metadata": {},
   "outputs": [],
   "source": [
    "def test(num_test_episodes=100):\n",
    "    \"\"\"\n",
    "    Test the learned policy using the trained actor model.\n",
    "\n",
    "    Args:\n",
    "        num_test_episodes (int): Number of episodes to test the model.\n",
    "\n",
    "    Returns:\n",
    "        float: Average reward over the test episodes.\n",
    "    \"\"\"\n",
    "    total_reward = 0\n",
    "\n",
    "    for episode in range(num_test_episodes):\n",
    "        state = env.reset()[0]  # Reset the environment and get the initial state\n",
    "        episode_reward = 0\n",
    "\n",
    "        for t in range(1, 10000):  # Limit the number of time steps\n",
    "            # Convert state to tensor and predict action probabilities\n",
    "            #             state_tensor = torch.tensor(state, dtype=torch.float32).to(device)\n",
    "            action_probs = actor.predict(pd.DataFrame(np.array([state]), columns=column_names))\n",
    "            # Select action based on the highest probability\n",
    "            action = np.argmax(action_probs)\n",
    "            # Take the chosen action\n",
    "            next_state, reward, done, trunc, _ = env.step(action)\n",
    "            # Accumulate reward\n",
    "            episode_reward += reward\n",
    "            if done or trunc:\n",
    "                break\n",
    "            # Update state\n",
    "            state = next_state\n",
    "        total_reward += episode_reward\n",
    "        print(f\"Test Episode {episode + 1}, Reward: {episode_reward}\")\n",
    "    avg_reward = total_reward / num_test_episodes\n",
    "    print(f\"\\nAverage Reward over {num_test_episodes} Test Episodes: {avg_reward}\")\n",
    "    return avg_reward"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 29,
   "id": "ef9e3e26",
   "metadata": {
    "scrolled": false
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Test Episode 1, Reward: 152.0\n",
      "Test Episode 2, Reward: 315.0\n",
      "Test Episode 3, Reward: 91.0\n",
      "Test Episode 4, Reward: 500.0\n",
      "Test Episode 5, Reward: 43.0\n",
      "Test Episode 6, Reward: 47.0\n",
      "Test Episode 7, Reward: 59.0\n",
      "Test Episode 8, Reward: 360.0\n",
      "Test Episode 9, Reward: 50.0\n",
      "Test Episode 10, Reward: 500.0\n",
      "Test Episode 11, Reward: 172.0\n",
      "Test Episode 12, Reward: 27.0\n",
      "Test Episode 13, Reward: 47.0\n",
      "Test Episode 14, Reward: 298.0\n",
      "Test Episode 15, Reward: 37.0\n",
      "Test Episode 16, Reward: 78.0\n",
      "Test Episode 17, Reward: 34.0\n",
      "Test Episode 18, Reward: 500.0\n",
      "Test Episode 19, Reward: 170.0\n",
      "Test Episode 20, Reward: 98.0\n",
      "Test Episode 21, Reward: 500.0\n",
      "Test Episode 22, Reward: 80.0\n",
      "Test Episode 23, Reward: 125.0\n",
      "Test Episode 24, Reward: 500.0\n",
      "Test Episode 25, Reward: 90.0\n",
      "Test Episode 26, Reward: 500.0\n",
      "Test Episode 27, Reward: 57.0\n",
      "Test Episode 28, Reward: 122.0\n",
      "Test Episode 29, Reward: 301.0\n",
      "Test Episode 30, Reward: 75.0\n",
      "Test Episode 31, Reward: 60.0\n",
      "Test Episode 32, Reward: 500.0\n",
      "Test Episode 33, Reward: 95.0\n",
      "Test Episode 34, Reward: 265.0\n",
      "Test Episode 35, Reward: 129.0\n",
      "Test Episode 36, Reward: 35.0\n",
      "Test Episode 37, Reward: 26.0\n",
      "Test Episode 38, Reward: 500.0\n",
      "Test Episode 39, Reward: 432.0\n",
      "Test Episode 40, Reward: 51.0\n",
      "Test Episode 41, Reward: 46.0\n",
      "Test Episode 42, Reward: 175.0\n",
      "Test Episode 43, Reward: 306.0\n",
      "Test Episode 44, Reward: 500.0\n",
      "Test Episode 45, Reward: 234.0\n",
      "Test Episode 46, Reward: 57.0\n",
      "Test Episode 47, Reward: 342.0\n",
      "Test Episode 48, Reward: 500.0\n",
      "Test Episode 49, Reward: 139.0\n",
      "Test Episode 50, Reward: 500.0\n",
      "Test Episode 51, Reward: 449.0\n",
      "Test Episode 52, Reward: 29.0\n",
      "Test Episode 53, Reward: 500.0\n",
      "Test Episode 54, Reward: 426.0\n",
      "Test Episode 55, Reward: 500.0\n",
      "Test Episode 56, Reward: 500.0\n",
      "Test Episode 57, Reward: 37.0\n",
      "Test Episode 58, Reward: 500.0\n",
      "Test Episode 59, Reward: 54.0\n",
      "Test Episode 60, Reward: 500.0\n",
      "Test Episode 61, Reward: 278.0\n",
      "Test Episode 62, Reward: 500.0\n",
      "Test Episode 63, Reward: 120.0\n",
      "Test Episode 64, Reward: 79.0\n",
      "Test Episode 65, Reward: 500.0\n",
      "Test Episode 66, Reward: 158.0\n",
      "Test Episode 67, Reward: 500.0\n",
      "Test Episode 68, Reward: 245.0\n",
      "Test Episode 69, Reward: 105.0\n",
      "Test Episode 70, Reward: 500.0\n",
      "Test Episode 71, Reward: 64.0\n",
      "Test Episode 72, Reward: 99.0\n",
      "Test Episode 73, Reward: 168.0\n",
      "Test Episode 74, Reward: 71.0\n",
      "Test Episode 75, Reward: 69.0\n",
      "Test Episode 76, Reward: 104.0\n",
      "Test Episode 77, Reward: 100.0\n",
      "Test Episode 78, Reward: 116.0\n",
      "Test Episode 79, Reward: 70.0\n",
      "Test Episode 80, Reward: 105.0\n",
      "Test Episode 81, Reward: 67.0\n",
      "Test Episode 82, Reward: 247.0\n",
      "Test Episode 83, Reward: 53.0\n",
      "Test Episode 84, Reward: 500.0\n",
      "Test Episode 85, Reward: 500.0\n",
      "Test Episode 86, Reward: 50.0\n",
      "Test Episode 87, Reward: 52.0\n",
      "Test Episode 88, Reward: 20.0\n",
      "Test Episode 89, Reward: 403.0\n",
      "Test Episode 90, Reward: 434.0\n",
      "Test Episode 91, Reward: 500.0\n",
      "Test Episode 92, Reward: 157.0\n",
      "Test Episode 93, Reward: 500.0\n",
      "Test Episode 94, Reward: 214.0\n",
      "Test Episode 95, Reward: 500.0\n",
      "Test Episode 96, Reward: 500.0\n",
      "Test Episode 97, Reward: 47.0\n",
      "Test Episode 98, Reward: 74.0\n",
      "Test Episode 99, Reward: 62.0\n",
      "Test Episode 100, Reward: 177.0\n",
      "\n",
      "Average Reward over 100 Test Episodes: 233.23\n"
     ]
    }
   ],
   "source": [
    "avg_test_reward = test(num_test_episodes=100)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 30,
   "id": "31340922",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[<matplotlib.lines.Line2D at 0x7f324ef4b760>]"
      ]
     },
     "execution_count": 30,
     "metadata": {},
     "output_type": "execute_result"
    },
    {
     "data": {
      "image/png": "iVBORw0KGgoAAAANSUhEUgAAAXcAAAD4CAYAAAAXUaZHAAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjUuMiwgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy8qNh9FAAAACXBIWXMAAAsTAAALEwEAmpwYAABBB0lEQVR4nO2dd5wdVfn/38/cti3Z3Ww2PaSR0EnAAAFCDSBFCf4ERFBQUSwoiny/CgpW9IvSFQRBmqCoFCkhoQVCCSWdJKT3bNr23u69c35/zNy2JbvZezfZvfd5v1772pkz5545c2fu5zzznOecI8YYFEVRlPTCOtAVUBRFUVKPiruiKEoaouKuKIqShqi4K4qipCEq7oqiKGmI90BXAGDw4MFm7NixB7oaiqIo/YrFixeXG2OKOzrWJ8R97NixLFq06EBXQ1EUpV8hIls7O6ZuGUVRlDRExV1RFCUNUXFXFEVJQ1TcFUVR0hAVd0VRlDSkW+IuIltEZIWILBORRW7aIBF5Q0TWu/8L3XQRkT+JyAYRWS4ix/bmBSiKoijt2RfL/QxjzBRjzFR3/0ZgrjFmIjDX3Qc4D5jo/l0DPJCqyiqKoijdIxm3zEzgCXf7CeCiuPS/G4ePgAIRGZ7EeRRFSTHzN5SzubzhQFdD6UW6K+4GeF1EFovINW7aUGPMLnd7NzDU3R4JbI/7bImbloCIXCMii0RkUVlZWQ+qrihKT7nibx9zxh3zDnQ1lF6kuyNUpxtjdojIEOANEVkTf9AYY0Rkn1b9MMY8BDwEMHXqVF0xRFEUJYV0y3I3xuxw/5cC/wWOB/ZE3C3u/1I3+w5gdNzHR7lpiqIoyn6iS3EXkVwRGRDZBs4BVgIvAVe52a4CXnS3XwKudKNmpgE1ce4bRVEUZT/QHbfMUOC/IhLJ/09jzKsishD4j4hcDWwFLnXzzwbOBzYAjcDXU15rRVEUZa90Ke7GmE3A5A7SK4AZHaQb4NqU1E5RFEXpETpCVVEUJQ1RcVcURUlDVNwVRVHSEBV3RVGUNETFXVEUJQ1RcVcURUlDVNwVRVHSEBV3RVGUNETFXVEUJQ1RcVcURUlDVNwVRVHSEBV3RVGUNETFXVEUJQ1RcVcURUlDVNwVRVHSEBV3RVGUNETFXVEUJQ1RcVcURUlDVNwVRVHSEBV3RVGUNETFXVEUJQ1RcVcURUlDVNwVRVHSEBV3RVGUNETFXVEUJQ1RcVcURUlDVNwVRVHSEBV3RVGUNETFXVEUJQ1RcVcURUlDVNwVRVHSkG6Lu4h4RGSpiMxy98eJyMciskFE/i0ifjc94O5vcI+P7aW6K4qiKJ2wL5b7D4HVcft/AO42xhwMVAFXu+lXA1Vu+t1uPkVRFGU/0i1xF5FRwAXA39x9Ac4EnnWzPAFc5G7PdPdxj89w8yuKoij7ie5a7vcAPwFsd78IqDbGhNz9EmCkuz0S2A7gHq9x8ycgIteIyCIRWVRWVtaz2iuKoigd0qW4i8jngFJjzOJUntgY85AxZqoxZmpxcXEqi1YURcl4vN3IczJwoYicD2QBA4F7gQIR8brW+Shgh5t/BzAaKBERL5APVKS85oqiKEqndGm5G2NuMsaMMsaMBS4D3jLGXAG8DVzsZrsKeNHdfsndxz3+ljHGpLTWiqIoyl5JJs79p8CPRWQDjk/9ETf9EaDITf8xcGNyVVQURVH2le64ZaIYY+YB89ztTcDxHeRpBi5JQd0URVGUHqIjVBVFUdIQFXdFUZQ0RMVdURQlDVFxVxRFSUNU3BVFUdIQFXdFUZQ0RMVdURQlDVFxVxRFSUNU3BVFUdIQFXdFUZQ0RMVdURQlDVFxVxRFSUNU3BVFUdIQFXdFUZQ0RMVdURQlDVFxVxRFSUNU3BVFUdIQFXdFUZQ0RMVdUTIMXa8+M1BxVxRFSUNU3BUlw1DDPTNQcVcURUlDVNwVJcNQwz0zUHFXFEVJQ1TcFUVR0hAVd0XJMDQUMjNQcVcURUlDVNwVJcNQuz0zUHFXlAxm0ZbKA10FpZdQcVeUDCPe5X7xgx+yelftgauM0muouCtKhlPV0Hqgq6D0Al2Ku4hkicgCEflERD4VkV+76eNE5GMR2SAi/xYRv5secPc3uMfH9vI1KIqyD5g2XncROUA1UXqT7ljuLcCZxpjJwBTgXBGZBvwBuNsYczBQBVzt5r8aqHLT73bzKYrSR1FtT0+6FHfjUO/u+tw/A5wJPOumPwFc5G7PdPdxj88QNQ0Upc+iP870pFs+dxHxiMgyoBR4A9gIVBtjQm6WEmCkuz0S2A7gHq8BilJYZ0VRkqDtGCa1vdKTbom7MSZsjJkCjAKOBw5N9sQico2ILBKRRWVlZckWpyhKD7FU29OSfYqWMcZUA28DJwIFIuJ1D40CdrjbO4DRAO7xfKCig7IeMsZMNcZMLS4u7lntFUVJmr5muFc3tvKTZz+hqTV8oKvSr+lOtEyxiBS429nA2cBqHJG/2M12FfCiu/2Su497/C2jk1koSh+mb6n7PW+u5z+LSvjXwm0Huir9Gm/XWRgOPCEiHpzG4D/GmFkisgr4l4jcCiwFHnHzPwI8KSIbgErgsl6ot6IoPaS9z/3A1EPpXboUd2PMcuCYDtI34fjf26Y3A5ekpHaKovQ6Vh9Vd33fTw4doaooGU7flHYlWVTcFSXDaD9C9QBVpBMi9VHDPTlU3BVF6VOI+y6hcRjJoeKuKBlGW83sqz53JTlU3BVF6VNoW5MaVNwVJcNo6+zoa2IaqY56ZZJDxV1RMhzpY/EysQ5VVfdkUHFXlAxDOyozAxV3Rclw+qqFrG1Qcqi4K0qG09dEVKcgTg0q7oqSYfQxLW9HtEP1gNai/6PirihK3yLSoarqnhQq7oqSYbQVzb4qon21L6C/oOKuKBlOXxPRvhaa2V9RcVeUTKNvaXk7RN0yKUHFXVEynGRFtCUU5sL73mfhlsqU1Eft9tSg4q4oGU6yBvKG0nqWl9RwywsrU1IfJTWouCtKhtHWx56qEaupjk/XkbTJoeKuKEpSpFqDdQxTalBxV5QMo10oZIrKTZUmxxbrSFGBGYqKu6JkOH1NRHWZvdTgPdAVUBRl/xIRzenWCoqoAU5MSbmpdqf0tUanv6HirigZylP+/wNgMf97gGuSiLrcU4O6ZRQlw0nWQk65he2+AvS1kbP9DRV3Rckw2oYYpqxDNUUmty6zlxpU3BUlw0nacu8lC1u1PTlU3BUlw0i1aEYaB53wq2+h4q4oGU7qRqimpBgdxJQiVNwVJcNI9SCmlPen6modKUHFXVEyHGPbKSknZSNUdRBTSlBxV5QMo20HqNjBA1STvaOGe3KouCtKpmO3JvXxVM/eqC731NCluIvIaBF5W0RWicinIvJDN32QiLwhIuvd/4VuuojIn0Rkg4gsF5Fje/siFEXpOVY4RZZ7inpCY24ZNd2ToTuWewi4wRhzODANuFZEDgduBOYaYyYCc919gPOAie7fNcADKa+1oig9p61mJinuqR+gqrNCpoIuxd0Ys8sYs8TdrgNWAyOBmcATbrYngIvc7ZnA343DR0CBiAxPdcUVRUmGmHJaSfrcY3HuqUW1PTn2yecuImOBY4CPgaHGmF3uod3AUHd7JLA97mMlblrbsq4RkUUisqisrGxf660oSg8xgJdwLCGcnM89gsan9y26Le4ikgc8B/zIGFMbf8w4PSr71NAaYx4yxkw1xkwtLi7el48qipIkPkLRbUmyQ1Vt7L5Jt8RdRHw4wv4PY8zzbvKeiLvF/V/qpu8ARsd9fJSbpihKH8AY8MeLe6os95SUEtehqm1GUnQnWkaAR4DVxpi74g69BFzlbl8FvBiXfqUbNTMNqIlz3yiK0gdIEPc+FuceXWZP3wiSojuLdZwMfBVYISLL3LSfAbcB/xGRq4GtwKXusdnA+cAGoBH4eiorrChK8viJCXqy4t5rFrZqe1J0Ke7GmPfp/I1rRgf5DXBtkvVSFKWXMBj80gtumRTHuSvJoSNUFSUD8fVpt4yDGu7JoeKuKBmG06GaQrdMpJykSokR61BVeU8GFXdFyUASo2WSE3fbdkQ41e4U1fbkUHFXlAzDQKLPPdmJw5KsT1t0RafUoOKuKBlIvFsm2ekHbNfEVlHuW6i4K0qGYYxhqFRF95OOlkmx6a6LdaQGFXdFyUAmyM7othVsSqqsXgtzV3VPiu4MYlIUJc3Ip4HdphA/QXLqNydVlt1L00LqCNXkUMtdUTIMY8AvQVqNl81mONn125IuL5VEyhtVvwJaG1JbeAah4q4oGUiAEEG8NBk/nnBLUmWlOs4doJgqrl77bXhRB7v3FBV3RclA/ARpxUcrvqQ7VKPRMilSd4NhoDQ6O7tXpKbQDETFXVEyED8hWvDSii/pUMhUu8aNAV9kMRHLl9rCMwgVdyUpfvSvpYy98ZUDXQ1lH3DEM+Ra7l6sJAcxpTrO3QAB3Dp5NOajp6i4K0nxwrKdXWdS+hyRDlXHck9yhGovWO454vYDqOXeY1TcFSUD8bsdqq3Gi5Wkz703AhZzaHY2LLXce4qKu6JkGAYT7VBtSYHl3hsdqrm4lrtHLfeeouKuKBmInxCteFPic+8Nt0x21C2jlntPUXFXlAzDGAhILBTSCrfy6Pub+cHTS3taYkrrB5Abccuo5d5jVNyVlKALK/QvvIQJGg9B40Ww+d2sFbz8Sc86x+3I7AMpHMWU7bpltlWnZgnATETFXUkJtmp7v8EAFgYbi1Z3eqn4KYD3ubzo1DIpCoU0hlxxLPcNpXUpKTMTUXFXUkJY1b1fIdjYCEFX3KODhnpAyjtUTcxy95pQF7mVzlBxV1KCrW6ZfoMxJmq5B/EAjpumx+WlqmJx5eW44h6QvrV4d39CxV1JCWq59y8ccRfCrrh7khH3FDfsxhB1y8Sv9arsGyruSkoIq+Xer7CwMUjUck/GLdMbtz4y/UAyfQGZjoq7khLCYRX3/oIBxHXLhIzrlpFk3DIpttwxBFxR96nl3mNU3JWUoJZ7/8LjdqiGoh2qPRdR205VrRwicfigbplkUHFXUoKtPvd+gzExn3sqO1QlReEyhpio+7VDtceouCspQS33/kUkWiYUFfeem98mOuVv6oj42tta7rtqmrjkwQ+obNDBTV2h4q6kBI2W6U+YaJx7TNx77v4wqR6hakzMcm/Tofrwu5tZuKWK55eUpOhk6YuKu5ISVNz7F+0t90S3TElVI2t213arrNR3qMZHy6jPvafolGtKSlBx719EfO4RcfdJOGE00vQ/vA3Altsu6LKs3pgV0i8Ryz3kJLivBZGGJFX+/XSmS8tdRB4VkVIRWRmXNkhE3hCR9e7/QjddRORPIrJBRJaLyLG9WfnOWLa9mir1yfU69S0xq0pHqPYfjG2wxDhx7ib5DtVUt+uR+eYBLDFgx56z2Dw2Sld0xy3zOHBum7QbgbnGmInAXHcf4Dxgovt3DfBAaqq5b1x0/3wu/euHB+LUGcVrK3dHt8MpDofbH9Q0BXnwnY0ZOKOlc722saKhkMn43COd6VYKrekEd0yoOWXlZhJdirsx5l2gsk3yTOAJd/sJ4KK49L8bh4+AAhEZnqK67hPrS+sPxGkzlv7olvnliyu5bc4a3ltffqCrsl8xxmmJE0Mhk4+WsVI4cZifILUmx0lobWyXR70yXdPTDtWhxphd7vZuYKi7PRLYHpevxE1rh4hcIyKLRGRRWVlZD6vRHo23Tj2tIZu65s7jjWdYi7Fqtnd6vK9S2+xYh8H++NqRDHHiHk5BnDvBZub5r+fIpoWpqB3G2PglTJXJc8tvSEm5mUbS0TLGabb3WVGNMQ8ZY6YaY6YWFxcnW40oGm+deq56dAFH/er1Do/5CPGI/07GvXLpfq5V8pgUT1Xbb3CHlJq4WSGTGaHqby5jrLWHq8ruTEn1PO6yf1W44t4aE/fMc6H1nJ6K+56Iu8X9X+qm7wBGx+Ub5abtN/qje6Cv8+Gmig7TDTBSnLcuX+Oe/Vgjx18+9sZXeHXlrq4zd0J0BaFM655zBdKx3B0J8LhumZ6IpzHO95cf7vg52Vc8tvOWWG0GOAmt7S33DLtjPaKn4v4ScJW7fRXwYlz6lW7UzDSgJs59s19Qcd9/GGMYI067HgwM2q/n3ljm9Kk88M6mHpcRfVIyTCmM64LpWNzb51+zu5aK+pbOy3PF2MJAffIuVss45+rQck+69MyhO6GQTwMfAoeISImIXA3cBpwtIuuBs9x9gNnAJmAD8DDwvV6pdQfUt4QI20bdMvuZ0a64t/gL9+t5UxES1xvD5vsDEu9zd0MhLXHTOvj9nHvPe5z/p/c6Lc/EhSry/l1J188bdtwy1aa9uEfQOPeu6XIQkzHmy50cmtFBXgNcm2yluktLKMxNz63gR2dN4tTb3+Yr0w7ihrMP2V+nV4gTdytrP585df7yjBMK41juBitquUc6VB+bv4XBA/yxrK7Y76nt3HKXcJy4Z+UnXb2IW6ZqL24ZpWv69QjVeWvLeH7pDvbUOXGwzywq4UdnTTrAtcocDDCAJgA8rft3IePUWO6dlxEM24RtQ5bPk8QZ+ih2zOdut3HL/G726oSsNU3dmJUx3nIPDEi6epbtNCRZ+YOhEWiNhTXri3n36ddzy0SsilA4MijDqM99PxMQ5xW6sGFTSvyt3SUV08yavVj/F943n0NvebXHZfdpEkIhHQmwOolzn/KbN7pRXJy4dxCTvq94jdOgFBS5EdZBjXPvCf1a3G0DeTRGBd022qHam3QUSRFZMUcwUJ/aiJnFW6v4qLNInZRa7u1LWb2re5Nm9RaNrYmhiQ0tqZtAy9gRcbcItbHc4/mq53W2ZF0encSrMyRB3JMfPOhxfe7N3oEAvPfpVj73Z8fnn+pJytKZfi3uWfUlrMz6Jqc3zAHUcu9t2n21BrLif/gdWFjJ8MUHPuCyhz5KaZnxpHyq2hTxzroyDv/FayzY7AwMn7NiF0f88jVW7qhJSfniCvm5R45o55aJ5wbvMwAMYu8utwTLPQXPgGWcZypsBWgkizXbdrFyRy1PL9gWzdPHblmfpF+Le6DeGRV5btMrgPNjVXHvPdp+t/FrXQIpsdq6SyoGIEWswL72zHyw0ZkOYfHWKgDedadHWLa9OiXlR6Yf8Ho97UIh44nM71Ige7+vYsc/A8l3fnrcxsK2fDSSRS5On9pNz69IuuxMol+Lu93kWDK5JvbwaShk79E2TC5kG7Kklcq9hKz1Fqm4y5HL6avPTKTx8XmcFiyUqmkSXHFHrL1a7r5uiPvGsnoam2KRNHUNyT8DlnHOaywvTQTIllj5ffRW9Un6tbh7mhyLJjJCDvqeFZZOtBX3sO1Y7rGQtX17JQ/bpsfzutjRGPVkOlQdnv54217nztlXWkLhpOY4antNXsv5mYZS9GxLnLhH5nP3dDC3jE+ctL25ZWbc+Q4frI/NDvrump0pqJ9bF/EkWO6JmdQx0xX9WtytkBOGF//I76u427bhVy99yuZyjaXtirbfbShsyKKVSiLivm9umS8+8AETfz4nubok1aPq/Ht91R5ueWHl3vN2k9aQzSE3v8r/zVnddeYuKK1tYVdNE17Xcg+GUyPukQ5VJBbn7pH2jWyz8QFwirV8r+XFTzrmT2YCMpeouFseGk0WOXHiHo2SSvos6U+/FvdpV/yCF73nUWiqoz36+yrua3bX8fgHW/j+P5f0RhXTCrvN7z9sO+Ietdz3sTMtGR9yxIpNTttjz0pFihZ3aQ45wvTPj7d1kbNrHv9gCyf+31t4rb27ZeZvKOeoX75GbTffPiIdqoiFE+ck7UIh/QTJEqe8w6y9X0tE3JuMP6l54SNYkUFW4qWRALkduGXUcO+afi3uAMv9k8mhmROtT4Geu2VCKbKK0o34CI22vumt5TUMlSq2mGFOwn70uYfDPe9Q3VXTRGld4qt+qkapxuqVOvXxeZyfabCTZ/veN9dT1xJi1c5uhm9GFdIp14innc99rDiuliqTxzjZxd56OSJzwTfhT2p2yQiRxkcsD40EyKbz0bFK5/R7cX+r6WAAxsoewOyzX1KXh9s7lzz4IVm08BXPG4RDiZbhRwsXEJAQq+wxtEpgv0bLxN/nfW3QT/y/tzj+d3MTOudStdBEq2tdp9Kw7KpD1Rs9vvfvIRS2nb4A1+duXHG3xYOPMMfL6qgFf4g4kWhzwscxUJq40Pqg03Ij/vomAlE/fXcxxrS7LrFdy93y0GDa+tz199pd+r24b27KpsEE+JXv79zvuxfbGAK0siXrcljwMFsrGvb6utoSisyzoQ9NR9jG8Bvv49zqewzvlncSjg2yHEu9nHxaJCsloxM7oqYpyLaKxLIjjfJHmyqZ8LPZPSrX3rGU9YGvsiXrcia1rEq6nuD43FON17P3DlVv1LLf+7kP/vkcfvyfZcxZ4czCLa64t4ThC573+E/gt1ztmc3Dvjv4s/8+AN61JwPwJ//9ndfPFfRm41ju+zJt8J2vr+Pgn8+J/g4BhJjPvcFkkSO6zF5P6PfiDkKV26F3gWcBobBhlDvHOLP/h9Nun8cX/9K51dHU2vkP4nevrMp4X7zHEsZYzshTaUocLXpQnvMjbDBZVIf8NDX2zqjOi+6fz6m3v52QFrJjiyj3lLP5MGppnlbvNBDGGP6zsPNVpbZXNvL2mtJOj0ejf1Jountk75Z5xCcf3ovlHhHcF5bt5JVPHHHP8jtTS4WxKBbn3p3lWcLZHueZr/EN4XV7KjtMkVOInWiVRyKCBuI08tXk4SXc5ZvUgs2VfLK9mn8t2Maj8zcD0NASJ+7RNwsP9cZPLs3k0MwZ1tJov4++cHdNGog71EXWWgSkpYYRkihCna2n+sGGcv767kag44fl4fc2M2v5fp2Ovs9hDNSbbGenbnfCMZ/bgVpHNg1kMW/FlpQOk4/QUSST1VLNuqyruMH7nx6XW2tyo9tlvhEAzFtXxk+e6zw65Px73+Prj3e+nNxbrvCn0i0TeUvp6O1ye2UjTa2OMIb2Yrm3xL1RWG45eVnO7I92nAxMlJLodp2vmKIB2dwfushNSPwtRPpgxkgptSaHCjMQH+Euxw1c+tcPmXn/fG58fgWNbt3jp1uIxLkv2lpDo8kiS4I84b+Nx/y3k9XqGG66IlPXpIW41xITd0/9LoZLx/ORtOXyv32ccYsj7ythOyYp/p2OqL29ppQt5Q34w47oWoEBNBEgl+YuXWDPLNre4xjw5mDMuvM2OCL6A+8LPSoLIF9ijUbAXSCirnnvjVOd23j9+uVP+emzy9tdy62vOCGQqexQ3Vs/0il/fDu6UtbeQiUjIgqxScKKBmQzoTg3GusOMChuwFKTdyB+j8U6210GefO7CWVGLPQxsoctZiitePER6tBy7+qeN7W2t9xrWwwNOFNJH2etA8DX4nTw63CWrkkPcY+z3L2NexIs9wF07Qc+11rA/fXX79dZDfsLQdsm141W8Jc6Fu3XH1/I6XfMI2A74rin1U+1yaVIarE6EbWVO2o45OZX+d9nlzNrRc/ehuKF19MacwFNkn1vMPJoZLJspMzkU2nyyLedof5tLcLOLMTH5m/h34u2c+H97+/TeXtCRCy7Mlb3ZrnHv1GJ21znBnyccciQBMs9nvrAELweYamZSJnJh0WPdlivg2QP28xQQng6dMtsKK1n/M9m89qniW9+DoZzrIUEK7ZGUyKhkEEsGklcJ8AbrGOGtZiBdes7vVbFIS3E/fbQl6hzXQfehlKGUxk9dp33+ej2N59YxEOuGyaer3lfY5K9Ed69vfcr2wWvrtxFVYpirlOBMZDtdmh5GkshbmGGgaYOGw91doDNZjjjZDehcMfREou2xO5JeV3PQtsio0ht2/CPd2LzjJxjLSJoO5Egzy4u6dYw/Vu8T3GiZxV5NJFPAyfVzmH1209T28Zy78p/vHJH+36GCbKDg83WDnJ3j7btY8g2jl/bTqxbrOFx/gdD3bPcx4jTh+IvHEFeljc6kKktnwz7f85kfHh4zz4K02bWz5Bt8BBmlJSz1QwhaLz4JJQwHmJ5STVn3eV0xM9bW5rQceoEPlzBQ/67GfPGN+MuzMkTNhaNJpBwzmPq5vGI/06+8OHFULWl0+tV0kTc15nRnNDi9OZ7G/ckuGXiZy18c/Uefj97TbvPD8L5gVbu6Noa+O2sVYy98ZVkq9whZXUtfOepJZx777tdZ96PRCx3MWHCrt/9M7KWKzxzqct2ZhbcaEaQIy3Y1R2vh+6JizVs2YeIkjGym4ssxzqOWO6Vja0MjHsjO9TaTihseGbxdv7nmU94bP6WLss9zHLEd7Z9An8PnwPAlrceoaaxlTwa+afvVl71/7QHr/+GuYH/5Tn+J3W9fqEmlmd9i/O2x5aw21zewEebKjlCtrAl6woe9t1BdXUFJVWJb6r3v72BT3fW0BDn0z7WWk/ICsDQo8jxezoU9wnNT1JfeER0BaYak0tdVTlPfeR8b3NW7OLlT3YyQsrxSZitZihBnJDK+DeI+9/eEN3Oz/azvCQ2bmJSnH8/t2o11LpvdG7HbdBYNJIo7gXBuM7sVS/t/XvLcNJC3AEayaKebPxNZYyQCuaEj2ODPYKvet/kcs/chLxtLbth4rySb93ecZTEpztjD+Qj7zu9+z2dE2VvRKyaPbUt1DT2LBJkW0UjH27ce5/Dyh013R/wAmRLC/XGeT1ura+kmGqeC/yaQqmnLncMAJvMcACsyo4bSCtO3NuGC3bmUvET5J3Aj7nH/xemyppoo1BW10K+6xveaA+nWKoJhm3K652GvHwvizlHr4lWltnj+Vnwan4duop3w0cxQiqoagxyi/cpTvKs4lBrO/ZeXB2CzeetD3jm7h9G04qI+15rk5tnJZcmZvtv4ozNjqifUPECAKW1zZxxxzy+/PBHTLEc8Tzbs4Sid29m+h+cqKKXP9nJzPvnc/tra7ngT+/T2BLGR4infL/jm945VOUfAV4/fo9F2DgyEI6fowkPuQEv5x3pDFCrIZeB0kjuK9/F2Dbf/ccSbn5hJQe5yyxuM0MJ4sVPMKFDddzgPMBwkfU+RQGbT+JGJZ/jWQTAUyF3xc5dywAw7tthyFhRn3uE4lDMpff4O6tYEddYKImkjbgDlFGAv6mUYVLJbjOIO0OXAPAdT2ILf/DP57DQdRNk08xAcaydImkveP/PepeH77utXXp8516qiHcBdHcoeVtOvf1tvvzw3udA/9yf39/rgsfxnHXYUPJpYIcZDECwoZqzPIujx80AJ8pkk+2Iu6dqU4flOOF8hnt895G7/R0q41xPZZ2I8VESK+vZwG/IKXHqXFbXwjjZTaMJ8KkZy0gpjw4eAjoMVVm5oybqkvMQ5iDZw0f2EbTgRIxsMsMZJ7uobmhNuL5wY3WHdQO413c/f/bfxyU1j0dj/COGAtAuumTfMNzju5/Dra0cU/pCLHnVSyzZFjvHCIkFBEyWmMvxB08vTRDShtYQp1qfMN3jjORuHHoMAP64aX9rcKKHyo2zSIYlwu0XT+a6Mw+mxo0s+oJnPi3VsUZrKE5ddplBbDdDKJAGPFtiz1a2z8N0ayX3+P/CSVv/QkvIZpq1ismyge94Xua18FSWjP0WAOGaHWwpb8C4lntzGNbaBwHwl9CFbLeLGR+KXWNzYz33zl3X7W800+j34v7IVVOZNDSPmVNGUGUG4G+tIk+amXHMIcyxT2CZPYHtZki7z/3OjWo4TJx5M3aaQRRK+9nv7vI/yD3+v0AwcSBFUy+Ie3MwJlDxvskDiWW3MkCa2G6KAWhtrOFw2UqT8fNA6POETvoh4wbnUkoBrcaDVVvSYTk/++8KiqnhIs8HfHPrDXz29tejx074/dx2+W3bcLSV2FBkVazi5U92smZ3LYfKNjaa4SyxJzJKypGdy6L5Opop8nN/fp/fz16DMYZJ/koCEmKj+7YBsNkMZ6A0YdeXJkyEZco7d9Vd6Pkwuh3a+YlzLQNjfQvJiPtIyqPx5vF8uOAjvvNULH287GKrPYS/hi5gnOyikNoO+xwaWkJc5Jkfd4KpAPi9FrWuqEcEvAVnwjDbGPxei+EF2XxkHx79aKg09p0Mcn8zlWYgb9ifASCw9sXocY8F+W4cfF7DdlpDNv/y38qLgV/gkzDv2JMZN3YcIWPxzqJPOP2OeTQ2O439jMOHU04+Rzc/zF2hi1lkEtdHzqYZv7ffS1iv0e+/mRmHDeX1609jWH4WdSaHrGYn4mVQYQEAO00REz27otYAwJGyiWt2/4qDpYRzPQsJGg+vho93ImtCMYsyO37Yc63jS454F1qCqXfLRN4GArRS35KcuKcqDjgQct5mIg3kM/M/5ThrLQvtQ/hw/HWMmXAEs687BYPFDjMYb23Hri3bxOYrAfhK6Nm9njdsDEdZmxPSGrct4QdPL+WO2Sv4jGc9C+zDeCF8MrYRnn7qYW5/bW2X19MSshlrnAZoQyTED9jszo8zuG4V+dLII6HzALjr8X/w438vSyjjOFnDF6z3CBmLJbYz/cUbr7/Cr176lM80vkvIdXNQ1fNO1UlW+0ayBR/LN2xJSDtCtrDCjGdu+Fg8YjjNWp4wICjClopGToub3TF33PGAI+57TCEQs9xbTETcnbzZPg+rzRg+13IrAKGymLgXSS2txkMd2Ww1w1huj8MT18CHbBM1msSE2vW3lJoCBg3IZg+F1O1xrq25tZUwFr/4/BEA1JJLCC9r7dHRz1WZPLJpxe/p9xLWa6TNN+O1hFqTTVaLI+6W3wmP/Ng+jCFUEtrm+PcsbGYFbuZ8zwIe9d3ONd5XWGImstE47gWaHMvLGMPBEuczrXFEKxLq1zuWe5hRUsrarK+Rs3rv4tcV+9JpuTeygtUAlLiWe/OudUyUEkYceQp//8bxWJaQ7fdE8/jqO+5QBaL+YYBplvPmVEw1o6SUN1clRmJU1LcyUsrZYg+Npg2vc6blPUy2EiDIQvsQqhnAcjOeU2UJuTRxr+8+JlXO67QOTa1hxuLU8Zdfv4h7L5vCfZcfE+0zOLTRsYqX2gezwxQxRTbw/NLYNY0MNPFM4Dfc7X8Ar9g8HT6TFfZYjiz5F89/sJIp1kZet6dSJflQ2n7a37rmYDQksDkYZk4nYaGjXV/2d1p/FE2rNrkU0BCNUxdshkklW80QVhun76NIarjlxcTpiy1sHpq7koHSyB3BS7j/yGcYPMpplPyemLg3uf0qEcv9sOHOyO8BWc5I1k/NWJqND6mI3cdiqaHZP4iIL6zEFFO9I9bIBsN21C9vhVt4e2XiDJNbzVCKcgPsNoMYbLt9RXYIGys6rUKE6NTSOOJ+hmcpI8LJzx+frqSNuHssi1qTQyDkdLRZAUfc37GPBiBc5kTJXO2JzUNykOU0BLvNICoj09Y2OD7MlpDNuZ4FsRPscPywkY7B+EEXqaIlZHO65bzeD139WFJlNaaofgVB5ztaZcZQY3K43vccHjE0DBjfLm+JKY4ufdgRJ1qr2GgP57/hkxnp+orv8/+J9wM/4rq/v5/QsbqprJ6BNLLejGJq8wP8MfglioM7GUIVMz3OdBJVBUcC8Gr4OKZYm3jafyszPR9w9pbbEyJV4t0UjcEw49hBva+IKZPGMnPKSD539Ai+cs7JtBgvU4JLAeeNb6l9MMdITMgAPutPHL26fOAZ/DF0GaOtMpZnXcNIqeCN8GcokWHQgYvq5hdW8u0nF7O8pJpDb3mV7/5jSdSH/vbaUmYtd8RqmFTRajy8Zk/l4pZf8JnmB6g2eRxvrWZT1lfYknU5n7c+xC9hykwBdWTTYrwMllpeXxV7Qyqgjo8D3+Nx/x8B2EMh1158TvR4wGvxTPg0ngufwt2hLwLQPGkmH9x4JidNcPpZjh5VAIDBYrMZRk1JrNGaJNtpKZwY3V9iT2R4eCfU7WZTWT3BsOFQ1/XZUllCQ6Vzfb8KXsk5LX/g2Vu+QVGen12mKBrlZuwwtsQGVgGcMG4Q1ZEVv4Dx1m6KpZYv7WzfH6Y4pI24ey2hjuzofsRy326GEMQLpesYRC0/9/0TgBfDJ0XzFuTnM2zUOGen2nkQG1pCHGetZY09mrX2KMw2p5MyMs9HMh2qL32yM6GzK0JzMMzB4liJncUed5f44dzJUBR0LMtN9nC+1vpTWo2H1fZBHDF9ZkK+sw4bygozHn9zBexqP3zfQ5jjrLV8aB/OJns4I6hgMDWcYDmN7igpSwjXK61rIY8mph02hu9+7kTWGOeV/ArvXL7hfZWdZhAPfu9Crp4+jpXGuXdHu26cAcFy2BbrVF6wuZILrQ+Y7b+J4M6VjJddVGePSaif1+tlqxnKBOPc//EHH8pyezyjrTJe8N8CHzqhthPtmKvoH6EZHDR8CO/ZR3N78FLW2KO5ofU7/Nc+hWqTC01VtGWrOwHahffN5xDZxsWed2h0Qzy//thCvv/PpQRCtXzP+xJlFGCw+MQ6jAryqSaPcVbsDScymVeZKQCEcvKZbq0gGDYMp4LfeB/jJ95/USy10TelcpOfUB+/12KFGc8Nwe+ywBzGMc0PcswVtzKiIPZbKh4Q4J/fPIG7Lp3MZjOcYJzPfYzsoWHAuOh+ZPrn1evXcead7/DY/M0cYjkN/kFSytFup+9aM5p1ZjT5OT6Kcv2UmGJGSjkWNnY4jB03anbYwCxuvuDw2LoBcSSERioJpI24eyxJmGPGE3Ba+TAedlgjkIp1fNbjDJ+fFT6BWXJ6NO+c/C+xO2uCI6i7HWH667ubGEYla81oVpuDaN3hDJrxWoaveV4lb0PPYmxL65q57umlzLx/fju/eEtrazQ8LKux551xA2nAu+LfKYmzLgyXEcbiu587idbhn2FSy5Oc13ob3oGJndQ/OmsiH0Y63TpwRxwq2xkgTXxsH8Z8+0gsMcwK/Cx6/PXAT6lvivVxNLSGGCCNeLILmDllRFSUfuh9nnIzkK+0/ozCvABnHDKEXWZQ9HNTmx8gjAfWvxZNK6lu4jzPxxxubaVwzvcYJpXUZ8c6U8ERuc2uayYkXj5z5GGUuu6KKdZGeO1nbNpdyYDWPWy0h3Ni8595Zsh1/Gam4xe+P3wR57b+gcu//VO+OX0clXYeNCaK++6aZnZu38wHge+zIfAVXgvcyB2+vyLb57Mhbv6jUXXOM/hU6GwAXrx2Oj6PJMyFE0+ks/v18FSOsrYwwWzjh97nuNL7Bpd7Eydc++q509tddzxVDOxwkvyTDh7M8PxsNpthHCSlDKCRoVQygCZCgYJovkinbHOtY4XnhWsYKtU8F56OT8J83+t0tm6zY89PUV6ArWYIAQkxjErEhLHdGSuX3nI2c284DZ9XotcJcEbLnfw7dDr5rbuhpuNO/EwnvcQ9znL3+GNCv9MajtRs4yueN6kyefwg+ANqh5/ED1q/zyHNj1PmGwX+XMpkMFRspKk1zN/e3cBQqWbcuINZYx9EoHEXNFVxpucTfuX7O0d88CMo67oDry1byhs53/qI+YEfULtlGQB3vr6Wx+dvJlS+iRFSSakpIKelDHZ3b+m3H/9nGa9EJzgz/NP/O4a99SMatu99ebTukBWsodEzkK9Nn8CsH0zn26eO59aLjmyXz+exoiIb/9oOTv9FJGTv11+/kB25h1PFwMSwQcCsibnMGptD5NGENzcfv9dKsDjnhI9n6LijAMjP9kX7A+4MXszE8eMpkaFQ4ViI1/97Gbc++yEnu4u55NetY5SU0+wvalf/iLjX+wbjsTxUk5eQ5/Y/3cMwqWK3GcQuivjJBUcyPD+bLbddwD+/eQKfPWIoU0YXku33UBHOpam2nBk3PcRbS9dijOH9DeV80fMeI6QSb9yydhXzHuTsu95mELUMpIFA2BH61+ypbt0kYd6YWeFpXN/63ej+OjMKgDftYwGnobzMOw+AhfYkfhr8VjTvmSedmHBN+9IhmeVzviOfhJntv4mPs76PJQbbNzCaJzrPU1M14AwwA3ghPJ1SU8Dh1lZKTQE7GMxv3edoYJaXneL0rRxkleLBxrjSVJjrJzfgxe+x2I1zz+aGj2GzGc7D4fOdc218q9vXkEmkjbh721ju+PNYcsvZTBldwJbmHKyGMiZKCS+HT8RgYSwvL9sn0YIfEefHvdMaiqnazJcenM+ywLcISBAz7CjWGCfWds+GpRzeGieY5fseY7u1ooErvW8wUirwvv9HKupbeOKtZWybfSfnvX8xAH8IXuZk3r1iLyU5tIZsnl+yg2vdqYnPtRZypLXFqe+jX8a0WR3JGMPp1jLu9d0Hn77QZfnZwRqavY6wigg3nX8YX5k2pl0+r0doJkCpKSBv4b1U7tnG0m1V1DUH2VnTHJ3vJ6doJBdMHs0q15VSGedHHTLvp9G3DdNQildsvHnFTqcfhdF8fw+fw2NfPw6AghwfLfiZ0Pwkl97wZ848dAirQyMpXTOf0uoG/ru0hD/4HmKgNCYIYqN/cEL9fR6LTa5LwcJgWRL18ZaZfHaaQTzgv5ep1jq2GkeIsnwx18FJBw/mr1+discSsnwe9pgCsk0jcwP/y5kvHs+bvzgT34vf5hrvLDbaw/lJ8Fuc3/J7ng6dwenWJzzsu5MlWd9haeAaAkEnQinyPEc6Fse40Ub/CM/gv/YpXNLyC77e+r80u6M459tH8oRr7QPcGryCS1p/xZthR/RXj7wYvIkjPvcllDAv4GWz7XxHo63YPEwmzj8eebtoqa/kYs87PO3/HQBr7NHRCeieDZ8KCKdOdO6BiFCT7TRQv/U+xpXeN9r53COrUR3e/CjfCV4PwAYzkgZrAOzI7Gm5OyNtxN2x3OPEfcBQBuX6Wba9mgry8TZX4JcwG8wITpk4uM3KO4LPY7GDIYQqtjBu9xwGSpMT0jbxHDbgiPuf//USI6WCqoggVXfeedgWYwwLNleyZO0mpopj8WdtfpMv/u5JnvP/ml/4niRLgjSaAB/6jnfL3/valcYYKhpamGEt5mbvk7B7Jef5llBp8lhtH8R4dtD82m8SRtO2hGx+6n2amZ4PMM99i8WbyxLKA2cw1azlO2kOhsmza2kNFLY7d1tG5Gdz4vgivtv6QzCGHfd/noqHv8Ci383glj/ewfe9/wXAO2AIAZ/FOtuJTlpuT2CLPZS54WPwtlRBpRPbnl/lvLVYI6Y4oyjxsMYNhfvqBTOiwjow24nsCONh9KAcpo4tZFZ4GkNMBate/Su3eh/lPM9Ctgw+nRftk3kw9Dn+EzqNt61pCfX3eYQtrnAhFh6L6JugZ9I53Bj8FrUmh7AR/hK+0Kmje+625Pg9LHNDJAFqTA5ne5Yw03qfQqlnzeSfUXfYlznttBnMsY9noDRylsfpyPWI4ZytdwKx8xfmOOf52D4MgJW20zAuNIfytn0MWb7Iz1h4NHxe9Lx/C18AQAX5jG3+JwuPvKVdXQtyOr6Gjhian9XhmJHhgdiUB9XkOh3Ta+/hDt9fo+llFET98a+GnYY5L+CNHm8IOMcmWk6f08Bw4ltdpJ6NZDl9aMCg3AC7PMOhOhZyaoyJ/sWndbSdamzb9HiZz97A23WW/oHXYyVa7rnOQzj94MGUb4690n/xszM45MSpfCNuTu7iAQFqm4KsaS7i8+Ey7vX/hWUcyrOTH+TmsaMpsR1xu9XnRLB8GD6ccdYumufcwyOvbWOEt45m46Vw4ECmHD2FzfZQ7A1vcciEcczb6aGpZCXZrWVMCG/mW7Idr2Xzm+BX+YXvSeYFbiBkLK5tvY637Cnk0EKTP5fdFDJs3u95ankdy2tzOGGEl0BTKfn5hSyyJ1JAHQvWbCVXmrnd9w8GST32Q3M5F5sl9iS+EryJW72P8uXFD/LWgo8o9Y1gfUshdeTwR992ak0OA+1GWh69kBcLJvNORT4TfJUUFhWzfk8tU6yNzLMM53pWsSXn3C6//2y/h6evmcY76yZw7xOf8mPfsxxqtuOTMGd4nAigZfYEJnt9BLwWa+xR4HHC9E5vvZtDZBszPEtZ+OTPWdwyiksa/+VE1w2fHI1Qurz159z2xclceVxMOAe4AjGmyLn3U0YX8KF/Gsvs2Zy+5tfghefD0/nct5/HvuVVbgtd7pSVMyKh/h5L2OSGw64oOhdLhI1mJFe1/pTbzv0u7674gKktDyAYzpk8lqfOnsTYwR37wM88dAjPLT6eR7J/y4Ajz+PjrXXcMH0QX7v/VYb6W3jyi1dyAc5AtUPmHc1/wyczgEauC/6Ab3le4XrfcwA042f+jWdSkONnTFEOv634Kg+ELkw0YoAFPz+LG59bzuwVu9luhvB6+DMst51opitPHMP4wbn86uVVHU4JPDw/m3svm8LWikbuemPvb6IDAl7KiP2Wvtz6c341eB6HTP823veWELINTWRxb+j/8RNx5tl/OTyNdfYoQPif4Lc5Rjay3Dh1y8uKyc/68mbazDSQeO6sWCO06ffns6O6iaufWMiqyiLGb5zHM/ffQnPZJifsOWzTYLIYkJdH6biLWLV8AcXUkFtYTHPVbkb5agkUjCDkySIvJ4dDjzuT19fXcah3D0vWb6OlrpwheX5GZAcptCvxDTmEZ7dmk1+7jiFSRcvQY/B7oKW2nIq6JoqKh1Mf9uCp3MiR1haCuUMZcdiJVGSPZfYHSxjrKWdA3gAKh4wkHLYZ0FpK1qCRbK01DMzy8NkZZxMobh99lixpI+6ThuRFO1xKTDGjvM6w8r9dNZXpt2zkJOtTDjniGCafciGIcNCgHD7YWMFnxhRy/VkT+ew979LgxgrvMEWM/95/uHVoxP0g3Beayfe9L2Ib4anwWQTCrdzlf5Df8gDRNYGrgHdgSqRSuyDeO71NimnGz0s5X+Sxys/yec+HNJoALafdzKUHHcf1BdnUNge55YWVvF46lSu9b/CVyj+7H3YLKYNT3M2v+2NlPxD6PN/1vkxAwBoykTmXnsGldzdygrWao61NDAh/SsAXm9Lg6fAZfNv7Cid5VmHXrmam3/3hVwI+qDdZtODDRhh0wmXdvg8nTyjix4Ev8X7TkYw78njeWrGNL3jm8wvfkzwSOo8/i3Dc2EHcbB9Kpcnj3+EzAFhvRrHTDOK46jkc53zlvG8fyXS3Y/zNH59GfUuIKaMLEs5nWcI/vnkCE4c4+USEp797Gl+4+2fc6H2agiGj+ML3bke8Ht793zPYU9dMdWOQaeMHJZSTn+2jnHyOb76fHx09nSlDnMiMd+zJDMgbwM0XHMZ768t5Z10Zxx5U0KmwA4wpymXWdacCpwJwqevm/uXVF0cbIYCA18Mdl0zh+meu5d7LptD4r2X8M3wm13mfZ70ZxTWnTmCkG7Xy0Fen8tl73mUngzn/qGHMXuG4aF76/skMzPJxxQlj2FTWwJrddVwTvAFw4tN/M/NIjDEUD8jizEPbW90AM6eMxBjD8pIaLj9hdId5It/t9IlDOG79X6gijxBeqi+6GgYU8dCVn+GhdzdRUtXEM1Wncb33ORrI4sfB7/GFqWM5tbaFd9eBFI7jnrMn8dySEgLemOvloEE5nFJ1N15svuWZxSkzZtK2Jt+cPo4RBdlYljB6UA5Hjsjn32Wnc7a1mC+V/Ylm42OPKUTEkGc1Mai5HlbPgki7UA/4nDl0PNXu814BbL+La9wsp4JjVDRAuF6oJo+iypc5BuezjSZATkVsdDU+oDq2XW4GEmhaxYClTv/RDIAwUOP+RSiJ/Y7fCf+M0674aaffe0+R3nhNEZFzgXsBD/A3Y8xeg1GnTp1qFi1alNQ5Q2Gb389eQ27lSmYcexhTjjoqemxDaR2tIcPhI2IdP3XNQe59cz3XnTWRgVk+lm6r4urHF/LIJWPJHzyC8cUxX3BNU5BbX/6UBVurOKgwm8e/cQKzlu9kwZLFfH6CD98w53V5/Y5SyjcuYVpeGWXF03h03mquPdpQOOE4ho87jJCVRXl9C+MG5/LntzZwzmFDmDousWMPYFdNE9tKqzDNtSxZt5VjClvIzi/GXziSu597mxMDm9ktxVRXVzH+8OM4edIQnt3k46zsNezYU8EZZ53P0OGjnUmVjCHg99DQ1MS/31nG6OwgI4YNY31jLhP9FXjzh7F20zYGh3Zz6DEnsmTdds46tIhA0RjK65oZOxCKBrWvY3fZUFrP8pJqHpj9MU9cex4jCh1x21PbzK6aZiaPymdzeQPbKhtZsWY9F42qo8w/kuxAFgVDRzE8P7uLM3TMprJ6DhqU024gTGfYtmFTeQMeSxhVmI3PY7G9spFg2E54FraUNzCmKCeli3FsKqtnTFEuxhi2VjZSVd/CkAEBDhqc2KFbUd+CxxIKcvxU1LdQXt/KIcMSwwONca4jP9uHz2N16jpKhu2VjeTn+Kisb+2wkZu3tpQPV23my9PGM3a4O/gtGKayoTUhxDKeuuYgy0tqEGDM4Nxoo7Y3mlrD7Khuory8jAkDWmnOGcnIwlw+KalmQJaXW/7+GqdYKxh7+HEsrCngokOzKRg0hEbPQBqrdpOf7ePDtSVQsoBjhngIDjuWVZUGf/YADh6WzxEHDaUq5OPtRSuxKzbw2VNP5qNdhpK1i5g+aRjZBcPYXB1k4fKVDPM2cubxR9OYNxaPwOqVSwjuXs2xh08iOPgI3li+jckDaxlZNJBg3nAa92xGsNlZG+LM4ycTGNhxw9sVIrLYGDO1w2OpFncR8QDrgLOBEmAh8GVjTKcrEKdC3BVFUTKNvYl7b3SoHg9sMMZsMsa0Av8CZnbxGUVRFCWF9Ia4jwTiw0hK3LQEROQaEVkkIovKynR5O0VRlFRywEIhjTEPGWOmGmOmFhcXd/0BRVEUpdv0hrjvgISO7lFumqIoirKf6A1xXwhMFJFxIuIHLgN0sUNFUZT9SMrj3I0xIRH5PvAaTijko8aYT1N9HkVRFKVzemUQkzFmNjC7y4yKoihKr5A2c8soiqIoMXplhOo+V0KkDOjpgpODgfIuc6UXes2ZgV5zZpDMNY8xxnQYbtgnxD0ZRGRRZyO00hW95sxArzkz6K1rVreMoihKGqLiriiKkoakg7g/dKArcADQa84M9Jozg1655n7vc1cURVHakw6Wu6IoitIGFXdFUZQ0pF+Lu4icKyJrRWSDiNx4oOuTKkRktIi8LSKrRORTEfmhmz5IRN4QkfXu/0I3XUTkT+73sFxEjj2wV9AzRMQjIktFZJa7P05EPnav69/uXEWISMDd3+AeH3tAK95DRKRARJ4VkTUislpETsyAe3y9+0yvFJGnRSQrHe+ziDwqIqUisjIubZ/vrYhc5eZfLyJX7Usd+q24uys+3Q+cBxwOfFlEDj+wtUoZIeAGY8zhwDTgWvfabgTmGmMmAnPdfXC+g4nu3zXAA/u/yinhh8DquP0/AHcbYw7GWaH2ajf9aqDKTb/bzdcfuRd41RhzKDAZ59rT9h6LyEjgOmCqMeZInLmnLiM97/PjQNuV5ffp3orIIOCXwAk4iyD9MtIgdAtjTL/8A04EXovbvwm46UDXq5eu9UWcZQvXAsPdtOHAWnf7rzhLGUbyR/P1lz+cqaHnAmcCs3CWKS4HvG3vN86kdCe62143nxzoa9jH680HNretd5rf48hCPoPc+zYL+Gy63mdgLLCyp/cW+DLw17j0hHxd/fVby51urvjU33FfRY8BPgaGGmN2uYd2A0Pd7XT4Lu4BfgLY7n4RUG2MCbn78dcUvV73eI2bvz8xDigDHnNdUX8TkVzS+B4bY3YAdwDbgF04920x6X2f49nXe5vUPe/P4p72iEge8BzwI2NMbfwx4zTlaRHHKiKfA0qNMYsPdF32I17gWOABY8wxQAOx13Qgve4xgOtSmInTsI0AcmnvusgI9se97c/intYrPomID0fY/2GMed5N3iMiw93jw4FSN72/fxcnAxeKyBacBdXPxPFHF4hIZFrq+GuKXq97PB+o2J8VTgElQIkx5mN3/1kcsU/XewxwFrDZGFNmjAkCz+Pc+3S+z/Hs671N6p73Z3FP2xWfRESAR4DVxpi74g69BER6zK/C8cVH0q90e92nATVxr399HmPMTcaYUcaYsTj38S1jzBXA28DFbra21xv5Hi528/crC9cYsxvYLiKHuEkzgFWk6T122QZME5Ec9xmPXHPa3uc27Ou9fQ04R0QK3beec9y07nGgOx2S7LA4H1gHbAR+fqDrk8Lrmo7zyrYcWOb+nY/jb5wLrAfeBAa5+QUncmgjsAInGuGAX0cPr/10YJa7PR5YAGwAngECbnqWu7/BPT7+QNe7h9c6BVjk3ucXgMJ0v8fAr4E1wErgSSCQjvcZeBqnXyGI85Z2dU/uLfAN9/o3AF/flzro9AOKoihpSH92yyiKoiidoOKuKIqShqi4K4qipCEq7oqiKGmIiruiKEoaouKuKIqShqi4K4qipCH/H5e1qfGQxgMHAAAAAElFTkSuQmCC\n",
      "text/plain": [
       "<Figure size 432x288 with 1 Axes>"
      ]
     },
     "metadata": {
      "needs_background": "light"
     },
     "output_type": "display_data"
    }
   ],
   "source": [
    "import matplotlib.pyplot as plt\n",
    "# Generate recent 50 interval average\n",
    "average_reward = []\n",
    "for idx in range(len(rewards)):\n",
    "    avg_list = np.empty(shape=(1,), dtype=int)\n",
    "    if idx < 5:\n",
    "        avg_list = rewards[:idx+1]\n",
    "    else:\n",
    "        avg_list = rewards[idx-4:idx+1]\n",
    "    average_reward.append(np.average(avg_list))\n",
    "plt.plot(rewards)\n",
    "plt.plot(average_reward)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "9f18bae5",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "44b0354e",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "58e2db1b",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "8385f8b3",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "c1d27da3",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "fb4df6e4",
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.10.12"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
