{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "id": "67576132",
   "metadata": {},
   "outputs": [],
   "source": [
    "from math import inf\n",
    "import numpy as np\n",
    "import scipy\n",
    "import torch\n",
    "import torch.nn as nn\n",
    "import torch.nn.functional as F\n",
    "import torch.optim as optim\n",
    "import gymnasium as gym\n",
    "import pandas as pd\n",
    "from datetime import datetime\n",
    "from sklearn.base import BaseEstimator\n",
    "from realkd.boosting import WeightUpdateMethod\n",
    "from pandas import qcut\n",
    "from realkd.rules import SquaredLoss, AdditiveRuleEnsemble, Rule\n",
    "from realkd.search import Context\n",
    "\n",
    "import warnings"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "id": "8b8f01e2",
   "metadata": {},
   "outputs": [],
   "source": [
    "# warnings.filterwarnings('ignore')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "id": "db545637",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "cuda\n"
     ]
    }
   ],
   "source": [
    "env = gym.make('CartPole-v1', render_mode='rgb_array')\n",
    "device = torch.device(\"cuda\" if torch.cuda.is_available() else \"cpu\")\n",
    "print(device)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "id": "7aa6c889",
   "metadata": {},
   "outputs": [],
   "source": [
    "column_names = ['cp', 'cv', 'pa', 'pav']"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "id": "24f75485",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<torch._C.Generator at 0x7fa2de005430>"
      ]
     },
     "execution_count": 5,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "np.random.seed(753894)\n",
    "torch.manual_seed(3921840)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "id": "84732b72",
   "metadata": {},
   "outputs": [],
   "source": [
    "def orthonormalization(Q):\n",
    "    n, k = Q.shape\n",
    "    O = np.zeros(shape=(n, k))\n",
    "    q = Q[:, 0]\n",
    "    O[:, 0] = q / (norm(q) + 1e-6)\n",
    "    for i in range(1, k):\n",
    "        O_i = O[:, :i]\n",
    "        q = Q[:, i]\n",
    "        q_orth = q - O_i.dot(O_i.T.dot(q))\n",
    "        O[:, i] = q_orth / (norm(q_orth) + 1e-6)\n",
    "    return O"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "id": "973f1f9b",
   "metadata": {},
   "outputs": [],
   "source": [
    "def softmax1(action, values, other_values, location):\n",
    "    all_values = np.insert(other_values, location, values, axis=1)\n",
    "    exps = np.exp(all_values)\n",
    "    res = np.exp(all_values[np.arange(values.shape[0]), action]) / np.sum(exps, axis=1)\n",
    "    return res\n",
    "\n",
    "def norm(x):\n",
    "    \"\"\"\n",
    "    Calculate the L-2 norm of a vector\n",
    "    :param x: the vector whose L-2 norm is to be calculated\n",
    "    :return: the L-2 norm of the vector\n",
    "    \"\"\"\n",
    "    return (x * x).sum() ** 0.5\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "id": "5b0af6ac",
   "metadata": {},
   "outputs": [],
   "source": [
    "class PiLoss:\n",
    "    _instance = None\n",
    "\n",
    "    def __new__(cls):\n",
    "        if cls._instance is None:\n",
    "            cls._instance = super(PiLoss, cls).__new__(cls)\n",
    "        return cls._instance\n",
    "\n",
    "    @staticmethod\n",
    "    def __call__(action, values, advantage, other_values, current):\n",
    "        \"\"\"\n",
    "        :param action: the action chosen\n",
    "        :param values: the values provided by current model\n",
    "        :param other_values: the output by other models\n",
    "        :param current: the action represented by the current model\n",
    "        \"\"\"\n",
    "        sm = softmax1(action, values, other_values, current)+1e-6\n",
    "        return -np.log(sm) * advantage\n",
    "\n",
    "    @staticmethod\n",
    "    def g(action, values, advantage, other_values, current):\n",
    "        return np.where(action == current, -advantage * (1 - softmax1(current, values, other_values, current)),\n",
    "                        advantage * softmax1(current, values, other_values, current))\n",
    "\n",
    "    @staticmethod\n",
    "    def h(action, values, advantage, other_values, current):\n",
    "        sm = softmax1(current, values, other_values, current)\n",
    "        return advantage * sm * (1 - sm)\n",
    "\n",
    "    @staticmethod\n",
    "    def __repr__():\n",
    "        return 'pi_loss'\n",
    "\n",
    "    @staticmethod\n",
    "    def __str__():\n",
    "        return 'pi_loss'"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 9,
   "id": "67942365",
   "metadata": {},
   "outputs": [],
   "source": [
    "loss_functions = {\n",
    "    'pi_loss': PiLoss()\n",
    "}"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 10,
   "id": "693287f4",
   "metadata": {},
   "outputs": [],
   "source": [
    "def loss_function(loss):\n",
    "    \"\"\"Provides loss functions from string representation.\n",
    "\n",
    "    :param loss: string identifier of loss function loss function\n",
    "    :return: loss function matching corresponding to input string (or unchanged input if was already loss function)\n",
    "    \"\"\"\n",
    "    if callable(loss):\n",
    "        return loss\n",
    "    else:\n",
    "        return loss_functions[loss]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 11,
   "id": "ae0af97c",
   "metadata": {},
   "outputs": [],
   "source": [
    "def calc_risk(loss, action, rules, states, reg, advantage, others, current):\n",
    "    weights = np.array([rule.y for rule in rules])\n",
    "    risk = sum(loss(action, rules(states), advantage, others, current)) + reg * sum(weights * weights) / 2\n",
    "    return risk"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 12,
   "id": "d06dc96b",
   "metadata": {},
   "outputs": [],
   "source": [
    "class FullyCorrectiveA2C:\n",
    "    def __init__(self, loss='pi_loss', reg=1.0, solver='L-BFGS-B'):\n",
    "        self.loss = loss_function(loss)\n",
    "        self.reg = reg\n",
    "        self.solver = solver\n",
    "\n",
    "    @staticmethod\n",
    "    def get_risk(loss, action, q_mat, reg, advantage, others, current):\n",
    "        def sum_loss(weights):\n",
    "            return sum(loss(action, q_mat.dot(weights), advantage, others, current)) + reg * sum(weights * weights) / 2\n",
    "\n",
    "        return sum_loss\n",
    "\n",
    "    @staticmethod\n",
    "    def get_gradient(g, action, q_mat, reg, advantage, other, current):\n",
    "        def gradient(weights):\n",
    "            grad_vec = g(action, q_mat.dot(weights), advantage, other, current)\n",
    "            return q_mat.T.dot(grad_vec) + reg * weights\n",
    "\n",
    "        return gradient\n",
    "\n",
    "    @staticmethod\n",
    "    def get_hessian(h, action, q_mat, reg, advantage, other, current):\n",
    "        def hessian(weights):\n",
    "            h_vec = h(action, q_mat.dot(weights), advantage, other, current)\n",
    "            return q_mat.T.dot(np.diag(h_vec)).dot(q_mat) + np.diag([reg] * len(weights))\n",
    "\n",
    "        return hessian\n",
    "\n",
    "    def calc_weight(self, data, action, rules, advantage, other, current):\n",
    "        g = self.loss.g\n",
    "        h = self.loss.h\n",
    "        loss = self.loss\n",
    "        y = np.array(action)\n",
    "        q_mat = np.column_stack(\n",
    "            [rules[i].q(data) + np.zeros(len(data)) for i in range(len(rules))])\n",
    "        sum_loss = self.get_risk(loss, y, q_mat, self.reg, advantage, other, current)\n",
    "        gradient = self.get_gradient(g, y, q_mat, self.reg, advantage, other, current)\n",
    "        hessian = self.get_hessian(h, y, q_mat, self.reg, advantage, other, current)\n",
    "        if self.solver == 'GD':  # Gradient descent\n",
    "            w = np.array([r.y for r in rules])\n",
    "            old_w = np.ones_like(w) * (1.0 if len(w) - sum(w) > 1e-5 else 2.0)\n",
    "            i = 0\n",
    "            while norm(old_w - w) > 1e-3 and i < 50:\n",
    "                old_w = np.array(w)\n",
    "                if norm(gradient(w)) == 0:\n",
    "                    break\n",
    "                p = -gradient(w) / norm(gradient(w))\n",
    "                w += GoldenRatioSearch(sum_loss, old_w, p, gradient).run() * p\n",
    "                i += 1\n",
    "        elif self.solver == 'Line':\n",
    "            w = np.array([r.y for r in rules])\n",
    "            if norm(gradient(w)) != 0:\n",
    "                p = -gradient(w) / norm(gradient(w))\n",
    "                distance = GoldenRatioSearch(sum_loss, w, p, gradient).run()\n",
    "                w += distance * p\n",
    "        else:\n",
    "            w = np.array([r.y for r in rules])\n",
    "            w = scipy.optimize.minimize(sum_loss, w, method=self.solver, jac=gradient,  # hess=hessian,\n",
    "                                        options={'disp': False}).x\n",
    "\n",
    "        return w"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 13,
   "id": "2d0c04a8",
   "metadata": {},
   "outputs": [],
   "source": [
    "class ObjectFunction:\n",
    "    def __init__(self, data, target, predictions, loss, reg, advantage, other_values, current, rules=None):\n",
    "        self.loss = loss_function(loss)\n",
    "        self.reg = reg\n",
    "        predictions = np.zeros_like(\n",
    "            target) if predictions is None else predictions\n",
    "        g = np.array(self.loss.g(target, predictions, advantage, other_values, current))\n",
    "        h = np.array(self.loss.h(target, predictions, advantage, other_values, current)) + 1e-6\n",
    "        r = g / h\n",
    "        order = np.argsort(r)[::-1]\n",
    "        self.g = g[order]\n",
    "        self.h = h[order]\n",
    "        self.data = data.iloc[order].reset_index(drop=True)\n",
    "        self.target = target.iloc[order].reset_index(drop=True)\n",
    "        self.n = len(target)\n",
    "\n",
    "    def __call__(self, ext):\n",
    "        raise NotImplementedError()\n",
    "\n",
    "    def bound(self, ext):\n",
    "        raise NotImplementedError()\n",
    "\n",
    "    def search(self, method='greedy', verbose=False, **search_params):\n",
    "        from realkd.search import search_methods\n",
    "        ctx = Context.from_df(self.data, **search_params)\n",
    "        if verbose >= 2:\n",
    "            print(\n",
    "                f'Created search context with {len(ctx.attributes)} attributes')\n",
    "        return search_methods[method](ctx, self, self.bound, verbose=verbose, **search_params).run()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 14,
   "id": "eaec4413",
   "metadata": {},
   "outputs": [],
   "source": [
    "class OrthogonalBoostingObjective(ObjectFunction):\n",
    "    def __init__(self, data, target, advantage, other_values, current, predictions=None, loss=SquaredLoss, reg=1.0,\n",
    "                 rules=None,\n",
    "                 epsilon=1e-4, **kwargs):\n",
    "        super().__init__(data, target, predictions, loss, reg, advantage, other_values, current, rules)\n",
    "        self.rules = [] if rules is None else rules\n",
    "        self.loss = loss_function(loss)\n",
    "        self.reg = reg\n",
    "        self.epsilon = epsilon\n",
    "        predictions = np.zeros_like(\n",
    "            target) if predictions is None else predictions\n",
    "        g = np.array(self.loss.g(target, predictions, advantage, other_values, current))\n",
    "        self.n = len(target)\n",
    "        r = g\n",
    "        order = np.argsort(r)[::-1]\n",
    "        self.g = g[order]\n",
    "        self.data = data.iloc[order].reset_index(drop=True)\n",
    "        self.target = target.iloc[order].reset_index(drop=True)\n",
    "        if len(rules) != 0:\n",
    "            orth_basis = kwargs['orth_basis']\n",
    "            self.orth_basis = orth_basis[order]\n",
    "            self.g = self.g - self.orth_basis @ self.orth_basis.T @ self.g\n",
    "        else:\n",
    "            self.orth_basis = np.zeros(self.n)\n",
    "\n",
    "    def __call__(self, ext):\n",
    "        if len(ext) == 0:\n",
    "            return -inf\n",
    "        g_q = self.g[ext]\n",
    "        if len(self.rules) == 0:\n",
    "            h_q = self.h[ext]\n",
    "            return abs(g_q.sum()) / np.sqrt(h_q.sum())\n",
    "        length = self.fast_orth_norm(ext)\n",
    "        if length > 1e-4:\n",
    "            obj = abs(g_q.sum()) / (length + self.epsilon)\n",
    "        else:\n",
    "            obj = 0\n",
    "        return obj\n",
    "\n",
    "    def fast_orth_norm(self, ext):\n",
    "        deltas = self.orth_basis[ext]\n",
    "        length = len(ext)\n",
    "        okqi = abs(np.sum(deltas, axis=0))\n",
    "        q_para_norms = (okqi ** 2).sum()\n",
    "        q_orth_norms_sq = np.abs(length - q_para_norms)\n",
    "        return np.sqrt(q_orth_norms_sq)\n",
    "\n",
    "    def fast_para_norms_prefix(self, ext):\n",
    "        deltas = self.orth_basis[ext]\n",
    "        length = len(ext)\n",
    "        okqi = np.cumsum(deltas, axis=0)\n",
    "        q_para_norms = (okqi ** 2).sum(axis=1)\n",
    "        q_orth_norms_sq = np.abs(np.arange(1, length + 1) - q_para_norms)\n",
    "        q_orth_norms = np.sqrt(q_orth_norms_sq)\n",
    "        return q_orth_norms\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 15,
   "id": "626cceb7",
   "metadata": {},
   "outputs": [],
   "source": [
    "class GeneralRuleBoostingEstimator(BaseEstimator):\n",
    "    def __init__(self, num_rules, objective_function, weight_update_method, loss='squared', reg=1.0,\n",
    "                 search='greedy', max_col_attr=10,\n",
    "                 search_params=None, verbose=False):\n",
    "        if search_params is None:\n",
    "            search_params = {'order': 'bestboundfirst', 'apx': 1.0, 'max_depth': None, 'discretization': qcut,\n",
    "                             'max_col_attr': max_col_attr}\n",
    "        self.num_rules = num_rules\n",
    "        self.num_components = 500\n",
    "        self.objective = objective_function\n",
    "        self.objective_function = objective_function\n",
    "        self.max_col_attr = max_col_attr\n",
    "        self.weight_update_method = weight_update_method\n",
    "        self.loss = loss_function(loss)\n",
    "        self.reg = reg\n",
    "        self.weight_update_method.loss = loss\n",
    "        self.weight_update_method.reg = reg\n",
    "        self.verbose = verbose\n",
    "        self.search = search\n",
    "        self.rules_ = AdditiveRuleEnsemble([])\n",
    "        self.search_params = search_params\n",
    "        self.history = []\n",
    "        self.time = []\n",
    "\n",
    "    def set_reg(self, reg):\n",
    "        self.reg = reg\n",
    "        self.objective.reg = reg\n",
    "        self.weight_update_method.reg = reg\n",
    "\n",
    "    def fit(self, data, target, advantage, other_values, current, has_origin_rules=False, verbose=False):\n",
    "        if not has_origin_rules:\n",
    "            self.history = []\n",
    "            self.time = []\n",
    "            self.rules_.members = []\n",
    "            orth_basis = np.array([])\n",
    "        else:\n",
    "            q_mat = np.column_stack(\n",
    "                [self.rules_[i].q(data) + np.zeros(len(data)) for i in range(len(self.rules_))])\n",
    "            orth_basis = orthonormalization(q_mat)\n",
    "        num_components = 0\n",
    "        while len(self.rules_) < self.num_rules and num_components < self.num_components:\n",
    "            start_time = datetime.now()\n",
    "            # Search for a rule\n",
    "            scores = self.rules_(data)\n",
    "            obj = self.objective(data, target, advantage, other_values, current, predictions=scores,\n",
    "                                 loss=self.loss, reg=self.reg, rules=self.rules_, orth_basis=orth_basis)\n",
    "            q = obj.search(method=self.search, verbose=verbose,\n",
    "                           **self.search_params)\n",
    "            if hasattr(self.objective, 'opt_weight') and callable(getattr(self.objective, 'opt_weight')):\n",
    "                y = obj.opt_weight(q)\n",
    "            else:\n",
    "                y = 1.0  # np.random.random()\n",
    "            q_vec = q(data)\n",
    "            num_components += (1 + len(q))\n",
    "            if len(orth_basis) == 0:\n",
    "                basis = q_vec / norm(q_vec)\n",
    "                orth_basis = np.array([basis]).T\n",
    "            else:\n",
    "                basis = q_vec - orth_basis.dot(orth_basis.T.dot(q_vec))\n",
    "                basis = basis / (norm(basis) + 1e-6)\n",
    "                orth_basis = np.hstack((orth_basis, np.array([basis]).T))\n",
    "            rule = Rule(q, y)\n",
    "            if self.verbose:\n",
    "                print(rule)\n",
    "            self.rules_.append(rule)\n",
    "            # Calculate weights\n",
    "            weights = self.weight_update_method.calc_weight(\n",
    "                data, target, self.rules_, advantage, other_values, current)\n",
    "            for i in range(len(self.rules_)):\n",
    "                self.rules_[i].y = weights[i]\n",
    "            self.history.append(AdditiveRuleEnsemble(\n",
    "                [Rule(q=rule.q, y=rule.y) for rule in self.rules_.members]))\n",
    "            end_time = datetime.now()\n",
    "            self.time.append(str(end_time - start_time))\n",
    "        return self\n",
    "\n",
    "    def predict(self, data):\n",
    "        loss = loss_function(self.loss)\n",
    "        return loss.preidictions(self.rules_(data))\n",
    "\n",
    "    def decision_function(self, data):\n",
    "        return self.rules_(data)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 16,
   "id": "b50ce787",
   "metadata": {},
   "outputs": [],
   "source": [
    "# class Actor(nn.Module):\n",
    "#     def __init__(self, action_space, node=16):\n",
    "#         super(Actor, self).__init__()\n",
    "#         self.fc1 = nn.Linear(4, node)  \n",
    "# #         self.fc1_ = nn.Linear(node, node)\n",
    "#         self.fc2 = nn.Linear(node, action_space)\n",
    "\n",
    "#     def forward(self, state):\n",
    "#         x = F.relu(self.fc1(state))\n",
    "# #         x = F.relu(self.fc1_(x))\n",
    "#         x = self.fc2(x)\n",
    "#         return x"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 17,
   "id": "84b0ee0a",
   "metadata": {},
   "outputs": [],
   "source": [
    "def copy_rules(origin_rules):\n",
    "    rules = []\n",
    "    for n in range(len(origin_rules)):\n",
    "        rule = origin_rules[n]\n",
    "        rules.append(Rule(q=rule.q, y=rule.y))\n",
    "    return AdditiveRuleEnsemble(rules)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 18,
   "id": "bb3fcc8c",
   "metadata": {},
   "outputs": [],
   "source": [
    "class ActorRule():\n",
    "    def __init__(self, action_space=2, num_rules=12):\n",
    "        self.action_space = action_space\n",
    "        self.model = [GeneralRuleBoostingEstimator(num_rules=num_rules, objective_function=OrthogonalBoostingObjective,\n",
    "                                                   weight_update_method=FullyCorrectiveA2C(), loss=PiLoss(),\n",
    "                                                   reg=0.3, search='greedy', max_col_attr=10, verbose=False) for _ in\n",
    "                      range(action_space)]\n",
    "        self.best_model = [\n",
    "            GeneralRuleBoostingEstimator(num_rules=num_rules, objective_function=OrthogonalBoostingObjective,\n",
    "                                         weight_update_method=FullyCorrectiveA2C(), loss=PiLoss(),\n",
    "                                         reg=0.01, search='greedy', max_col_attr=20, verbose=False) for _ in\n",
    "            range(action_space)]\n",
    "\n",
    "    def __call__(self, state):\n",
    "        res = [self.model[i].rules_(state) for i in range(len(self.model))]\n",
    "        return np.array(res)\n",
    "\n",
    "    def predict(self, state):\n",
    "        res = [self.best_model[i].rules_(state) for i in range(len(self.model))]\n",
    "        return np.array(res)\n",
    "\n",
    "\n",
    "def update_rules(estimator: GeneralRuleBoostingEstimator, x, y, adv, other_values, current):\n",
    "    queries_lst = []\n",
    "    queries = {}\n",
    "    original_rules = copy_rules(estimator.rules_)\n",
    "    origin_risk = calc_risk(PiLoss(), y, original_rules, x, estimator.reg, adv, other_values, current)\n",
    "    for i in range(len(estimator.rules_)):\n",
    "        q_str = str(estimator.rules_[i].q)\n",
    "        if q_str not in queries:\n",
    "            queries[q_str] = estimator.rules_[i].y\n",
    "            queries_lst.append(estimator.rules_[i].q)\n",
    "        else:\n",
    "            queries[q_str] += estimator.rules_[i].y\n",
    "    for k in queries:\n",
    "        queries[k] = abs(queries[k])\n",
    "    min_weight_query = min(queries, key=queries.get)\n",
    "    rules = []\n",
    "    for i in range(len(queries_lst)):\n",
    "        q_str = str(queries_lst[i])\n",
    "        if q_str != min_weight_query:\n",
    "            rules.append(Rule(q=queries_lst[i], y=queries[str(queries_lst[i])]))\n",
    "    if len(rules) == 0:\n",
    "        rules = [Rule(q=queries_lst[0], y=queries[str(queries_lst[0])])]\n",
    "    new_rules = AdditiveRuleEnsemble(rules)\n",
    "    weights = FullyCorrectiveA2C(loss_function('pi_loss'), estimator.reg).calc_weight(x, y, new_rules, adv,\n",
    "                                                                                      other_values, current)\n",
    "    for i in range(len(new_rules)):\n",
    "        new_rules[i].y = weights[i]\n",
    "    estimator.rules_ = new_rules\n",
    "    estimator.fit(x, y, adv, other_values, current, has_origin_rules=True)\n",
    "    weights = FullyCorrectiveA2C(loss_function('pi_loss'), estimator.reg).calc_weight(x, y, estimator.rules_, adv,\n",
    "                                                                                      other_values, current)\n",
    "    for i in range(len(estimator.rules_)):\n",
    "        estimator.rules_[i].y = weights[i]\n",
    "    new_risk = calc_risk(PiLoss(), y, estimator.rules_, x, estimator.reg, adv, other_values, current)\n",
    "    if new_risk > origin_risk:\n",
    "        estimator.rules_ = copy_rules(original_rules)\n",
    "        print(\"origin\", origin_risk, 'new', new_risk, 'not updated')\n",
    "        # risk = sum(PiLoss.__call__(y, estimator.rules_[i].y))\n",
    "    return estimator"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 19,
   "id": "2824981f",
   "metadata": {},
   "outputs": [],
   "source": [
    "class Critic(nn.Module):\n",
    "    def __init__(self, node=16):\n",
    "        super(Critic, self).__init__()\n",
    "        self.fc1 = nn.Linear(4, node)\n",
    "        self.fc2 = nn.Linear(node, 1)\n",
    "\n",
    "    def forward(self, state):\n",
    "        x = F.relu(self.fc1(state))\n",
    "        x = self.fc2(x)\n",
    "        return x"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 20,
   "id": "6b6e2dd7",
   "metadata": {},
   "outputs": [],
   "source": [
    "gamma = 0.99\n",
    "actor = ActorRule()\n",
    "critic = Critic().to(device)\n",
    "critic_optimizer = optim.AdamW(critic.parameters(), lr=0.001)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 21,
   "id": "ae072cc5",
   "metadata": {},
   "outputs": [],
   "source": [
    "class ActorNet(nn.Module):\n",
    "    def __init__(self, hidden_dim=16):\n",
    "        super().__init__()\n",
    "\n",
    "        self.hidden = nn.Linear(4, hidden_dim)\n",
    "        self.output = nn.Linear(hidden_dim, 2)\n",
    "\n",
    "    def forward(self, s):\n",
    "        outs = self.hidden(s)\n",
    "        outs = F.relu(outs)\n",
    "        logits = self.output(outs)\n",
    "        return logits\n",
    "\n",
    "\n",
    "actor_func = ActorNet().to(device)\n",
    "value_func = critic"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 22,
   "id": "c565d5ef",
   "metadata": {
    "scrolled": true
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Run episode 0 with rewards 22.0\n",
      "Run episode 1 with rewards 11.0\n",
      "Run episode 2 with rewards 13.0\n",
      "Run episode 3 with rewards 13.0\n",
      "Run episode 4 with rewards 13.0\n",
      "Run episode 5 with rewards 13.0\n",
      "Run episode 6 with rewards 14.0\n",
      "Run episode 7 with rewards 9.0\n",
      "Run episode 8 with rewards 10.0\n",
      "Run episode 9 with rewards 11.0\n",
      "Run episode 10 with rewards 12.0\n",
      "Run episode 11 with rewards 53.0\n",
      "Run episode 12 with rewards 12.0\n",
      "Run episode 13 with rewards 10.0\n",
      "Run episode 14 with rewards 18.0\n",
      "Run episode 15 with rewards 18.0\n",
      "Run episode 16 with rewards 12.0\n",
      "Run episode 17 with rewards 15.0\n",
      "Run episode 18 with rewards 13.0\n",
      "Run episode 19 with rewards 14.0\n",
      "Run episode 20 with rewards 12.0\n",
      "Run episode 21 with rewards 18.0\n",
      "Run episode 22 with rewards 26.0\n",
      "Run episode 23 with rewards 18.0\n",
      "Run episode 24 with rewards 10.0\n",
      "Run episode 25 with rewards 14.0\n",
      "Run episode 26 with rewards 21.0\n",
      "Run episode 27 with rewards 12.0\n",
      "Run episode 28 with rewards 16.0\n",
      "Run episode 29 with rewards 14.0\n",
      "Run episode 30 with rewards 19.0\n",
      "Run episode 31 with rewards 10.0\n",
      "Run episode 32 with rewards 24.0\n",
      "Run episode 33 with rewards 18.0\n",
      "Run episode 34 with rewards 14.0\n",
      "Run episode 35 with rewards 9.0\n",
      "Run episode 36 with rewards 13.0\n",
      "Run episode 37 with rewards 13.0\n",
      "Run episode 38 with rewards 24.0\n",
      "Run episode 39 with rewards 11.0\n",
      "Run episode 40 with rewards 15.0\n",
      "Run episode 41 with rewards 12.0\n",
      "Run episode 42 with rewards 17.0\n",
      "Run episode 43 with rewards 10.0\n",
      "Run episode 44 with rewards 13.0\n",
      "Run episode 45 with rewards 12.0\n",
      "Run episode 46 with rewards 10.0\n",
      "Run episode 47 with rewards 23.0\n",
      "Run episode 48 with rewards 18.0\n",
      "Run episode 49 with rewards 15.0\n",
      "Run episode 50 with rewards 16.0\n",
      "Run episode 51 with rewards 12.0\n",
      "Run episode 52 with rewards 22.0\n",
      "Run episode 53 with rewards 11.0\n",
      "Run episode 54 with rewards 13.0\n",
      "Run episode 55 with rewards 13.0\n",
      "Run episode 56 with rewards 12.0\n",
      "Run episode 57 with rewards 30.0\n",
      "Run episode 58 with rewards 16.0\n",
      "Run episode 59 with rewards 21.0\n",
      "Run episode 60 with rewards 13.0\n",
      "Run episode 61 with rewards 9.0\n",
      "Run episode 62 with rewards 13.0\n",
      "Run episode 63 with rewards 10.0\n",
      "Run episode 64 with rewards 11.0\n",
      "Run episode 65 with rewards 12.0\n",
      "Run episode 66 with rewards 14.0\n",
      "Run episode 67 with rewards 15.0\n",
      "Run episode 68 with rewards 18.0\n",
      "Run episode 69 with rewards 13.0\n",
      "Run episode 70 with rewards 11.0\n",
      "Run episode 71 with rewards 14.0\n",
      "Run episode 72 with rewards 12.0\n",
      "Run episode 73 with rewards 9.0\n",
      "Run episode 74 with rewards 9.0\n",
      "Run episode 75 with rewards 12.0\n",
      "Run episode 76 with rewards 17.0\n",
      "Run episode 77 with rewards 8.0\n",
      "Run episode 78 with rewards 22.0\n",
      "Run episode 79 with rewards 20.0\n"
     ]
    }
   ],
   "source": [
    "opt1 = torch.optim.AdamW(value_func.parameters(), lr=0.001)\n",
    "opt2 = torch.optim.AdamW(actor_func.parameters(), lr=0.001)\n",
    "def pick_sample(s):\n",
    "    with torch.no_grad():\n",
    "        #   --> size : (1, 4)\n",
    "        s_batch = np.expand_dims(s, axis=0)\n",
    "        s_batch = torch.tensor(s_batch, dtype=torch.float).to(device)\n",
    "        # Get logits from state\n",
    "        #   --> size : (1, 2)\n",
    "        logits = actor_func(s_batch)\n",
    "        #   --> size : (2)\n",
    "        logits = logits.squeeze(dim=0)\n",
    "        # From logits to probabilities\n",
    "        probs = F.softmax(logits, dim=-1)\n",
    "        # Pick up action's sample\n",
    "        a = torch.multinomial(probs, num_samples=1)\n",
    "        # Return\n",
    "        return a.tolist()[0]\n",
    "reward_records = []\n",
    "for i in range(80):\n",
    "    #\n",
    "    # Run episode till done\n",
    "    #\n",
    "    done = False\n",
    "    states = []\n",
    "    actions = []\n",
    "    rewards = []\n",
    "    s, _ = env.reset(seed=np.random.randint(0, 1e6))\n",
    "    while not done:\n",
    "        states.append(s.tolist())\n",
    "        a = pick_sample(s)\n",
    "        s, r, term, trunc, _ = env.step(a)\n",
    "        done = term or trunc\n",
    "        actions.append(a)\n",
    "        rewards.append(r)\n",
    "\n",
    "    #\n",
    "    # Get cumulative rewards\n",
    "    #\n",
    "    cum_rewards = np.zeros_like(rewards)\n",
    "    reward_len = len(rewards)\n",
    "    for j in reversed(range(reward_len)):\n",
    "        cum_rewards[j] = rewards[j] + (cum_rewards[j+1]*gamma if j+1 < reward_len else 0)\n",
    "\n",
    "    #\n",
    "    # Train (optimize parameters)\n",
    "    #\n",
    "\n",
    "    # Optimize value loss (Critic)\n",
    "    opt1.zero_grad()\n",
    "    states = torch.tensor(states, dtype=torch.float).to(device)\n",
    "    cum_rewards = torch.tensor(cum_rewards, dtype=torch.float).to(device)\n",
    "    values = value_func(states)\n",
    "    values = values.squeeze(dim=1)\n",
    "    vf_loss = F.mse_loss(\n",
    "        values,\n",
    "        cum_rewards,\n",
    "        reduction=\"none\")\n",
    "    vf_loss.sum().backward()\n",
    "    opt1.step()\n",
    "\n",
    "    # Todo 2; RULE BASED UPDATES\n",
    "    with torch.no_grad():\n",
    "        values = value_func(states).squeeze(dim=1)\n",
    "    opt2.zero_grad()\n",
    "    actions = torch.tensor(actions, dtype=torch.int64).to(device)\n",
    "    advantages = cum_rewards - values\n",
    "#     print(advantages)\n",
    "    logits = actor_func(states)\n",
    "    log_probs = -F.cross_entropy(logits, actions, reduction=\"none\")\n",
    "    pi_loss = -log_probs * advantages\n",
    "    pi_loss.sum().backward()\n",
    "    opt2.step()\n",
    "\n",
    "    # Output total rewards in episode (max 500)\n",
    "    print(\"Run episode {} with rewards {}\".format(i, sum(rewards)))#, end=\"\\r\")\n",
    "    reward_records.append(sum(rewards))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 23,
   "id": "73589768",
   "metadata": {},
   "outputs": [],
   "source": [
    "def softmax(logits):\n",
    "    exp_logits = np.exp(logits)\n",
    "    sum_logits = np.sum(exp_logits)\n",
    "    return (exp_logits / sum_logits).reshape([-1])\n",
    "\n",
    "def pick_sample(s):\n",
    "    with torch.no_grad():\n",
    "        s_batch = np.expand_dims(s, axis=0)\n",
    "        logits = actor(pd.DataFrame(s_batch, columns=column_names))\n",
    "        probs = softmax(logits)\n",
    "        a = torch.multinomial(torch.tensor(probs), num_samples=1)\n",
    "        return a.tolist()[0]\n",
    "\n",
    "\n",
    "def train():\n",
    "    reward_records = []\n",
    "    best_rewards = 0\n",
    "    # best_model = None\n",
    "    for i in range(1000):\n",
    "\n",
    "        done = False\n",
    "        states = []\n",
    "        actions = []\n",
    "        rewards = []\n",
    "        s, _ = env.reset(seed=np.random.randint(0, 1e6))\n",
    "        if i == 2:\n",
    "            print('stop here')\n",
    "        while not done:\n",
    "            states.append(s.tolist())\n",
    "            a = pick_sample(s)\n",
    "            s, r, term, trunc, _ = env.step(a)\n",
    "            done = term or trunc\n",
    "            actions.append(a)\n",
    "            rewards.append(r)\n",
    "\n",
    "        # if sum(rewards) > 480:\n",
    "        #     break\n",
    "        #\n",
    "        # Get cumulative rewards\n",
    "        #\n",
    "        cum_rewards = np.zeros_like(rewards)\n",
    "        reward_len = len(rewards)\n",
    "        for j in reversed(range(reward_len)):\n",
    "            cum_rewards[j] = rewards[j] + (cum_rewards[j + 1] * gamma if j + 1 < reward_len else 0)\n",
    "        #\n",
    "        # Train (optimize parameters)\n",
    "        #\n",
    "        # Optimize value loss (Critic)\n",
    "        critic_optimizer.zero_grad()\n",
    "        states = torch.tensor(states, dtype=torch.float).to(device)\n",
    "        cum_rewards = torch.tensor(cum_rewards, dtype=torch.float).to(device)\n",
    "        values = critic(states)\n",
    "        values = values.squeeze(dim=1)\n",
    "        vf_loss = F.mse_loss(\n",
    "            values,\n",
    "            cum_rewards,\n",
    "            reduction=\"none\")\n",
    "        vf_loss.sum().backward()\n",
    "        critic_optimizer.step()\n",
    "        print('============', i, '===========')\n",
    "        print(len(actions), 'actions', actions)\n",
    "\n",
    "        print(\"{}\\n--------------\\n{}\\nRun episode {} with rewards {}\".format(actor.model[0].rules_,\n",
    "                                                                              actor.model[1].rules_,\n",
    "                                                                              i,\n",
    "                                                                              sum(rewards)))  # , end=\"\\r\")\n",
    "        if i > 0:\n",
    "            if sum(rewards) >= best_rewards:\n",
    "                best_rewards = sum(rewards)\n",
    "                for rr in range(actor.action_space):\n",
    "                    rules = []\n",
    "                    for n in range(len(actor.model[rr].rules_)):\n",
    "                        rule = actor.model[rr].rules_[n]\n",
    "                        rules.append(Rule(q=rule.q, y=rule.y))\n",
    "                    actor.best_model[rr].rules_ = AdditiveRuleEnsemble(rules)\n",
    "                print('best')\n",
    "        if np.average(reward_records[-5:]) > 475.0:\n",
    "            break\n",
    "        #     else:\n",
    "        #         for rr in range(actor.action_space):\n",
    "        #             rules = []\n",
    "        #             for n in range(len(actor.best_model[rr].rules_)):\n",
    "        #                 rule = actor.best_model[rr].rules_[n]\n",
    "        #                 rules.append(Rule(q=rule.q, y=rule.y))\n",
    "        #             actor.model[rr].rules_ = AdditiveRuleEnsemble(rules)\n",
    "        #         print('')\n",
    "\n",
    "        #\n",
    "        # Todo 2; RULE BASED UPDATES\n",
    "        with torch.no_grad():\n",
    "            values = critic(states).squeeze(dim=1)\n",
    "        actions = torch.tensor(actions, dtype=torch.int64).to(device)\n",
    "        advantages = cum_rewards - values\n",
    "        states_array = states.cpu().detach().numpy()\n",
    "        x = pd.DataFrame(states_array, columns=column_names)\n",
    "        y = pd.Series(actions.cpu().detach().numpy())\n",
    "#         advantages = (advantages-advantages.mean())/advantages.std()\n",
    "        adv = pd.Series(advantages.cpu().detach().numpy())\n",
    "        outputs = actor(x).T\n",
    "        # print('adv', advantages.cpu().detach().numpy())\n",
    "        # print('outputs', outputs.tolist())\n",
    "        for j in range(len(actor.model)):\n",
    "            m = actor.model[j]\n",
    "            masks = np.ones_like(outputs, dtype=bool)\n",
    "            masks[:, j] = False\n",
    "            other_values = outputs[masks].reshape(-1, outputs.shape[1] - 1)\n",
    "\n",
    "            if len(m.rules_) == 0:\n",
    "                m.fit(x, y, adv, other_values, j)\n",
    "            else:\n",
    "                for _ in range(1):\n",
    "                    update_rules(m, x, y, adv, other_values, j)\n",
    "        \n",
    "        # print(\n",
    "        #     \"{}\\n--------------\\n{}\\nRun episode {} with rewards {}\".format(actor.model[0].rules_,\n",
    "        #                                                                     actor.model[1].rules_,\n",
    "        #                                                                     i,\n",
    "        #                                                                     sum(rewards)))  # , end=\"\\r\")\n",
    "        reward_records.append(sum(rewards))\n",
    "    print(\"\\nDone\")\n",
    "    env.close()\n",
    "    return reward_records"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 24,
   "id": "b411aa5d",
   "metadata": {
    "scrolled": true
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 0 ===========\n",
      "67 actions [1, 0, 1, 1, 1, 0, 0, 0, 0, 1, 0, 0, 0, 1, 1, 0, 1, 1, 0, 0, 1, 1, 1, 0, 1, 1, 0, 0, 1, 1, 1, 0, 0, 1, 1, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 0, 1, 1, 0, 0, 0, 0, 1, 0, 0, 0]\n",
      "\n",
      "--------------\n",
      "\n",
      "Run episode 0 with rewards 67.0\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/home/fyan/.local/lib/python3.10/site-packages/numpy/lib/function_base.py:518: RuntimeWarning: Mean of empty slice.\n",
      "  avg = a.mean(axis, **keepdims_kw)\n",
      "/home/fyan/.local/lib/python3.10/site-packages/numpy/core/_methods.py:190: RuntimeWarning: invalid value encountered in double_scalars\n",
      "  ret = ret.dtype.type(ret / rcount)\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 1 ===========\n",
      "41 actions [1, 0, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 0, 1, 0, 0, 1, 1, 1, 0, 0, 0, 1, 0]\n",
      "   +0.5219 if cp>=0.025326931476593054 & cv>=-0.17492903470993043 & pa<=-0.029433537274599072\n",
      "   -6.2703 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   +2.1582 if cp<=0.025326931476593054 & cp>=-0.015411880426108835 & cv>=-0.17492903470993043 & pa>=-0.029433537274599072\n",
      "   +3.9683 if cp>=-0.015411880426108835 & cv>=0.019291881844401358 & pav>=-0.29077954292297364\n",
      "   -3.2642 if pav>=1.2673492431640625\n",
      "   +4.5905 if cp<=0.025326931476593054 & cp>=-0.0011798852123320073 & cv<=0.019291881844401358 & cv>=-0.17492903470993043 & pa>=-0.06770601868629456\n",
      "   +1.7283 if cp<=-0.0011798852123320073 & cv<=0.4088188290596008 & cv>=0.213888081908226\n",
      "   -5.1032 if cp>=-0.0011798852123320073 & cv<=0.4088188290596008 & cv>=0.213888081908226 & pa>=-0.029433537274599072 & pa>=0.009568695165216926\n",
      "   +2.8643 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   -1.8633 if cp<=0.052692229300737393 & cv<=0.4088188290596008 & pa<=0.009568695165216926 & pav<=-0.29077954292297364\n",
      "   -2.5238 if cp<=0.052692229300737393 & cp>=0.025326931476593054 & cv<=-0.17492903470993043\n",
      "   +3.7224 if cp>=0.025326931476593054 & cv>=0.4088188290596008\n",
      "--------------\n",
      "   -0.5219 if cp>=0.025326931476593054 & cv>=-0.17492903470993043 & pa<=-0.029433537274599072\n",
      "   +6.2705 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   -2.1582 if cp<=0.025326931476593054 & cp>=-0.015411880426108835 & cv>=-0.17492903470993043 & pa>=-0.029433537274599072\n",
      "   -3.9686 if cp>=-0.015411880426108835 & cv>=0.019291881844401358 & pav>=-0.29077954292297364\n",
      "   +3.2644 if pav>=1.2673492431640625\n",
      "   -4.5906 if cp<=0.025326931476593054 & cp>=-0.0011798852123320073 & cv<=0.019291881844401358 & cv>=-0.17492903470993043 & pa>=-0.06770601868629456\n",
      "   -1.7284 if cp<=-0.0011798852123320073 & cv<=0.4088188290596008 & cv>=0.213888081908226\n",
      "   +5.1030 if cp>=-0.0011798852123320073 & cv<=0.4088188290596008 & cv>=0.213888081908226 & pa>=-0.029433537274599072 & pa>=0.009568695165216926\n",
      "   -2.8645 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   +1.8632 if cp<=0.052692229300737393 & cv<=0.4088188290596008 & pa<=0.009568695165216926 & pav<=-0.29077954292297364\n",
      "   +2.5239 if cp<=0.052692229300737393 & cp>=0.025326931476593054 & cv<=-0.17492903470993043\n",
      "   -3.7224 if cp>=0.025326931476593054 & cv>=0.4088188290596008\n",
      "Run episode 1 with rewards 41.0\n",
      "best\n",
      "stop here\n",
      "============ 2 ===========\n",
      "14 actions [0, 1, 1, 1, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0]\n",
      "   -2.3368 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   +0.3052 if cp<=0.025326931476593054 & cp>=-0.015411880426108835 & cv>=-0.17492903470993043 & pa>=-0.029433537274599072\n",
      "   +1.0344 if cp>=-0.015411880426108835 & cv>=0.019291881844401358 & pav>=-0.29077954292297364\n",
      "   +0.0000 if pav>=1.2673492431640625\n",
      "   +3.4938 if cp<=0.025326931476593054 & cp>=-0.0011798852123320073 & cv<=0.019291881844401358 & cv>=-0.17492903470993043 & pa>=-0.06770601868629456\n",
      "   +2.1702 if cp<=-0.0011798852123320073 & cv<=0.4088188290596008 & cv>=0.213888081908226\n",
      "   +2.4179 if cp>=-0.0011798852123320073 & cv<=0.4088188290596008 & cv>=0.213888081908226 & pa>=-0.029433537274599072 & pa>=0.009568695165216926\n",
      "   -0.9283 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   +0.0000 if cp<=0.052692229300737393 & cv<=0.4088188290596008 & pa<=0.009568695165216926 & pav<=-0.29077954292297364\n",
      "   +0.0000 if cp<=0.052692229300737393 & cp>=0.025326931476593054 & cv<=-0.17492903470993043\n",
      "   +0.0000 if cp>=0.025326931476593054 & cv>=0.4088188290596008\n",
      "   +4.2344 if cv<=0.03999288007616997 & cv>=0.03999288007616997\n",
      "--------------\n",
      "   +2.3371 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   -0.3044 if cp<=0.025326931476593054 & cp>=-0.015411880426108835 & cv>=-0.17492903470993043 & pa>=-0.029433537274599072\n",
      "   -1.0355 if cp>=-0.015411880426108835 & cv>=0.019291881844401358 & pav>=-0.29077954292297364\n",
      "   +0.0006 if pav>=1.2673492431640625\n",
      "   -3.4937 if cp<=0.025326931476593054 & cp>=-0.0011798852123320073 & cv<=0.019291881844401358 & cv>=-0.17492903470993043 & pa>=-0.06770601868629456\n",
      "   -2.1703 if cp<=-0.0011798852123320073 & cv<=0.4088188290596008 & cv>=0.213888081908226\n",
      "   -2.4181 if cp>=-0.0011798852123320073 & cv<=0.4088188290596008 & cv>=0.213888081908226 & pa>=-0.029433537274599072 & pa>=0.009568695165216926\n",
      "   +0.9273 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   +0.0003 if cp<=0.052692229300737393 & cv<=0.4088188290596008 & pa<=0.009568695165216926 & pav<=-0.29077954292297364\n",
      "   +0.0005 if cp<=0.052692229300737393 & cp>=0.025326931476593054 & cv<=-0.17492903470993043\n",
      "   +0.0007 if cp>=0.025326931476593054 & cv>=0.4088188290596008\n",
      "   -4.2345 if cv<=0.03999288007616997 & cv>=0.03999288007616997\n",
      "Run episode 2 with rewards 14.0\n",
      "============ 3 ===========\n",
      "12 actions [0, 0, 0, 0, 1, 1, 0, 0, 1, 0, 0, 1]\n",
      "   -1.9831 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   -0.0000 if cp<=0.025326931476593054 & cp>=-0.015411880426108835 & cv>=-0.17492903470993043 & pa>=-0.029433537274599072\n",
      "   -0.0000 if cp>=-0.015411880426108835 & cv>=0.019291881844401358 & pav>=-0.29077954292297364\n",
      "   -0.0000 if pav>=1.2673492431640625\n",
      "   -0.0000 if cp<=0.025326931476593054 & cp>=-0.0011798852123320073 & cv<=0.019291881844401358 & cv>=-0.17492903470993043 & pa>=-0.06770601868629456\n",
      "   -0.0000 if cp<=-0.0011798852123320073 & cv<=0.4088188290596008 & cv>=0.213888081908226\n",
      "   -0.0000 if cp>=-0.0011798852123320073 & cv<=0.4088188290596008 & cv>=0.213888081908226 & pa>=-0.029433537274599072 & pa>=0.009568695165216926\n",
      "   +2.3786 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   -3.7161 if cp<=0.052692229300737393 & cp>=0.025326931476593054 & cv<=-0.17492903470993043\n",
      "   +1.4731 if cp>=0.025326931476593054 & cv>=0.4088188290596008\n",
      "   -0.0000 if cv<=0.03999288007616997 & cv>=0.03999288007616997\n",
      "   -3.2237 if cv<=0.5419640362262728 & cv>=0.11055615544319154\n",
      "--------------\n",
      "   +1.9832 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   -0.0000 if cp<=0.025326931476593054 & cp>=-0.015411880426108835 & cv>=-0.17492903470993043 & pa>=-0.029433537274599072\n",
      "   -0.0000 if cp>=-0.015411880426108835 & cv>=0.019291881844401358 & pav>=-0.29077954292297364\n",
      "   -0.0000 if pav>=1.2673492431640625\n",
      "   -0.0000 if cp<=0.025326931476593054 & cp>=-0.0011798852123320073 & cv<=0.019291881844401358 & cv>=-0.17492903470993043 & pa>=-0.06770601868629456\n",
      "   -0.0000 if cp<=-0.0011798852123320073 & cv<=0.4088188290596008 & cv>=0.213888081908226\n",
      "   -0.0000 if cp>=-0.0011798852123320073 & cv<=0.4088188290596008 & cv>=0.213888081908226 & pa>=-0.029433537274599072 & pa>=0.009568695165216926\n",
      "   -2.3795 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   +3.7163 if cp<=0.052692229300737393 & cp>=0.025326931476593054 & cv<=-0.17492903470993043\n",
      "   -1.4724 if cp>=0.025326931476593054 & cv>=0.4088188290596008\n",
      "   -0.0000 if cv<=0.03999288007616997 & cv>=0.03999288007616997\n",
      "   +3.2238 if cv<=0.5419640362262728 & cv>=0.11055615544319154\n",
      "Run episode 3 with rewards 12.0\n",
      "============ 4 ===========\n",
      "11 actions [0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 0]\n",
      "   +1.4442 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   -0.0000 if cp<=0.025326931476593054 & cp>=-0.015411880426108835 & cv>=-0.17492903470993043 & pa>=-0.029433537274599072\n",
      "   -0.0000 if cp>=-0.015411880426108835 & cv>=0.019291881844401358 & pav>=-0.29077954292297364\n",
      "   -0.0000 if cp<=0.025326931476593054 & cp>=-0.0011798852123320073 & cv<=0.019291881844401358 & cv>=-0.17492903470993043 & pa>=-0.06770601868629456\n",
      "   -0.0000 if cp<=-0.0011798852123320073 & cv<=0.4088188290596008 & cv>=0.213888081908226\n",
      "   -0.0000 if cp>=-0.0011798852123320073 & cv<=0.4088188290596008 & cv>=0.213888081908226 & pa>=-0.029433537274599072 & pa>=0.009568695165216926\n",
      "   +1.4442 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   -0.0000 if cp<=0.052692229300737393 & cp>=0.025326931476593054 & cv<=-0.17492903470993043\n",
      "   -0.0000 if cp>=0.025326931476593054 & cv>=0.4088188290596008\n",
      "   -0.0000 if cv<=0.03999288007616997 & cv>=0.03999288007616997\n",
      "   -0.0000 if cv<=0.5419640362262728 & cv>=0.11055615544319154\n",
      "   -3.8166 if cv<=-0.6254599928855896\n",
      "--------------\n",
      "   -1.4445 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   -0.0000 if cp<=0.025326931476593054 & cp>=-0.015411880426108835 & cv>=-0.17492903470993043 & pa>=-0.029433537274599072\n",
      "   -0.0000 if cp>=-0.015411880426108835 & cv>=0.019291881844401358 & pav>=-0.29077954292297364\n",
      "   -0.0000 if cp<=0.025326931476593054 & cp>=-0.0011798852123320073 & cv<=0.019291881844401358 & cv>=-0.17492903470993043 & pa>=-0.06770601868629456\n",
      "   -0.0000 if cp<=-0.0011798852123320073 & cv<=0.4088188290596008 & cv>=0.213888081908226\n",
      "   -0.0000 if cp>=-0.0011798852123320073 & cv<=0.4088188290596008 & cv>=0.213888081908226 & pa>=-0.029433537274599072 & pa>=0.009568695165216926\n",
      "   -1.4445 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   -0.0000 if cp<=0.052692229300737393 & cp>=0.025326931476593054 & cv<=-0.17492903470993043\n",
      "   -0.0000 if cp>=0.025326931476593054 & cv>=0.4088188290596008\n",
      "   -0.0000 if cv<=0.03999288007616997 & cv>=0.03999288007616997\n",
      "   -0.0000 if cv<=0.5419640362262728 & cv>=0.11055615544319154\n",
      "   +3.8166 if cv<=-0.6254599928855896\n",
      "Run episode 4 with rewards 11.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 5 ===========\n",
      "10 actions [0, 0, 0, 1, 0, 0, 1, 0, 1, 0]\n",
      "   +0.5535 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   +0.0000 if cp>=-0.015411880426108835 & cv>=0.019291881844401358 & pav>=-0.29077954292297364\n",
      "   +0.0000 if cp<=0.025326931476593054 & cp>=-0.0011798852123320073 & cv<=0.019291881844401358 & cv>=-0.17492903470993043 & pa>=-0.06770601868629456\n",
      "   +0.0000 if cp<=-0.0011798852123320073 & cv<=0.4088188290596008 & cv>=0.213888081908226\n",
      "   +0.0000 if cp>=-0.0011798852123320073 & cv<=0.4088188290596008 & cv>=0.213888081908226 & pa>=-0.029433537274599072 & pa>=0.009568695165216926\n",
      "   +0.5535 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   +0.0000 if cp<=0.052692229300737393 & cp>=0.025326931476593054 & cv<=-0.17492903470993043\n",
      "   +0.0000 if cp>=0.025326931476593054 & cv>=0.4088188290596008\n",
      "   +0.0000 if cv<=0.03999288007616997 & cv>=0.03999288007616997\n",
      "   +0.0000 if cv<=0.5419640362262728 & cv>=0.11055615544319154\n",
      "   -2.4678 if cv<=-0.6254599928855896\n",
      "   -0.1282 if cp>=-0.09483367949724197\n",
      "--------------\n",
      "   -0.5538 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   +0.0000 if cp>=-0.015411880426108835 & cv>=0.019291881844401358 & pav>=-0.29077954292297364\n",
      "   +0.0000 if cp<=0.025326931476593054 & cp>=-0.0011798852123320073 & cv<=0.019291881844401358 & cv>=-0.17492903470993043 & pa>=-0.06770601868629456\n",
      "   +0.0000 if cp<=-0.0011798852123320073 & cv<=0.4088188290596008 & cv>=0.213888081908226\n",
      "   +0.0000 if cp>=-0.0011798852123320073 & cv<=0.4088188290596008 & cv>=0.213888081908226 & pa>=-0.029433537274599072 & pa>=0.009568695165216926\n",
      "   -0.5538 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   +0.0000 if cp<=0.052692229300737393 & cp>=0.025326931476593054 & cv<=-0.17492903470993043\n",
      "   +0.0000 if cp>=0.025326931476593054 & cv>=0.4088188290596008\n",
      "   +0.0000 if cv<=0.03999288007616997 & cv>=0.03999288007616997\n",
      "   +0.0000 if cv<=0.5419640362262728 & cv>=0.11055615544319154\n",
      "   +2.4677 if cv<=-0.6254599928855896\n",
      "   +0.1280 if cp>=-0.09483367949724197\n",
      "Run episode 5 with rewards 10.0\n",
      "============ 6 ===========\n",
      "12 actions [0, 0, 0, 1, 0, 1, 0, 0, 1, 1, 0, 0]\n",
      "   -0.0780 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   +0.0000 if cp<=0.025326931476593054 & cp>=-0.0011798852123320073 & cv<=0.019291881844401358 & cv>=-0.17492903470993043 & pa>=-0.06770601868629456\n",
      "   +0.0000 if cp<=-0.0011798852123320073 & cv<=0.4088188290596008 & cv>=0.213888081908226\n",
      "   +0.0000 if cp>=-0.0011798852123320073 & cv<=0.4088188290596008 & cv>=0.213888081908226 & pa>=-0.029433537274599072 & pa>=0.009568695165216926\n",
      "   -0.0780 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   +0.0000 if cp<=0.052692229300737393 & cp>=0.025326931476593054 & cv<=-0.17492903470993043\n",
      "   +0.0000 if cp>=0.025326931476593054 & cv>=0.4088188290596008\n",
      "   +0.0000 if cv<=0.03999288007616997 & cv>=0.03999288007616997\n",
      "   +0.0000 if cv<=0.5419640362262728 & cv>=0.11055615544319154\n",
      "   -0.7939 if cv<=-0.6254599928855896\n",
      "   -0.4827 if cp>=-0.09483367949724197\n",
      "   +3.1037 if cv>=-0.5116368293762207\n",
      "--------------\n",
      "   +0.0778 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   +0.0000 if cp<=0.025326931476593054 & cp>=-0.0011798852123320073 & cv<=0.019291881844401358 & cv>=-0.17492903470993043 & pa>=-0.06770601868629456\n",
      "   +0.0000 if cp<=-0.0011798852123320073 & cv<=0.4088188290596008 & cv>=0.213888081908226\n",
      "   +0.0000 if cp>=-0.0011798852123320073 & cv<=0.4088188290596008 & cv>=0.213888081908226 & pa>=-0.029433537274599072 & pa>=0.009568695165216926\n",
      "   +0.0778 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   +0.0000 if cp<=0.052692229300737393 & cp>=0.025326931476593054 & cv<=-0.17492903470993043\n",
      "   +0.0000 if cp>=0.025326931476593054 & cv>=0.4088188290596008\n",
      "   +0.0000 if cv<=0.03999288007616997 & cv>=0.03999288007616997\n",
      "   +0.0000 if cv<=0.5419640362262728 & cv>=0.11055615544319154\n",
      "   +0.7938 if cv<=-0.6254599928855896\n",
      "   +0.4825 if cp>=-0.09483367949724197\n",
      "   -3.1037 if cv>=-0.5116368293762207\n",
      "Run episode 6 with rewards 12.0\n",
      "============ 7 ===========\n",
      "15 actions [0, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0]\n",
      "   +0.4445 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   +0.0000 if cp<=0.025326931476593054 & cp>=-0.0011798852123320073 & cv<=0.019291881844401358 & cv>=-0.17492903470993043 & pa>=-0.06770601868629456\n",
      "   +0.0000 if cp>=-0.0011798852123320073 & cv<=0.4088188290596008 & cv>=0.213888081908226 & pa>=-0.029433537274599072 & pa>=0.009568695165216926\n",
      "   +0.4445 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   +0.0000 if cp<=0.052692229300737393 & cp>=0.025326931476593054 & cv<=-0.17492903470993043\n",
      "   +0.0000 if cp>=0.025326931476593054 & cv>=0.4088188290596008\n",
      "   +0.0000 if cv<=0.03999288007616997 & cv>=0.03999288007616997\n",
      "   +0.0000 if cv<=0.5419640362262728 & cv>=0.11055615544319154\n",
      "   -0.0329 if cv<=-0.6254599928855896\n",
      "   -2.3499 if cp>=-0.09483367949724197\n",
      "   +2.8805 if cv>=-0.5116368293762207\n",
      "   -1.9180 if cv<=-0.6210723280906677\n",
      "--------------\n",
      "   -0.4447 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   +0.0000 if cp<=0.025326931476593054 & cp>=-0.0011798852123320073 & cv<=0.019291881844401358 & cv>=-0.17492903470993043 & pa>=-0.06770601868629456\n",
      "   +0.0000 if cp>=-0.0011798852123320073 & cv<=0.4088188290596008 & cv>=0.213888081908226 & pa>=-0.029433537274599072 & pa>=0.009568695165216926\n",
      "   -0.4447 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   +0.0000 if cp<=0.052692229300737393 & cp>=0.025326931476593054 & cv<=-0.17492903470993043\n",
      "   +0.0000 if cp>=0.025326931476593054 & cv>=0.4088188290596008\n",
      "   +0.0000 if cv<=0.03999288007616997 & cv>=0.03999288007616997\n",
      "   +0.0000 if cv<=0.5419640362262728 & cv>=0.11055615544319154\n",
      "   +0.0329 if cv<=-0.6254599928855896\n",
      "   +2.3498 if cp>=-0.09483367949724197\n",
      "   -2.8805 if cv>=-0.5116368293762207\n",
      "   +1.9180 if cv<=-0.6210723280906677\n",
      "Run episode 7 with rewards 15.0\n",
      "============ 8 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 1, 0, 0, 1, 1]\n",
      "   +0.1924 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   +0.0000 if cp<=0.025326931476593054 & cp>=-0.0011798852123320073 & cv<=0.019291881844401358 & cv>=-0.17492903470993043 & pa>=-0.06770601868629456\n",
      "   +0.1924 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   -0.4883 if cp<=0.052692229300737393 & cp>=0.025326931476593054 & cv<=-0.17492903470993043\n",
      "   +0.0000 if cp>=0.025326931476593054 & cv>=0.4088188290596008\n",
      "   +0.0000 if cv<=0.03999288007616997 & cv>=0.03999288007616997\n",
      "   +0.0000 if cv<=0.5419640362262728 & cv>=0.11055615544319154\n",
      "   -0.3803 if cv<=-0.6254599928855896\n",
      "   +0.1924 if cp>=-0.09483367949724197\n",
      "   +2.9881 if cv>=-0.5116368293762207\n",
      "   -0.3803 if cv<=-0.6210723280906677\n",
      "   -1.8459 if cp<=0.03204101100564004 & cp>=0.003031891118735101\n",
      "--------------\n",
      "   -0.1926 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   +0.0000 if cp<=0.025326931476593054 & cp>=-0.0011798852123320073 & cv<=0.019291881844401358 & cv>=-0.17492903470993043 & pa>=-0.06770601868629456\n",
      "   -0.1926 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   +0.4883 if cp<=0.052692229300737393 & cp>=0.025326931476593054 & cv<=-0.17492903470993043\n",
      "   +0.0000 if cp>=0.025326931476593054 & cv>=0.4088188290596008\n",
      "   +0.0000 if cv<=0.03999288007616997 & cv>=0.03999288007616997\n",
      "   +0.0000 if cv<=0.5419640362262728 & cv>=0.11055615544319154\n",
      "   +0.3802 if cv<=-0.6254599928855896\n",
      "   -0.1926 if cp>=-0.09483367949724197\n",
      "   -2.9882 if cv>=-0.5116368293762207\n",
      "   +0.3802 if cv<=-0.6210723280906677\n",
      "   +1.8459 if cp<=0.03204101100564004 & cp>=0.003031891118735101\n",
      "Run episode 8 with rewards 10.0\n",
      "============ 9 ===========\n",
      "11 actions [0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0]\n",
      "   +0.7108 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   +0.5891 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   +0.0000 if cp<=0.052692229300737393 & cp>=0.025326931476593054 & cv<=-0.17492903470993043\n",
      "   +0.0000 if cp>=0.025326931476593054 & cv>=0.4088188290596008\n",
      "   +0.0000 if cv<=0.03999288007616997 & cv>=0.03999288007616997\n",
      "   +0.0000 if cv<=0.5419640362262728 & cv>=0.11055615544319154\n",
      "   -0.3986 if cv<=-0.6254599928855896\n",
      "   +1.2276 if cp>=-0.09483367949724197\n",
      "   +0.2155 if cv>=-0.5116368293762207\n",
      "   -0.3986 if cv<=-0.6210723280906677\n",
      "   +0.0000 if cp<=0.03204101100564004 & cp>=0.003031891118735101\n",
      "   -2.8927 if cp>=-0.04866652190685272 & cv<=-0.8220348358154297\n",
      "--------------\n",
      "   -0.7108 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   -0.5894 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   +0.0000 if cp<=0.052692229300737393 & cp>=0.025326931476593054 & cv<=-0.17492903470993043\n",
      "   +0.0000 if cp>=0.025326931476593054 & cv>=0.4088188290596008\n",
      "   +0.0000 if cv<=0.03999288007616997 & cv>=0.03999288007616997\n",
      "   +0.0000 if cv<=0.5419640362262728 & cv>=0.11055615544319154\n",
      "   +0.3986 if cv<=-0.6254599928855896\n",
      "   -1.2278 if cp>=-0.09483367949724197\n",
      "   -0.2154 if cv>=-0.5116368293762207\n",
      "   +0.3986 if cv<=-0.6210723280906677\n",
      "   +0.0000 if cp<=0.03204101100564004 & cp>=0.003031891118735101\n",
      "   +2.8927 if cp>=-0.04866652190685272 & cv<=-0.8220348358154297\n",
      "Run episode 9 with rewards 11.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 10 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 1]\n",
      "   -0.2165 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   +0.0781 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   +0.0000 if cp<=0.052692229300737393 & cp>=0.025326931476593054 & cv<=-0.17492903470993043\n",
      "   +0.0000 if cp>=0.025326931476593054 & cv>=0.4088188290596008\n",
      "   +0.0000 if cv<=0.5419640362262728 & cv>=0.11055615544319154\n",
      "   -0.3887 if cv<=-0.6254599928855896\n",
      "   +2.5388 if cp>=-0.09483367949724197\n",
      "   +0.6261 if cv>=-0.5116368293762207\n",
      "   -0.3887 if cv<=-0.6210723280906677\n",
      "   +0.0000 if cp<=0.03204101100564004 & cp>=0.003031891118735101\n",
      "   +0.0000 if cp>=-0.04866652190685272 & cv<=-0.8220348358154297\n",
      "   +1.9770 if cp<=-0.13380591571331024\n",
      "--------------\n",
      "   +0.2164 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   -0.0782 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   +0.0000 if cp<=0.052692229300737393 & cp>=0.025326931476593054 & cv<=-0.17492903470993043\n",
      "   +0.0000 if cp>=0.025326931476593054 & cv>=0.4088188290596008\n",
      "   +0.0000 if cv<=0.5419640362262728 & cv>=0.11055615544319154\n",
      "   +0.3886 if cv<=-0.6254599928855896\n",
      "   -2.5390 if cp>=-0.09483367949724197\n",
      "   -0.6261 if cv>=-0.5116368293762207\n",
      "   +0.3886 if cv<=-0.6210723280906677\n",
      "   +0.0000 if cp<=0.03204101100564004 & cp>=0.003031891118735101\n",
      "   +0.0000 if cp>=-0.04866652190685272 & cv<=-0.8220348358154297\n",
      "   -1.9770 if cp<=-0.13380591571331024\n",
      "Run episode 10 with rewards 9.0\n",
      "============ 11 ===========\n",
      "8 actions [0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.6893 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   +0.6893 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   +0.0000 if cp<=0.052692229300737393 & cp>=0.025326931476593054 & cv<=-0.17492903470993043\n",
      "   +0.0000 if cv<=0.5419640362262728 & cv>=0.11055615544319154\n",
      "   +0.3917 if cv<=-0.6254599928855896\n",
      "   +0.7962 if cp>=-0.09483367949724197\n",
      "   +0.2976 if cv>=-0.5116368293762207\n",
      "   +0.3917 if cv<=-0.6210723280906677\n",
      "   +0.0000 if cp<=0.03204101100564004 & cp>=0.003031891118735101\n",
      "   +0.2061 if cp>=-0.04866652190685272 & cv<=-0.8220348358154297\n",
      "   +0.0000 if cp<=-0.13380591571331024\n",
      "   -0.0667 if cp<=-0.07414135038852691\n",
      "--------------\n",
      "   -0.6894 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   -0.6894 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   +0.0000 if cp<=0.052692229300737393 & cp>=0.025326931476593054 & cv<=-0.17492903470993043\n",
      "   +0.0000 if cv<=0.5419640362262728 & cv>=0.11055615544319154\n",
      "   -0.3918 if cv<=-0.6254599928855896\n",
      "   -0.7962 if cp>=-0.09483367949724197\n",
      "   -0.2977 if cv>=-0.5116368293762207\n",
      "   -0.3918 if cv<=-0.6210723280906677\n",
      "   +0.0000 if cp<=0.03204101100564004 & cp>=0.003031891118735101\n",
      "   -0.2062 if cp>=-0.04866652190685272 & cv<=-0.8220348358154297\n",
      "   +0.0000 if cp<=-0.13380591571331024\n",
      "   +0.0667 if cp<=-0.07414135038852691\n",
      "Run episode 11 with rewards 8.0\n",
      "============ 12 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.7443 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   +0.7443 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   +0.0000 if cp<=0.052692229300737393 & cp>=0.025326931476593054 & cv<=-0.17492903470993043\n",
      "   +0.1569 if cv<=-0.6254599928855896\n",
      "   +0.6669 if cp>=-0.09483367949724197\n",
      "   +0.3993 if cv>=-0.5116368293762207\n",
      "   +0.1569 if cv<=-0.6210723280906677\n",
      "   +0.0000 if cp<=0.03204101100564004 & cp>=0.003031891118735101\n",
      "   +0.0000 if cp>=-0.04866652190685272 & cv<=-0.8220348358154297\n",
      "   +0.0000 if cp<=-0.13380591571331024\n",
      "   +0.1088 if cp<=-0.07414135038852691\n",
      "   +0.1231 if cp>=-0.046753622591495514\n",
      "--------------\n",
      "   -0.7444 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   -0.7444 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   +0.0000 if cp<=0.052692229300737393 & cp>=0.025326931476593054 & cv<=-0.17492903470993043\n",
      "   -0.1569 if cv<=-0.6254599928855896\n",
      "   -0.6670 if cp>=-0.09483367949724197\n",
      "   -0.3993 if cv>=-0.5116368293762207\n",
      "   -0.1569 if cv<=-0.6210723280906677\n",
      "   +0.0000 if cp<=0.03204101100564004 & cp>=0.003031891118735101\n",
      "   +0.0000 if cp>=-0.04866652190685272 & cv<=-0.8220348358154297\n",
      "   +0.0000 if cp<=-0.13380591571331024\n",
      "   -0.1088 if cp<=-0.07414135038852691\n",
      "   -0.1231 if cp>=-0.046753622591495514\n",
      "Run episode 12 with rewards 10.0\n",
      "============ 13 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.8642 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   +0.6045 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   +0.3219 if cv<=-0.6254599928855896\n",
      "   +0.7081 if cp>=-0.09483367949724197\n",
      "   +0.4085 if cv>=-0.5116368293762207\n",
      "   +0.3219 if cv<=-0.6210723280906677\n",
      "   +0.0000 if cp<=0.03204101100564004 & cp>=0.003031891118735101\n",
      "   +0.0000 if cp>=-0.04866652190685272 & cv<=-0.8220348358154297\n",
      "   -0.0016 if cp<=-0.13380591571331024\n",
      "   +0.1561 if cp<=-0.07414135038852691\n",
      "   +0.5854 if cp>=-0.046753622591495514\n",
      "   +0.2597 if cv>=0.023790350183844566\n",
      "--------------\n",
      "   -0.8642 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   -0.6045 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   -0.3219 if cv<=-0.6254599928855896\n",
      "   -0.7081 if cp>=-0.09483367949724197\n",
      "   -0.4085 if cv>=-0.5116368293762207\n",
      "   -0.3219 if cv<=-0.6210723280906677\n",
      "   +0.0000 if cp<=0.03204101100564004 & cp>=0.003031891118735101\n",
      "   +0.0000 if cp>=-0.04866652190685272 & cv<=-0.8220348358154297\n",
      "   +0.0016 if cp<=-0.13380591571331024\n",
      "   -0.1561 if cp<=-0.07414135038852691\n",
      "   -0.5854 if cp>=-0.046753622591495514\n",
      "   -0.2597 if cv>=0.023790350183844566\n",
      "Run episode 13 with rewards 9.0\n",
      "============ 14 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 1, 0]\n",
      "   +0.6019 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   +0.6019 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   +0.2124 if cv<=-0.6254599928855896\n",
      "   +0.5350 if cp>=-0.09483367949724197\n",
      "   +0.2626 if cv>=-0.5116368293762207\n",
      "   +0.2124 if cv<=-0.6210723280906677\n",
      "   +0.0000 if cp>=-0.04866652190685272 & cv<=-0.8220348358154297\n",
      "   +0.0000 if cp<=-0.13380591571331024\n",
      "   +0.1045 if cp<=-0.07414135038852691\n",
      "   +0.4247 if cp>=-0.046753622591495514\n",
      "   +0.0000 if cv>=0.023790350183844566\n",
      "   +0.0831 if cp>=-0.018449416384100914\n",
      "--------------\n",
      "   -0.6019 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   -0.6019 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   -0.2124 if cv<=-0.6254599928855896\n",
      "   -0.5351 if cp>=-0.09483367949724197\n",
      "   -0.2626 if cv>=-0.5116368293762207\n",
      "   -0.2124 if cv<=-0.6210723280906677\n",
      "   +0.0000 if cp>=-0.04866652190685272 & cv<=-0.8220348358154297\n",
      "   +0.0000 if cp<=-0.13380591571331024\n",
      "   -0.1045 if cp<=-0.07414135038852691\n",
      "   -0.4247 if cp>=-0.046753622591495514\n",
      "   +0.0000 if cv>=0.023790350183844566\n",
      "   -0.0831 if cp>=-0.018449416384100914\n",
      "Run episode 14 with rewards 9.0\n",
      "============ 15 ===========\n",
      "8 actions [0, 0, 0, 0, 0, 0, 0, 1]\n",
      "   +0.2286 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   +0.2286 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   -0.2882 if cv<=-0.6254599928855896\n",
      "   +1.4090 if cp>=-0.09483367949724197\n",
      "   +0.3572 if cv>=-0.5116368293762207\n",
      "   -0.2882 if cv<=-0.6210723280906677\n",
      "   +0.0000 if cp<=-0.13380591571331024\n",
      "   -0.7654 if cp<=-0.07414135038852691\n",
      "   +0.6660 if cp>=-0.046753622591495514\n",
      "   +0.0000 if cv>=0.023790350183844566\n",
      "   +0.0000 if cp>=-0.018449416384100914\n",
      "   -1.3637 if pav>=2.1502227783203125\n",
      "--------------\n",
      "   -0.2286 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   -0.2286 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   +0.2882 if cv<=-0.6254599928855896\n",
      "   -1.4090 if cp>=-0.09483367949724197\n",
      "   -0.3572 if cv>=-0.5116368293762207\n",
      "   +0.2882 if cv<=-0.6210723280906677\n",
      "   +0.0000 if cp<=-0.13380591571331024\n",
      "   +0.7654 if cp<=-0.07414135038852691\n",
      "   -0.6660 if cp>=-0.046753622591495514\n",
      "   +0.0000 if cv>=0.023790350183844566\n",
      "   +0.0000 if cp>=-0.018449416384100914\n",
      "   +1.3637 if pav>=2.1502227783203125\n",
      "Run episode 15 with rewards 8.0\n",
      "============ 16 ===========\n",
      "8 actions [0, 0, 0, 0, 0, 0, 0, 1]\n",
      "   +0.4068 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   +0.4068 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   +0.0299 if cv<=-0.6254599928855896\n",
      "   +0.4068 if cp>=-0.09483367949724197\n",
      "   +0.2626 if cv>=-0.5116368293762207\n",
      "   +0.0299 if cv<=-0.6210723280906677\n",
      "   -0.0000 if cp<=-0.07414135038852691\n",
      "   +0.4068 if cp>=-0.046753622591495514\n",
      "   -0.0000 if cv>=0.023790350183844566\n",
      "   +0.6705 if cp>=-0.018449416384100914\n",
      "   -0.2637 if pav>=2.1502227783203125\n",
      "   +0.0951 if cp>=0.043813955038785934\n",
      "--------------\n",
      "   -0.4068 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   -0.4068 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   -0.0299 if cv<=-0.6254599928855896\n",
      "   -0.4068 if cp>=-0.09483367949724197\n",
      "   -0.2626 if cv>=-0.5116368293762207\n",
      "   -0.0299 if cv<=-0.6210723280906677\n",
      "   +0.0000 if cp<=-0.07414135038852691\n",
      "   -0.4068 if cp>=-0.046753622591495514\n",
      "   +0.0000 if cv>=0.023790350183844566\n",
      "   -0.6705 if cp>=-0.018449416384100914\n",
      "   +0.2637 if pav>=2.1502227783203125\n",
      "   -0.0951 if cp>=0.043813955038785934\n",
      "Run episode 16 with rewards 8.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 17 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.8330 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   +0.8330 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   +0.1749 if cv<=-0.6254599928855896\n",
      "   +0.9234 if cp>=-0.09483367949724197\n",
      "   +0.3448 if cv>=-0.5116368293762207\n",
      "   +0.1749 if cv<=-0.6210723280906677\n",
      "   +0.0159 if cp<=-0.07414135038852691\n",
      "   +0.3448 if cp>=-0.046753622591495514\n",
      "   +0.0000 if cp>=-0.018449416384100914\n",
      "   -0.2928 if pav>=2.1502227783203125\n",
      "   +0.0000 if cp>=0.043813955038785934\n",
      "   +0.1226 if cp>=-0.03710911050438881\n",
      "--------------\n",
      "   -0.8330 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   -0.8330 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   -0.1749 if cv<=-0.6254599928855896\n",
      "   -0.9234 if cp>=-0.09483367949724197\n",
      "   -0.3448 if cv>=-0.5116368293762207\n",
      "   -0.1749 if cv<=-0.6210723280906677\n",
      "   -0.0159 if cp<=-0.07414135038852691\n",
      "   -0.3448 if cp>=-0.046753622591495514\n",
      "   +0.0000 if cp>=-0.018449416384100914\n",
      "   +0.2928 if pav>=2.1502227783203125\n",
      "   +0.0000 if cp>=0.043813955038785934\n",
      "   -0.1225 if cp>=-0.03710911050438881\n",
      "Run episode 17 with rewards 10.0\n",
      "============ 18 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.2674 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   +0.5464 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   +0.1640 if cv<=-0.6254599928855896\n",
      "   +0.5563 if cp>=-0.09483367949724197\n",
      "   +0.3179 if cv>=-0.5116368293762207\n",
      "   +0.1640 if cv<=-0.6210723280906677\n",
      "   +0.0303 if cp<=-0.07414135038852691\n",
      "   +0.4552 if cp>=-0.046753622591495514\n",
      "   +0.4318 if cp>=-0.018449416384100914\n",
      "   +0.0303 if pav>=2.1502227783203125\n",
      "   +0.4552 if cp>=-0.03710911050438881\n",
      "   +0.0843 if cp<=-0.021443277597427368 & cp>=-0.06261669993400573\n",
      "--------------\n",
      "   -0.2674 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   -0.5464 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   -0.1640 if cv<=-0.6254599928855896\n",
      "   -0.5563 if cp>=-0.09483367949724197\n",
      "   -0.3179 if cv>=-0.5116368293762207\n",
      "   -0.1640 if cv<=-0.6210723280906677\n",
      "   -0.0303 if cp<=-0.07414135038852691\n",
      "   -0.4552 if cp>=-0.046753622591495514\n",
      "   -0.4318 if cp>=-0.018449416384100914\n",
      "   -0.0303 if pav>=2.1502227783203125\n",
      "   -0.4552 if cp>=-0.03710911050438881\n",
      "   -0.0843 if cp<=-0.021443277597427368 & cp>=-0.06261669993400573\n",
      "Run episode 18 with rewards 10.0\n",
      "============ 19 ===========\n",
      "8 actions [0, 0, 0, 0, 0, 0, 0, 1]\n",
      "   +0.5597 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   +0.3944 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   +0.2201 if cv<=-0.6254599928855896\n",
      "   +0.5728 if cp>=-0.09483367949724197\n",
      "   +0.2692 if cv>=-0.5116368293762207\n",
      "   +0.2201 if cv<=-0.6210723280906677\n",
      "   +0.4958 if cp>=-0.046753622591495514\n",
      "   +0.3949 if cp>=-0.018449416384100914\n",
      "   +0.0638 if pav>=2.1502227783203125\n",
      "   +0.4370 if cp>=-0.03710911050438881\n",
      "   +0.0588 if cp<=-0.021443277597427368 & cp>=-0.06261669993400573\n",
      "   +0.1161 if cp<=0.03170740753412247 & cp>=0.017684276401996615\n",
      "--------------\n",
      "   -0.4919 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   -0.3526 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   -0.1892 if cv<=-0.6254599928855896\n",
      "   -0.5022 if cp>=-0.09483367949724197\n",
      "   -0.2355 if cv>=-0.5116368293762207\n",
      "   -0.1892 if cv<=-0.6210723280906677\n",
      "   +0.0104 if cp<=-0.07414135038852691\n",
      "   -0.4381 if cp>=-0.046753622591495514\n",
      "   -0.3526 if cp>=-0.018449416384100914\n",
      "   -0.3891 if cp>=-0.03710911050438881\n",
      "   -0.0491 if cp<=-0.021443277597427368 & cp>=-0.06261669993400573\n",
      "   -0.4919 if \n",
      "Run episode 19 with rewards 8.0\n",
      "============ 20 ===========\n",
      "10 actions [0, 0, 1, 0, 0, 0, 0, 0, 0, 1]\n",
      "   +0.2153 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   +0.0944 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   -0.1064 if cv<=-0.6254599928855896\n",
      "   +0.2153 if cp>=-0.09483367949724197\n",
      "   +0.2454 if cv>=-0.5116368293762207\n",
      "   -0.1064 if cv<=-0.6210723280906677\n",
      "   +0.4846 if cp>=-0.046753622591495514\n",
      "   +0.4349 if cp>=-0.018449416384100914\n",
      "   -0.2694 if pav>=2.1502227783203125\n",
      "   +0.4846 if cp>=-0.03710911050438881\n",
      "   +0.3216 if cp<=0.03170740753412247 & cp>=0.017684276401996615\n",
      "   -0.0301 if cp<=0.02058889977633954\n",
      "--------------\n",
      "   -0.2268 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   -0.0946 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   +0.1175 if cv<=-0.6254599928855896\n",
      "   -0.2268 if cp>=-0.09483367949724197\n",
      "   -0.2627 if cv>=-0.5116368293762207\n",
      "   +0.1175 if cv<=-0.6210723280906677\n",
      "   -0.4928 if cp>=-0.046753622591495514\n",
      "   -0.4393 if cp>=-0.018449416384100914\n",
      "   -0.4928 if cp>=-0.03710911050438881\n",
      "   +0.2126 if cp<=-0.021443277597427368 & cp>=-0.06261669993400573\n",
      "   -0.2268 if \n",
      "   +0.2660 if pa>=0.16887736320495605\n",
      "Run episode 20 with rewards 10.0\n",
      "============ 21 ===========\n",
      "11 actions [0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0]\n",
      "   +0.7681 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   +0.7681 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   +0.4627 if cv<=-0.6254599928855896\n",
      "   +0.7309 if cp>=-0.09483367949724197\n",
      "   -0.3502 if cv>=-0.5116368293762207\n",
      "   +0.4627 if cv<=-0.6210723280906677\n",
      "   -2.7193 if cp>=-0.046753622591495514\n",
      "   +0.0000 if cp>=-0.018449416384100914\n",
      "   -0.1849 if pav>=2.1502227783203125\n",
      "   +0.0000 if cp>=-0.03710911050438881\n",
      "   +0.0000 if cp<=0.03170740753412247 & cp>=0.017684276401996615\n",
      "   +2.0943 if cp>=-0.03826036676764488\n",
      "--------------\n",
      "   -1.5645 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   -0.0504 if cv<=-0.6254599928855896\n",
      "   -1.6210 if cp>=-0.09483367949724197\n",
      "   +0.0199 if cv>=-0.5116368293762207\n",
      "   -0.0504 if cv<=-0.6210723280906677\n",
      "   +3.4906 if cp>=-0.046753622591495514\n",
      "   +0.0000 if cp>=-0.018449416384100914\n",
      "   +0.0000 if cp>=-0.03710911050438881\n",
      "   +0.0199 if cp<=-0.021443277597427368 & cp>=-0.06261669993400573\n",
      "   -1.5645 if \n",
      "   +0.1918 if pa>=0.16887736320495605\n",
      "   +3.1205 if cp<=-0.04215016812086105 & cp>=-0.06877081394195557\n",
      "Run episode 21 with rewards 11.0\n",
      "============ 22 ===========\n",
      "21 actions [1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 0]\n",
      "   +0.4766 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   +0.4766 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   -0.2308 if cv<=-0.6254599928855896\n",
      "   +0.2455 if cp>=-0.09483367949724197\n",
      "   +0.4982 if cv>=-0.5116368293762207\n",
      "   -0.2308 if cv<=-0.6210723280906677\n",
      "   -0.9006 if cp>=-0.046753622591495514\n",
      "   +0.7073 if cp>=-0.018449416384100914\n",
      "   +0.0000 if pav>=2.1502227783203125\n",
      "   +1.2309 if cp>=-0.03710911050438881\n",
      "   +1.2309 if cp>=-0.03826036676764488\n",
      "   +0.1462 if cp<=-0.09918037056922913 & cp>=-0.09918037056922913 & cv<=-0.9977253079414368\n",
      "--------------\n",
      "   -0.5720 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   +0.4065 if cv<=-0.6254599928855896\n",
      "   -0.3094 if cp>=-0.09483367949724197\n",
      "   -0.7122 if cv>=-0.5116368293762207\n",
      "   +0.4065 if cv<=-0.6210723280906677\n",
      "   +0.3210 if cp>=-0.046753622591495514\n",
      "   -1.7084 if cp>=-0.03710911050438881\n",
      "   +1.2995 if cp<=-0.021443277597427368 & cp>=-0.06261669993400573\n",
      "   -0.5720 if \n",
      "   -0.0000 if pa>=0.16887736320495605\n",
      "   +1.4926 if cp<=-0.04215016812086105 & cp>=-0.06877081394195557\n",
      "   -0.8930 if cp<=-0.06314399093389511\n",
      "Run episode 22 with rewards 21.0\n",
      "============ 23 ===========\n",
      "11 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +1.7956 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   -0.7489 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   -0.1088 if cv<=-0.6254599928855896\n",
      "   +0.0500 if cp>=-0.09483367949724197\n",
      "   -1.0427 if cv>=-0.5116368293762207\n",
      "   -0.2142 if cv<=-0.6210723280906677\n",
      "   -1.4400 if cp>=-0.046753622591495514\n",
      "   +0.2238 if cp>=-0.018449416384100914\n",
      "   +2.5977 if cp>=-0.03710911050438881\n",
      "   +2.5977 if cp>=-0.03826036676764488\n",
      "   +0.0000 if cp<=-0.09918037056922913 & cp>=-0.09918037056922913 & cv<=-0.9977253079414368\n",
      "   +0.3617 if cp<=-0.043721359223127365 & cp>=-0.12945516407489777\n",
      "--------------\n",
      "   -0.7752 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   +0.2464 if cv<=-0.6254599928855896\n",
      "   -0.2208 if cp>=-0.09483367949724197\n",
      "   +0.3229 if cv>=-0.5116368293762207\n",
      "   +0.1023 if cv<=-0.6210723280906677\n",
      "   +0.1920 if cp>=-0.046753622591495514\n",
      "   -2.6013 if cp>=-0.03710911050438881\n",
      "   +1.4511 if cp<=-0.021443277597427368 & cp>=-0.06261669993400573\n",
      "   +0.4252 if \n",
      "   +3.8017 if cp<=-0.04215016812086105 & cp>=-0.06877081394195557\n",
      "   -0.7752 if cp<=-0.06314399093389511\n",
      "   -1.7097 if cp>=-0.12945516407489777\n",
      "Run episode 23 with rewards 11.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 24 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.9006 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   +0.9754 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   +0.8955 if cv<=-0.6254599928855896\n",
      "   +1.0938 if cp>=-0.09483367949724197\n",
      "   +0.1897 if cv>=-0.5116368293762207\n",
      "   +0.8955 if cv<=-0.6210723280906677\n",
      "   +0.2002 if cp>=-0.046753622591495514\n",
      "   +0.1966 if cp>=-0.018449416384100914\n",
      "   +0.2002 if cp>=-0.03710911050438881\n",
      "   +0.2002 if cp>=-0.03826036676764488\n",
      "   +0.8963 if cp<=-0.043721359223127365 & cp>=-0.12945516407489777\n",
      "   -0.0020 if cp<=-0.07953928411006927\n",
      "--------------\n",
      "   -0.3403 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   -0.3337 if cv<=-0.6254599928855896\n",
      "   -0.6330 if cp>=-0.09483367949724197\n",
      "   -0.3434 if cv>=-0.5116368293762207\n",
      "   -0.3641 if cp>=-0.046753622591495514\n",
      "   -0.3641 if cp>=-0.03710911050438881\n",
      "   -0.1574 if cp<=-0.021443277597427368 & cp>=-0.06261669993400573\n",
      "   -0.6837 if \n",
      "   -0.1534 if cp<=-0.04215016812086105 & cp>=-0.06877081394195557\n",
      "   -0.1661 if cp<=-0.06314399093389511\n",
      "   -0.7369 if cp>=-0.12945516407489777\n",
      "   +0.0532 if pa>=0.20813199877738953\n",
      "Run episode 24 with rewards 10.0\n",
      "============ 25 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.3050 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   +0.4497 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   +0.2482 if cv<=-0.6254599928855896\n",
      "   +0.5220 if cp>=-0.09483367949724197\n",
      "   +0.2787 if cv>=-0.5116368293762207\n",
      "   +0.2482 if cv<=-0.6210723280906677\n",
      "   +0.4010 if cp>=-0.046753622591495514\n",
      "   +0.3355 if cp>=-0.018449416384100914\n",
      "   +0.3602 if cp>=-0.03710911050438881\n",
      "   +0.4010 if cp>=-0.03826036676764488\n",
      "   +0.1997 if cp<=-0.043721359223127365 & cp>=-0.12945516407489777\n",
      "   -0.0170 if pa>=0.16569870710372925\n",
      "--------------\n",
      "   -0.0767 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   -0.0377 if cv<=-0.6254599928855896\n",
      "   -0.4683 if cp>=-0.09483367949724197\n",
      "   -0.3993 if cv>=-0.5116368293762207\n",
      "   -0.4557 if cp>=-0.046753622591495514\n",
      "   -0.4451 if cp>=-0.03710911050438881\n",
      "   -0.0250 if cp<=-0.021443277597427368 & cp>=-0.06261669993400573\n",
      "   -0.4759 if \n",
      "   -0.0075 if cp<=-0.04215016812086105 & cp>=-0.06877081394195557\n",
      "   -0.0128 if cp<=-0.06314399093389511\n",
      "   -0.4799 if cp>=-0.12945516407489777\n",
      "   -0.1058 if cp<=-0.003624896984547376 & cp>=-0.018125452101230618\n",
      "Run episode 25 with rewards 9.0\n",
      "============ 26 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.4997 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   +0.3965 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   +0.1999 if cv<=-0.6254599928855896\n",
      "   +0.4997 if cp>=-0.09483367949724197\n",
      "   +0.2178 if cv>=-0.5116368293762207\n",
      "   +0.1999 if cv<=-0.6210723280906677\n",
      "   +0.3979 if cp>=-0.046753622591495514\n",
      "   +0.3695 if cp>=-0.018449416384100914\n",
      "   +0.3979 if cp>=-0.03710911050438881\n",
      "   +0.3979 if cp>=-0.03826036676764488\n",
      "   +0.1017 if cp<=-0.043721359223127365 & cp>=-0.12945516407489777\n",
      "   +0.0556 if cp<=-0.012256073206663129 & cp>=-0.0436529278755188\n",
      "--------------\n",
      "   -0.4557 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   -0.1398 if cv<=-0.6254599928855896\n",
      "   -0.4557 if cp>=-0.09483367949724197\n",
      "   -0.2363 if cv>=-0.5116368293762207\n",
      "   -0.3964 if cp>=-0.046753622591495514\n",
      "   -0.3964 if cp>=-0.03710911050438881\n",
      "   -0.0833 if cp<=-0.021443277597427368 & cp>=-0.06261669993400573\n",
      "   -0.4557 if \n",
      "   +0.0022 if cp<=-0.06314399093389511\n",
      "   -0.4557 if cp>=-0.12945516407489777\n",
      "   -0.0248 if cp<=-0.003624896984547376 & cp>=-0.018125452101230618\n",
      "   -0.0623 if cp>=0.022067468613386154\n",
      "Run episode 26 with rewards 10.0\n",
      "============ 27 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 1]\n",
      "   +0.2459 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   +0.5110 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   +0.2003 if cv<=-0.6254599928855896\n",
      "   +0.5323 if cp>=-0.09483367949724197\n",
      "   +0.2651 if cv>=-0.5116368293762207\n",
      "   +0.2459 if cv<=-0.6210723280906677\n",
      "   +0.3801 if cp>=-0.046753622591495514\n",
      "   +0.3588 if cp>=-0.018449416384100914\n",
      "   +0.3801 if cp>=-0.03710911050438881\n",
      "   +0.3801 if cp>=-0.03826036676764488\n",
      "   +0.1309 if cp<=-0.043721359223127365 & cp>=-0.12945516407489777\n",
      "   +0.4640 if cp>=-0.057790301740169525\n",
      "--------------\n",
      "   -0.2462 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   -0.1981 if cv<=-0.6254599928855896\n",
      "   -0.5111 if cp>=-0.09483367949724197\n",
      "   -0.2433 if cv>=-0.5116368293762207\n",
      "   -0.3595 if cp>=-0.046753622591495514\n",
      "   -0.3595 if cp>=-0.03710911050438881\n",
      "   -0.1036 if cp<=-0.021443277597427368 & cp>=-0.06261669993400573\n",
      "   -0.4895 if \n",
      "   -0.4895 if cp>=-0.12945516407489777\n",
      "   -0.0211 if cp<=-0.003624896984547376 & cp>=-0.018125452101230618\n",
      "   -0.2433 if cp>=0.022067468613386154\n",
      "   -0.4432 if cp>=-0.057790301740169525\n",
      "Run episode 27 with rewards 10.0\n",
      "============ 28 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.7545 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   +0.7545 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   +0.5470 if cv<=-0.6254599928855896\n",
      "   +0.3045 if cp>=-0.09483367949724197\n",
      "   +0.1511 if cv>=-0.5116368293762207\n",
      "   +0.5470 if cv<=-0.6210723280906677\n",
      "   +0.2517 if cp>=-0.046753622591495514\n",
      "   +0.2203 if cp>=-0.018449416384100914\n",
      "   +0.2319 if cp>=-0.03710911050438881\n",
      "   +0.2319 if cp>=-0.03826036676764488\n",
      "   +0.2517 if cp>=-0.057790301740169525\n",
      "   +0.3940 if pa>=0.18111178278923035\n",
      "--------------\n",
      "   -0.7062 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   -0.5568 if cv<=-0.6254599928855896\n",
      "   -0.2576 if cp>=-0.09483367949724197\n",
      "   -0.1107 if cv>=-0.5116368293762207\n",
      "   -0.2025 if cp>=-0.046753622591495514\n",
      "   -0.1760 if cp>=-0.03710911050438881\n",
      "   -0.0404 if cp<=-0.021443277597427368 & cp>=-0.06261669993400573\n",
      "   -0.7062 if \n",
      "   -0.7062 if cp>=-0.12945516407489777\n",
      "   +0.0000 if cp>=0.022067468613386154\n",
      "   -0.2025 if cp>=-0.057790301740169525\n",
      "   -0.0696 if cp<=0.014167434349656106 & cp>=-0.0022994693368673285\n",
      "Run episode 28 with rewards 10.0\n",
      "============ 29 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.7297 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   +0.7297 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   +0.3125 if cv<=-0.6254599928855896\n",
      "   +0.5369 if cp>=-0.09483367949724197\n",
      "   +0.3125 if cv<=-0.6210723280906677\n",
      "   +0.2833 if cp>=-0.046753622591495514\n",
      "   +0.0000 if cp>=-0.018449416384100914\n",
      "   +0.0000 if cp>=-0.03710911050438881\n",
      "   +0.0000 if cp>=-0.03826036676764488\n",
      "   +0.4173 if cp>=-0.057790301740169525\n",
      "   +0.0000 if pa>=0.18111178278923035\n",
      "   +0.0990 if cp>=-0.04137541353702545\n",
      "--------------\n",
      "   -0.6425 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   -0.3003 if cv<=-0.6254599928855896\n",
      "   -0.4615 if cp>=-0.09483367949724197\n",
      "   -0.2166 if cv>=-0.5116368293762207\n",
      "   -0.2166 if cp>=-0.046753622591495514\n",
      "   -0.0000 if cp>=-0.03710911050438881\n",
      "   -0.3422 if cp<=-0.021443277597427368 & cp>=-0.06261669993400573\n",
      "   -0.6425 if \n",
      "   -0.6020 if cp>=-0.12945516407489777\n",
      "   -0.3422 if cp>=-0.057790301740169525\n",
      "   -0.0000 if cp<=0.014167434349656106 & cp>=-0.0022994693368673285\n",
      "   -0.0404 if cp<=-0.1325063854455948\n",
      "Run episode 29 with rewards 9.0\n",
      "============ 30 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.3959 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   +0.3959 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   +0.1332 if cv<=-0.6254599928855896\n",
      "   +0.4016 if cp>=-0.09483367949724197\n",
      "   +0.1332 if cv<=-0.6210723280906677\n",
      "   +0.3049 if cp>=-0.046753622591495514\n",
      "   +0.3049 if cp>=-0.03710911050438881\n",
      "   +0.3049 if cp>=-0.03826036676764488\n",
      "   +0.3458 if cp>=-0.057790301740169525\n",
      "   -0.0000 if pa>=0.18111178278923035\n",
      "   +0.3049 if cp>=-0.04137541353702545\n",
      "   -0.0057 if pa>=0.16756385564804077\n",
      "--------------\n",
      "   -0.3999 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   -0.1043 if cv<=-0.6254599928855896\n",
      "   -0.4039 if cp>=-0.09483367949724197\n",
      "   -0.2348 if cv>=-0.5116368293762207\n",
      "   -0.3359 if cp>=-0.046753622591495514\n",
      "   -0.3359 if cp>=-0.03710911050438881\n",
      "   -0.0488 if cp<=-0.021443277597427368 & cp>=-0.06261669993400573\n",
      "   -0.3999 if \n",
      "   -0.3999 if cp>=-0.12945516407489777\n",
      "   -0.3679 if cp>=-0.057790301740169525\n",
      "   +0.0000 if cp<=-0.1325063854455948\n",
      "   -0.2225 if cp<=0.002532805188093336\n",
      "Run episode 30 with rewards 9.0\n",
      "============ 31 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.3910 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   +0.3910 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   +0.1147 if cv<=-0.6254599928855896\n",
      "   +0.3910 if cp>=-0.09483367949724197\n",
      "   +0.1147 if cv<=-0.6210723280906677\n",
      "   +0.3470 if cp>=-0.046753622591495514\n",
      "   +0.3470 if cp>=-0.03710911050438881\n",
      "   +0.3470 if cp>=-0.03826036676764488\n",
      "   +0.3966 if cp>=-0.057790301740169525\n",
      "   +0.3470 if cp>=-0.04137541353702545\n",
      "   -0.0055 if pa>=0.16756385564804077\n",
      "   +0.0776 if cp<=-0.005939542315900323\n",
      "--------------\n",
      "   -0.4117 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   -0.1247 if cv<=-0.6254599928855896\n",
      "   -0.4117 if cp>=-0.09483367949724197\n",
      "   -0.2194 if cv>=-0.5116368293762207\n",
      "   -0.3646 if cp>=-0.046753622591495514\n",
      "   -0.3646 if cp>=-0.03710911050438881\n",
      "   -0.0688 if cp<=-0.021443277597427368 & cp>=-0.06261669993400573\n",
      "   -0.4117 if \n",
      "   -0.4117 if cp>=-0.12945516407489777\n",
      "   -0.4178 if cp>=-0.057790301740169525\n",
      "   -0.0880 if cp<=0.002532805188093336\n",
      "   -0.0788 if cp>=0.030468126758933067\n",
      "Run episode 31 with rewards 9.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 32 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.5124 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   +0.5124 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   +0.3153 if cv<=-0.6254599928855896\n",
      "   +0.4317 if cp>=-0.09483367949724197\n",
      "   +0.3153 if cv<=-0.6210723280906677\n",
      "   +0.2398 if cp>=-0.046753622591495514\n",
      "   +0.1971 if cp>=-0.03710911050438881\n",
      "   +0.1971 if cp>=-0.03826036676764488\n",
      "   +0.2398 if cp>=-0.057790301740169525\n",
      "   +0.1971 if cp>=-0.04137541353702545\n",
      "   +0.5124 if cp<=-0.005939542315900323\n",
      "   -0.0083 if pa>=0.18114443123340607\n",
      "--------------\n",
      "   -0.5230 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   -0.3558 if cv<=-0.6254599928855896\n",
      "   -0.4379 if cp>=-0.09483367949724197\n",
      "   -0.1313 if cv>=-0.5116368293762207\n",
      "   -0.2209 if cp>=-0.046753622591495514\n",
      "   -0.1673 if cp>=-0.03710911050438881\n",
      "   -0.5230 if \n",
      "   -0.5330 if cp>=-0.12945516407489777\n",
      "   -0.2209 if cp>=-0.057790301740169525\n",
      "   -0.5230 if cp<=0.002532805188093336\n",
      "   -0.0000 if cp>=0.030468126758933067\n",
      "   +0.0100 if pa>=0.18114443123340607\n",
      "Run episode 32 with rewards 9.0\n",
      "============ 33 ===========\n",
      "8 actions [0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.4144 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   +0.2951 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   +0.0841 if cv<=-0.6254599928855896\n",
      "   +0.4144 if cp>=-0.09483367949724197\n",
      "   +0.0841 if cv<=-0.6210723280906677\n",
      "   +0.3697 if cp>=-0.046753622591495514\n",
      "   +0.3697 if cp>=-0.03710911050438881\n",
      "   +0.3697 if cp>=-0.03826036676764488\n",
      "   +0.3697 if cp>=-0.057790301740169525\n",
      "   +0.3697 if cp>=-0.04137541353702545\n",
      "   +0.0659 if cp<=-0.005939542315900323\n",
      "   -0.0030 if pa>=0.17611287534236908\n",
      "--------------\n",
      "   -0.4359 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   -0.0812 if cv<=-0.6254599928855896\n",
      "   -0.4359 if cp>=-0.09483367949724197\n",
      "   -0.2817 if cv>=-0.5116368293762207\n",
      "   -0.4011 if cp>=-0.046753622591495514\n",
      "   -0.4011 if cp>=-0.03710911050438881\n",
      "   -0.4359 if \n",
      "   -0.4359 if cp>=-0.12945516407489777\n",
      "   -0.4011 if cp>=-0.057790301740169525\n",
      "   -0.0812 if cp<=0.002532805188093336\n",
      "   +0.0000 if pa>=0.18114443123340607\n",
      "   -0.0714 if cp>=0.019454795867204666\n",
      "Run episode 33 with rewards 8.0\n",
      "============ 34 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.3731 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   +0.3731 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   +0.1703 if cv<=-0.6254599928855896\n",
      "   +0.3731 if cp>=-0.09483367949724197\n",
      "   +0.1703 if cv<=-0.6210723280906677\n",
      "   +0.2258 if cp>=-0.046753622591495514\n",
      "   +0.2258 if cp>=-0.03710911050438881\n",
      "   +0.2258 if cp>=-0.03826036676764488\n",
      "   +0.2988 if cp>=-0.057790301740169525\n",
      "   +0.2258 if cp>=-0.04137541353702545\n",
      "   +0.3731 if cp<=-0.005939542315900323\n",
      "   +0.1473 if cp<=-0.03657839298248291\n",
      "--------------\n",
      "   -0.4103 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   -0.2137 if cv<=-0.6254599928855896\n",
      "   -0.4103 if cp>=-0.09483367949724197\n",
      "   -0.1551 if cv>=-0.5116368293762207\n",
      "   -0.2179 if cp>=-0.046753622591495514\n",
      "   -0.2179 if cp>=-0.03710911050438881\n",
      "   -0.4103 if \n",
      "   -0.4103 if cp>=-0.12945516407489777\n",
      "   -0.3141 if cp>=-0.057790301740169525\n",
      "   -0.4103 if cp<=0.002532805188093336\n",
      "   +0.0000 if cp>=0.019454795867204666\n",
      "   -0.0502 if cp>=-0.010642851702868938\n",
      "Run episode 34 with rewards 9.0\n",
      "============ 35 ===========\n",
      "8 actions [0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.3893 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   +0.3893 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   +0.0833 if cv<=-0.6254599928855896\n",
      "   +0.3893 if cp>=-0.09483367949724197\n",
      "   +0.0833 if cv<=-0.6210723280906677\n",
      "   +0.3961 if cp>=-0.046753622591495514\n",
      "   +0.3809 if cp>=-0.03710911050438881\n",
      "   +0.3809 if cp>=-0.03826036676764488\n",
      "   +0.3961 if cp>=-0.057790301740169525\n",
      "   +0.3961 if cp>=-0.04137541353702545\n",
      "   +0.0203 if cp<=-0.005939542315900323\n",
      "   +0.0466 if cp<=0.005921376449987295\n",
      "--------------\n",
      "   -0.3985 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   -0.0944 if cv<=-0.6254599928855896\n",
      "   -0.3985 if cp>=-0.09483367949724197\n",
      "   -0.2318 if cv>=-0.5116368293762207\n",
      "   -0.4050 if cp>=-0.046753622591495514\n",
      "   -0.3877 if cp>=-0.03710911050438881\n",
      "   -0.3985 if \n",
      "   -0.3985 if cp>=-0.12945516407489777\n",
      "   -0.4050 if cp>=-0.057790301740169525\n",
      "   -0.0288 if cp<=0.002532805188093336\n",
      "   -0.3697 if cp>=-0.010642851702868938\n",
      "   -0.0830 if cp>=0.04363064467906952\n",
      "Run episode 35 with rewards 8.0\n",
      "============ 36 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.3184 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   +0.2305 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   +0.0673 if cv<=-0.6254599928855896\n",
      "   +0.3184 if cp>=-0.09483367949724197\n",
      "   +0.0673 if cv<=-0.6210723280906677\n",
      "   +0.3184 if cp>=-0.046753622591495514\n",
      "   +0.3184 if cp>=-0.03710911050438881\n",
      "   +0.3184 if cp>=-0.03826036676764488\n",
      "   +0.3184 if cp>=-0.057790301740169525\n",
      "   +0.3184 if cp>=-0.04137541353702545\n",
      "   +0.0673 if cp<=0.005921376449987295\n",
      "   +0.0392 if cp<=-0.0050665199756622275\n",
      "--------------\n",
      "   -0.3225 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   -0.0652 if cv<=-0.6254599928855896\n",
      "   -0.3225 if cp>=-0.09483367949724197\n",
      "   -0.2079 if cv>=-0.5116368293762207\n",
      "   -0.3225 if cp>=-0.046753622591495514\n",
      "   -0.3225 if cp>=-0.03710911050438881\n",
      "   -0.3225 if \n",
      "   -0.3225 if cp>=-0.12945516407489777\n",
      "   -0.3225 if cp>=-0.057790301740169525\n",
      "   -0.2855 if cp>=-0.010642851702868938\n",
      "   +0.0000 if cp>=0.04363064467906952\n",
      "   -0.0565 if cp>=0.020192807540297508\n",
      "Run episode 36 with rewards 9.0\n",
      "============ 37 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.7685 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   +0.7685 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   +0.3429 if cv<=-0.6254599928855896\n",
      "   +0.5983 if cp>=-0.09483367949724197\n",
      "   +0.3429 if cv<=-0.6210723280906677\n",
      "   +0.1810 if cp>=-0.046753622591495514\n",
      "   +0.0000 if cp>=-0.03710911050438881\n",
      "   +0.0000 if cp>=-0.03826036676764488\n",
      "   +0.4256 if cp>=-0.057790301740169525\n",
      "   +0.0000 if cp>=-0.04137541353702545\n",
      "   +0.7685 if cp<=0.005921376449987295\n",
      "   +0.0489 if cp<=-0.1121879056096077\n",
      "--------------\n",
      "   -0.8468 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   -0.4268 if cv<=-0.6254599928855896\n",
      "   -0.6348 if cp>=-0.09483367949724197\n",
      "   -0.2910 if cv>=-0.5116368293762207\n",
      "   -0.1753 if cp>=-0.046753622591495514\n",
      "   +0.0000 if cp>=-0.03710911050438881\n",
      "   -0.8468 if \n",
      "   -0.8611 if cp>=-0.12945516407489777\n",
      "   -0.4199 if cp>=-0.057790301740169525\n",
      "   +0.0000 if cp>=-0.010642851702868938\n",
      "   +0.0000 if cp>=0.020192807540297508\n",
      "   -0.0565 if cp<=-0.1121879056096077\n",
      "Run episode 37 with rewards 9.0\n",
      "============ 38 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 1]\n",
      "   +0.2925 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   +0.2226 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   +0.0825 if cv<=-0.6254599928855896\n",
      "   +0.2976 if cp>=-0.09483367949724197\n",
      "   +0.0825 if cv<=-0.6210723280906677\n",
      "   +0.2465 if cp>=-0.046753622591495514\n",
      "   +0.2465 if cp>=-0.03826036676764488\n",
      "   +0.2726 if cp>=-0.057790301740169525\n",
      "   +0.2465 if cp>=-0.04137541353702545\n",
      "   +0.2925 if cp<=0.005921376449987295\n",
      "   +0.0000 if cp<=-0.1121879056096077\n",
      "   +0.0207 if cp<=-0.010468449071049683 & cp>=-0.03077740557491779\n",
      "--------------\n",
      "   -0.3296 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   -0.0777 if cv<=-0.6254599928855896\n",
      "   -0.3342 if cp>=-0.09483367949724197\n",
      "   -0.2110 if cv>=-0.5116368293762207\n",
      "   -0.2891 if cp>=-0.046753622591495514\n",
      "   -0.2891 if cp>=-0.03710911050438881\n",
      "   -0.3296 if \n",
      "   -0.3296 if cp>=-0.12945516407489777\n",
      "   -0.3116 if cp>=-0.057790301740169525\n",
      "   -0.2519 if cp>=-0.010642851702868938\n",
      "   -0.0000 if cp<=-0.1121879056096077\n",
      "   -0.0806 if cp<=-0.0007231626193970435 & cp>=-0.010468449071049683\n",
      "Run episode 38 with rewards 9.0\n",
      "============ 39 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.7265 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   +0.7265 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   +0.5066 if cv<=-0.6254599928855896\n",
      "   +0.3720 if cp>=-0.09483367949724197\n",
      "   +0.5066 if cv<=-0.6210723280906677\n",
      "   +0.2520 if cp>=-0.046753622591495514\n",
      "   +0.2199 if cp>=-0.03826036676764488\n",
      "   +0.2520 if cp>=-0.057790301740169525\n",
      "   +0.2199 if cp>=-0.04137541353702545\n",
      "   +0.7265 if cp<=0.005921376449987295\n",
      "   +0.1622 if cp<=-0.010468449071049683 & cp>=-0.03077740557491779\n",
      "   +0.0590 if cp>=-0.018952660262584686\n",
      "--------------\n",
      "   -0.7836 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   -0.5251 if cv<=-0.6254599928855896\n",
      "   -0.4255 if cp>=-0.09483367949724197\n",
      "   -0.2170 if cv>=-0.5116368293762207\n",
      "   -0.2938 if cp>=-0.046753622591495514\n",
      "   -0.2585 if cp>=-0.03710911050438881\n",
      "   -0.7836 if \n",
      "   -0.4769 if cp>=-0.12945516407489777\n",
      "   -0.2938 if cp>=-0.057790301740169525\n",
      "   +0.0000 if cp>=-0.010642851702868938\n",
      "   +0.0000 if cp<=-0.0007231626193970435 & cp>=-0.010468449071049683\n",
      "   -0.6059 if cp<=-0.022373953834176064\n",
      "Run episode 39 with rewards 9.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 40 ===========\n",
      "10 actions [0, 0, 0, 0, 1, 0, 0, 0, 0, 0]\n",
      "   +0.3615 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   +0.2607 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   +0.0714 if cv<=-0.6254599928855896\n",
      "   +0.3615 if cp>=-0.09483367949724197\n",
      "   +0.0714 if cv<=-0.6210723280906677\n",
      "   +0.3371 if cp>=-0.046753622591495514\n",
      "   +0.3371 if cp>=-0.03826036676764488\n",
      "   +0.3371 if cp>=-0.057790301740169525\n",
      "   +0.3371 if cp>=-0.04137541353702545\n",
      "   +0.0714 if cp<=0.005921376449987295\n",
      "   +0.0172 if cp<=-0.010468449071049683 & cp>=-0.03077740557491779\n",
      "   -0.0026 if pa>=0.19195154309272766\n",
      "--------------\n",
      "   -0.3655 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   -0.0395 if cv<=-0.6254599928855896\n",
      "   -0.3655 if cp>=-0.09483367949724197\n",
      "   -0.2658 if cv>=-0.5116368293762207\n",
      "   -0.3472 if cp>=-0.046753622591495514\n",
      "   -0.3472 if cp>=-0.03710911050438881\n",
      "   -0.3655 if \n",
      "   -0.3655 if cp>=-0.12945516407489777\n",
      "   -0.3472 if cp>=-0.057790301740169525\n",
      "   -0.3342 if cp>=-0.010642851702868938\n",
      "   -0.0241 if cp<=-0.022373953834176064\n",
      "   -0.0606 if cp>=0.020835377275943756\n",
      "Run episode 40 with rewards 10.0\n",
      "============ 41 ===========\n",
      "14 actions [0, 0, 0, 0, 1, 0, 1, 1, 0, 0, 0, 0, 1, 1]\n",
      "   +1.1688 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   +0.5927 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   -1.6768 if cv<=-0.6254599928855896\n",
      "   +1.2101 if cp>=-0.09483367949724197\n",
      "   -1.6768 if cv<=-0.6210723280906677\n",
      "   -0.1007 if cp>=-0.046753622591495514\n",
      "   -0.9326 if cp>=-0.03826036676764488\n",
      "   +0.5338 if cp>=-0.057790301740169525\n",
      "   -0.1007 if cp>=-0.04137541353702545\n",
      "   +0.3042 if cp<=0.005921376449987295\n",
      "   -2.1927 if cp<=-0.010468449071049683 & cp>=-0.03077740557491779\n",
      "   -0.9325 if cp>=-0.0326911672949791\n",
      "--------------\n",
      "   -0.7286 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   +2.6816 if cv<=-0.6254599928855896\n",
      "   -0.7614 if cp>=-0.09483367949724197\n",
      "   -1.0091 if cv>=-0.5116368293762207\n",
      "   +0.8838 if cp>=-0.046753622591495514\n",
      "   +2.6119 if cp>=-0.03710911050438881\n",
      "   -0.7286 if \n",
      "   -0.7286 if cp>=-0.12945516407489777\n",
      "   -0.0809 if cp>=-0.057790301740169525\n",
      "   -1.6030 if cp>=-0.010642851702868938\n",
      "   -0.0000 if cp>=0.020835377275943756\n",
      "   +0.0231 if cp<=0.006297735311090947\n",
      "Run episode 41 with rewards 14.0\n",
      "============ 42 ===========\n",
      "10 actions [0, 0, 0, 0, 1, 0, 0, 0, 1, 1]\n",
      "   -0.4410 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   +0.4429 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   -1.2327 if cv<=-0.6254599928855896\n",
      "   +1.9579 if cp>=-0.09483367949724197\n",
      "   -1.2327 if cv<=-0.6210723280906677\n",
      "   -0.4556 if cp>=-0.03826036676764488\n",
      "   +1.3006 if cp>=-0.057790301740169525\n",
      "   -0.4327 if cp>=-0.04137541353702545\n",
      "   +0.6951 if cp<=0.005921376449987295\n",
      "   -2.2972 if cp<=-0.010468449071049683 & cp>=-0.03077740557491779\n",
      "   -0.4556 if cp>=-0.0326911672949791\n",
      "   -1.9558 if cv<=-0.5639529228210449 & cv>=-0.7202362537384033\n",
      "--------------\n",
      "   +0.7395 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   +1.5520 if cv<=-0.6254599928855896\n",
      "   -0.9182 if cp>=-0.09483367949724197\n",
      "   -1.8925 if cv>=-0.5116368293762207\n",
      "   +1.0864 if cp>=-0.046753622591495514\n",
      "   +1.1637 if cp>=-0.03710911050438881\n",
      "   -0.8196 if \n",
      "   -0.8196 if cp>=-0.12945516407489777\n",
      "   -0.5904 if cp>=-0.057790301740169525\n",
      "   -1.2276 if cp>=-0.010642851702868938\n",
      "   -0.3743 if cp<=0.006297735311090947\n",
      "   +2.2047 if cp>=-0.03664170019328594 & cv<=-0.5639529228210449 & cv>=-0.7202362537384033\n",
      "Run episode 42 with rewards 10.0\n",
      "============ 43 ===========\n",
      "12 actions [0, 0, 0, 0, 1, 0, 0, 1, 0, 0, 0, 0]\n",
      "   +0.2629 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   +0.1011 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   -0.9519 if cv<=-0.6254599928855896\n",
      "   +1.6461 if cp>=-0.09483367949724197\n",
      "   -0.9519 if cv<=-0.6210723280906677\n",
      "   -0.8114 if cp>=-0.03826036676764488\n",
      "   -0.6414 if cp>=-0.057790301740169525\n",
      "   +0.2629 if cp<=0.005921376449987295\n",
      "   +1.0447 if cp<=-0.010468449071049683 & cp>=-0.03077740557491779\n",
      "   +1.0447 if cp>=-0.0326911672949791\n",
      "   -0.0000 if cv<=-0.5639529228210449 & cv>=-0.7202362537384033\n",
      "   +0.9043 if cp<=-0.05436729192733765\n",
      "--------------\n",
      "   -1.0728 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   +3.1553 if cv<=-0.6254599928855896\n",
      "   -1.5391 if cp>=-0.09483367949724197\n",
      "   -1.8838 if cv>=-0.5116368293762207\n",
      "   +1.0088 if cp>=-0.046753622591495514\n",
      "   +1.0088 if cp>=-0.03710911050438881\n",
      "   -1.0728 if \n",
      "   -1.0728 if cp>=-0.12945516407489777\n",
      "   +1.0025 if cp>=-0.057790301740169525\n",
      "   -0.0000 if cp>=-0.010642851702868938\n",
      "   -0.0000 if cp>=-0.03664170019328594 & cv<=-0.5639529228210449 & cv>=-0.7202362537384033\n",
      "   +0.3863 if pav>=1.9479126930236816\n",
      "Run episode 43 with rewards 12.0\n",
      "============ 44 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   -0.0711 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   +0.6570 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   -0.8739 if cv<=-0.6254599928855896\n",
      "   -0.0341 if cp>=-0.09483367949724197\n",
      "   -0.8739 if cv<=-0.6210723280906677\n",
      "   +1.1718 if cp>=-0.03826036676764488\n",
      "   -0.9617 if cp>=-0.057790301740169525\n",
      "   -0.8511 if cp<=0.005921376449987295\n",
      "   +2.2491 if cp<=-0.010468449071049683 & cp>=-0.03077740557491779\n",
      "   +1.1718 if cp>=-0.0326911672949791\n",
      "   +1.6187 if cp<=-0.05436729192733765\n",
      "   +1.7344 if cp<=-0.006529654166661181\n",
      "--------------\n",
      "   +0.0599 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   +1.7577 if cv<=-0.6254599928855896\n",
      "   -0.1406 if cp>=-0.09483367949724197\n",
      "   -1.9659 if cv>=-0.5116368293762207\n",
      "   +1.3757 if cp>=-0.046753622591495514\n",
      "   -0.3728 if cp>=-0.03710911050438881\n",
      "   -1.3926 if \n",
      "   -1.3926 if cp>=-0.12945516407489777\n",
      "   +1.3757 if cp>=-0.057790301740169525\n",
      "   -1.1844 if cp>=-0.03664170019328594 & cv<=-0.5639529228210449 & cv>=-0.7202362537384033\n",
      "   +0.0202 if pav>=1.9479126930236816\n",
      "   -2.1859 if cp<=-0.006529654166661181 & cp>=-0.03750900328159332 & cv<=-0.6757340073585507\n",
      "Run episode 44 with rewards 9.0\n",
      "============ 45 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.6071 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   +0.6071 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   +0.3842 if cv<=-0.6254599928855896\n",
      "   +0.3842 if cv<=-0.6210723280906677\n",
      "   -0.0000 if cp>=-0.03826036676764488\n",
      "   +0.1669 if cp>=-0.057790301740169525\n",
      "   +0.6071 if cp<=0.005921376449987295\n",
      "   -0.0000 if cp<=-0.010468449071049683 & cp>=-0.03077740557491779\n",
      "   -0.0000 if cp>=-0.0326911672949791\n",
      "   +0.4403 if cp<=-0.05436729192733765\n",
      "   +0.6071 if cp<=-0.006529654166661181\n",
      "   +0.0607 if cp>=-0.04837080463767052\n",
      "--------------\n",
      "   -0.9017 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   -0.3359 if cv<=-0.6254599928855896\n",
      "   -0.7290 if cp>=-0.09483367949724197\n",
      "   -0.5371 if cv>=-0.5116368293762207\n",
      "   -0.0000 if cp>=-0.046753622591495514\n",
      "   -0.0000 if cp>=-0.03710911050438881\n",
      "   -0.9017 if \n",
      "   -0.8199 if cp>=-0.12945516407489777\n",
      "   -0.5371 if cp>=-0.057790301740169525\n",
      "   -0.0000 if cp>=-0.03664170019328594 & cv<=-0.5639529228210449 & cv>=-0.7202362537384033\n",
      "   -0.0000 if cp<=-0.006529654166661181 & cp>=-0.03750900328159332 & cv<=-0.6757340073585507\n",
      "   +0.0136 if pa>=0.19996565580368042\n",
      "Run episode 45 with rewards 10.0\n",
      "============ 46 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.2093 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   +0.4114 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   +0.1743 if cv<=-0.6254599928855896\n",
      "   +0.1743 if cv<=-0.6210723280906677\n",
      "   +0.2370 if cp>=-0.03826036676764488\n",
      "   +0.2556 if cp>=-0.057790301740169525\n",
      "   +0.4114 if cp<=0.005921376449987295\n",
      "   +0.2020 if cp<=-0.010468449071049683 & cp>=-0.03077740557491779\n",
      "   +0.1558 if cp<=-0.05436729192733765\n",
      "   +0.4114 if cp<=-0.006529654166661181\n",
      "   +0.2556 if cp>=-0.04837080463767052\n",
      "   +0.2917 if cp>=-0.06968495920300484\n",
      "--------------\n",
      "   -0.1825 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   -0.1266 if cv<=-0.6254599928855896\n",
      "   -0.5547 if cp>=-0.09483367949724197\n",
      "   -0.4184 if cv>=-0.5116368293762207\n",
      "   -0.4943 if cp>=-0.046753622591495514\n",
      "   -0.6009 if \n",
      "   -0.5835 if cp>=-0.12945516407489777\n",
      "   -0.4943 if cp>=-0.057790301740169525\n",
      "   -0.0558 if cp>=-0.03664170019328594 & cv<=-0.5639529228210449 & cv>=-0.7202362537384033\n",
      "   +0.0000 if cp<=-0.006529654166661181 & cp>=-0.03750900328159332 & cv<=-0.6757340073585507\n",
      "   +0.0000 if pa>=0.19996565580368042\n",
      "   -0.2823 if cp<=-0.02506732977926731\n",
      "Run episode 46 with rewards 9.0\n",
      "============ 47 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.3766 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   +0.3766 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   +0.1456 if cv<=-0.6254599928855896\n",
      "   +0.1456 if cv<=-0.6210723280906677\n",
      "   +0.2541 if cp>=-0.03826036676764488\n",
      "   +0.2764 if cp>=-0.057790301740169525\n",
      "   +0.3766 if cp<=0.005921376449987295\n",
      "   +0.1245 if cp<=-0.010468449071049683 & cp>=-0.03077740557491779\n",
      "   +0.3766 if cp<=-0.006529654166661181\n",
      "   +0.2764 if cp>=-0.04837080463767052\n",
      "   +0.3439 if cp>=-0.06968495920300484\n",
      "   +0.1225 if cp<=-0.042879112809896466\n",
      "--------------\n",
      "   -0.4778 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   -0.1445 if cv<=-0.6254599928855896\n",
      "   -0.4871 if cp>=-0.09483367949724197\n",
      "   -0.2754 if cv>=-0.5116368293762207\n",
      "   -0.3890 if cp>=-0.046753622591495514\n",
      "   -0.4778 if \n",
      "   -0.4778 if cp>=-0.12945516407489777\n",
      "   -0.3890 if cp>=-0.057790301740169525\n",
      "   -0.0579 if cp>=-0.03664170019328594 & cv<=-0.5639529228210449 & cv>=-0.7202362537384033\n",
      "   +0.0000 if pa>=0.19996565580368042\n",
      "   -0.1445 if cp<=-0.02506732977926731\n",
      "   -0.2583 if cp<=-0.009596847556531427\n",
      "Run episode 47 with rewards 10.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 48 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.4787 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   +0.4787 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   +0.2743 if cv<=-0.6254599928855896\n",
      "   +0.2743 if cv<=-0.6210723280906677\n",
      "   +0.1421 if cp>=-0.03826036676764488\n",
      "   +0.2512 if cp>=-0.057790301740169525\n",
      "   +0.4787 if cp<=0.005921376449987295\n",
      "   +0.1421 if cp<=-0.010468449071049683 & cp>=-0.03077740557491779\n",
      "   +0.4787 if cp<=-0.006529654166661181\n",
      "   +0.2044 if cp>=-0.04837080463767052\n",
      "   +0.3216 if cp>=-0.06968495920300484\n",
      "   +0.1571 if cp<=-0.07556589245796204\n",
      "--------------\n",
      "   -0.4920 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   -0.2689 if cv<=-0.6254599928855896\n",
      "   -0.3984 if cp>=-0.09483367949724197\n",
      "   -0.1563 if cv>=-0.5116368293762207\n",
      "   -0.2231 if cp>=-0.046753622591495514\n",
      "   -0.4920 if \n",
      "   -0.4612 if cp>=-0.12945516407489777\n",
      "   -0.2693 if cp>=-0.057790301740169525\n",
      "   -0.0000 if cp>=-0.03664170019328594 & cv<=-0.5639529228210449 & cv>=-0.7202362537384033\n",
      "   -0.4920 if cp<=-0.02506732977926731\n",
      "   -0.4920 if cp<=-0.009596847556531427\n",
      "   +0.0127 if pa>=0.2021649330854416\n",
      "Run episode 48 with rewards 9.0\n",
      "============ 49 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.4833 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   +0.4833 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   +0.1173 if cv<=-0.6254599928855896\n",
      "   +0.1173 if cv<=-0.6210723280906677\n",
      "   +0.4376 if cp>=-0.057790301740169525\n",
      "   +0.4833 if cp<=0.005921376449987295\n",
      "   +0.0262 if cp<=-0.010468449071049683 & cp>=-0.03077740557491779\n",
      "   +0.1173 if cp<=-0.006529654166661181\n",
      "   +0.4376 if cp>=-0.04837080463767052\n",
      "   +0.4672 if cp>=-0.06968495920300484\n",
      "   +0.0161 if cp<=-0.07556589245796204\n",
      "   +0.0573 if cp<=-0.03578396514058113\n",
      "--------------\n",
      "   -0.4400 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   -0.1415 if cv<=-0.6254599928855896\n",
      "   -0.4469 if cp>=-0.09483367949724197\n",
      "   -0.2985 if cv>=-0.5116368293762207\n",
      "   -0.3719 if cp>=-0.046753622591495514\n",
      "   -0.4400 if \n",
      "   -0.4400 if cp>=-0.12945516407489777\n",
      "   -0.3719 if cp>=-0.057790301740169525\n",
      "   -0.0905 if cp<=-0.02506732977926731\n",
      "   -0.1415 if cp<=-0.009596847556531427\n",
      "   +0.0000 if pa>=0.2021649330854416\n",
      "   -0.3246 if cp>=-0.012465757131576528\n",
      "Run episode 49 with rewards 10.0\n",
      "============ 50 ===========\n",
      "8 actions [0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.5063 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   +0.5063 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   +0.1325 if cv<=-0.6254599928855896\n",
      "   +0.1325 if cv<=-0.6210723280906677\n",
      "   +0.4964 if cp>=-0.057790301740169525\n",
      "   +0.0867 if cp<=0.005921376449987295\n",
      "   +0.0273 if cp<=-0.010468449071049683 & cp>=-0.03077740557491779\n",
      "   +0.0533 if cp<=-0.006529654166661181\n",
      "   +0.4964 if cp>=-0.04837080463767052\n",
      "   +0.5361 if cp>=-0.06968495920300484\n",
      "   +0.0260 if cp<=-0.03578396514058113\n",
      "   +0.1325 if cp<=0.021001322194933895\n",
      "--------------\n",
      "   -0.4603 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   -0.1173 if cv<=-0.6254599928855896\n",
      "   -0.4846 if cp>=-0.09483367949724197\n",
      "   -0.2589 if cv>=-0.5116368293762207\n",
      "   -0.4509 if cp>=-0.046753622591495514\n",
      "   -0.4603 if \n",
      "   -0.4603 if cp>=-0.12945516407489777\n",
      "   -0.4509 if cp>=-0.057790301740169525\n",
      "   -0.0225 if cp<=-0.02506732977926731\n",
      "   -0.0439 if cp<=-0.009596847556531427\n",
      "   -0.4164 if cp>=-0.012465757131576528\n",
      "   -0.0439 if cp<=-0.0063965361332520825\n",
      "Run episode 50 with rewards 8.0\n",
      "============ 51 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.4001 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   +0.4001 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   +0.0705 if cv<=-0.6254599928855896\n",
      "   +0.0705 if cv<=-0.6210723280906677\n",
      "   +0.4060 if cp>=-0.057790301740169525\n",
      "   +0.0705 if cp<=0.005921376449987295\n",
      "   +0.0282 if cp<=-0.010468449071049683 & cp>=-0.03077740557491779\n",
      "   +0.0378 if cp<=-0.006529654166661181\n",
      "   +0.4060 if cp>=-0.04837080463767052\n",
      "   +0.4001 if cp>=-0.06968495920300484\n",
      "   +0.1311 if cp<=0.021001322194933895\n",
      "   +0.1215 if cp<=0.015123616531491288 & cp>=-0.027089172601699827\n",
      "--------------\n",
      "   -0.3870 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   -0.0673 if cv<=-0.6254599928855896\n",
      "   -0.3870 if cp>=-0.09483367949724197\n",
      "   -0.2535 if cv>=-0.5116368293762207\n",
      "   -0.3923 if cp>=-0.046753622591495514\n",
      "   -0.3870 if \n",
      "   -0.3870 if cp>=-0.12945516407489777\n",
      "   -0.3923 if cp>=-0.057790301740169525\n",
      "   -0.0345 if cp<=-0.009596847556531427\n",
      "   -0.3525 if cp>=-0.012465757131576528\n",
      "   -0.0345 if cp<=-0.0063965361332520825\n",
      "   -0.0922 if cp>=0.02678295224905014\n",
      "Run episode 51 with rewards 10.0\n",
      "============ 52 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.5522 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   +0.4503 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   +0.2716 if cv<=-0.6254599928855896\n",
      "   +0.2716 if cv<=-0.6210723280906677\n",
      "   +0.2806 if cp>=-0.057790301740169525\n",
      "   +0.5522 if cp<=0.005921376449987295\n",
      "   +0.5522 if cp<=-0.006529654166661181\n",
      "   +0.2112 if cp>=-0.04837080463767052\n",
      "   +0.3419 if cp>=-0.06968495920300484\n",
      "   +0.5522 if cp<=0.021001322194933895\n",
      "   +0.0000 if cp<=0.015123616531491288 & cp>=-0.027089172601699827\n",
      "   +0.3920 if cp<=-0.04665858522057533\n",
      "--------------\n",
      "   -0.7149 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   -0.4212 if cv<=-0.6254599928855896\n",
      "   -0.4782 if cp>=-0.09483367949724197\n",
      "   -0.2048 if cv>=-0.5116368293762207\n",
      "   -0.1483 if cp>=-0.046753622591495514\n",
      "   -0.7149 if \n",
      "   -0.6723 if cp>=-0.12945516407489777\n",
      "   -0.2937 if cp>=-0.057790301740169525\n",
      "   -0.0000 if cp>=-0.012465757131576528\n",
      "   -0.7149 if cp<=-0.0063965361332520825\n",
      "   -0.0000 if cp>=0.02678295224905014\n",
      "   +0.0210 if pa>=0.2079688161611557\n",
      "Run episode 52 with rewards 9.0\n",
      "============ 53 ===========\n",
      "12 actions [1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.2906 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   +0.2906 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   +0.0834 if cv<=-0.6254599928855896\n",
      "   +0.0834 if cv<=-0.6210723280906677\n",
      "   +0.2459 if cp>=-0.057790301740169525\n",
      "   +0.2906 if cp<=0.005921376449987295\n",
      "   +0.2906 if cp<=-0.006529654166661181\n",
      "   +0.2264 if cp>=-0.04837080463767052\n",
      "   +0.2459 if cp>=-0.06968495920300484\n",
      "   +0.2906 if cp<=0.021001322194933895\n",
      "   +0.0642 if cp<=-0.04665858522057533\n",
      "   +0.0834 if cp<=-0.032050771266221995\n",
      "--------------\n",
      "   -0.3359 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   -0.0922 if cv<=-0.6254599928855896\n",
      "   -0.3193 if cp>=-0.09483367949724197\n",
      "   -0.1920 if cv>=-0.5116368293762207\n",
      "   -0.2679 if cp>=-0.046753622591495514\n",
      "   -0.3359 if \n",
      "   -0.3359 if cp>=-0.12945516407489777\n",
      "   -0.2875 if cp>=-0.057790301740169525\n",
      "   +0.0000 if cp>=-0.012465757131576528\n",
      "   -0.3359 if cp<=-0.0063965361332520825\n",
      "   +0.0000 if pa>=0.2079688161611557\n",
      "   -0.1029 if cp<=-0.020029634982347486 & cp>=-0.032050771266221995\n",
      "Run episode 53 with rewards 12.0\n",
      "============ 54 ===========\n",
      "13 actions [0, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 1, 0]\n",
      "   +1.0400 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   -2.0149 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   +1.0400 if cv<=-0.6254599928855896\n",
      "   +1.0400 if cv<=-0.6210723280906677\n",
      "   +0.2686 if cp>=-0.057790301740169525\n",
      "   +0.1416 if cp<=0.005921376449987295\n",
      "   +0.1416 if cp<=-0.006529654166661181\n",
      "   +0.2686 if cp>=-0.04837080463767052\n",
      "   +0.3253 if cp>=-0.06968495920300484\n",
      "   +0.3274 if cp<=0.021001322194933895\n",
      "   +0.0673 if cp<=-0.032050771266221995\n",
      "   +2.0443 if cp>=0.051106419414281845\n",
      "--------------\n",
      "   -1.0746 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   -1.0746 if cv<=-0.6254599928855896\n",
      "   -0.0749 if cp>=-0.09483367949724197\n",
      "   +1.0131 if cv>=-0.5116368293762207\n",
      "   -0.0444 if cp>=-0.046753622591495514\n",
      "   -0.0615 if \n",
      "   -0.0615 if cp>=-0.12945516407489777\n",
      "   -0.0444 if cp>=-0.057790301740169525\n",
      "   -0.1330 if cp<=-0.0063965361332520825\n",
      "   +0.0000 if pa>=0.2079688161611557\n",
      "   +0.0000 if cp<=-0.020029634982347486 & cp>=-0.032050771266221995\n",
      "   -2.9876 if pa<=-0.03690292090177536\n",
      "Run episode 54 with rewards 13.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 55 ===========\n",
      "34 actions [0, 0, 0, 0, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1]\n",
      "   -0.7089 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   -0.7089 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   -0.1686 if cv<=-0.6254599928855896\n",
      "   -0.1686 if cv<=-0.6210723280906677\n",
      "   +1.1230 if cp>=-0.057790301740169525\n",
      "   -0.4767 if cp<=0.005921376449987295\n",
      "   -0.8674 if cp<=-0.006529654166661181\n",
      "   +1.1230 if cp>=-0.04837080463767052\n",
      "   -0.7144 if cp>=-0.06968495920300484\n",
      "   +1.7970 if cp<=0.021001322194933895\n",
      "   +0.0000 if cp>=0.051106419414281845\n",
      "   +2.3128 if cp>=0.041614193469285965\n",
      "--------------\n",
      "   +0.3263 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   -0.0730 if cv<=-0.6254599928855896\n",
      "   +0.3263 if cp>=-0.09483367949724197\n",
      "   +0.3993 if cv>=-0.5116368293762207\n",
      "   -1.1937 if cp>=-0.046753622591495514\n",
      "   +0.3263 if \n",
      "   +0.3263 if cp>=-0.12945516407489777\n",
      "   -1.1937 if cp>=-0.057790301740169525\n",
      "   +0.8270 if cp<=-0.0063965361332520825\n",
      "   -0.3713 if cp<=-0.020029634982347486 & cp>=-0.032050771266221995\n",
      "   -0.0000 if pa<=-0.03690292090177536\n",
      "   -2.2387 if cp>=0.041614193469285965\n",
      "Run episode 55 with rewards 34.0\n",
      "============ 56 ===========\n",
      "30 actions [0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +1.6049 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   +2.3473 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   -4.0128 if cv<=-0.6254599928855896\n",
      "   -4.0128 if cv<=-0.6210723280906677\n",
      "   +3.1006 if cp>=-0.057790301740169525\n",
      "   -0.6403 if cp<=0.005921376449987295\n",
      "   -1.0755 if cp<=-0.006529654166661181\n",
      "   +2.9480 if cp>=-0.04837080463767052\n",
      "   +2.9441 if cp>=-0.06968495920300484\n",
      "   -0.3637 if cp<=0.021001322194933895\n",
      "   +0.0003 if cp>=0.041614193469285965\n",
      "   -4.5891 if cp<=-0.00736388750374316\n",
      "--------------\n",
      "   -4.0057 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   +4.0615 if cv<=-0.6254599928855896\n",
      "   +1.9255 if cp>=-0.09483367949724197\n",
      "   -2.1306 if cv>=-0.5116368293762207\n",
      "   -2.1815 if cp>=-0.046753622591495514\n",
      "   +1.9309 if \n",
      "   +1.9267 if cp>=-0.12945516407489777\n",
      "   -4.9230 if cp>=-0.057790301740169525\n",
      "   +3.3417 if cp<=-0.0063965361332520825\n",
      "   -3.3042 if cp<=-0.020029634982347486 & cp>=-0.032050771266221995\n",
      "   -0.0005 if cp>=0.041614193469285965\n",
      "   -4.9941 if cp>=-0.00736388750374316\n",
      "Run episode 56 with rewards 30.0\n",
      "============ 57 ===========\n",
      "53 actions [0, 0, 0, 0, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0]\n",
      "   +0.2346 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   +0.6945 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   -1.4341 if cv<=-0.6254599928855896\n",
      "   -1.4341 if cv<=-0.6210723280906677\n",
      "   +1.6122 if cp>=-0.057790301740169525\n",
      "   -0.9936 if cp<=0.005921376449987295\n",
      "   -0.9946 if cp<=-0.006529654166661181\n",
      "   +0.8471 if cp>=-0.04837080463767052\n",
      "   +1.6083 if cp>=-0.06968495920300484\n",
      "   -0.9936 if cp<=0.021001322194933895\n",
      "   -0.9946 if cp<=-0.00736388750374316\n",
      "   +3.1164 if cp<=-0.04411777853965758 & cv>=-0.5844623446464539 & pa<=0.11316266506910327\n",
      "--------------\n",
      "   -0.5215 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   +1.3818 if cv<=-0.6254599928855896\n",
      "   -0.1477 if cp>=-0.09483367949724197\n",
      "   +1.4588 if cv>=-0.5116368293762207\n",
      "   -0.9878 if cp>=-0.046753622591495514\n",
      "   +0.4997 if \n",
      "   +0.4997 if cp>=-0.12945516407489777\n",
      "   -0.8951 if cp>=-0.057790301740169525\n",
      "   +0.6276 if cp<=-0.0063965361332520825\n",
      "   -1.7956 if cp<=-0.020029634982347486 & cp>=-0.032050771266221995\n",
      "   -0.1279 if cp>=-0.00736388750374316\n",
      "   +1.6915 if cv<=-0.5844623446464539\n",
      "Run episode 57 with rewards 53.0\n",
      "best\n",
      "============ 58 ===========\n",
      "39 actions [1, 1, 1, 0, 0, 0, 1, 0, 0, 1, 0, 1, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0, 0, 0, 0, 0]\n",
      "   -0.3830 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   -4.6586 if cv<=-0.6254599928855896\n",
      "   -4.6586 if cv<=-0.6210723280906677\n",
      "   +4.7914 if cp>=-0.057790301740169525\n",
      "   +0.7160 if cp<=0.005921376449987295\n",
      "   -3.4158 if cp<=-0.006529654166661181\n",
      "   +1.4455 if cp>=-0.04837080463767052\n",
      "   +0.0637 if cp>=-0.06968495920300484\n",
      "   +1.4461 if cp<=0.021001322194933895\n",
      "   -3.4158 if cp<=-0.00736388750374316\n",
      "   +3.2474 if cp<=-0.04411777853965758 & cv>=-0.5844623446464539 & pa<=0.11316266506910327\n",
      "   -3.6944 if cp>=-0.03789158836007118 & cv>=-0.5892714262008667\n",
      "--------------\n",
      "   -2.5155 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   +2.8683 if cv<=-0.6254599928855896\n",
      "   +2.2949 if cp>=-0.09483367949724197\n",
      "   +3.2724 if cv>=-0.5116368293762207\n",
      "   -5.3678 if cp>=-0.046753622591495514\n",
      "   +2.7446 if \n",
      "   +2.7446 if cp>=-0.12945516407489777\n",
      "   -4.6431 if cp>=-0.057790301740169525\n",
      "   +0.9196 if cp<=-0.0063965361332520825\n",
      "   +0.5866 if cp<=-0.020029634982347486 & cp>=-0.032050771266221995\n",
      "   +4.9368 if cv<=-0.5844623446464539\n",
      "   -3.9091 if cp<=-0.03789158836007118\n",
      "Run episode 58 with rewards 39.0\n",
      "============ 59 ===========\n",
      "11 actions [1, 1, 0, 1, 1, 1, 1, 0, 0, 1, 0]\n",
      "   -2.3362 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   -1.2545 if cv<=-0.6254599928855896\n",
      "   -1.2545 if cv<=-0.6210723280906677\n",
      "   +3.6056 if cp>=-0.057790301740169525\n",
      "   +0.1224 if cp<=0.005921376449987295\n",
      "   -2.4559 if cp<=-0.006529654166661181\n",
      "   +0.0403 if cp>=-0.04837080463767052\n",
      "   +2.4480 if cp<=0.021001322194933895\n",
      "   -3.8101 if cp<=-0.00736388750374316\n",
      "   +2.6944 if cp<=-0.04411777853965758 & cv>=-0.5844623446464539 & pa<=0.11316266506910327\n",
      "   -1.4079 if cp>=-0.03789158836007118 & cv>=-0.5892714262008667\n",
      "   +4.5828 if cp<=0.028416517376899722 & cp>=0.01171111185103657 & cv<=0.03980387896299362 & cv>=-0.5352908611297608\n",
      "--------------\n",
      "   -0.7114 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   +2.0597 if cv<=-0.6254599928855896\n",
      "   +0.4144 if cp>=-0.09483367949724197\n",
      "   +5.3519 if cv>=-0.5116368293762207\n",
      "   -2.1626 if cp>=-0.046753622591495514\n",
      "   +0.8776 if \n",
      "   +0.8776 if cp>=-0.12945516407489777\n",
      "   -2.6298 if cp>=-0.057790301740169525\n",
      "   +0.7903 if cp<=-0.0063965361332520825\n",
      "   +2.0597 if cv<=-0.5844623446464539\n",
      "   -1.2947 if cp<=-0.03789158836007118\n",
      "   -1.9157 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "Run episode 59 with rewards 11.0\n",
      "============ 60 ===========\n",
      "29 actions [1, 1, 1, 0, 1, 0, 0, 0, 0, 1, 0, 0, 1, 1, 0, 0, 1, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1]\n",
      "   -1.7733 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   +0.0000 if cv<=-0.6254599928855896\n",
      "   +0.0000 if cv<=-0.6210723280906677\n",
      "   +3.6172 if cp>=-0.057790301740169525\n",
      "   -1.2970 if cp<=0.005921376449987295\n",
      "   -1.2970 if cp<=-0.006529654166661181\n",
      "   +1.2472 if cp<=0.021001322194933895\n",
      "   -1.2970 if cp<=-0.00736388750374316\n",
      "   -1.7733 if cp<=-0.04411777853965758 & cv>=-0.5844623446464539 & pa<=0.11316266506910327\n",
      "   -0.9218 if cp>=-0.03789158836007118 & cv>=-0.5892714262008667\n",
      "   +0.0000 if cp<=0.028416517376899722 & cp>=0.01171111185103657 & cv<=0.03980387896299362 & cv>=-0.5352908611297608\n",
      "   -2.9092 if pa>=-0.04247509688138962\n",
      "--------------\n",
      "   +0.0000 if cv<=0.213888081908226 & pa>=-0.029433537274599072\n",
      "   +0.0000 if cv<=-0.6254599928855896\n",
      "   +0.3097 if cv>=-0.5116368293762207\n",
      "   +0.3097 if cp>=-0.046753622591495514\n",
      "   +0.3097 if \n",
      "   +0.3097 if cp>=-0.12945516407489777\n",
      "   +0.3097 if cp>=-0.057790301740169525\n",
      "   +0.7288 if cp<=-0.0063965361332520825\n",
      "   +0.0000 if cv<=-0.5844623446464539\n",
      "   -1.4305 if cp<=-0.03789158836007118\n",
      "   -0.5071 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   +2.4888 if pav>=0.018923847004771233\n",
      "Run episode 60 with rewards 29.0\n",
      "============ 61 ===========\n",
      "29 actions [1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0]\n",
      "   +0.0000 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   +0.0000 if cv<=-0.6210723280906677\n",
      "   +0.0851 if cp>=-0.057790301740169525\n",
      "   +2.1937 if cp<=0.005921376449987295\n",
      "   -0.5396 if cp<=-0.006529654166661181\n",
      "   -1.7897 if cp<=0.021001322194933895\n",
      "   -0.5396 if cp<=-0.00736388750374316\n",
      "   +0.0000 if cp<=-0.04411777853965758 & cv>=-0.5844623446464539 & pa<=0.11316266506910327\n",
      "   +0.0850 if cp>=-0.03789158836007118 & cv>=-0.5892714262008667\n",
      "   +3.0105 if cp<=0.028416517376899722 & cp>=0.01171111185103657 & cv<=0.03980387896299362 & cv>=-0.5352908611297608\n",
      "   -5.0579 if pa>=-0.04247509688138962\n",
      "   +3.4926 if cp>=-0.014962592348456382 & cv>=-0.31691043376922606 & pav<=0.004587148874998222\n",
      "--------------\n",
      "   -0.0000 if cv<=-0.6254599928855896\n",
      "   -0.3234 if cv>=-0.5116368293762207\n",
      "   -0.1095 if cp>=-0.046753622591495514\n",
      "   -0.1095 if \n",
      "   -0.1095 if cp>=-0.12945516407489777\n",
      "   -0.1095 if cp>=-0.057790301740169525\n",
      "   +1.6235 if cp<=-0.0063965361332520825\n",
      "   -0.0000 if cv<=-0.5844623446464539\n",
      "   -0.0000 if cp<=-0.03789158836007118\n",
      "   +0.3902 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   +6.4816 if pav>=0.018923847004771233\n",
      "   +2.8376 if cp<=0.03927613794803621 & cp>=0.0025158711243420907\n",
      "Run episode 61 with rewards 29.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 62 ===========\n",
      "54 actions [1, 0, 1, 0, 1, 1, 1, 1, 0, 0, 0, 1, 0, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 1, 0]\n",
      "   +0.0000 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   -1.0742 if cp>=-0.057790301740169525\n",
      "   -3.2124 if cp<=0.005921376449987295\n",
      "   -0.0083 if cp<=-0.006529654166661181\n",
      "   -0.2761 if cp<=0.021001322194933895\n",
      "   -0.0083 if cp<=-0.00736388750374316\n",
      "   +0.0000 if cp<=-0.04411777853965758 & cv>=-0.5844623446464539 & pa<=0.11316266506910327\n",
      "   -1.0742 if cp>=-0.03789158836007118 & cv>=-0.5892714262008667\n",
      "   +1.2854 if cp<=0.028416517376899722 & cp>=0.01171111185103657 & cv<=0.03980387896299362 & cv>=-0.5352908611297608\n",
      "   -3.6301 if pa>=-0.04247509688138962\n",
      "   +5.9558 if cp>=-0.014962592348456382 & cv>=-0.31691043376922606 & pav<=0.004587148874998222\n",
      "   +2.5622 if cp>=0.0028268722817301802 & pa>=-0.15071093142032624\n",
      "--------------\n",
      "   +0.1188 if cv>=-0.5116368293762207\n",
      "   +0.1188 if cp>=-0.046753622591495514\n",
      "   +0.1188 if \n",
      "   +0.1188 if cp>=-0.12945516407489777\n",
      "   +0.1188 if cp>=-0.057790301740169525\n",
      "   +0.1858 if cp<=-0.0063965361332520825\n",
      "   +0.0000 if cv<=-0.5844623446464539\n",
      "   +0.0000 if cp<=-0.03789158836007118\n",
      "   +1.0934 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   +3.4559 if pav>=0.018923847004771233\n",
      "   +1.0443 if cp<=0.03927613794803621 & cp>=0.0025158711243420907\n",
      "   -3.7278 if cv>=1.0074654817581177\n",
      "Run episode 62 with rewards 54.0\n",
      "best\n",
      "============ 63 ===========\n",
      "36 actions [1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 0, 1, 0, 0, 1, 0, 1, 1, 1, 1, 0, 0, 0, 0, 1, 0, 1, 1]\n",
      "   +0.7550 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   -0.9856 if cp>=-0.057790301740169525\n",
      "   -1.8265 if cp<=0.005921376449987295\n",
      "   +0.1195 if cp<=-0.006529654166661181\n",
      "   -0.5493 if cp<=0.021001322194933895\n",
      "   +0.1195 if cp<=-0.00736388750374316\n",
      "   -0.9856 if cp>=-0.03789158836007118 & cv>=-0.5892714262008667\n",
      "   +0.3570 if cp<=0.028416517376899722 & cp>=0.01171111185103657 & cv<=0.03980387896299362 & cv>=-0.5352908611297608\n",
      "   -3.5798 if pa>=-0.04247509688138962\n",
      "   +7.0708 if cp>=-0.014962592348456382 & cv>=-0.31691043376922606 & pav<=0.004587148874998222\n",
      "   +0.7725 if cp>=0.0028268722817301802 & pa>=-0.15071093142032624\n",
      "   +3.9498 if pa>=0.04578816518187523\n",
      "--------------\n",
      "   -0.1013 if cv>=-0.5116368293762207\n",
      "   -0.1013 if cp>=-0.046753622591495514\n",
      "   -0.1013 if \n",
      "   -0.1013 if cp>=-0.12945516407489777\n",
      "   -0.1013 if cp>=-0.057790301740169525\n",
      "   -0.5961 if cp<=-0.0063965361332520825\n",
      "   +0.0000 if cp<=-0.03789158836007118\n",
      "   +2.4856 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   +5.5790 if pav>=0.018923847004771233\n",
      "   +1.3524 if cp<=0.03927613794803621 & cp>=0.0025158711243420907\n",
      "   +0.0000 if cv>=1.0074654817581177\n",
      "   -4.0709 if pa>=0.04578816518187523\n",
      "Run episode 63 with rewards 36.0\n",
      "============ 64 ===========\n",
      "51 actions [1, 1, 1, 1, 0, 0, 0, 0, 1, 0, 1, 0, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1]\n",
      "   -0.1054 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   -1.2720 if cp>=-0.057790301740169525\n",
      "   +1.0884 if cp<=0.005921376449987295\n",
      "   -1.2720 if cp<=0.021001322194933895\n",
      "   -5.0440 if cp<=-0.00736388750374316\n",
      "   -1.2720 if cp>=-0.03789158836007118 & cv>=-0.5892714262008667\n",
      "   +0.0000 if cp<=0.028416517376899722 & cp>=0.01171111185103657 & cv<=0.03980387896299362 & cv>=-0.5352908611297608\n",
      "   +0.0000 if pa>=-0.04247509688138962\n",
      "   +7.8693 if cp>=-0.014962592348456382 & cv>=-0.31691043376922606 & pav<=0.004587148874998222\n",
      "   +0.5019 if cp>=0.0028268722817301802 & pa>=-0.15071093142032624\n",
      "   +0.0000 if pa>=0.04578816518187523\n",
      "   +1.2879 if cv<=0.21199920773506165\n",
      "--------------\n",
      "   -0.2288 if cv>=-0.5116368293762207\n",
      "   -0.2288 if cp>=-0.046753622591495514\n",
      "   -0.2288 if \n",
      "   -0.2288 if cp>=-0.12945516407489777\n",
      "   -0.2288 if cp>=-0.057790301740169525\n",
      "   +0.8275 if cp<=-0.0063965361332520825\n",
      "   +0.0406 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   +2.6423 if pav>=0.018923847004771233\n",
      "   +1.3478 if cp<=0.03927613794803621 & cp>=0.0025158711243420907\n",
      "   +0.0000 if cv>=1.0074654817581177\n",
      "   +0.0000 if pa>=0.04578816518187523\n",
      "   +6.2027 if cp<=-0.010974494740366936 & pav>=-0.5162443518638611\n",
      "Run episode 64 with rewards 51.0\n",
      "============ 65 ===========\n",
      "32 actions [1, 1, 0, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 0, 1, 1, 0, 1, 1, 0, 1, 1, 0, 0, 0, 0]\n",
      "   -4.6161 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   -1.2871 if cp>=-0.057790301740169525\n",
      "   -0.3838 if cp<=0.005921376449987295\n",
      "   +1.0266 if cp<=0.021001322194933895\n",
      "   -4.1491 if cp<=-0.00736388750374316\n",
      "   -1.2871 if cp>=-0.03789158836007118 & cv>=-0.5892714262008667\n",
      "   +0.7486 if pa>=-0.04247509688138962\n",
      "   +6.3296 if cp>=-0.014962592348456382 & cv>=-0.31691043376922606 & pav<=0.004587148874998222\n",
      "   +0.4854 if cp>=0.0028268722817301802 & pa>=-0.15071093142032624\n",
      "   +0.0000 if pa>=0.04578816518187523\n",
      "   +0.5995 if cv<=0.21199920773506165\n",
      "   +3.0035 if pa<=-0.0520213283598423\n",
      "--------------\n",
      "   -1.1466 if cv>=-0.5116368293762207\n",
      "   -1.1451 if cp>=-0.046753622591495514\n",
      "   -1.1451 if \n",
      "   -1.1451 if cp>=-0.12945516407489777\n",
      "   -1.1451 if cp>=-0.057790301740169525\n",
      "   +1.2487 if cp<=-0.0063965361332520825\n",
      "   +3.4068 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   +2.8133 if pav>=0.018923847004771233\n",
      "   +3.3527 if cp<=0.03927613794803621 & cp>=0.0025158711243420907\n",
      "   +0.0000 if pa>=0.04578816518187523\n",
      "   +0.1212 if cp<=-0.010974494740366936 & pav>=-0.5162443518638611\n",
      "   +3.5952 if cv<=0.21164408326148987 & pav>=-0.5399397015571594\n",
      "Run episode 65 with rewards 32.0\n",
      "============ 66 ===========\n",
      "100 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 0, 1, 1, 1, 1]\n",
      "   -4.5500 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   -0.0246 if cp>=-0.057790301740169525\n",
      "   -1.2227 if cp<=0.005921376449987295\n",
      "   -0.0246 if cp<=0.021001322194933895\n",
      "   -5.6381 if cp<=-0.00736388750374316\n",
      "   -0.0246 if cp>=-0.03789158836007118 & cv>=-0.5892714262008667\n",
      "   +2.0448 if pa>=-0.04247509688138962\n",
      "   +5.6981 if cp>=-0.014962592348456382 & cv>=-0.31691043376922606 & pav<=0.004587148874998222\n",
      "   +1.0360 if cp>=0.0028268722817301802 & pa>=-0.15071093142032624\n",
      "   -0.2490 if cv<=0.21199920773506165\n",
      "   +6.4787 if pa<=-0.0520213283598423\n",
      "   -1.7718 if pa<=-0.07811971008777618\n",
      "--------------\n",
      "   -1.1400 if cv>=-0.5116368293762207\n",
      "   -1.1400 if cp>=-0.046753622591495514\n",
      "   -1.1400 if \n",
      "   -1.1400 if cp>=-0.12945516407489777\n",
      "   -1.1400 if cp>=-0.057790301740169525\n",
      "   +1.3999 if cp<=-0.0063965361332520825\n",
      "   +3.2908 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   +2.8084 if pav>=0.018923847004771233\n",
      "   -0.6359 if cp<=0.03927613794803621 & cp>=0.0025158711243420907\n",
      "   +1.3541 if cp<=-0.010974494740366936 & pav>=-0.5162443518638611\n",
      "   +2.5586 if cv<=0.21164408326148987 & pav>=-0.5399397015571594\n",
      "   +3.3615 if cp>=0.0007647808524779981 & cv<=0.010018973611295223 & pa>=-0.05219616815447807\n",
      "Run episode 66 with rewards 100.0\n",
      "best\n",
      "============ 67 ===========\n",
      "36 actions [1, 1, 0, 0, 1, 0, 0, 1, 1, 0, 0, 1, 0, 0, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 1, 1, 1, 0, 1, 0, 0, 0, 1, 1, 1, 0]\n",
      "   -4.1678 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   -1.6973 if cp<=0.005921376449987295\n",
      "   -3.7965 if cp<=0.021001322194933895\n",
      "   -4.5263 if cp<=-0.00736388750374316\n",
      "   -0.7530 if cp>=-0.03789158836007118 & cv>=-0.5892714262008667\n",
      "   +3.9604 if pa>=-0.04247509688138962\n",
      "   +7.2191 if cp>=-0.014962592348456382 & cv>=-0.31691043376922606 & pav<=0.004587148874998222\n",
      "   -0.1356 if cp>=0.0028268722817301802 & pa>=-0.15071093142032624\n",
      "   -0.8178 if cv<=0.21199920773506165\n",
      "  +10.7359 if pa<=-0.0520213283598423\n",
      "   -1.3670 if pa<=-0.07811971008777618\n",
      "   +2.0360 if cv<=-0.015671711415052414 & pa>=-0.06053330302238464\n",
      "--------------\n",
      "   -1.1632 if cv>=-0.5116368293762207\n",
      "   +0.2910 if cp>=-0.046753622591495514\n",
      "   -2.3374 if \n",
      "   -2.3374 if cp>=-0.12945516407489777\n",
      "   +0.8684 if cp>=-0.057790301740169525\n",
      "   -0.2436 if cp<=-0.0063965361332520825\n",
      "   +4.1288 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   +2.2287 if pav>=0.018923847004771233\n",
      "   +2.5044 if cp<=-0.010974494740366936 & pav>=-0.5162443518638611\n",
      "   +0.4107 if cv<=0.21164408326148987 & pav>=-0.5399397015571594\n",
      "   +2.8638 if cp>=0.0007647808524779981 & cv<=0.010018973611295223 & pa>=-0.05219616815447807\n",
      "   +4.2846 if cp<=0.02107748314738274 & cv<=0.17556737661361693 & pa<=-0.020740539953112598 & pav<=-0.00137262009084223\n",
      "Run episode 67 with rewards 36.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 68 ===========\n",
      "26 actions [1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 1, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0]\n",
      "   -0.3312 if cv<=0.019291881844401358 & pa>=-0.06770601868629456 & pav>=-0.29077954292297364\n",
      "   -0.5714 if cp<=0.005921376449987295\n",
      "   -0.5714 if cp<=0.021001322194933895\n",
      "   -2.2120 if cp<=-0.00736388750374316\n",
      "   -0.5714 if cp>=-0.03789158836007118 & cv>=-0.5892714262008667\n",
      "   +1.1244 if pa>=-0.04247509688138962\n",
      "   +5.8481 if cp>=-0.014962592348456382 & cv>=-0.31691043376922606 & pav<=0.004587148874998222\n",
      "   -3.2355 if cv<=0.21199920773506165\n",
      "   +5.9835 if pa<=-0.0520213283598423\n",
      "   -1.6109 if pa<=-0.07811971008777618\n",
      "   -3.0027 if cv<=-0.015671711415052414 & pa>=-0.06053330302238464\n",
      "   -5.2835 if cp>=0.005538606084883213\n",
      "--------------\n",
      "   -2.8325 if cv>=-0.5116368293762207\n",
      "   -1.1931 if cp>=-0.046753622591495514\n",
      "   -1.1931 if \n",
      "   -1.1931 if cp>=-0.12945516407489777\n",
      "   -1.1931 if cp>=-0.057790301740169525\n",
      "   +5.0617 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   +3.2597 if pav>=0.018923847004771233\n",
      "   +2.6704 if cp<=-0.010974494740366936 & pav>=-0.5162443518638611\n",
      "   +2.1184 if cv<=0.21164408326148987 & pav>=-0.5399397015571594\n",
      "   -0.0000 if cp>=0.0007647808524779981 & cv<=0.010018973611295223 & pa>=-0.05219616815447807\n",
      "   +6.3993 if cp<=0.02107748314738274 & cv<=0.17556737661361693 & pa<=-0.020740539953112598 & pav<=-0.00137262009084223\n",
      "   +4.3456 if cp>=0.005538606084883213\n",
      "Run episode 68 with rewards 26.0\n",
      "============ 69 ===========\n",
      "40 actions [1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 0, 1, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 0, 1, 0]\n",
      "   -0.8293 if cp<=0.005921376449987295\n",
      "   -0.8293 if cp<=0.021001322194933895\n",
      "   -2.8875 if cp<=-0.00736388750374316\n",
      "   -0.4876 if cp>=-0.03789158836007118 & cv>=-0.5892714262008667\n",
      "   -0.3047 if pa>=-0.04247509688138962\n",
      "   +2.7176 if cp>=-0.014962592348456382 & cv>=-0.31691043376922606 & pav<=0.004587148874998222\n",
      "   -1.3185 if cv<=0.21199920773506165\n",
      "   +4.7957 if pa<=-0.0520213283598423\n",
      "   +0.0126 if pa<=-0.07811971008777618\n",
      "   -0.0000 if cv<=-0.015671711415052414 & pa>=-0.06053330302238464\n",
      "   -0.0000 if cp>=0.005538606084883213\n",
      "   -3.3672 if pav>=0.6522895097732544\n",
      "--------------\n",
      "   -4.5741 if cv>=-0.5116368293762207\n",
      "   -0.0183 if cp>=-0.046753622591495514\n",
      "   -0.0183 if \n",
      "   -0.0183 if cp>=-0.12945516407489777\n",
      "   -0.0183 if cp>=-0.057790301740169525\n",
      "   +3.2640 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   +3.0950 if pav>=0.018923847004771233\n",
      "   +4.1861 if cp<=-0.010974494740366936 & pav>=-0.5162443518638611\n",
      "   -1.8566 if cv<=0.21164408326148987 & pav>=-0.5399397015571594\n",
      "   +4.9510 if cp<=0.02107748314738274 & cv<=0.17556737661361693 & pa<=-0.020740539953112598 & pav<=-0.00137262009084223\n",
      "   +0.0000 if cp>=0.005538606084883213\n",
      "   +0.5591 if cp>=-0.018017824739217755 & cv<=0.2471112161874771\n",
      "Run episode 69 with rewards 40.0\n",
      "============ 70 ===========\n",
      "40 actions [1, 0, 0, 1, 1, 0, 0, 1, 1, 0, 0, 0, 0, 1, 1, 1, 1, 0, 1, 0, 0, 0, 0, 1, 1, 1, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 0, 0, 0, 1]\n",
      "   -1.4724 if cp<=0.005921376449987295\n",
      "   -0.8728 if cp<=0.021001322194933895\n",
      "   -6.5781 if cp<=-0.00736388750374316\n",
      "   +0.3891 if cp>=-0.03789158836007118 & cv>=-0.5892714262008667\n",
      "   -1.2521 if pa>=-0.04247509688138962\n",
      "   +2.6471 if cp>=-0.014962592348456382 & cv>=-0.31691043376922606 & pav<=0.004587148874998222\n",
      "   -0.9888 if cv<=0.21199920773506165\n",
      "   +4.6848 if pa<=-0.0520213283598423\n",
      "   +1.4560 if pa<=-0.07811971008777618\n",
      "   -1.6428 if cp>=0.005538606084883213\n",
      "   -3.4519 if pav>=0.6522895097732544\n",
      "   +2.8353 if cp>=-0.029031646996736528 & pav<=-0.4726494014263153\n",
      "--------------\n",
      "   -6.5001 if cv>=-0.5116368293762207\n",
      "   +0.7591 if cp>=-0.046753622591495514\n",
      "   +0.7591 if \n",
      "   +0.7591 if cp>=-0.12945516407489777\n",
      "   +0.7591 if cp>=-0.057790301740169525\n",
      "   +4.2982 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   +4.0433 if pav>=0.018923847004771233\n",
      "   +0.7651 if cp<=-0.010974494740366936 & pav>=-0.5162443518638611\n",
      "   -0.2407 if cv<=0.21164408326148987 & pav>=-0.5399397015571594\n",
      "   +5.2126 if cp<=0.02107748314738274 & cv<=0.17556737661361693 & pa<=-0.020740539953112598 & pav<=-0.00137262009084223\n",
      "   -1.0119 if cp>=-0.018017824739217755 & cv<=0.2471112161874771\n",
      "   -3.1691 if cp>=-0.012034687772393221 & pa>=-0.06478999555110931\n",
      "Run episode 70 with rewards 40.0\n",
      "============ 71 ===========\n",
      "34 actions [1, 1, 1, 0, 0, 1, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 0, 0, 1, 0, 0, 1, 0, 1, 0, 0, 0, 1, 1, 1, 1, 0, 1, 0]\n",
      "   -0.6938 if cp<=0.005921376449987295\n",
      "   +2.3721 if cp<=0.021001322194933895\n",
      "   -3.6835 if cp<=-0.00736388750374316\n",
      "   -0.8352 if pa>=-0.04247509688138962\n",
      "   +1.7719 if cp>=-0.014962592348456382 & cv>=-0.31691043376922606 & pav<=0.004587148874998222\n",
      "   -6.4235 if cv<=0.21199920773506165\n",
      "   +6.8267 if pa<=-0.0520213283598423\n",
      "   -0.8160 if pa<=-0.07811971008777618\n",
      "   -1.1521 if cp>=0.005538606084883213\n",
      "   -0.0284 if pav>=0.6522895097732544\n",
      "   +1.2371 if cp>=-0.029031646996736528 & pav<=-0.4726494014263153\n",
      "   +5.0523 if cp>=0.023265797272324563\n",
      "--------------\n",
      "   -4.9390 if cv>=-0.5116368293762207\n",
      "   +0.3227 if cp>=-0.046753622591495514\n",
      "   +0.3227 if \n",
      "   +0.3227 if cp>=-0.12945516407489777\n",
      "   +0.3227 if cp>=-0.057790301740169525\n",
      "   +2.4892 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   +0.5770 if pav>=0.018923847004771233\n",
      "   -1.5159 if cp<=-0.010974494740366936 & pav>=-0.5162443518638611\n",
      "   +4.0795 if cp<=0.02107748314738274 & cv<=0.17556737661361693 & pa<=-0.020740539953112598 & pav<=-0.00137262009084223\n",
      "   +2.0173 if cp>=-0.018017824739217755 & cv<=0.2471112161874771\n",
      "   -1.1150 if cp>=-0.012034687772393221 & pa>=-0.06478999555110931\n",
      "   -4.0438 if cp>=0.00699273506179452 & cv>=0.0333540216088295 & pa>=-0.04337278977036475\n",
      "Run episode 71 with rewards 34.0\n",
      "============ 72 ===========\n",
      "28 actions [1, 1, 1, 1, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 1, 1, 0, 1, 0, 1, 1, 1, 1, 0, 1, 0, 1, 1]\n",
      "   -3.7981 if cp<=0.005921376449987295\n",
      "   -2.0324 if cp<=0.021001322194933895\n",
      "   +0.9201 if cp<=-0.00736388750374316\n",
      "   -1.1789 if pa>=-0.04247509688138962\n",
      "   +4.4179 if cp>=-0.014962592348456382 & cv>=-0.31691043376922606 & pav<=0.004587148874998222\n",
      "   -1.8825 if cv<=0.21199920773506165\n",
      "   +3.4863 if pa<=-0.0520213283598423\n",
      "   +1.3022 if pa<=-0.07811971008777618\n",
      "   +1.7657 if cp>=0.005538606084883213\n",
      "   +3.0457 if cp>=-0.029031646996736528 & pav<=-0.4726494014263153\n",
      "   +0.0000 if cp>=0.023265797272324563\n",
      "   +3.8992 if cp>=-0.00258796624839305 & cv>=-0.011440593097358936 & pa<=-0.09719790220260618\n",
      "--------------\n",
      "   -5.7880 if cv>=-0.5116368293762207\n",
      "   +0.7943 if \n",
      "   +0.7943 if cp>=-0.12945516407489777\n",
      "   +0.7943 if cp>=-0.057790301740169525\n",
      "   +2.5448 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -1.6102 if pav>=0.018923847004771233\n",
      "   +0.3885 if cp<=-0.010974494740366936 & pav>=-0.5162443518638611\n",
      "   +4.2079 if cp<=0.02107748314738274 & cv<=0.17556737661361693 & pa<=-0.020740539953112598 & pav<=-0.00137262009084223\n",
      "   +0.6566 if cp>=-0.018017824739217755 & cv<=0.2471112161874771\n",
      "   +1.2490 if cp>=-0.012034687772393221 & pa>=-0.06478999555110931\n",
      "   -0.0000 if cp>=0.00699273506179452 & cv>=0.0333540216088295 & pa>=-0.04337278977036475\n",
      "   +1.1393 if cv<=0.19986332654953007\n",
      "Run episode 72 with rewards 28.0\n",
      "============ 73 ===========\n",
      "54 actions [1, 1, 0, 1, 0, 1, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0]\n",
      "   -2.9989 if cp<=0.005921376449987295\n",
      "   +0.5279 if cp<=0.021001322194933895\n",
      "   -0.6540 if cp<=-0.00736388750374316\n",
      "   -2.1081 if pa>=-0.04247509688138962\n",
      "   +0.0565 if cp>=-0.014962592348456382 & cv>=-0.31691043376922606 & pav<=0.004587148874998222\n",
      "   -0.4220 if cv<=0.21199920773506165\n",
      "   +2.6360 if pa<=-0.0520213283598423\n",
      "   +0.2208 if pa<=-0.07811971008777618\n",
      "   +3.5268 if cp>=0.005538606084883213\n",
      "   +2.9472 if cp>=-0.029031646996736528 & pav<=-0.4726494014263153\n",
      "   -1.1109 if cp>=-0.00258796624839305 & cv>=-0.011440593097358936 & pa<=-0.09719790220260618\n",
      "   -1.0249 if cv<=-0.4091957449913025\n",
      "--------------\n",
      "   -4.3655 if cv>=-0.5116368293762207\n",
      "   +0.4542 if \n",
      "   +0.4542 if cp>=-0.12945516407489777\n",
      "   +0.5065 if cp>=-0.057790301740169525\n",
      "   +1.0796 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   +0.0804 if pav>=0.018923847004771233\n",
      "   +1.9062 if cp<=-0.010974494740366936 & pav>=-0.5162443518638611\n",
      "   +7.7097 if cp<=0.02107748314738274 & cv<=0.17556737661361693 & pa<=-0.020740539953112598 & pav<=-0.00137262009084223\n",
      "   +2.0866 if cp>=-0.018017824739217755 & cv<=0.2471112161874771\n",
      "   +0.0000 if cp>=-0.012034687772393221 & pa>=-0.06478999555110931\n",
      "   +0.3719 if cv<=0.19986332654953007\n",
      "   -3.3184 if cv<=0.15928918421268465\n",
      "Run episode 73 with rewards 54.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 74 ===========\n",
      "35 actions [1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0]\n",
      "   -6.8743 if cp<=0.005921376449987295\n",
      "   +1.4348 if cp<=0.021001322194933895\n",
      "   +0.4122 if cp<=-0.00736388750374316\n",
      "   -3.2435 if pa>=-0.04247509688138962\n",
      "   -3.7812 if cv<=0.21199920773506165\n",
      "   +0.1308 if pa<=-0.0520213283598423\n",
      "   -0.0000 if pa<=-0.07811971008777618\n",
      "   +3.9620 if cp>=0.005538606084883213\n",
      "   +5.0638 if cp>=-0.029031646996736528 & pav<=-0.4726494014263153\n",
      "   -0.0000 if cp>=-0.00258796624839305 & cv>=-0.011440593097358936 & pa<=-0.09719790220260618\n",
      "   -0.0506 if cv<=-0.4091957449913025\n",
      "   +4.5666 if cv<=0.5291530013084412\n",
      "--------------\n",
      "   -1.1294 if cv>=-0.5116368293762207\n",
      "   -0.4472 if \n",
      "   -0.4472 if cp>=-0.12945516407489777\n",
      "   -1.0256 if cp>=-0.057790301740169525\n",
      "   -1.1294 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -0.4843 if pav>=0.018923847004771233\n",
      "   +3.5458 if cp<=-0.010974494740366936 & pav>=-0.5162443518638611\n",
      "   +0.0000 if cp<=0.02107748314738274 & cv<=0.17556737661361693 & pa<=-0.020740539953112598 & pav<=-0.00137262009084223\n",
      "   +0.6357 if cp>=-0.018017824739217755 & cv<=0.2471112161874771\n",
      "   +2.4609 if cv<=0.19986332654953007\n",
      "   -1.6727 if cv<=0.15928918421268465\n",
      "   +5.5011 if cp<=0.01430786084383727 & cv>=0.5291530013084412 & pa<=0.053262326121330264\n",
      "Run episode 74 with rewards 35.0\n",
      "============ 75 ===========\n",
      "43 actions [1, 0, 1, 1, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 0, 1, 0, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0]\n",
      "   -0.9985 if cp<=0.005921376449987295\n",
      "   -0.2381 if cp<=0.021001322194933895\n",
      "   -0.9985 if cp<=-0.00736388750374316\n",
      "   -4.6049 if pa>=-0.04247509688138962\n",
      "   -3.0905 if cv<=0.21199920773506165\n",
      "   -1.2528 if pa<=-0.0520213283598423\n",
      "   +5.8893 if cp>=0.005538606084883213\n",
      "   +5.4646 if cp>=-0.029031646996736528 & pav<=-0.4726494014263153\n",
      "   +1.8398 if cp>=-0.00258796624839305 & cv>=-0.011440593097358936 & pa<=-0.09719790220260618\n",
      "   +1.5783 if cv<=-0.4091957449913025\n",
      "   +0.5139 if cv<=0.5291530013084412\n",
      "   +3.7646 if cp<=-0.03723467960953712 & pav<=-0.7084547281265259\n",
      "--------------\n",
      "   -1.2481 if cv>=-0.5116368293762207\n",
      "   -1.5248 if \n",
      "   -1.5248 if cp>=-0.12945516407489777\n",
      "   +1.9970 if cp>=-0.057790301740169525\n",
      "   -1.9073 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -0.3716 if pav>=0.018923847004771233\n",
      "   +0.7939 if cp<=-0.010974494740366936 & pav>=-0.5162443518638611\n",
      "   -0.9105 if cp>=-0.018017824739217755 & cv<=0.2471112161874771\n",
      "   +2.2865 if cv<=0.19986332654953007\n",
      "   -0.2546 if cv<=0.15928918421268465\n",
      "   +1.2980 if cp<=0.01430786084383727 & cv>=0.5291530013084412 & pa<=0.053262326121330264\n",
      "   +2.4041 if pa>=-0.044184552133083345\n",
      "Run episode 75 with rewards 43.0\n",
      "============ 76 ===========\n",
      "20 actions [1, 1, 1, 0, 0, 1, 0, 1, 0, 0, 1, 0, 0, 0, 1, 1, 1, 1, 0, 0]\n",
      "   -0.6770 if cp<=0.005921376449987295\n",
      "   -4.2729 if cp<=-0.00736388750374316\n",
      "   -3.1964 if pa>=-0.04247509688138962\n",
      "   -7.5392 if cv<=0.21199920773506165\n",
      "   +0.9522 if pa<=-0.0520213283598423\n",
      "   +2.5817 if cp>=0.005538606084883213\n",
      "   +5.9414 if cp>=-0.029031646996736528 & pav<=-0.4726494014263153\n",
      "   +2.3615 if cp>=-0.00258796624839305 & cv>=-0.011440593097358936 & pa<=-0.09719790220260618\n",
      "   -0.0706 if cv<=-0.4091957449913025\n",
      "   +1.9048 if cv<=0.5291530013084412\n",
      "   -0.0001 if cp<=-0.03723467960953712 & pav<=-0.7084547281265259\n",
      "   +4.8138 if cp>=0.006805960088968284\n",
      "--------------\n",
      "   -3.0028 if cv>=-0.5116368293762207\n",
      "   +0.0824 if \n",
      "   +0.0824 if cp>=-0.12945516407489777\n",
      "   +0.0825 if cp>=-0.057790301740169525\n",
      "   -0.3321 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   +0.3034 if pav>=0.018923847004771233\n",
      "   +0.0265 if cp<=-0.010974494740366936 & pav>=-0.5162443518638611\n",
      "   +0.9098 if cp>=-0.018017824739217755 & cv<=0.2471112161874771\n",
      "   +3.1530 if cv<=0.19986332654953007\n",
      "   +0.0003 if cp<=0.01430786084383727 & cv>=0.5291530013084412 & pa<=0.053262326121330264\n",
      "   -0.9935 if pa>=-0.044184552133083345\n",
      "   -2.1747 if pa<=-0.039318481087684626\n",
      "Run episode 76 with rewards 20.0\n",
      "============ 77 ===========\n",
      "28 actions [1, 1, 1, 0, 0, 1, 0, 1, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 0, 0, 0, 1, 1, 0, 0, 1, 1, 0]\n",
      "   -1.4773 if cp<=0.005921376449987295\n",
      "   -1.7087 if cp<=-0.00736388750374316\n",
      "   -2.4193 if pa>=-0.04247509688138962\n",
      "   -1.4266 if cv<=0.21199920773506165\n",
      "   +0.8786 if pa<=-0.0520213283598423\n",
      "   +2.1567 if cp>=0.005538606084883213\n",
      "   +2.6978 if cp>=-0.029031646996736528 & pav<=-0.4726494014263153\n",
      "   +3.0510 if cp>=-0.00258796624839305 & cv>=-0.011440593097358936 & pa<=-0.09719790220260618\n",
      "   -0.4701 if cv<=-0.4091957449913025\n",
      "   -1.5408 if cv<=0.5291530013084412\n",
      "   +2.1567 if cp>=0.006805960088968284\n",
      "   -0.1142 if pa<=-0.10114003270864486\n",
      "--------------\n",
      "   -0.2333 if cv>=-0.5116368293762207\n",
      "   -0.2333 if \n",
      "   -0.2333 if cp>=-0.12945516407489777\n",
      "   -0.2333 if cp>=-0.057790301740169525\n",
      "   -0.9860 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   +0.2189 if pav>=0.018923847004771233\n",
      "   +0.0114 if cp<=-0.010974494740366936 & pav>=-0.5162443518638611\n",
      "   +0.8529 if cp>=-0.018017824739217755 & cv<=0.2471112161874771\n",
      "   +0.8538 if cv<=0.19986332654953007\n",
      "   -0.9860 if pa>=-0.044184552133083345\n",
      "   -2.0570 if pa<=-0.039318481087684626\n",
      "   -2.8097 if cv>=0.5389953255653381\n",
      "Run episode 77 with rewards 28.0\n",
      "============ 78 ===========\n",
      "37 actions [0, 1, 1, 1, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 1, 1, 1, 0, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0, 0, 1]\n",
      "   -0.9080 if cp<=0.005921376449987295\n",
      "   -2.5976 if cp<=-0.00736388750374316\n",
      "   -1.8443 if pa>=-0.04247509688138962\n",
      "   -2.4006 if cv<=0.21199920773506165\n",
      "   +0.4364 if pa<=-0.0520213283598423\n",
      "   +2.5481 if cp>=0.005538606084883213\n",
      "   +3.1145 if cp>=-0.029031646996736528 & pav<=-0.4726494014263153\n",
      "   +5.3236 if cp>=-0.00258796624839305 & cv>=-0.011440593097358936 & pa<=-0.09719790220260618\n",
      "   -1.9827 if cv<=-0.4091957449913025\n",
      "   -0.5056 if cv<=0.5291530013084412\n",
      "   +4.5308 if cp>=0.006805960088968284\n",
      "   -1.9834 if cp>=-0.016432926431298255 & pav>=-0.5658186197280883\n",
      "--------------\n",
      "   -3.1334 if cv>=-0.5116368293762207\n",
      "   -0.2580 if \n",
      "   -0.2580 if cp>=-0.12945516407489777\n",
      "   -0.2580 if cp>=-0.057790301740169525\n",
      "   -0.5732 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   +0.8139 if pav>=0.018923847004771233\n",
      "   +2.5702 if cp>=-0.018017824739217755 & cv<=0.2471112161874771\n",
      "   +2.9877 if cv<=0.19986332654953007\n",
      "   +0.5554 if pa>=-0.044184552133083345\n",
      "   -0.8134 if pa<=-0.039318481087684626\n",
      "   -2.3624 if cv>=0.5389953255653381\n",
      "   -2.5227 if cp>=-0.006322119757533074\n",
      "Run episode 78 with rewards 37.0\n",
      "============ 79 ===========\n",
      "49 actions [1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0]\n",
      "   -1.8110 if cp<=0.005921376449987295\n",
      "   -1.8077 if cp<=-0.00736388750374316\n",
      "   -1.1943 if pa>=-0.04247509688138962\n",
      "   -1.3117 if cv<=0.21199920773506165\n",
      "   +0.6167 if cp>=0.005538606084883213\n",
      "   +0.2285 if cp>=-0.029031646996736528 & pav<=-0.4726494014263153\n",
      "   -0.0001 if cp>=-0.00258796624839305 & cv>=-0.011440593097358936 & pa<=-0.09719790220260618\n",
      "   -0.5070 if cv<=-0.4091957449913025\n",
      "   -1.3492 if cv<=0.5291530013084412\n",
      "   +3.6830 if cp>=0.006805960088968284\n",
      "   -1.3492 if cp>=-0.016432926431298255 & pav>=-0.5658186197280883\n",
      "   +2.8403 if cp>=0.015797895938158037\n",
      "--------------\n",
      "   -0.7236 if cv>=-0.5116368293762207\n",
      "   -0.6192 if cp>=-0.12945516407489777\n",
      "   -0.6192 if cp>=-0.057790301740169525\n",
      "   -0.7236 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   +1.6807 if pav>=0.018923847004771233\n",
      "   +1.2938 if cp>=-0.018017824739217755 & cv<=0.2471112161874771\n",
      "   +1.2938 if cv<=0.19986332654953007\n",
      "   -0.6192 if pa>=-0.044184552133083345\n",
      "   +0.0000 if pa<=-0.039318481087684626\n",
      "   -0.3126 if cv>=0.5389953255653381\n",
      "   -1.3363 if cp>=-0.006322119757533074\n",
      "   +3.9169 if cp<=0.015797895938158037 & pav>=0.6212986826896668\n",
      "Run episode 79 with rewards 49.0\n",
      "============ 80 ===========\n",
      "27 actions [1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0]\n",
      "   -3.3166 if cp<=0.005921376449987295\n",
      "   -3.1429 if cp<=-0.00736388750374316\n",
      "   -5.2683 if pa>=-0.04247509688138962\n",
      "   -1.2768 if cv<=0.21199920773506165\n",
      "   +3.3868 if cp>=0.005538606084883213\n",
      "   +2.2282 if cp>=-0.029031646996736528 & pav<=-0.4726494014263153\n",
      "   -1.9465 if cv<=-0.4091957449913025\n",
      "   +0.2987 if cv<=0.5291530013084412\n",
      "   +3.3868 if cp>=0.006805960088968284\n",
      "   -1.1713 if cp>=-0.016432926431298255 & pav>=-0.5658186197280883\n",
      "   +1.2095 if cp>=0.015797895938158037\n",
      "   +4.8703 if cp<=0.02599950209259991 & cp>=-0.006280170753598207 & cv>=-0.38428284525871276 & pa>=-0.04452063962817192\n",
      "--------------\n",
      "   -1.7518 if cv>=-0.5116368293762207\n",
      "   +1.8063 if cp>=-0.12945516407489777\n",
      "   +1.8063 if cp>=-0.057790301740169525\n",
      "   -2.7092 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   +0.5874 if pav>=0.018923847004771233\n",
      "   +1.5216 if cp>=-0.018017824739217755 & cv<=0.2471112161874771\n",
      "   +1.5876 if cv<=0.19986332654953007\n",
      "   +3.3348 if pa>=-0.044184552133083345\n",
      "   +0.5196 if cv>=0.5389953255653381\n",
      "   -6.8996 if cp>=-0.006322119757533074\n",
      "   +2.1101 if cp<=0.015797895938158037 & pav>=0.6212986826896668\n",
      "   -2.6829 if pav<=0.4272501707077029\n",
      "Run episode 80 with rewards 27.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 81 ===========\n",
      "30 actions [1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0]\n",
      "   -2.3470 if cp<=0.005921376449987295\n",
      "   -2.7454 if cp<=-0.00736388750374316\n",
      "   -0.8359 if pa>=-0.04247509688138962\n",
      "   +0.1020 if cv<=0.21199920773506165\n",
      "   +0.1926 if cp>=0.005538606084883213\n",
      "   +0.0026 if cp>=-0.029031646996736528 & pav<=-0.4726494014263153\n",
      "   +0.1513 if cv<=-0.4091957449913025\n",
      "   +1.8372 if cp>=0.006805960088968284\n",
      "   +0.1908 if cp>=-0.016432926431298255 & pav>=-0.5658186197280883\n",
      "   +1.8372 if cp>=0.015797895938158037\n",
      "   -0.0000 if cp<=0.02599950209259991 & cp>=-0.006280170753598207 & cv>=-0.38428284525871276 & pa>=-0.04452063962817192\n",
      "   -1.2777 if cp<=0.01249780692160131 & cp>=-0.0318358477205038 & pa<=-0.04384375959634781\n",
      "--------------\n",
      "   -0.6336 if cv>=-0.5116368293762207\n",
      "   +0.0096 if cp>=-0.12945516407489777\n",
      "   +0.0096 if cp>=-0.057790301740169525\n",
      "   -1.0444 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   +0.5694 if pav>=0.018923847004771233\n",
      "   +0.5416 if cp>=-0.018017824739217755 & cv<=0.2471112161874771\n",
      "   +0.5473 if cv<=0.19986332654953007\n",
      "   +0.1220 if pa>=-0.044184552133083345\n",
      "   -1.8053 if cp>=-0.006322119757533074\n",
      "   +2.2501 if cp<=0.015797895938158037 & pav>=0.6212986826896668\n",
      "   -0.6336 if pav<=0.4272501707077029\n",
      "   -0.6537 if cv>=0.6281527519226074\n",
      "Run episode 81 with rewards 30.0\n",
      "============ 82 ===========\n",
      "11 actions [1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0]\n",
      "   -3.3283 if cp<=0.005921376449987295\n",
      "   -1.8446 if cp<=-0.00736388750374316\n",
      "   -2.0617 if pa>=-0.04247509688138962\n",
      "   -0.5790 if cv<=0.21199920773506165\n",
      "   +0.7605 if cp>=0.005538606084883213\n",
      "   -0.7650 if cp>=-0.029031646996736528 & pav<=-0.4726494014263153\n",
      "   -0.7612 if cv<=-0.4091957449913025\n",
      "   +0.7605 if cp>=0.006805960088968284\n",
      "   -0.3061 if cp>=-0.016432926431298255 & pav>=-0.5658186197280883\n",
      "   +3.7909 if cp>=0.015797895938158037\n",
      "   +0.1112 if cp<=0.01249780692160131 & cp>=-0.0318358477205038 & pa<=-0.04384375959634781\n",
      "   -1.1421 if cv>=0.41481969952583314\n",
      "--------------\n",
      "   -0.5397 if cv>=-0.5116368293762207\n",
      "   +0.3669 if cp>=-0.057790301740169525\n",
      "   -0.2720 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   +0.5500 if pav>=0.018923847004771233\n",
      "   +0.2137 if cp>=-0.018017824739217755 & cv<=0.2471112161874771\n",
      "   +0.4528 if cv<=0.19986332654953007\n",
      "   +1.7849 if pa>=-0.044184552133083345\n",
      "   -1.7049 if cp>=-0.006322119757533074\n",
      "   +2.6403 if cp<=0.015797895938158037 & pav>=0.6212986826896668\n",
      "   -0.5397 if pav<=0.4272501707077029\n",
      "   +0.0277 if cv>=0.6281527519226074\n",
      "   +2.6170 if pav>=1.358390212059021\n",
      "Run episode 82 with rewards 11.0\n",
      "============ 83 ===========\n",
      "52 actions [0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   -2.0863 if cp<=0.005921376449987295\n",
      "   -1.0769 if cp<=-0.00736388750374316\n",
      "   -0.5209 if pa>=-0.04247509688138962\n",
      "   -0.2571 if cv<=0.21199920773506165\n",
      "   +1.2131 if cp>=0.005538606084883213\n",
      "   -0.5384 if cp>=-0.029031646996736528 & pav<=-0.4726494014263153\n",
      "   +0.0000 if cv<=-0.4091957449913025\n",
      "   +1.2131 if cp>=0.006805960088968284\n",
      "   +0.0122 if cp>=-0.016432926431298255 & pav>=-0.5658186197280883\n",
      "   +0.6143 if cp>=0.015797895938158037\n",
      "   -0.4958 if cv>=0.41481969952583314\n",
      "   -0.4958 if cv>=0.5608624219894409\n",
      "--------------\n",
      "   -0.4220 if cv>=-0.5116368293762207\n",
      "   -0.4220 if cp>=-0.057790301740169525\n",
      "   +0.1572 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -0.0000 if pav>=0.018923847004771233\n",
      "   -0.0104 if cp>=-0.018017824739217755 & cv<=0.2471112161874771\n",
      "   +0.0560 if cv<=0.19986332654953007\n",
      "   +0.0911 if pa>=-0.044184552133083345\n",
      "   -0.9913 if cp>=-0.006322119757533074\n",
      "   -0.0000 if cp<=0.015797895938158037 & pav>=0.6212986826896668\n",
      "   -0.4220 if pav<=0.4272501707077029\n",
      "   -0.0000 if pav>=1.358390212059021\n",
      "   -0.8895 if cv>=0.9526481032371521\n",
      "Run episode 83 with rewards 52.0\n",
      "============ 84 ===========\n",
      "51 actions [0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -3.9506 if cp<=0.005921376449987295\n",
      "   -2.4426 if cp<=-0.00736388750374316\n",
      "   -1.1471 if pa>=-0.04247509688138962\n",
      "   +2.1015 if cv<=0.21199920773506165\n",
      "   +2.9881 if cp>=0.005538606084883213\n",
      "   -1.9871 if cp>=-0.029031646996736528 & pav<=-0.4726494014263153\n",
      "   +1.4809 if cp>=0.006805960088968284\n",
      "   +4.9225 if cp>=-0.016432926431298255 & pav>=-0.5658186197280883\n",
      "   +1.4800 if cp>=0.015797895938158037\n",
      "   +0.3787 if cv>=0.41481969952583314\n",
      "   +0.3264 if cv>=0.5608624219894409\n",
      "   -3.9359 if cp<=-0.010239078290760508 & cv<=-0.15709589719772304 & pav<=0.38936426043510497\n",
      "--------------\n",
      "   +0.1658 if cv>=-0.5116368293762207\n",
      "   -0.8886 if cp>=-0.057790301740169525\n",
      "   +0.4146 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -1.5468 if cp>=-0.018017824739217755 & cv<=0.2471112161874771\n",
      "   +0.0923 if cv<=0.19986332654953007\n",
      "   +1.5904 if pa>=-0.044184552133083345\n",
      "   -3.4599 if cp>=-0.006322119757533074\n",
      "   +0.8861 if cp<=0.015797895938158037 & pav>=0.6212986826896668\n",
      "   +0.0815 if pav<=0.4272501707077029\n",
      "   +0.3174 if pav>=1.358390212059021\n",
      "   -1.7709 if cv>=0.9526481032371521\n",
      "   -6.7704 if cp<=-0.010239078290760508 & cv<=0.339819622039795 & cv>=-0.15709589719772304 & pa<=0.0489315912127495\n",
      "Run episode 84 with rewards 51.0\n",
      "============ 85 ===========\n",
      "31 actions [0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   -3.0021 if cp<=0.005921376449987295\n",
      "   -2.9405 if cp<=-0.00736388750374316\n",
      "   -0.9818 if pa>=-0.04247509688138962\n",
      "   +1.0168 if cv<=0.21199920773506165\n",
      "   +1.6495 if cp>=0.005538606084883213\n",
      "   -2.3097 if cp>=-0.029031646996736528 & pav<=-0.4726494014263153\n",
      "   +1.6495 if cp>=0.006805960088968284\n",
      "   +1.4921 if cp>=-0.016432926431298255 & pav>=-0.5658186197280883\n",
      "   +1.6316 if cp>=0.015797895938158037\n",
      "   -2.3604 if cv>=0.41481969952583314\n",
      "   -0.1022 if cp<=-0.010239078290760508 & cv<=-0.15709589719772304 & pav<=0.38936426043510497\n",
      "   +1.5876 if cp>=-0.0008000442758202436\n",
      "--------------\n",
      "   +0.4667 if cv>=-0.5116368293762207\n",
      "   +0.8611 if cp>=-0.057790301740169525\n",
      "   +0.5719 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   +0.4054 if cp>=-0.018017824739217755 & cv<=0.2471112161874771\n",
      "   +0.5866 if cv<=0.19986332654953007\n",
      "   +1.0943 if pa>=-0.044184552133083345\n",
      "   -2.6129 if cp>=-0.006322119757533074\n",
      "   +0.4934 if cp<=0.015797895938158037 & pav>=0.6212986826896668\n",
      "   +1.1048 if pav>=1.358390212059021\n",
      "   +0.4730 if cv>=0.9526481032371521\n",
      "   +0.0000 if cp<=-0.010239078290760508 & cv<=0.339819622039795 & cv>=-0.15709589719772304 & pa<=0.0489315912127495\n",
      "   -2.6128 if cp>=-0.0008000442758202436\n",
      "Run episode 85 with rewards 31.0\n",
      "============ 86 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 0, 0, 0, 0, 0]\n",
      "   -2.1896 if cp<=0.005921376449987295\n",
      "   -1.5228 if cp<=-0.00736388750374316\n",
      "   -0.6037 if pa>=-0.04247509688138962\n",
      "   +0.7554 if cv<=0.21199920773506165\n",
      "   +1.5859 if cp>=0.005538606084883213\n",
      "   -1.2514 if cp>=-0.029031646996736528 & pav<=-0.4726494014263153\n",
      "   +1.5859 if cp>=0.006805960088968284\n",
      "   +1.8095 if cp>=-0.016432926431298255 & pav>=-0.5658186197280883\n",
      "   +1.5548 if cp>=0.015797895938158037\n",
      "   -1.2728 if cv>=0.41481969952583314\n",
      "   +0.9191 if cp>=-0.0008000442758202436\n",
      "   +1.0994 if cp<=0.00142290152143687 & cv<=-0.5963911414146423\n",
      "--------------\n",
      "   +0.1421 if cv>=-0.5116368293762207\n",
      "   -0.4129 if cp>=-0.057790301740169525\n",
      "   +0.1421 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -0.5804 if cp>=-0.018017824739217755 & cv<=0.2471112161874771\n",
      "   +0.1840 if cv<=0.19986332654953007\n",
      "   -0.0239 if pa>=-0.044184552133083345\n",
      "   -1.6136 if cp>=-0.006322119757533074\n",
      "   -0.0682 if cp<=0.015797895938158037 & pav>=0.6212986826896668\n",
      "   +0.7797 if pav>=1.358390212059021\n",
      "   -0.1417 if cv>=0.9526481032371521\n",
      "   -1.6136 if cp>=-0.0008000442758202436\n",
      "   +0.2337 if cp<=0.00142290152143687\n",
      "Run episode 86 with rewards 10.0\n",
      "============ 87 ===========\n",
      "42 actions [1, 1, 1, 1, 1, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0]\n",
      "   -2.4485 if cp<=0.005921376449987295\n",
      "   -1.1990 if cp<=-0.00736388750374316\n",
      "   -0.3904 if cv<=0.21199920773506165\n",
      "   +0.5888 if cp>=0.005538606084883213\n",
      "   -0.8559 if cp>=-0.029031646996736528 & pav<=-0.4726494014263153\n",
      "   +0.5888 if cp>=0.006805960088968284\n",
      "   +0.0043 if cp>=-0.016432926431298255 & pav>=-0.5658186197280883\n",
      "   +0.3625 if cp>=0.015797895938158037\n",
      "   -0.8602 if cv>=0.41481969952583314\n",
      "   +0.5888 if cp>=-0.0008000442758202436\n",
      "   +0.0000 if cp<=0.00142290152143687 & cv<=-0.5963911414146423\n",
      "   +0.3663 if cv>=0.8077487111091614\n",
      "--------------\n",
      "   -0.0604 if cv>=-0.5116368293762207\n",
      "   -0.0604 if cp>=-0.057790301740169525\n",
      "   +0.4525 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -0.0007 if cp>=-0.018017824739217755 & cv<=0.2471112161874771\n",
      "   +0.2830 if cv<=0.19986332654953007\n",
      "   -0.5365 if cp>=-0.006322119757533074\n",
      "   +0.0000 if cp<=0.015797895938158037 & pav>=0.6212986826896668\n",
      "   +0.0000 if pav>=1.358390212059021\n",
      "   -0.4463 if cv>=0.9526481032371521\n",
      "   -0.6891 if cp>=-0.0008000442758202436\n",
      "   +0.6287 if cp<=0.00142290152143687\n",
      "   +0.4517 if cv<=0.4205584764480591\n",
      "Run episode 87 with rewards 42.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 88 ===========\n",
      "26 actions [0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1]\n",
      "   -1.3243 if cp<=0.005921376449987295\n",
      "   -0.6104 if cp<=-0.00736388750374316\n",
      "   +1.4849 if cv<=0.21199920773506165\n",
      "   +2.2844 if cp>=0.005538606084883213\n",
      "   -4.8151 if cp>=-0.029031646996736528 & pav<=-0.4726494014263153\n",
      "   +2.2844 if cp>=0.006805960088968284\n",
      "   -2.4414 if cp>=-0.016432926431298255 & pav>=-0.5658186197280883\n",
      "   +0.2795 if cp>=0.015797895938158037\n",
      "   +4.6665 if cv>=0.41481969952583314\n",
      "   +2.2844 if cp>=-0.0008000442758202436\n",
      "   -2.1970 if cv>=0.8077487111091614\n",
      "   -3.0690 if cp<=0.06545908823609355\n",
      "--------------\n",
      "   -0.6644 if cv>=-0.5116368293762207\n",
      "   +1.9495 if cp>=-0.057790301740169525\n",
      "   -2.7613 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -4.3962 if cp>=-0.018017824739217755 & cv<=0.2471112161874771\n",
      "   -2.2221 if cv<=0.19986332654953007\n",
      "   +0.0891 if cp>=-0.006322119757533074\n",
      "   -0.7419 if pav>=1.358390212059021\n",
      "   +2.2732 if cv>=0.9526481032371521\n",
      "   -4.0342 if cp>=-0.0008000442758202436\n",
      "   +0.4002 if cp<=0.00142290152143687\n",
      "   +5.7958 if cv<=0.4205584764480591\n",
      "   -4.7435 if cv<=0.4960196733474741 & cv>=-0.0034226754214614612 & pa<=-0.10581586211919783\n",
      "Run episode 88 with rewards 26.0\n",
      "============ 89 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 1, 1, 1, 1]\n",
      "   -1.0212 if cp<=0.005921376449987295\n",
      "   -0.2773 if cp<=-0.00736388750374316\n",
      "   -1.6873 if cv<=0.21199920773506165\n",
      "   +1.2455 if cp>=0.005538606084883213\n",
      "   -3.9669 if cp>=-0.029031646996736528 & pav<=-0.4726494014263153\n",
      "   +0.6927 if cp>=0.006805960088968284\n",
      "   +0.0744 if cp>=-0.016432926431298255 & pav>=-0.5658186197280883\n",
      "   +1.6937 if cv>=0.41481969952583314\n",
      "   +1.8729 if cp>=-0.0008000442758202436\n",
      "   +0.0000 if cv>=0.8077487111091614\n",
      "   +0.2242 if cp<=0.06545908823609355\n",
      "   +0.2243 if \n",
      "--------------\n",
      "   -0.5896 if cv>=-0.5116368293762207\n",
      "   -1.9394 if cp>=-0.057790301740169525\n",
      "   -0.5896 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -1.6930 if cp>=-0.018017824739217755 & cv<=0.2471112161874771\n",
      "   +0.6832 if cv<=0.19986332654953007\n",
      "   -0.9196 if pav>=1.358390212059021\n",
      "   +0.0000 if cv>=0.9526481032371521\n",
      "   -2.8631 if cp>=-0.0008000442758202436\n",
      "   +0.9237 if cp<=0.00142290152143687\n",
      "   +2.3386 if cv<=0.4205584764480591\n",
      "   +0.0000 if cv<=0.4960196733474741 & cv>=-0.0034226754214614612 & pa<=-0.10581586211919783\n",
      "   -0.2302 if cp>=-0.010219207033514977\n",
      "Run episode 89 with rewards 9.0\n",
      "============ 90 ===========\n",
      "41 actions [0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0]\n",
      "   -0.5536 if cp<=0.005921376449987295\n",
      "   -0.9866 if cp<=-0.00736388750374316\n",
      "   -0.1884 if cv<=0.21199920773506165\n",
      "   +0.3651 if cp>=0.005538606084883213\n",
      "   +0.0000 if cp>=-0.029031646996736528 & pav<=-0.4726494014263153\n",
      "   +0.3651 if cp>=0.006805960088968284\n",
      "   -0.0200 if cp>=-0.016432926431298255 & pav>=-0.5658186197280883\n",
      "   +0.0000 if cv>=0.41481969952583314\n",
      "   +0.7981 if cp>=-0.0008000442758202436\n",
      "   -0.1884 if cp<=0.06545908823609355\n",
      "   -0.1884 if \n",
      "   -0.8181 if pav>=1.5941218137741089\n",
      "--------------\n",
      "   -0.1450 if cv>=-0.5116368293762207\n",
      "   -0.1443 if cp>=-0.057790301740169525\n",
      "   -0.1450 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -0.5748 if cp>=-0.018017824739217755 & cv<=0.2471112161874771\n",
      "   -0.1082 if cv<=0.19986332654953007\n",
      "   +0.4694 if pav>=1.358390212059021\n",
      "   -1.0442 if cp>=-0.0008000442758202436\n",
      "   +0.9360 if cp<=0.00142290152143687\n",
      "   -0.1082 if cv<=0.4205584764480591\n",
      "   -0.0000 if cv<=0.4960196733474741 & cv>=-0.0034226754214614612 & pa<=-0.10581586211919783\n",
      "   -1.0442 if cp>=-0.010219207033514977\n",
      "   -0.0150 if cp<=0.026359975337982178 & cv>=-0.4420544028282164\n",
      "Run episode 90 with rewards 41.0\n",
      "============ 91 ===========\n",
      "25 actions [1, 0, 1, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0]\n",
      "   -2.1850 if cp<=0.005921376449987295\n",
      "   +3.0482 if cp<=-0.00736388750374316\n",
      "   -0.3296 if cv<=0.21199920773506165\n",
      "   +0.4245 if cp>=0.005538606084883213\n",
      "   +1.1734 if cp>=-0.029031646996736528 & pav<=-0.4726494014263153\n",
      "   +0.4245 if cp>=0.006805960088968284\n",
      "   +4.4078 if cp>=-0.016432926431298255 & pav>=-0.5658186197280883\n",
      "   +6.8661 if cp>=-0.0008000442758202436\n",
      "   -1.7604 if cp<=0.06545908823609355\n",
      "   -1.7604 if \n",
      "   +0.0000 if pav>=1.5941218137741089\n",
      "   -1.4725 if pa>=-0.1113012358546257\n",
      "--------------\n",
      "   -2.0163 if cv>=-0.5116368293762207\n",
      "   +0.0354 if cp>=-0.057790301740169525\n",
      "   -1.3689 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -6.1991 if cp>=-0.018017824739217755 & cv<=0.2471112161874771\n",
      "   +0.1477 if cv<=0.19986332654953007\n",
      "   +0.4845 if pav>=1.358390212059021\n",
      "   -3.7846 if cp>=-0.0008000442758202436\n",
      "   +3.8159 if cp<=0.00142290152143687\n",
      "   +2.7849 if cv<=0.4205584764480591\n",
      "   +1.3316 if cp>=-0.010219207033514977\n",
      "   -1.4307 if cp<=0.026359975337982178 & cv>=-0.4420544028282164\n",
      "   +3.5312 if cp<=-0.004414650611579399 & cv>=0.24100883305072787 & pa<=0.020645761862397194\n",
      "Run episode 91 with rewards 25.0\n",
      "============ 92 ===========\n",
      "28 actions [0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0, 0, 0, 0, 0]\n",
      "   -2.4591 if cp<=0.005921376449987295\n",
      "   +4.8613 if cp<=-0.00736388750374316\n",
      "   +1.4492 if cv<=0.21199920773506165\n",
      "   +0.4771 if cp>=0.005538606084883213\n",
      "   +0.3919 if cp>=-0.029031646996736528 & pav<=-0.4726494014263153\n",
      "   +0.4771 if cp>=0.006805960088968284\n",
      "   +4.0813 if cp>=-0.016432926431298255 & pav>=-0.5658186197280883\n",
      "   +0.5143 if cp>=-0.0008000442758202436\n",
      "   -1.9933 if cp<=0.06545908823609355\n",
      "   -1.9820 if \n",
      "   -2.0339 if pa>=-0.1113012358546257\n",
      "   +3.1755 if cp>=-0.004644392151385544 & cv>=-0.013342144712805749\n",
      "--------------\n",
      "   +0.3315 if cv>=-0.5116368293762207\n",
      "   +0.4785 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -2.9196 if cp>=-0.018017824739217755 & cv<=0.2471112161874771\n",
      "   -0.4521 if cv<=0.19986332654953007\n",
      "   +0.0000 if pav>=1.358390212059021\n",
      "   -0.1682 if cp>=-0.0008000442758202436\n",
      "   +0.3264 if cp<=0.00142290152143687\n",
      "   -0.3106 if cv<=0.4205584764480591\n",
      "   -0.9227 if cp>=-0.010219207033514977\n",
      "   +0.4785 if cp<=0.026359975337982178 & cv>=-0.4420544028282164\n",
      "   +0.4603 if cp<=-0.004414650611579399 & cv>=0.24100883305072787 & pa<=0.020645761862397194\n",
      "   -3.0960 if cp<=0.02022861540317543 & cp>=-0.004644392151385544 & cv>=-0.013342144712805749\n",
      "Run episode 92 with rewards 28.0\n",
      "============ 93 ===========\n",
      "37 actions [1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -1.2253 if cp<=0.005921376449987295\n",
      "   -0.2661 if cp<=-0.00736388750374316\n",
      "   +0.3823 if cv<=0.21199920773506165\n",
      "   +0.8247 if cp>=0.005538606084883213\n",
      "   +0.7327 if cp>=0.006805960088968284\n",
      "   +3.6074 if cp>=-0.016432926431298255 & pav>=-0.5658186197280883\n",
      "   +0.8247 if cp>=-0.0008000442758202436\n",
      "   -2.6158 if cp<=0.06545908823609355\n",
      "   -0.4005 if \n",
      "   -0.7922 if pa>=-0.1113012358546257\n",
      "   +0.4657 if cp>=-0.004644392151385544 & cv>=-0.013342144712805749\n",
      "   +2.6201 if cv>=1.3324260473251344 & pa>=0.0028448623605072656\n",
      "--------------\n",
      "   +0.5886 if cv>=-0.5116368293762207\n",
      "   +1.7908 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -2.8723 if cp>=-0.018017824739217755 & cv<=0.2471112161874771\n",
      "   +0.4738 if cv<=0.19986332654953007\n",
      "   -0.7683 if cp>=-0.0008000442758202436\n",
      "   +2.8301 if cp<=0.00142290152143687\n",
      "   +0.5322 if cv<=0.4205584764480591\n",
      "   -1.7251 if cp>=-0.010219207033514977\n",
      "   -1.2644 if cp<=0.026359975337982178 & cv>=-0.4420544028282164\n",
      "   +0.0000 if cp<=-0.004414650611579399 & cv>=0.24100883305072787 & pa<=0.020645761862397194\n",
      "   +0.0000 if cp<=0.02022861540317543 & cp>=-0.004644392151385544 & cv>=-0.013342144712805749\n",
      "   -1.5145 if cp<=0.046974910050630606\n",
      "Run episode 93 with rewards 37.0\n",
      "============ 94 ===========\n",
      "32 actions [0, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0]\n",
      "   -1.5843 if cp<=0.005921376449987295\n",
      "   -0.0137 if cv<=0.21199920773506165\n",
      "   +1.2281 if cp>=0.005538606084883213\n",
      "   +1.2281 if cp>=0.006805960088968284\n",
      "   +0.6760 if cp>=-0.016432926431298255 & pav>=-0.5658186197280883\n",
      "   +1.8139 if cp>=-0.0008000442758202436\n",
      "   -0.6778 if cp<=0.06545908823609355\n",
      "   -0.3563 if \n",
      "   -0.6868 if pa>=-0.1113012358546257\n",
      "   +1.1435 if cp>=-0.004644392151385544 & cv>=-0.013342144712805749\n",
      "   -0.0000 if cv>=1.3324260473251344 & pa>=0.0028448623605072656\n",
      "   -0.5945 if pa>=-0.1415664494037628\n",
      "--------------\n",
      "   -0.8991 if cv>=-0.5116368293762207\n",
      "   +0.5395 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -0.4535 if cp>=-0.018017824739217755 & cv<=0.2471112161874771\n",
      "   +0.1453 if cv<=0.19986332654953007\n",
      "   -2.7454 if cp>=-0.0008000442758202436\n",
      "   +1.6895 if cp<=0.00142290152143687\n",
      "   +0.2063 if cv<=0.4205584764480591\n",
      "   -1.9709 if cp>=-0.010219207033514977\n",
      "   +0.5553 if cp<=0.026359975337982178 & cv>=-0.4420544028282164\n",
      "   -0.8397 if cp<=0.02022861540317543 & cp>=-0.004644392151385544 & cv>=-0.013342144712805749\n",
      "   -0.2179 if cp<=0.046974910050630606\n",
      "   -0.0518 if cp>=0.060936757922172555 & cv>=0.35164651870727537\n",
      "Run episode 94 with rewards 32.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 95 ===========\n",
      "23 actions [1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -1.1004 if cp<=0.005921376449987295\n",
      "   +0.0302 if cv<=0.21199920773506165\n",
      "   +0.2224 if cp>=0.005538606084883213\n",
      "   +0.2224 if cp>=0.006805960088968284\n",
      "   +0.5415 if cp>=-0.016432926431298255 & pav>=-0.5658186197280883\n",
      "   +4.6078 if cp>=-0.0008000442758202436\n",
      "   -0.8780 if cp<=0.06545908823609355\n",
      "   -0.8780 if \n",
      "   -0.8782 if pa>=-0.1113012358546257\n",
      "   +0.2883 if cp>=-0.004644392151385544 & cv>=-0.013342144712805749\n",
      "   -0.8782 if pa>=-0.1415664494037628\n",
      "   -0.1805 if cp<=-0.015375298634171485 & cv>=0.2741463959217074 & pa>=-0.03439104482531547\n",
      "--------------\n",
      "   -0.2031 if cv>=-0.5116368293762207\n",
      "   -0.1690 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -0.7307 if cp>=-0.018017824739217755 & cv<=0.2471112161874771\n",
      "   +0.0097 if cv<=0.19986332654953007\n",
      "   -5.2409 if cp>=-0.0008000442758202436\n",
      "   +1.1514 if cp<=0.00142290152143687\n",
      "   +0.2177 if cv<=0.4205584764480591\n",
      "   -1.2202 if cp>=-0.010219207033514977\n",
      "   -0.1466 if cp<=0.026359975337982178 & cv>=-0.4420544028282164\n",
      "   -0.4107 if cp<=0.02022861540317543 & cp>=-0.004644392151385544 & cv>=-0.013342144712805749\n",
      "   +0.6595 if cp<=0.046974910050630606\n",
      "   +0.6598 if \n",
      "Run episode 95 with rewards 23.0\n",
      "============ 96 ===========\n",
      "29 actions [1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0]\n",
      "   -0.8794 if cp<=0.005921376449987295\n",
      "   +0.4486 if cp>=0.005538606084883213\n",
      "   +0.4486 if cp>=0.006805960088968284\n",
      "   -0.0382 if cp>=-0.016432926431298255 & pav>=-0.5658186197280883\n",
      "   +0.9261 if cp>=-0.0008000442758202436\n",
      "   -0.4309 if cp<=0.06545908823609355\n",
      "   -0.4309 if \n",
      "   -0.3927 if pa>=-0.1113012358546257\n",
      "   +0.6900 if cp>=-0.004644392151385544 & cv>=-0.013342144712805749\n",
      "   -0.6501 if pa>=-0.1415664494037628\n",
      "   +0.0000 if cp<=-0.015375298634171485 & cv>=0.2741463959217074 & pa>=-0.03439104482531547\n",
      "   -1.3569 if cp<=-0.0013342186342924687\n",
      "--------------\n",
      "   -0.4074 if cv>=-0.5116368293762207\n",
      "   +0.2973 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   +0.0471 if cp>=-0.018017824739217755 & cv<=0.2471112161874771\n",
      "   -1.5886 if cp>=-0.0008000442758202436\n",
      "   +1.5481 if cp<=0.00142290152143687\n",
      "   +0.3608 if cv<=0.4205584764480591\n",
      "   -0.8016 if cp>=-0.010219207033514977\n",
      "   +0.1396 if cp<=0.026359975337982178 & cv>=-0.4420544028282164\n",
      "   -0.8644 if cp<=0.02022861540317543 & cp>=-0.004644392151385544 & cv>=-0.013342144712805749\n",
      "   -0.0405 if cp<=0.046974910050630606\n",
      "   -0.0405 if \n",
      "   -0.5568 if cv>=0.4822332143783572 & pav<=-1.0210192918777465\n",
      "Run episode 96 with rewards 29.0\n",
      "============ 97 ===========\n",
      "28 actions [0, 0, 1, 1, 1, 1, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0]\n",
      "   -0.9866 if cp<=0.005921376449987295\n",
      "   +0.4552 if cp>=0.005538606084883213\n",
      "   +0.4552 if cp>=0.006805960088968284\n",
      "   -0.0998 if cp>=-0.016432926431298255 & pav>=-0.5658186197280883\n",
      "   +2.8111 if cp>=-0.0008000442758202436\n",
      "   -0.5315 if cp<=0.06545908823609355\n",
      "   -0.5315 if \n",
      "   -0.5341 if pa>=-0.1113012358546257\n",
      "   +1.3612 if cp>=-0.004644392151385544 & cv>=-0.013342144712805749\n",
      "   -0.5312 if pa>=-0.1415664494037628\n",
      "   -1.3317 if cp<=-0.0013342186342924687\n",
      "   -6.0619 if cp>=0.02888802401721478 & cv<=-0.36624195575714114\n",
      "--------------\n",
      "   +4.5187 if cv>=-0.5116368293762207\n",
      "   -0.6616 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   +0.1889 if cp>=-0.018017824739217755 & cv<=0.2471112161874771\n",
      "   -3.0206 if cp>=-0.0008000442758202436\n",
      "   +1.2624 if cp<=0.00142290152143687\n",
      "   +0.6572 if cv<=0.4205584764480591\n",
      "   -1.3673 if cp>=-0.010219207033514977\n",
      "   +0.7933 if cp<=0.026359975337982178 & cv>=-0.4420544028282164\n",
      "   -0.8988 if cp<=0.02022861540317543 & cp>=-0.004644392151385544 & cv>=-0.013342144712805749\n",
      "   +0.4463 if cp<=0.046974910050630606\n",
      "   -0.4335 if cv>=0.4822332143783572 & pav<=-1.0210192918777465\n",
      "   -5.2478 if cv>=-0.36624195575714114\n",
      "Run episode 97 with rewards 28.0\n",
      "============ 98 ===========\n",
      "46 actions [0, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 0, 1, 1, 1, 1, 1, 1, 0, 1, 0]\n",
      "   -0.4483 if cp<=0.005921376449987295\n",
      "   +0.0728 if cp>=0.005538606084883213\n",
      "   +0.0728 if cp>=0.006805960088968284\n",
      "   +2.4040 if cp>=-0.0008000442758202436\n",
      "   -0.3755 if cp<=0.06545908823609355\n",
      "   -0.3755 if \n",
      "   -0.3755 if pa>=-0.1113012358546257\n",
      "   +0.3459 if cp>=-0.004644392151385544 & cv>=-0.013342144712805749\n",
      "   -0.3755 if pa>=-0.1415664494037628\n",
      "   -2.7795 if cp<=-0.0013342186342924687\n",
      "   -0.4953 if cp>=0.02888802401721478 & cv<=-0.36624195575714114\n",
      "   -3.0416 if cp>=0.004652777779847387 & cv<=-0.20420368313789367\n",
      "--------------\n",
      "   +1.4823 if cv>=-0.5116368293762207\n",
      "   +1.4823 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -3.0970 if cp>=-0.0008000442758202436\n",
      "   -1.2315 if cp<=0.00142290152143687\n",
      "   +0.2886 if cv<=0.4205584764480591\n",
      "   +0.5363 if cp>=-0.010219207033514977\n",
      "   +1.6866 if cp<=0.026359975337982178 & cv>=-0.4420544028282164\n",
      "   -0.3857 if cp<=0.02022861540317543 & cp>=-0.004644392151385544 & cv>=-0.013342144712805749\n",
      "   +1.5209 if cp<=0.046974910050630606\n",
      "   +0.0000 if cv>=0.4822332143783572 & pav<=-1.0210192918777465\n",
      "   -5.3425 if cv>=-0.36624195575714114\n",
      "   -0.9396 if pa<=0.05584583953022957\n",
      "Run episode 98 with rewards 46.0\n",
      "============ 99 ===========\n",
      "33 actions [0, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 0, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1]\n",
      "   -0.7931 if cp<=0.005921376449987295\n",
      "   -0.8714 if cp>=0.006805960088968284\n",
      "   +2.5309 if cp>=-0.0008000442758202436\n",
      "   -1.1770 if cp<=0.06545908823609355\n",
      "   -1.1770 if \n",
      "   +0.7320 if pa>=-0.1113012358546257\n",
      "   +0.3654 if cp>=-0.004644392151385544 & cv>=-0.013342144712805749\n",
      "   -1.6321 if pa>=-0.1415664494037628\n",
      "   -3.7079 if cp<=-0.0013342186342924687\n",
      "   -0.7282 if cp>=0.02888802401721478 & cv<=-0.36624195575714114\n",
      "   -1.0167 if cp>=0.004652777779847387 & cv<=-0.20420368313789367\n",
      "   +4.7736 if pav<=0.24514786899089813\n",
      "--------------\n",
      "   -1.1195 if cv>=-0.5116368293762207\n",
      "   +2.5913 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -3.2762 if cp>=-0.0008000442758202436\n",
      "   +1.9753 if cp<=0.00142290152143687\n",
      "   +0.6532 if cv<=0.4205584764480591\n",
      "   +5.9950 if cp>=-0.010219207033514977\n",
      "   +0.0116 if cp<=0.026359975337982178 & cv>=-0.4420544028282164\n",
      "   -0.2543 if cp<=0.02022861540317543 & cp>=-0.004644392151385544 & cv>=-0.013342144712805749\n",
      "   -1.1191 if cp<=0.046974910050630606\n",
      "   -8.4890 if cv>=-0.36624195575714114\n",
      "   -1.1191 if pa<=0.05584583953022957\n",
      "   +6.5549 if cp<=-0.012825311161577702\n",
      "Run episode 99 with rewards 33.0\n",
      "============ 100 ===========\n",
      "29 actions [0, 0, 1, 0, 1, 1, 1, 1, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1]\n",
      "   -1.5306 if cp<=0.005921376449987295\n",
      "   +0.4096 if cp>=0.006805960088968284\n",
      "   +2.2540 if cp>=-0.0008000442758202436\n",
      "   -0.6914 if cp<=0.06545908823609355\n",
      "   -0.6914 if \n",
      "   -0.6914 if pa>=-0.1113012358546257\n",
      "   -0.6914 if pa>=-0.1415664494037628\n",
      "   -2.9454 if cp<=-0.0013342186342924687\n",
      "   +0.0000 if cp>=0.02888802401721478 & cv<=-0.36624195575714114\n",
      "   -1.2841 if cp>=0.004652777779847387 & cv<=-0.20420368313789367\n",
      "   -0.1018 if pav<=0.24514786899089813\n",
      "   +3.5068 if cp<=0.009017197974026211 & cv<=0.1987526923418045 & cv>=0.0026460231281817057 & pa<=0.10626617670059205\n",
      "--------------\n",
      "   -0.6439 if cv>=-0.5116368293762207\n",
      "   -0.6439 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -2.1058 if cp>=-0.0008000442758202436\n",
      "   +4.1217 if cp<=0.00142290152143687\n",
      "   -0.6153 if cv<=0.4205584764480591\n",
      "   +3.2773 if cp>=-0.010219207033514977\n",
      "   -0.0521 if cp<=0.02022861540317543 & cp>=-0.004644392151385544 & cv>=-0.013342144712805749\n",
      "   -0.6439 if cp<=0.046974910050630606\n",
      "   -4.3065 if cv>=-0.36624195575714114\n",
      "   +0.7119 if pa<=0.05584583953022957\n",
      "   -0.0000 if cp<=-0.012825311161577702\n",
      "   +2.9742 if cp>=0.0020913713611662404 & cv<=-0.21635273694992066\n",
      "Run episode 100 with rewards 29.0\n",
      "============ 101 ===========\n",
      "39 actions [0, 0, 1, 0, 1, 1, 0, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -2.6372 if cp<=0.005921376449987295\n",
      "   +1.5635 if cp>=0.006805960088968284\n",
      "   +1.0401 if cp>=-0.0008000442758202436\n",
      "   -1.0737 if cp<=0.06545908823609355\n",
      "   -1.0737 if \n",
      "   -1.0737 if pa>=-0.1113012358546257\n",
      "   -1.0737 if pa>=-0.1415664494037628\n",
      "   -2.1138 if cp<=-0.0013342186342924687\n",
      "   -1.0434 if cp>=0.004652777779847387 & cv<=-0.20420368313789367\n",
      "   +2.7075 if pav<=0.24514786899089813\n",
      "   -0.0647 if cp<=0.009017197974026211 & cv<=0.1987526923418045 & cv>=0.0026460231281817057 & pa<=0.10626617670059205\n",
      "   +1.5123 if cp>=0.013521378301084042\n",
      "--------------\n",
      "   +0.6012 if cv>=-0.5116368293762207\n",
      "   +0.6012 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -1.8593 if cp>=-0.0008000442758202436\n",
      "   +2.4604 if cp<=0.00142290152143687\n",
      "   +1.3214 if cv<=0.4205584764480591\n",
      "   +0.5777 if cp>=-0.010219207033514977\n",
      "   -2.5812 if cp<=0.02022861540317543 & cp>=-0.004644392151385544 & cv>=-0.013342144712805749\n",
      "   +0.6012 if cp<=0.046974910050630606\n",
      "   -4.1034 if cv>=-0.36624195575714114\n",
      "   -1.5946 if pa<=0.05584583953022957\n",
      "   +1.9450 if cp>=0.0020913713611662404 & cv<=-0.21635273694992066\n",
      "   -2.4790 if cp>=0.029025012627244006 & pa>=0.10984141528606417\n",
      "Run episode 101 with rewards 39.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 102 ===========\n",
      "35 actions [1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0]\n",
      "   -3.2878 if cp<=0.005921376449987295\n",
      "   +1.9850 if cp>=0.006805960088968284\n",
      "   +3.4714 if cp>=-0.0008000442758202436\n",
      "   -1.0465 if cp<=0.06545908823609355\n",
      "   -1.0465 if \n",
      "   -2.6928 if pa>=-0.1113012358546257\n",
      "   -2.7033 if pa>=-0.1415664494037628\n",
      "   -0.8095 if cp<=-0.0013342186342924687\n",
      "   -2.0259 if cp>=0.004652777779847387 & cv<=-0.20420368313789367\n",
      "   +1.2249 if pav<=0.24514786899089813\n",
      "   +2.1701 if cp>=0.013521378301084042\n",
      "   +4.3910 if cp<=0.02437907457351685 & cv>=-0.19414334297180175 & pa>=-0.0698458194732666\n",
      "--------------\n",
      "   +2.9256 if cv>=-0.5116368293762207\n",
      "   +0.9445 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -4.0176 if cp>=-0.0008000442758202436\n",
      "   +0.1621 if cp<=0.00142290152143687\n",
      "   +0.4326 if cv<=0.4205584764480591\n",
      "   -4.9950 if cp<=0.02022861540317543 & cp>=-0.004644392151385544 & cv>=-0.013342144712805749\n",
      "   +0.3993 if cp<=0.046974910050630606\n",
      "   -1.6175 if cv>=-0.36624195575714114\n",
      "   +0.3993 if pa<=0.05584583953022957\n",
      "   +1.9951 if cp>=0.0020913713611662404 & cv<=-0.21635273694992066\n",
      "   +0.0000 if cp>=0.029025012627244006 & pa>=0.10984141528606417\n",
      "   -3.6965 if cp>=0.002580943983048201 & cv>=-0.3794747233390808 & pa<=-0.02767487913370132\n",
      "Run episode 102 with rewards 35.0\n",
      "============ 103 ===========\n",
      "27 actions [1, 0, 0, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 1, 0, 0, 1, 1, 1, 0, 1, 1, 0]\n",
      "   -0.0638 if cp<=0.005921376449987295\n",
      "   +0.9184 if cp>=0.006805960088968284\n",
      "   +1.9960 if cp>=-0.0008000442758202436\n",
      "   -3.3363 if cp<=0.06545908823609355\n",
      "   +0.8546 if \n",
      "   -3.5419 if pa>=-0.1113012358546257\n",
      "   +0.3558 if pa>=-0.1415664494037628\n",
      "   -2.9959 if cp>=0.004652777779847387 & cv<=-0.20420368313789367\n",
      "   -0.0878 if pav<=0.24514786899089813\n",
      "   +1.0066 if cp>=0.013521378301084042\n",
      "   +2.3839 if cp<=0.02437907457351685 & cv>=-0.19414334297180175 & pa>=-0.0698458194732666\n",
      "   -0.4869 if cv<=0.6087097883224487 & cv>=-0.13812730610370635 & pa<=-0.05074187293648713 & pav<=-0.18669375479221337\n",
      "--------------\n",
      "   -0.5596 if cv>=-0.5116368293762207\n",
      "   +2.0142 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -2.8823 if cp>=-0.0008000442758202436\n",
      "   +0.6989 if cp<=0.00142290152143687\n",
      "   -0.1084 if cv<=0.4205584764480591\n",
      "   -2.4434 if cp<=0.02022861540317543 & cp>=-0.004644392151385544 & cv>=-0.013342144712805749\n",
      "   +2.4199 if cp<=0.046974910050630606\n",
      "   -0.5596 if cv>=-0.36624195575714114\n",
      "   -2.5090 if pa<=0.05584583953022957\n",
      "   +4.6419 if cp>=0.0020913713611662404 & cv<=-0.21635273694992066\n",
      "   -1.2585 if cp>=0.002580943983048201 & cv>=-0.3794747233390808 & pa<=-0.02767487913370132\n",
      "   +2.1158 if pav>=1.1385263204574585\n",
      "Run episode 103 with rewards 27.0\n",
      "============ 104 ===========\n",
      "40 actions [1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 0, 1, 1, 1, 0, 0, 0, 1, 1]\n",
      "   +0.0970 if cp>=0.006805960088968284\n",
      "   +0.0970 if cp>=-0.0008000442758202436\n",
      "   -2.2506 if cp<=0.06545908823609355\n",
      "   +0.0970 if \n",
      "   +0.0970 if pa>=-0.1113012358546257\n",
      "   +0.0970 if pa>=-0.1415664494037628\n",
      "   -3.1503 if cp>=0.004652777779847387 & cv<=-0.20420368313789367\n",
      "   -1.5885 if pav<=0.24514786899089813\n",
      "   +0.0970 if cp>=0.013521378301084042\n",
      "   -0.0000 if cp<=0.02437907457351685 & cv>=-0.19414334297180175 & pa>=-0.0698458194732666\n",
      "   -0.0000 if cv<=0.6087097883224487 & cv>=-0.13812730610370635 & pa<=-0.05074187293648713 & pav<=-0.18669375479221337\n",
      "   +2.4414 if cv>=0.2345998078584671\n",
      "--------------\n",
      "   -0.6287 if cv>=-0.5116368293762207\n",
      "   -0.6287 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -0.6287 if cp>=-0.0008000442758202436\n",
      "   +0.0000 if cp<=0.00142290152143687\n",
      "   +0.0000 if cp<=0.02022861540317543 & cp>=-0.004644392151385544 & cv>=-0.013342144712805749\n",
      "   +4.1595 if cp<=0.046974910050630606\n",
      "   -0.6287 if cv>=-0.36624195575714114\n",
      "   -1.6340 if pa<=0.05584583953022957\n",
      "   +4.7690 if cp>=0.0020913713611662404 & cv<=-0.21635273694992066\n",
      "   +0.0000 if cp>=0.002580943983048201 & cv>=-0.3794747233390808 & pa<=-0.02767487913370132\n",
      "   +0.0000 if pav>=1.1385263204574585\n",
      "   -4.6306 if pa<=0.06253425180912017 & pav<=-0.050671379268169385\n",
      "Run episode 104 with rewards 40.0\n",
      "============ 105 ===========\n",
      "50 actions [1, 1, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 1, 0, 0, 0, 1, 0, 1, 0, 0, 1, 0, 0]\n",
      "   +3.8163 if cp>=0.006805960088968284\n",
      "   -1.1966 if cp>=-0.0008000442758202436\n",
      "   -1.6713 if cp<=0.06545908823609355\n",
      "   -1.6712 if \n",
      "   -0.8867 if pa>=-0.1113012358546257\n",
      "   -1.4589 if pa>=-0.1415664494037628\n",
      "   -2.3887 if cp>=0.004652777779847387 & cv<=-0.20420368313789367\n",
      "   -1.6713 if pav<=0.24514786899089813\n",
      "   -0.3932 if cp>=0.013521378301084042\n",
      "   +1.5696 if cp<=0.02437907457351685 & cv>=-0.19414334297180175 & pa>=-0.0698458194732666\n",
      "   -0.0000 if cv>=0.2345998078584671\n",
      "   +2.6392 if pav<=-0.17386061251163476\n",
      "--------------\n",
      "   +0.2348 if cv>=-0.5116368293762207\n",
      "   +2.1722 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -0.3073 if cp>=-0.0008000442758202436\n",
      "   +2.6319 if cp<=0.02022861540317543 & cp>=-0.004644392151385544 & cv>=-0.013342144712805749\n",
      "   +0.2348 if cp<=0.046974910050630606\n",
      "   -1.9229 if cv>=-0.36624195575714114\n",
      "   +0.2348 if pa<=0.05584583953022957\n",
      "   +0.0143 if cp>=0.0020913713611662404 & cv<=-0.21635273694992066\n",
      "   +2.2180 if cp>=0.002580943983048201 & cv>=-0.3794747233390808 & pa<=-0.02767487913370132\n",
      "   +0.0000 if pav>=1.1385263204574585\n",
      "   -7.8352 if pa<=0.06253425180912017 & pav<=-0.050671379268169385\n",
      "   +3.7024 if cp<=0.03003971502184868 & cv<=-0.017293096706271167 & pa<=-0.029247607663273792\n",
      "Run episode 105 with rewards 50.0\n",
      "============ 106 ===========\n",
      "27 actions [1, 0, 1, 0, 1, 1, 1, 0, 0, 0, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 0, 0, 1, 0, 1]\n",
      "   +2.6386 if cp>=0.006805960088968284\n",
      "   -2.0971 if cp>=-0.0008000442758202436\n",
      "   -2.0021 if cp<=0.06545908823609355\n",
      "   -2.0021 if \n",
      "   -1.4641 if pa>=-0.1113012358546257\n",
      "   -3.8328 if pa>=-0.1415664494037628\n",
      "   +0.8369 if cp>=0.004652777779847387 & cv<=-0.20420368313789367\n",
      "   -2.0021 if pav<=0.24514786899089813\n",
      "   +4.2240 if cp>=0.013521378301084042\n",
      "   -0.3704 if cp<=0.02437907457351685 & cv>=-0.19414334297180175 & pa>=-0.0698458194732666\n",
      "   +5.4444 if pav<=-0.17386061251163476\n",
      "   -5.2403 if cp<=0.020965076982975013 & cv<=-0.024234870076179492 & cv<=-0.03616342917084694 & pav>=-0.28452752232551576\n",
      "--------------\n",
      "   +0.0109 if cv>=-0.5116368293762207\n",
      "   +3.3764 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -0.2595 if cp>=-0.0008000442758202436\n",
      "   +7.1957 if cp<=0.02022861540317543 & cp>=-0.004644392151385544 & cv>=-0.013342144712805749\n",
      "   -1.9482 if cp<=0.046974910050630606\n",
      "   -2.3067 if cv>=-0.36624195575714114\n",
      "   +0.1667 if pa<=0.05584583953022957\n",
      "   +1.2428 if cp>=0.0020913713611662404 & cv<=-0.21635273694992066\n",
      "   +1.5026 if cp>=0.002580943983048201 & cv>=-0.3794747233390808 & pa<=-0.02767487913370132\n",
      "   -6.4658 if pa<=0.06253425180912017 & pav<=-0.050671379268169385\n",
      "   +5.8245 if cp<=0.03003971502184868 & cv<=-0.017293096706271167 & pa<=-0.029247607663273792\n",
      "   -4.0656 if cv>=0.5486418604850769\n",
      "Run episode 106 with rewards 27.0\n",
      "============ 107 ===========\n",
      "60 actions [0, 0, 1, 1, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0]\n",
      "   -0.0000 if cp>=0.006805960088968284\n",
      "   -0.0000 if cp>=-0.0008000442758202436\n",
      "   -0.8348 if cp<=0.06545908823609355\n",
      "   -0.8348 if \n",
      "   -3.1351 if pa>=-0.1113012358546257\n",
      "   -1.6010 if pa>=-0.1415664494037628\n",
      "   -0.0000 if cp>=0.004652777779847387 & cv<=-0.20420368313789367\n",
      "   -0.8348 if pav<=0.24514786899089813\n",
      "   -0.0000 if cp>=0.013521378301084042\n",
      "   +0.2558 if pav<=-0.17386061251163476\n",
      "   -4.0626 if cp<=0.020965076982975013 & cv<=-0.024234870076179492 & cv<=-0.03616342917084694 & pav>=-0.28452752232551576\n",
      "   +2.9899 if pa>=-0.031737010926008224\n",
      "--------------\n",
      "   +2.4346 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   +0.0000 if cp>=-0.0008000442758202436\n",
      "   +0.0000 if cp<=0.02022861540317543 & cp>=-0.004644392151385544 & cv>=-0.013342144712805749\n",
      "   -2.3418 if cp<=0.046974910050630606\n",
      "   -2.3829 if cv>=-0.36624195575714114\n",
      "   -2.3418 if pa<=0.05584583953022957\n",
      "   +0.0000 if cp>=0.0020913713611662404 & cv<=-0.21635273694992066\n",
      "   +0.0000 if cp>=0.002580943983048201 & cv>=-0.3794747233390808 & pa<=-0.02767487913370132\n",
      "   -2.3420 if pa<=0.06253425180912017 & pav<=-0.050671379268169385\n",
      "   +3.5341 if cp<=0.03003971502184868 & cv<=-0.017293096706271167 & pa<=-0.029247607663273792\n",
      "   +0.0000 if cv>=0.5486418604850769\n",
      "   +0.6140 if cp>=-0.043199308961629865\n",
      "Run episode 107 with rewards 60.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 108 ===========\n",
      "39 actions [1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0]\n",
      "   -0.2287 if cp>=0.006805960088968284\n",
      "   -2.6445 if cp>=-0.0008000442758202436\n",
      "   +2.7930 if cp<=0.06545908823609355\n",
      "   -2.6444 if \n",
      "   -3.2405 if pa>=-0.1113012358546257\n",
      "   -2.6666 if pa>=-0.1415664494037628\n",
      "   +1.7351 if pav<=0.24514786899089813\n",
      "   -3.0301 if cp>=0.013521378301084042\n",
      "   +2.3971 if pav<=-0.17386061251163476\n",
      "   -6.0463 if cp<=0.020965076982975013 & cv<=-0.024234870076179492 & cv<=-0.03616342917084694 & pav>=-0.28452752232551576\n",
      "   +4.3592 if pa>=-0.031737010926008224\n",
      "   +2.8309 if pa<=0.013001559115946295\n",
      "--------------\n",
      "   +0.8051 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -0.6124 if cp<=0.02022861540317543 & cp>=-0.004644392151385544 & cv>=-0.013342144712805749\n",
      "   -5.7652 if cp<=0.046974910050630606\n",
      "   -3.0289 if cv>=-0.36624195575714114\n",
      "   +1.3279 if pa<=0.05584583953022957\n",
      "   +2.3599 if cp>=0.0020913713611662404 & cv<=-0.21635273694992066\n",
      "   +3.0822 if cp>=0.002580943983048201 & cv>=-0.3794747233390808 & pa<=-0.02767487913370132\n",
      "   -6.5103 if pa<=0.06253425180912017 & pav<=-0.050671379268169385\n",
      "   +0.0000 if cp<=0.03003971502184868 & cv<=-0.017293096706271167 & pa<=-0.029247607663273792\n",
      "   -0.1820 if cv>=0.5486418604850769\n",
      "   +1.3279 if cp>=-0.043199308961629865\n",
      "   +3.6490 if pa>=0.013001559115946295\n",
      "Run episode 108 with rewards 39.0\n",
      "============ 109 ===========\n",
      "19 actions [1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -1.7643 if cp>=-0.0008000442758202436\n",
      "   -1.3888 if cp<=0.06545908823609355\n",
      "   -1.7643 if \n",
      "   -0.3736 if pa>=-0.1113012358546257\n",
      "   -0.6535 if pa>=-0.1415664494037628\n",
      "   -1.7643 if pav<=0.24514786899089813\n",
      "   -1.7643 if cp>=0.013521378301084042\n",
      "   +2.1376 if pav<=-0.17386061251163476\n",
      "   +0.0000 if cp<=0.020965076982975013 & cv<=-0.024234870076179492 & cv<=-0.03616342917084694 & pav>=-0.28452752232551576\n",
      "   +2.1751 if pa>=-0.031737010926008224\n",
      "   -0.3754 if pa<=0.013001559115946295\n",
      "   +3.3090 if cp<=0.08820451200008393 & cv>=0.025386495515704155\n",
      "--------------\n",
      "   -1.2200 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -0.0000 if cp<=0.02022861540317543 & cp>=-0.004644392151385544 & cv>=-0.013342144712805749\n",
      "   -2.5801 if cp<=0.046974910050630606\n",
      "   +0.1795 if cv>=-0.36624195575714114\n",
      "   +0.1795 if pa<=0.05584583953022957\n",
      "   -0.0000 if cp>=0.0020913713611662404 & cv<=-0.21635273694992066\n",
      "   +1.4018 if cp>=0.002580943983048201 & cv>=-0.3794747233390808 & pa<=-0.02767487913370132\n",
      "   -5.7469 if pa<=0.06253425180912017 & pav<=-0.050671379268169385\n",
      "   +1.4018 if cv>=0.5486418604850769\n",
      "   +0.1795 if cp>=-0.043199308961629865\n",
      "   +2.4751 if pa>=0.013001559115946295\n",
      "   +5.5407 if cp>=0.13406274616718292\n",
      "Run episode 109 with rewards 19.0\n",
      "============ 110 ===========\n",
      "22 actions [1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 1, 1, 1, 1, 0, 0]\n",
      "   -1.0571 if cp>=-0.0008000442758202436\n",
      "   -2.0379 if cp<=0.06545908823609355\n",
      "   -1.0571 if \n",
      "   -1.4529 if pa>=-0.1113012358546257\n",
      "   -2.0379 if pa>=-0.1415664494037628\n",
      "   -1.0571 if pav<=0.24514786899089813\n",
      "   -1.0571 if cp>=0.013521378301084042\n",
      "   +0.7295 if pav<=-0.17386061251163476\n",
      "   +1.4492 if pa>=-0.031737010926008224\n",
      "   -1.0571 if pa<=0.013001559115946295\n",
      "   +2.2953 if cp<=0.08820451200008393 & cv>=0.025386495515704155\n",
      "   +2.6916 if cp>=0.02707395702600479\n",
      "--------------\n",
      "   -3.7957 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   +0.1362 if cp<=0.046974910050630606\n",
      "   +0.0740 if cv>=-0.36624195575714114\n",
      "   +0.0740 if pa<=0.05584583953022957\n",
      "   +1.1480 if cp>=0.0020913713611662404 & cv<=-0.21635273694992066\n",
      "   -0.3832 if cp>=0.002580943983048201 & cv>=-0.3794747233390808 & pa<=-0.02767487913370132\n",
      "   -1.8678 if pa<=0.06253425180912017 & pav<=-0.050671379268169385\n",
      "   +2.8656 if cv>=0.5486418604850769\n",
      "   +0.0740 if cp>=-0.043199308961629865\n",
      "   +0.0000 if pa>=0.013001559115946295\n",
      "   +0.0000 if cp>=0.13406274616718292\n",
      "   -3.8807 if cp>=0.02840052954852581\n",
      "Run episode 110 with rewards 22.0\n",
      "============ 111 ===========\n",
      "21 actions [1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.4530 if cp>=-0.0008000442758202436\n",
      "   -1.8302 if cp<=0.06545908823609355\n",
      "   -1.8714 if \n",
      "   -1.4609 if pa>=-0.1113012358546257\n",
      "   -2.4663 if pa>=-0.1415664494037628\n",
      "   -1.8714 if pav<=0.24514786899089813\n",
      "   -0.4243 if cp>=0.013521378301084042\n",
      "   +4.1077 if pa>=-0.031737010926008224\n",
      "   -1.8714 if pa<=0.013001559115946295\n",
      "   +5.1489 if cp<=0.08820451200008393 & cv>=0.025386495515704155\n",
      "   -0.4105 if cp>=0.02707395702600479\n",
      "   +1.5420 if cp>=-0.023856081068515778 & cv>=0.17508700788021087\n",
      "--------------\n",
      "   -2.7598 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   +0.3594 if cp<=0.046974910050630606\n",
      "   -0.1635 if cv>=-0.36624195575714114\n",
      "   -0.1635 if pa<=0.05584583953022957\n",
      "   +0.0000 if cp>=0.0020913713611662404 & cv<=-0.21635273694992066\n",
      "   +1.3675 if cp>=0.002580943983048201 & cv>=-0.3794747233390808 & pa<=-0.02767487913370132\n",
      "   -4.3177 if pa<=0.06253425180912017 & pav<=-0.050671379268169385\n",
      "   -1.5163 if cv>=0.5486418604850769\n",
      "   -0.1635 if cp>=-0.043199308961629865\n",
      "   +0.0000 if cp>=0.13406274616718292\n",
      "   +0.8567 if cp>=0.02840052954852581\n",
      "   +1.3015 if cv>=0.1731320708990097\n",
      "Run episode 111 with rewards 21.0\n",
      "============ 112 ===========\n",
      "31 actions [0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1, 0, 1, 1, 0, 1, 0, 0, 1, 0, 1, 0]\n",
      "   -1.4526 if cp>=-0.0008000442758202436\n",
      "   -0.7254 if cp<=0.06545908823609355\n",
      "   -1.4526 if \n",
      "   -1.2421 if pa>=-0.1113012358546257\n",
      "   -1.4042 if pa>=-0.1415664494037628\n",
      "   -1.4526 if pav<=0.24514786899089813\n",
      "   -1.4526 if cp>=0.013521378301084042\n",
      "   +3.2033 if pa>=-0.031737010926008224\n",
      "   -1.4526 if pa<=0.013001559115946295\n",
      "   +1.0401 if cp<=0.08820451200008393 & cv>=0.025386495515704155\n",
      "   +2.3407 if cp>=-0.023856081068515778 & cv>=0.17508700788021087\n",
      "   +4.5836 if cp<=0.031221849843859673 & cv>=-0.02113974839448929\n",
      "--------------\n",
      "   -0.7861 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -1.0055 if cp<=0.046974910050630606\n",
      "   -0.4810 if cv>=-0.36624195575714114\n",
      "   -0.4810 if pa<=0.05584583953022957\n",
      "   +0.0000 if cp>=0.0020913713611662404 & cv<=-0.21635273694992066\n",
      "   +0.9704 if cp>=0.002580943983048201 & cv>=-0.3794747233390808 & pa<=-0.02767487913370132\n",
      "   -1.7210 if pa<=0.06253425180912017 & pav<=-0.050671379268169385\n",
      "   +0.3841 if cv>=0.5486418604850769\n",
      "   -0.4810 if cp>=-0.043199308961629865\n",
      "   +3.6720 if cp>=0.02840052954852581\n",
      "   -1.7210 if cv>=0.1731320708990097\n",
      "   -2.8384 if cp<=0.031221849843859673 & cp>=0.031221849843859673\n",
      "Run episode 112 with rewards 31.0\n",
      "============ 113 ===========\n",
      "154 actions [1, 0, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 1, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 0, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 0, 1, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 1, 1, 0, 1, 1, 0, 0, 0, 0, 0, 1, 1, 0, 1, 1, 1, 0, 0, 1, 1, 1, 0, 0, 1, 0, 1, 1, 1, 1, 0, 1, 0, 0, 0, 1, 0, 0, 1, 1, 1, 0, 1, 1, 1, 1, 0, 0, 0, 1, 0, 0, 0, 1, 0, 0, 1, 1, 1, 1, 0, 0, 1, 0, 1, 1]\n",
      "   -0.1396 if cp>=-0.0008000442758202436\n",
      "   -0.5813 if \n",
      "   -0.5813 if pa>=-0.1113012358546257\n",
      "   -0.5813 if pa>=-0.1415664494037628\n",
      "   +2.6694 if pav<=0.24514786899089813\n",
      "   -5.6690 if cp>=0.013521378301084042\n",
      "   -0.5813 if pa>=-0.031737010926008224\n",
      "   +0.8965 if pa<=0.013001559115946295\n",
      "   +2.6695 if cp<=0.08820451200008393 & cv>=0.025386495515704155\n",
      "   +1.9856 if cp>=-0.023856081068515778 & cv>=0.17508700788021087\n",
      "   +2.6694 if cp<=0.031221849843859673 & cv>=-0.02113974839448929\n",
      "   -5.9977 if cp<=0.014768391847610479 & cv>=0.034477151930332184 & pa<=0.0010241540148854256\n",
      "--------------\n",
      "   -3.0277 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   +0.2694 if cp<=0.046974910050630606\n",
      "   -1.3009 if cv>=-0.36624195575714114\n",
      "   -2.9242 if pa<=0.05584583953022957\n",
      "   -0.0000 if cp>=0.002580943983048201 & cv>=-0.3794747233390808 & pa<=-0.02767487913370132\n",
      "   -1.7375 if pa<=0.06253425180912017 & pav<=-0.050671379268169385\n",
      "   -0.0000 if cv>=0.5486418604850769\n",
      "   +2.7745 if cp>=-0.043199308961629865\n",
      "   -0.0000 if cp>=0.02840052954852581\n",
      "   -1.7375 if cv>=0.1731320708990097\n",
      "   -0.0000 if cp<=0.031221849843859673 & cp>=0.031221849843859673\n",
      "   +4.6440 if cp<=0.014768391847610479 & pa<=0.0010241540148854256\n",
      "Run episode 113 with rewards 154.0\n",
      "best\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 114 ===========\n",
      "137 actions [0, 0, 0, 1, 0, 0, 1, 1, 1, 1, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 0, 1, 0, 1, 1, 1, 1, 0, 1, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 1, 1, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1, 1, 0, 1, 0, 0, 0, 0, 0, 1, 1, 1, 0, 1, 1, 0, 0, 1, 1, 1, 0, 0, 1, 1, 1, 1, 0, 0, 1, 1, 0, 1, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 0]\n",
      "   -1.7292 if \n",
      "   -1.7292 if pa>=-0.1113012358546257\n",
      "   -1.7292 if pa>=-0.1415664494037628\n",
      "   +3.3652 if pav<=0.24514786899089813\n",
      "   -1.7283 if cp>=0.013521378301084042\n",
      "   -1.9209 if pa>=-0.031737010926008224\n",
      "   +2.1600 if pa<=0.013001559115946295\n",
      "   +3.6574 if cp<=0.08820451200008393 & cv>=0.025386495515704155\n",
      "   +2.0803 if cp>=-0.023856081068515778 & cv>=0.17508700788021087\n",
      "   +0.0005 if cp<=0.031221849843859673 & cv>=-0.02113974839448929\n",
      "   +0.0011 if cp<=0.014768391847610479 & cv>=0.034477151930332184 & pa<=0.0010241540148854256\n",
      "   -3.6580 if pa>=0.11002523452043533\n",
      "--------------\n",
      "   -0.6033 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -0.4853 if cp<=0.046974910050630606\n",
      "   -0.6033 if cv>=-0.36624195575714114\n",
      "   -2.8557 if pa<=0.05584583953022957\n",
      "   -3.2223 if cp>=0.002580943983048201 & cv>=-0.3794747233390808 & pa<=-0.02767487913370132\n",
      "   -1.1871 if pa<=0.06253425180912017 & pav<=-0.050671379268169385\n",
      "   -0.6033 if cp>=-0.043199308961629865\n",
      "   -0.6033 if cp>=0.02840052954852581\n",
      "   -0.8848 if cv>=0.1731320708990097\n",
      "   -0.0000 if cp<=0.031221849843859673 & cp>=0.031221849843859673\n",
      "   -0.0001 if cp<=0.014768391847610479 & pa<=0.0010241540148854256\n",
      "   +5.4931 if cp<=0.06365713030099869 & cv<=0.15943694710731507 & pa<=0.054199893772602085 & pa>=0.028904534131288528 & pav<=0.3249213457107545\n",
      "Run episode 114 with rewards 137.0\n",
      "============ 115 ===========\n",
      "128 actions [1, 0, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 0, 1, 1, 1, 1, 0, 0, 0, 1, 0, 0, 0, 1, 0, 1, 1, 0, 1, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 0, 0, 1, 1, 0, 1, 1, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 0, 1, 0, 1, 1, 1, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.2742 if \n",
      "   -0.2742 if pa>=-0.1113012358546257\n",
      "   -0.2742 if pa>=-0.1415664494037628\n",
      "   +3.1958 if pav<=0.24514786899089813\n",
      "   -6.6785 if cp>=0.013521378301084042\n",
      "   -6.2445 if pa>=-0.031737010926008224\n",
      "   +6.6537 if pa<=0.013001559115946295\n",
      "   +6.8431 if cp<=0.08820451200008393 & cv>=0.025386495515704155\n",
      "   +6.9585 if cp>=-0.023856081068515778 & cv>=0.17508700788021087\n",
      "   +0.0004 if cp<=0.014768391847610479 & cv>=0.034477151930332184 & pa<=0.0010241540148854256\n",
      "   -7.9605 if pa>=0.11002523452043533\n",
      "   +1.2517 if pa<=0.10190294831991195 & pav<=-0.2970845580101013\n",
      "--------------\n",
      "   -2.7330 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -1.5214 if cp<=0.046974910050630606\n",
      "   +1.9827 if cv>=-0.36624195575714114\n",
      "   -2.9322 if pa<=0.05584583953022957\n",
      "   -2.2981 if cp>=0.002580943983048201 & cv>=-0.3794747233390808 & pa<=-0.02767487913370132\n",
      "   -0.4844 if pa<=0.06253425180912017 & pav<=-0.050671379268169385\n",
      "   -0.2580 if cp>=-0.043199308961629865\n",
      "   -1.6934 if cp>=0.02840052954852581\n",
      "   -0.1290 if cv>=0.1731320708990097\n",
      "   -2.1984 if cp<=0.014768391847610479 & pa<=0.0010241540148854256\n",
      "   +0.0033 if cp<=0.06365713030099869 & cv<=0.15943694710731507 & pa<=0.054199893772602085 & pa>=0.028904534131288528 & pav<=0.3249213457107545\n",
      "   -3.4388 if cp<=0.6955190300941468 & cp>=-0.02656570859253403 & cv>=0.708544147014618 & pav<=-0.2970845580101013\n",
      "Run episode 115 with rewards 128.0\n",
      "============ 116 ===========\n",
      "142 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 1, 1, 1, 0, 0, 0, 1, 0, 1, 1, 1, 0, 1, 0, 1, 0, 0, 1, 1, 1, 0, 1, 0, 0, 0, 1, 1, 0, 1, 1, 0, 0, 1, 1, 1, 0, 0, 0, 0, 1, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 1, 1, 0, 0, 0, 1, 1, 1, 0, 0, 1, 0, 1, 1, 1, 1, 0, 0, 0, 1, 0, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1]\n",
      "   -2.1238 if \n",
      "   -2.1238 if pa>=-0.1113012358546257\n",
      "   -2.1238 if pa>=-0.1415664494037628\n",
      "   +3.7426 if pav<=0.24514786899089813\n",
      "   -6.5623 if cp>=0.013521378301084042\n",
      "   -2.1246 if pa>=-0.031737010926008224\n",
      "   -0.0009 if pa<=0.013001559115946295\n",
      "   +6.6720 if cp<=0.08820451200008393 & cv>=0.025386495515704155\n",
      "   +7.7470 if cp>=-0.023856081068515778 & cv>=0.17508700788021087\n",
      "   -8.5794 if pa>=0.11002523452043533\n",
      "   +1.8893 if pa<=0.10190294831991195 & pav<=-0.2970845580101013\n",
      "   -0.9512 if pa>=0.07562298923730851 & pav<=-0.02331792078912255\n",
      "--------------\n",
      "   -0.9436 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   +2.4184 if cp<=0.046974910050630606\n",
      "   -0.9436 if cv>=-0.36624195575714114\n",
      "   -3.1384 if pa<=0.05584583953022957\n",
      "   +0.0000 if cp>=0.002580943983048201 & cv>=-0.3794747233390808 & pa<=-0.02767487913370132\n",
      "   -0.7815 if pa<=0.06253425180912017 & pav<=-0.050671379268169385\n",
      "   -0.9436 if cp>=-0.043199308961629865\n",
      "   +1.0185 if cp>=0.02840052954852581\n",
      "   -0.5677 if cv>=0.1731320708990097\n",
      "   +0.0000 if cp<=0.014768391847610479 & pa<=0.0010241540148854256\n",
      "   -3.0299 if cp<=0.6955190300941468 & cp>=-0.02656570859253403 & cv>=0.708544147014618 & pav<=-0.2970845580101013\n",
      "   -0.9558 if cv<=0.9026257634162903\n",
      "Run episode 116 with rewards 142.0\n",
      "============ 117 ===========\n",
      "31 actions [0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 0]\n",
      "   -1.9779 if \n",
      "   -1.9779 if pa>=-0.1113012358546257\n",
      "   -1.9779 if pa>=-0.1415664494037628\n",
      "   +4.5337 if pav<=0.24514786899089813\n",
      "   +1.4515 if cp>=0.013521378301084042\n",
      "   -1.9777 if pa>=-0.031737010926008224\n",
      "   +7.4403 if cp<=0.08820451200008393 & cv>=0.025386495515704155\n",
      "   -1.2040 if cp>=-0.023856081068515778 & cv>=0.17508700788021087\n",
      "   -8.2685 if pa>=0.11002523452043533\n",
      "   +3.6791 if pa<=0.10190294831991195 & pav<=-0.2970845580101013\n",
      "   -3.7564 if pa>=0.07562298923730851 & pav<=-0.02331792078912255\n",
      "  +10.2259 if pa>=0.12361104041337967\n",
      "--------------\n",
      "   -1.9574 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   +4.3290 if cp<=0.046974910050630606\n",
      "   -1.9574 if cv>=-0.36624195575714114\n",
      "   -3.5482 if pa<=0.05584583953022957\n",
      "   +0.0000 if cp>=0.002580943983048201 & cv>=-0.3794747233390808 & pa<=-0.02767487913370132\n",
      "   -2.5201 if pa<=0.06253425180912017 & pav<=-0.050671379268169385\n",
      "   -1.9574 if cp>=-0.043199308961629865\n",
      "   +0.0569 if cp>=0.02840052954852581\n",
      "   +3.3259 if cv>=0.1731320708990097\n",
      "   -4.3638 if cp<=0.6955190300941468 & cp>=-0.02656570859253403 & cv>=0.708544147014618 & pav<=-0.2970845580101013\n",
      "   -0.7060 if cv<=0.9026257634162903\n",
      "   -4.7344 if pa>=0.12361104041337967\n",
      "Run episode 117 with rewards 31.0\n",
      "============ 118 ===========\n",
      "27 actions [0, 1, 0, 0, 1, 1, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1]\n",
      "   -1.6528 if \n",
      "   -1.6528 if pa>=-0.1113012358546257\n",
      "   -1.6528 if pa>=-0.1415664494037628\n",
      "   +4.1663 if pav<=0.24514786899089813\n",
      "   -2.3827 if cp>=0.013521378301084042\n",
      "   -1.6528 if pa>=-0.031737010926008224\n",
      "   +2.9495 if cp<=0.08820451200008393 & cv>=0.025386495515704155\n",
      "   +0.1610 if pa>=0.11002523452043533\n",
      "   +0.0000 if pa<=0.10190294831991195 & pav<=-0.2970845580101013\n",
      "   +0.0000 if pa>=0.07562298923730851 & pav<=-0.02331792078912255\n",
      "   -0.9701 if pa>=0.12361104041337967\n",
      "   +3.5623 if pav<=0.07440806925296783\n",
      "--------------\n",
      "   -0.3913 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -0.3913 if cp<=0.046974910050630606\n",
      "   -2.0291 if cv>=-0.36624195575714114\n",
      "   -2.5999 if pa<=0.05584583953022957\n",
      "   +0.0000 if pa<=0.06253425180912017 & pav<=-0.050671379268169385\n",
      "   -0.3913 if cp>=-0.043199308961629865\n",
      "   +0.0000 if cp>=0.02840052954852581\n",
      "   +0.0000 if cv>=0.1731320708990097\n",
      "   +0.0000 if cp<=0.6955190300941468 & cp>=-0.02656570859253403 & cv>=0.708544147014618 & pav<=-0.2970845580101013\n",
      "   -0.3913 if cv<=0.9026257634162903\n",
      "   -1.6418 if pa>=0.12361104041337967\n",
      "   -3.0242 if pav<=0.07440806925296783\n",
      "Run episode 118 with rewards 27.0\n",
      "============ 119 ===========\n",
      "30 actions [0, 1, 0, 0, 1, 1, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 0, 1]\n",
      "   -1.7532 if \n",
      "   -1.7532 if pa>=-0.1113012358546257\n",
      "   -1.7532 if pa>=-0.1415664494037628\n",
      "   +4.2834 if pav<=0.24514786899089813\n",
      "   +0.0000 if cp>=0.013521378301084042\n",
      "   -1.7532 if pa>=-0.031737010926008224\n",
      "   +2.6437 if cp<=0.08820451200008393 & cv>=0.025386495515704155\n",
      "   -0.5556 if pa>=0.11002523452043533\n",
      "   +0.0740 if pa>=0.07562298923730851 & pav<=-0.02331792078912255\n",
      "   -0.2346 if pa>=0.12361104041337967\n",
      "   +0.4419 if pav<=0.07440806925296783\n",
      "   +1.1058 if cp>=-0.052640303224325176 & cv<=-0.18536521494388578\n",
      "--------------\n",
      "   -0.5934 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -0.5934 if cp<=0.046974910050630606\n",
      "   -1.1140 if cv>=-0.36624195575714114\n",
      "   -3.5461 if pa<=0.05584583953022957\n",
      "   +0.0000 if pa<=0.06253425180912017 & pav<=-0.050671379268169385\n",
      "   +0.0000 if cp>=-0.043199308961629865\n",
      "   -0.0020 if cv>=0.1731320708990097\n",
      "   +0.0000 if cp<=0.6955190300941468 & cp>=-0.02656570859253403 & cv>=0.708544147014618 & pav<=-0.2970845580101013\n",
      "   -0.5934 if cv<=0.9026257634162903\n",
      "   -0.3657 if pa>=0.12361104041337967\n",
      "   -0.1704 if pav<=0.07440806925296783\n",
      "   -2.4012 if cp>=-0.06257951632142067 & pa>=0.15101547241210939\n",
      "Run episode 119 with rewards 30.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 120 ===========\n",
      "22 actions [0, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0]\n",
      "   -1.6749 if \n",
      "   -1.6749 if pa>=-0.1113012358546257\n",
      "   -1.6749 if pa>=-0.1415664494037628\n",
      "   +4.2257 if pav<=0.24514786899089813\n",
      "   -1.6749 if pa>=-0.031737010926008224\n",
      "   +3.2855 if cp<=0.08820451200008393 & cv>=0.025386495515704155\n",
      "   +0.8404 if pa>=0.11002523452043533\n",
      "   +0.7593 if pa>=0.07562298923730851 & pav<=-0.02331792078912255\n",
      "   -1.4577 if pa>=0.12361104041337967\n",
      "   -2.4738 if pav<=0.07440806925296783\n",
      "   +0.0748 if cp>=-0.052640303224325176 & cv<=-0.18536521494388578\n",
      "   +2.9512 if pav<=0.06422646939754487\n",
      "--------------\n",
      "   -0.4069 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -0.4069 if cp<=0.046974910050630606\n",
      "   -1.4118 if cv>=-0.36624195575714114\n",
      "   -4.7463 if pa<=0.05584583953022957\n",
      "   -0.4069 if cp>=-0.043199308961629865\n",
      "   -2.5337 if cv>=0.1731320708990097\n",
      "   +0.0000 if cp<=0.6955190300941468 & cp>=-0.02656570859253403 & cv>=0.708544147014618 & pav<=-0.2970845580101013\n",
      "   -0.4069 if cv<=0.9026257634162903\n",
      "   -0.9189 if pa>=0.12361104041337967\n",
      "   +1.7840 if pav<=0.07440806925296783\n",
      "   -5.5488 if cp>=-0.06257951632142067 & pa>=0.15101547241210939\n",
      "   +3.9304 if cp>=0.006674146093428137 & pav>=0.21495876908302308\n",
      "Run episode 120 with rewards 22.0\n",
      "============ 121 ===========\n",
      "20 actions [0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1]\n",
      "   -1.4548 if \n",
      "   -1.4548 if pa>=-0.1113012358546257\n",
      "   -1.4548 if pa>=-0.1415664494037628\n",
      "   +3.8889 if pav<=0.24514786899089813\n",
      "   -1.4548 if pa>=-0.031737010926008224\n",
      "   +3.9212 if cp<=0.08820451200008393 & cv>=0.025386495515704155\n",
      "   -1.6766 if pa>=0.11002523452043533\n",
      "   +0.0000 if pa>=0.07562298923730851 & pav<=-0.02331792078912255\n",
      "   -3.0082 if pa>=0.12361104041337967\n",
      "   +0.8821 if pav<=0.07440806925296783\n",
      "   +0.8821 if pav<=0.06422646939754487\n",
      "   +1.6273 if cp>=-0.008956185542047024\n",
      "--------------\n",
      "   -1.0677 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -0.6000 if cp<=0.046974910050630606\n",
      "   -1.0677 if cv>=-0.36624195575714114\n",
      "   -5.6469 if pa<=0.05584583953022957\n",
      "   -0.6770 if cp>=-0.043199308961629865\n",
      "   -1.1481 if cv>=0.1731320708990097\n",
      "   -0.6000 if cv<=0.9026257634162903\n",
      "   -0.7169 if pa>=0.12361104041337967\n",
      "   -0.1731 if pav<=0.07440806925296783\n",
      "   -1.4502 if cp>=-0.06257951632142067 & pa>=0.15101547241210939\n",
      "   +0.0000 if cp>=0.006674146093428137 & pav>=0.21495876908302308\n",
      "   +1.0168 if pa>=0.08121557831764221\n",
      "Run episode 121 with rewards 20.0\n",
      "============ 122 ===========\n",
      "11 actions [0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1]\n",
      "   -0.9276 if \n",
      "   -0.9276 if pa>=-0.1113012358546257\n",
      "   -0.9276 if pa>=-0.1415664494037628\n",
      "   +1.5398 if pav<=0.24514786899089813\n",
      "   -0.9276 if pa>=-0.031737010926008224\n",
      "   +0.4066 if cp<=0.08820451200008393 & cv>=0.025386495515704155\n",
      "   -1.6113 if pa>=0.11002523452043533\n",
      "   -1.6113 if pa>=0.12361104041337967\n",
      "   +2.2418 if pav<=0.07440806925296783\n",
      "   +2.2418 if pav<=0.06422646939754487\n",
      "   +0.0000 if cp>=-0.008956185542047024\n",
      "   +1.1125 if pa>=0.1873852103948593 & pav>=0.12721259295940401\n",
      "--------------\n",
      "   -0.9163 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -1.5386 if cp<=0.046974910050630606\n",
      "   +0.0043 if cv>=-0.36624195575714114\n",
      "   -5.8366 if pa<=0.05584583953022957\n",
      "   +0.0000 if cp>=-0.043199308961629865\n",
      "   -1.8186 if cv>=0.1731320708990097\n",
      "   -1.5386 if cv<=0.9026257634162903\n",
      "   +0.9975 if pa>=0.12361104041337967\n",
      "   -2.1209 if pav<=0.07440806925296783\n",
      "   +0.0000 if cp>=-0.06257951632142067 & pa>=0.15101547241210939\n",
      "   +1.5653 if pa>=0.08121557831764221\n",
      "   -0.0800 if cp<=-0.06698787063360213 & cp>=-0.1326202094554901\n",
      "Run episode 122 with rewards 11.0\n",
      "============ 123 ===========\n",
      "11 actions [0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 0]\n",
      "   -0.4101 if \n",
      "   -0.4101 if pa>=-0.1113012358546257\n",
      "   -0.4101 if pa>=-0.1415664494037628\n",
      "   +0.0011 if pav<=0.24514786899089813\n",
      "   -0.4101 if pa>=-0.031737010926008224\n",
      "   +0.0011 if cp<=0.08820451200008393 & cv>=0.025386495515704155\n",
      "   -1.6690 if pa>=0.11002523452043533\n",
      "   -0.3849 if pa>=0.12361104041337967\n",
      "   +0.0011 if pav<=0.07440806925296783\n",
      "   +0.0011 if pav<=0.06422646939754487\n",
      "   -0.0116 if pa>=0.1873852103948593 & pav>=0.12721259295940401\n",
      "   -1.6307 if pav>=1.7874646186828613\n",
      "--------------\n",
      "   -0.6755 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -2.2787 if cp<=0.046974910050630606\n",
      "   -0.6782 if cv>=-0.36624195575714114\n",
      "   -2.1813 if pa<=0.05584583953022957\n",
      "   -0.0000 if cv>=0.1731320708990097\n",
      "   -2.2787 if cv<=0.9026257634162903\n",
      "   +0.0549 if pa>=0.12361104041337967\n",
      "   -0.0007 if pav<=0.07440806925296783\n",
      "   -0.0000 if cp>=-0.06257951632142067 & pa>=0.15101547241210939\n",
      "   +2.7402 if pa>=0.08121557831764221\n",
      "   +0.3626 if cp<=-0.06698787063360213 & cp>=-0.1326202094554901\n",
      "   -0.5933 if cv<=-0.7526628375053406\n",
      "Run episode 123 with rewards 11.0\n",
      "============ 124 ===========\n",
      "11 actions [0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1]\n",
      "   -0.6004 if \n",
      "   -0.6004 if pa>=-0.1113012358546257\n",
      "   -0.6004 if pa>=-0.1415664494037628\n",
      "   +0.0907 if pav<=0.24514786899089813\n",
      "   -0.6004 if pa>=-0.031737010926008224\n",
      "   -0.0000 if cp<=0.08820451200008393 & cv>=0.025386495515704155\n",
      "   -1.1576 if pa>=0.11002523452043533\n",
      "   -1.1576 if pa>=0.12361104041337967\n",
      "   +0.0907 if pav<=0.06422646939754487\n",
      "   +0.0041 if pa>=0.1873852103948593 & pav>=0.12721259295940401\n",
      "   -1.1017 if pav>=1.7874646186828613\n",
      "   -1.1017 if pav>=1.8022464513778687\n",
      "--------------\n",
      "   -0.8246 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -1.6032 if cp<=0.046974910050630606\n",
      "   -0.4706 if cv>=-0.36624195575714114\n",
      "   -1.8903 if pa<=0.05584583953022957\n",
      "   +0.0000 if cv>=0.1731320708990097\n",
      "   -1.6032 if cv<=0.9026257634162903\n",
      "   +0.6847 if pa>=0.12361104041337967\n",
      "   -0.2215 if pav<=0.07440806925296783\n",
      "   +2.1591 if pa>=0.08121557831764221\n",
      "   +0.2793 if cp<=-0.06698787063360213 & cp>=-0.1326202094554901\n",
      "   -0.1796 if cv<=-0.7526628375053406\n",
      "   -0.1796 if cv<=-0.8291042447090149\n",
      "Run episode 124 with rewards 11.0\n",
      "============ 125 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 1, 1]\n",
      "   -0.2415 if \n",
      "   -0.2415 if pa>=-0.1113012358546257\n",
      "   -0.2415 if pa>=-0.1415664494037628\n",
      "   +0.0765 if pav<=0.24514786899089813\n",
      "   -0.5587 if pa>=-0.031737010926008224\n",
      "   -0.5834 if pa>=0.11002523452043533\n",
      "   -0.1739 if pa>=0.12361104041337967\n",
      "   +0.0765 if pav<=0.06422646939754487\n",
      "   +0.0000 if pa>=0.1873852103948593 & pav>=0.12721259295940401\n",
      "   -1.5830 if pav>=1.7874646186828613\n",
      "   -1.1735 if pav>=1.8022464513778687\n",
      "   -1.1735 if pav>=2.0584452152252197\n",
      "--------------\n",
      "   -0.6085 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -1.4971 if cp<=0.046974910050630606\n",
      "   -0.3576 if cv>=-0.36624195575714114\n",
      "   -2.8138 if pa<=0.05584583953022957\n",
      "   -1.4971 if cv<=0.9026257634162903\n",
      "   +0.0268 if pa>=0.12361104041337967\n",
      "   -0.1582 if pav<=0.07440806925296783\n",
      "   +0.2984 if pa>=0.08121557831764221\n",
      "   +0.2984 if cp<=-0.06698787063360213 & cp>=-0.1326202094554901\n",
      "   -0.1824 if cv<=-0.7526628375053406\n",
      "   +0.3861 if cv<=-0.8291042447090149\n",
      "   +0.2984 if cp<=-0.08656515926122665\n",
      "Run episode 125 with rewards 10.0\n",
      "============ 126 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +1.0745 if \n",
      "   +1.0745 if pa>=-0.1113012358546257\n",
      "   +1.0745 if pa>=-0.1415664494037628\n",
      "   +0.0429 if pav<=0.24514786899089813\n",
      "   +1.2577 if pa>=-0.031737010926008224\n",
      "   +1.3092 if pa>=0.11002523452043533\n",
      "   +1.0728 if pa>=0.12361104041337967\n",
      "   +0.0429 if pav<=0.06422646939754487\n",
      "   +1.8852 if pav>=1.7874646186828613\n",
      "   +1.6488 if pav>=1.8022464513778687\n",
      "   +1.6500 if pav>=2.0584452152252197\n",
      "   +0.9925 if cp>=0.04377755522727966\n",
      "--------------\n",
      "   -0.3443 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -2.8087 if cp<=0.046974910050630606\n",
      "   -0.2183 if cv>=-0.36624195575714114\n",
      "   -0.5059 if pa<=0.05584583953022957\n",
      "   -2.8087 if cv<=0.9026257634162903\n",
      "   -0.1017 if pav<=0.07440806925296783\n",
      "   -2.3018 if pa>=0.08121557831764221\n",
      "   -2.5352 if cp<=-0.06698787063360213 & cp>=-0.1326202094554901\n",
      "   -2.3156 if cv<=-0.7526628375053406\n",
      "   -2.3037 if cv<=-0.8291042447090149\n",
      "   -2.5352 if cp<=-0.08656515926122665\n",
      "   -2.5352 if pa>=0.18822601437568665\n",
      "Run episode 126 with rewards 10.0\n",
      "============ 127 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 1, 1, 0]\n",
      "   +0.1097 if \n",
      "   +0.1097 if pa>=-0.1113012358546257\n",
      "   +0.1097 if pa>=-0.1415664494037628\n",
      "   +0.0435 if pa>=-0.031737010926008224\n",
      "   -0.0000 if pa>=0.11002523452043533\n",
      "   -0.0000 if pa>=0.12361104041337967\n",
      "   +0.0227 if pav<=0.06422646939754487\n",
      "   +0.0000 if pav>=1.7874646186828613\n",
      "   +0.0000 if pav>=1.8022464513778687\n",
      "   +0.0000 if pav>=2.0584452152252197\n",
      "   +0.0000 if cp>=0.04377755522727966\n",
      "   +0.0227 if cv>=0.048942700028419495\n",
      "--------------\n",
      "   -0.3647 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -0.4583 if cp<=0.046974910050630606\n",
      "   -0.3271 if cv>=-0.36624195575714114\n",
      "   -0.4582 if pa<=0.05584583953022957\n",
      "   -0.4583 if cv<=0.9026257634162903\n",
      "   -0.0001 if pa>=0.08121557831764221\n",
      "   -0.0001 if cp<=-0.06698787063360213 & cp>=-0.1326202094554901\n",
      "   -0.0501 if cv<=-0.7526628375053406\n",
      "   -0.0501 if cv<=-0.8291042447090149\n",
      "   +0.0000 if cp<=-0.08656515926122665\n",
      "   -0.0000 if pa>=0.18822601437568665\n",
      "   -0.2141 if cp>=0.005134062003344298\n",
      "Run episode 127 with rewards 9.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 128 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 1, 1, 0]\n",
      "   +0.5218 if \n",
      "   +0.5218 if pa>=-0.1113012358546257\n",
      "   +0.5218 if pa>=-0.1415664494037628\n",
      "   +0.5218 if pa>=-0.031737010926008224\n",
      "   -1.8292 if pa>=0.11002523452043533\n",
      "   -1.8292 if pa>=0.12361104041337967\n",
      "   +0.2552 if pav<=0.06422646939754487\n",
      "   -0.6239 if pav>=1.7874646186828613\n",
      "   -0.6239 if pav>=1.8022464513778687\n",
      "   +0.0000 if pav>=2.0584452152252197\n",
      "   +0.0000 if cv>=0.048942700028419495\n",
      "   -1.2053 if cp<=-0.04840499237179756\n",
      "--------------\n",
      "   -0.5534 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -1.0256 if cp<=0.046974910050630606\n",
      "   -0.3532 if cv>=-0.36624195575714114\n",
      "   -0.5534 if pa<=0.05584583953022957\n",
      "   -1.0256 if cv<=0.9026257634162903\n",
      "   +0.9984 if pa>=0.08121557831764221\n",
      "   +0.6220 if cp<=-0.06698787063360213 & cp>=-0.1326202094554901\n",
      "   +0.0080 if cv<=-0.7526628375053406\n",
      "   +0.0080 if cv<=-0.8291042447090149\n",
      "   -0.0000 if cp<=-0.08656515926122665\n",
      "   -1.0336 if cp>=0.005134062003344298\n",
      "   +0.9984 if cp<=-0.014795880392193792\n",
      "Run episode 128 with rewards 9.0\n",
      "============ 129 ===========\n",
      "35 actions [0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1]\n",
      "   +0.2457 if \n",
      "   +0.2457 if pa>=-0.1113012358546257\n",
      "   +0.2457 if pa>=-0.1415664494037628\n",
      "   +0.2457 if pa>=-0.031737010926008224\n",
      "   -1.4479 if pa>=0.11002523452043533\n",
      "   -1.4479 if pa>=0.12361104041337967\n",
      "   +0.0872 if pav<=0.06422646939754487\n",
      "   -0.3288 if pav>=1.7874646186828613\n",
      "   -0.3288 if pav>=1.8022464513778687\n",
      "   +0.0000 if cv>=0.048942700028419495\n",
      "   -1.1191 if cp<=-0.04840499237179756\n",
      "   +0.0872 if cv>=0.03199116140604019\n",
      "--------------\n",
      "   -0.3412 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -0.2915 if cp<=0.046974910050630606\n",
      "   -0.3412 if cv>=-0.36624195575714114\n",
      "   -0.3412 if pa<=0.05584583953022957\n",
      "   -0.2915 if cv<=0.9026257634162903\n",
      "   +0.4666 if pa>=0.08121557831764221\n",
      "   +1.0599 if cp<=-0.06698787063360213 & cp>=-0.1326202094554901\n",
      "   +0.4666 if cv<=-0.7526628375053406\n",
      "   -0.5934 if cv<=-0.8291042447090149\n",
      "   -0.7580 if cp>=0.005134062003344298\n",
      "   +1.2003 if cp<=-0.014795880392193792\n",
      "   -0.7580 if cp>=-0.00536457411944866\n",
      "Run episode 129 with rewards 35.0\n",
      "============ 130 ===========\n",
      "42 actions [1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1]\n",
      "   +0.6636 if \n",
      "   +0.6636 if pa>=-0.1113012358546257\n",
      "   +0.6636 if pa>=-0.1415664494037628\n",
      "   +0.6636 if pa>=-0.031737010926008224\n",
      "   -2.4815 if pa>=0.11002523452043533\n",
      "   -2.2390 if pa>=0.12361104041337967\n",
      "   -1.4991 if pav<=0.06422646939754487\n",
      "   +0.8871 if pav>=1.7874646186828613\n",
      "   +0.8871 if pav>=1.8022464513778687\n",
      "   -1.7278 if cp<=-0.04840499237179756\n",
      "   -1.7142 if cv>=0.03199116140604019\n",
      "   -4.4167 if cp<=0.17256624996662143 & pav>=1.2188693523406984\n",
      "--------------\n",
      "   +0.8862 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   +0.9927 if cv>=-0.36624195575714114\n",
      "   +4.4228 if pa<=0.05584583953022957\n",
      "   -2.1200 if cv<=0.9026257634162903\n",
      "   +0.6721 if pa>=0.08121557831764221\n",
      "   +0.1367 if cp<=-0.06698787063360213 & cp>=-0.1326202094554901\n",
      "   -0.1034 if cv<=-0.7526628375053406\n",
      "   +1.2302 if cv<=-0.8291042447090149\n",
      "   -1.8004 if cp>=0.005134062003344298\n",
      "   +4.7641 if cp<=-0.014795880392193792\n",
      "   -2.1271 if cp>=-0.00536457411944866\n",
      "   -4.7830 if pa<=0.04895737618207932\n",
      "Run episode 130 with rewards 42.0\n",
      "============ 131 ===========\n",
      "31 actions [1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0]\n",
      "   +0.1497 if \n",
      "   +0.1497 if pa>=-0.1113012358546257\n",
      "   +0.1497 if pa>=-0.1415664494037628\n",
      "   +0.1153 if pa>=0.11002523452043533\n",
      "   +0.8498 if pa>=0.12361104041337967\n",
      "   -0.5221 if pav<=0.06422646939754487\n",
      "   +2.6953 if pav>=1.7874646186828613\n",
      "   +2.6953 if pav>=1.8022464513778687\n",
      "   -2.4367 if cp<=-0.04840499237179756\n",
      "   +0.4063 if cv>=0.03199116140604019\n",
      "   +0.5349 if cp<=0.17256624996662143 & pav>=1.2188693523406984\n",
      "   +2.8849 if cp>=-0.0196363005787134 & cv>=0.7546098351478577 & pav<=-0.7724302887916563\n",
      "--------------\n",
      "   +0.3909 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   +0.3648 if cv>=-0.36624195575714114\n",
      "   +0.3833 if pa<=0.05584583953022957\n",
      "   -0.4322 if cv<=0.9026257634162903\n",
      "   -1.0827 if pa>=0.08121557831764221\n",
      "   +0.1462 if cp<=-0.06698787063360213 & cp>=-0.1326202094554901\n",
      "   -1.1854 if cv<=-0.8291042447090149\n",
      "   -3.1366 if cp>=0.005134062003344298\n",
      "   +4.7012 if cp<=-0.014795880392193792\n",
      "   -5.4356 if cp>=-0.00536457411944866\n",
      "   -0.0234 if pa<=0.04895737618207932\n",
      "   -2.7095 if pav>=2.39192271232605\n",
      "Run episode 131 with rewards 31.0\n",
      "============ 132 ===========\n",
      "34 actions [1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0]\n",
      "   -0.6808 if \n",
      "   -0.6810 if pa>=-0.1113012358546257\n",
      "   -0.6808 if pa>=-0.1415664494037628\n",
      "   -0.0000 if pa>=0.12361104041337967\n",
      "   -0.2983 if pav<=0.06422646939754487\n",
      "   -0.0000 if pav>=1.7874646186828613\n",
      "   -0.0000 if pav>=1.8022464513778687\n",
      "   -0.1806 if cp<=-0.04840499237179756\n",
      "   -0.2679 if cv>=0.03199116140604019\n",
      "   -0.1060 if cp<=0.17256624996662143 & pav>=1.2188693523406984\n",
      "   +2.5095 if cp>=-0.0196363005787134 & cv>=0.7546098351478577 & pav<=-0.7724302887916563\n",
      "   +2.0468 if pa<=-0.05086350068449974\n",
      "--------------\n",
      "   +1.2815 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   +0.2104 if cv>=-0.36624195575714114\n",
      "   -0.0284 if pa<=0.05584583953022957\n",
      "   +0.3172 if cv<=0.9026257634162903\n",
      "   -0.0000 if pa>=0.08121557831764221\n",
      "   +0.0881 if cp<=-0.06698787063360213 & cp>=-0.1326202094554901\n",
      "   -0.0212 if cv<=-0.8291042447090149\n",
      "   -1.6089 if cp>=0.005134062003344298\n",
      "   +2.4896 if cp<=-0.014795880392193792\n",
      "   -4.6001 if cp>=-0.00536457411944866\n",
      "   -0.0000 if pav>=2.39192271232605\n",
      "   +1.9729 if pa>=-0.05086350068449974\n",
      "Run episode 132 with rewards 34.0\n",
      "============ 133 ===========\n",
      "20 actions [1, 1, 0, 0, 1, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0]\n",
      "   +0.3983 if \n",
      "   +0.3987 if pa>=-0.1113012358546257\n",
      "   +0.3987 if pa>=-0.1415664494037628\n",
      "   -0.0137 if pav<=0.06422646939754487\n",
      "   +0.0000 if pav>=1.7874646186828613\n",
      "   +0.0000 if pav>=1.8022464513778687\n",
      "   -0.5032 if cp<=-0.04840499237179756\n",
      "   -0.0137 if cv>=0.03199116140604019\n",
      "   +0.4779 if cp<=0.17256624996662143 & pav>=1.2188693523406984\n",
      "   +0.7820 if cp>=-0.0196363005787134 & cv>=0.7546098351478577 & pav<=-0.7724302887916563\n",
      "   +0.4997 if pa<=-0.05086350068449974\n",
      "   -2.0661 if cp<=-0.004302615113556371\n",
      "--------------\n",
      "   +1.0072 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   +0.4152 if cv>=-0.36624195575714114\n",
      "   -0.6188 if pa<=0.05584583953022957\n",
      "   -1.3664 if cv<=0.9026257634162903\n",
      "   +0.4020 if cp<=-0.06698787063360213 & cp>=-0.1326202094554901\n",
      "   -0.6724 if cv<=-0.8291042447090149\n",
      "   -1.6639 if cp>=0.005134062003344298\n",
      "   +1.7950 if cp<=-0.014795880392193792\n",
      "   -3.6395 if cp>=-0.00536457411944866\n",
      "   -0.0000 if pav>=2.39192271232605\n",
      "   +0.8476 if pa>=-0.05086350068449974\n",
      "   +2.2778 if cp<=-0.004302615113556371 & pa>=-0.03350066244602203\n",
      "Run episode 133 with rewards 20.0\n",
      "============ 134 ===========\n",
      "11 actions [0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1]\n",
      "   +0.5437 if \n",
      "   +0.3261 if pa>=-0.1113012358546257\n",
      "   +0.5434 if pa>=-0.1415664494037628\n",
      "   -1.3451 if pav<=0.06422646939754487\n",
      "   +0.0000 if pav>=1.8022464513778687\n",
      "   +0.0000 if cp<=-0.04840499237179756\n",
      "   +3.2718 if cv>=0.03199116140604019\n",
      "   +0.0000 if cp<=0.17256624996662143 & pav>=1.2188693523406984\n",
      "   +0.2173 if cp>=-0.0196363005787134 & cv>=0.7546098351478577 & pav<=-0.7724302887916563\n",
      "   -0.8562 if pa<=-0.05086350068449974\n",
      "   +0.5434 if cp<=-0.004302615113556371\n",
      "   -2.4328 if cp<=-0.007858607079833744 & cv<=0.5525187253952026\n",
      "--------------\n",
      "   -0.2909 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -1.0671 if cv>=-0.36624195575714114\n",
      "   -1.3959 if pa<=0.05584583953022957\n",
      "   -0.9869 if cv<=0.9026257634162903\n",
      "   +0.0000 if cp<=-0.06698787063360213 & cp>=-0.1326202094554901\n",
      "   +0.0000 if cv<=-0.8291042447090149\n",
      "   -0.0173 if cp>=0.005134062003344298\n",
      "   +5.1170 if cp<=-0.014795880392193792\n",
      "   -0.0173 if cp>=-0.00536457411944866\n",
      "   -0.9284 if pa>=-0.05086350068449974\n",
      "   +0.0000 if cp<=-0.004302615113556371 & pa>=-0.03350066244602203\n",
      "   +5.1539 if cp<=-0.007858607079833744 & cp>=-0.011335084959864615 & cv<=-0.037819355726242065 & cv<=0.15588094890117646\n",
      "Run episode 134 with rewards 11.0\n",
      "============ 135 ===========\n",
      "11 actions [0, 0, 0, 0, 0, 0, 1, 1, 0, 1, 1]\n",
      "   +0.4325 if \n",
      "   +0.4325 if pa>=-0.1113012358546257\n",
      "   +0.4325 if pa>=-0.1415664494037628\n",
      "   +0.0693 if pav<=0.06422646939754487\n",
      "   -0.1941 if cp<=-0.04840499237179756\n",
      "   +0.0693 if cv>=0.03199116140604019\n",
      "   -0.0883 if cp<=0.17256624996662143 & pav>=1.2188693523406984\n",
      "   +0.0000 if cp>=-0.0196363005787134 & cv>=0.7546098351478577 & pav<=-0.7724302887916563\n",
      "   +0.0000 if pa<=-0.05086350068449974\n",
      "   -0.7514 if cp<=-0.004302615113556371\n",
      "   -0.7514 if cp<=-0.007858607079833744 & cv<=0.5525187253952026\n",
      "   +0.0669 if cp>=0.03448614105582237\n",
      "--------------\n",
      "   -0.3154 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -0.3154 if cv>=-0.36624195575714114\n",
      "   -0.6967 if pa<=0.05584583953022957\n",
      "   -0.2552 if cv<=0.9026257634162903\n",
      "   +0.1070 if cv<=-0.8291042447090149\n",
      "   -0.6967 if cp>=0.005134062003344298\n",
      "   +1.0532 if cp<=-0.014795880392193792\n",
      "   -1.3084 if cp>=-0.00536457411944866\n",
      "   -0.2552 if pa>=-0.05086350068449974\n",
      "   +1.0532 if cp<=-0.004302615113556371 & pa>=-0.03350066244602203\n",
      "   +0.0000 if cp<=-0.007858607079833744 & cp>=-0.011335084959864615 & cv<=-0.037819355726242065 & cv<=0.15588094890117646\n",
      "   +1.0532 if cp<=-0.01935424655675888\n",
      "Run episode 135 with rewards 11.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 136 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 1, 1, 0, 1, 0]\n",
      "   +0.6815 if \n",
      "   +0.6815 if pa>=-0.1113012358546257\n",
      "   +0.6815 if pa>=-0.1415664494037628\n",
      "   +0.0674 if pav<=0.06422646939754487\n",
      "   +1.5716 if cp<=-0.04840499237179756\n",
      "   +0.0000 if cv>=0.03199116140604019\n",
      "   -1.4197 if cp<=0.17256624996662143 & pav>=1.2188693523406984\n",
      "   +0.0000 if pa<=-0.05086350068449974\n",
      "   -0.0773 if cp<=-0.004302615113556371\n",
      "   -0.0773 if cp<=-0.007858607079833744 & cv<=0.5525187253952026\n",
      "   +0.2106 if cp>=0.03448614105582237\n",
      "   -1.6488 if cp>=-0.05900755897164345 & cv<=-1.0134258270263672\n",
      "--------------\n",
      "   -0.2618 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -0.1728 if cv>=-0.36624195575714114\n",
      "   -0.9121 if pa<=0.05584583953022957\n",
      "   -0.6467 if cv<=0.9026257634162903\n",
      "   +1.8109 if cv<=-0.8291042447090149\n",
      "   -0.9121 if cp>=0.005134062003344298\n",
      "   -0.3893 if cp<=-0.014795880392193792\n",
      "   -0.9121 if cp>=-0.00536457411944866\n",
      "   -0.6467 if pa>=-0.05086350068449974\n",
      "   +0.2655 if cp<=-0.004302615113556371 & pa>=-0.03350066244602203\n",
      "   -0.3893 if cp<=-0.01935424655675888\n",
      "   +1.6618 if cp>=-0.05900755897164345 & cv<=-1.0134258270263672\n",
      "Run episode 136 with rewards 10.0\n",
      "============ 137 ===========\n",
      "74 actions [1, 1, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 0, 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 0, 0]\n",
      "   +0.3558 if \n",
      "   +0.3558 if pa>=-0.1113012358546257\n",
      "   +0.3558 if pa>=-0.1415664494037628\n",
      "   +0.1038 if pav<=0.06422646939754487\n",
      "   +0.4609 if cp<=-0.04840499237179756\n",
      "   +0.0000 if cv>=0.03199116140604019\n",
      "   -1.5000 if cp<=0.17256624996662143 & pav>=1.2188693523406984\n",
      "   -0.7855 if cp<=-0.004302615113556371\n",
      "   -0.7855 if cp<=-0.007858607079833744 & cv<=0.5525187253952026\n",
      "   +0.0000 if cp>=0.03448614105582237\n",
      "   -0.2249 if cp>=-0.05900755897164345 & cv<=-1.0134258270263672\n",
      "   -0.4061 if cp<=-0.06027389168739319\n",
      "--------------\n",
      "   -0.4127 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -0.4127 if pa<=0.05584583953022957\n",
      "   -0.3034 if cv<=0.9026257634162903\n",
      "   +1.3971 if cv<=-0.8291042447090149\n",
      "   -0.6556 if cp>=0.005134062003344298\n",
      "   +0.7229 if cp<=-0.014795880392193792\n",
      "   -1.0263 if cp>=-0.00536457411944866\n",
      "   -0.3034 if pa>=-0.05086350068449974\n",
      "   +0.7229 if cp<=-0.004302615113556371 & pa>=-0.03350066244602203\n",
      "   +0.7229 if cp<=-0.01935424655675888\n",
      "   +0.1524 if cp>=-0.05900755897164345 & cv<=-1.0134258270263672\n",
      "   -0.1362 if cp>=0.023108752444386482\n",
      "Run episode 137 with rewards 74.0\n",
      "============ 138 ===========\n",
      "51 actions [1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1]\n",
      "   +0.0787 if \n",
      "   +0.0787 if pa>=-0.1113012358546257\n",
      "   +0.0787 if pa>=-0.1415664494037628\n",
      "   -0.2400 if pav<=0.06422646939754487\n",
      "   +1.2028 if cp<=-0.04840499237179756\n",
      "   -0.4667 if cp<=0.17256624996662143 & pav>=1.2188693523406984\n",
      "   +2.7513 if cp<=-0.004302615113556371\n",
      "   -5.2211 if cp<=-0.007858607079833744 & cv<=0.5525187253952026\n",
      "   +1.9256 if cp>=0.03448614105582237\n",
      "   -0.4278 if cp>=-0.05900755897164345 & cv<=-1.0134258270263672\n",
      "   -2.3693 if cp<=-0.06027389168739319\n",
      "   -1.0214 if pa<=0.06994461566209793 & pav<=-0.49467852115631095\n",
      "--------------\n",
      "   +1.9084 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -1.3808 if pa<=0.05584583953022957\n",
      "   -5.9914 if cv<=0.9026257634162903\n",
      "   +3.8557 if cv<=-0.8291042447090149\n",
      "   +3.6910 if cp>=0.005134062003344298\n",
      "   +9.1871 if cp<=-0.014795880392193792\n",
      "   -1.1054 if cp>=-0.00536457411944866\n",
      "   +3.6698 if pa>=-0.05086350068449974\n",
      "   -4.9214 if cp<=-0.004302615113556371 & pa>=-0.03350066244602203\n",
      "   -4.1425 if cp<=-0.01935424655675888\n",
      "   +0.0830 if cp>=-0.05900755897164345 & cv<=-1.0134258270263672\n",
      "   +4.8622 if cp<=-0.004911469854414456 & cv<=0.4224217414855957\n",
      "Run episode 138 with rewards 51.0\n",
      "============ 139 ===========\n",
      "23 actions [1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 0, 1, 1]\n",
      "   -1.0091 if pa>=-0.1113012358546257\n",
      "   +0.7297 if pa>=-0.1415664494037628\n",
      "   -2.6103 if pav<=0.06422646939754487\n",
      "   +0.1865 if cp<=-0.04840499237179756\n",
      "   +1.5139 if cp<=0.17256624996662143 & pav>=1.2188693523406984\n",
      "   +2.8795 if cp<=-0.004302615113556371\n",
      "   -4.5532 if cp<=-0.007858607079833744 & cv<=0.5525187253952026\n",
      "   +1.4550 if cp>=0.03448614105582237\n",
      "   +1.5656 if cp>=-0.05900755897164345 & cv<=-1.0134258270263672\n",
      "   -0.6896 if cp<=-0.06027389168739319\n",
      "   +0.8729 if pa<=0.06994461566209793 & pav<=-0.49467852115631095\n",
      "   +3.7474 if cp<=-0.1234923005104065 & cv>=0.550218939781189\n",
      "--------------\n",
      "   +2.1066 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -3.6031 if pa<=0.05584583953022957\n",
      "   -9.0111 if cv<=0.9026257634162903\n",
      "   -1.1924 if cv<=-0.8291042447090149\n",
      "   +5.5472 if cp>=0.005134062003344298\n",
      "   +2.0662 if cp<=-0.014795880392193792\n",
      "   -0.7470 if cp>=-0.00536457411944866\n",
      "   +4.6490 if pa>=-0.05086350068449974\n",
      "   -3.2479 if cp<=-0.004302615113556371 & pa>=-0.03350066244602203\n",
      "   +2.0662 if cp<=-0.01935424655675888\n",
      "   +4.9688 if cp<=-0.004911469854414456 & cv<=0.4224217414855957\n",
      "   +4.9260 if cp>=-0.1234923005104065 & cv<=0.7454566359519958\n",
      "Run episode 139 with rewards 23.0\n",
      "============ 140 ===========\n",
      "23 actions [1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1]\n",
      "   -0.1361 if pa>=-0.1113012358546257\n",
      "   +0.8638 if pa>=-0.1415664494037628\n",
      "   -1.1699 if pav<=0.06422646939754487\n",
      "   +1.6410 if cp<=0.17256624996662143 & pav>=1.2188693523406984\n",
      "   -0.2247 if cp<=-0.004302615113556371\n",
      "   -0.2247 if cp<=-0.007858607079833744 & cv<=0.5525187253952026\n",
      "   +2.2390 if cp>=0.03448614105582237\n",
      "   +0.4778 if cp>=-0.05900755897164345 & cv<=-1.0134258270263672\n",
      "   +1.1632 if cp<=-0.06027389168739319\n",
      "   -0.1766 if pa<=0.06994461566209793 & pav<=-0.49467852115631095\n",
      "   +0.0000 if cp<=-0.1234923005104065 & cv>=0.550218939781189\n",
      "   -2.2165 if cv<=-1.3182264566421509\n",
      "--------------\n",
      "   +2.4875 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -0.7495 if pa<=0.05584583953022957\n",
      "   -3.3262 if cv<=0.9026257634162903\n",
      "   -1.3546 if cv<=-0.8291042447090149\n",
      "   -2.1252 if cp>=0.005134062003344298\n",
      "   +1.2773 if cp<=-0.014795880392193792\n",
      "   +3.3669 if pa>=-0.05086350068449974\n",
      "   -1.2010 if cp<=-0.004302615113556371 & pa>=-0.03350066244602203\n",
      "   +1.2773 if cp<=-0.01935424655675888\n",
      "   -1.2010 if cp<=-0.004911469854414456 & cv<=0.4224217414855957\n",
      "   +1.9020 if cp>=-0.1234923005104065 & cv<=0.7454566359519958\n",
      "   +1.9648 if cv<=-1.3182264566421509\n",
      "Run episode 140 with rewards 23.0\n",
      "============ 141 ===========\n",
      "19 actions [1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0]\n",
      "   -0.1754 if pa>=-0.1113012358546257\n",
      "   +0.7655 if pa>=-0.1415664494037628\n",
      "   -1.3633 if pav<=0.06422646939754487\n",
      "   +1.6183 if cp<=0.17256624996662143 & pav>=1.2188693523406984\n",
      "   -1.7480 if cp<=-0.004302615113556371\n",
      "   +0.0976 if cp<=-0.007858607079833744 & cv<=0.5525187253952026\n",
      "   +1.1307 if cp>=0.03448614105582237\n",
      "   +0.1626 if cp>=-0.05900755897164345 & cv<=-1.0134258270263672\n",
      "   +1.4557 if cp<=-0.06027389168739319\n",
      "   +0.8902 if pa<=0.06994461566209793 & pav<=-0.49467852115631095\n",
      "   -2.1628 if cv<=-1.3182264566421509\n",
      "   -0.8918 if cp<=0.010286404751241218 & pa<=-0.029085673391818983 & pa>=-0.06972404122352599\n",
      "--------------\n",
      "   +1.3373 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -0.8414 if cv<=0.9026257634162903\n",
      "   -1.2191 if cv<=-0.8291042447090149\n",
      "   -2.5320 if cp>=0.005134062003344298\n",
      "   -0.3193 if cp<=-0.014795880392193792\n",
      "   +2.3295 if pa>=-0.05086350068449974\n",
      "   +0.2403 if cp<=-0.004302615113556371 & pa>=-0.03350066244602203\n",
      "   -0.3193 if cp<=-0.01935424655675888\n",
      "   +0.1906 if cp<=-0.004911469854414456 & cv<=0.4224217414855957\n",
      "   +0.6869 if cp>=-0.1234923005104065 & cv<=0.7454566359519958\n",
      "   +2.4302 if cv<=-1.3182264566421509\n",
      "   -2.2710 if cp>=0.010286404751241218\n",
      "Run episode 141 with rewards 19.0\n",
      "============ 142 ===========\n",
      "30 actions [0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1]\n",
      "   +0.5430 if pa>=-0.1113012358546257\n",
      "   +0.5430 if pa>=-0.1415664494037628\n",
      "   -0.0641 if pav<=0.06422646939754487\n",
      "   +0.3565 if cp<=0.17256624996662143 & pav>=1.2188693523406984\n",
      "   -0.0449 if cp<=-0.004302615113556371\n",
      "   +1.6236 if cp>=0.03448614105582237\n",
      "   +2.5048 if cp>=-0.05900755897164345 & cv<=-1.0134258270263672\n",
      "   -2.2211 if cp<=-0.06027389168739319\n",
      "   +0.1397 if pa<=0.06994461566209793 & pav<=-0.49467852115631095\n",
      "   +2.4565 if cv<=-1.3182264566421509\n",
      "   -0.0000 if cp<=0.010286404751241218 & pa<=-0.029085673391818983 & pa>=-0.06972404122352599\n",
      "   -2.9607 if cp<=0.007474425993859768\n",
      "--------------\n",
      "   +1.4338 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -0.1238 if cv<=0.9026257634162903\n",
      "   -1.3283 if cv<=-0.8291042447090149\n",
      "   -1.1403 if cp>=0.005134062003344298\n",
      "   +2.2390 if cp<=-0.014795880392193792\n",
      "   +0.6853 if pa>=-0.05086350068449974\n",
      "   -0.2371 if cp<=-0.004302615113556371 & pa>=-0.03350066244602203\n",
      "   +2.2390 if cp<=-0.01935424655675888\n",
      "   +1.7617 if cp>=-0.1234923005104065 & cv<=0.7454566359519958\n",
      "   -2.6458 if cv<=-1.3182264566421509\n",
      "   -3.8079 if cp>=0.010286404751241218\n",
      "   -1.8918 if cp>=0.034288951754570016\n",
      "Run episode 142 with rewards 30.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 143 ===========\n",
      "18 actions [1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +1.4960 if pa>=-0.1113012358546257\n",
      "   +1.4960 if pa>=-0.1415664494037628\n",
      "   -0.4841 if pav<=0.06422646939754487\n",
      "   +4.3859 if cp<=0.17256624996662143 & pav>=1.2188693523406984\n",
      "   -0.0688 if cp<=-0.004302615113556371\n",
      "   +0.3379 if cp>=0.03448614105582237\n",
      "   +4.3857 if cp>=-0.05900755897164345 & cv<=-1.0134258270263672\n",
      "   -0.0001 if cp<=-0.06027389168739319\n",
      "   -0.8377 if pa<=0.06994461566209793 & pav<=-0.49467852115631095\n",
      "   +4.3857 if cv<=-1.3182264566421509\n",
      "   -4.0515 if cp<=0.007474425993859768\n",
      "   +0.2439 if pa<=-0.040273288637399665\n",
      "--------------\n",
      "   +1.9263 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -4.3842 if cv<=-0.8291042447090149\n",
      "   -2.1199 if cp>=0.005134062003344298\n",
      "   -0.6249 if cp<=-0.014795880392193792\n",
      "   +1.5050 if pa>=-0.05086350068449974\n",
      "   +0.7763 if cp<=-0.004302615113556371 & pa>=-0.03350066244602203\n",
      "   -0.6249 if cp<=-0.01935424655675888\n",
      "   -0.0745 if cp>=-0.1234923005104065 & cv<=0.7454566359519958\n",
      "   -4.3880 if cv<=-1.3182264566421509\n",
      "   -4.3368 if cp>=0.010286404751241218\n",
      "   -0.2806 if cp>=0.034288951754570016\n",
      "   -2.3976 if pa>=0.1696242392063141\n",
      "Run episode 143 with rewards 18.0\n",
      "============ 144 ===========\n",
      "11 actions [1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0]\n",
      "   +0.0262 if pa>=-0.1113012358546257\n",
      "   +0.0262 if pa>=-0.1415664494037628\n",
      "   -0.7925 if pav<=0.06422646939754487\n",
      "   +0.6365 if cp<=0.17256624996662143 & pav>=1.2188693523406984\n",
      "   +0.6142 if cp<=-0.004302615113556371\n",
      "   +0.3038 if cp>=0.03448614105582237\n",
      "   +0.6137 if cp>=-0.05900755897164345 & cv<=-1.0134258270263672\n",
      "   -0.7797 if pa<=0.06994461566209793 & pav<=-0.49467852115631095\n",
      "   +0.0020 if cv<=-1.3182264566421509\n",
      "   -1.3839 if cp<=0.007474425993859768\n",
      "   -0.5880 if pa<=-0.040273288637399665\n",
      "   +0.0423 if cp>=0.04377919062972069\n",
      "--------------\n",
      "   +1.9661 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   +0.9353 if cv<=-0.8291042447090149\n",
      "   -0.5187 if cp>=0.005134062003344298\n",
      "   +1.0393 if cp<=-0.014795880392193792\n",
      "   +1.6724 if pa>=-0.05086350068449974\n",
      "   +1.0393 if cp<=-0.004302615113556371 & pa>=-0.03350066244602203\n",
      "   +1.0393 if cp<=-0.01935424655675888\n",
      "   +2.3657 if cv<=-1.3182264566421509\n",
      "   -1.7477 if cp>=0.010286404751241218\n",
      "   -0.4105 if cp>=0.034288951754570016\n",
      "   +5.0320 if pa>=0.1696242392063141\n",
      "   +2.3657 if cp<=-0.046777307242155064\n",
      "Run episode 144 with rewards 11.0\n",
      "============ 145 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 0, 0]\n",
      "   -1.1674 if pa>=-0.1113012358546257\n",
      "   -0.5529 if pa>=-0.1415664494037628\n",
      "   +0.0029 if pav<=0.06422646939754487\n",
      "   -0.0000 if cp<=0.17256624996662143 & pav>=1.2188693523406984\n",
      "   -0.0000 if cp<=-0.004302615113556371\n",
      "   +0.3429 if cp>=0.03448614105582237\n",
      "   -0.0000 if cp>=-0.05900755897164345 & cv<=-1.0134258270263672\n",
      "   +0.0955 if pa<=0.06994461566209793 & pav<=-0.49467852115631095\n",
      "   -0.0000 if cp<=0.007474425993859768\n",
      "   +0.0029 if pa<=-0.040273288637399665\n",
      "   +0.3429 if cp>=0.04377919062972069\n",
      "   -3.3654 if cp<=0.044184502214193344\n",
      "--------------\n",
      "   +3.6267 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   +0.0000 if cv<=-0.8291042447090149\n",
      "   -1.6331 if cp>=0.005134062003344298\n",
      "   +0.0000 if cp<=-0.014795880392193792\n",
      "   +1.9189 if pa>=-0.05086350068449974\n",
      "   +0.0000 if cp<=-0.004302615113556371 & pa>=-0.03350066244602203\n",
      "   +0.0000 if cp<=-0.01935424655675888\n",
      "   +0.0000 if cv<=-1.3182264566421509\n",
      "   -1.6331 if cp>=0.010286404751241218\n",
      "   +0.0000 if pa>=0.1696242392063141\n",
      "   +0.0000 if cp<=-0.046777307242155064\n",
      "   +3.0977 if cp<=0.044184502214193344 & cv>=0.7988568544387817\n",
      "Run episode 145 with rewards 10.0\n",
      "============ 146 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.4589 if pa>=-0.1113012358546257\n",
      "   +0.2688 if pa>=-0.1415664494037628\n",
      "   -2.0150 if pav<=0.06422646939754487\n",
      "   +0.0000 if cp<=0.17256624996662143 & pav>=1.2188693523406984\n",
      "   +0.0000 if cp<=-0.004302615113556371\n",
      "   -1.5612 if cp>=0.03448614105582237\n",
      "   -1.6240 if pa<=0.06994461566209793 & pav<=-0.49467852115631095\n",
      "   +0.0000 if cp<=0.007474425993859768\n",
      "   -1.5609 if pa<=-0.040273288637399665\n",
      "   -1.5612 if cp>=0.04377919062972069\n",
      "   -0.4538 if cp<=0.044184502214193344\n",
      "   -1.5657 if cp>=0.029651553183794022\n",
      "--------------\n",
      "   +0.1905 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   +1.7059 if cp>=0.005134062003344298\n",
      "   -0.0000 if cp<=-0.014795880392193792\n",
      "   +0.1905 if pa>=-0.05086350068449974\n",
      "   -0.0000 if cp<=-0.004302615113556371 & pa>=-0.03350066244602203\n",
      "   -0.0000 if cp<=-0.01935424655675888\n",
      "   -0.0000 if cv<=-1.3182264566421509\n",
      "   +1.7059 if cp>=0.010286404751241218\n",
      "   -0.0000 if pa>=0.1696242392063141\n",
      "   -0.0000 if cp<=-0.046777307242155064\n",
      "   -0.0000 if cp<=0.044184502214193344 & cv>=0.7988568544387817\n",
      "   -0.6739 if cv>=1.5380133390426636\n",
      "Run episode 146 with rewards 10.0\n",
      "============ 147 ===========\n",
      "10 actions [1, 1, 1, 1, 0, 1, 1, 1, 1, 1]\n",
      "   -0.3853 if pa>=-0.1113012358546257\n",
      "   -0.3853 if pa>=-0.1415664494037628\n",
      "   -0.3470 if pav<=0.06422646939754487\n",
      "   -0.0000 if cp<=0.17256624996662143 & pav>=1.2188693523406984\n",
      "   -0.3470 if cp>=0.03448614105582237\n",
      "   -0.1819 if pa<=0.06994461566209793 & pav<=-0.49467852115631095\n",
      "   -0.0000 if cp<=0.007474425993859768\n",
      "   -0.0079 if pa<=-0.040273288637399665\n",
      "   -0.1819 if cp>=0.04377919062972069\n",
      "   -0.1651 if cp<=0.044184502214193344\n",
      "   -0.3470 if cp>=0.029651553183794022\n",
      "   -0.0746 if pa>=0.01658451557159424\n",
      "--------------\n",
      "   +0.1148 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   +0.1151 if cp>=0.005134062003344298\n",
      "   +0.0000 if cp<=-0.014795880392193792\n",
      "   +0.1148 if pa>=-0.05086350068449974\n",
      "   +0.0000 if cp<=-0.01935424655675888\n",
      "   +0.0000 if cv<=-1.3182264566421509\n",
      "   +0.1151 if cp>=0.010286404751241218\n",
      "   +0.0000 if pa>=0.1696242392063141\n",
      "   +0.0000 if cp<=-0.046777307242155064\n",
      "   +0.0000 if cp<=0.044184502214193344 & cv>=0.7988568544387817\n",
      "   -0.0001 if cv>=1.5380133390426636\n",
      "   +0.0086 if cp<=0.09100903272628785 & cp>=0.046229171007871626\n",
      "Run episode 147 with rewards 10.0\n",
      "============ 148 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 0, 1, 1]\n",
      "   -0.0493 if pa>=-0.1113012358546257\n",
      "   -0.1098 if pa>=-0.1415664494037628\n",
      "   -0.0006 if pav<=0.06422646939754487\n",
      "   -0.5996 if cp>=0.03448614105582237\n",
      "   +1.1254 if pa<=0.06994461566209793 & pav<=-0.49467852115631095\n",
      "   -3.6244 if cp<=0.007474425993859768\n",
      "   -1.6023 if pa<=-0.040273288637399665\n",
      "   -0.1484 if cp>=0.04377919062972069\n",
      "   +0.1478 if cp<=0.044184502214193344\n",
      "   -1.6023 if cp>=0.029651553183794022\n",
      "   +0.0000 if pa>=0.01658451557159424\n",
      "   +0.0486 if cp>=0.061227437853813176\n",
      "--------------\n",
      "   +2.2976 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -1.5311 if cp>=0.005134062003344298\n",
      "   -0.9221 if pa>=-0.05086350068449974\n",
      "   +0.0000 if cp<=-0.01935424655675888\n",
      "   +0.0000 if cv<=-1.3182264566421509\n",
      "   -1.5311 if cp>=0.010286404751241218\n",
      "   +0.0000 if pa>=0.1696242392063141\n",
      "   +0.0000 if cp<=-0.046777307242155064\n",
      "   +0.0000 if cp<=0.044184502214193344 & cv>=0.7988568544387817\n",
      "   +0.0000 if cv>=1.5380133390426636\n",
      "   +0.8473 if cp<=0.09100903272628785 & cp>=0.046229171007871626\n",
      "   +2.0408 if cp>=0.03555812425911427\n",
      "Run episode 148 with rewards 9.0\n",
      "============ 149 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 0, 0]\n",
      "   -0.7147 if pa>=-0.1113012358546257\n",
      "   -0.4099 if pa>=-0.1415664494037628\n",
      "   +0.4742 if pav<=0.06422646939754487\n",
      "   +0.8841 if cp>=0.03448614105582237\n",
      "   +0.5675 if pa<=0.06994461566209793 & pav<=-0.49467852115631095\n",
      "   -0.7147 if cp<=0.007474425993859768\n",
      "   +0.5675 if pa<=-0.040273288637399665\n",
      "   +2.0781 if cp>=0.04377919062972069\n",
      "   -1.6038 if cp<=0.044184502214193344\n",
      "   +0.8841 if cp>=0.029651553183794022\n",
      "   +0.0000 if cp>=0.061227437853813176\n",
      "   -1.9086 if cv<=1.0829041719436647\n",
      "--------------\n",
      "   +0.6383 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -1.5897 if cp>=0.005134062003344298\n",
      "   +0.5048 if pa>=-0.05086350068449974\n",
      "   -0.0000 if cv<=-1.3182264566421509\n",
      "   -1.5897 if cp>=0.010286404751241218\n",
      "   -0.0000 if pa>=0.1696242392063141\n",
      "   -0.0000 if cp<=-0.046777307242155064\n",
      "   +0.6116 if cp<=0.044184502214193344 & cv>=0.7988568544387817\n",
      "   -0.0000 if cv>=1.5380133390426636\n",
      "   -2.0225 if cp<=0.09100903272628785 & cp>=0.046229171007871626\n",
      "   -1.0945 if cp>=0.03555812425911427\n",
      "   +0.9281 if cp>=0.025735512748360643 & cv<=1.0829041719436647\n",
      "Run episode 149 with rewards 9.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 150 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.9122 if pa>=-0.1113012358546257\n",
      "   -0.7824 if pa>=-0.1415664494037628\n",
      "   -0.8003 if pav<=0.06422646939754487\n",
      "   +0.1119 if cp>=0.03448614105582237\n",
      "   -0.5991 if pa<=0.06994461566209793 & pav<=-0.49467852115631095\n",
      "   -0.3275 if cp<=0.007474425993859768\n",
      "   -0.5199 if pa<=-0.040273288637399665\n",
      "   +0.1119 if cp>=0.04377919062972069\n",
      "   -0.9122 if cp<=0.044184502214193344\n",
      "   +0.1119 if cp>=0.029651553183794022\n",
      "   -0.3275 if cv<=1.0829041719436647\n",
      "   -0.2804 if cp<=-0.0235149297863245\n",
      "--------------\n",
      "   +0.4288 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   +0.3223 if cp>=0.005134062003344298\n",
      "   +0.4288 if pa>=-0.05086350068449974\n",
      "   +0.3223 if cp>=0.010286404751241218\n",
      "   +0.0000 if pa>=0.1696242392063141\n",
      "   +0.0000 if cp<=-0.046777307242155064\n",
      "   +0.3971 if cp<=0.044184502214193344 & cv>=0.7988568544387817\n",
      "   +0.0000 if cv>=1.5380133390426636\n",
      "   +0.0269 if cp<=0.09100903272628785 & cp>=0.046229171007871626\n",
      "   +0.0073 if cp>=0.03555812425911427\n",
      "   +0.0000 if cp>=0.025735512748360643 & cv<=1.0829041719436647\n",
      "   +0.4789 if cp>=-0.0235149297863245\n",
      "Run episode 150 with rewards 9.0\n",
      "============ 151 ===========\n",
      "8 actions [1, 1, 1, 1, 1, 1, 0, 0]\n",
      "   -0.6857 if pa>=-0.1113012358546257\n",
      "   -1.4262 if pa>=-0.1415664494037628\n",
      "   +0.6241 if pav<=0.06422646939754487\n",
      "   +0.7093 if pa<=0.06994461566209793 & pav<=-0.49467852115631095\n",
      "   -0.6857 if cp<=0.007474425993859768\n",
      "   +0.7780 if pa<=-0.040273288637399665\n",
      "   +2.8269 if cp>=0.04377919062972069\n",
      "   -2.2028 if cp<=0.044184502214193344\n",
      "   +2.0503 if cp>=0.029651553183794022\n",
      "   -0.6857 if cv<=1.0829041719436647\n",
      "   -0.4195 if cp<=-0.0235149297863245\n",
      "   +1.0425 if cp>=-0.01241636425256728\n",
      "--------------\n",
      "   +0.2630 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -1.6428 if cp>=0.005134062003344298\n",
      "   +0.2440 if pa>=-0.05086350068449974\n",
      "   -2.0682 if cp>=0.010286404751241218\n",
      "   -0.0000 if pa>=0.1696242392063141\n",
      "   +1.2204 if cp<=0.044184502214193344 & cv>=0.7988568544387817\n",
      "   -0.0000 if cv>=1.5380133390426636\n",
      "   -2.8296 if cp<=0.09100903272628785 & cp>=0.046229171007871626\n",
      "   -2.8296 if cp>=0.03555812425911427\n",
      "   -0.0000 if cp>=0.025735512748360643 & cv<=1.0829041719436647\n",
      "   -1.6092 if cp>=-0.0235149297863245\n",
      "   +0.7219 if cp<=0.018412029184401043\n",
      "Run episode 151 with rewards 8.0\n",
      "============ 152 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 0]\n",
      "   -0.6670 if pa>=-0.1113012358546257\n",
      "   -0.5107 if pa>=-0.1415664494037628\n",
      "   -0.5139 if pav<=0.06422646939754487\n",
      "   -0.2994 if pa<=0.06994461566209793 & pav<=-0.49467852115631095\n",
      "   -0.6670 if cp<=0.007474425993859768\n",
      "   -0.5139 if pa<=-0.040273288637399665\n",
      "   -0.0032 if cp>=0.04377919062972069\n",
      "   -0.5107 if cp<=0.044184502214193344\n",
      "   -0.0032 if cp>=0.029651553183794022\n",
      "   -0.6702 if cv<=1.0829041719436647\n",
      "   +0.1020 if cp>=-0.01241636425256728\n",
      "   +0.1563 if cv>=1.145225167274475\n",
      "--------------\n",
      "   +0.1980 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -0.4645 if cp>=0.005134062003344298\n",
      "   +0.1980 if pa>=-0.05086350068449974\n",
      "   -0.4645 if cp>=0.010286404751241218\n",
      "   -0.2304 if cp<=0.044184502214193344 & cv>=0.7988568544387817\n",
      "   +0.0000 if cv>=1.5380133390426636\n",
      "   +0.0000 if cp<=0.09100903272628785 & cp>=0.046229171007871626\n",
      "   +0.0005 if cp>=0.03555812425911427\n",
      "   +0.0005 if cp>=0.025735512748360643 & cv<=1.0829041719436647\n",
      "   -0.1125 if cp>=-0.0235149297863245\n",
      "   +0.6484 if cp<=0.018412029184401043\n",
      "   +0.1840 if \n",
      "Run episode 152 with rewards 10.0\n",
      "============ 153 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.4048 if pa>=-0.1113012358546257\n",
      "   -0.4497 if pa>=-0.1415664494037628\n",
      "   -2.7521 if pav<=0.06422646939754487\n",
      "   -2.5280 if pa<=0.06994461566209793 & pav<=-0.49467852115631095\n",
      "   +0.1855 if cp<=0.007474425993859768\n",
      "   -2.2118 if pa<=-0.040273288637399665\n",
      "   -0.3154 if cp<=0.044184502214193344\n",
      "   -2.5096 if cp>=0.029651553183794022\n",
      "   -0.3539 if cv<=1.0829041719436647\n",
      "   -2.8667 if cp>=-0.01241636425256728\n",
      "   -2.3113 if cv>=1.145225167274475\n",
      "   +0.0634 if cp>=0.11340034604072571\n",
      "--------------\n",
      "   -0.0416 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   +2.4453 if cp>=0.005134062003344298\n",
      "   -0.0416 if pa>=-0.05086350068449974\n",
      "   +2.4453 if cp>=0.010286404751241218\n",
      "   +0.0550 if cp<=0.044184502214193344 & cv>=0.7988568544387817\n",
      "   -0.0314 if cp<=0.09100903272628785 & cp>=0.046229171007871626\n",
      "   +2.3920 if cp>=0.03555812425911427\n",
      "   -0.0427 if cp>=0.025735512748360643 & cv<=1.0829041719436647\n",
      "   +2.3613 if cp>=-0.0235149297863245\n",
      "   +0.1547 if cp<=0.018412029184401043\n",
      "   +2.3784 if \n",
      "   +0.9835 if cp<=0.026253991574048997\n",
      "Run episode 153 with rewards 9.0\n",
      "============ 154 ===========\n",
      "15 actions [0, 1, 1, 0, 1, 1, 1, 0, 1, 1, 0, 0, 1, 1, 1]\n",
      "   -0.0007 if pa>=-0.1113012358546257\n",
      "   -0.0007 if pa>=-0.1415664494037628\n",
      "   -0.0007 if pav<=0.06422646939754487\n",
      "   -0.0004 if pa<=0.06994461566209793 & pav<=-0.49467852115631095\n",
      "   +0.0000 if cp<=0.007474425993859768\n",
      "   -0.0003 if pa<=-0.040273288637399665\n",
      "   -0.0005 if cp<=0.044184502214193344\n",
      "   -0.0007 if cp>=0.029651553183794022\n",
      "   -0.0007 if cv<=1.0829041719436647\n",
      "   -0.0007 if cp>=-0.01241636425256728\n",
      "   +0.0000 if cv>=1.145225167274475\n",
      "   -0.0001 if cp>=0.07211526557803155\n",
      "--------------\n",
      "   +0.0031 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   +0.0032 if cp>=0.005134062003344298\n",
      "   +0.0031 if pa>=-0.05086350068449974\n",
      "   +0.0032 if cp>=0.010286404751241218\n",
      "   -0.0000 if cp<=0.044184502214193344 & cv>=0.7988568544387817\n",
      "   +0.0032 if cp>=0.03555812425911427\n",
      "   +0.0032 if cp>=0.025735512748360643 & cv<=1.0829041719436647\n",
      "   +0.0032 if cp>=-0.0235149297863245\n",
      "   -0.0000 if cp<=0.018412029184401043\n",
      "   +0.0032 if \n",
      "   -0.0000 if cp<=0.026253991574048997\n",
      "   +0.0032 if cp<=0.07211526557803155\n",
      "Run episode 154 with rewards 15.0\n",
      "============ 155 ===========\n",
      "56 actions [0, 1, 1, 1, 0, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1, 1, 0, 0, 1, 0, 0, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 0, 0, 1, 0, 1, 1]\n",
      "   -1.1970 if pa>=-0.1113012358546257\n",
      "   +1.3634 if pa>=-0.1415664494037628\n",
      "   +1.5289 if pav<=0.06422646939754487\n",
      "   -1.7633 if pa<=0.06994461566209793 & pav<=-0.49467852115631095\n",
      "   -0.2989 if pa<=-0.040273288637399665\n",
      "   +0.0957 if cp<=0.044184502214193344\n",
      "   -0.2989 if cp>=0.029651553183794022\n",
      "   -1.3978 if cv<=1.0829041719436647\n",
      "   -1.3978 if cp>=-0.01241636425256728\n",
      "   +0.0000 if cv>=1.145225167274475\n",
      "   -0.2008 if cp>=0.07211526557803155\n",
      "   +3.4071 if cp>=0.0229519534856081\n",
      "--------------\n",
      "   -0.9740 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   +0.0602 if cp>=0.005134062003344298\n",
      "   -0.9740 if pa>=-0.05086350068449974\n",
      "   +0.0602 if cp>=0.010286404751241218\n",
      "   +1.0345 if cp>=0.03555812425911427\n",
      "   -1.3133 if cp>=0.025735512748360643 & cv<=1.0829041719436647\n",
      "   +0.0602 if cp>=-0.0235149297863245\n",
      "   -2.2041 if cp<=0.018412029184401043\n",
      "   +0.0602 if \n",
      "   +1.3735 if cp<=0.026253991574048997\n",
      "   +0.9002 if cp<=0.07211526557803155\n",
      "   +3.9268 if cv<=-0.03215434700250626 & pa>=-0.028441185131669044\n",
      "Run episode 155 with rewards 56.0\n",
      "============ 156 ===========\n",
      "142 actions [0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 0, 0, 1, 1, 1, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 0, 0, 1, 1, 1, 0, 0, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1, 1, 0, 1, 1, 0, 0, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 0]\n",
      "   -2.0786 if pa>=-0.1113012358546257\n",
      "   -2.0785 if pa>=-0.1415664494037628\n",
      "   +3.6213 if pav<=0.06422646939754487\n",
      "   +3.5665 if pa<=0.06994461566209793 & pav<=-0.49467852115631095\n",
      "   +0.0002 if pa<=-0.040273288637399665\n",
      "   +0.8772 if cp<=0.044184502214193344\n",
      "   +5.0643 if cp>=0.029651553183794022\n",
      "   -2.0785 if cv<=1.0829041719436647\n",
      "   +1.4131 if cp>=-0.01241636425256728\n",
      "   +0.0001 if cp>=0.07211526557803155\n",
      "   -0.8118 if cp>=0.0229519534856081\n",
      "   +5.2723 if cp<=0.006250881124287844 & cv>=-0.0208522230386734 & pa<=0.020050277933478355\n",
      "--------------\n",
      "   +2.4755 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -2.3567 if cp>=0.005134062003344298\n",
      "   +2.4755 if pa>=-0.05086350068449974\n",
      "   +1.8948 if cp>=0.010286404751241218\n",
      "   +2.0232 if cp>=0.03555812425911427\n",
      "   -2.0959 if cp>=0.025735512748360643 & cv<=1.0829041719436647\n",
      "   -7.2628 if cp>=-0.0235149297863245\n",
      "   -6.4203 if cp<=0.018412029184401043\n",
      "   +4.5704 if cp<=0.026253991574048997\n",
      "   +2.4755 if cp<=0.07211526557803155\n",
      "   +3.3197 if cv<=-0.03215434700250626 & pa>=-0.028441185131669044\n",
      "   -2.5443 if cv>=0.1783861517906189 & pa>=0.03013694100081921\n",
      "Run episode 156 with rewards 142.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 157 ===========\n",
      "33 actions [0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 1, 1]\n",
      "   +0.9124 if pa>=-0.1113012358546257\n",
      "   -3.9135 if pa>=-0.1415664494037628\n",
      "   +5.1745 if pav<=0.06422646939754487\n",
      "   +2.4319 if pa<=0.06994461566209793 & pav<=-0.49467852115631095\n",
      "   -2.2723 if pa<=-0.040273288637399665\n",
      "   +0.3576 if cp<=0.044184502214193344\n",
      "   -0.0014 if cp>=0.029651553183794022\n",
      "   +0.3572 if cv<=1.0829041719436647\n",
      "   -1.0783 if cp>=-0.01241636425256728\n",
      "   -0.0002 if cp>=0.0229519534856081\n",
      "   +0.7376 if cp<=0.006250881124287844 & cv>=-0.0208522230386734 & pa<=0.020050277933478355\n",
      "   +5.1449 if cp>=-0.009269407950341702\n",
      "--------------\n",
      "   +8.8125 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -0.0000 if cp>=0.005134062003344298\n",
      "   +6.4029 if pa>=-0.05086350068449974\n",
      "   -0.0000 if cp>=0.03555812425911427\n",
      "   -0.0000 if cp>=0.025735512748360643 & cv<=1.0829041719436647\n",
      "   -7.0090 if cp>=-0.0235149297863245\n",
      "   +0.1587 if cp<=0.018412029184401043\n",
      "   +0.1587 if cp<=0.026253991574048997\n",
      "   +0.1587 if cp<=0.07211526557803155\n",
      "   +3.0723 if cv<=-0.03215434700250626 & pa>=-0.028441185131669044\n",
      "   -0.0000 if cv>=0.1783861517906189 & pa>=0.03013694100081921\n",
      "  -10.3043 if cp>=-0.029453209787607192 & pa>=-0.06627395823597895\n",
      "Run episode 157 with rewards 33.0\n",
      "============ 158 ===========\n",
      "41 actions [0, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 0, 0, 0, 0, 0, 0]\n",
      "   -0.9355 if pa>=-0.1113012358546257\n",
      "   -0.9355 if pa>=-0.1415664494037628\n",
      "   +3.2618 if pav<=0.06422646939754487\n",
      "   +3.2414 if pa<=0.06994461566209793 & pav<=-0.49467852115631095\n",
      "   +0.0000 if pa<=-0.040273288637399665\n",
      "   +3.3723 if cp<=0.044184502214193344\n",
      "   +0.5982 if cp>=0.029651553183794022\n",
      "   -4.1745 if cv<=1.0829041719436647\n",
      "   +2.6314 if cp>=-0.01241636425256728\n",
      "   +0.0011 if cp<=0.006250881124287844 & cv>=-0.0208522230386734 & pa<=0.020050277933478355\n",
      "   +2.5788 if cp>=-0.009269407950341702\n",
      "   +2.7121 if pa<=-0.024416998401284216\n",
      "--------------\n",
      "   +3.5043 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   +1.0579 if cp>=0.005134062003344298\n",
      "   +1.1339 if pa>=-0.05086350068449974\n",
      "   +1.6159 if cp>=0.025735512748360643 & cv<=1.0829041719436647\n",
      "   -6.0800 if cp>=-0.0235149297863245\n",
      "   -0.4537 if cp<=0.018412029184401043\n",
      "   -0.4820 if cp<=0.026253991574048997\n",
      "   +1.1339 if cp<=0.07211526557803155\n",
      "   +0.9856 if cv<=-0.03215434700250626 & pa>=-0.028441185131669044\n",
      "   +2.0052 if cv>=0.1783861517906189 & pa>=0.03013694100081921\n",
      "   -4.4531 if cp>=-0.029453209787607192 & pa>=-0.06627395823597895\n",
      "   +2.5093 if cv<=-0.38099486827850343\n",
      "Run episode 158 with rewards 41.0\n",
      "============ 159 ===========\n",
      "37 actions [1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1]\n",
      "   -0.9887 if pa>=-0.1113012358546257\n",
      "   -0.9887 if pa>=-0.1415664494037628\n",
      "   +0.2794 if pav<=0.06422646939754487\n",
      "   +2.8142 if pa<=0.06994461566209793 & pav<=-0.49467852115631095\n",
      "   +1.0252 if cp<=0.044184502214193344\n",
      "   -1.0978 if cp>=0.029651553183794022\n",
      "   -0.6638 if cv<=1.0829041719436647\n",
      "   +1.6283 if cp>=-0.01241636425256728\n",
      "   +0.0812 if cp<=0.006250881124287844 & cv>=-0.0208522230386734 & pa<=0.020050277933478355\n",
      "   +1.3638 if cp>=-0.009269407950341702\n",
      "   +0.0000 if pa<=-0.024416998401284216\n",
      "   +2.9512 if pav<=0.07888057827949524\n",
      "--------------\n",
      "   +2.5683 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   +1.0989 if cp>=0.005134062003344298\n",
      "   +2.6043 if pa>=-0.05086350068449974\n",
      "   +1.0989 if cp>=0.025735512748360643 & cv<=1.0829041719436647\n",
      "   -5.5614 if cp>=-0.0235149297863245\n",
      "   +1.5054 if cp<=0.026253991574048997\n",
      "   -1.7227 if cp<=0.07211526557803155\n",
      "   -0.1854 if cv<=-0.03215434700250626 & pa>=-0.028441185131669044\n",
      "   +2.2775 if cv>=0.1783861517906189 & pa>=0.03013694100081921\n",
      "   -5.9597 if cp>=-0.029453209787607192 & pa>=-0.06627395823597895\n",
      "   +0.0513 if cv<=-0.38099486827850343\n",
      "   +1.2677 if pa<=0.16434048116207123 & pav>=0.07888057827949524\n",
      "Run episode 159 with rewards 37.0\n",
      "============ 160 ===========\n",
      "28 actions [0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1]\n",
      "   +0.1529 if pa>=-0.1113012358546257\n",
      "   +0.1529 if pa>=-0.1415664494037628\n",
      "   +0.5056 if pav<=0.06422646939754487\n",
      "   +1.2683 if pa<=0.06994461566209793 & pav<=-0.49467852115631095\n",
      "   -0.1467 if cp<=0.044184502214193344\n",
      "   +0.3086 if cp>=0.029651553183794022\n",
      "   -1.7354 if cv<=1.0829041719436647\n",
      "   +0.9805 if cp>=-0.01241636425256728\n",
      "   -0.5324 if cp<=0.006250881124287844 & cv>=-0.0208522230386734 & pa<=0.020050277933478355\n",
      "   +0.9402 if cp>=-0.009269407950341702\n",
      "   +0.5056 if pav<=0.07888057827949524\n",
      "   +1.8882 if cv>=1.1966038942337036\n",
      "--------------\n",
      "   +1.8813 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -0.4048 if cp>=0.005134062003344298\n",
      "   +1.7878 if pa>=-0.05086350068449974\n",
      "   -0.3940 if cp>=0.025735512748360643 & cv<=1.0829041719436647\n",
      "   -3.6746 if cp>=-0.0235149297863245\n",
      "   +2.1818 if cp<=0.026253991574048997\n",
      "   +1.7878 if cp<=0.07211526557803155\n",
      "   -1.1051 if cv<=-0.03215434700250626 & pa>=-0.028441185131669044\n",
      "   -0.5516 if cv>=0.1783861517906189 & pa>=0.03013694100081921\n",
      "   -5.2649 if cp>=-0.029453209787607192 & pa>=-0.06627395823597895\n",
      "   -1.2828 if pa<=0.16434048116207123 & pav>=0.07888057827949524\n",
      "   +0.0376 if pa>=0.0507584407925606 & pav<=1.1632689952850341\n",
      "Run episode 160 with rewards 28.0\n",
      "============ 161 ===========\n",
      "26 actions [0, 0, 0, 0, 1, 1, 1, 0, 1, 1, 1, 1, 1, 0, 0, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.2171 if pa>=-0.1113012358546257\n",
      "   +0.2171 if pa>=-0.1415664494037628\n",
      "   +0.6277 if pav<=0.06422646939754487\n",
      "   +0.7051 if pa<=0.06994461566209793 & pav<=-0.49467852115631095\n",
      "   +0.0375 if cp>=0.029651553183794022\n",
      "   -0.3553 if cv<=1.0829041719436647\n",
      "   +1.3562 if cp>=-0.01241636425256728\n",
      "   -0.0000 if cp<=0.006250881124287844 & cv>=-0.0208522230386734 & pa<=0.020050277933478355\n",
      "   +0.9243 if cp>=-0.009269407950341702\n",
      "   +0.6277 if pav<=0.07888057827949524\n",
      "   -0.0000 if cv>=1.1966038942337036\n",
      "   +4.1069 if pa>=0.18421624600887299\n",
      "--------------\n",
      "   +1.8268 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -0.3050 if cp>=0.005134062003344298\n",
      "   +0.6428 if pa>=-0.05086350068449974\n",
      "   -0.2361 if cp>=0.025735512748360643 & cv<=1.0829041719436647\n",
      "   -2.3320 if cp>=-0.0235149297863245\n",
      "   +0.8789 if cp<=0.026253991574048997\n",
      "   +0.6428 if cp<=0.07211526557803155\n",
      "   -2.0811 if cv<=-0.03215434700250626 & pa>=-0.028441185131669044\n",
      "   +1.1815 if cv>=0.1783861517906189 & pa>=0.03013694100081921\n",
      "   -6.4615 if cp>=-0.029453209787607192 & pa>=-0.06627395823597895\n",
      "   +1.9802 if pa<=0.16434048116207123 & pav>=0.07888057827949524\n",
      "   -1.1755 if pa>=0.11454986482858659\n",
      "Run episode 161 with rewards 26.0\n",
      "============ 162 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 1, 1, 0, 1]\n",
      "   +0.4350 if pa>=-0.1113012358546257\n",
      "   +0.4350 if pa>=-0.1415664494037628\n",
      "   +2.2975 if pav<=0.06422646939754487\n",
      "   +0.0000 if pa<=0.06994461566209793 & pav<=-0.49467852115631095\n",
      "   +0.0387 if cp>=0.029651553183794022\n",
      "   +0.4350 if cv<=1.0829041719436647\n",
      "   +0.0790 if cp>=-0.01241636425256728\n",
      "   +0.0790 if cp>=-0.009269407950341702\n",
      "   -0.1418 if pav<=0.07888057827949524\n",
      "   +0.0000 if cv>=1.1966038942337036\n",
      "   +0.0000 if pa>=0.18421624600887299\n",
      "   -2.4233 if cp>=-0.053173284977674484 & pa<=0.16238495707511902 & pav>=0.7918283343315125\n",
      "--------------\n",
      "   -1.3320 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -0.0370 if cp>=0.005134062003344298\n",
      "   +1.5538 if pa>=-0.05086350068449974\n",
      "   -1.1670 if cp>=-0.0235149297863245\n",
      "   +1.5621 if cp<=0.026253991574048997\n",
      "   +1.5538 if cp<=0.07211526557803155\n",
      "   -0.7387 if cv<=-0.03215434700250626 & pa>=-0.028441185131669044\n",
      "   -0.5904 if cv>=0.1783861517906189 & pa>=0.03013694100081921\n",
      "   -3.4415 if cp>=-0.029453209787607192 & pa>=-0.06627395823597895\n",
      "   -0.7471 if pa<=0.16434048116207123 & pav>=0.07888057827949524\n",
      "   -0.6374 if pa>=0.11454986482858659\n",
      "   -2.9718 if cp>=-0.026540052145719514 & cv<=0.19839565455913574\n",
      "Run episode 162 with rewards 10.0\n",
      "============ 163 ===========\n",
      "11 actions [0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0]\n",
      "   +0.4306 if pa>=-0.1113012358546257\n",
      "   +0.4306 if pa>=-0.1415664494037628\n",
      "   +0.0652 if pav<=0.06422646939754487\n",
      "   -0.0000 if pa<=0.06994461566209793 & pav<=-0.49467852115631095\n",
      "   -0.0000 if cp>=0.029651553183794022\n",
      "   +0.4306 if cv<=1.0829041719436647\n",
      "   +0.1957 if cp>=-0.01241636425256728\n",
      "   +0.1957 if cp>=-0.009269407950341702\n",
      "   +0.0652 if pav<=0.07888057827949524\n",
      "   -0.0000 if pa>=0.18421624600887299\n",
      "   -0.3068 if cp>=-0.053173284977674484 & pa<=0.16238495707511902 & pav>=0.7918283343315125\n",
      "   -0.4593 if pav>=1.792494773864746\n",
      "--------------\n",
      "   -0.1273 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -0.3462 if pa>=-0.05086350068449974\n",
      "   -1.6184 if cp>=-0.0235149297863245\n",
      "   -0.3462 if cp<=0.026253991574048997\n",
      "   -0.3462 if cp<=0.07211526557803155\n",
      "   -0.3443 if cv<=-0.03215434700250626 & pa>=-0.028441185131669044\n",
      "   -0.0000 if cv>=0.1783861517906189 & pa>=0.03013694100081921\n",
      "   -1.6184 if cp>=-0.029453209787607192 & pa>=-0.06627395823597895\n",
      "   +1.8869 if pa<=0.16434048116207123 & pav>=0.07888057827949524\n",
      "   +0.1157 if pa>=0.11454986482858659\n",
      "   -1.6184 if cp>=-0.026540052145719514 & cv<=0.19839565455913574\n",
      "   -2.2312 if pa>=0.1816900372505188\n",
      "Run episode 163 with rewards 11.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 164 ===========\n",
      "8 actions [0, 0, 0, 0, 0, 0, 0, 1]\n",
      "   +1.2031 if pa>=-0.1113012358546257\n",
      "   +1.2031 if pa>=-0.1415664494037628\n",
      "   +0.0021 if pav<=0.06422646939754487\n",
      "   -0.0000 if cp>=0.029651553183794022\n",
      "   +1.2031 if cv<=1.0829041719436647\n",
      "   -0.0000 if cp>=-0.01241636425256728\n",
      "   -0.0000 if cp>=-0.009269407950341702\n",
      "   +0.0021 if pav<=0.07888057827949524\n",
      "   -0.0000 if pa>=0.18421624600887299\n",
      "   +0.4805 if cp>=-0.053173284977674484 & pa<=0.16238495707511902 & pav>=0.7918283343315125\n",
      "   -1.8991 if pav>=1.792494773864746\n",
      "   -2.0558 if cv<=-1.2079447507858276\n",
      "--------------\n",
      "   -0.6945 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -0.1050 if pa>=-0.05086350068449974\n",
      "   -0.5349 if cp>=-0.0235149297863245\n",
      "   -0.1050 if cp<=0.026253991574048997\n",
      "   -0.1050 if cp<=0.07211526557803155\n",
      "   +1.1259 if cv<=-0.03215434700250626 & pa>=-0.028441185131669044\n",
      "   -0.6945 if cp>=-0.029453209787607192 & pa>=-0.06627395823597895\n",
      "   -2.0601 if pa<=0.16434048116207123 & pav>=0.07888057827949524\n",
      "   +2.3865 if pa>=0.11454986482858659\n",
      "   -0.5349 if cp>=-0.026540052145719514 & cv<=0.19839565455913574\n",
      "   -0.0000 if pa>=0.1816900372505188\n",
      "   +2.5206 if cp>=-0.13678619265556335 & cv<=-1.2079447507858276\n",
      "Run episode 164 with rewards 8.0\n",
      "============ 165 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +3.6441 if pa>=-0.1113012358546257\n",
      "   +3.6441 if pa>=-0.1415664494037628\n",
      "   +0.0000 if pav<=0.06422646939754487\n",
      "   +0.0000 if cp>=0.029651553183794022\n",
      "   +3.6441 if cv<=1.0829041719436647\n",
      "   +0.0001 if cp>=-0.01241636425256728\n",
      "   +0.0001 if cp>=-0.009269407950341702\n",
      "   +0.0000 if pav<=0.07888057827949524\n",
      "   +0.0000 if cp>=-0.053173284977674484 & pa<=0.16238495707511902 & pav>=0.7918283343315125\n",
      "   +3.6440 if pav>=1.792494773864746\n",
      "   +3.6440 if cv<=-1.2079447507858276\n",
      "   +0.0000 if cp>=0.02220284380018711\n",
      "--------------\n",
      "   -0.6912 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -1.8473 if pa>=-0.05086350068449974\n",
      "   -0.6063 if cp>=-0.0235149297863245\n",
      "   -1.8473 if cp<=0.026253991574048997\n",
      "   -1.8473 if cp<=0.07211526557803155\n",
      "   -2.5794 if cv<=-0.03215434700250626 & pa>=-0.028441185131669044\n",
      "   -0.7266 if cp>=-0.029453209787607192 & pa>=-0.06627395823597895\n",
      "   -1.8224 if pa<=0.16434048116207123 & pav>=0.07888057827949524\n",
      "   -3.3640 if pa>=0.11454986482858659\n",
      "   -0.6063 if cp>=-0.026540052145719514 & cv<=0.19839565455913574\n",
      "   -3.3612 if cp>=-0.13678619265556335 & cv<=-1.2079447507858276\n",
      "   +0.9854 if cv>=0.02773205190896988\n",
      "Run episode 165 with rewards 10.0\n",
      "============ 166 ===========\n",
      "19 actions [1, 0, 1, 0, 0, 1, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 1]\n",
      "   +0.0422 if pa>=-0.1113012358546257\n",
      "   +0.0422 if pa>=-0.1415664494037628\n",
      "   +0.0360 if pav<=0.06422646939754487\n",
      "   +0.0422 if cv<=1.0829041719436647\n",
      "   +0.0421 if cp>=-0.01241636425256728\n",
      "   +0.0420 if cp>=-0.009269407950341702\n",
      "   +0.0360 if pav<=0.07888057827949524\n",
      "   +0.0004 if cp>=-0.053173284977674484 & pa<=0.16238495707511902 & pav>=0.7918283343315125\n",
      "   +0.0000 if pav>=1.792494773864746\n",
      "   +0.0000 if cv<=-1.2079447507858276\n",
      "   +0.0418 if cp>=0.02220284380018711\n",
      "   +0.0360 if cp>=0.029673531651496887\n",
      "--------------\n",
      "   -0.0013 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -0.0022 if pa>=-0.05086350068449974\n",
      "   -0.0021 if cp>=-0.0235149297863245\n",
      "   -0.0013 if cp<=0.026253991574048997\n",
      "   -0.0022 if cp<=0.07211526557803155\n",
      "   -0.0013 if cv<=-0.03215434700250626 & pa>=-0.028441185131669044\n",
      "   -0.0022 if cp>=-0.029453209787607192 & pa>=-0.06627395823597895\n",
      "   -0.0017 if pa<=0.16434048116207123 & pav>=0.07888057827949524\n",
      "   +0.0000 if pa>=0.11454986482858659\n",
      "   +0.0000 if cp>=-0.13678619265556335 & cv<=-1.2079447507858276\n",
      "   +0.0000 if cv>=0.02773205190896988\n",
      "   -0.0006 if cp<=0.01093779876828194\n",
      "Run episode 166 with rewards 19.0\n",
      "============ 167 ===========\n",
      "30 actions [1, 0, 1, 0, 1, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 1, 0, 1, 0]\n",
      "   +0.2315 if pa>=-0.1113012358546257\n",
      "   +0.2315 if pa>=-0.1415664494037628\n",
      "   -0.4666 if pav<=0.06422646939754487\n",
      "   +0.2315 if cv<=1.0829041719436647\n",
      "   -1.1000 if cp>=-0.01241636425256728\n",
      "   +2.4048 if cp>=-0.009269407950341702\n",
      "   -0.4666 if pav<=0.07888057827949524\n",
      "   -1.5268 if cp>=-0.053173284977674484 & pa<=0.16238495707511902 & pav>=0.7918283343315125\n",
      "   +0.0000 if pav>=1.792494773864746\n",
      "   +0.0000 if cp>=0.02220284380018711\n",
      "   +0.0000 if cp>=0.029673531651496887\n",
      "   -1.1277 if cv>=-0.2162771999835968\n",
      "--------------\n",
      "   -3.5081 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   +0.8793 if pa>=-0.05086350068449974\n",
      "   +1.6873 if cp>=-0.0235149297863245\n",
      "   +0.8792 if cp<=0.026253991574048997\n",
      "   +0.8793 if cp<=0.07211526557803155\n",
      "   +1.4436 if cv<=-0.03215434700250626 & pa>=-0.028441185131669044\n",
      "   -0.9723 if cp>=-0.029453209787607192 & pa>=-0.06627395823597895\n",
      "   -2.4798 if pa<=0.16434048116207123 & pav>=0.07888057827949524\n",
      "   +0.0108 if pa>=0.11454986482858659\n",
      "   +0.0000 if cp>=-0.13678619265556335 & cv<=-1.2079447507858276\n",
      "   +0.8792 if cp<=0.01093779876828194\n",
      "   -3.1749 if cv>=0.17585383355617523\n",
      "Run episode 167 with rewards 30.0\n",
      "============ 168 ===========\n",
      "21 actions [1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1]\n",
      "   +0.0337 if pa>=-0.1113012358546257\n",
      "   +0.0337 if pa>=-0.1415664494037628\n",
      "   -4.2084 if pav<=0.06422646939754487\n",
      "   +0.0337 if cv<=1.0829041719436647\n",
      "   +0.8689 if cp>=-0.01241636425256728\n",
      "   +0.8689 if cp>=-0.009269407950341702\n",
      "   -0.0061 if pav<=0.07888057827949524\n",
      "   -3.0124 if cp>=-0.053173284977674484 & pa<=0.16238495707511902 & pav>=0.7918283343315125\n",
      "   +0.0000 if cp>=0.02220284380018711\n",
      "   +0.0000 if cp>=0.029673531651496887\n",
      "   -0.4147 if cv>=-0.2162771999835968\n",
      "   +5.4139 if cv>=-0.00461280699819326 & pav<=0.033639769628644005\n",
      "--------------\n",
      "   -6.0250 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   +2.5591 if pa>=-0.05086350068449974\n",
      "   +2.2249 if cp>=-0.0235149297863245\n",
      "   +1.7524 if cp<=0.026253991574048997\n",
      "   +1.7524 if cp<=0.07211526557803155\n",
      "   +0.7523 if cv<=-0.03215434700250626 & pa>=-0.028441185131669044\n",
      "   -0.1156 if cp>=-0.029453209787607192 & pa>=-0.06627395823597895\n",
      "   -3.1023 if pa<=0.16434048116207123 & pav>=0.07888057827949524\n",
      "   +2.5470 if pa>=0.11454986482858659\n",
      "   +0.0743 if cp<=0.01093779876828194\n",
      "   -5.9096 if cv>=0.17585383355617523\n",
      "   -4.7945 if cp>=0.014680569991469383\n",
      "Run episode 168 with rewards 21.0\n",
      "============ 169 ===========\n",
      "36 actions [0, 1, 1, 0, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 0, 1, 1, 1, 0, 1, 0, 0]\n",
      "   -0.5263 if pa>=-0.1113012358546257\n",
      "   -0.1804 if pa>=-0.1415664494037628\n",
      "   -1.2008 if pav<=0.06422646939754487\n",
      "   -1.2008 if cv<=1.0829041719436647\n",
      "   -0.8894 if cp>=-0.01241636425256728\n",
      "   +2.9606 if cp>=-0.009269407950341702\n",
      "   -1.2008 if pav<=0.07888057827949524\n",
      "   +0.0000 if cp>=-0.053173284977674484 & pa<=0.16238495707511902 & pav>=0.7918283343315125\n",
      "   -0.6745 if cp>=0.02220284380018711\n",
      "   -1.2008 if cv>=-0.2162771999835968\n",
      "   +6.2230 if cv>=-0.00461280699819326 & pav<=0.033639769628644005\n",
      "   +3.1841 if pa>=-0.11794757843017578 & pav>=-0.3092974126338959\n",
      "--------------\n",
      "   -1.2144 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -0.4009 if pa>=-0.05086350068449974\n",
      "   +1.7186 if cp>=-0.0235149297863245\n",
      "   +0.7942 if cp<=0.026253991574048997\n",
      "   +1.7186 if cp<=0.07211526557803155\n",
      "   +0.0277 if cv<=-0.03215434700250626 & pa>=-0.028441185131669044\n",
      "   +1.1646 if cp>=-0.029453209787607192 & pa>=-0.06627395823597895\n",
      "   +0.0000 if pa<=0.16434048116207123 & pav>=0.07888057827949524\n",
      "   +0.0000 if pa>=0.11454986482858659\n",
      "   -5.5046 if cv>=0.17585383355617523\n",
      "   -3.8459 if cp>=0.014680569991469383\n",
      "   -5.2021 if cp<=-0.016846656799316406 & cv>=-0.030385859310626984 & pav>=-0.3092974126338959\n",
      "Run episode 169 with rewards 36.0\n",
      "============ 170 ===========\n",
      "21 actions [0, 0, 1, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 1]\n",
      "   -0.0564 if pa>=-0.1113012358546257\n",
      "   -0.0564 if pa>=-0.1415664494037628\n",
      "   +1.7205 if pav<=0.06422646939754487\n",
      "   -0.0563 if cv<=1.0829041719436647\n",
      "   +4.2562 if cp>=-0.01241636425256728\n",
      "   +5.5748 if cp>=-0.009269407950341702\n",
      "   +1.8497 if pav<=0.07888057827949524\n",
      "   +0.0000 if cp>=0.02220284380018711\n",
      "   -0.0553 if cv>=-0.2162771999835968\n",
      "   +1.6924 if cv>=-0.00461280699819326 & pav<=0.033639769628644005\n",
      "   -0.0563 if pa>=-0.11794757843017578 & pav>=-0.3092974126338959\n",
      "   -3.0669 if cp>=-0.02731324173510074\n",
      "--------------\n",
      "   -1.4634 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   +1.2173 if pa>=-0.05086350068449974\n",
      "   -1.2653 if cp>=-0.0235149297863245\n",
      "   +1.2173 if cp<=0.026253991574048997\n",
      "   +1.2173 if cp<=0.07211526557803155\n",
      "   +0.1854 if cv<=-0.03215434700250626 & pa>=-0.028441185131669044\n",
      "   +2.1314 if cp>=-0.029453209787607192 & pa>=-0.06627395823597895\n",
      "   -0.9435 if pa<=0.16434048116207123 & pav>=0.07888057827949524\n",
      "   -2.6592 if cv>=0.17585383355617523\n",
      "   +0.0001 if cp>=0.014680569991469383\n",
      "   -6.8279 if cp<=-0.016846656799316406 & cv>=-0.030385859310626984 & pav>=-0.3092974126338959\n",
      "   +0.1280 if cp<=-0.05298580601811409 & cv<=0.017999613657593744\n",
      "Run episode 170 with rewards 21.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 171 ===========\n",
      "27 actions [0, 0, 0, 1, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1]\n",
      "   -0.3297 if pa>=-0.1113012358546257\n",
      "   -0.3297 if pa>=-0.1415664494037628\n",
      "   +1.2402 if pav<=0.06422646939754487\n",
      "   -0.3297 if cv<=1.0829041719436647\n",
      "   +4.0356 if cp>=-0.01241636425256728\n",
      "   +4.5178 if cp>=-0.009269407950341702\n",
      "   +1.2402 if pav<=0.07888057827949524\n",
      "   +2.8517 if cv>=-0.2162771999835968\n",
      "   +0.4916 if cv>=-0.00461280699819326 & pav<=0.033639769628644005\n",
      "   -0.3297 if pa>=-0.11794757843017578 & pav>=-0.3092974126338959\n",
      "   -5.1336 if cp>=-0.02731324173510074\n",
      "   +2.7111 if cp<=-0.02457897551357746 & cv>=-0.013584508560597897\n",
      "--------------\n",
      "   -0.5595 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -0.5595 if pa>=-0.05086350068449974\n",
      "   -1.9012 if cp>=-0.0235149297863245\n",
      "   -0.5595 if cp<=0.026253991574048997\n",
      "   -0.5595 if cp<=0.07211526557803155\n",
      "   +2.5970 if cv<=-0.03215434700250626 & pa>=-0.028441185131669044\n",
      "   +2.8766 if cp>=-0.029453209787607192 & pa>=-0.06627395823597895\n",
      "   -0.7850 if pa<=0.16434048116207123 & pav>=0.07888057827949524\n",
      "   -0.3761 if cv>=0.17585383355617523\n",
      "   -3.1557 if cp<=-0.016846656799316406 & cv>=-0.030385859310626984 & pav>=-0.3092974126338959\n",
      "   +0.6023 if cp<=-0.05298580601811409 & cv<=0.017999613657593744\n",
      "   +3.5210 if cp>=-0.05084318295121193 & cv<=-0.2179044485092163\n",
      "Run episode 171 with rewards 27.0\n",
      "============ 172 ===========\n",
      "16 actions [0, 1, 0, 0, 1, 0, 1, 0, 0, 1, 1, 1, 0, 0, 1, 0]\n",
      "   -0.6292 if pa>=-0.1113012358546257\n",
      "   +1.5530 if pav<=0.06422646939754487\n",
      "   -0.6292 if cv<=1.0829041719436647\n",
      "   +3.8423 if cp>=-0.01241636425256728\n",
      "   +3.8423 if cp>=-0.009269407950341702\n",
      "   +1.5655 if pav<=0.07888057827949524\n",
      "   +2.0522 if cv>=-0.2162771999835968\n",
      "   +1.5529 if cv>=-0.00461280699819326 & pav<=0.033639769628644005\n",
      "   -0.6292 if pa>=-0.11794757843017578 & pav>=-0.3092974126338959\n",
      "   -4.2760 if cp>=-0.02731324173510074\n",
      "   +0.8641 if cp<=-0.02457897551357746 & cv>=-0.013584508560597897\n",
      "   +1.9024 if cp>=-0.06385265439748763 & cv>=-0.3870550572872162 & pav>=0.24086304605007172\n",
      "--------------\n",
      "   -3.1225 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -0.4718 if pa>=-0.05086350068449974\n",
      "   +0.5215 if cp>=-0.0235149297863245\n",
      "   -0.4718 if cp<=0.026253991574048997\n",
      "   -0.4718 if cp<=0.07211526557803155\n",
      "   +1.4458 if cv<=-0.03215434700250626 & pa>=-0.028441185131669044\n",
      "   +1.2984 if cp>=-0.029453209787607192 & pa>=-0.06627395823597895\n",
      "   +2.0865 if pa<=0.16434048116207123 & pav>=0.07888057827949524\n",
      "   -1.9157 if cp<=-0.016846656799316406 & cv>=-0.030385859310626984 & pav>=-0.3092974126338959\n",
      "   +1.8493 if cp<=-0.05298580601811409 & cv<=0.017999613657593744\n",
      "   +3.6817 if cp>=-0.05084318295121193 & cv<=-0.2179044485092163\n",
      "   -2.3255 if cp>=-0.00505175534635782 & cv<=-0.20234642326831817\n",
      "Run episode 172 with rewards 16.0\n",
      "============ 173 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.9015 if pa>=-0.1113012358546257\n",
      "   +0.7179 if pav<=0.06422646939754487\n",
      "   -0.9015 if cv<=1.0829041719436647\n",
      "   +0.0000 if cp>=-0.01241636425256728\n",
      "   +0.0000 if cp>=-0.009269407950341702\n",
      "   +0.7179 if pav<=0.07888057827949524\n",
      "   +1.6109 if cv>=-0.2162771999835968\n",
      "   +0.6969 if cv>=-0.00461280699819326 & pav<=0.033639769628644005\n",
      "   -4.0917 if cp>=-0.02731324173510074\n",
      "   +0.7883 if cp<=-0.02457897551357746 & cv>=-0.013584508560597897\n",
      "   +2.0945 if cp>=-0.06385265439748763 & cv>=-0.3870550572872162 & pav>=0.24086304605007172\n",
      "   +0.3946 if cp>=-0.029243746772408485\n",
      "--------------\n",
      "   -1.0942 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -0.8205 if pa>=-0.05086350068449974\n",
      "   +0.0000 if cp>=-0.0235149297863245\n",
      "   -0.8205 if cp<=0.026253991574048997\n",
      "   -0.0006 if cv<=-0.03215434700250626 & pa>=-0.028441185131669044\n",
      "   +0.1123 if cp>=-0.029453209787607192 & pa>=-0.06627395823597895\n",
      "   +1.4949 if pa<=0.16434048116207123 & pav>=0.07888057827949524\n",
      "   -0.8198 if cp<=-0.016846656799316406 & cv>=-0.030385859310626984 & pav>=-0.3092974126338959\n",
      "   +2.4341 if cp<=-0.05298580601811409 & cv<=0.017999613657593744\n",
      "   +3.9466 if cp>=-0.05084318295121193 & cv<=-0.2179044485092163\n",
      "   +0.0000 if cp>=-0.00505175534635782 & cv<=-0.20234642326831817\n",
      "   +1.9674 if cp>=-0.02600123919546604\n",
      "Run episode 173 with rewards 10.0\n",
      "============ 174 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.6322 if pa>=-0.1113012358546257\n",
      "   -0.6265 if pav<=0.06422646939754487\n",
      "   -0.5851 if cv<=1.0829041719436647\n",
      "   -0.6265 if cp>=-0.009269407950341702\n",
      "   -0.6265 if pav<=0.07888057827949524\n",
      "   -0.6265 if cv>=-0.2162771999835968\n",
      "   -0.6265 if cv>=-0.00461280699819326 & pav<=0.033639769628644005\n",
      "   -0.6265 if cp>=-0.02731324173510074\n",
      "   +0.0000 if cp<=-0.02457897551357746 & cv>=-0.013584508560597897\n",
      "   +0.0000 if cp>=-0.06385265439748763 & cv>=-0.3870550572872162 & pav>=0.24086304605007172\n",
      "   -0.6265 if cp>=-0.029243746772408485\n",
      "   -0.2886 if cp<=0.017083643935620785\n",
      "--------------\n",
      "   +0.8936 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   +0.8936 if pa>=-0.05086350068449974\n",
      "   +0.3892 if cp<=0.026253991574048997\n",
      "   +0.0000 if cv<=-0.03215434700250626 & pa>=-0.028441185131669044\n",
      "   +0.8936 if cp>=-0.029453209787607192 & pa>=-0.06627395823597895\n",
      "   +0.0000 if pa<=0.16434048116207123 & pav>=0.07888057827949524\n",
      "   +0.0000 if cp<=-0.016846656799316406 & cv>=-0.030385859310626984 & pav>=-0.3092974126338959\n",
      "   +0.0000 if cp<=-0.05298580601811409 & cv<=0.017999613657593744\n",
      "   +0.0000 if cp>=-0.05084318295121193 & cv<=-0.2179044485092163\n",
      "   +0.0000 if cp>=-0.00505175534635782 & cv<=-0.20234642326831817\n",
      "   +0.4517 if cp>=-0.02600123919546604\n",
      "   -0.0766 if cp>=0.03371059969067573\n",
      "Run episode 174 with rewards 9.0\n",
      "============ 175 ===========\n",
      "10 actions [1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.4760 if pa>=-0.1113012358546257\n",
      "   -0.2913 if pav<=0.06422646939754487\n",
      "   -0.2732 if cv<=1.0829041719436647\n",
      "   -0.2913 if cp>=-0.009269407950341702\n",
      "   -0.2913 if pav<=0.07888057827949524\n",
      "   -0.2913 if cv>=-0.2162771999835968\n",
      "   -0.2913 if cv>=-0.00461280699819326 & pav<=0.033639769628644005\n",
      "   -0.2913 if cp>=-0.02731324173510074\n",
      "   +0.0000 if cp>=-0.06385265439748763 & cv>=-0.3870550572872162 & pav>=0.24086304605007172\n",
      "   -0.2913 if cp>=-0.029243746772408485\n",
      "   -0.1316 if cp<=0.017083643935620785\n",
      "   -0.1383 if cp>=0.038069987297058114\n",
      "--------------\n",
      "   +0.1330 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   +0.1330 if pa>=-0.05086350068449974\n",
      "   +0.1330 if cp<=0.026253991574048997\n",
      "   -0.0000 if cv<=-0.03215434700250626 & pa>=-0.028441185131669044\n",
      "   +0.1546 if cp>=-0.029453209787607192 & pa>=-0.06627395823597895\n",
      "   -0.0000 if pa<=0.16434048116207123 & pav>=0.07888057827949524\n",
      "   -0.0000 if cp<=-0.016846656799316406 & cv>=-0.030385859310626984 & pav>=-0.3092974126338959\n",
      "   -0.0000 if cp<=-0.05298580601811409 & cv<=0.017999613657593744\n",
      "   -0.0000 if cp>=-0.05084318295121193 & cv<=-0.2179044485092163\n",
      "   +0.1524 if cp>=-0.02600123919546604\n",
      "   +0.0193 if cp>=0.03371059969067573\n",
      "   +0.0298 if pa>=-0.00799544807523489\n",
      "Run episode 175 with rewards 10.0\n",
      "============ 176 ===========\n",
      "9 actions [1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -0.5680 if pa>=-0.1113012358546257\n",
      "   -0.5025 if pav<=0.06422646939754487\n",
      "   -0.4631 if cv<=1.0829041719436647\n",
      "   -0.5025 if cp>=-0.009269407950341702\n",
      "   -0.5025 if pav<=0.07888057827949524\n",
      "   -0.5025 if cv>=-0.2162771999835968\n",
      "   -0.5025 if cv>=-0.00461280699819326 & pav<=0.033639769628644005\n",
      "   -0.5025 if cp>=-0.02731324173510074\n",
      "   -0.5025 if cp>=-0.029243746772408485\n",
      "   -0.3419 if cp<=0.017083643935620785\n",
      "   -0.0394 if cp>=0.038069987297058114\n",
      "   -0.1605 if cp>=0.015772543102502826\n",
      "--------------\n",
      "   +0.5091 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   +0.5091 if pa>=-0.05086350068449974\n",
      "   +0.3771 if cp<=0.026253991574048997\n",
      "   +0.5091 if cp>=-0.029453209787607192 & pa>=-0.06627395823597895\n",
      "   +0.0000 if pa<=0.16434048116207123 & pav>=0.07888057827949524\n",
      "   +0.0000 if cp<=-0.016846656799316406 & cv>=-0.030385859310626984 & pav>=-0.3092974126338959\n",
      "   +0.0000 if cp<=-0.05298580601811409 & cv<=0.017999613657593744\n",
      "   +0.0000 if cp>=-0.05084318295121193 & cv<=-0.2179044485092163\n",
      "   +0.4719 if cp>=-0.02600123919546604\n",
      "   +0.0948 if cp>=0.03371059969067573\n",
      "   +0.3771 if pa>=-0.00799544807523489\n",
      "   +0.1456 if cp>=0.015772543102502826\n",
      "Run episode 176 with rewards 9.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 177 ===========\n",
      "41 actions [1, 1, 0, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n",
      "   -2.1677 if pa>=-0.1113012358546257\n",
      "   +0.3851 if pav<=0.06422646939754487\n",
      "   -1.1601 if cv<=1.0829041719436647\n",
      "   +0.8528 if cp>=-0.009269407950341702\n",
      "   +0.3851 if pav<=0.07888057827949524\n",
      "   +0.3851 if cv>=-0.2162771999835968\n",
      "   +0.4618 if cv>=-0.00461280699819326 & pav<=0.033639769628644005\n",
      "   +0.7519 if cp>=-0.02731324173510074\n",
      "   +0.7519 if cp>=-0.029243746772408485\n",
      "   -2.1677 if cp<=0.017083643935620785\n",
      "   +2.5528 if cp>=0.015772543102502826\n",
      "   -0.0768 if pa>=-0.008885621093213558\n",
      "--------------\n",
      "   +0.5681 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   +0.5681 if pa>=-0.05086350068449974\n",
      "   +0.6273 if cp<=0.026253991574048997\n",
      "   +0.0240 if cp>=-0.029453209787607192 & pa>=-0.06627395823597895\n",
      "   -0.0000 if pa<=0.16434048116207123 & pav>=0.07888057827949524\n",
      "   -0.0000 if cp<=-0.05298580601811409 & cv<=0.017999613657593744\n",
      "   -0.0000 if cp>=-0.05084318295121193 & cv<=-0.2179044485092163\n",
      "   +0.0157 if cp>=-0.02600123919546604\n",
      "   -0.0676 if cp>=0.03371059969067573\n",
      "   -0.0000 if pa>=-0.00799544807523489\n",
      "   -0.0676 if cp>=0.015772543102502826\n",
      "   +0.1684 if cp<=-0.03104888834059238 & cp>=-0.04133600890636444\n",
      "Run episode 177 with rewards 41.0\n",
      "============ 178 ===========\n",
      "23 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1]\n",
      "   -4.0772 if pa>=-0.1113012358546257\n",
      "   -0.3544 if pav<=0.06422646939754487\n",
      "   -0.8316 if cv<=1.0829041719436647\n",
      "   -8.1589 if cp>=-0.009269407950341702\n",
      "   -0.3544 if pav<=0.07888057827949524\n",
      "   +5.6424 if cv>=-0.2162771999835968\n",
      "   -0.0157 if cv>=-0.00461280699819326 & pav<=0.033639769628644005\n",
      "   +4.3525 if cp>=-0.02731324173510074\n",
      "   +4.3525 if cp>=-0.029243746772408485\n",
      "   -2.4063 if cp<=0.017083643935620785\n",
      "   +3.7062 if cp>=0.015772543102502826\n",
      "   +5.6199 if cv<=-0.17933720350265503 & cv>=-0.17933720350265503\n",
      "--------------\n",
      "   +1.9803 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   +0.9249 if pa>=-0.05086350068449974\n",
      "   -2.3896 if cp<=0.026253991574048997\n",
      "   +1.0611 if cp>=-0.029453209787607192 & pa>=-0.06627395823597895\n",
      "   +0.8381 if cp<=-0.05298580601811409 & cv<=0.017999613657593744\n",
      "   +5.3587 if cp>=-0.05084318295121193 & cv<=-0.2179044485092163\n",
      "   -6.1893 if cp>=-0.02600123919546604\n",
      "   -1.7488 if cp>=0.03371059969067573\n",
      "   +0.0000 if pa>=-0.00799544807523489\n",
      "   +1.8591 if cp>=0.015772543102502826\n",
      "   +0.0075 if cp<=-0.03104888834059238 & cp>=-0.04133600890636444\n",
      "   +7.3845 if cp<=0.016467629000544555 & cp>=-0.07787509262561798 & pa>=-0.06423645466566086 & pav<=0.15218895673751837\n",
      "Run episode 178 with rewards 23.0\n",
      "============ 179 ===========\n",
      "16 actions [0, 0, 1, 0, 1, 1, 0, 0, 0, 1, 0, 0, 0, 0, 0, 1]\n",
      "   +0.0280 if pa>=-0.1113012358546257\n",
      "   +0.8930 if pav<=0.06422646939754487\n",
      "   +0.0280 if cv<=1.0829041719436647\n",
      "   -2.3000 if cp>=-0.009269407950341702\n",
      "   +1.6439 if pav<=0.07888057827949524\n",
      "   +2.5275 if cv>=-0.2162771999835968\n",
      "   +0.0280 if cp>=-0.02731324173510074\n",
      "   +0.0280 if cp>=-0.029243746772408485\n",
      "   -0.2901 if cp<=0.017083643935620785\n",
      "   +0.3181 if cp>=0.015772543102502826\n",
      "   -0.0000 if cv<=-0.17933720350265503 & cv>=-0.17933720350265503\n",
      "   +1.5046 if cp<=0.0358876995742321 & cv>=-0.06155570819973945\n",
      "--------------\n",
      "   -0.8559 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -0.8559 if pa>=-0.05086350068449974\n",
      "   -1.4192 if cp<=0.026253991574048997\n",
      "   -0.8559 if cp>=-0.029453209787607192 & pa>=-0.06627395823597895\n",
      "   +0.0000 if cp<=-0.05298580601811409 & cv<=0.017999613657593744\n",
      "   +3.7072 if cp>=-0.05084318295121193 & cv<=-0.2179044485092163\n",
      "   -0.8559 if cp>=-0.02600123919546604\n",
      "   +0.4659 if cp>=0.03371059969067573\n",
      "   +2.7864 if cp>=0.015772543102502826\n",
      "   +0.0000 if cp<=-0.03104888834059238 & cp>=-0.04133600890636444\n",
      "   +0.0000 if cp<=0.016467629000544555 & cp>=-0.07787509262561798 & pa>=-0.06423645466566086 & pav<=0.15218895673751837\n",
      "   +1.1469 if cv<=-0.24116332530975343\n",
      "Run episode 179 with rewards 16.0\n",
      "============ 180 ===========\n",
      "18 actions [0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 0, 0]\n",
      "   -0.1680 if pa>=-0.1113012358546257\n",
      "   +0.4433 if pav<=0.06422646939754487\n",
      "   -0.1680 if cv<=1.0829041719436647\n",
      "   -0.0000 if cp>=-0.009269407950341702\n",
      "   +0.4433 if pav<=0.07888057827949524\n",
      "   +0.4433 if cv>=-0.2162771999835968\n",
      "   -1.4856 if cp>=-0.02731324173510074\n",
      "   -1.4856 if cp>=-0.029243746772408485\n",
      "   -0.1680 if cp<=0.017083643935620785\n",
      "   -0.0000 if cp>=0.015772543102502826\n",
      "   +0.4433 if cp<=0.0358876995742321 & cv>=-0.06155570819973945\n",
      "   +3.0600 if cp>=-0.03380712866783142\n",
      "--------------\n",
      "   -1.5494 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -0.6872 if pa>=-0.05086350068449974\n",
      "   -0.6872 if cp<=0.026253991574048997\n",
      "   +0.2232 if cp>=-0.029453209787607192 & pa>=-0.06627395823597895\n",
      "   -2.9911 if cp<=-0.05298580601811409 & cv<=0.017999613657593744\n",
      "   +3.9277 if cp>=-0.05084318295121193 & cv<=-0.2179044485092163\n",
      "   +0.2232 if cp>=-0.02600123919546604\n",
      "   +0.0000 if cp>=0.03371059969067573\n",
      "   +0.0000 if cp>=0.015772543102502826\n",
      "   -0.0030 if cp<=0.016467629000544555 & cp>=-0.07787509262561798 & pa>=-0.06423645466566086 & pav<=0.15218895673751837\n",
      "   +3.5155 if cv<=-0.24116332530975343\n",
      "   -3.4554 if cp>=-0.03380712866783142\n",
      "Run episode 180 with rewards 18.0\n",
      "============ 181 ===========\n",
      "15 actions [0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1]\n",
      "   -1.2752 if pa>=-0.1113012358546257\n",
      "   +0.1315 if pav<=0.06422646939754487\n",
      "   -1.2752 if cv<=1.0829041719436647\n",
      "   +0.0000 if cp>=-0.009269407950341702\n",
      "   +0.1315 if pav<=0.07888057827949524\n",
      "   +3.3460 if cv>=-0.2162771999835968\n",
      "   +0.0119 if cp>=-0.02731324173510074\n",
      "   +0.0119 if cp>=-0.029243746772408485\n",
      "   -1.2752 if cp<=0.017083643935620785\n",
      "   +0.1315 if cp<=0.0358876995742321 & cv>=-0.06155570819973945\n",
      "   +0.1044 if cp>=-0.03380712866783142\n",
      "   +3.1151 if cp<=-0.07711121290922165\n",
      "--------------\n",
      "   +0.5135 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -1.7897 if pa>=-0.05086350068449974\n",
      "   -1.7897 if cp<=0.026253991574048997\n",
      "   -0.1669 if cp>=-0.029453209787607192 & pa>=-0.06627395823597895\n",
      "   -0.7656 if cp<=-0.05298580601811409 & cv<=0.017999613657593744\n",
      "   +3.1115 if cp>=-0.05084318295121193 & cv<=-0.2179044485092163\n",
      "   -0.1669 if cp>=-0.02600123919546604\n",
      "   +0.0000 if cp>=0.015772543102502826\n",
      "   -0.2686 if cp<=0.016467629000544555 & cp>=-0.07787509262561798 & pa>=-0.06423645466566086 & pav<=0.15218895673751837\n",
      "   +3.6507 if cv<=-0.24116332530975343\n",
      "   -0.2357 if cp>=-0.03380712866783142\n",
      "   +0.7383 if cv<=-0.36121366620063783\n",
      "Run episode 181 with rewards 15.0\n",
      "============ 182 ===========\n",
      "15 actions [0, 0, 1, 0, 0, 1, 1, 0, 0, 0, 0, 1, 1, 1, 1]\n",
      "   -0.2926 if pa>=-0.1113012358546257\n",
      "   +0.1702 if pav<=0.06422646939754487\n",
      "   -0.2926 if cv<=1.0829041719436647\n",
      "   +0.1702 if pav<=0.07888057827949524\n",
      "   +1.7375 if cv>=-0.2162771999835968\n",
      "   +0.0011 if cp>=-0.02731324173510074\n",
      "   +0.0011 if cp>=-0.029243746772408485\n",
      "   -0.2926 if cp<=0.017083643935620785\n",
      "   +0.1702 if cp<=0.0358876995742321 & cv>=-0.06155570819973945\n",
      "   +0.2659 if cp>=-0.03380712866783142\n",
      "   -0.0000 if cp<=-0.07711121290922165\n",
      "   +0.2520 if pa>=0.20936347544193268\n",
      "--------------\n",
      "   -1.2449 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -1.2449 if pa>=-0.05086350068449974\n",
      "   -1.2449 if cp<=0.026253991574048997\n",
      "   -0.1592 if cp>=-0.029453209787607192 & pa>=-0.06627395823597895\n",
      "   -0.2261 if cp<=-0.05298580601811409 & cv<=0.017999613657593744\n",
      "   +1.6135 if cp>=-0.05084318295121193 & cv<=-0.2179044485092163\n",
      "   -0.1592 if cp>=-0.02600123919546604\n",
      "   -0.2696 if cp<=0.016467629000544555 & cp>=-0.07787509262561798 & pa>=-0.06423645466566086 & pav<=0.15218895673751837\n",
      "   +1.7625 if cv<=-0.24116332530975343\n",
      "   -0.5851 if cp>=-0.03380712866783142\n",
      "   +1.7625 if cv<=-0.36121366620063783\n",
      "   -0.1300 if cp>=-0.008188841212540857\n",
      "Run episode 182 with rewards 15.0\n",
      "============ 183 ===========\n",
      "12 actions [0, 0, 1, 0, 1, 0, 0, 0, 0, 0, 1, 1]\n",
      "   -0.1674 if pa>=-0.1113012358546257\n",
      "   +0.2185 if pav<=0.06422646939754487\n",
      "   -0.1674 if cv<=1.0829041719436647\n",
      "   +0.2185 if pav<=0.07888057827949524\n",
      "   +0.8559 if cv>=-0.2162771999835968\n",
      "   +1.2746 if cp>=-0.02731324173510074\n",
      "   +1.2746 if cp>=-0.029243746772408485\n",
      "   -0.1122 if cp<=0.017083643935620785\n",
      "   +0.0000 if cp<=0.0358876995742321 & cv>=-0.06155570819973945\n",
      "   +1.2746 if cp>=-0.03380712866783142\n",
      "   +0.0000 if pa>=0.20936347544193268\n",
      "   -3.0152 if cp>=-0.006339060002937909\n",
      "--------------\n",
      "   -1.9120 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   +0.9450 if pa>=-0.05086350068449974\n",
      "   -2.5854 if cp<=0.026253991574048997\n",
      "   -0.8280 if cp>=-0.029453209787607192 & pa>=-0.06627395823597895\n",
      "   +0.1507 if cp<=-0.05298580601811409 & cv<=0.017999613657593744\n",
      "   +1.6182 if cp>=-0.05084318295121193 & cv<=-0.2179044485092163\n",
      "   -0.8280 if cp>=-0.02600123919546604\n",
      "   +0.0000 if cp<=0.016467629000544555 & cp>=-0.07787509262561798 & pa>=-0.06423645466566086 & pav<=0.15218895673751837\n",
      "   +1.7689 if cv<=-0.24116332530975343\n",
      "   -0.8280 if cp>=-0.03380712866783142\n",
      "   +1.7689 if cv<=-0.36121366620063783\n",
      "   -3.1453 if cp<=-0.006339060002937909 & cp>=-0.0410750575363636\n",
      "Run episode 183 with rewards 12.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 184 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +2.0980 if pa>=-0.1113012358546257\n",
      "   +0.1217 if pav<=0.06422646939754487\n",
      "   +2.0980 if cv<=1.0829041719436647\n",
      "   +0.1217 if pav<=0.07888057827949524\n",
      "   +0.3822 if cv>=-0.2162771999835968\n",
      "   -0.6544 if cp>=-0.02731324173510074\n",
      "   -0.6544 if cp>=-0.029243746772408485\n",
      "   +3.2059 if cp<=0.017083643935620785\n",
      "   -0.6544 if cp>=-0.03380712866783142\n",
      "   -0.0000 if pa>=0.20936347544193268\n",
      "   -0.6565 if cp>=-0.006339060002937909\n",
      "   -2.7240 if cp>=0.02728187181055547 & cv<=-0.1807118147611618\n",
      "--------------\n",
      "   +0.2370 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -2.6644 if pa>=-0.05086350068449974\n",
      "   -4.5510 if cp<=0.026253991574048997\n",
      "   +0.1001 if cp>=-0.029453209787607192 & pa>=-0.06627395823597895\n",
      "   -2.7182 if cp<=-0.05298580601811409 & cv<=0.017999613657593744\n",
      "   +2.5774 if cp>=-0.05084318295121193 & cv<=-0.2179044485092163\n",
      "   +0.1001 if cp>=-0.02600123919546604\n",
      "   -0.1408 if cv<=-0.24116332530975343\n",
      "   +0.1001 if cp>=-0.03380712866783142\n",
      "   -0.1408 if cv<=-0.36121366620063783\n",
      "   -0.0476 if cp<=-0.006339060002937909 & cp>=-0.0410750575363636\n",
      "   +2.6628 if cp>=0.014604824967682364 & cv<=-0.1807118147611618\n",
      "Run episode 184 with rewards 9.0\n",
      "============ 185 ===========\n",
      "12 actions [0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 1, 0]\n",
      "   +0.1973 if pa>=-0.1113012358546257\n",
      "   +0.0109 if pav<=0.06422646939754487\n",
      "   +0.1973 if cv<=1.0829041719436647\n",
      "   +0.0109 if pav<=0.07888057827949524\n",
      "   +0.0205 if cv>=-0.2162771999835968\n",
      "   +0.1025 if cp>=-0.02731324173510074\n",
      "   +0.1542 if cp>=-0.029243746772408485\n",
      "   +0.1973 if cp<=0.017083643935620785\n",
      "   +0.1542 if cp>=-0.03380712866783142\n",
      "   -0.0000 if cp>=-0.006339060002937909\n",
      "   -0.0000 if cp>=0.02728187181055547 & cv<=-0.1807118147611618\n",
      "   -0.0001 if cp<=-0.08475320041179657\n",
      "--------------\n",
      "   -0.0980 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -0.1213 if pa>=-0.05086350068449974\n",
      "   -0.1213 if cp<=0.026253991574048997\n",
      "   -0.1149 if cp>=-0.029453209787607192 & pa>=-0.06627395823597895\n",
      "   -0.0021 if cp<=-0.05298580601811409 & cv<=0.017999613657593744\n",
      "   -0.0545 if cp>=-0.05084318295121193 & cv<=-0.2179044485092163\n",
      "   -0.0980 if cp>=-0.02600123919546604\n",
      "   -0.0566 if cv<=-0.24116332530975343\n",
      "   -0.1149 if cp>=-0.03380712866783142\n",
      "   -0.0566 if cv<=-0.36121366620063783\n",
      "   +0.0000 if cp>=0.014604824967682364 & cv<=-0.1807118147611618\n",
      "   -0.0588 if cp<=-0.01872282214462757 & cp>=-0.08475320041179657\n",
      "Run episode 185 with rewards 12.0\n",
      "============ 186 ===========\n",
      "17 actions [0, 0, 0, 0, 0, 1, 1, 1, 0, 1, 1, 0, 1, 1, 0, 0, 1]\n",
      "   +0.2479 if pa>=-0.1113012358546257\n",
      "   +0.1741 if pav<=0.06422646939754487\n",
      "   +0.2479 if cv<=1.0829041719436647\n",
      "   +0.1741 if pav<=0.07888057827949524\n",
      "   +0.1741 if cv>=-0.2162771999835968\n",
      "   +1.1186 if cp>=-0.02731324173510074\n",
      "   +1.1186 if cp>=-0.029243746772408485\n",
      "   +0.2479 if cp<=0.017083643935620785\n",
      "   +1.1186 if cp>=-0.03380712866783142\n",
      "   +0.0000 if cp>=0.02728187181055547 & cv<=-0.1807118147611618\n",
      "   -1.5964 if cp<=-0.08475320041179657\n",
      "   -2.2795 if pav>=1.9614720344543457\n",
      "--------------\n",
      "   -0.5634 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -0.1025 if pa>=-0.05086350068449974\n",
      "   -0.1025 if cp<=0.026253991574048997\n",
      "   -0.8898 if cp>=-0.029453209787607192 & pa>=-0.06627395823597895\n",
      "   +2.1637 if cp<=-0.05298580601811409 & cv<=0.017999613657593744\n",
      "   -1.8680 if cp>=-0.05084318295121193 & cv<=-0.2179044485092163\n",
      "   -0.8624 if cp>=-0.02600123919546604\n",
      "   +0.3545 if cv<=-0.24116332530975343\n",
      "   -0.8898 if cp>=-0.03380712866783142\n",
      "   +0.3545 if cv<=-0.36121366620063783\n",
      "   -0.1871 if cp<=-0.01872282214462757 & cp>=-0.08475320041179657\n",
      "   -2.0906 if cp<=-0.016656085476279236 & cv>=-1.0195966005325316\n",
      "Run episode 186 with rewards 17.0\n",
      "============ 187 ===========\n",
      "13 actions [0, 0, 0, 0, 0, 1, 1, 1, 1, 0, 1, 1, 0]\n",
      "   +0.6175 if pa>=-0.1113012358546257\n",
      "   +0.1022 if pav<=0.06422646939754487\n",
      "   +0.6175 if cv<=1.0829041719436647\n",
      "   +0.1022 if pav<=0.07888057827949524\n",
      "   +1.0727 if cv>=-0.2162771999835968\n",
      "   -0.0000 if cp>=-0.02731324173510074\n",
      "   -0.0000 if cp>=-0.029243746772408485\n",
      "   +0.6175 if cp<=0.017083643935620785\n",
      "   -0.0000 if cp>=-0.03380712866783142\n",
      "   -3.0043 if cp<=-0.08475320041179657\n",
      "   -0.0000 if pav>=1.9614720344543457\n",
      "   -3.5482 if pav>=1.4362791776657104\n",
      "--------------\n",
      "   -1.6910 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -0.4854 if cp<=0.026253991574048997\n",
      "   +0.0000 if cp>=-0.029453209787607192 & pa>=-0.06627395823597895\n",
      "   +1.3356 if cp<=-0.05298580601811409 & cv<=0.017999613657593744\n",
      "   -0.8682 if cp>=-0.05084318295121193 & cv<=-0.2179044485092163\n",
      "   +0.0000 if cp>=-0.02600123919546604\n",
      "   +0.7080 if cv<=-0.24116332530975343\n",
      "   +0.0000 if cp>=-0.03380712866783142\n",
      "   +0.9953 if cv<=-0.36121366620063783\n",
      "   -2.9852 if cp<=-0.01872282214462757 & cp>=-0.08475320041179657\n",
      "   -0.4854 if cp<=-0.016656085476279236 & cv>=-1.0195966005325316\n",
      "   +3.6996 if pav>=1.4362791776657104\n",
      "Run episode 187 with rewards 13.0\n",
      "============ 188 ===========\n",
      "12 actions [0, 0, 0, 1, 0, 0, 0, 1, 0, 1, 1, 1]\n",
      "   +0.3450 if pa>=-0.1113012358546257\n",
      "   +0.0229 if pav<=0.06422646939754487\n",
      "   +0.3450 if cv<=1.0829041719436647\n",
      "   +0.0229 if pav<=0.07888057827949524\n",
      "   +0.6328 if cv>=-0.2162771999835968\n",
      "   +0.0000 if cp>=-0.029243746772408485\n",
      "   +0.3450 if cp<=0.017083643935620785\n",
      "   +0.0449 if cp>=-0.03380712866783142\n",
      "   -2.0528 if cp<=-0.08475320041179657\n",
      "   +0.0000 if pav>=1.9614720344543457\n",
      "   -1.0946 if pav>=1.4362791776657104\n",
      "   -1.2282 if cp<=-0.10704701989889144 & cv<=-0.3474475085735319\n",
      "--------------\n",
      "   -0.6284 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -0.5224 if cp<=0.026253991574048997\n",
      "   -0.0000 if cp>=-0.029453209787607192 & pa>=-0.06627395823597895\n",
      "   +0.5453 if cp<=-0.05298580601811409 & cv<=0.017999613657593744\n",
      "   -0.9854 if cp>=-0.05084318295121193 & cv<=-0.2179044485092163\n",
      "   +1.0491 if cv<=-0.24116332530975343\n",
      "   -0.0823 if cp>=-0.03380712866783142\n",
      "   +1.0491 if cv<=-0.36121366620063783\n",
      "   -1.9936 if cp<=-0.01872282214462757 & cp>=-0.08475320041179657\n",
      "   -0.5224 if cp<=-0.016656085476279236 & cv>=-1.0195966005325316\n",
      "   +1.3320 if pav>=1.4362791776657104\n",
      "   +0.4255 if cp<=-0.06667464599013327 & cv>=-0.6980578660964966\n",
      "Run episode 188 with rewards 12.0\n",
      "============ 189 ===========\n",
      "11 actions [0, 0, 1, 0, 0, 0, 0, 1, 1, 0, 1]\n",
      "   +0.2126 if pa>=-0.1113012358546257\n",
      "   +0.3312 if pav<=0.06422646939754487\n",
      "   +0.2126 if cv<=1.0829041719436647\n",
      "   +0.3312 if pav<=0.07888057827949524\n",
      "   +0.9090 if cv>=-0.2162771999835968\n",
      "   +0.2126 if cp<=0.017083643935620785\n",
      "   -1.0283 if cp>=-0.03380712866783142\n",
      "   -0.1031 if cp<=-0.08475320041179657\n",
      "   +0.0000 if pav>=1.9614720344543457\n",
      "   -1.8382 if pav>=1.4362791776657104\n",
      "   +0.3100 if cp<=-0.10704701989889144 & cv<=-0.3474475085735319\n",
      "   +2.2307 if cp>=-0.0023679188219830347\n",
      "--------------\n",
      "   -2.4595 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -0.2031 if cp<=0.026253991574048997\n",
      "   -0.7600 if cp<=-0.05298580601811409 & cv<=0.017999613657593744\n",
      "   +0.1583 if cp>=-0.05084318295121193 & cv<=-0.2179044485092163\n",
      "   +0.6380 if cv<=-0.24116332530975343\n",
      "   +0.0438 if cp>=-0.03380712866783142\n",
      "   +2.2564 if cv<=-0.36121366620063783\n",
      "   -0.7261 if cp<=-0.01872282214462757 & cp>=-0.08475320041179657\n",
      "   -1.3204 if cp<=-0.016656085476279236 & cv>=-1.0195966005325316\n",
      "   +1.3099 if pav>=1.4362791776657104\n",
      "   -0.8916 if cp<=-0.06667464599013327 & cv>=-0.6980578660964966\n",
      "   -2.7025 if cp<=-0.02157978191971778 & cv>=-0.7444406032562256\n",
      "Run episode 189 with rewards 11.0\n",
      "============ 190 ===========\n",
      "13 actions [0, 0, 0, 0, 0, 1, 1, 0, 1, 0, 1, 0, 0]\n",
      "   +0.3348 if pa>=-0.1113012358546257\n",
      "   +0.5924 if pav<=0.06422646939754487\n",
      "   +0.3348 if cv<=1.0829041719436647\n",
      "   +0.5924 if pav<=0.07888057827949524\n",
      "   +2.2685 if cv>=-0.2162771999835968\n",
      "   +0.3348 if cp<=0.017083643935620785\n",
      "   -1.5557 if cp>=-0.03380712866783142\n",
      "   +2.0433 if cp<=-0.08475320041179657\n",
      "   -0.4360 if pav>=1.4362791776657104\n",
      "   +2.0389 if cp<=-0.10704701989889144 & cv<=-0.3474475085735319\n",
      "   -0.0000 if cp>=-0.0023679188219830347\n",
      "   -1.5557 if cp>=-0.029719324782490727\n",
      "--------------\n",
      "   -0.1536 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -1.8283 if cp<=0.026253991574048997\n",
      "   +1.4178 if cp<=-0.05298580601811409 & cv<=0.017999613657593744\n",
      "   -0.1984 if cp>=-0.05084318295121193 & cv<=-0.2179044485092163\n",
      "   +1.2194 if cv<=-0.24116332530975343\n",
      "   +1.2194 if cv<=-0.36121366620063783\n",
      "   -2.0812 if cp<=-0.01872282214462757 & cp>=-0.08475320041179657\n",
      "   +1.1593 if cp<=-0.016656085476279236 & cv>=-1.0195966005325316\n",
      "   +0.4162 if pav>=1.4362791776657104\n",
      "   -0.7365 if cp<=-0.06667464599013327 & cv>=-0.6980578660964966\n",
      "   -2.3415 if cp<=-0.02157978191971778 & cv>=-0.7444406032562256\n",
      "   -0.1536 if cp>=-0.029719324782490727\n",
      "Run episode 190 with rewards 13.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 191 ===========\n",
      "14 actions [0, 0, 0, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 0]\n",
      "   +0.1701 if pa>=-0.1113012358546257\n",
      "   +0.0213 if pav<=0.06422646939754487\n",
      "   +0.1701 if cv<=1.0829041719436647\n",
      "   +0.0213 if pav<=0.07888057827949524\n",
      "   +0.2316 if cv>=-0.2162771999835968\n",
      "   +0.1701 if cp<=0.017083643935620785\n",
      "   +0.8480 if cp>=-0.03380712866783142\n",
      "   +1.0174 if cp<=-0.08475320041179657\n",
      "   +0.0000 if pav>=1.4362791776657104\n",
      "   -0.1304 if cp<=-0.10704701989889144 & cv<=-0.3474475085735319\n",
      "   +0.4470 if cp>=-0.029719324782490727\n",
      "   -1.7476 if pav>=1.432715654373169\n",
      "--------------\n",
      "   -1.4197 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   +0.1544 if cp<=0.026253991574048997\n",
      "   +3.4260 if cp<=-0.05298580601811409 & cv<=0.017999613657593744\n",
      "   -2.4253 if cp>=-0.05084318295121193 & cv<=-0.2179044485092163\n",
      "   +1.0006 if cv<=-0.24116332530975343\n",
      "   +1.0006 if cv<=-0.36121366620063783\n",
      "   -1.6412 if cp<=-0.01872282214462757 & cp>=-0.08475320041179657\n",
      "   +0.1544 if cp<=-0.016656085476279236 & cv>=-1.0195966005325316\n",
      "   +0.0000 if pav>=1.4362791776657104\n",
      "   -1.8546 if cp<=-0.06667464599013327 & cv>=-0.6980578660964966\n",
      "   -2.9048 if cp<=-0.02157978191971778 & cv>=-0.7444406032562256\n",
      "   -0.8120 if cp>=-0.021291512995958328\n",
      "Run episode 191 with rewards 14.0\n",
      "============ 192 ===========\n",
      "14 actions [0, 0, 0, 0, 0, 1, 1, 1, 0, 1, 0, 0, 1, 1]\n",
      "   -0.8735 if pa>=-0.1113012358546257\n",
      "   +0.3630 if pav<=0.06422646939754487\n",
      "   -0.8735 if cv<=1.0829041719436647\n",
      "   +0.3630 if pav<=0.07888057827949524\n",
      "   +0.3630 if cv>=-0.2162771999835968\n",
      "   -0.8735 if cp<=0.017083643935620785\n",
      "   +2.0814 if cp>=-0.03380712866783142\n",
      "   +3.8337 if cp<=-0.08475320041179657\n",
      "   -1.3750 if cp<=-0.10704701989889144 & cv<=-0.3474475085735319\n",
      "   +2.0814 if cp>=-0.029719324782490727\n",
      "   +0.0000 if pav>=1.432715654373169\n",
      "   +3.9275 if cp<=-0.056534332036972036 & cp>=-0.11377048045396805 & cv>=-0.45968279838562\n",
      "--------------\n",
      "   -3.7212 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   +0.3026 if cp<=0.026253991574048997\n",
      "   +1.5469 if cp<=-0.05298580601811409 & cv<=0.017999613657593744\n",
      "   -1.0098 if cp>=-0.05084318295121193 & cv<=-0.2179044485092163\n",
      "   +0.5370 if cv<=-0.24116332530975343\n",
      "   +0.5370 if cv<=-0.36121366620063783\n",
      "   +1.7651 if cp<=-0.01872282214462757 & cp>=-0.08475320041179657\n",
      "   +0.5370 if cp<=-0.016656085476279236 & cv>=-1.0195966005325316\n",
      "   +0.1996 if cp<=-0.06667464599013327 & cv>=-0.6980578660964966\n",
      "   -2.8823 if cp<=-0.02157978191971778 & cv>=-0.7444406032562256\n",
      "   -0.4467 if cp>=-0.021291512995958328\n",
      "   +2.0319 if cp<=-0.11377048045396805\n",
      "Run episode 192 with rewards 14.0\n",
      "============ 193 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 1, 1, 1]\n",
      "   +0.0319 if pa>=-0.1113012358546257\n",
      "   +0.0479 if pav<=0.06422646939754487\n",
      "   +0.0319 if cv<=1.0829041719436647\n",
      "   +0.0479 if pav<=0.07888057827949524\n",
      "   +0.0966 if cv>=-0.2162771999835968\n",
      "   +0.0319 if cp<=0.017083643935620785\n",
      "   +1.2939 if cp>=-0.03380712866783142\n",
      "   +1.6698 if cp<=-0.08475320041179657\n",
      "   +0.2331 if cp<=-0.10704701989889144 & cv<=-0.3474475085735319\n",
      "   +1.2939 if cp>=-0.029719324782490727\n",
      "   +1.2187 if cp<=-0.056534332036972036 & cp>=-0.11377048045396805 & cv>=-0.45968279838562\n",
      "   -2.2399 if pav>=1.4536411762237549\n",
      "--------------\n",
      "   -1.6048 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -0.4060 if cp<=0.026253991574048997\n",
      "   -0.9385 if cp<=-0.05298580601811409 & cv<=0.017999613657593744\n",
      "   +0.6966 if cp>=-0.05084318295121193 & cv<=-0.2179044485092163\n",
      "   -0.2418 if cv<=-0.24116332530975343\n",
      "   -0.2418 if cv<=-0.36121366620063783\n",
      "   +2.4423 if cp<=-0.01872282214462757 & cp>=-0.08475320041179657\n",
      "   +1.4597 if cp<=-0.016656085476279236 & cv>=-1.0195966005325316\n",
      "   -1.6023 if cp<=-0.02157978191971778 & cv>=-0.7444406032562256\n",
      "   -1.8657 if cp>=-0.021291512995958328\n",
      "   -1.4380 if cp<=-0.11377048045396805\n",
      "   -0.1037 if cp>=0.011412368156015873\n",
      "Run episode 193 with rewards 9.0\n",
      "============ 194 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.0269 if pav<=0.06422646939754487\n",
      "   +1.1386 if cv<=1.0829041719436647\n",
      "   +0.0269 if pav<=0.07888057827949524\n",
      "   +0.0517 if cv>=-0.2162771999835968\n",
      "   +1.0597 if cp<=0.017083643935620785\n",
      "   -0.5045 if cp>=-0.03380712866783142\n",
      "   -0.0000 if cp<=-0.08475320041179657\n",
      "   -0.0000 if cp<=-0.10704701989889144 & cv<=-0.3474475085735319\n",
      "   +0.1899 if cp>=-0.029719324782490727\n",
      "   -0.0000 if cp<=-0.056534332036972036 & cp>=-0.11377048045396805 & cv>=-0.45968279838562\n",
      "   -0.7697 if pav>=1.4536411762237549\n",
      "   +1.9512 if cv>=-0.9505589485168457\n",
      "--------------\n",
      "   -0.3810 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -0.9824 if cp<=0.026253991574048997\n",
      "   -1.9769 if cp<=-0.05298580601811409 & cv<=0.017999613657593744\n",
      "   +0.7166 if cp>=-0.05084318295121193 & cv<=-0.2179044485092163\n",
      "   -0.6754 if cv<=-0.24116332530975343\n",
      "   -0.6754 if cv<=-0.36121366620063783\n",
      "   -0.0942 if cp<=-0.01872282214462757 & cp>=-0.08475320041179657\n",
      "   -1.3920 if cp<=-0.016656085476279236 & cv>=-1.0195966005325316\n",
      "   -0.0000 if cp<=-0.02157978191971778 & cv>=-0.7444406032562256\n",
      "   -0.8882 if cp>=-0.021291512995958328\n",
      "   -0.0000 if cp<=-0.11377048045396805\n",
      "   +1.2978 if pav>=1.8280446529388428\n",
      "Run episode 194 with rewards 9.0\n",
      "============ 195 ===========\n",
      "17 actions [0, 1, 0, 0, 1, 0, 1, 0, 1, 1, 0, 0, 0, 0, 0, 1, 0]\n",
      "   +0.1725 if pav<=0.06422646939754487\n",
      "   +0.4400 if cv<=1.0829041719436647\n",
      "   +0.1725 if pav<=0.07888057827949524\n",
      "   +0.3839 if cv>=-0.2162771999835968\n",
      "   +0.4400 if cp<=0.017083643935620785\n",
      "   +0.0000 if cp>=-0.03380712866783142\n",
      "   -0.1115 if cp<=-0.08475320041179657\n",
      "   +0.0000 if cp>=-0.029719324782490727\n",
      "   +0.0000 if cp<=-0.056534332036972036 & cp>=-0.11377048045396805 & cv>=-0.45968279838562\n",
      "   -0.1014 if pav>=1.4536411762237549\n",
      "   +0.5414 if cv>=-0.9505589485168457\n",
      "   +0.0081 if cp<=-0.058446843922138204 & cp>=-0.07993922680616379\n",
      "--------------\n",
      "   -0.1038 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   +0.8034 if cp<=0.026253991574048997\n",
      "   +0.9072 if cp<=-0.05298580601811409 & cv<=0.017999613657593744\n",
      "   -0.0706 if cp>=-0.05084318295121193 & cv<=-0.2179044485092163\n",
      "   +0.8366 if cv<=-0.24116332530975343\n",
      "   +0.8366 if cv<=-0.36121366620063783\n",
      "   -1.7509 if cp<=-0.01872282214462757 & cp>=-0.08475320041179657\n",
      "   -1.7509 if cp<=-0.016656085476279236 & cv>=-1.0195966005325316\n",
      "   -0.2700 if cp<=-0.02157978191971778 & cv>=-0.7444406032562256\n",
      "   +0.0000 if cp>=-0.021291512995958328\n",
      "   +5.4476 if pav>=1.8280446529388428\n",
      "   +5.4477 if cp<=-0.11161622703075409\n",
      "Run episode 195 with rewards 17.0\n",
      "============ 196 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 1, 0, 0]\n",
      "   +2.7206 if pav<=0.06422646939754487\n",
      "   -0.7140 if cv<=1.0829041719436647\n",
      "   +2.7206 if pav<=0.07888057827949524\n",
      "   -0.6134 if cv>=-0.2162771999835968\n",
      "   +1.9993 if cp<=0.017083643935620785\n",
      "   +0.4577 if cp>=-0.03380712866783142\n",
      "   +0.0000 if cp<=-0.08475320041179657\n",
      "   -0.1529 if cp>=-0.029719324782490727\n",
      "   -1.7886 if pav>=1.4536411762237549\n",
      "   -0.5705 if cv>=-0.9505589485168457\n",
      "   -0.1435 if cp<=-0.058446843922138204 & cp>=-0.07993922680616379\n",
      "   +4.3951 if cp>=0.02213576324284077 & cv<=-0.21572406589984894\n",
      "--------------\n",
      "   +2.6289 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -3.9441 if cp<=0.026253991574048997\n",
      "   +0.3998 if cp<=-0.05298580601811409 & cv<=0.017999613657593744\n",
      "   +2.3868 if cp>=-0.05084318295121193 & cv<=-0.2179044485092163\n",
      "   +1.7667 if cv<=-0.24116332530975343\n",
      "   +1.7667 if cv<=-0.36121366620063783\n",
      "   -1.7673 if cp<=-0.01872282214462757 & cp>=-0.08475320041179657\n",
      "   -1.7673 if cp<=-0.016656085476279236 & cv>=-1.0195966005325316\n",
      "   -1.6045 if cp<=-0.02157978191971778 & cv>=-0.7444406032562256\n",
      "   +0.0000 if pav>=1.8280446529388428\n",
      "   +0.0000 if cp<=-0.11161622703075409\n",
      "   -3.4916 if cp>=0.028132034465670586\n",
      "Run episode 196 with rewards 9.0\n",
      "============ 197 ===========\n",
      "34 actions [0, 0, 0, 0, 0, 1, 1, 1, 0, 1, 1, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 1]\n",
      "   +0.0453 if pav<=0.06422646939754487\n",
      "   -1.2253 if cv<=1.0829041719436647\n",
      "   +0.0453 if pav<=0.07888057827949524\n",
      "   +0.0884 if cv>=-0.2162771999835968\n",
      "   -1.2253 if cp<=0.017083643935620785\n",
      "   +0.0000 if cp>=-0.03380712866783142\n",
      "   +0.0000 if cp>=-0.029719324782490727\n",
      "   -1.7128 if pav>=1.4536411762237549\n",
      "   +2.1598 if cv>=-0.9505589485168457\n",
      "   +0.1700 if cp<=-0.058446843922138204 & cp>=-0.07993922680616379\n",
      "   +0.0000 if cp>=0.02213576324284077 & cv<=-0.21572406589984894\n",
      "   -3.3338 if pa>=0.17553935945034027\n",
      "--------------\n",
      "   -0.1607 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   +0.5657 if cp<=0.026253991574048997\n",
      "   +0.7264 if cp<=-0.05298580601811409 & cv<=0.017999613657593744\n",
      "   +0.0000 if cp>=-0.05084318295121193 & cv<=-0.2179044485092163\n",
      "   +0.6517 if cv<=-0.24116332530975343\n",
      "   +0.7264 if cv<=-0.36121366620063783\n",
      "   -2.2156 if cp<=-0.01872282214462757 & cp>=-0.08475320041179657\n",
      "   -2.9026 if cp<=-0.016656085476279236 & cv>=-1.0195966005325316\n",
      "   -0.7503 if cp<=-0.02157978191971778 & cv>=-0.7444406032562256\n",
      "   +2.6484 if cp<=-0.11161622703075409\n",
      "   +0.0000 if cp>=0.028132034465670586\n",
      "   +3.3354 if pa>=0.17553935945034027\n",
      "Run episode 197 with rewards 34.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 198 ===========\n",
      "27 actions [0, 1, 0, 0, 0, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 0, 1, 1, 0, 1, 0, 0, 1]\n",
      "   +3.8942 if pav<=0.06422646939754487\n",
      "   -2.5675 if cv<=1.0829041719436647\n",
      "   +3.8942 if pav<=0.07888057827949524\n",
      "   -2.4123 if cv>=-0.2162771999835968\n",
      "   -2.5675 if cp<=0.017083643935620785\n",
      "   -0.0000 if cp>=-0.03380712866783142\n",
      "   -0.0000 if pav>=1.4536411762237549\n",
      "   +2.4271 if cv>=-0.9505589485168457\n",
      "   +3.3819 if cp<=-0.058446843922138204 & cp>=-0.07993922680616379\n",
      "   -0.0000 if cp>=0.02213576324284077 & cv<=-0.21572406589984894\n",
      "   -2.7660 if pa>=0.17553935945034027\n",
      "   +2.9991 if pav<=0.8458609223365784 & pav>=-0.011459403089247628\n",
      "--------------\n",
      "   -1.0897 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -0.2789 if cp<=0.026253991574048997\n",
      "   +4.8094 if cp<=-0.05298580601811409 & cv<=0.017999613657593744\n",
      "   -2.9633 if cv<=-0.24116332530975343\n",
      "   -2.9633 if cv<=-0.36121366620063783\n",
      "   -4.4834 if cp<=-0.01872282214462757 & cp>=-0.08475320041179657\n",
      "   -0.2790 if cp<=-0.016656085476279236 & cv>=-1.0195966005325316\n",
      "   -2.0137 if cp<=-0.02157978191971778 & cv>=-0.7444406032562256\n",
      "   +2.3721 if cp<=-0.11161622703075409\n",
      "   -0.0000 if cp>=0.028132034465670586\n",
      "   +1.6779 if pa>=0.17553935945034027\n",
      "   +4.8660 if cv<=-0.419759601354599\n",
      "Run episode 198 with rewards 27.0\n",
      "============ 199 ===========\n",
      "14 actions [0, 0, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1, 1, 1]\n",
      "   +3.2321 if pav<=0.06422646939754487\n",
      "   -1.5682 if cv<=1.0829041719436647\n",
      "   +3.2321 if pav<=0.07888057827949524\n",
      "   +1.0862 if cv>=-0.2162771999835968\n",
      "   -1.5682 if cp<=0.017083643935620785\n",
      "   -0.0000 if pav>=1.4536411762237549\n",
      "   +0.0695 if cv>=-0.9505589485168457\n",
      "   -1.6377 if cp<=-0.058446843922138204 & cp>=-0.07993922680616379\n",
      "   -0.0000 if cp>=0.02213576324284077 & cv<=-0.21572406589984894\n",
      "   -1.2245 if pa>=0.17553935945034027\n",
      "   +2.1240 if pav<=0.8458609223365784 & pav>=-0.011459403089247628\n",
      "   -2.3812 if cp>=-0.034373172372579565\n",
      "--------------\n",
      "   -0.3487 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   +2.6076 if cp<=0.026253991574048997\n",
      "   +5.5391 if cp<=-0.05298580601811409 & cv<=0.017999613657593744\n",
      "   -2.9691 if cv<=-0.24116332530975343\n",
      "   -2.9691 if cv<=-0.36121366620063783\n",
      "   -3.0306 if cp<=-0.01872282214462757 & cp>=-0.08475320041179657\n",
      "   -3.5306 if cp<=-0.016656085476279236 & cv>=-1.0195966005325316\n",
      "   -0.7131 if cp<=-0.02157978191971778 & cv>=-0.7444406032562256\n",
      "   -0.0165 if cp<=-0.11161622703075409\n",
      "   -0.8802 if pa>=0.17553935945034027\n",
      "   +5.2256 if cv<=-0.419759601354599\n",
      "   -2.8398 if cp>=-0.014123460277915001\n",
      "Run episode 199 with rewards 14.0\n",
      "============ 200 ===========\n",
      "14 actions [0, 0, 0, 1, 0, 0, 1, 1, 0, 0, 0, 0, 0, 1]\n",
      "   +0.4849 if pav<=0.06422646939754487\n",
      "   -0.9962 if cv<=1.0829041719436647\n",
      "   +0.4849 if pav<=0.07888057827949524\n",
      "   +1.6399 if cv>=-0.2162771999835968\n",
      "   -0.6613 if cp<=0.017083643935620785\n",
      "   -0.2300 if pav>=1.4536411762237549\n",
      "   -0.7662 if cv>=-0.9505589485168457\n",
      "   -0.2300 if cp<=-0.058446843922138204 & cp>=-0.07993922680616379\n",
      "   -0.0972 if pa>=0.17553935945034027\n",
      "   +2.2178 if pav<=0.8458609223365784 & pav>=-0.011459403089247628\n",
      "   -1.8379 if cp>=-0.034373172372579565\n",
      "   +0.2519 if cv<=-0.6533100008964539\n",
      "--------------\n",
      "   -3.4526 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -0.4467 if cp<=0.026253991574048997\n",
      "   +0.8038 if cp<=-0.05298580601811409 & cv<=0.017999613657593744\n",
      "   -0.8998 if cv<=-0.24116332530975343\n",
      "   -0.8998 if cv<=-0.36121366620063783\n",
      "   -1.9462 if cp<=-0.01872282214462757 & cp>=-0.08475320041179657\n",
      "   -1.5056 if cp<=-0.016656085476279236 & cv>=-1.0195966005325316\n",
      "   -1.2643 if cp<=-0.02157978191971778 & cv>=-0.7444406032562256\n",
      "   +0.0711 if pa>=0.17553935945034027\n",
      "   +1.5474 if cv<=-0.419759601354599\n",
      "   -0.3995 if cp>=-0.014123460277915001\n",
      "   -0.4081 if cv>=-0.5681428074836731\n",
      "Run episode 200 with rewards 14.0\n",
      "============ 201 ===========\n",
      "9 actions [0, 0, 0, 0, 1, 0, 0, 0, 0]\n",
      "   +0.4749 if pav<=0.06422646939754487\n",
      "   +0.8964 if cv<=1.0829041719436647\n",
      "   +0.4749 if pav<=0.07888057827949524\n",
      "   +1.5861 if cv>=-0.2162771999835968\n",
      "   +2.6942 if cp<=0.017083643935620785\n",
      "   +4.1442 if pav>=1.4536411762237549\n",
      "   -3.2477 if cv>=-0.9505589485168457\n",
      "   +0.0000 if cp<=-0.058446843922138204 & cp>=-0.07993922680616379\n",
      "   +0.4443 if pav<=0.8458609223365784 & pav>=-0.011459403089247628\n",
      "   -3.3425 if cp>=-0.034373172372579565\n",
      "   +0.4151 if cv<=-0.6533100008964539\n",
      "   +2.8878 if cp>=0.009764324314892301\n",
      "--------------\n",
      "   -1.0256 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -1.9159 if cp<=0.026253991574048997\n",
      "   -4.0195 if cp<=-0.05298580601811409 & cv<=0.017999613657593744\n",
      "   -0.0065 if cv<=-0.24116332530975343\n",
      "   -0.0065 if cv<=-0.36121366620063783\n",
      "   -1.5943 if cp<=-0.01872282214462757 & cp>=-0.08475320041179657\n",
      "   -1.5949 if cp<=-0.016656085476279236 & cv>=-1.0195966005325316\n",
      "   -0.7679 if cp<=-0.02157978191971778 & cv>=-0.7444406032562256\n",
      "   +0.7974 if cv<=-0.419759601354599\n",
      "   +0.1894 if cp>=-0.014123460277915001\n",
      "   -1.0256 if cv>=-0.5681428074836731\n",
      "   -3.3482 if cv>=-0.604309904575348\n",
      "Run episode 201 with rewards 9.0\n",
      "============ 202 ===========\n",
      "12 actions [0, 0, 0, 1, 0, 1, 0, 0, 0, 1, 0, 1]\n",
      "   +0.0391 if pav<=0.06422646939754487\n",
      "   -0.3003 if cv<=1.0829041719436647\n",
      "   +0.0391 if pav<=0.07888057827949524\n",
      "   +0.0732 if cv>=-0.2162771999835968\n",
      "   -0.3735 if cp<=0.017083643935620785\n",
      "   +0.0227 if pav>=1.4536411762237549\n",
      "   -0.2846 if cv>=-0.9505589485168457\n",
      "   +0.0785 if pav<=0.8458609223365784 & pav>=-0.011459403089247628\n",
      "   -0.3229 if cp>=-0.034373172372579565\n",
      "   -0.7037 if cv<=-0.6533100008964539\n",
      "   +0.1176 if cp>=0.009764324314892301\n",
      "   -1.1322 if cp>=-0.014322362095117567 & cv<=-0.7062352180480956\n",
      "--------------\n",
      "   -0.5377 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -0.8717 if cp<=0.026253991574048997\n",
      "   +0.0001 if cp<=-0.05298580601811409 & cv<=0.017999613657593744\n",
      "   -0.3340 if cv<=-0.36121366620063783\n",
      "   -1.0530 if cp<=-0.01872282214462757 & cp>=-0.08475320041179657\n",
      "   -1.2069 if cp<=-0.016656085476279236 & cv>=-1.0195966005325316\n",
      "   +0.0000 if cp<=-0.02157978191971778 & cv>=-0.7444406032562256\n",
      "   -0.3340 if cv<=-0.419759601354599\n",
      "   +0.3351 if cp>=-0.014123460277915001\n",
      "   -2.0501 if cv>=-0.5681428074836731\n",
      "   -2.0501 if cv>=-0.604309904575348\n",
      "   -0.1539 if cp<=-0.014322362095117567 & cv>=-0.7062352180480956\n",
      "Run episode 202 with rewards 12.0\n",
      "============ 203 ===========\n",
      "12 actions [0, 0, 0, 1, 0, 0, 0, 0, 1, 0, 1, 1]\n",
      "   +0.2934 if pav<=0.06422646939754487\n",
      "   -0.9234 if cv<=1.0829041719436647\n",
      "   +0.2934 if pav<=0.07888057827949524\n",
      "   +0.2934 if cv>=-0.2162771999835968\n",
      "   -1.9722 if cp<=0.017083643935620785\n",
      "   +0.2670 if cv>=-0.9505589485168457\n",
      "   +1.4527 if pav<=0.8458609223365784 & pav>=-0.011459403089247628\n",
      "   -0.6530 if cp>=-0.034373172372579565\n",
      "   -0.2705 if cv<=-0.6533100008964539\n",
      "   -0.5614 if cp>=0.009764324314892301\n",
      "   +0.0000 if cp>=-0.014322362095117567 & cv<=-0.7062352180480956\n",
      "   +1.2307 if cp<=-0.025732863694429394\n",
      "--------------\n",
      "   -1.9906 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   +0.1281 if cp<=0.026253991574048997\n",
      "   +0.4765 if cp<=-0.05298580601811409 & cv<=0.017999613657593744\n",
      "   +0.1281 if cv<=-0.36121366620063783\n",
      "   -1.2871 if cp<=-0.01872282214462757 & cp>=-0.08475320041179657\n",
      "   -2.3233 if cp<=-0.016656085476279236 & cv>=-1.0195966005325316\n",
      "   +0.1281 if cv<=-0.419759601354599\n",
      "   +0.9810 if cp>=-0.014123460277915001\n",
      "   -1.9906 if cv>=-0.5681428074836731\n",
      "   -1.9906 if cv>=-0.604309904575348\n",
      "   -0.7407 if cp<=-0.014322362095117567 & cv>=-0.7062352180480956\n",
      "   -0.3028 if cp>=0.02816140465438366\n",
      "Run episode 203 with rewards 12.0\n",
      "============ 204 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.0197 if pav<=0.06422646939754487\n",
      "   +0.3552 if cv<=1.0829041719436647\n",
      "   +0.0197 if pav<=0.07888057827949524\n",
      "   +0.3520 if cv>=-0.2162771999835968\n",
      "   -0.4716 if cp<=0.017083643935620785\n",
      "   +0.5179 if cv>=-0.9505589485168457\n",
      "   -2.8929 if pav<=0.8458609223365784 & pav>=-0.011459403089247628\n",
      "   +0.5179 if cp>=-0.034373172372579565\n",
      "   +0.0489 if cv<=-0.6533100008964539\n",
      "   +0.8268 if cp>=0.009764324314892301\n",
      "   -0.1627 if cp<=-0.025732863694429394\n",
      "   +2.8792 if cp<=-0.07634420990943908\n",
      "--------------\n",
      "   -2.2276 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -2.4792 if cp<=0.026253991574048997\n",
      "   -0.1535 if cp<=-0.05298580601811409 & cv<=0.017999613657593744\n",
      "   +1.2206 if cp<=-0.01872282214462757 & cp>=-0.08475320041179657\n",
      "   -4.3420 if cp<=-0.016656085476279236 & cv>=-1.0195966005325316\n",
      "   -0.2516 if cv<=-0.419759601354599\n",
      "   -0.8259 if cp>=-0.014123460277915001\n",
      "   -2.2276 if cv>=-0.5681428074836731\n",
      "   -0.8259 if cv>=-0.604309904575348\n",
      "   -0.0000 if cp<=-0.014322362095117567 & cv>=-0.7062352180480956\n",
      "   -0.0000 if cp>=0.02816140465438366\n",
      "   +3.6858 if cp>=-0.005358449881896365\n",
      "Run episode 204 with rewards 10.0\n",
      "============ 205 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +0.7927 if cv<=1.0829041719436647\n",
      "   +0.1092 if pav<=0.07888057827949524\n",
      "   +0.2169 if cv>=-0.2162771999835968\n",
      "   +0.4939 if cp<=0.017083643935620785\n",
      "   +0.7016 if cv>=-0.9505589485168457\n",
      "   +0.2266 if pav<=0.8458609223365784 & pav>=-0.011459403089247628\n",
      "   +0.7992 if cp>=-0.034373172372579565\n",
      "   +0.4939 if cv<=-0.6533100008964539\n",
      "   +0.2988 if cp>=0.009764324314892301\n",
      "   +0.0911 if cp<=-0.025732863694429394\n",
      "   -0.0491 if cp<=-0.07634420990943908\n",
      "   +0.4028 if cp<=0.012251720204949383 & cp>=-0.014610572904348373\n",
      "--------------\n",
      "   -0.7165 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   -0.9436 if cp<=0.026253991574048997\n",
      "   +0.3031 if cp<=-0.05298580601811409 & cv<=0.017999613657593744\n",
      "   -0.5339 if cp<=-0.01872282214462757 & cp>=-0.08475320041179657\n",
      "   +0.0000 if cp<=-0.016656085476279236 & cv>=-1.0195966005325316\n",
      "   -0.8099 if cv<=-0.419759601354599\n",
      "   -1.0820 if cp>=-0.014123460277915001\n",
      "   -0.7221 if cv>=-0.5681428074836731\n",
      "   -0.7221 if cv>=-0.604309904575348\n",
      "   +0.0000 if cp<=-0.014322362095117567 & cv>=-0.7062352180480956\n",
      "   -0.8556 if cp>=-0.005358449881896365\n",
      "   -0.7221 if cp>=0.012251720204949383\n",
      "Run episode 205 with rewards 10.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 206 ===========\n",
      "22 actions [0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1]\n",
      "   -0.4717 if cv<=1.0829041719436647\n",
      "   +0.0262 if pav<=0.07888057827949524\n",
      "   +0.0500 if cv>=-0.2162771999835968\n",
      "   -0.4717 if cp<=0.017083643935620785\n",
      "   +1.2028 if cv>=-0.9505589485168457\n",
      "   +0.0879 if pav<=0.8458609223365784 & pav>=-0.011459403089247628\n",
      "   +1.2028 if cp>=-0.034373172372579565\n",
      "   -0.5596 if cv<=-0.6533100008964539\n",
      "   +0.0000 if cp>=0.009764324314892301\n",
      "   -0.8000 if cp<=-0.025732863694429394\n",
      "   +0.3283 if cp<=0.012251720204949383 & cp>=-0.014610572904348373\n",
      "   -5.4527 if pa>=0.16876693069934845\n",
      "--------------\n",
      "   -0.4657 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   +2.6824 if cp<=0.026253991574048997\n",
      "   +4.6212 if cp<=-0.05298580601811409 & cv<=0.017999613657593744\n",
      "   -2.8467 if cp<=-0.01872282214462757 & cp>=-0.08475320041179657\n",
      "   -0.1434 if cp<=-0.016656085476279236 & cv>=-1.0195966005325316\n",
      "   +3.1481 if cv<=-0.419759601354599\n",
      "   -1.3548 if cp>=-0.014123460277915001\n",
      "   -0.6440 if cv>=-0.5681428074836731\n",
      "   -0.6440 if cv>=-0.604309904575348\n",
      "   -0.6440 if cp>=-0.005358449881896365\n",
      "   +0.0000 if cp>=0.012251720204949383\n",
      "   -3.7403 if cp<=0.006921333260834218 & cp>=-0.07428496778011322\n",
      "Run episode 206 with rewards 22.0\n",
      "============ 207 ===========\n",
      "47 actions [1, 0, 0, 0, 0, 1, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0]\n",
      "   +0.5951 if cv<=1.0829041719436647\n",
      "   -0.8984 if pav<=0.07888057827949524\n",
      "   -0.9141 if cv>=-0.2162771999835968\n",
      "   +0.5951 if cp<=0.017083643935620785\n",
      "   +0.5951 if cv>=-0.9505589485168457\n",
      "   +0.0977 if pav<=0.8458609223365784 & pav>=-0.011459403089247628\n",
      "   -0.1602 if cp>=-0.034373172372579565\n",
      "   -3.2805 if cv<=-0.6533100008964539\n",
      "   -1.9103 if cp<=-0.025732863694429394\n",
      "   +0.7483 if cp<=0.012251720204949383 & cp>=-0.014610572904348373\n",
      "   -0.3593 if pa>=0.16876693069934845\n",
      "   -1.7667 if pa>=0.15067561864852907\n",
      "--------------\n",
      "   +1.0482 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   +1.8602 if cp<=0.026253991574048997\n",
      "   +4.2345 if cp<=-0.05298580601811409 & cv<=0.017999613657593744\n",
      "   +0.9262 if cp<=-0.01872282214462757 & cp>=-0.08475320041179657\n",
      "   +1.9227 if cp<=-0.016656085476279236 & cv>=-1.0195966005325316\n",
      "   +0.8120 if cv<=-0.419759601354599\n",
      "   -0.0373 if cp>=-0.014123460277915001\n",
      "   -2.4125 if cv>=-0.5681428074836731\n",
      "   -2.4308 if cv>=-0.604309904575348\n",
      "   -0.0000 if cp>=-0.005358449881896365\n",
      "   -4.2322 if cp<=0.006921333260834218 & cp>=-0.07428496778011322\n",
      "   +1.1819 if cv<=-0.5488481998443604 & pa<=0.16868769824504853 & pav>=0.6717349648475648\n",
      "Run episode 207 with rewards 47.0\n",
      "============ 208 ===========\n",
      "25 actions [0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   -0.4367 if cv<=1.0829041719436647\n",
      "   -4.7239 if pav<=0.07888057827949524\n",
      "   -2.9005 if cv>=-0.2162771999835968\n",
      "   -1.3091 if cp<=0.017083643935620785\n",
      "   +3.7815 if cv>=-0.9505589485168457\n",
      "   +1.8208 if cp>=-0.034373172372579565\n",
      "   -2.8275 if cv<=-0.6533100008964539\n",
      "   -2.0065 if cp<=-0.025732863694429394\n",
      "   +1.9936 if cp<=0.012251720204949383 & cp>=-0.014610572904348373\n",
      "   +0.0000 if pa>=0.16876693069934845\n",
      "   +0.0001 if pa>=0.15067561864852907\n",
      "   +4.9365 if pav<=-0.049893178045749664\n",
      "--------------\n",
      "   -0.3452 if cv>=-0.5352908611297608 & pa>=-0.0615288682281971\n",
      "   +2.2430 if cp<=0.026253991574048997\n",
      "   +1.4513 if cp<=-0.05298580601811409 & cv<=0.017999613657593744\n",
      "   -1.7822 if cp<=-0.01872282214462757 & cp>=-0.08475320041179657\n",
      "   +3.1811 if cp<=-0.016656085476279236 & cv>=-1.0195966005325316\n",
      "   +2.6273 if cv<=-0.419759601354599\n",
      "   -4.4051 if cp>=-0.014123460277915001\n",
      "   -0.3844 if cv>=-0.5681428074836731\n",
      "   -1.8491 if cv>=-0.604309904575348\n",
      "   -2.5876 if cp<=0.006921333260834218 & cp>=-0.07428496778011322\n",
      "   -2.3288 if cv<=-0.5488481998443604 & pa<=0.16868769824504853 & pav>=0.6717349648475648\n",
      "   -1.5238 if cp>=-0.07298106253147126 & pav<=-0.049893178045749664\n",
      "Run episode 208 with rewards 25.0\n",
      "============ 209 ===========\n",
      "11 actions [0, 0, 0, 1, 0, 0, 1, 0, 0, 1, 1]\n",
      "   -0.9730 if cv<=1.0829041719436647\n",
      "   -0.4353 if pav<=0.07888057827949524\n",
      "   -0.0199 if cv>=-0.2162771999835968\n",
      "   -0.5844 if cp<=0.017083643935620785\n",
      "   -0.9730 if cv>=-0.9505589485168457\n",
      "   +0.9711 if cp>=-0.034373172372579565\n",
      "   -3.3341 if cv<=-0.6533100008964539\n",
      "   +2.4976 if cp<=-0.025732863694429394\n",
      "   +0.1243 if cp<=0.012251720204949383 & cp>=-0.014610572904348373\n",
      "   -1.7193 if pa>=0.15067561864852907\n",
      "   -0.4478 if pav<=-0.049893178045749664\n",
      "   +3.4148 if cp>=-0.046283074468374236 & pa<=0.14660244584083557\n",
      "--------------\n",
      "   -0.3034 if cp<=0.026253991574048997\n",
      "   +4.2146 if cp<=-0.05298580601811409 & cv<=0.017999613657593744\n",
      "   -0.1972 if cp<=-0.01872282214462757 & cp>=-0.08475320041179657\n",
      "   +1.9251 if cp<=-0.016656085476279236 & cv>=-1.0195966005325316\n",
      "   +0.0661 if cv<=-0.419759601354599\n",
      "   -2.2285 if cp>=-0.014123460277915001\n",
      "   -0.1477 if cv>=-0.5681428074836731\n",
      "   -0.1477 if cv>=-0.604309904575348\n",
      "   -2.9468 if cp<=0.006921333260834218 & cp>=-0.07428496778011322\n",
      "   -0.1557 if cv<=-0.5488481998443604 & pa<=0.16868769824504853 & pav>=0.6717349648475648\n",
      "   -1.0512 if cp>=-0.07298106253147126 & pav<=-0.049893178045749664\n",
      "   +4.9543 if pa<=0.09636197239160539 & pav>=0.23857961297035246\n",
      "Run episode 209 with rewards 11.0\n",
      "============ 210 ===========\n",
      "12 actions [0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 0, 0]\n",
      "   +0.3603 if cv<=1.0829041719436647\n",
      "   +0.0161 if pav<=0.07888057827949524\n",
      "   +2.2297 if cp<=0.017083643935620785\n",
      "   +0.4528 if cv>=-0.9505589485168457\n",
      "   +0.0637 if cp>=-0.034373172372579565\n",
      "   -3.0477 if cv<=-0.6533100008964539\n",
      "   +0.2966 if cp<=-0.025732863694429394\n",
      "   -1.9247 if cp<=0.012251720204949383 & cp>=-0.014610572904348373\n",
      "   -0.0830 if pa>=0.15067561864852907\n",
      "   -0.0000 if pav<=-0.049893178045749664\n",
      "   +0.4433 if cp>=-0.046283074468374236 & pa<=0.14660244584083557\n",
      "   +3.7307 if cp>=0.03361134231090546\n",
      "--------------\n",
      "   +0.6840 if cp<=0.026253991574048997\n",
      "   -0.0067 if cp<=-0.05298580601811409 & cv<=0.017999613657593744\n",
      "   -0.6438 if cp<=-0.01872282214462757 & cp>=-0.08475320041179657\n",
      "   -0.6640 if cp<=-0.016656085476279236 & cv>=-1.0195966005325316\n",
      "   +0.4515 if cp>=-0.014123460277915001\n",
      "   -1.6038 if cv>=-0.5681428074836731\n",
      "   -1.6038 if cv>=-0.604309904575348\n",
      "   -2.8692 if cp<=0.006921333260834218 & cp>=-0.07428496778011322\n",
      "   +1.4384 if cv<=-0.5488481998443604 & pa<=0.16868769824504853 & pav>=0.6717349648475648\n",
      "   -0.0000 if cp>=-0.07298106253147126 & pav<=-0.049893178045749664\n",
      "   +0.7257 if pa<=0.09636197239160539 & pav>=0.23857961297035246\n",
      "   +0.4957 if cp>=-0.009002706967294216 & cv<=-0.6298959255218504 & cv>=-0.6330713629722595\n",
      "Run episode 210 with rewards 12.0\n",
      "============ 211 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 1]\n",
      "   +0.2223 if cv<=1.0829041719436647\n",
      "   +0.0257 if pav<=0.07888057827949524\n",
      "   +0.2223 if cp<=0.017083643935620785\n",
      "   -0.4235 if cv>=-0.9505589485168457\n",
      "   +0.6499 if cp>=-0.034373172372579565\n",
      "   +0.0959 if cv<=-0.6533100008964539\n",
      "   +0.0959 if cp<=-0.025732863694429394\n",
      "   +0.1190 if cp<=0.012251720204949383 & cp>=-0.014610572904348373\n",
      "   -1.8716 if pa>=0.15067561864852907\n",
      "   +1.4481 if cp>=-0.046283074468374236 & pa<=0.14660244584083557\n",
      "   +0.0000 if cp>=0.03361134231090546\n",
      "   -2.7733 if pa>=0.20719827711582184\n",
      "--------------\n",
      "   +0.8479 if cp<=0.026253991574048997\n",
      "   +1.9822 if cp<=-0.05298580601811409 & cv<=0.017999613657593744\n",
      "   -1.8256 if cp<=-0.01872282214462757 & cp>=-0.08475320041179657\n",
      "   +1.0656 if cp<=-0.016656085476279236 & cv>=-1.0195966005325316\n",
      "   -0.5219 if cp>=-0.014123460277915001\n",
      "   -0.5322 if cv>=-0.5681428074836731\n",
      "   -0.5322 if cv>=-0.604309904575348\n",
      "   -2.3475 if cp<=0.006921333260834218 & cp>=-0.07428496778011322\n",
      "   -0.1841 if cv<=-0.5488481998443604 & pa<=0.16868769824504853 & pav>=0.6717349648475648\n",
      "   -0.8933 if pa<=0.09636197239160539 & pav>=0.23857961297035246\n",
      "   -0.0000 if cp>=-0.009002706967294216 & cv<=-0.6298959255218504 & cv>=-0.6330713629722595\n",
      "   +2.8011 if pa>=0.20719827711582184\n",
      "Run episode 211 with rewards 10.0\n",
      "============ 212 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +5.0621 if cv<=1.0829041719436647\n",
      "   +1.0733 if pav<=0.07888057827949524\n",
      "   +3.2145 if cp<=0.017083643935620785\n",
      "   +1.9337 if cv>=-0.9505589485168457\n",
      "   +1.8429 if cp>=-0.034373172372579565\n",
      "   +3.0604 if cv<=-0.6533100008964539\n",
      "   +3.0004 if cp<=-0.025732863694429394\n",
      "   +0.2173 if cp<=0.012251720204949383 & cp>=-0.014610572904348373\n",
      "   +2.9572 if pa>=0.15067561864852907\n",
      "   +1.4990 if cp>=-0.046283074468374236 & pa<=0.14660244584083557\n",
      "   -1.1947 if pa>=0.20719827711582184\n",
      "   +0.9942 if cp<=0.01945822425186634 & cp>=0.005329908884596083\n",
      "--------------\n",
      "   -5.2118 if cp<=0.026253991574048997\n",
      "   -5.5617 if cp<=-0.05298580601811409 & cv<=0.017999613657593744\n",
      "   +0.0099 if cp<=-0.01872282214462757 & cp>=-0.08475320041179657\n",
      "   -0.0000 if cp<=-0.016656085476279236 & cv>=-1.0195966005325316\n",
      "   +0.3400 if cp>=-0.014123460277915001\n",
      "   +0.2861 if cv>=-0.5681428074836731\n",
      "   +0.2861 if cv>=-0.604309904575348\n",
      "   +0.0639 if cp<=0.006921333260834218 & cp>=-0.07428496778011322\n",
      "   +0.0639 if cv<=-0.5488481998443604 & pa<=0.16868769824504853 & pav>=0.6717349648475648\n",
      "   +0.2573 if pa<=0.09636197239160539 & pav>=0.23857961297035246\n",
      "   -0.0000 if pa>=0.20719827711582184\n",
      "   -5.2997 if \n",
      "Run episode 212 with rewards 9.0\n",
      "============ 213 ===========\n",
      "16 actions [0, 0, 1, 0, 1, 0, 0, 0, 0, 1, 1, 0, 1, 1, 1, 0]\n",
      "   +0.0050 if cv<=1.0829041719436647\n",
      "   +0.0013 if pav<=0.07888057827949524\n",
      "   +0.0050 if cp<=0.017083643935620785\n",
      "   +0.0050 if cv>=-0.9505589485168457\n",
      "   +0.0000 if cp>=-0.034373172372579565\n",
      "   +0.0000 if cv<=-0.6533100008964539\n",
      "   +0.0050 if cp<=-0.025732863694429394\n",
      "   -0.0000 if pa>=0.15067561864852907\n",
      "   +0.0050 if cp>=-0.046283074468374236 & pa<=0.14660244584083557\n",
      "   +0.0000 if pa>=0.20719827711582184\n",
      "   +0.0000 if cp<=0.01945822425186634 & cp>=0.005329908884596083\n",
      "   +0.0000 if pa>=0.2058255523443222\n",
      "--------------\n",
      "   -0.0000 if cp<=0.026253991574048997\n",
      "   -0.0000 if cp<=-0.05298580601811409 & cv<=0.017999613657593744\n",
      "   -0.0000 if cp<=-0.01872282214462757 & cp>=-0.08475320041179657\n",
      "   +0.0000 if cp>=-0.014123460277915001\n",
      "   -0.0000 if cv>=-0.5681428074836731\n",
      "   -0.0000 if cv>=-0.604309904575348\n",
      "   -0.0000 if cp<=0.006921333260834218 & cp>=-0.07428496778011322\n",
      "   -0.0000 if cv<=-0.5488481998443604 & pa<=0.16868769824504853 & pav>=0.6717349648475648\n",
      "   -0.0000 if pa<=0.09636197239160539 & pav>=0.23857961297035246\n",
      "   +0.0000 if pa>=0.20719827711582184\n",
      "   -0.0000 if \n",
      "   +0.0000 if cv>=0.04039212316274643\n",
      "Run episode 213 with rewards 16.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 214 ===========\n",
      "36 actions [0, 0, 1, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 1, 0, 1, 0, 1]\n",
      "   -2.1031 if cv<=1.0829041719436647\n",
      "   +1.8157 if pav<=0.07888057827949524\n",
      "   +3.3686 if cp<=0.017083643935620785\n",
      "   +1.8347 if cv>=-0.9505589485168457\n",
      "   +0.2909 if cp>=-0.034373172372579565\n",
      "   -1.3485 if cv<=-0.6533100008964539\n",
      "   -2.3940 if cp<=-0.025732863694429394\n",
      "   -1.9332 if pa>=0.15067561864852907\n",
      "   -1.3699 if cp>=-0.046283074468374236 & pa<=0.14660244584083557\n",
      "   -0.2492 if pa>=0.20719827711582184\n",
      "   -0.2492 if pa>=0.2058255523443222\n",
      "   +2.7309 if cv>=-0.4036271572113037 & pa<=0.019266029819846153\n",
      "--------------\n",
      "   -3.7510 if cp<=0.026253991574048997\n",
      "   +0.1076 if cp<=-0.05298580601811409 & cv<=0.017999613657593744\n",
      "   +1.3642 if cp<=-0.01872282214462757 & cp>=-0.08475320041179657\n",
      "   -2.9563 if cp>=-0.014123460277915001\n",
      "   +2.1476 if cv>=-0.5681428074836731\n",
      "   -2.1790 if cv>=-0.604309904575348\n",
      "   +0.3815 if cp<=0.006921333260834218 & cp>=-0.07428496778011322\n",
      "   +0.0305 if cv<=-0.5488481998443604 & pa<=0.16868769824504853 & pav>=0.6717349648475648\n",
      "   +1.2426 if pa<=0.09636197239160539 & pav>=0.23857961297035246\n",
      "   +3.4174 if \n",
      "   +0.0000 if cv>=0.04039212316274643\n",
      "   -4.6226 if cp>=0.034838929772377014 & cv>=-0.208836168050766\n",
      "Run episode 214 with rewards 36.0\n",
      "============ 215 ===========\n",
      "65 actions [0, 0, 1, 1, 1, 1, 0, 0, 0, 1, 0, 1, 0, 0, 0, 1, 1, 1, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 0, 0, 1, 0, 0, 1]\n",
      "   +0.4277 if cv<=1.0829041719436647\n",
      "   +3.0120 if pav<=0.07888057827949524\n",
      "   +0.4277 if cp<=0.017083643935620785\n",
      "   +0.4277 if cv>=-0.9505589485168457\n",
      "   +4.8279 if cp>=-0.034373172372579565\n",
      "   -4.5208 if cv<=-0.6533100008964539\n",
      "   +0.6283 if cp<=-0.025732863694429394\n",
      "   -3.2410 if pa>=0.15067561864852907\n",
      "   -5.6195 if cp>=-0.046283074468374236 & pa<=0.14660244584083557\n",
      "   +0.0000 if pa>=0.2058255523443222\n",
      "   +4.3387 if cv>=-0.4036271572113037 & pa<=0.019266029819846153\n",
      "   -2.3775 if cp<=-0.12441594898700714\n",
      "--------------\n",
      "   +0.2923 if cp<=0.026253991574048997\n",
      "   -0.4830 if cp<=-0.05298580601811409 & cv<=0.017999613657593744\n",
      "   -3.6283 if cp<=-0.01872282214462757 & cp>=-0.08475320041179657\n",
      "   -0.0000 if cp>=-0.014123460277915001\n",
      "   +0.2150 if cv>=-0.5681428074836731\n",
      "   +0.2150 if cv>=-0.604309904575348\n",
      "   +3.7911 if cp<=0.006921333260834218 & cp>=-0.07428496778011322\n",
      "   +0.0773 if cv<=-0.5488481998443604 & pa<=0.16868769824504853 & pav>=0.6717349648475648\n",
      "   +0.9639 if pa<=0.09636197239160539 & pav>=0.23857961297035246\n",
      "   +0.2923 if \n",
      "   -0.0001 if cp>=0.034838929772377014 & cv>=-0.208836168050766\n",
      "   +2.3079 if pav>=1.3057200908660889\n",
      "Run episode 215 with rewards 65.0\n",
      "============ 216 ===========\n",
      "37 actions [0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 0, 0]\n",
      "   -1.3321 if cv<=1.0829041719436647\n",
      "   +2.3255 if pav<=0.07888057827949524\n",
      "   +0.6635 if cp<=0.017083643935620785\n",
      "   -1.3321 if cv>=-0.9505589485168457\n",
      "   +5.2729 if cp>=-0.034373172372579565\n",
      "   -0.0000 if cv<=-0.6533100008964539\n",
      "   -1.3357 if cp<=-0.025732863694429394\n",
      "   +1.6044 if pa>=0.15067561864852907\n",
      "   -3.7393 if cp>=-0.046283074468374236 & pa<=0.14660244584083557\n",
      "   +6.0352 if cv>=-0.4036271572113037 & pa<=0.019266029819846153\n",
      "   -0.0000 if cp<=-0.12441594898700714\n",
      "   +3.0300 if cv>=0.18683374822139742 & pa>=0.02074484340846539\n",
      "--------------\n",
      "   +1.9632 if cp<=0.026253991574048997\n",
      "   -0.0039 if cp<=-0.05298580601811409 & cv<=0.017999613657593744\n",
      "   -2.5533 if cp<=-0.01872282214462757 & cp>=-0.08475320041179657\n",
      "   +0.3383 if cv>=-0.5681428074836731\n",
      "   +0.5971 if cv>=-0.604309904575348\n",
      "   +0.9981 if cp<=0.006921333260834218 & cp>=-0.07428496778011322\n",
      "   +0.2582 if cv<=-0.5488481998443604 & pa<=0.16868769824504853 & pav>=0.6717349648475648\n",
      "   +2.2787 if pa<=0.09636197239160539 & pav>=0.23857961297035246\n",
      "   +0.5965 if \n",
      "   -0.4305 if cp>=0.034838929772377014 & cv>=-0.208836168050766\n",
      "   -1.9915 if pav>=1.3057200908660889\n",
      "   -1.5068 if cp>=-0.013122606463730336\n",
      "Run episode 216 with rewards 37.0\n",
      "============ 217 ===========\n",
      "86 actions [0, 1, 0, 1, 1, 1, 0, 0, 0, 0, 1, 1, 0, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 0, 1, 0, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 1, 0, 1, 1, 0, 0, 1, 1, 0, 0, 1, 0, 1, 1, 1]\n",
      "   +0.1455 if cv<=1.0829041719436647\n",
      "   +4.5525 if pav<=0.07888057827949524\n",
      "   +0.0000 if cp<=0.017083643935620785\n",
      "   +0.1455 if cv>=-0.9505589485168457\n",
      "   +0.1455 if cp>=-0.034373172372579565\n",
      "   +0.0000 if cv<=-0.6533100008964539\n",
      "   +0.0000 if cp<=-0.025732863694429394\n",
      "   +1.0382 if pa>=0.15067561864852907\n",
      "   -3.8245 if cp>=-0.046283074468374236 & pa<=0.14660244584083557\n",
      "   +0.0000 if cv>=-0.4036271572113037 & pa<=0.019266029819846153\n",
      "   +5.3432 if cv>=0.18683374822139742 & pa>=0.02074484340846539\n",
      "   +3.3780 if cv<=-0.024970776587724685 & pa<=0.0678311288356781\n",
      "--------------\n",
      "   +0.0000 if cp<=0.026253991574048997\n",
      "   +0.0000 if cp<=-0.01872282214462757 & cp>=-0.08475320041179657\n",
      "   +1.3854 if cv>=-0.5681428074836731\n",
      "   +1.3854 if cv>=-0.604309904575348\n",
      "   +0.0000 if cp<=0.006921333260834218 & cp>=-0.07428496778011322\n",
      "   +0.0000 if cv<=-0.5488481998443604 & pa<=0.16868769824504853 & pav>=0.6717349648475648\n",
      "   +3.4849 if pa<=0.09636197239160539 & pav>=0.23857961297035246\n",
      "   +1.3854 if \n",
      "   -5.8899 if cp>=0.034838929772377014 & cv>=-0.208836168050766\n",
      "   +2.2403 if pav>=1.3057200908660889\n",
      "   +1.3854 if cp>=-0.013122606463730336\n",
      "   -3.0857 if cp<=0.040582723915576935 & pav<=0.12340002804994583\n",
      "Run episode 217 with rewards 86.0\n",
      "============ 218 ===========\n",
      "72 actions [1, 1, 1, 0, 0, 0, 0, 1, 0, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 0, 1, 0, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 1, 0, 0, 0, 1, 1, 1]\n",
      "   -4.5047 if cv<=1.0829041719436647\n",
      "   +4.8652 if pav<=0.07888057827949524\n",
      "   +1.4593 if cp<=0.017083643935620785\n",
      "   +1.2229 if cv>=-0.9505589485168457\n",
      "   +2.1634 if cp>=-0.034373172372579565\n",
      "   +1.9317 if cp<=-0.025732863694429394\n",
      "   +0.4703 if pa>=0.15067561864852907\n",
      "   -2.2822 if cp>=-0.046283074468374236 & pa<=0.14660244584083557\n",
      "   -0.2229 if cv>=-0.4036271572113037 & pa<=0.019266029819846153\n",
      "   -0.0004 if cv>=0.18683374822139742 & pa>=0.02074484340846539\n",
      "   +3.7257 if cv<=-0.024970776587724685 & pa<=0.0678311288356781\n",
      "   +4.7034 if cv>=0.5977326035499573\n",
      "--------------\n",
      "   +0.3108 if cp<=0.026253991574048997\n",
      "   +2.9239 if cp<=-0.01872282214462757 & cp>=-0.08475320041179657\n",
      "   -1.0710 if cv>=-0.5681428074836731\n",
      "   -1.0710 if cv>=-0.604309904575348\n",
      "   -1.8558 if cp<=0.006921333260834218 & cp>=-0.07428496778011322\n",
      "   +3.5894 if pa<=0.09636197239160539 & pav>=0.23857961297035246\n",
      "   +1.0790 if \n",
      "   -7.4796 if cp>=0.034838929772377014 & cv>=-0.208836168050766\n",
      "   +0.0005 if pav>=1.3057200908660889\n",
      "   +7.3424 if cp>=-0.013122606463730336\n",
      "   -3.0876 if cp<=0.040582723915576935 & pav<=0.12340002804994583\n",
      "   -5.3780 if cv>=0.5977326035499573\n",
      "Run episode 218 with rewards 72.0\n",
      "============ 219 ===========\n",
      "111 actions [0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1, 0, 1, 0, 0, 0, 1, 0, 0, 0, 1, 1, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1]\n",
      "   -4.0206 if cv<=1.0829041719436647\n",
      "   +4.6150 if pav<=0.07888057827949524\n",
      "   +1.0211 if cp<=0.017083643935620785\n",
      "   +4.4772 if cv>=-0.9505589485168457\n",
      "   +0.1651 if cp>=-0.034373172372579565\n",
      "   +1.3294 if cp<=-0.025732863694429394\n",
      "   +1.3986 if pa>=0.15067561864852907\n",
      "   -4.1910 if cp>=-0.046283074468374236 & pa<=0.14660244584083557\n",
      "   +0.2189 if cv>=-0.4036271572113037 & pa<=0.019266029819846153\n",
      "   +4.3742 if cv<=-0.024970776587724685 & pa<=0.0678311288356781\n",
      "   +1.3392 if cv>=0.5977326035499573\n",
      "   -2.6590 if cp<=-0.14482987523078913\n",
      "--------------\n",
      "   +1.4066 if cp<=0.026253991574048997\n",
      "   +2.8706 if cp<=-0.01872282214462757 & cp>=-0.08475320041179657\n",
      "   +0.2120 if cv>=-0.5681428074836731\n",
      "   +0.2120 if cv>=-0.604309904575348\n",
      "   -2.0746 if cp<=0.006921333260834218 & cp>=-0.07428496778011322\n",
      "   +5.5741 if pa<=0.09636197239160539 & pav>=0.23857961297035246\n",
      "   -2.1965 if \n",
      "   -8.5182 if cp>=0.034838929772377014 & cv>=-0.208836168050766\n",
      "   +8.5620 if cp>=-0.013122606463730336\n",
      "   -2.3051 if cp<=0.040582723915576935 & pav<=0.12340002804994583\n",
      "   -2.6418 if cv>=0.5977326035499573\n",
      "   -2.4306 if pa<=-0.05643089190125465\n",
      "Run episode 219 with rewards 111.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 220 ===========\n",
      "33 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 1, 0, 1, 0, 0, 0, 1, 0, 0, 0, 0]\n",
      "   -3.7153 if cv<=1.0829041719436647\n",
      "   +6.4536 if pav<=0.07888057827949524\n",
      "   +1.4937 if cp<=0.017083643935620785\n",
      "   +2.5066 if cv>=-0.9505589485168457\n",
      "   +5.4427 if cp<=-0.025732863694429394\n",
      "   +1.9119 if pa>=0.15067561864852907\n",
      "   -1.9848 if cp>=-0.046283074468374236 & pa<=0.14660244584083557\n",
      "   -2.1145 if cv>=-0.4036271572113037 & pa<=0.019266029819846153\n",
      "   +2.5869 if cv<=-0.024970776587724685 & pa<=0.0678311288356781\n",
      "   -2.1782 if cv>=0.5977326035499573\n",
      "   -6.3883 if cp<=-0.14482987523078913\n",
      "   -6.0102 if pa<=-0.1466614454984665 & pav>=0.33184200525283813\n",
      "--------------\n",
      "   +0.0186 if cp<=0.026253991574048997\n",
      "   +4.7644 if cp<=-0.01872282214462757 & cp>=-0.08475320041179657\n",
      "   +0.1385 if cv>=-0.5681428074836731\n",
      "   -1.4465 if cp<=0.006921333260834218 & cp>=-0.07428496778011322\n",
      "   +5.9323 if pa<=0.09636197239160539 & pav>=0.23857961297035246\n",
      "   -0.4944 if \n",
      "   -9.7471 if cp>=0.034838929772377014 & cv>=-0.208836168050766\n",
      "   +9.9850 if cp>=-0.013122606463730336\n",
      "   -4.7310 if cp<=0.040582723915576935 & pav<=0.12340002804994583\n",
      "   +1.6265 if cv>=0.5977326035499573\n",
      "   -3.3603 if pa<=-0.05643089190125465\n",
      "   -5.8212 if cv<=-0.9170470237731934 & cv>=-0.9170470237731934\n",
      "Run episode 220 with rewards 33.0\n",
      "============ 221 ===========\n",
      "40 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 0, 0]\n",
      "   +2.2113 if cv<=1.0829041719436647\n",
      "   +2.1740 if pav<=0.07888057827949524\n",
      "   +2.2113 if cv>=-0.9505589485168457\n",
      "   +1.2995 if cp<=-0.025732863694429394\n",
      "   +0.0834 if pa>=0.15067561864852907\n",
      "   -3.1389 if cp>=-0.046283074468374236 & pa<=0.14660244584083557\n",
      "   -0.3966 if cv>=-0.4036271572113037 & pa<=0.019266029819846153\n",
      "   +2.2224 if cv<=-0.024970776587724685 & pa<=0.0678311288356781\n",
      "   -0.0000 if cv>=0.5977326035499573\n",
      "   -0.0000 if cp<=-0.14482987523078913\n",
      "   -0.0000 if pa<=-0.1466614454984665 & pav>=0.33184200525283813\n",
      "   -2.5285 if cp<=-0.07385655492544174\n",
      "--------------\n",
      "   +1.9268 if cp<=-0.01872282214462757 & cp>=-0.08475320041179657\n",
      "   +1.8330 if cv>=-0.5681428074836731\n",
      "   -2.5544 if cp<=0.006921333260834218 & cp>=-0.07428496778011322\n",
      "   +6.2228 if pa<=0.09636197239160539 & pav>=0.23857961297035246\n",
      "   +1.8394 if \n",
      "   +0.0000 if cp>=0.034838929772377014 & cv>=-0.208836168050766\n",
      "   +0.0000 if cp>=-0.013122606463730336\n",
      "   -4.1408 if cp<=0.040582723915576935 & pav<=0.12340002804994583\n",
      "   +0.0000 if cv>=0.5977326035499573\n",
      "   +0.0000 if pa<=-0.05643089190125465\n",
      "   +0.0000 if cv<=-0.9170470237731934 & cv>=-0.9170470237731934\n",
      "   +2.5588 if cp<=-0.07385655492544174 & cv<=-0.008567308634519577 & cv>=-0.019547272473573678\n",
      "Run episode 221 with rewards 40.0\n",
      "============ 222 ===========\n",
      "37 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1]\n",
      "   +0.9376 if cv<=1.0829041719436647\n",
      "   +0.8336 if pav<=0.07888057827949524\n",
      "   +0.9376 if cv>=-0.9505589485168457\n",
      "   +0.0000 if cp<=-0.025732863694429394\n",
      "   +0.2631 if pa>=0.15067561864852907\n",
      "   -1.1124 if cp>=-0.046283074468374236 & pa<=0.14660244584083557\n",
      "   +0.6911 if cv>=-0.4036271572113037 & pa<=0.019266029819846153\n",
      "   -0.3777 if cv<=-0.024970776587724685 & pa<=0.0678311288356781\n",
      "   +0.0000 if cp<=-0.14482987523078913\n",
      "   +0.0000 if pa<=-0.1466614454984665 & pav>=0.33184200525283813\n",
      "   +0.0000 if cp<=-0.07385655492544174\n",
      "   +3.9638 if pav<=0.1965594500303269\n",
      "--------------\n",
      "   -0.0000 if cp<=-0.01872282214462757 & cp>=-0.08475320041179657\n",
      "   +0.1182 if cv>=-0.5681428074836731\n",
      "   -0.8889 if cp<=0.006921333260834218 & cp>=-0.07428496778011322\n",
      "   +6.1450 if pa<=0.09636197239160539 & pav>=0.23857961297035246\n",
      "   +0.2516 if \n",
      "   -0.0000 if cp>=0.034838929772377014 & cv>=-0.208836168050766\n",
      "   -2.1222 if cp>=-0.013122606463730336\n",
      "   -1.5676 if cp<=0.040582723915576935 & pav<=0.12340002804994583\n",
      "   -0.0000 if pa<=-0.05643089190125465\n",
      "   -0.0000 if cv<=-0.9170470237731934 & cv>=-0.9170470237731934\n",
      "   -0.0000 if cp<=-0.07385655492544174 & cv<=-0.008567308634519577 & cv>=-0.019547272473573678\n",
      "   +4.3551 if cv<=0.017256867140531543 & pav>=0.1965594500303269\n",
      "Run episode 222 with rewards 37.0\n",
      "============ 223 ===========\n",
      "48 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0]\n",
      "   +0.1540 if cv<=1.0829041719436647\n",
      "   +0.7468 if pav<=0.07888057827949524\n",
      "   +0.1540 if cv>=-0.9505589485168457\n",
      "   +0.1540 if cp<=-0.025732863694429394\n",
      "   +1.0520 if pa>=0.15067561864852907\n",
      "   +0.4117 if cp>=-0.046283074468374236 & pa<=0.14660244584083557\n",
      "   +0.3363 if cv>=-0.4036271572113037 & pa<=0.019266029819846153\n",
      "   +1.3084 if cv<=-0.024970776587724685 & pa<=0.0678311288356781\n",
      "   +0.0000 if cp<=-0.14482987523078913\n",
      "   +0.0000 if cp<=-0.07385655492544174\n",
      "   +2.3134 if pav<=0.1965594500303269\n",
      "   +2.0414 if cv>=0.13895457684993745 & pav<=0.3351419150829315\n",
      "--------------\n",
      "   -0.0994 if cp<=-0.01872282214462757 & cp>=-0.08475320041179657\n",
      "   -0.0994 if cv>=-0.5681428074836731\n",
      "   -0.0994 if cp<=0.006921333260834218 & cp>=-0.07428496778011322\n",
      "   +2.0441 if pa<=0.09636197239160539 & pav>=0.23857961297035246\n",
      "   -0.0994 if \n",
      "   +0.0000 if cp>=0.034838929772377014 & cv>=-0.208836168050766\n",
      "   +0.0000 if cp>=-0.013122606463730336\n",
      "   -0.7445 if cp<=0.040582723915576935 & pav<=0.12340002804994583\n",
      "   +0.0000 if cv<=-0.9170470237731934 & cv>=-0.9170470237731934\n",
      "   +0.0000 if cp<=-0.07385655492544174 & cv<=-0.008567308634519577 & cv>=-0.019547272473573678\n",
      "   +5.7711 if cv<=0.017256867140531543 & pav>=0.1965594500303269\n",
      "   +0.5473 if cp<=-0.06552206873893737 & pav<=0.21985108852386476\n",
      "Run episode 223 with rewards 48.0\n",
      "============ 224 ===========\n",
      "44 actions [0, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 0, 1]\n",
      "   +0.3482 if cv<=1.0829041719436647\n",
      "   +1.9880 if pav<=0.07888057827949524\n",
      "   +0.3482 if cv>=-0.9505589485168457\n",
      "   -1.1801 if cp<=-0.025732863694429394\n",
      "   +2.0769 if pa>=0.15067561864852907\n",
      "   +2.1922 if cp>=-0.046283074468374236 & pa<=0.14660244584083557\n",
      "   +2.6048 if cv>=-0.4036271572113037 & pa<=0.019266029819846153\n",
      "   +0.2035 if cv<=-0.024970776587724685 & pa<=0.0678311288356781\n",
      "   +0.0000 if cp<=-0.07385655492544174\n",
      "   +0.3348 if pav<=0.1965594500303269\n",
      "   +2.0433 if cv>=0.13895457684993745 & pav<=0.3351419150829315\n",
      "   -2.8798 if cp>=0.0016839250922203125 & cv<=-0.2141095370054245\n",
      "--------------\n",
      "   +5.7515 if cp<=-0.01872282214462757 & cp>=-0.08475320041179657\n",
      "   -2.0123 if cv>=-0.5681428074836731\n",
      "   -1.2940 if cp<=0.006921333260834218 & cp>=-0.07428496778011322\n",
      "   +1.5719 if pa<=0.09636197239160539 & pav>=0.23857961297035246\n",
      "   -2.0123 if \n",
      "   +0.0000 if cp>=0.034838929772377014 & cv>=-0.208836168050766\n",
      "   +5.6684 if cp>=-0.013122606463730336\n",
      "   -4.5327 if cp<=0.040582723915576935 & pav<=0.12340002804994583\n",
      "   +0.0000 if cp<=-0.07385655492544174 & cv<=-0.008567308634519577 & cv>=-0.019547272473573678\n",
      "   +4.4300 if cv<=0.017256867140531543 & pav>=0.1965594500303269\n",
      "   +0.0000 if cp<=-0.06552206873893737 & pav<=0.21985108852386476\n",
      "   +1.9719 if pav<=0.20378408133983614\n",
      "Run episode 224 with rewards 44.0\n",
      "============ 225 ===========\n",
      "53 actions [0, 1, 0, 1, 0, 0, 0, 1, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1]\n",
      "   +0.8980 if cv<=1.0829041719436647\n",
      "   +2.0709 if pav<=0.07888057827949524\n",
      "   +0.8980 if cv>=-0.9505589485168457\n",
      "   -1.8681 if cp<=-0.025732863694429394\n",
      "   +0.1087 if pa>=0.15067561864852907\n",
      "   +2.8743 if cp>=-0.046283074468374236 & pa<=0.14660244584083557\n",
      "   +3.1122 if cv>=-0.4036271572113037 & pa<=0.019266029819846153\n",
      "   -1.4902 if cv<=-0.024970776587724685 & pa<=0.0678311288356781\n",
      "   +1.6515 if pav<=0.1965594500303269\n",
      "   +3.2788 if cv>=0.13895457684993745 & pav<=0.3351419150829315\n",
      "   -2.3778 if cp>=0.0016839250922203125 & cv<=-0.2141095370054245\n",
      "   -1.4959 if pav<=0.233574378490448\n",
      "--------------\n",
      "   +3.1319 if cp<=-0.01872282214462757 & cp>=-0.08475320041179657\n",
      "   -2.0495 if cv>=-0.5681428074836731\n",
      "   +0.8514 if cp<=0.006921333260834218 & cp>=-0.07428496778011322\n",
      "   +1.5113 if pa<=0.09636197239160539 & pav>=0.23857961297035246\n",
      "   -2.0495 if \n",
      "   +3.5447 if cp>=-0.013122606463730336\n",
      "   -4.9776 if cp<=0.040582723915576935 & pav<=0.12340002804994583\n",
      "   +0.0000 if cp<=-0.07385655492544174 & cv<=-0.008567308634519577 & cv>=-0.019547272473573678\n",
      "   +4.9793 if cv<=0.017256867140531543 & pav>=0.1965594500303269\n",
      "   +0.0000 if cp<=-0.06552206873893737 & pav<=0.21985108852386476\n",
      "   +2.1325 if pav<=0.20378408133983614\n",
      "   +3.2745 if cp>=0.016427554190158844\n",
      "Run episode 225 with rewards 53.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 226 ===========\n",
      "34 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 0]\n",
      "   +0.8607 if cv<=1.0829041719436647\n",
      "   +0.7607 if pav<=0.07888057827949524\n",
      "   +0.8607 if cv>=-0.9505589485168457\n",
      "   -2.3234 if cp<=-0.025732863694429394\n",
      "   +5.5941 if cp>=-0.046283074468374236 & pa<=0.14660244584083557\n",
      "   +1.9083 if cv>=-0.4036271572113037 & pa<=0.019266029819846153\n",
      "   -4.0118 if cv<=-0.024970776587724685 & pa<=0.0678311288356781\n",
      "   +4.9547 if pav<=0.1965594500303269\n",
      "   +0.1584 if cv>=0.13895457684993745 & pav<=0.3351419150829315\n",
      "   -0.0000 if cp>=0.0016839250922203125 & cv<=-0.2141095370054245\n",
      "   -3.3847 if pav<=0.233574378490448\n",
      "   +2.2151 if cv>=0.013880855403840547\n",
      "--------------\n",
      "   +3.8448 if cp<=-0.01872282214462757 & cp>=-0.08475320041179657\n",
      "   -3.0390 if cv>=-0.5681428074836731\n",
      "   +4.1153 if cp<=0.006921333260834218 & cp>=-0.07428496778011322\n",
      "   +1.1389 if pa<=0.09636197239160539 & pav>=0.23857961297035246\n",
      "   -3.0390 if \n",
      "   +5.1609 if cp>=-0.013122606463730336\n",
      "   -6.3952 if cp<=0.040582723915576935 & pav<=0.12340002804994583\n",
      "   +4.9490 if cv<=0.017256867140531543 & pav>=0.1965594500303269\n",
      "   -1.4343 if cp<=-0.06552206873893737 & pav<=0.21985108852386476\n",
      "   -0.2471 if pav<=0.20378408133983614\n",
      "   -0.0001 if cp>=0.016427554190158844\n",
      "   +2.6214 if cp<=-0.046878177672624574\n",
      "Run episode 226 with rewards 34.0\n",
      "============ 227 ===========\n",
      "40 actions [1, 0, 0, 0, 1, 1, 1, 0, 1, 1, 0, 0, 0, 0, 0, 1, 1, 1, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 1, 1, 1, 1, 0, 0, 1, 1, 1, 1, 0]\n",
      "   +0.4464 if cv<=1.0829041719436647\n",
      "   +0.0410 if pav<=0.07888057827949524\n",
      "   +0.4464 if cv>=-0.9505589485168457\n",
      "   -0.0000 if cp<=-0.025732863694429394\n",
      "   +2.2693 if cp>=-0.046283074468374236 & pa<=0.14660244584083557\n",
      "   -0.0000 if cv>=-0.4036271572113037 & pa<=0.019266029819846153\n",
      "   +3.5692 if cv<=-0.024970776587724685 & pa<=0.0678311288356781\n",
      "   +0.1598 if pav<=0.1965594500303269\n",
      "   +1.5694 if cv>=0.13895457684993745 & pav<=0.3351419150829315\n",
      "   -2.9159 if pav<=0.233574378490448\n",
      "   +2.8329 if cv>=0.013880855403840547\n",
      "   -5.4941 if cp>=0.010079050622880462 & pav>=0.2217007040977478\n",
      "--------------\n",
      "   +0.0000 if cp<=-0.01872282214462757 & cp>=-0.08475320041179657\n",
      "   +0.3307 if cv>=-0.5681428074836731\n",
      "   +8.8538 if cp<=0.006921333260834218 & cp>=-0.07428496778011322\n",
      "   -0.0473 if pa<=0.09636197239160539 & pav>=0.23857961297035246\n",
      "   +0.3307 if \n",
      "   +0.3308 if cp>=-0.013122606463730336\n",
      "   -5.0329 if cp<=0.040582723915576935 & pav<=0.12340002804994583\n",
      "   +5.9973 if cv<=0.017256867140531543 & pav>=0.1965594500303269\n",
      "   +0.0000 if cp<=-0.06552206873893737 & pav<=0.21985108852386476\n",
      "   +4.9315 if pav<=0.20378408133983614\n",
      "   +0.0000 if cp<=-0.046878177672624574\n",
      "   -4.9497 if cp<=0.010079050622880462\n",
      "Run episode 227 with rewards 40.0\n",
      "============ 228 ===========\n",
      "44 actions [1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 0, 0, 0, 0, 1, 1, 0, 0, 1, 1, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 1, 0, 1]\n",
      "   -0.4785 if cv<=1.0829041719436647\n",
      "   -1.4812 if pav<=0.07888057827949524\n",
      "   +3.1213 if cv>=-0.9505589485168457\n",
      "   +2.5380 if cp<=-0.025732863694429394\n",
      "   +3.1213 if cp>=-0.046283074468374236 & pa<=0.14660244584083557\n",
      "   +4.5857 if cv<=-0.024970776587724685 & pa<=0.0678311288356781\n",
      "   -1.4267 if pav<=0.1965594500303269\n",
      "   +1.8044 if cv>=0.13895457684993745 & pav<=0.3351419150829315\n",
      "   -1.4266 if pav<=0.233574378490448\n",
      "   +1.8044 if cv>=0.013880855403840547\n",
      "   +0.0001 if cp>=0.010079050622880462 & pav>=0.2217007040977478\n",
      "   -3.8411 if cp<=-0.002366305910982189 & cv<=0.09535341560840632\n",
      "--------------\n",
      "   -0.4494 if cp<=-0.01872282214462757 & cp>=-0.08475320041179657\n",
      "   -1.1270 if cv>=-0.5681428074836731\n",
      "   +6.5964 if cp<=0.006921333260834218 & cp>=-0.07428496778011322\n",
      "   +0.9986 if pa<=0.09636197239160539 & pav>=0.23857961297035246\n",
      "   +4.9263 if \n",
      "   -1.0342 if cp>=-0.013122606463730336\n",
      "   -5.7704 if cp<=0.040582723915576935 & pav<=0.12340002804994583\n",
      "   +0.9986 if cv<=0.017256867140531543 & pav>=0.1965594500303269\n",
      "   +3.9277 if pav<=0.20378408133983614\n",
      "   +0.0000 if cp<=-0.046878177672624574\n",
      "   -3.4171 if cp<=0.010079050622880462\n",
      "   -1.6539 if cp>=0.07741032242774969\n",
      "Run episode 228 with rewards 44.0\n",
      "============ 229 ===========\n",
      "26 actions [0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 0, 1, 0, 1, 1, 1, 0, 1, 0, 1, 0, 0, 0, 0, 0]\n",
      "   -1.4854 if cv<=1.0829041719436647\n",
      "   +1.0321 if pav<=0.07888057827949524\n",
      "   +4.0765 if cv>=-0.9505589485168457\n",
      "   +2.9393 if cp<=-0.025732863694429394\n",
      "   +2.7471 if cp>=-0.046283074468374236 & pa<=0.14660244584083557\n",
      "   +5.2472 if cv<=-0.024970776587724685 & pa<=0.0678311288356781\n",
      "   -2.2696 if pav<=0.1965594500303269\n",
      "   +2.2400 if cv>=0.13895457684993745 & pav<=0.3351419150829315\n",
      "   -1.5796 if pav<=0.233574378490448\n",
      "   +0.9582 if cv>=0.013880855403840547\n",
      "   -4.7190 if cp<=-0.002366305910982189 & cv<=0.09535341560840632\n",
      "   +2.9342 if cv>=0.4076113700866699\n",
      "--------------\n",
      "   +3.3325 if cp<=-0.01872282214462757 & cp>=-0.08475320041179657\n",
      "   -3.1314 if cv>=-0.5681428074836731\n",
      "   +4.5957 if cp<=0.006921333260834218 & cp>=-0.07428496778011322\n",
      "   -0.8788 if pa<=0.09636197239160539 & pav>=0.23857961297035246\n",
      "   +0.7129 if \n",
      "   -0.8025 if cp>=-0.013122606463730336\n",
      "   -3.0699 if cp<=0.040582723915576935 & pav<=0.12340002804994583\n",
      "   +3.7842 if cv<=0.017256867140531543 & pav>=0.1965594500303269\n",
      "   +5.2776 if pav<=0.20378408133983614\n",
      "   +0.7712 if cp<=0.010079050622880462\n",
      "   +0.0013 if cp>=0.07741032242774969\n",
      "   -2.8117 if cp<=-0.0014129831688478593 & cv>=-0.3643034100532532 & pa>=-0.04844097718596459\n",
      "Run episode 229 with rewards 26.0\n",
      "============ 230 ===========\n",
      "11 actions [0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1]\n",
      "   +1.7256 if cv<=1.0829041719436647\n",
      "   +2.1628 if pav<=0.07888057827949524\n",
      "   +3.1398 if cv>=-0.9505589485168457\n",
      "   -0.4300 if cp<=-0.025732863694429394\n",
      "   +2.9143 if cp>=-0.046283074468374236 & pa<=0.14660244584083557\n",
      "   +2.9533 if cv<=-0.024970776587724685 & pa<=0.0678311288356781\n",
      "   -0.8523 if pav<=0.1965594500303269\n",
      "   -0.7681 if cv>=0.13895457684993745 & pav<=0.3351419150829315\n",
      "   -0.8828 if pav<=0.233574378490448\n",
      "   -2.2750 if cp<=-0.002366305910982189 & cv<=0.09535341560840632\n",
      "   +3.9266 if cv>=0.4076113700866699\n",
      "   +3.9439 if cv<=0.3805105984210968 & pav<=0.1969979852437973\n",
      "--------------\n",
      "   +3.3641 if cp<=-0.01872282214462757 & cp>=-0.08475320041179657\n",
      "   +0.0118 if cv>=-0.5681428074836731\n",
      "   +1.4167 if cp<=0.006921333260834218 & cp>=-0.07428496778011322\n",
      "   +1.0277 if pa<=0.09636197239160539 & pav>=0.23857961297035246\n",
      "   +1.0698 if \n",
      "   -1.9871 if cp>=-0.013122606463730336\n",
      "   -3.0014 if cp<=0.040582723915576935 & pav<=0.12340002804994583\n",
      "   +1.0470 if cv<=0.017256867140531543 & pav>=0.1965594500303269\n",
      "   +1.6135 if pav<=0.20378408133983614\n",
      "   +1.3079 if cp<=0.010079050622880462\n",
      "   +1.2461 if cp<=-0.0014129831688478593 & cv>=-0.3643034100532532 & pa>=-0.04844097718596459\n",
      "   -3.3368 if cp<=-0.0170885045081377 & cv<=0.3805105984210968 & pav<=0.1969979852437973\n",
      "Run episode 230 with rewards 11.0\n",
      "============ 231 ===========\n",
      "21 actions [0, 1, 0, 0, 1, 0, 0, 1, 1, 1, 0, 0, 1, 1, 0, 0, 0, 1, 1, 0, 0]\n",
      "   +0.5277 if cv<=1.0829041719436647\n",
      "   +0.1556 if pav<=0.07888057827949524\n",
      "   +2.7766 if cv>=-0.9505589485168457\n",
      "   +0.5162 if cp>=-0.046283074468374236 & pa<=0.14660244584083557\n",
      "   +1.5683 if cv<=-0.024970776587724685 & pa<=0.0678311288356781\n",
      "   +0.1556 if pav<=0.1965594500303269\n",
      "   +0.0000 if cv>=0.13895457684993745 & pav<=0.3351419150829315\n",
      "   +0.1556 if pav<=0.233574378490448\n",
      "   +1.1941 if cp<=-0.002366305910982189 & cv<=0.09535341560840632\n",
      "   +0.0000 if cv>=0.4076113700866699\n",
      "   +0.1556 if cv<=0.3805105984210968 & pav<=0.1969979852437973\n",
      "   -0.1267 if cp<=0.04477308690547943 & cp>=-0.048945702612400055\n",
      "--------------\n",
      "   +0.9291 if cp<=-0.01872282214462757 & cp>=-0.08475320041179657\n",
      "   -0.5625 if cp<=0.006921333260834218 & cp>=-0.07428496778011322\n",
      "   +1.9120 if pa<=0.09636197239160539 & pav>=0.23857961297035246\n",
      "   +1.2704 if \n",
      "   +0.3413 if cp>=-0.013122606463730336\n",
      "   +0.0000 if cp<=0.040582723915576935 & pav<=0.12340002804994583\n",
      "   +1.2704 if cv<=0.017256867140531543 & pav>=0.1965594500303269\n",
      "   -0.0000 if pav<=0.20378408133983614\n",
      "   +1.4648 if cp<=0.010079050622880462\n",
      "   +0.0000 if cp<=-0.0014129831688478593 & cv>=-0.3643034100532532 & pa>=-0.04844097718596459\n",
      "   +0.0000 if cp<=-0.0170885045081377 & cv<=0.3805105984210968 & pav<=0.1969979852437973\n",
      "   -0.1944 if pa<=0.04548279941082001\n",
      "Run episode 231 with rewards 21.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 232 ===========\n",
      "20 actions [0, 1, 0, 1, 0, 0, 0, 1, 0, 0, 0, 1, 1, 1, 0, 0, 1, 1, 1, 0]\n",
      "   +1.1938 if cv<=1.0829041719436647\n",
      "   +0.7523 if pav<=0.07888057827949524\n",
      "   +1.1938 if cv>=-0.9505589485168457\n",
      "   -3.0263 if cp>=-0.046283074468374236 & pa<=0.14660244584083557\n",
      "   +1.4418 if cv<=-0.024970776587724685 & pa<=0.0678311288356781\n",
      "   +0.7686 if pav<=0.1965594500303269\n",
      "   +1.5667 if pav<=0.233574378490448\n",
      "   +1.1938 if cp<=-0.002366305910982189 & cv<=0.09535341560840632\n",
      "   -0.0000 if cv>=0.4076113700866699\n",
      "   +0.7686 if cv<=0.3805105984210968 & pav<=0.1969979852437973\n",
      "   +2.9259 if cp<=0.04477308690547943 & cp>=-0.048945702612400055\n",
      "   +1.0927 if cp<=-0.009477400220930576 & pav<=0.600848913192749\n",
      "--------------\n",
      "   +0.6827 if cp<=-0.01872282214462757 & cp>=-0.08475320041179657\n",
      "   +0.0504 if cp<=0.006921333260834218 & cp>=-0.07428496778011322\n",
      "   +1.5258 if pa<=0.09636197239160539 & pav>=0.23857961297035246\n",
      "   +0.5957 if \n",
      "   +3.2735 if cp>=-0.013122606463730336\n",
      "   -1.1710 if cp<=0.040582723915576935 & pav<=0.12340002804994583\n",
      "   +2.0540 if cv<=0.017256867140531543 & pav>=0.1965594500303269\n",
      "   -1.4583 if pav<=0.20378408133983614\n",
      "   +0.5957 if cp<=0.010079050622880462\n",
      "   -0.1103 if cp<=-0.0170885045081377 & cv<=0.3805105984210968 & pav<=0.1969979852437973\n",
      "   -1.0483 if pa<=0.04548279941082001\n",
      "   +1.9775 if pav>=0.600848913192749\n",
      "Run episode 232 with rewards 20.0\n",
      "============ 233 ===========\n",
      "48 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 1, 1, 0, 1, 0, 1]\n",
      "   +0.2741 if cv<=1.0829041719436647\n",
      "   +0.8987 if pav<=0.07888057827949524\n",
      "   +2.3090 if cv>=-0.9505589485168457\n",
      "   -0.8054 if cp>=-0.046283074468374236 & pa<=0.14660244584083557\n",
      "   +2.9273 if cv<=-0.024970776587724685 & pa<=0.0678311288356781\n",
      "   +0.8987 if pav<=0.1965594500303269\n",
      "   +1.5601 if pav<=0.233574378490448\n",
      "   +1.8020 if cp<=-0.002366305910982189 & cv<=0.09535341560840632\n",
      "   +0.8987 if cv<=0.3805105984210968 & pav<=0.1969979852437973\n",
      "   -0.8055 if cp<=0.04477308690547943 & cp>=-0.048945702612400055\n",
      "   +2.4144 if cp<=-0.009477400220930576 & pav<=0.600848913192749\n",
      "   +0.1864 if cv<=-0.636212944984436\n",
      "--------------\n",
      "   -1.5336 if cp<=-0.01872282214462757 & cp>=-0.08475320041179657\n",
      "   +2.9206 if pa<=0.09636197239160539 & pav>=0.23857961297035246\n",
      "   +0.7197 if \n",
      "   +3.9846 if cp>=-0.013122606463730336\n",
      "   -0.7265 if cp<=0.040582723915576935 & pav<=0.12340002804994583\n",
      "   +1.4462 if cv<=0.017256867140531543 & pav>=0.1965594500303269\n",
      "   -0.7265 if pav<=0.20378408133983614\n",
      "   +0.7197 if cp<=0.010079050622880462\n",
      "   -0.0000 if cp<=-0.0170885045081377 & cv<=0.3805105984210968 & pav<=0.1969979852437973\n",
      "   -2.6033 if pa<=0.04548279941082001\n",
      "   +1.4820 if pav>=0.600848913192749\n",
      "   +3.8773 if cp>=-0.02854387313127515 & cv<=-0.5904564142227173\n",
      "Run episode 233 with rewards 48.0\n",
      "============ 234 ===========\n",
      "39 actions [0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 0, 1, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 1, 1, 0]\n",
      "   +0.9173 if cv<=1.0829041719436647\n",
      "   +4.5911 if pav<=0.07888057827949524\n",
      "   +0.9173 if cv>=-0.9505589485168457\n",
      "   +0.8982 if cp>=-0.046283074468374236 & pa<=0.14660244584083557\n",
      "   -0.8829 if cv<=-0.024970776587724685 & pa<=0.0678311288356781\n",
      "   +3.9251 if pav<=0.1965594500303269\n",
      "   -0.0666 if pav<=0.233574378490448\n",
      "   -0.0001 if cp<=-0.002366305910982189 & cv<=0.09535341560840632\n",
      "   +2.4301 if cv<=0.3805105984210968 & pav<=0.1969979852437973\n",
      "   -7.3229 if cp<=0.04477308690547943 & cp>=-0.048945702612400055\n",
      "   -0.0001 if cp<=-0.009477400220930576 & pav<=0.600848913192749\n",
      "   +5.2974 if cv<=0.03450129479169846\n",
      "--------------\n",
      "   -0.0000 if cp<=-0.01872282214462757 & cp>=-0.08475320041179657\n",
      "   +4.8765 if pa<=0.09636197239160539 & pav>=0.23857961297035246\n",
      "   +2.3628 if \n",
      "   +2.3628 if cp>=-0.013122606463730336\n",
      "   -0.3812 if cp<=0.040582723915576935 & pav<=0.12340002804994583\n",
      "   +4.8765 if cv<=0.017256867140531543 & pav>=0.1965594500303269\n",
      "   -0.8624 if pav<=0.20378408133983614\n",
      "   -0.0000 if cp<=0.010079050622880462\n",
      "   -2.6239 if pa<=0.04548279941082001\n",
      "   +1.0192 if pav>=0.600848913192749\n",
      "   -0.0000 if cp>=-0.02854387313127515 & cv<=-0.5904564142227173\n",
      "   -3.0264 if cv<=0.03450129479169846 & pa<=0.08561319410800934\n",
      "Run episode 234 with rewards 39.0\n",
      "============ 235 ===========\n",
      "34 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1]\n",
      "   +0.4821 if cv<=1.0829041719436647\n",
      "   +0.1259 if pav<=0.07888057827949524\n",
      "   +0.4821 if cv>=-0.9505589485168457\n",
      "   -1.4553 if cp>=-0.046283074468374236 & pa<=0.14660244584083557\n",
      "   +1.3083 if cv<=-0.024970776587724685 & pa<=0.0678311288356781\n",
      "   +0.2394 if pav<=0.1965594500303269\n",
      "   +3.0034 if pav<=0.233574378490448\n",
      "   +0.2394 if cv<=0.3805105984210968 & pav<=0.1969979852437973\n",
      "   -1.9031 if cp<=0.04477308690547943 & cp>=-0.048945702612400055\n",
      "   +2.8595 if cp<=-0.009477400220930576 & pav<=0.600848913192749\n",
      "   +1.1137 if cv<=0.03450129479169846\n",
      "   -3.2245 if cp>=-0.0695705935359001 & cv<=-0.4087065875530243\n",
      "--------------\n",
      "   -0.4345 if cp<=-0.01872282214462757 & cp>=-0.08475320041179657\n",
      "   +8.3056 if pa<=0.09636197239160539 & pav>=0.23857961297035246\n",
      "   +2.1901 if \n",
      "   +0.0000 if cp>=-0.013122606463730336\n",
      "   -0.0546 if cp<=0.040582723915576935 & pav<=0.12340002804994583\n",
      "   +6.6821 if cv<=0.017256867140531543 & pav>=0.1965594500303269\n",
      "   -0.0556 if pav<=0.20378408133983614\n",
      "   -5.2027 if pa<=0.04548279941082001\n",
      "   +3.4404 if pav>=0.600848913192749\n",
      "   +0.0000 if cp>=-0.02854387313127515 & cv<=-0.5904564142227173\n",
      "   -5.4284 if cv<=0.03450129479169846 & pa<=0.08561319410800934\n",
      "   +3.3790 if cp>=-0.0695705935359001 & cv<=-0.4087065875530243\n",
      "Run episode 235 with rewards 34.0\n",
      "============ 236 ===========\n",
      "46 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0]\n",
      "   +0.8346 if cv<=1.0829041719436647\n",
      "   +0.8346 if cv>=-0.9505589485168457\n",
      "   -1.0291 if cp>=-0.046283074468374236 & pa<=0.14660244584083557\n",
      "   -1.0565 if cv<=-0.024970776587724685 & pa<=0.0678311288356781\n",
      "   +1.3819 if pav<=0.1965594500303269\n",
      "   +1.2469 if pav<=0.233574378490448\n",
      "   +1.3819 if cv<=0.3805105984210968 & pav<=0.1969979852437973\n",
      "   -0.2694 if cp<=0.04477308690547943 & cp>=-0.048945702612400055\n",
      "   +0.8008 if cp<=-0.009477400220930576 & pav<=0.600848913192749\n",
      "   -1.2172 if cv<=0.03450129479169846\n",
      "   +0.0000 if cp>=-0.0695705935359001 & cv<=-0.4087065875530243\n",
      "   +1.4688 if cp>=-0.041838707029819476\n",
      "--------------\n",
      "   +0.6975 if cp<=-0.01872282214462757 & cp>=-0.08475320041179657\n",
      "   +0.8103 if pa<=0.09636197239160539 & pav>=0.23857961297035246\n",
      "   +0.6975 if \n",
      "   -0.0000 if cp>=-0.013122606463730336\n",
      "   -1.5071 if cp<=0.040582723915576935 & pav<=0.12340002804994583\n",
      "   +6.8422 if cv<=0.017256867140531543 & pav>=0.1965594500303269\n",
      "   -1.6336 if pav<=0.20378408133983614\n",
      "   -0.6588 if pa<=0.04548279941082001\n",
      "   -0.0319 if pav>=0.600848913192749\n",
      "   -0.7498 if cv<=0.03450129479169846 & pa<=0.08561319410800934\n",
      "   -0.0000 if cp>=-0.0695705935359001 & cv<=-0.4087065875530243\n",
      "   +2.4175 if pa<=0.10259403884410859\n",
      "Run episode 236 with rewards 46.0\n",
      "============ 237 ===========\n",
      "54 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0]\n",
      "   +0.8984 if cv<=1.0829041719436647\n",
      "   +0.8984 if cv>=-0.9505589485168457\n",
      "   -0.0426 if cp>=-0.046283074468374236 & pa<=0.14660244584083557\n",
      "   -0.4129 if cv<=-0.024970776587724685 & pa<=0.0678311288356781\n",
      "   +2.2296 if pav<=0.1965594500303269\n",
      "   -0.3005 if pav<=0.233574378490448\n",
      "   +2.2296 if cv<=0.3805105984210968 & pav<=0.1969979852437973\n",
      "   +0.8984 if cp<=0.04477308690547943 & cp>=-0.048945702612400055\n",
      "   +0.0000 if cp<=-0.009477400220930576 & pav<=0.600848913192749\n",
      "   -1.6170 if cv<=0.03450129479169846\n",
      "   +0.8984 if cp>=-0.041838707029819476\n",
      "   -1.3353 if cp<=0.006491147913038731 & pav>=0.005521969869732857\n",
      "--------------\n",
      "   +0.0000 if cp<=-0.01872282214462757 & cp>=-0.08475320041179657\n",
      "   +0.8162 if pa<=0.09636197239160539 & pav>=0.23857961297035246\n",
      "   -0.3476 if \n",
      "   -1.1771 if cp<=0.040582723915576935 & pav<=0.12340002804994583\n",
      "   +1.8707 if cv<=0.017256867140531543 & pav>=0.1965594500303269\n",
      "   -1.5739 if pav<=0.20378408133983614\n",
      "   -0.2699 if pa<=0.04548279941082001\n",
      "   +0.2910 if pav>=0.600848913192749\n",
      "   -0.5519 if cv<=0.03450129479169846 & pa<=0.08561319410800934\n",
      "   +0.0000 if cp>=-0.0695705935359001 & cv<=-0.4087065875530243\n",
      "   +1.5237 if pa<=0.10259403884410859\n",
      "   +3.8925 if cv<=0.03011201322078705 & pav>=0.20300064980983734\n",
      "Run episode 237 with rewards 54.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 238 ===========\n",
      "37 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1]\n",
      "   +0.4634 if cv<=1.0829041719436647\n",
      "   +0.4634 if cv>=-0.9505589485168457\n",
      "   -0.2663 if cp>=-0.046283074468374236 & pa<=0.14660244584083557\n",
      "   -0.3647 if cv<=-0.024970776587724685 & pa<=0.0678311288356781\n",
      "   +2.2965 if pav<=0.1965594500303269\n",
      "   -0.0333 if pav<=0.233574378490448\n",
      "   +2.2965 if cv<=0.3805105984210968 & pav<=0.1969979852437973\n",
      "   +0.4634 if cp<=0.04477308690547943 & cp>=-0.048945702612400055\n",
      "   -4.3469 if cv<=0.03450129479169846\n",
      "   +0.4634 if cp>=-0.041838707029819476\n",
      "   +0.8392 if cp<=0.006491147913038731 & pav>=0.005521969869732857\n",
      "   +2.0801 if cp<=0.021148857101798063 & pav<=0.19628315269947053\n",
      "--------------\n",
      "   -0.5174 if cp<=-0.01872282214462757 & cp>=-0.08475320041179657\n",
      "   +0.6971 if pa<=0.09636197239160539 & pav>=0.23857961297035246\n",
      "   -0.1965 if \n",
      "   -0.3942 if cp<=0.040582723915576935 & pav<=0.12340002804994583\n",
      "   +4.2182 if cv<=0.017256867140531543 & pav>=0.1965594500303269\n",
      "   -0.7305 if pav<=0.20378408133983614\n",
      "   +0.3209 if pa<=0.04548279941082001\n",
      "   +0.1844 if pav>=0.600848913192749\n",
      "   +0.7792 if cv<=0.03450129479169846 & pa<=0.08561319410800934\n",
      "   +0.3875 if pa<=0.10259403884410859\n",
      "   +2.5410 if cv<=0.03011201322078705 & pav>=0.20300064980983734\n",
      "   +1.8790 if cv<=0.0403841868042946 & cv>=-0.14140277206897736 & pa>=0.10822374373674395\n",
      "Run episode 238 with rewards 37.0\n",
      "============ 239 ===========\n",
      "35 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1]\n",
      "   +0.2107 if cv<=1.0829041719436647\n",
      "   +0.2107 if cv>=-0.9505589485168457\n",
      "   -0.7645 if cp>=-0.046283074468374236 & pa<=0.14660244584083557\n",
      "   -0.0989 if cv<=-0.024970776587724685 & pa<=0.0678311288356781\n",
      "   +1.7314 if pav<=0.1965594500303269\n",
      "   +1.7314 if cv<=0.3805105984210968 & pav<=0.1969979852437973\n",
      "   +0.6500 if cp<=0.04477308690547943 & cp>=-0.048945702612400055\n",
      "   -1.9119 if cv<=0.03450129479169846\n",
      "   +0.9876 if cp>=-0.041838707029819476\n",
      "   +0.1715 if cp<=0.006491147913038731 & pav>=0.005521969869732857\n",
      "   +1.7314 if cp<=0.021148857101798063 & pav<=0.19628315269947053\n",
      "   +1.0929 if cv>=0.16686491668224346 & pa>=0.13184547275304795 & pav<=0.3464231312274933\n",
      "--------------\n",
      "   -0.4184 if cp<=-0.01872282214462757 & cp>=-0.08475320041179657\n",
      "   +1.1038 if pa<=0.09636197239160539 & pav>=0.23857961297035246\n",
      "   -0.4224 if \n",
      "   -0.0593 if cp<=0.040582723915576935 & pav<=0.12340002804994583\n",
      "   +0.9574 if cv<=0.017256867140531543 & pav>=0.1965594500303269\n",
      "   -0.7446 if pav<=0.20378408133983614\n",
      "   +0.4726 if pa<=0.04548279941082001\n",
      "   +0.1010 if cv<=0.03450129479169846 & pa<=0.08561319410800934\n",
      "   +0.6485 if pa<=0.10259403884410859\n",
      "   +2.1682 if cv<=0.03011201322078705 & pav>=0.20300064980983734\n",
      "   +0.7771 if cv<=0.0403841868042946 & cv>=-0.14140277206897736 & pa>=0.10822374373674395\n",
      "   +0.4927 if pa>=0.0955692782998085 & pav>=0.3464231312274933\n",
      "Run episode 239 with rewards 35.0\n",
      "============ 240 ===========\n",
      "27 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0]\n",
      "   +0.3730 if cv<=1.0829041719436647\n",
      "   +0.3730 if cv>=-0.9505589485168457\n",
      "   -1.4513 if cp>=-0.046283074468374236 & pa<=0.14660244584083557\n",
      "   +2.9216 if pav<=0.1965594500303269\n",
      "   +2.8492 if cv<=0.3805105984210968 & pav<=0.1969979852437973\n",
      "   +0.8995 if cp<=0.04477308690547943 & cp>=-0.048945702612400055\n",
      "   -1.7542 if cv<=0.03450129479169846\n",
      "   +0.9304 if cp>=-0.041838707029819476\n",
      "   -0.6128 if cp<=0.006491147913038731 & pav>=0.005521969869732857\n",
      "   +2.9216 if cp<=0.021148857101798063 & pav<=0.19628315269947053\n",
      "   -0.0000 if cv>=0.16686491668224346 & pa>=0.13184547275304795 & pav<=0.3464231312274933\n",
      "   -2.7448 if pav<=0.2056886851787567\n",
      "--------------\n",
      "   +1.2295 if cp<=-0.01872282214462757 & cp>=-0.08475320041179657\n",
      "   +1.4866 if pa<=0.09636197239160539 & pav>=0.23857961297035246\n",
      "   +1.4007 if \n",
      "   +2.5618 if cv<=0.017256867140531543 & pav>=0.1965594500303269\n",
      "   -2.6911 if pav<=0.20378408133983614\n",
      "   -0.0030 if pa<=0.04548279941082001\n",
      "   -0.6689 if cv<=0.03450129479169846 & pa<=0.08561319410800934\n",
      "   -0.5582 if pa<=0.10259403884410859\n",
      "   +2.5618 if cv<=0.03011201322078705 & pav>=0.20300064980983734\n",
      "   +0.5788 if cv<=0.0403841868042946 & cv>=-0.14140277206897736 & pa>=0.10822374373674395\n",
      "   -0.4282 if pa>=0.0955692782998085 & pav>=0.3464231312274933\n",
      "   -2.6798 if pav>=0.2056886851787567\n",
      "Run episode 240 with rewards 27.0\n",
      "============ 241 ===========\n",
      "69 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1]\n",
      "   +0.1514 if cv<=1.0829041719436647\n",
      "   +0.1514 if cv>=-0.9505589485168457\n",
      "   +0.2218 if cp>=-0.046283074468374236 & pa<=0.14660244584083557\n",
      "   +1.1315 if pav<=0.1965594500303269\n",
      "   +1.1315 if cv<=0.3805105984210968 & pav<=0.1969979852437973\n",
      "   +0.1514 if cp<=0.04477308690547943 & cp>=-0.048945702612400055\n",
      "   -2.1826 if cv<=0.03450129479169846\n",
      "   +0.1514 if cp>=-0.041838707029819476\n",
      "   +0.1170 if cp<=0.006491147913038731 & pav>=0.005521969869732857\n",
      "   +1.1315 if cp<=0.021148857101798063 & pav<=0.19628315269947053\n",
      "   +1.1315 if pav<=0.2056886851787567\n",
      "   +0.0011 if cp>=0.005702055990695953\n",
      "--------------\n",
      "   +0.0000 if cp<=-0.01872282214462757 & cp>=-0.08475320041179657\n",
      "   +0.9454 if pa<=0.09636197239160539 & pav>=0.23857961297035246\n",
      "   -1.1704 if \n",
      "   +2.1544 if cv<=0.017256867140531543 & pav>=0.1965594500303269\n",
      "   -0.8614 if pav<=0.20378408133983614\n",
      "   -0.0347 if cv<=0.03450129479169846 & pa<=0.08561319410800934\n",
      "   +0.8009 if pa<=0.10259403884410859\n",
      "   +2.1544 if cv<=0.03011201322078705 & pav>=0.20300064980983734\n",
      "   +0.3620 if cv<=0.0403841868042946 & cv>=-0.14140277206897736 & pa>=0.10822374373674395\n",
      "   +1.4249 if pa>=0.0955692782998085 & pav>=0.3464231312274933\n",
      "   -0.3090 if pav>=0.2056886851787567\n",
      "   +0.3612 if pa>=0.1515461266040802\n",
      "Run episode 241 with rewards 69.0\n",
      "============ 242 ===========\n",
      "51 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1]\n",
      "   +0.1678 if cv<=1.0829041719436647\n",
      "   +0.1678 if cv>=-0.9505589485168457\n",
      "   -0.2953 if cp>=-0.046283074468374236 & pa<=0.14660244584083557\n",
      "   +0.6658 if pav<=0.1965594500303269\n",
      "   +0.6658 if cv<=0.3805105984210968 & pav<=0.1969979852437973\n",
      "   -0.2953 if cp<=0.04477308690547943 & cp>=-0.048945702612400055\n",
      "   -1.8343 if cv<=0.03450129479169846\n",
      "   -0.1692 if cp>=-0.041838707029819476\n",
      "   -0.1893 if cp<=0.006491147913038731 & pav>=0.005521969869732857\n",
      "   +0.6658 if cp<=0.021148857101798063 & pav<=0.19628315269947053\n",
      "   +7.0471 if pav<=0.2056886851787567\n",
      "   -2.4200 if cp<=-0.14400075674057006\n",
      "--------------\n",
      "   +0.8540 if pa<=0.09636197239160539 & pav>=0.23857961297035246\n",
      "   -0.5771 if \n",
      "   +0.9877 if cv<=0.017256867140531543 & pav>=0.1965594500303269\n",
      "   -3.3807 if pav<=0.20378408133983614\n",
      "   +0.3985 if cv<=0.03450129479169846 & pa<=0.08561319410800934\n",
      "   -1.1310 if pa<=0.10259403884410859\n",
      "   +2.6260 if cv<=0.03011201322078705 & pav>=0.20300064980983734\n",
      "   +0.3757 if cv<=0.0403841868042946 & cv>=-0.14140277206897736 & pa>=0.10822374373674395\n",
      "   +1.0442 if pa>=0.0955692782998085 & pav>=0.3464231312274933\n",
      "   +2.8036 if pav>=0.2056886851787567\n",
      "   -0.1904 if pa>=0.1515461266040802\n",
      "   -3.4517 if pa>=0.10946480780839923 & pav>=0.23868310153484348\n",
      "Run episode 242 with rewards 51.0\n",
      "============ 243 ===========\n",
      "30 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0]\n",
      "   +1.1908 if cv>=-0.9505589485168457\n",
      "   -0.1561 if cp>=-0.046283074468374236 & pa<=0.14660244584083557\n",
      "   +0.9802 if pav<=0.1965594500303269\n",
      "   +0.9802 if cv<=0.3805105984210968 & pav<=0.1969979852437973\n",
      "   -0.2207 if cp<=0.04477308690547943 & cp>=-0.048945702612400055\n",
      "   -2.1050 if cv<=0.03450129479169846\n",
      "   -0.1268 if cp>=-0.041838707029819476\n",
      "   +0.3625 if cp<=0.006491147913038731 & pav>=0.005521969869732857\n",
      "   +0.9802 if cp<=0.021148857101798063 & pav<=0.19628315269947053\n",
      "   +0.9802 if pav<=0.2056886851787567\n",
      "   -0.0000 if cp<=-0.14400075674057006\n",
      "   -1.9390 if cp<=-0.07162853330373764 & pa>=0.11599280685186386\n",
      "--------------\n",
      "   +0.6351 if pa<=0.09636197239160539 & pav>=0.23857961297035246\n",
      "   +0.3314 if \n",
      "   +1.8655 if cv<=0.017256867140531543 & pav>=0.1965594500303269\n",
      "   -0.7925 if pav<=0.20378408133983614\n",
      "   -0.1566 if cv<=0.03450129479169846 & pa<=0.08561319410800934\n",
      "   -0.0803 if pa<=0.10259403884410859\n",
      "   +1.8655 if cv<=0.03011201322078705 & pav>=0.20300064980983734\n",
      "   +1.1143 if cv<=0.0403841868042946 & cv>=-0.14140277206897736 & pa>=0.10822374373674395\n",
      "   -0.7316 if pa>=0.0955692782998085 & pav>=0.3464231312274933\n",
      "   +1.1239 if pav>=0.2056886851787567\n",
      "   -3.6828 if pa>=0.10946480780839923 & pav>=0.23868310153484348\n",
      "   +0.4816 if pa>=0.07558202743530275\n",
      "Run episode 243 with rewards 30.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 244 ===========\n",
      "39 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1]\n",
      "   +0.1877 if cv>=-0.9505589485168457\n",
      "   -0.0898 if cp>=-0.046283074468374236 & pa<=0.14660244584083557\n",
      "   +1.6948 if pav<=0.1965594500303269\n",
      "   +1.6948 if cv<=0.3805105984210968 & pav<=0.1969979852437973\n",
      "   +0.1877 if cp<=0.04477308690547943 & cp>=-0.048945702612400055\n",
      "   -1.1255 if cv<=0.03450129479169846\n",
      "   +0.1877 if cp>=-0.041838707029819476\n",
      "   -1.2133 if cp<=0.006491147913038731 & pav>=0.005521969869732857\n",
      "   +1.6948 if cp<=0.021148857101798063 & pav<=0.19628315269947053\n",
      "   +1.6948 if pav<=0.2056886851787567\n",
      "   -0.0000 if cp<=-0.07162853330373764 & pa>=0.11599280685186386\n",
      "   +0.2449 if cv>=0.1789414793252945 & pav<=0.23630303442478182\n",
      "--------------\n",
      "   +0.6080 if pa<=0.09636197239160539 & pav>=0.23857961297035246\n",
      "   -0.0638 if \n",
      "   +1.6513 if cv<=0.017256867140531543 & pav>=0.1965594500303269\n",
      "   -2.0204 if pav<=0.20378408133983614\n",
      "   -1.0862 if cv<=0.03450129479169846 & pa<=0.08561319410800934\n",
      "   +1.6513 if cv<=0.03011201322078705 & pav>=0.20300064980983734\n",
      "   +0.9759 if cv<=0.0403841868042946 & cv>=-0.14140277206897736 & pa>=0.10822374373674395\n",
      "   -0.5279 if pa>=0.0955692782998085 & pav>=0.3464231312274933\n",
      "   +1.9565 if pav>=0.2056886851787567\n",
      "   -3.5127 if pa>=0.10946480780839923 & pav>=0.23868310153484348\n",
      "   +0.6104 if pa>=0.07558202743530275\n",
      "   +0.6162 if cv<=0.007520409114658835 & pav>=0.09132880419492723\n",
      "Run episode 244 with rewards 39.0\n",
      "============ 245 ===========\n",
      "46 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0]\n",
      "   +0.6038 if cv>=-0.9505589485168457\n",
      "   -0.2463 if cp>=-0.046283074468374236 & pa<=0.14660244584083557\n",
      "   +1.3039 if pav<=0.1965594500303269\n",
      "   +1.3039 if cv<=0.3805105984210968 & pav<=0.1969979852437973\n",
      "   +0.6038 if cp<=0.04477308690547943 & cp>=-0.048945702612400055\n",
      "   -2.1174 if cv<=0.03450129479169846\n",
      "   +0.6038 if cp>=-0.041838707029819476\n",
      "   -0.1314 if cp<=0.006491147913038731 & pav>=0.005521969869732857\n",
      "   +0.4941 if cp<=0.021148857101798063 & pav<=0.19628315269947053\n",
      "   +1.3039 if pav<=0.2056886851787567\n",
      "   +0.1055 if cv>=0.1789414793252945 & pav<=0.23630303442478182\n",
      "   -0.7382 if cv<=0.16620478630065919 & pa>=0.09044390320777895 & pav>=0.346860420703888\n",
      "--------------\n",
      "   +1.0091 if pa<=0.09636197239160539 & pav>=0.23857961297035246\n",
      "   +1.8932 if cv<=0.017256867140531543 & pav>=0.1965594500303269\n",
      "   -1.4074 if pav<=0.20378408133983614\n",
      "   -0.4279 if cv<=0.03450129479169846 & pa<=0.08561319410800934\n",
      "   +1.8932 if cv<=0.03011201322078705 & pav>=0.20300064980983734\n",
      "   +0.6248 if cv<=0.0403841868042946 & cv>=-0.14140277206897736 & pa>=0.10822374373674395\n",
      "   -0.1498 if pa>=0.0955692782998085 & pav>=0.3464231312274933\n",
      "   +0.2189 if pav>=0.2056886851787567\n",
      "   -1.0496 if pa>=0.10946480780839923 & pav>=0.23868310153484348\n",
      "   -0.6657 if pa>=0.07558202743530275\n",
      "   +1.5677 if cv<=0.007520409114658835 & pav>=0.09132880419492723\n",
      "   -1.4022 if cv>=0.16620478630065919\n",
      "Run episode 245 with rewards 46.0\n",
      "============ 246 ===========\n",
      "33 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1]\n",
      "   +0.2937 if cv>=-0.9505589485168457\n",
      "   +0.0055 if cp>=-0.046283074468374236 & pa<=0.14660244584083557\n",
      "   +0.9545 if pav<=0.1965594500303269\n",
      "   +0.9545 if cv<=0.3805105984210968 & pav<=0.1969979852437973\n",
      "   +0.0124 if cp<=0.04477308690547943 & cp>=-0.048945702612400055\n",
      "   -0.7757 if cv<=0.03450129479169846\n",
      "   +0.0000 if cp>=-0.041838707029819476\n",
      "   -0.0968 if cp<=0.006491147913038731 & pav>=0.005521969869732857\n",
      "   +0.9545 if cp<=0.021148857101798063 & pav<=0.19628315269947053\n",
      "   +2.5611 if pav<=0.2056886851787567\n",
      "   -0.4217 if cv<=0.16620478630065919 & pa>=0.09044390320777895 & pav>=0.346860420703888\n",
      "   +0.8581 if cp<=-0.057703081518411636 & pav<=0.3084956705570221\n",
      "--------------\n",
      "   +1.4430 if pa<=0.09636197239160539 & pav>=0.23857961297035246\n",
      "   +0.8683 if cv<=0.017256867140531543 & pav>=0.1965594500303269\n",
      "   -2.5196 if pav<=0.20378408133983614\n",
      "   -1.3099 if cv<=0.03450129479169846 & pa<=0.08561319410800934\n",
      "   +1.8568 if cv<=0.03011201322078705 & pav>=0.20300064980983734\n",
      "   +0.2655 if cv<=0.0403841868042946 & cv>=-0.14140277206897736 & pa>=0.10822374373674395\n",
      "   +0.8857 if pav>=0.2056886851787567\n",
      "   -0.7519 if pa>=0.10946480780839923 & pav>=0.23868310153484348\n",
      "   -1.3125 if pa>=0.07558202743530275\n",
      "   +1.6483 if cv<=0.007520409114658835 & pav>=0.09132880419492723\n",
      "   -0.9886 if cv>=0.16620478630065919\n",
      "   -0.9827 if cv>=0.018803080543875698 & pa>=0.11857341229915619\n",
      "Run episode 246 with rewards 33.0\n",
      "============ 247 ===========\n",
      "58 actions [0, 1, 0, 1, 1, 0, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0]\n",
      "   +0.2512 if cv>=-0.9505589485168457\n",
      "   -0.3922 if cp>=-0.046283074468374236 & pa<=0.14660244584083557\n",
      "   +1.0639 if pav<=0.1965594500303269\n",
      "   +1.0639 if cv<=0.3805105984210968 & pav<=0.1969979852437973\n",
      "   +0.2512 if cp<=0.04477308690547943 & cp>=-0.048945702612400055\n",
      "   -1.7721 if cv<=0.03450129479169846\n",
      "   -0.4836 if cp<=0.006491147913038731 & pav>=0.005521969869732857\n",
      "   +1.0639 if cp<=0.021148857101798063 & pav<=0.19628315269947053\n",
      "   +1.0639 if pav<=0.2056886851787567\n",
      "   -0.7900 if cv<=0.16620478630065919 & pa>=0.09044390320777895 & pav>=0.346860420703888\n",
      "   +0.0000 if cp<=-0.057703081518411636 & pav<=0.3084956705570221\n",
      "   +0.4048 if cp<=0.005701047182083132 & pav<=0.08659504801034928\n",
      "--------------\n",
      "   +0.9460 if pa<=0.09636197239160539 & pav>=0.23857961297035246\n",
      "   +1.3536 if cv<=0.017256867140531543 & pav>=0.1965594500303269\n",
      "   -1.1635 if pav<=0.20378408133983614\n",
      "   -0.4503 if cv<=0.03450129479169846 & pa<=0.08561319410800934\n",
      "   +2.4051 if cv<=0.03011201322078705 & pav>=0.20300064980983734\n",
      "   +0.8315 if pav>=0.2056886851787567\n",
      "   -0.9980 if pa>=0.10946480780839923 & pav>=0.23868310153484348\n",
      "   +0.0609 if pa>=0.07558202743530275\n",
      "   +0.8362 if cv<=0.007520409114658835 & pav>=0.09132880419492723\n",
      "   -1.6109 if cv>=0.16620478630065919\n",
      "   -1.5754 if cv>=0.018803080543875698 & pa>=0.11857341229915619\n",
      "   +0.2549 if pa<=0.13597341775894164\n",
      "Run episode 247 with rewards 58.0\n",
      "============ 248 ===========\n",
      "28 actions [0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1]\n",
      "   -0.2052 if cv>=-0.9505589485168457\n",
      "   -1.7675 if cp>=-0.046283074468374236 & pa<=0.14660244584083557\n",
      "   +1.4904 if pav<=0.1965594500303269\n",
      "   +1.4904 if cv<=0.3805105984210968 & pav<=0.1969979852437973\n",
      "   -1.2207 if cp<=0.04477308690547943 & cp>=-0.048945702612400055\n",
      "   -1.8566 if cv<=0.03450129479169846\n",
      "   +2.1311 if cp<=0.006491147913038731 & pav>=0.005521969869732857\n",
      "   +1.4904 if cp<=0.021148857101798063 & pav<=0.19628315269947053\n",
      "   +1.4904 if pav<=0.2056886851787567\n",
      "   -0.6455 if cv<=0.16620478630065919 & pa>=0.09044390320777895 & pav>=0.346860420703888\n",
      "   -0.8380 if cp<=0.005701047182083132 & pav<=0.08659504801034928\n",
      "   -6.5061 if cp>=-0.15046737790107725 & cv<=-0.17883082926273347 & pav<=0.40020589232444764\n",
      "--------------\n",
      "   +0.8983 if pa<=0.09636197239160539 & pav>=0.23857961297035246\n",
      "   +2.1125 if cv<=0.017256867140531543 & pav>=0.1965594500303269\n",
      "   -1.4642 if pav<=0.20378408133983614\n",
      "   +1.5451 if cv<=0.03450129479169846 & pa<=0.08561319410800934\n",
      "   +2.1125 if cv<=0.03011201322078705 & pav>=0.20300064980983734\n",
      "   +0.7284 if pav>=0.2056886851787567\n",
      "   -0.6007 if pa>=0.10946480780839923 & pav>=0.23868310153484348\n",
      "   -2.1383 if cv<=0.007520409114658835 & pav>=0.09132880419492723\n",
      "   -1.4793 if cv>=0.16620478630065919\n",
      "   -1.3967 if cv>=0.018803080543875698 & pa>=0.11857341229915619\n",
      "   +0.3383 if pa<=0.13597341775894164\n",
      "   +6.7330 if cp>=-0.15046737790107725 & cv<=-0.17883082926273347 & pav<=0.32596146464347847\n",
      "Run episode 248 with rewards 28.0\n",
      "============ 249 ===========\n",
      "34 actions [1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 0, 1, 1]\n",
      "   +2.1656 if cp>=-0.046283074468374236 & pa<=0.14660244584083557\n",
      "   +2.1655 if pav<=0.1965594500303269\n",
      "   +2.1655 if cv<=0.3805105984210968 & pav<=0.1969979852437973\n",
      "   -2.8555 if cp<=0.04477308690547943 & cp>=-0.048945702612400055\n",
      "   -4.8203 if cv<=0.03450129479169846\n",
      "   -0.0000 if cp<=0.006491147913038731 & pav>=0.005521969869732857\n",
      "   -0.0000 if cp<=0.021148857101798063 & pav<=0.19628315269947053\n",
      "   +2.1655 if pav<=0.2056886851787567\n",
      "   -0.0000 if cv<=0.16620478630065919 & pa>=0.09044390320777895 & pav>=0.346860420703888\n",
      "   -0.0000 if cp<=0.005701047182083132 & pav<=0.08659504801034928\n",
      "   -0.6734 if cp>=-0.15046737790107725 & cv<=-0.17883082926273347 & pav<=0.40020589232444764\n",
      "   -3.3611 if pav<=-0.036212016269564586\n",
      "--------------\n",
      "   +0.0000 if pa<=0.09636197239160539 & pav>=0.23857961297035246\n",
      "   +0.0000 if cv<=0.017256867140531543 & pav>=0.1965594500303269\n",
      "   -3.0753 if pav<=0.20378408133983614\n",
      "   +3.0558 if cv<=0.03450129479169846 & pa<=0.08561319410800934\n",
      "   +0.0000 if cv<=0.03011201322078705 & pav>=0.20300064980983734\n",
      "   +0.0000 if pav>=0.2056886851787567\n",
      "   -0.0000 if pa>=0.10946480780839923 & pav>=0.23868310153484348\n",
      "   +0.0000 if cv<=0.007520409114658835 & pav>=0.09132880419492723\n",
      "   -0.7780 if cv>=0.16620478630065919\n",
      "   -0.0000 if cv>=0.018803080543875698 & pa>=0.11857341229915619\n",
      "   +0.1081 if cp>=-0.15046737790107725 & cv<=-0.17883082926273347 & pav<=0.32596146464347847\n",
      "   +0.6062 if cp<=0.040608961135149\n",
      "Run episode 249 with rewards 34.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 250 ===========\n",
      "78 actions [0, 1, 1, 0, 0, 1, 1, 1, 0, 0, 0, 0, 1, 1, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 0, 1]\n",
      "   +0.3465 if cp>=-0.046283074468374236 & pa<=0.14660244584083557\n",
      "   +2.6785 if pav<=0.1965594500303269\n",
      "   +2.6785 if cv<=0.3805105984210968 & pav<=0.1969979852437973\n",
      "   -1.2105 if cp<=0.04477308690547943 & cp>=-0.048945702612400055\n",
      "   -2.7112 if cv<=0.03450129479169846\n",
      "   +0.0000 if cp<=0.006491147913038731 & pav>=0.005521969869732857\n",
      "   +0.6651 if cp<=0.021148857101798063 & pav<=0.19628315269947053\n",
      "   +2.6785 if pav<=0.2056886851787567\n",
      "   +0.0000 if cp<=0.005701047182083132 & pav<=0.08659504801034928\n",
      "   -0.1855 if cp>=-0.15046737790107725 & cv<=-0.17883082926273347 & pav<=0.40020589232444764\n",
      "   +0.1456 if pav<=-0.036212016269564586\n",
      "   -4.1244 if cp>=0.023621946945786478 & pav<=0.04777921736240387\n",
      "--------------\n",
      "   +0.3879 if pa<=0.09636197239160539 & pav>=0.23857961297035246\n",
      "   +1.0103 if cv<=0.017256867140531543 & pav>=0.1965594500303269\n",
      "   -5.1003 if pav<=0.20378408133983614\n",
      "   -1.6134 if cv<=0.03450129479169846 & pa<=0.08561319410800934\n",
      "   +1.0103 if cv<=0.03011201322078705 & pav>=0.20300064980983734\n",
      "   -0.3779 if pav>=0.2056886851787567\n",
      "   -1.1291 if cv<=0.007520409114658835 & pav>=0.09132880419492723\n",
      "   -1.3303 if cv>=0.16620478630065919\n",
      "   -1.3926 if cv>=0.018803080543875698 & pa>=0.11857341229915619\n",
      "   +0.0000 if cp>=-0.15046737790107725 & cv<=-0.17883082926273347 & pav<=0.32596146464347847\n",
      "   +4.2878 if cp<=0.040608961135149\n",
      "   +5.2771 if cv<=0.10320749878883427 & pav<=0.04777921736240387\n",
      "Run episode 250 with rewards 78.0\n",
      "============ 251 ===========\n",
      "76 actions [0, 1, 1, 1, 0, 0, 0, 1, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0]\n",
      "   -5.8629 if cp>=-0.046283074468374236 & pa<=0.14660244584083557\n",
      "   +1.1117 if pav<=0.1965594500303269\n",
      "   +0.3738 if cv<=0.3805105984210968 & pav<=0.1969979852437973\n",
      "   -4.6491 if cp<=0.04477308690547943 & cp>=-0.048945702612400055\n",
      "   +2.3482 if cv<=0.03450129479169846\n",
      "   -2.9391 if cp<=0.006491147913038731 & pav>=0.005521969869732857\n",
      "   +2.7223 if cp<=0.021148857101798063 & pav<=0.19628315269947053\n",
      "   +9.0277 if pav<=0.2056886851787567\n",
      "   +2.0484 if cp>=-0.15046737790107725 & cv<=-0.17883082926273347 & pav<=0.40020589232444764\n",
      "   +0.9899 if pav<=-0.036212016269564586\n",
      "   -1.6505 if cp>=0.023621946945786478 & pav<=0.04777921736240387\n",
      "   -5.2378 if cv<=0.00869258139282465 & pav<=-0.04230953976511955\n",
      "--------------\n",
      "   -2.9039 if pa<=0.09636197239160539 & pav>=0.23857961297035246\n",
      "   -1.9843 if cv<=0.017256867140531543 & pav>=0.1965594500303269\n",
      "   -3.4866 if pav<=0.20378408133983614\n",
      "   -0.7613 if cv<=0.03450129479169846 & pa<=0.08561319410800934\n",
      "   +4.0704 if cv<=0.03011201322078705 & pav>=0.20300064980983734\n",
      "   +2.4918 if pav>=0.2056886851787567\n",
      "   -2.5928 if cv<=0.007520409114658835 & pav>=0.09132880419492723\n",
      "   +0.3947 if cv>=0.16620478630065919\n",
      "   -3.0752 if cv>=0.018803080543875698 & pa>=0.11857341229915619\n",
      "   +4.9498 if cp<=0.040608961135149\n",
      "   +3.7768 if cv<=0.10320749878883427 & pav<=0.04777921736240387\n",
      "   -3.3608 if pa<=0.002238377509638667 & pav<=0.08278412222862244 & pav>=-0.04230953976511955\n",
      "Run episode 251 with rewards 76.0\n",
      "============ 252 ===========\n",
      "60 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 0, 1, 1, 1, 0, 0, 0]\n",
      "   -2.1175 if cp>=-0.046283074468374236 & pa<=0.14660244584083557\n",
      "   +2.5902 if pav<=0.1965594500303269\n",
      "   -5.5675 if cp<=0.04477308690547943 & cp>=-0.048945702612400055\n",
      "   -3.1942 if cv<=0.03450129479169846\n",
      "   +1.6144 if cp<=0.006491147913038731 & pav>=0.005521969869732857\n",
      "   +2.6997 if cp<=0.021148857101798063 & pav<=0.19628315269947053\n",
      "   +8.4212 if pav<=0.2056886851787567\n",
      "   +2.8005 if cp>=-0.15046737790107725 & cv<=-0.17883082926273347 & pav<=0.40020589232444764\n",
      "   +2.3650 if pav<=-0.036212016269564586\n",
      "   -1.3301 if cp>=0.023621946945786478 & pav<=0.04777921736240387\n",
      "   -4.1949 if cv<=0.00869258139282465 & pav<=-0.04230953976511955\n",
      "   -6.1733 if cp>=0.017727350816130638 & cv>=0.11530930548906326 & pa>=-0.03741910308599472\n",
      "--------------\n",
      "   -1.3158 if pa<=0.09636197239160539 & pav>=0.23857961297035246\n",
      "   +0.8995 if cv<=0.017256867140531543 & pav>=0.1965594500303269\n",
      "   -4.3742 if pav<=0.20378408133983614\n",
      "   +0.3036 if cv<=0.03450129479169846 & pa<=0.08561319410800934\n",
      "   +0.8995 if cv<=0.03011201322078705 & pav>=0.20300064980983734\n",
      "   +1.5462 if pav>=0.2056886851787567\n",
      "   +0.7202 if cv<=0.007520409114658835 & pav>=0.09132880419492723\n",
      "   +0.3262 if cv>=0.018803080543875698 & pa>=0.11857341229915619\n",
      "   +0.5338 if cp<=0.040608961135149\n",
      "   +2.6947 if cv<=0.10320749878883427 & pav<=0.04777921736240387\n",
      "   -1.5547 if pa<=0.002238377509638667 & pav<=0.08278412222862244 & pav>=-0.04230953976511955\n",
      "   +7.0021 if cp>=0.017727350816130638 & pa>=-0.03741910308599472\n",
      "Run episode 252 with rewards 60.0\n",
      "============ 253 ===========\n",
      "36 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 1]\n",
      "   -1.8245 if cp>=-0.046283074468374236 & pa<=0.14660244584083557\n",
      "   +3.2348 if pav<=0.1965594500303269\n",
      "   -1.8245 if cp<=0.04477308690547943 & cp>=-0.048945702612400055\n",
      "   -2.1683 if cv<=0.03450129479169846\n",
      "   +3.4681 if cp<=0.006491147913038731 & pav>=0.005521969869732857\n",
      "   +3.2348 if cp<=0.021148857101798063 & pav<=0.19628315269947053\n",
      "   +2.3265 if pav<=0.2056886851787567\n",
      "   -1.5078 if cp>=-0.15046737790107725 & cv<=-0.17883082926273347 & pav<=0.40020589232444764\n",
      "   -0.1211 if pav<=-0.036212016269564586\n",
      "   -0.4796 if cv<=0.00869258139282465 & pav<=-0.04230953976511955\n",
      "   +0.0000 if cp>=0.017727350816130638 & cv>=0.11530930548906326 & pa>=-0.03741910308599472\n",
      "   -3.0093 if pa>=-0.024793134629726408\n",
      "--------------\n",
      "   +0.4633 if pa<=0.09636197239160539 & pav>=0.23857961297035246\n",
      "   +1.8838 if cv<=0.017256867140531543 & pav>=0.1965594500303269\n",
      "   -0.6651 if pav<=0.20378408133983614\n",
      "   +1.8838 if cv<=0.03011201322078705 & pav>=0.20300064980983734\n",
      "   +1.0034 if pav>=0.2056886851787567\n",
      "   +1.1974 if cv<=0.007520409114658835 & pav>=0.09132880419492723\n",
      "   +0.3520 if cv>=0.018803080543875698 & pa>=0.11857341229915619\n",
      "   +1.5709 if cp<=0.040608961135149\n",
      "   +0.0925 if cv<=0.10320749878883427 & pav<=0.04777921736240387\n",
      "   -0.4857 if pa<=0.002238377509638667 & pav<=0.08278412222862244 & pav>=-0.04230953976511955\n",
      "   -0.0000 if cp>=0.017727350816130638 & pa>=-0.03741910308599472\n",
      "   -4.2100 if cp>=-0.040193236619234074 & pav<=0.17048296630382537\n",
      "Run episode 253 with rewards 36.0\n",
      "============ 254 ===========\n",
      "41 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 0, 0, 1, 1, 1, 1, 0, 1, 0, 1, 1, 0, 1]\n",
      "   -0.9971 if cp>=-0.046283074468374236 & pa<=0.14660244584083557\n",
      "   +1.7053 if pav<=0.1965594500303269\n",
      "   -0.1643 if cp<=0.04477308690547943 & cp>=-0.048945702612400055\n",
      "   +0.2349 if cv<=0.03450129479169846\n",
      "   +0.4543 if cp<=0.006491147913038731 & pav>=0.005521969869732857\n",
      "   +1.7041 if cp<=0.021148857101798063 & pav<=0.19628315269947053\n",
      "   +1.7053 if pav<=0.2056886851787567\n",
      "   -0.0604 if cp>=-0.15046737790107725 & cv<=-0.17883082926273347 & pav<=0.40020589232444764\n",
      "   +1.1232 if pav<=-0.036212016269564586\n",
      "   +0.0000 if cv<=0.00869258139282465 & pav<=-0.04230953976511955\n",
      "   -0.1274 if pa>=-0.024793134629726408\n",
      "   +4.2134 if cp<=0.0018218799959868193 & cp>=0.0018218799959868193\n",
      "--------------\n",
      "   +0.1792 if pa<=0.09636197239160539 & pav>=0.23857961297035246\n",
      "   +0.4521 if cv<=0.017256867140531543 & pav>=0.1965594500303269\n",
      "   -1.9459 if pav<=0.20378408133983614\n",
      "   +0.4521 if cv<=0.03011201322078705 & pav>=0.20300064980983734\n",
      "   +1.1327 if pav>=0.2056886851787567\n",
      "   +0.3430 if cv<=0.007520409114658835 & pav>=0.09132880419492723\n",
      "   +0.5235 if cv>=0.018803080543875698 & pa>=0.11857341229915619\n",
      "   -0.7972 if cp<=0.040608961135149\n",
      "   -1.0769 if cv<=0.10320749878883427 & pav<=0.04777921736240387\n",
      "   +0.0000 if pa<=0.002238377509638667 & pav<=0.08278412222862244 & pav>=-0.04230953976511955\n",
      "   -1.3924 if cp>=-0.040193236619234074 & pav<=0.17048296630382537\n",
      "   -3.8003 if cv<=0.3347737193107605 & cv>=0.3347737193107605\n",
      "Run episode 254 with rewards 41.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 255 ===========\n",
      "43 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1]\n",
      "   -0.7536 if cp>=-0.046283074468374236 & pa<=0.14660244584083557\n",
      "   +0.7067 if pav<=0.1965594500303269\n",
      "   -0.8636 if cp<=0.04477308690547943 & cp>=-0.048945702612400055\n",
      "   +2.5847 if cv<=0.03450129479169846\n",
      "   -0.8789 if cp<=0.006491147913038731 & pav>=0.005521969869732857\n",
      "   +0.7067 if cp<=0.021148857101798063 & pav<=0.19628315269947053\n",
      "   +3.1997 if pav<=0.2056886851787567\n",
      "   -1.1305 if cp>=-0.15046737790107725 & cv<=-0.17883082926273347 & pav<=0.40020589232444764\n",
      "   -0.0000 if pav<=-0.036212016269564586\n",
      "   -0.8130 if pa>=-0.024793134629726408\n",
      "   -0.0000 if cp<=0.0018218799959868193 & cp>=0.0018218799959868193\n",
      "   -3.0131 if pa<=0.09274406731128694 & pav>=0.19923922419548035\n",
      "--------------\n",
      "   +4.7694 if pa<=0.09636197239160539 & pav>=0.23857961297035246\n",
      "   -0.0079 if cv<=0.017256867140531543 & pav>=0.1965594500303269\n",
      "   -1.3063 if pav<=0.20378408133983614\n",
      "   +0.1825 if cv<=0.03011201322078705 & pav>=0.20300064980983734\n",
      "   +2.2871 if pav>=0.2056886851787567\n",
      "   -0.0323 if cv<=0.007520409114658835 & pav>=0.09132880419492723\n",
      "   +1.5787 if cv>=0.018803080543875698 & pa>=0.11857341229915619\n",
      "   +0.9807 if cp<=0.040608961135149\n",
      "   -0.1603 if cv<=0.10320749878883427 & pav<=0.04777921736240387\n",
      "   -0.1863 if cp>=-0.040193236619234074 & pav<=0.17048296630382537\n",
      "   +0.0000 if cv<=0.3347737193107605 & cv>=0.3347737193107605\n",
      "   -3.0105 if cp>=-0.06900935620069504 & cv<=0.13640457391738892\n",
      "Run episode 255 with rewards 43.0\n",
      "============ 256 ===========\n",
      "68 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 1, 0, 1]\n",
      "   -0.5528 if cp>=-0.046283074468374236 & pa<=0.14660244584083557\n",
      "   +3.2533 if pav<=0.1965594500303269\n",
      "   -1.1832 if cp<=0.04477308690547943 & cp>=-0.048945702612400055\n",
      "   -1.0714 if cv<=0.03450129479169846\n",
      "   +0.0000 if cp<=0.006491147913038731 & pav>=0.005521969869732857\n",
      "   +0.6863 if cp<=0.021148857101798063 & pav<=0.19628315269947053\n",
      "   +3.2533 if pav<=0.2056886851787567\n",
      "   +0.0000 if cp>=-0.15046737790107725 & cv<=-0.17883082926273347 & pav<=0.40020589232444764\n",
      "   -1.0679 if pa>=-0.024793134629726408\n",
      "   +0.0000 if cp<=0.0018218799959868193 & cp>=0.0018218799959868193\n",
      "   -0.6177 if pa<=0.09274406731128694 & pav>=0.19923922419548035\n",
      "   -6.3867 if cp>=0.030497316271066666 & cv<=0.24968084692955061 & pav<=0.16055078506469728 & pav>=0.04881138950586319\n",
      "--------------\n",
      "   +0.3079 if pa<=0.09636197239160539 & pav>=0.23857961297035246\n",
      "   +0.2805 if cv<=0.017256867140531543 & pav>=0.1965594500303269\n",
      "   +0.0466 if pav<=0.20378408133983614\n",
      "   +0.8290 if cv<=0.03011201322078705 & pav>=0.20300064980983734\n",
      "   +5.9047 if pav>=0.2056886851787567\n",
      "   +0.0731 if cv<=0.007520409114658835 & pav>=0.09132880419492723\n",
      "   -3.0397 if cv>=0.018803080543875698 & pa>=0.11857341229915619\n",
      "   +2.1309 if cp<=0.040608961135149\n",
      "   -0.7905 if cv<=0.10320749878883427 & pav<=0.04777921736240387\n",
      "   +0.2933 if cp>=-0.040193236619234074 & pav<=0.17048296630382537\n",
      "   -3.2525 if cp>=-0.06900935620069504 & cv<=0.13640457391738892\n",
      "   -4.6285 if cp<=0.030497316271066666 & cv>=0.033948200196027754\n",
      "Run episode 256 with rewards 68.0\n",
      "============ 257 ===========\n",
      "39 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1]\n",
      "   -2.9047 if cp>=-0.046283074468374236 & pa<=0.14660244584083557\n",
      "   +3.8964 if pav<=0.1965594500303269\n",
      "   -0.4097 if cp<=0.04477308690547943 & cp>=-0.048945702612400055\n",
      "   +1.3415 if cv<=0.03450129479169846\n",
      "   -1.8829 if cp<=0.006491147913038731 & pav>=0.005521969869732857\n",
      "   +1.9269 if cp<=0.021148857101798063 & pav<=0.19628315269947053\n",
      "   +3.4356 if pav<=0.2056886851787567\n",
      "   +0.0000 if cp>=-0.15046737790107725 & cv<=-0.17883082926273347 & pav<=0.40020589232444764\n",
      "   -2.3365 if pa>=-0.024793134629726408\n",
      "   -0.8328 if pa<=0.09274406731128694 & pav>=0.19923922419548035\n",
      "   +0.0000 if cp>=0.030497316271066666 & cv<=0.24968084692955061 & pav<=0.16055078506469728 & pav>=0.04881138950586319\n",
      "   +5.0048 if cp<=0.005260068364441396 & pav>=-0.018511974811553953\n",
      "--------------\n",
      "   +0.0457 if pa<=0.09636197239160539 & pav>=0.23857961297035246\n",
      "   +1.6625 if cv<=0.017256867140531543 & pav>=0.1965594500303269\n",
      "   +2.6827 if cv<=0.03011201322078705 & pav>=0.20300064980983734\n",
      "   +2.0948 if pav>=0.2056886851787567\n",
      "   +1.5835 if cv<=0.007520409114658835 & pav>=0.09132880419492723\n",
      "   -0.1070 if cv>=0.018803080543875698 & pa>=0.11857341229915619\n",
      "   -1.0182 if cp<=0.040608961135149\n",
      "   -1.1679 if cv<=0.10320749878883427 & pav<=0.04777921736240387\n",
      "   -1.3621 if cp>=-0.040193236619234074 & pav<=0.17048296630382537\n",
      "   -0.6601 if cp>=-0.06900935620069504 & cv<=0.13640457391738892\n",
      "   -1.1731 if cp<=0.030497316271066666 & cv>=0.033948200196027754\n",
      "   -6.1470 if cp<=0.005260068364441396 & cv<=0.009726925473660233 & pa<=0.029399363696575167 & pav<=0.2283377468585968\n",
      "Run episode 257 with rewards 39.0\n",
      "============ 258 ===========\n",
      "35 actions [0, 1, 0, 0, 0, 1, 0, 1, 0, 0, 1, 1, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1]\n",
      "   -0.8810 if cp>=-0.046283074468374236 & pa<=0.14660244584083557\n",
      "   +1.9188 if pav<=0.1965594500303269\n",
      "   -1.3192 if cp<=0.04477308690547943 & cp>=-0.048945702612400055\n",
      "   +1.9517 if cv<=0.03450129479169846\n",
      "   +0.2438 if cp<=0.006491147913038731 & pav>=0.005521969869732857\n",
      "   +0.8342 if cp<=0.021148857101798063 & pav<=0.19628315269947053\n",
      "   +4.0261 if pav<=0.2056886851787567\n",
      "   -2.1865 if pa>=-0.024793134629726408\n",
      "   +1.4238 if pa<=0.09274406731128694 & pav>=0.19923922419548035\n",
      "   +0.0000 if cp>=0.030497316271066666 & cv<=0.24968084692955061 & pav<=0.16055078506469728 & pav>=0.04881138950586319\n",
      "   +0.2821 if cp<=0.005260068364441396 & pav>=-0.018511974811553953\n",
      "   +1.5726 if cp<=0.005221730004996062\n",
      "--------------\n",
      "   -0.2438 if cv<=0.017256867140531543 & pav>=0.1965594500303269\n",
      "   +2.2238 if cv<=0.03011201322078705 & pav>=0.20300064980983734\n",
      "   +3.1620 if pav>=0.2056886851787567\n",
      "   -0.2958 if cv<=0.007520409114658835 & pav>=0.09132880419492723\n",
      "   +0.3154 if cv>=0.018803080543875698 & pa>=0.11857341229915619\n",
      "   -0.7198 if cp<=0.040608961135149\n",
      "   -0.3964 if cv<=0.10320749878883427 & pav<=0.04777921736240387\n",
      "   -1.3928 if cp>=-0.040193236619234074 & pav<=0.17048296630382537\n",
      "   -0.7081 if cp>=-0.06900935620069504 & cv<=0.13640457391738892\n",
      "   -0.1180 if cp<=0.030497316271066666 & cv>=0.033948200196027754\n",
      "   +0.0000 if cp<=0.005260068364441396 & cv<=0.009726925473660233 & pa<=0.029399363696575167 & pav<=0.2283377468585968\n",
      "   +0.3075 if cv<=-0.047311995178461075\n",
      "Run episode 258 with rewards 35.0\n",
      "============ 259 ===========\n",
      "31 actions [0, 1, 0, 1, 0, 1, 0, 0, 0, 1, 0, 1, 1, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1]\n",
      "   +2.6945 if cp>=-0.046283074468374236 & pa<=0.14660244584083557\n",
      "   +0.8666 if pav<=0.1965594500303269\n",
      "   +2.6945 if cp<=0.04477308690547943 & cp>=-0.048945702612400055\n",
      "   +1.0027 if cv<=0.03450129479169846\n",
      "   -1.2047 if cp<=0.006491147913038731 & pav>=0.005521969869732857\n",
      "   +0.8665 if cp<=0.021148857101798063 & pav<=0.19628315269947053\n",
      "   +3.5231 if pav<=0.2056886851787567\n",
      "   +2.7582 if pa>=-0.024793134629726408\n",
      "   +3.7769 if pa<=0.09274406731128694 & pav>=0.19923922419548035\n",
      "   -1.1353 if cp<=0.005260068364441396 & pav>=-0.018511974811553953\n",
      "   -1.1351 if cp<=0.005221730004996062\n",
      "   -5.6866 if cp>=-0.03722570091485977\n",
      "--------------\n",
      "   +0.5524 if cv<=0.017256867140531543 & pav>=0.1965594500303269\n",
      "   +0.5524 if cv<=0.03011201322078705 & pav>=0.20300064980983734\n",
      "   +2.9658 if pav>=0.2056886851787567\n",
      "   +0.5177 if cv<=0.007520409114658835 & pav>=0.09132880419492723\n",
      "   +0.2983 if cv>=0.018803080543875698 & pa>=0.11857341229915619\n",
      "   +0.7765 if cp<=0.040608961135149\n",
      "   -0.0168 if cv<=0.10320749878883427 & pav<=0.04777921736240387\n",
      "   -0.0076 if cp>=-0.040193236619234074 & pav<=0.17048296630382537\n",
      "   -1.5750 if cp>=-0.06900935620069504 & cv<=0.13640457391738892\n",
      "   +0.2983 if cp<=0.030497316271066666 & cv>=0.033948200196027754\n",
      "   -1.2314 if cv<=-0.047311995178461075\n",
      "   +3.8467 if cp>=-0.03722570091485977\n",
      "Run episode 259 with rewards 31.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 260 ===========\n",
      "46 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 1, 0, 0, 1, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1, 1]\n",
      "   +1.7753 if cp>=-0.046283074468374236 & pa<=0.14660244584083557\n",
      "   +2.0649 if pav<=0.1965594500303269\n",
      "   +1.7753 if cp<=0.04477308690547943 & cp>=-0.048945702612400055\n",
      "   -0.4183 if cv<=0.03450129479169846\n",
      "   +0.1633 if cp<=0.006491147913038731 & pav>=0.005521969869732857\n",
      "   +4.2260 if pav<=0.2056886851787567\n",
      "   +0.1633 if pa>=-0.024793134629726408\n",
      "   +1.9922 if pa<=0.09274406731128694 & pav>=0.19923922419548035\n",
      "   +0.1633 if cp<=0.005260068364441396 & pav>=-0.018511974811553953\n",
      "   +0.1633 if cp<=0.005221730004996062\n",
      "   -3.2344 if cp>=-0.03722570091485977\n",
      "   -0.3565 if cp<=-0.103976771235466\n",
      "--------------\n",
      "   +0.8550 if cv<=0.017256867140531543 & pav>=0.1965594500303269\n",
      "   +2.4439 if cv<=0.03011201322078705 & pav>=0.20300064980983734\n",
      "   +3.8072 if pav>=0.2056886851787567\n",
      "   +0.8550 if cv<=0.007520409114658835 & pav>=0.09132880419492723\n",
      "   +0.2430 if cv>=0.018803080543875698 & pa>=0.11857341229915619\n",
      "   +0.3679 if cp<=0.040608961135149\n",
      "   -0.7301 if cv<=0.10320749878883427 & pav<=0.04777921736240387\n",
      "   -2.4541 if cp>=-0.06900935620069504 & cv<=0.13640457391738892\n",
      "   +0.2430 if cp<=0.030497316271066666 & cv>=0.033948200196027754\n",
      "   +0.1249 if cv<=-0.047311995178461075\n",
      "   +2.1420 if cp>=-0.03722570091485977\n",
      "   -1.7740 if cp<=-0.0375581718981266\n",
      "Run episode 260 with rewards 46.0\n",
      "============ 261 ===========\n",
      "73 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0]\n",
      "   +3.6303 if cp>=-0.046283074468374236 & pa<=0.14660244584083557\n",
      "   +2.4438 if pav<=0.1965594500303269\n",
      "   +0.9965 if cp<=0.04477308690547943 & cp>=-0.048945702612400055\n",
      "   -2.5135 if cv<=0.03450129479169846\n",
      "   -0.2316 if cp<=0.006491147913038731 & pav>=0.005521969869732857\n",
      "   +2.4438 if pav<=0.2056886851787567\n",
      "   -1.4820 if pa>=-0.024793134629726408\n",
      "   -0.1304 if pa<=0.09274406731128694 & pav>=0.19923922419548035\n",
      "   +0.7332 if cp<=0.005260068364441396 & pav>=-0.018511974811553953\n",
      "   -1.4820 if cp>=-0.03722570091485977\n",
      "   +0.0000 if cp<=-0.103976771235466\n",
      "   +3.8804 if cv>=0.7561783194541931 & pav<=0.029311519116163254\n",
      "--------------\n",
      "   +1.4158 if cv<=0.017256867140531543 & pav>=0.1965594500303269\n",
      "   +1.9310 if cv<=0.03011201322078705 & pav>=0.20300064980983734\n",
      "   +4.8902 if pav>=0.2056886851787567\n",
      "   +1.4158 if cv<=0.007520409114658835 & pav>=0.09132880419492723\n",
      "   +0.6792 if cv>=0.018803080543875698 & pa>=0.11857341229915619\n",
      "   -2.4173 if cp<=0.040608961135149\n",
      "   -0.9723 if cv<=0.10320749878883427 & pav<=0.04777921736240387\n",
      "   +0.8000 if cp>=-0.06900935620069504 & cv<=0.13640457391738892\n",
      "   +3.1776 if cp<=0.030497316271066666 & cv>=0.033948200196027754\n",
      "   +0.7427 if cp>=-0.03722570091485977\n",
      "   -0.0000 if cp<=-0.0375581718981266\n",
      "   +4.5097 if cv<=0.7561783194541931 & pa>=0.15191885828971863 & pav<=0.13706842064857483\n",
      "Run episode 261 with rewards 73.0\n",
      "============ 262 ===========\n",
      "58 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 1, 1, 0, 0, 0, 1, 0, 1, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 1, 0, 1]\n",
      "   +4.7923 if cp>=-0.046283074468374236 & pa<=0.14660244584083557\n",
      "   +2.2989 if pav<=0.1965594500303269\n",
      "   -0.8958 if cp<=0.04477308690547943 & cp>=-0.048945702612400055\n",
      "   -2.6195 if cv<=0.03450129479169846\n",
      "   +0.9560 if cp<=0.006491147913038731 & pav>=0.005521969869732857\n",
      "   +2.2989 if pav<=0.2056886851787567\n",
      "   -1.9973 if pa>=-0.024793134629726408\n",
      "   -0.5500 if pa<=0.09274406731128694 & pav>=0.19923922419548035\n",
      "   +1.3595 if cp<=0.005260068364441396 & pav>=-0.018511974811553953\n",
      "   -1.9742 if cp>=-0.03722570091485977\n",
      "   +2.3928 if cv>=0.7561783194541931 & pav<=0.029311519116163254\n",
      "   +2.5282 if pav<=0.08597432971000672\n",
      "--------------\n",
      "   +0.8368 if cv<=0.017256867140531543 & pav>=0.1965594500303269\n",
      "   +1.0101 if cv<=0.03011201322078705 & pav>=0.20300064980983734\n",
      "   +4.2077 if pav>=0.2056886851787567\n",
      "   +0.8368 if cv<=0.007520409114658835 & pav>=0.09132880419492723\n",
      "   +2.2093 if cv>=0.018803080543875698 & pa>=0.11857341229915619\n",
      "   +1.4048 if cp<=0.040608961135149\n",
      "   -1.8778 if cv<=0.10320749878883427 & pav<=0.04777921736240387\n",
      "   -0.2891 if cp>=-0.06900935620069504 & cv<=0.13640457391738892\n",
      "   +1.0555 if cp<=0.030497316271066666 & cv>=0.033948200196027754\n",
      "   -0.3984 if cp>=-0.03722570091485977\n",
      "   +3.1222 if cv<=0.7561783194541931 & pa>=0.15191885828971863 & pav<=0.13706842064857483\n",
      "   -2.9672 if cv<=0.6890100955963137 & pa>=0.1195587769150734 & pav<=0.08597432971000672 & pav>=-0.012333278357982634\n",
      "Run episode 262 with rewards 58.0\n",
      "============ 263 ===========\n",
      "52 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 0, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0]\n",
      "   +6.3574 if cp>=-0.046283074468374236 & pa<=0.14660244584083557\n",
      "   +2.4720 if pav<=0.1965594500303269\n",
      "   +0.8284 if cp<=0.04477308690547943 & cp>=-0.048945702612400055\n",
      "   -0.6958 if cv<=0.03450129479169846\n",
      "   -0.0000 if cp<=0.006491147913038731 & pav>=0.005521969869732857\n",
      "   +2.4720 if pav<=0.2056886851787567\n",
      "   -2.6130 if pa>=-0.024793134629726408\n",
      "   -0.0000 if cp<=0.005260068364441396 & pav>=-0.018511974811553953\n",
      "   -2.6130 if cp>=-0.03722570091485977\n",
      "   +3.3393 if cv>=0.7561783194541931 & pav<=0.029311519116163254\n",
      "   -0.6485 if pav<=0.08597432971000672\n",
      "   +3.7604 if pav<=0.09953273385763169\n",
      "--------------\n",
      "   +1.0869 if cv<=0.017256867140531543 & pav>=0.1965594500303269\n",
      "   +1.0869 if cv<=0.03011201322078705 & pav>=0.20300064980983734\n",
      "   +4.7871 if pav>=0.2056886851787567\n",
      "   -1.0322 if cv<=0.007520409114658835 & pav>=0.09132880419492723\n",
      "   +1.8741 if cv>=0.018803080543875698 & pa>=0.11857341229915619\n",
      "   -0.5662 if cp<=0.040608961135149\n",
      "   -0.4563 if cv<=0.10320749878883427 & pav<=0.04777921736240387\n",
      "   -0.0104 if cp<=0.030497316271066666 & cv>=0.033948200196027754\n",
      "   -0.0839 if cp>=-0.03722570091485977\n",
      "   +5.6611 if cv<=0.7561783194541931 & pa>=0.15191885828971863 & pav<=0.13706842064857483\n",
      "   -0.1236 if cv<=0.6890100955963137 & pa>=0.1195587769150734 & pav<=0.08597432971000672 & pav>=-0.012333278357982634\n",
      "   -1.1804 if pa<=0.15304531455039977\n",
      "Run episode 263 with rewards 52.0\n",
      "============ 264 ===========\n",
      "57 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 0, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1]\n",
      "   +3.9183 if cp>=-0.046283074468374236 & pa<=0.14660244584083557\n",
      "   +0.3484 if pav<=0.1965594500303269\n",
      "   -0.8242 if cp<=0.04477308690547943 & cp>=-0.048945702612400055\n",
      "   -1.5350 if cv<=0.03450129479169846\n",
      "   +3.1755 if pav<=0.2056886851787567\n",
      "   -2.2895 if pa>=-0.024793134629726408\n",
      "   +1.7157 if cp<=0.005260068364441396 & pav>=-0.018511974811553953\n",
      "   -2.2895 if cp>=-0.03722570091485977\n",
      "   +1.9264 if cv>=0.7561783194541931 & pav<=0.029311519116163254\n",
      "   +1.1276 if pav<=0.08597432971000672\n",
      "   +1.1276 if pav<=0.09953273385763169\n",
      "   +3.2450 if cv>=0.5810786962509156 & pav<=0.11198783069849019\n",
      "--------------\n",
      "   +0.8088 if cv<=0.017256867140531543 & pav>=0.1965594500303269\n",
      "   +1.9936 if cv<=0.03011201322078705 & pav>=0.20300064980983734\n",
      "   +4.2527 if pav>=0.2056886851787567\n",
      "   +0.6752 if cv<=0.007520409114658835 & pav>=0.09132880419492723\n",
      "   +0.9258 if cv>=0.018803080543875698 & pa>=0.11857341229915619\n",
      "   +0.1290 if cp<=0.040608961135149\n",
      "   -0.0311 if cv<=0.10320749878883427 & pav<=0.04777921736240387\n",
      "   +1.7036 if cp>=-0.03722570091485977\n",
      "   +4.5227 if cv<=0.7561783194541931 & pa>=0.15191885828971863 & pav<=0.13706842064857483\n",
      "   +0.9626 if cv<=0.6890100955963137 & pa>=0.1195587769150734 & pav<=0.08597432971000672 & pav>=-0.012333278357982634\n",
      "   -1.2035 if pa<=0.15304531455039977\n",
      "   -3.1494 if cp>=0.06707723289728168 & cv<=0.9042959451675421 & pav<=0.11198783069849019 & pav>=0.01181051544845105\n",
      "Run episode 264 with rewards 57.0\n",
      "============ 265 ===========\n",
      "100 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0]\n",
      "   +4.4230 if cp>=-0.046283074468374236 & pa<=0.14660244584083557\n",
      "   -0.1749 if cp<=0.04477308690547943 & cp>=-0.048945702612400055\n",
      "   -4.6436 if cv<=0.03450129479169846\n",
      "   +3.5373 if pav<=0.2056886851787567\n",
      "   +0.6345 if pa>=-0.024793134629726408\n",
      "   +0.0000 if cp<=0.005260068364441396 & pav>=-0.018511974811553953\n",
      "   +0.6345 if cp>=-0.03722570091485977\n",
      "   +2.5755 if cv>=0.7561783194541931 & pav<=0.029311519116163254\n",
      "   -0.8997 if pav<=0.08597432971000672\n",
      "   +0.0877 if pav<=0.09953273385763169\n",
      "   +0.1619 if cv>=0.5810786962509156 & pav<=0.11198783069849019\n",
      "   -4.8312 if pav>=0.105914668738842\n",
      "--------------\n",
      "   +0.0142 if cv<=0.017256867140531543 & pav>=0.1965594500303269\n",
      "   +0.0142 if cv<=0.03011201322078705 & pav>=0.20300064980983734\n",
      "   +5.4925 if pav>=0.2056886851787567\n",
      "   +4.1391 if cv<=0.007520409114658835 & pav>=0.09132880419492723\n",
      "   +1.9331 if cv>=0.018803080543875698 & pa>=0.11857341229915619\n",
      "   +0.1593 if cp<=0.040608961135149\n",
      "   -1.0318 if cp>=-0.03722570091485977\n",
      "   +6.0816 if cv<=0.7561783194541931 & pa>=0.15191885828971863 & pav<=0.13706842064857483\n",
      "   +0.1552 if cv<=0.6890100955963137 & pa>=0.1195587769150734 & pav<=0.08597432971000672 & pav>=-0.012333278357982634\n",
      "   -4.8150 if pa<=0.15304531455039977\n",
      "   +1.1654 if cp>=0.06707723289728168 & cv<=0.9042959451675421 & pav<=0.11198783069849019 & pav>=0.01181051544845105\n",
      "   +4.5333 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "Run episode 265 with rewards 100.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 266 ===========\n",
      "78 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 1, 0, 0, 1, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1]\n",
      "   +0.6699 if cp>=-0.046283074468374236 & pa<=0.14660244584083557\n",
      "   +0.5389 if cp<=0.04477308690547943 & cp>=-0.048945702612400055\n",
      "   -5.1697 if cv<=0.03450129479169846\n",
      "   +0.4065 if pav<=0.2056886851787567\n",
      "   -0.2975 if pa>=-0.024793134629726408\n",
      "   +1.8966 if cp>=-0.03722570091485977\n",
      "   +0.8972 if cv>=0.7561783194541931 & pav<=0.029311519116163254\n",
      "   -1.7141 if pav<=0.08597432971000672\n",
      "   +3.5935 if pav<=0.09953273385763169\n",
      "   +1.0878 if cv>=0.5810786962509156 & pav<=0.11198783069849019\n",
      "   -5.5958 if pav>=0.105914668738842\n",
      "   +4.9048 if cv<=0.1721094608306885 & pav>=-0.04219573140144348\n",
      "--------------\n",
      "   +0.5798 if cv<=0.03011201322078705 & pav>=0.20300064980983734\n",
      "   +0.3149 if pav>=0.2056886851787567\n",
      "   +1.2568 if cv<=0.007520409114658835 & pav>=0.09132880419492723\n",
      "   +1.7538 if cv>=0.018803080543875698 & pa>=0.11857341229915619\n",
      "   -0.8970 if cp<=0.040608961135149\n",
      "   +0.4574 if cp>=-0.03722570091485977\n",
      "   +4.8583 if cv<=0.7561783194541931 & pa>=0.15191885828971863 & pav<=0.13706842064857483\n",
      "   -0.0612 if cv<=0.6890100955963137 & pa>=0.1195587769150734 & pav<=0.08597432971000672 & pav>=-0.012333278357982634\n",
      "   -5.2522 if pa<=0.15304531455039977\n",
      "   +0.0000 if cp>=0.06707723289728168 & cv<=0.9042959451675421 & pav<=0.11198783069849019 & pav>=0.01181051544845105\n",
      "   +8.7084 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   +4.1558 if cv<=0.1721094608306885 & pa>=0.046401172131299975 & pav<=-0.04219573140144348\n",
      "Run episode 266 with rewards 78.0\n",
      "============ 267 ===========\n",
      "60 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1]\n",
      "   +0.5321 if cp>=-0.046283074468374236 & pa<=0.14660244584083557\n",
      "   -1.3272 if cp<=0.04477308690547943 & cp>=-0.048945702612400055\n",
      "   -0.8570 if cv<=0.03450129479169846\n",
      "   +3.9783 if pav<=0.2056886851787567\n",
      "   +0.4099 if cp>=-0.03722570091485977\n",
      "   +2.1217 if cv>=0.7561783194541931 & pav<=0.029311519116163254\n",
      "   +0.0043 if pav<=0.08597432971000672\n",
      "   +0.0043 if pav<=0.09953273385763169\n",
      "   -0.1370 if cv>=0.5810786962509156 & pav<=0.11198783069849019\n",
      "   -5.3050 if pav>=0.105914668738842\n",
      "   -0.8570 if cv<=0.1721094608306885 & pav>=-0.04219573140144348\n",
      "   -1.7832 if pav>=0.5365146398544312\n",
      "--------------\n",
      "   +0.0508 if cv<=0.03011201322078705 & pav>=0.20300064980983734\n",
      "   +4.2586 if pav>=0.2056886851787567\n",
      "   +0.0469 if cv<=0.007520409114658835 & pav>=0.09132880419492723\n",
      "   -0.7281 if cv>=0.018803080543875698 & pa>=0.11857341229915619\n",
      "   +0.0776 if cp<=0.040608961135149\n",
      "   +0.9505 if cp>=-0.03722570091485977\n",
      "   +5.2452 if cv<=0.7561783194541931 & pa>=0.15191885828971863 & pav<=0.13706842064857483\n",
      "   -0.0074 if cv<=0.6890100955963137 & pa>=0.1195587769150734 & pav<=0.08597432971000672 & pav>=-0.012333278357982634\n",
      "   -6.4929 if pa<=0.15304531455039977\n",
      "   +5.3003 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   +0.0000 if cv<=0.1721094608306885 & pa>=0.046401172131299975 & pav<=-0.04219573140144348\n",
      "   +1.6759 if cp<=0.15526567697525026 & pa<=0.15440531373023986\n",
      "Run episode 267 with rewards 60.0\n",
      "============ 268 ===========\n",
      "95 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1]\n",
      "   -0.8884 if cp>=-0.046283074468374236 & pa<=0.14660244584083557\n",
      "   -1.6054 if cp<=0.04477308690547943 & cp>=-0.048945702612400055\n",
      "   -0.1377 if cv<=0.03450129479169846\n",
      "   +5.6545 if pav<=0.2056886851787567\n",
      "   -1.2230 if cp>=-0.03722570091485977\n",
      "   +0.9927 if cv>=0.7561783194541931 & pav<=0.029311519116163254\n",
      "   +1.3661 if pav<=0.09953273385763169\n",
      "   -1.3139 if cv>=0.5810786962509156 & pav<=0.11198783069849019\n",
      "   -2.5891 if pav>=0.105914668738842\n",
      "   -0.6654 if cv<=0.1721094608306885 & pav>=-0.04219573140144348\n",
      "   +0.0000 if pav>=0.5365146398544312\n",
      "   -2.3541 if cv<=0.557355666160584 & pav<=0.238668030500412 & pav>=0.08675469905138018\n",
      "--------------\n",
      "   +0.0023 if cv<=0.03011201322078705 & pav>=0.20300064980983734\n",
      "   +3.0561 if pav>=0.2056886851787567\n",
      "   +0.7828 if cv<=0.007520409114658835 & pav>=0.09132880419492723\n",
      "   -1.0605 if cv>=0.018803080543875698 & pa>=0.11857341229915619\n",
      "   -1.3039 if cp<=0.040608961135149\n",
      "   -1.9423 if cp>=-0.03722570091485977\n",
      "   +4.3924 if cv<=0.7561783194541931 & pa>=0.15191885828971863 & pav<=0.13706842064857483\n",
      "   -0.0370 if cv<=0.6890100955963137 & pa>=0.1195587769150734 & pav<=0.08597432971000672 & pav>=-0.012333278357982634\n",
      "   -1.5271 if pa<=0.15304531455039977\n",
      "   +5.2216 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   +1.4666 if cp<=0.15526567697525026 & pa<=0.15440531373023986\n",
      "   +3.4893 if cv>=0.557355666160584 & pav<=0.08675469905138018\n",
      "Run episode 268 with rewards 95.0\n",
      "============ 269 ===========\n",
      "106 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 0, 0, 1, 1, 1]\n",
      "   -1.2531 if cp>=-0.046283074468374236 & pa<=0.14660244584083557\n",
      "   -0.6643 if cp<=0.04477308690547943 & cp>=-0.048945702612400055\n",
      "   +1.1830 if cv<=0.03450129479169846\n",
      "   +2.7443 if pav<=0.2056886851787567\n",
      "   -0.5409 if cp>=-0.03722570091485977\n",
      "   +2.1101 if cv>=0.7561783194541931 & pav<=0.029311519116163254\n",
      "   +2.5829 if pav<=0.09953273385763169\n",
      "   -2.6284 if cv>=0.5810786962509156 & pav<=0.11198783069849019\n",
      "   -3.6751 if pav>=0.105914668738842\n",
      "   -0.9277 if cv<=0.1721094608306885 & pav>=-0.04219573140144348\n",
      "   +0.1603 if cv<=0.557355666160584 & pav<=0.238668030500412 & pav>=0.08675469905138018\n",
      "   +5.0457 if cp<=0.017127060517668727 & pa>=0.14063940346240997 & pav<=0.20234745144844057 & pav>=0.07060452848672867\n",
      "--------------\n",
      "   +2.4443 if pav>=0.2056886851787567\n",
      "   +0.7900 if cv<=0.007520409114658835 & pav>=0.09132880419492723\n",
      "   -0.1941 if cv>=0.018803080543875698 & pa>=0.11857341229915619\n",
      "   -0.2385 if cp<=0.040608961135149\n",
      "   -2.5214 if cp>=-0.03722570091485977\n",
      "   +3.3060 if cv<=0.7561783194541931 & pa>=0.15191885828971863 & pav<=0.13706842064857483\n",
      "   +2.6214 if cv<=0.6890100955963137 & pa>=0.1195587769150734 & pav<=0.08597432971000672 & pav>=-0.012333278357982634\n",
      "   -3.0982 if pa<=0.15304531455039977\n",
      "   +5.3528 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   -3.0626 if cp<=0.15526567697525026 & pa<=0.15440531373023986\n",
      "   +2.4349 if cv>=0.557355666160584 & pav<=0.08675469905138018\n",
      "   +4.8404 if pa<=0.14063940346240997\n",
      "Run episode 269 with rewards 106.0\n",
      "============ 270 ===========\n",
      "50 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1, 1]\n",
      "   +0.4709 if cp>=-0.046283074468374236 & pa<=0.14660244584083557\n",
      "   -0.9672 if cp<=0.04477308690547943 & cp>=-0.048945702612400055\n",
      "   -0.2896 if cv<=0.03450129479169846\n",
      "   +0.7682 if pav<=0.2056886851787567\n",
      "   -2.6828 if cp>=-0.03722570091485977\n",
      "   +1.3055 if cv>=0.7561783194541931 & pav<=0.029311519116163254\n",
      "   +2.1933 if pav<=0.09953273385763169\n",
      "   -2.1760 if cv>=0.5810786962509156 & pav<=0.11198783069849019\n",
      "   -4.7068 if pav>=0.105914668738842\n",
      "   -0.0459 if cv<=0.1721094608306885 & pav>=-0.04219573140144348\n",
      "   +0.0000 if cp<=0.017127060517668727 & pa>=0.14063940346240997 & pav<=0.20234745144844057 & pav>=0.07060452848672867\n",
      "   +2.7418 if \n",
      "--------------\n",
      "   -0.6246 if pav>=0.2056886851787567\n",
      "   +1.8036 if cv<=0.007520409114658835 & pav>=0.09132880419492723\n",
      "   +0.7337 if cp<=0.040608961135149\n",
      "   -1.2652 if cp>=-0.03722570091485977\n",
      "   -0.0000 if cv<=0.7561783194541931 & pa>=0.15191885828971863 & pav<=0.13706842064857483\n",
      "   +5.3354 if cv<=0.6890100955963137 & pa>=0.1195587769150734 & pav<=0.08597432971000672 & pav>=-0.012333278357982634\n",
      "   -2.0210 if pa<=0.15304531455039977\n",
      "   +7.1465 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   -2.0210 if cp<=0.15526567697525026 & pa<=0.15440531373023986\n",
      "   +1.3392 if cv>=0.557355666160584 & pav<=0.08675469905138018\n",
      "   +0.8852 if pa<=0.14063940346240997\n",
      "   -0.9696 if \n",
      "Run episode 270 with rewards 50.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 271 ===========\n",
      "91 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 0, 0, 0, 0]\n",
      "   -2.8786 if cp>=-0.046283074468374236 & pa<=0.14660244584083557\n",
      "   +0.4963 if cp<=0.04477308690547943 & cp>=-0.048945702612400055\n",
      "   -1.2931 if cv<=0.03450129479169846\n",
      "   +1.9044 if pav<=0.2056886851787567\n",
      "   +0.1903 if cp>=-0.03722570091485977\n",
      "   -0.0000 if cv>=0.7561783194541931 & pav<=0.029311519116163254\n",
      "   +3.2098 if pav<=0.09953273385763169\n",
      "   -0.0000 if cv>=0.5810786962509156 & pav<=0.11198783069849019\n",
      "   -3.4352 if pav>=0.105914668738842\n",
      "   +1.5593 if cv<=0.1721094608306885 & pav>=-0.04219573140144348\n",
      "   -0.2254 if \n",
      "   +2.0449 if cp>=0.06594289988279346 & pav<=0.3538276195526123\n",
      "--------------\n",
      "   -0.1503 if pav>=0.2056886851787567\n",
      "   +0.5528 if cv<=0.007520409114658835 & pav>=0.09132880419492723\n",
      "   +0.5206 if cp<=0.040608961135149\n",
      "   -3.2868 if cp>=-0.03722570091485977\n",
      "   -0.0046 if cv<=0.6890100955963137 & pa>=0.1195587769150734 & pav<=0.08597432971000672 & pav>=-0.012333278357982634\n",
      "   +0.9916 if pa<=0.15304531455039977\n",
      "   +3.4399 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   -0.8331 if cp<=0.15526567697525026 & pa<=0.15440531373023986\n",
      "   -0.0285 if cv>=0.557355666160584 & pav<=0.08675469905138018\n",
      "   +1.9309 if pa<=0.14063940346240997\n",
      "   -3.8663 if \n",
      "   +2.1890 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "Run episode 271 with rewards 91.0\n",
      "============ 272 ===========\n",
      "44 actions [0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0, 0, 0, 1]\n",
      "   -0.5320 if cp>=-0.046283074468374236 & pa<=0.14660244584083557\n",
      "   +0.1343 if cp<=0.04477308690547943 & cp>=-0.048945702612400055\n",
      "   -0.8520 if cv<=0.03450129479169846\n",
      "   +2.7991 if pav<=0.2056886851787567\n",
      "   -0.5957 if cp>=-0.03722570091485977\n",
      "   +2.1428 if pav<=0.09953273385763169\n",
      "   +0.0001 if cv>=0.5810786962509156 & pav<=0.11198783069849019\n",
      "   -6.0903 if pav>=0.105914668738842\n",
      "   -0.9070 if cv<=0.1721094608306885 & pav>=-0.04219573140144348\n",
      "   +2.0966 if \n",
      "   +0.0000 if cp>=0.06594289988279346 & pav<=0.3538276195526123\n",
      "   -2.9728 if cp>=0.004493808373808861 & pa>=0.11971680819988251 & pav<=0.18589775264263153 & pav>=0.08981578797101974\n",
      "--------------\n",
      "   +0.9657 if pav>=0.2056886851787567\n",
      "   +0.8743 if cv<=0.007520409114658835 & pav>=0.09132880419492723\n",
      "   -0.9394 if cp<=0.040608961135149\n",
      "   -2.9353 if cp>=-0.03722570091485977\n",
      "   -0.8121 if pa<=0.15304531455039977\n",
      "   +5.5361 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   -0.8121 if cp<=0.15526567697525026 & pa<=0.15440531373023986\n",
      "   -0.0714 if cv>=0.557355666160584 & pav<=0.08675469905138018\n",
      "   -0.1212 if pa<=0.14063940346240997\n",
      "   -1.2858 if \n",
      "   +2.6514 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -4.7078 if cp>=0.004493808373808861 & cv>=0.21057194471359253 & pav>=0.18589775264263153\n",
      "Run episode 272 with rewards 44.0\n",
      "============ 273 ===========\n",
      "53 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 0, 0, 1, 1, 0, 1, 1]\n",
      "   +0.8896 if cp>=-0.046283074468374236 & pa<=0.14660244584083557\n",
      "   +0.7749 if cp<=0.04477308690547943 & cp>=-0.048945702612400055\n",
      "   +0.3695 if cv<=0.03450129479169846\n",
      "   +1.2438 if pav<=0.2056886851787567\n",
      "   -2.1407 if cp>=-0.03722570091485977\n",
      "   +2.1431 if pav<=0.09953273385763169\n",
      "   +0.3470 if cv>=0.5810786962509156 & pav<=0.11198783069849019\n",
      "   -3.1310 if pav>=0.105914668738842\n",
      "   -0.3281 if cv<=0.1721094608306885 & pav>=-0.04219573140144348\n",
      "   -0.9880 if \n",
      "   -0.0231 if cp>=0.004493808373808861 & pa>=0.11971680819988251 & pav<=0.18589775264263153 & pav>=0.08981578797101974\n",
      "   +1.9506 if pav>=0.23533811569213875\n",
      "--------------\n",
      "   -1.5203 if pav>=0.2056886851787567\n",
      "   +0.4797 if cv<=0.007520409114658835 & pav>=0.09132880419492723\n",
      "   +0.0494 if cp<=0.040608961135149\n",
      "   -1.1147 if cp>=-0.03722570091485977\n",
      "   +0.0494 if pa<=0.15304531455039977\n",
      "   +3.3411 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   +0.0825 if cp<=0.15526567697525026 & pa<=0.15440531373023986\n",
      "   -0.6867 if pa<=0.14063940346240997\n",
      "   -0.4541 if \n",
      "   +0.4056 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -2.2366 if cp>=0.004493808373808861 & cv>=0.21057194471359253 & pav>=0.18589775264263153\n",
      "   -4.7125 if cp<=0.041698040068149554 & cv>=0.28142417073249876 & pav<=0.35831599235534667 & pav>=0.23533811569213875\n",
      "Run episode 273 with rewards 53.0\n",
      "============ 274 ===========\n",
      "102 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0]\n",
      "   +0.5512 if cp>=-0.046283074468374236 & pa<=0.14660244584083557\n",
      "   -4.3889 if cp<=0.04477308690547943 & cp>=-0.048945702612400055\n",
      "   -2.1763 if cv<=0.03450129479169846\n",
      "   +1.2495 if pav<=0.2056886851787567\n",
      "   +0.8594 if cp>=-0.03722570091485977\n",
      "   +3.3480 if pav<=0.09953273385763169\n",
      "   +0.0000 if cv>=0.5810786962509156 & pav<=0.11198783069849019\n",
      "   -2.4887 if pav>=0.105914668738842\n",
      "   +2.6373 if cv<=0.1721094608306885 & pav>=-0.04219573140144348\n",
      "   +0.8594 if \n",
      "   -0.3824 if pav>=0.23533811569213875\n",
      "   -4.5309 if pa>=0.06150407791137695 & pav>=0.0003513446099532305\n",
      "--------------\n",
      "   -0.8867 if pav>=0.2056886851787567\n",
      "   +2.3853 if cv<=0.007520409114658835 & pav>=0.09132880419492723\n",
      "   +2.5650 if cp<=0.040608961135149\n",
      "   -0.9614 if cp>=-0.03722570091485977\n",
      "   +4.6367 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   -0.4168 if cp<=0.15526567697525026 & pa<=0.15440531373023986\n",
      "   -0.4168 if pa<=0.14063940346240997\n",
      "   -0.9614 if \n",
      "   -0.6519 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -1.5938 if cp>=0.004493808373808861 & cv>=0.21057194471359253 & pav>=0.18589775264263153\n",
      "   -0.0000 if cp<=0.041698040068149554 & cv>=0.28142417073249876 & pav<=0.35831599235534667 & pav>=0.23533811569213875\n",
      "   -3.6035 if pa<=0.06150407791137695 & pav<=0.08987991958856582\n",
      "Run episode 274 with rewards 102.0\n",
      "============ 275 ===========\n",
      "71 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 1, 1, 0, 1, 0, 1]\n",
      "   -0.6017 if cp>=-0.046283074468374236 & pa<=0.14660244584083557\n",
      "   -3.4863 if cp<=0.04477308690547943 & cp>=-0.048945702612400055\n",
      "   -2.4966 if cv<=0.03450129479169846\n",
      "   +2.9534 if pav<=0.2056886851787567\n",
      "   +0.1421 if cp>=-0.03722570091485977\n",
      "   +3.2864 if pav<=0.09953273385763169\n",
      "   -1.2164 if pav>=0.105914668738842\n",
      "   +1.0506 if cv<=0.1721094608306885 & pav>=-0.04219573140144348\n",
      "   +2.0697 if \n",
      "   -0.4975 if pav>=0.23533811569213875\n",
      "   -6.0633 if pa>=0.06150407791137695 & pav>=0.0003513446099532305\n",
      "   -5.9984 if cp<=-0.04450223147869108 & pa>=0.10005136281251911\n",
      "--------------\n",
      "   -0.8647 if pav>=0.2056886851787567\n",
      "   +5.3319 if cv<=0.007520409114658835 & pav>=0.09132880419492723\n",
      "   +2.4761 if cp<=0.040608961135149\n",
      "   +0.0079 if cp>=-0.03722570091485977\n",
      "   +2.7278 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   -3.2644 if cp<=0.15526567697525026 & pa<=0.15440531373023986\n",
      "   +1.9472 if pa<=0.14063940346240997\n",
      "   -1.9655 if \n",
      "   +2.7068 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -0.9027 if cp>=0.004493808373808861 & cv>=0.21057194471359253 & pav>=0.18589775264263153\n",
      "   -5.3549 if pa<=0.06150407791137695 & pav<=0.08987991958856582\n",
      "   +5.1385 if cp<=-0.04450223147869108 & cv<=0.35752863287925724 & pa>=0.10005136281251911\n",
      "Run episode 275 with rewards 71.0\n",
      "============ 276 ===========\n",
      "98 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1]\n",
      "   -0.4088 if cp>=-0.046283074468374236 & pa<=0.14660244584083557\n",
      "   -2.4535 if cp<=0.04477308690547943 & cp>=-0.048945702612400055\n",
      "   -0.9456 if cv<=0.03450129479169846\n",
      "   +2.5937 if pav<=0.2056886851787567\n",
      "   +2.0678 if pav<=0.09953273385763169\n",
      "   -1.1023 if pav>=0.105914668738842\n",
      "   -0.9456 if cv<=0.1721094608306885 & pav>=-0.04219573140144348\n",
      "   +1.2282 if \n",
      "   -1.2952 if pav>=0.23533811569213875\n",
      "   -5.1942 if pa>=0.06150407791137695 & pav>=0.0003513446099532305\n",
      "   +0.0000 if cp<=-0.04450223147869108 & pa>=0.10005136281251911\n",
      "   +3.3920 if cp<=0.0742868110537529 & pav>=0.005486564245074987\n",
      "--------------\n",
      "   +1.1482 if pav>=0.2056886851787567\n",
      "   +0.3388 if cv<=0.007520409114658835 & pav>=0.09132880419492723\n",
      "   +2.9009 if cp<=0.040608961135149\n",
      "   +3.3970 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   -3.8248 if cp<=0.15526567697525026 & pa<=0.15440531373023986\n",
      "   +2.7639 if pa<=0.14063940346240997\n",
      "   -2.5487 if \n",
      "   +3.2446 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -1.5933 if cp>=0.004493808373808861 & cv>=0.21057194471359253 & pav>=0.18589775264263153\n",
      "   -1.1422 if pa<=0.06150407791137695 & pav<=0.08987991958856582\n",
      "   +0.0000 if cp<=-0.04450223147869108 & cv<=0.35752863287925724 & pa>=0.10005136281251911\n",
      "   -3.8362 if cv<=0.5580800771713257 & cv>=0.21216811239719494 & pav<=0.08475706726312637 & pav>=0.005486564245074987\n",
      "Run episode 276 with rewards 98.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 277 ===========\n",
      "51 actions [0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0]\n",
      "   +0.6273 if cp>=-0.046283074468374236 & pa<=0.14660244584083557\n",
      "   -0.8880 if cp<=0.04477308690547943 & cp>=-0.048945702612400055\n",
      "   +0.0372 if cv<=0.03450129479169846\n",
      "   +0.8021 if pav<=0.2056886851787567\n",
      "   +4.0416 if pav<=0.09953273385763169\n",
      "   -2.7426 if pav>=0.105914668738842\n",
      "   +0.6681 if cv<=0.1721094608306885 & pav>=-0.04219573140144348\n",
      "   +1.5320 if \n",
      "   -3.0163 if pav>=0.23533811569213875\n",
      "   -0.3694 if pa>=0.06150407791137695 & pav>=0.0003513446099532305\n",
      "   -1.3926 if cp<=0.0742868110537529 & pav>=0.005486564245074987\n",
      "   -0.8890 if pav>=0.5489321947097778\n",
      "--------------\n",
      "   -0.7893 if pav>=0.2056886851787567\n",
      "   +1.9880 if cv<=0.007520409114658835 & pav>=0.09132880419492723\n",
      "   +0.2684 if cp<=0.040608961135149\n",
      "   +6.4719 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   +0.3081 if cp<=0.15526567697525026 & pa<=0.15440531373023986\n",
      "   +0.6458 if pa<=0.14063940346240997\n",
      "   -3.5680 if \n",
      "   +3.4729 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -1.1970 if cp>=0.004493808373808861 & cv>=0.21057194471359253 & pav>=0.18589775264263153\n",
      "   -2.0330 if pa<=0.06150407791137695 & pav<=0.08987991958856582\n",
      "   -0.1941 if cv<=0.5580800771713257 & cv>=0.21216811239719494 & pav<=0.08475706726312637 & pav>=0.005486564245074987\n",
      "   +1.2803 if pav>=0.5489321947097778\n",
      "Run episode 277 with rewards 51.0\n",
      "============ 278 ===========\n",
      "57 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1, 0, 1]\n",
      "   +0.6212 if cp>=-0.046283074468374236 & pa<=0.14660244584083557\n",
      "   +0.7122 if cp<=0.04477308690547943 & cp>=-0.048945702612400055\n",
      "   +1.2195 if pav<=0.2056886851787567\n",
      "   +1.2695 if pav<=0.09953273385763169\n",
      "   -2.0601 if pav>=0.105914668738842\n",
      "   +0.1783 if cv<=0.1721094608306885 & pav>=-0.04219573140144348\n",
      "   -0.7906 if \n",
      "   -1.9139 if pav>=0.23533811569213875\n",
      "   -1.1774 if pa>=0.06150407791137695 & pav>=0.0003513446099532305\n",
      "   -0.2186 if cp<=0.0742868110537529 & pav>=0.005486564245074987\n",
      "   -0.2681 if pav>=0.5489321947097778\n",
      "   +2.0317 if pav<=0.257626473903656\n",
      "--------------\n",
      "   -0.0171 if pav>=0.2056886851787567\n",
      "   +0.7380 if cv<=0.007520409114658835 & pav>=0.09132880419492723\n",
      "   -0.2694 if cp<=0.040608961135149\n",
      "   +2.6418 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   +1.4127 if cp<=0.15526567697525026 & pa<=0.15440531373023986\n",
      "   -0.5091 if pa<=0.14063940346240997\n",
      "   -1.6453 if \n",
      "   +2.3817 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -2.0324 if cp>=0.004493808373808861 & cv>=0.21057194471359253 & pav>=0.18589775264263153\n",
      "   -0.5180 if pa<=0.06150407791137695 & pav<=0.08987991958856582\n",
      "   +0.3120 if pav>=0.5489321947097778\n",
      "   -2.5051 if cv<=0.5097461342811584 & cv>=0.5097461342811584\n",
      "Run episode 278 with rewards 57.0\n",
      "============ 279 ===========\n",
      "60 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 0, 1, 1]\n",
      "   -0.0002 if cp>=-0.046283074468374236 & pa<=0.14660244584083557\n",
      "   +0.5646 if cp<=0.04477308690547943 & cp>=-0.048945702612400055\n",
      "   +0.8629 if pav<=0.2056886851787567\n",
      "   +5.5652 if pav<=0.09953273385763169\n",
      "   +0.2338 if pav>=0.105914668738842\n",
      "   -1.4156 if \n",
      "   -2.0522 if pav>=0.23533811569213875\n",
      "   -2.3605 if pa>=0.06150407791137695 & pav>=0.0003513446099532305\n",
      "   +0.4407 if cp<=0.0742868110537529 & pav>=0.005486564245074987\n",
      "   -0.5023 if pav>=0.5489321947097778\n",
      "   +0.3949 if pav<=0.257626473903656\n",
      "   +2.9979 if cp>=0.07980440855026251 & cv>=0.5254972457885743 & pav<=0.34364643692970276 & pav>=0.1001829504966736 & pav>=0.24480353593826304\n",
      "--------------\n",
      "   +0.2051 if cv<=0.007520409114658835 & pav>=0.09132880419492723\n",
      "   -0.8394 if cp<=0.040608961135149\n",
      "   +4.0917 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   +0.6830 if cp<=0.15526567697525026 & pa<=0.15440531373023986\n",
      "   -1.1387 if pa<=0.14063940346240997\n",
      "   -0.8218 if \n",
      "   +3.1804 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -3.9135 if cp>=0.004493808373808861 & cv>=0.21057194471359253 & pav>=0.18589775264263153\n",
      "   -0.5084 if pa<=0.06150407791137695 & pav<=0.08987991958856582\n",
      "   +0.7726 if pav>=0.5489321947097778\n",
      "   -0.0000 if cv<=0.5097461342811584 & cv>=0.5097461342811584\n",
      "   +2.8450 if cp>=0.07980440855026251 & pav<=0.24480353593826304 & pav>=0.1001829504966736\n",
      "Run episode 279 with rewards 60.0\n",
      "============ 280 ===========\n",
      "54 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1]\n",
      "   -0.4159 if cp<=0.04477308690547943 & cp>=-0.048945702612400055\n",
      "   +1.1400 if pav<=0.2056886851787567\n",
      "   +2.0641 if pav<=0.09953273385763169\n",
      "   -3.2361 if pav>=0.105914668738842\n",
      "   -0.1626 if \n",
      "   -1.2779 if pav>=0.23533811569213875\n",
      "   -1.3863 if pa>=0.06150407791137695 & pav>=0.0003513446099532305\n",
      "   -0.9767 if cp<=0.0742868110537529 & pav>=0.005486564245074987\n",
      "   +0.2314 if pav>=0.5489321947097778\n",
      "   +3.2233 if pav<=0.257626473903656\n",
      "   -0.0000 if cp>=0.07980440855026251 & cv>=0.5254972457885743 & pav<=0.34364643692970276 & pav>=0.1001829504966736 & pav>=0.24480353593826304\n",
      "   +0.4223 if pa>=0.06612473875284196 & pav>=0.3398247003555298\n",
      "--------------\n",
      "   +0.1314 if cv<=0.007520409114658835 & pav>=0.09132880419492723\n",
      "   +0.8815 if cp<=0.040608961135149\n",
      "   +5.1024 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   -1.2815 if cp<=0.15526567697525026 & pa<=0.15440531373023986\n",
      "   -1.4948 if pa<=0.14063940346240997\n",
      "   -1.2850 if \n",
      "   +3.7118 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -2.7567 if cp>=0.004493808373808861 & cv>=0.21057194471359253 & pav>=0.18589775264263153\n",
      "   -0.0516 if pa<=0.06150407791137695 & pav<=0.08987991958856582\n",
      "   +0.0272 if pav>=0.5489321947097778\n",
      "   -0.6955 if cp>=0.07980440855026251 & pav<=0.24480353593826304 & pav>=0.1001829504966736\n",
      "   -0.2870 if cp<=0.05793148428201678 & pav<=0.10098131746053696\n",
      "Run episode 280 with rewards 54.0\n",
      "============ 281 ===========\n",
      "75 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 1, 1, 0]\n",
      "   +0.6463 if cp<=0.04477308690547943 & cp>=-0.048945702612400055\n",
      "   +0.1586 if pav<=0.2056886851787567\n",
      "   +1.9278 if pav<=0.09953273385763169\n",
      "   -1.6435 if pav>=0.105914668738842\n",
      "   +0.2844 if \n",
      "   -1.5450 if pav>=0.23533811569213875\n",
      "   -0.2771 if pa>=0.06150407791137695 & pav>=0.0003513446099532305\n",
      "   -2.3111 if cp<=0.0742868110537529 & pav>=0.005486564245074987\n",
      "   +0.0505 if pav>=0.5489321947097778\n",
      "   +2.2110 if pav<=0.257626473903656\n",
      "   -2.7467 if pa>=0.06612473875284196 & pav>=0.3398247003555298\n",
      "   -0.0229 if cp<=0.10656930357217793 & cv<=0.2186855971813202 & pav>=0.020451548323035244\n",
      "--------------\n",
      "   +0.0137 if cv<=0.007520409114658835 & pav>=0.09132880419492723\n",
      "   +1.5781 if cp<=0.040608961135149\n",
      "   +3.7658 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   -1.4326 if cp<=0.15526567697525026 & pa<=0.15440531373023986\n",
      "   -2.1235 if pa<=0.14063940346240997\n",
      "   -0.4861 if \n",
      "   +3.5018 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -3.5827 if cp>=0.004493808373808861 & cv>=0.21057194471359253 & pav>=0.18589775264263153\n",
      "   -0.2594 if pa<=0.06150407791137695 & pav<=0.08987991958856582\n",
      "   -2.9282 if cp>=0.07980440855026251 & pav<=0.24480353593826304 & pav>=0.1001829504966736\n",
      "   -0.5566 if cp<=0.05793148428201678 & pav<=0.10098131746053696\n",
      "   +1.6358 if cp<=0.10656930357217793 & cp>=0.03597051128745081 & pav<=0.2522799372673036 & pav>=0.12129032313823705\n",
      "Run episode 281 with rewards 75.0\n",
      "============ 282 ===========\n",
      "71 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1]\n",
      "   +0.8242 if cp<=0.04477308690547943 & cp>=-0.048945702612400055\n",
      "   +1.4617 if pav<=0.2056886851787567\n",
      "   +2.4707 if pav<=0.09953273385763169\n",
      "   -2.2926 if pav>=0.105914668738842\n",
      "   +0.1781 if \n",
      "   -0.4859 if pav>=0.23533811569213875\n",
      "   -0.7450 if pa>=0.06150407791137695 & pav>=0.0003513446099532305\n",
      "   -1.0172 if cp<=0.0742868110537529 & pav>=0.005486564245074987\n",
      "   -0.3502 if pav>=0.5489321947097778\n",
      "   -1.4722 if pav<=0.257626473903656\n",
      "   -1.1112 if pa>=0.06612473875284196 & pav>=0.3398247003555298\n",
      "   +0.9591 if pav<=0.22125779688358307\n",
      "--------------\n",
      "   +1.2664 if cp<=0.040608961135149\n",
      "   +4.9286 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   -2.6357 if cp<=0.15526567697525026 & pa<=0.15440531373023986\n",
      "   +1.5169 if pa<=0.14063940346240997\n",
      "   -1.8188 if \n",
      "   +2.8115 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -2.6574 if cp>=0.004493808373808861 & cv>=0.21057194471359253 & pav>=0.18589775264263153\n",
      "   -0.6692 if pa<=0.06150407791137695 & pav<=0.08987991958856582\n",
      "   +0.0886 if cp>=0.07980440855026251 & pav<=0.24480353593826304 & pav>=0.1001829504966736\n",
      "   -1.4692 if cp<=0.05793148428201678 & pav<=0.10098131746053696\n",
      "   +2.2629 if cp<=0.10656930357217793 & cp>=0.03597051128745081 & pav<=0.2522799372673036 & pav>=0.12129032313823705\n",
      "   -0.0319 if cp>=0.045958375930786145 & pav<=0.08072272837162023\n",
      "Run episode 282 with rewards 71.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 283 ===========\n",
      "40 actions [0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 0, 0, 1, 1, 0, 1]\n",
      "   -0.3150 if cp<=0.04477308690547943 & cp>=-0.048945702612400055\n",
      "   +0.9557 if pav<=0.2056886851787567\n",
      "   +2.0657 if pav<=0.09953273385763169\n",
      "   -2.0843 if pav>=0.105914668738842\n",
      "   -0.9329 if pav>=0.23533811569213875\n",
      "   -1.0114 if pa>=0.06150407791137695 & pav>=0.0003513446099532305\n",
      "   -0.5842 if cp<=0.0742868110537529 & pav>=0.005486564245074987\n",
      "   +0.4785 if pav>=0.5489321947097778\n",
      "   +0.4987 if pav<=0.257626473903656\n",
      "   +1.5721 if pa>=0.06612473875284196 & pav>=0.3398247003555298\n",
      "   +0.9172 if pav<=0.22125779688358307\n",
      "   +2.2435 if cp>=0.13051024079322815\n",
      "--------------\n",
      "   +0.2269 if cp<=0.040608961135149\n",
      "   +3.3495 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   +0.9989 if cp<=0.15526567697525026 & pa<=0.15440531373023986\n",
      "   -0.2311 if pa<=0.14063940346240997\n",
      "   -2.6221 if \n",
      "   +2.1027 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -2.3064 if cp>=0.004493808373808861 & cv>=0.21057194471359253 & pav>=0.18589775264263153\n",
      "   -0.6737 if pa<=0.06150407791137695 & pav<=0.08987991958856582\n",
      "   +0.0000 if cp>=0.07980440855026251 & pav<=0.24480353593826304 & pav>=0.1001829504966736\n",
      "   -2.1471 if cp<=0.05793148428201678 & pav<=0.10098131746053696\n",
      "   +0.0998 if cp<=0.10656930357217793 & cp>=0.03597051128745081 & pav<=0.2522799372673036 & pav>=0.12129032313823705\n",
      "   -0.0083 if cv>=0.7201533913612366\n",
      "Run episode 283 with rewards 40.0\n",
      "============ 284 ===========\n",
      "54 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 0, 0, 0, 0]\n",
      "   +0.7852 if pav<=0.2056886851787567\n",
      "   +1.7595 if pav<=0.09953273385763169\n",
      "   -2.1247 if pav>=0.105914668738842\n",
      "   -0.6517 if pav>=0.23533811569213875\n",
      "   -0.8541 if pa>=0.06150407791137695 & pav>=0.0003513446099532305\n",
      "   -0.8380 if cp<=0.0742868110537529 & pav>=0.005486564245074987\n",
      "   +1.4303 if pav>=0.5489321947097778\n",
      "   +0.2865 if pav<=0.257626473903656\n",
      "   +3.1903 if pa>=0.06612473875284196 & pav>=0.3398247003555298\n",
      "   +0.7852 if pav<=0.22125779688358307\n",
      "   +2.8304 if cp>=0.13051024079322815\n",
      "   -2.1669 if pav>=1.0563424825668335\n",
      "--------------\n",
      "   +1.4331 if cp<=0.040608961135149\n",
      "   +3.8814 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   -1.8910 if cp<=0.15526567697525026 & pa<=0.15440531373023986\n",
      "   +0.7886 if pa<=0.14063940346240997\n",
      "   -1.4982 if \n",
      "   +0.3421 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -1.5193 if cp>=0.004493808373808861 & cv>=0.21057194471359253 & pav>=0.18589775264263153\n",
      "   -0.3388 if pa<=0.06150407791137695 & pav<=0.08987991958856582\n",
      "   -1.7486 if cp<=0.05793148428201678 & pav<=0.10098131746053696\n",
      "   +0.3157 if cp<=0.10656930357217793 & cp>=0.03597051128745081 & pav<=0.2522799372673036 & pav>=0.12129032313823705\n",
      "   +0.0000 if cv>=0.7201533913612366\n",
      "   +2.1121 if cv>=0.1876391649246216 & pa<=0.13063086569309235 & pav>=0.11686329841613774\n",
      "Run episode 284 with rewards 54.0\n",
      "============ 285 ===========\n",
      "62 actions [0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 0, 1, 1, 1, 0, 1, 0, 1, 1, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1]\n",
      "   +0.1846 if pav<=0.2056886851787567\n",
      "   +1.8659 if pav<=0.09953273385763169\n",
      "   -3.9403 if pav>=0.105914668738842\n",
      "   +0.6798 if pav>=0.23533811569213875\n",
      "   -1.4660 if pa>=0.06150407791137695 & pav>=0.0003513446099532305\n",
      "   -0.1495 if cp<=0.0742868110537529 & pav>=0.005486564245074987\n",
      "   +0.2196 if pav>=0.5489321947097778\n",
      "   -0.0473 if pa>=0.06612473875284196 & pav>=0.3398247003555298\n",
      "   +0.0284 if pav<=0.22125779688358307\n",
      "   +0.2196 if cp>=0.13051024079322815\n",
      "   -3.8376 if pav>=1.0563424825668335\n",
      "   +2.4984 if pav<=0.24758950173854832\n",
      "--------------\n",
      "   -1.1146 if cp<=0.040608961135149\n",
      "   +4.0344 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   -0.8655 if cp<=0.15526567697525026 & pa<=0.15440531373023986\n",
      "   -1.1263 if pa<=0.14063940346240997\n",
      "   -0.4428 if \n",
      "   +4.7634 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -2.3523 if cp>=0.004493808373808861 & cv>=0.21057194471359253 & pav>=0.18589775264263153\n",
      "   -0.2883 if pa<=0.06150407791137695 & pav<=0.08987991958856582\n",
      "   -1.1347 if cp<=0.05793148428201678 & pav<=0.10098131746053696\n",
      "   +1.5350 if cp<=0.10656930357217793 & cp>=0.03597051128745081 & pav<=0.2522799372673036 & pav>=0.12129032313823705\n",
      "   +0.0393 if cv>=0.1876391649246216 & pa<=0.13063086569309235 & pav>=0.11686329841613774\n",
      "   +3.8353 if cp>=0.15692393481731415\n",
      "Run episode 285 with rewards 62.0\n",
      "============ 286 ===========\n",
      "117 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 1, 1, 0, 0, 1, 0, 1, 1, 1, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 1, 1, 0, 0, 0, 1, 1, 0, 1, 1, 1, 1, 0, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1]\n",
      "   +0.5516 if pav<=0.2056886851787567\n",
      "   -0.0835 if pav<=0.09953273385763169\n",
      "   -6.4236 if pav>=0.105914668738842\n",
      "   -2.1797 if pav>=0.23533811569213875\n",
      "   +1.8611 if pa>=0.06150407791137695 & pav>=0.0003513446099532305\n",
      "   +1.4582 if cp<=0.0742868110537529 & pav>=0.005486564245074987\n",
      "   -0.1248 if pav>=0.5489321947097778\n",
      "   -0.9545 if pa>=0.06612473875284196 & pav>=0.3398247003555298\n",
      "   +3.7730 if cp>=0.13051024079322815\n",
      "   -0.0000 if pav>=1.0563424825668335\n",
      "   -1.0468 if pav<=0.24758950173854832\n",
      "   +4.2324 if pa<=0.17110725343227387 & pav<=0.09408825337886813\n",
      "--------------\n",
      "   +0.5717 if cp<=0.040608961135149\n",
      "   +2.3491 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   -0.8870 if cp<=0.15526567697525026 & pa<=0.15440531373023986\n",
      "   -0.8870 if pa<=0.14063940346240997\n",
      "   +2.1091 if \n",
      "   +3.8436 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -0.8405 if cp>=0.004493808373808861 & cv>=0.21057194471359253 & pav>=0.18589775264263153\n",
      "   -0.1271 if pa<=0.06150407791137695 & pav<=0.08987991958856582\n",
      "   -0.5970 if cp<=0.05793148428201678 & pav<=0.10098131746053696\n",
      "   +3.9193 if cp<=0.10656930357217793 & cp>=0.03597051128745081 & pav<=0.2522799372673036 & pav>=0.12129032313823705\n",
      "   +2.7725 if cp>=0.15692393481731415\n",
      "   -3.8909 if pa<=0.17110725343227387\n",
      "Run episode 286 with rewards 117.0\n",
      "============ 287 ===========\n",
      "122 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 1, 1, 1, 0, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1]\n",
      "   +2.2634 if pav<=0.2056886851787567\n",
      "   -0.8395 if pav<=0.09953273385763169\n",
      "   -6.9870 if pav>=0.105914668738842\n",
      "   -2.2999 if pav>=0.23533811569213875\n",
      "   +2.3436 if pa>=0.06150407791137695 & pav>=0.0003513446099532305\n",
      "   -2.2757 if cp<=0.0742868110537529 & pav>=0.005486564245074987\n",
      "   +0.0000 if pav>=0.5489321947097778\n",
      "   -0.1735 if pa>=0.06612473875284196 & pav>=0.3398247003555298\n",
      "   -2.4393 if cp>=0.13051024079322815\n",
      "   +1.9964 if pav<=0.24758950173854832\n",
      "   +5.5395 if pa<=0.17110725343227387 & pav<=0.09408825337886813\n",
      "   +3.9270 if cp<=0.4724173963069918 & cv>=1.3031113386154176 & pa>=0.17070786356925965\n",
      "--------------\n",
      "   +0.6331 if cp<=0.040608961135149\n",
      "   +3.6553 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   -4.4583 if cp<=0.15526567697525026 & pa<=0.15440531373023986\n",
      "   +3.0345 if pa<=0.14063940346240997\n",
      "   +1.6584 if \n",
      "   +4.0696 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   +0.6450 if cp>=0.004493808373808861 & cv>=0.21057194471359253 & pav>=0.18589775264263153\n",
      "   -0.4256 if cp<=0.05793148428201678 & pav<=0.10098131746053696\n",
      "   +2.3408 if cp<=0.10656930357217793 & cp>=0.03597051128745081 & pav<=0.2522799372673036 & pav>=0.12129032313823705\n",
      "   +6.1063 if cp>=0.15692393481731415\n",
      "   -5.5685 if pa<=0.17110725343227387\n",
      "   -4.5869 if cp<=0.4724173963069918 & cv>=1.3031113386154176 & pa>=0.17070786356925965 & pav<=-0.07766690254211425\n",
      "Run episode 287 with rewards 122.0\n",
      "============ 288 ===========\n",
      "100 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 1, 0, 0, 1, 0, 1, 1, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1]\n",
      "   +2.1788 if pav<=0.2056886851787567\n",
      "   +0.0006 if pav<=0.09953273385763169\n",
      "   -6.7740 if pav>=0.105914668738842\n",
      "   -4.5892 if pav>=0.23533811569213875\n",
      "   +1.4162 if pa>=0.06150407791137695 & pav>=0.0003513446099532305\n",
      "   -0.0104 if cp<=0.0742868110537529 & pav>=0.005486564245074987\n",
      "   -0.2919 if pa>=0.06612473875284196 & pav>=0.3398247003555298\n",
      "   -3.7614 if cp>=0.13051024079322815\n",
      "   +1.6801 if pav<=0.24758950173854832\n",
      "   +4.7259 if pa<=0.17110725343227387 & pav<=0.09408825337886813\n",
      "   +3.4836 if cp<=0.4724173963069918 & cv>=1.3031113386154176 & pa>=0.17070786356925965\n",
      "   +3.1231 if cp>=0.03198039643466477 & cv>=0.37345741391181947\n",
      "--------------\n",
      "   +3.2807 if cp<=0.040608961135149\n",
      "   -0.8540 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   -1.9836 if cp<=0.15526567697525026 & pa<=0.15440531373023986\n",
      "   -1.1179 if pa<=0.14063940346240997\n",
      "   +2.8321 if \n",
      "   +4.8765 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   +0.8152 if cp>=0.004493808373808861 & cv>=0.21057194471359253 & pav>=0.18589775264263153\n",
      "   -0.9080 if cp<=0.10656930357217793 & cp>=0.03597051128745081 & pav<=0.2522799372673036 & pav>=0.12129032313823705\n",
      "   +3.3330 if cp>=0.15692393481731415\n",
      "   -5.4425 if pa<=0.17110725343227387\n",
      "   -4.5161 if cp<=0.4724173963069918 & cv>=1.3031113386154176 & pa>=0.17070786356925965 & pav<=-0.07766690254211425\n",
      "   +0.4132 if cp<=0.4015715777873995 & pa<=0.15495550334453584 & pav<=0.15249298810958864\n",
      "Run episode 288 with rewards 100.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 289 ===========\n",
      "49 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 1]\n",
      "   +2.3957 if pav<=0.2056886851787567\n",
      "   -8.1489 if pav>=0.105914668738842\n",
      "   -1.9322 if pav>=0.23533811569213875\n",
      "   -1.2879 if pa>=0.06150407791137695 & pav>=0.0003513446099532305\n",
      "   +1.4636 if cp<=0.0742868110537529 & pav>=0.005486564245074987\n",
      "   -0.2586 if pa>=0.06612473875284196 & pav>=0.3398247003555298\n",
      "   -3.1785 if cp>=0.13051024079322815\n",
      "   +1.4287 if pav<=0.24758950173854832\n",
      "   +1.9195 if pa<=0.17110725343227387 & pav<=0.09408825337886813\n",
      "   +2.7922 if cp<=0.4724173963069918 & cv>=1.3031113386154176 & pa>=0.17070786356925965\n",
      "   +3.5442 if cp>=0.03198039643466477 & cv>=0.37345741391181947\n",
      "   +5.4514 if cp>=-0.04069655835628509 & pa>=0.10482561588287355 & pav<=0.3323177874088287 & pav>=0.06272657662630081\n",
      "--------------\n",
      "   +3.4933 if cp<=0.040608961135149\n",
      "   +1.5873 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   -4.1169 if cp<=0.15526567697525026 & pa<=0.15440531373023986\n",
      "   -0.3468 if pa<=0.14063940346240997\n",
      "   +2.5466 if \n",
      "   +2.6821 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   +0.9334 if cp>=0.004493808373808861 & cv>=0.21057194471359253 & pav>=0.18589775264263153\n",
      "   -4.8614 if cp<=0.10656930357217793 & cp>=0.03597051128745081 & pav<=0.2522799372673036 & pav>=0.12129032313823705\n",
      "   +3.8633 if cp>=0.15692393481731415\n",
      "   -3.2437 if pa<=0.17110725343227387\n",
      "   -2.9528 if cp<=0.4724173963069918 & cv>=1.3031113386154176 & pa>=0.17070786356925965 & pav<=-0.07766690254211425\n",
      "   -4.8067 if cp<=0.07832173407077793 & cp>=-0.04069655835628509 & cv>=0.21187072694301606 & pav>=0.06272657662630081\n",
      "Run episode 289 with rewards 49.0\n",
      "============ 290 ===========\n",
      "115 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 1, 1, 0, 0, 0, 0, 1, 0]\n",
      "   +0.5278 if pav<=0.2056886851787567\n",
      "   -2.8853 if pav>=0.105914668738842\n",
      "   -1.3847 if pav>=0.23533811569213875\n",
      "   +0.4732 if pa>=0.06150407791137695 & pav>=0.0003513446099532305\n",
      "   -1.5644 if cp<=0.0742868110537529 & pav>=0.005486564245074987\n",
      "   +1.1761 if cp>=0.13051024079322815\n",
      "   +1.4688 if pav<=0.24758950173854832\n",
      "   +2.9206 if pa<=0.17110725343227387 & pav<=0.09408825337886813\n",
      "   -0.0000 if cp<=0.4724173963069918 & cv>=1.3031113386154176 & pa>=0.17070786356925965\n",
      "   +1.4047 if cp>=0.03198039643466477 & cv>=0.37345741391181947\n",
      "   +3.3078 if cp>=-0.04069655835628509 & pa>=0.10482561588287355 & pav<=0.3323177874088287 & pav>=0.06272657662630081\n",
      "   +0.9338 if pa<=0.05473344698548318\n",
      "--------------\n",
      "   +2.0028 if cp<=0.040608961135149\n",
      "   +0.3378 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   -1.2317 if cp<=0.15526567697525026 & pa<=0.15440531373023986\n",
      "   +0.0435 if \n",
      "   +0.5839 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -1.6600 if cp>=0.004493808373808861 & cv>=0.21057194471359253 & pav>=0.18589775264263153\n",
      "   -0.5872 if cp<=0.10656930357217793 & cp>=0.03597051128745081 & pav<=0.2522799372673036 & pav>=0.12129032313823705\n",
      "   -0.0000 if cp>=0.15692393481731415\n",
      "   -1.4323 if pa<=0.17110725343227387\n",
      "   -0.0000 if cp<=0.4724173963069918 & cv>=1.3031113386154176 & pa>=0.17070786356925965 & pav<=-0.07766690254211425\n",
      "   -3.2199 if cp<=0.07832173407077793 & cp>=-0.04069655835628509 & cv>=0.21187072694301606 & pav>=0.06272657662630081\n",
      "   +1.8809 if cp<=-0.007005532272160053 & cv<=0.1447057515382767 & cv>=-0.023631685972213743 & pa>=0.05473344698548318\n",
      "Run episode 290 with rewards 115.0\n",
      "============ 291 ===========\n",
      "88 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 1, 0, 0, 0, 1, 1, 1, 0, 1, 0, 1]\n",
      "   +3.2739 if pav<=0.2056886851787567\n",
      "   -6.8049 if pav>=0.105914668738842\n",
      "   -0.9595 if pav>=0.23533811569213875\n",
      "   -1.7391 if pa>=0.06150407791137695 & pav>=0.0003513446099532305\n",
      "   +0.1883 if cp<=0.0742868110537529 & pav>=0.005486564245074987\n",
      "   -0.0001 if cp>=0.13051024079322815\n",
      "   +0.2406 if pav<=0.24758950173854832\n",
      "   +3.6835 if pa<=0.17110725343227387 & pav<=0.09408825337886813\n",
      "   -2.4464 if cp>=0.03198039643466477 & cv>=0.37345741391181947\n",
      "   +5.8765 if cp>=-0.04069655835628509 & pa>=0.10482561588287355 & pav<=0.3323177874088287 & pav>=0.06272657662630081\n",
      "   +2.3520 if pa<=0.05473344698548318\n",
      "   -3.6283 if cv<=-0.056503293663263315 & pa<=-0.0020621411968022576 & pa>=-0.01230565458536148 & pav<=0.14950227439403538\n",
      "--------------\n",
      "   -0.1875 if cp<=0.040608961135149\n",
      "   +2.7327 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   -1.5790 if cp<=0.15526567697525026 & pa<=0.15440531373023986\n",
      "   -0.1877 if \n",
      "   +2.2326 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -1.3408 if cp>=0.004493808373808861 & cv>=0.21057194471359253 & pav>=0.18589775264263153\n",
      "   +0.0001 if cp<=0.10656930357217793 & cp>=0.03597051128745081 & pav<=0.2522799372673036 & pav>=0.12129032313823705\n",
      "   +0.0000 if cp>=0.15692393481731415\n",
      "   -3.6910 if pa<=0.17110725343227387\n",
      "   -2.7738 if cp<=0.07832173407077793 & cp>=-0.04069655835628509 & cv>=0.21187072694301606 & pav>=0.06272657662630081\n",
      "   +2.7537 if cp<=-0.007005532272160053 & cv<=0.1447057515382767 & cv>=-0.023631685972213743 & pa>=0.05473344698548318\n",
      "   +1.9679 if cp>=-0.19503398835659028\n",
      "Run episode 291 with rewards 88.0\n",
      "============ 292 ===========\n",
      "48 actions [0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1, 0, 1]\n",
      "   +3.5248 if pav<=0.2056886851787567\n",
      "   -1.8109 if pav>=0.105914668738842\n",
      "   -3.2473 if pav>=0.23533811569213875\n",
      "   -0.3808 if pa>=0.06150407791137695 & pav>=0.0003513446099532305\n",
      "   -0.2513 if cp<=0.0742868110537529 & pav>=0.005486564245074987\n",
      "   -2.2587 if pav<=0.24758950173854832\n",
      "   +2.2015 if pa<=0.17110725343227387 & pav<=0.09408825337886813\n",
      "   -0.5366 if cp>=0.03198039643466477 & cv>=0.37345741391181947\n",
      "   +2.4955 if cp>=-0.04069655835628509 & pa>=0.10482561588287355 & pav<=0.3323177874088287 & pav>=0.06272657662630081\n",
      "   +1.1511 if pa<=0.05473344698548318\n",
      "   +0.0506 if cv<=-0.056503293663263315 & pa<=-0.0020621411968022576 & pa>=-0.01230565458536148 & pav<=0.14950227439403538\n",
      "   -3.6528 if cp>=-0.045756562054157235 & cv<=-0.04450382739305495 & pav<=0.19287386238574986\n",
      "--------------\n",
      "   +2.1813 if cp<=0.040608961135149\n",
      "   -0.5166 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   -0.4798 if cp<=0.15526567697525026 & pa<=0.15440531373023986\n",
      "   -2.0678 if \n",
      "   +0.8854 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -2.2060 if cp>=0.004493808373808861 & cv>=0.21057194471359253 & pav>=0.18589775264263153\n",
      "   +2.3148 if cp<=0.10656930357217793 & cp>=0.03597051128745081 & pav<=0.2522799372673036 & pav>=0.12129032313823705\n",
      "   -4.4806 if pa<=0.17110725343227387\n",
      "   -2.2184 if cp<=0.07832173407077793 & cp>=-0.04069655835628509 & cv>=0.21187072694301606 & pav>=0.06272657662630081\n",
      "   +2.9646 if cp<=-0.007005532272160053 & cv<=0.1447057515382767 & cv>=-0.023631685972213743 & pa>=0.05473344698548318\n",
      "   +4.6439 if cp>=-0.19503398835659028\n",
      "   +3.6671 if cp>=-0.045756562054157235 & pav<=0.19287386238574986 & pav>=0.09049114435911179\n",
      "Run episode 292 with rewards 48.0\n",
      "============ 293 ===========\n",
      "58 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 1, 0, 1, 1]\n",
      "   +1.2504 if pav<=0.2056886851787567\n",
      "   -1.2815 if pav>=0.105914668738842\n",
      "   -2.8632 if pav>=0.23533811569213875\n",
      "   -3.1223 if pa>=0.06150407791137695 & pav>=0.0003513446099532305\n",
      "   -2.5601 if cp<=0.0742868110537529 & pav>=0.005486564245074987\n",
      "   +1.5745 if pav<=0.24758950173854832\n",
      "   -0.0072 if pa<=0.17110725343227387 & pav<=0.09408825337886813\n",
      "   +0.3973 if cp>=0.03198039643466477 & cv>=0.37345741391181947\n",
      "   +2.1962 if cp>=-0.04069655835628509 & pa>=0.10482561588287355 & pav<=0.3323177874088287 & pav>=0.06272657662630081\n",
      "   +0.0655 if pa<=0.05473344698548318\n",
      "   +0.0000 if cp>=-0.045756562054157235 & cv<=-0.04450382739305495 & pav<=0.19287386238574986\n",
      "   +3.8920 if pav<=0.12216950207948685\n",
      "--------------\n",
      "   +5.8800 if cp<=0.040608961135149\n",
      "   +1.6729 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   -0.7731 if \n",
      "   +1.5219 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -1.0379 if cp>=0.004493808373808861 & cv>=0.21057194471359253 & pav>=0.18589775264263153\n",
      "   -0.4626 if cp<=0.10656930357217793 & cp>=0.03597051128745081 & pav<=0.2522799372673036 & pav>=0.12129032313823705\n",
      "   -0.8859 if pa<=0.17110725343227387\n",
      "   +0.0000 if cp<=0.07832173407077793 & cp>=-0.04069655835628509 & cv>=0.21187072694301606 & pav>=0.06272657662630081\n",
      "   +0.0000 if cp<=-0.007005532272160053 & cv<=0.1447057515382767 & cv>=-0.023631685972213743 & pa>=0.05473344698548318\n",
      "   -0.7731 if cp>=-0.19503398835659028\n",
      "   +5.7342 if cp>=-0.045756562054157235 & pav<=0.19287386238574986 & pav>=0.09049114435911179\n",
      "   -4.4516 if pav<=0.12216950207948685\n",
      "Run episode 293 with rewards 58.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 294 ===========\n",
      "51 actions [0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1]\n",
      "   +2.0069 if pav<=0.2056886851787567\n",
      "   -3.2235 if pav>=0.105914668738842\n",
      "   -2.5851 if pav>=0.23533811569213875\n",
      "   -2.0683 if pa>=0.06150407791137695 & pav>=0.0003513446099532305\n",
      "   -1.2855 if cp<=0.0742868110537529 & pav>=0.005486564245074987\n",
      "   +1.2559 if pav<=0.24758950173854832\n",
      "   +1.8936 if pa<=0.17110725343227387 & pav<=0.09408825337886813\n",
      "   +0.1460 if cp>=0.03198039643466477 & cv>=0.37345741391181947\n",
      "   +1.8663 if cp>=-0.04069655835628509 & pa>=0.10482561588287355 & pav<=0.3323177874088287 & pav>=0.06272657662630081\n",
      "   +0.5354 if pa<=0.05473344698548318\n",
      "   +1.6929 if pav<=0.12216950207948685\n",
      "   +3.2333 if cv>=0.5134695291519167 & pav<=0.34157841801643374 & pav>=0.22666777968406687\n",
      "--------------\n",
      "   +0.2595 if cp<=0.040608961135149\n",
      "   +2.4874 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   +0.4509 if \n",
      "   +2.5556 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -1.2563 if cp>=0.004493808373808861 & cv>=0.21057194471359253 & pav>=0.18589775264263153\n",
      "   +0.0202 if cp<=0.10656930357217793 & cp>=0.03597051128745081 & pav<=0.2522799372673036 & pav>=0.12129032313823705\n",
      "   -1.8850 if pa<=0.17110725343227387\n",
      "   +0.0000 if cp<=-0.007005532272160053 & cv<=0.1447057515382767 & cv>=-0.023631685972213743 & pa>=0.05473344698548318\n",
      "   +0.4509 if cp>=-0.19503398835659028\n",
      "   +4.9173 if cp>=-0.045756562054157235 & pav<=0.19287386238574986 & pav>=0.09049114435911179\n",
      "   -2.3390 if pav<=0.12216950207948685\n",
      "   -2.3891 if cp>=0.18069123029708864\n",
      "Run episode 294 with rewards 51.0\n",
      "============ 295 ===========\n",
      "45 actions [0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 0, 1, 0, 1, 1, 1]\n",
      "   +1.4894 if pav<=0.2056886851787567\n",
      "   -2.6720 if pav>=0.105914668738842\n",
      "   -0.8456 if pav>=0.23533811569213875\n",
      "   -0.3678 if pa>=0.06150407791137695 & pav>=0.0003513446099532305\n",
      "   -0.8747 if cp<=0.0742868110537529 & pav>=0.005486564245074987\n",
      "   -0.9102 if pav<=0.24758950173854832\n",
      "   +2.5223 if pa<=0.17110725343227387 & pav<=0.09408825337886813\n",
      "   -2.5955 if cp>=-0.04069655835628509 & pa>=0.10482561588287355 & pav<=0.3323177874088287 & pav>=0.06272657662630081\n",
      "   +0.1508 if pa<=0.05473344698548318\n",
      "   +0.8754 if pav<=0.12216950207948685\n",
      "   +1.9941 if cv>=0.5134695291519167 & pav<=0.34157841801643374 & pav>=0.22666777968406687\n",
      "   +0.6411 if \n",
      "--------------\n",
      "   +1.7173 if cp<=0.040608961135149\n",
      "   +2.7005 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   +0.6418 if \n",
      "   +2.4181 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -0.7602 if cp>=0.004493808373808861 & cv>=0.21057194471359253 & pav>=0.18589775264263153\n",
      "   +5.0783 if cp<=0.10656930357217793 & cp>=0.03597051128745081 & pav<=0.2522799372673036 & pav>=0.12129032313823705\n",
      "   -5.1965 if pa<=0.17110725343227387\n",
      "   +0.6418 if cp>=-0.19503398835659028\n",
      "   +0.7740 if cp>=-0.045756562054157235 & pav<=0.19287386238574986 & pav>=0.09049114435911179\n",
      "   +0.0397 if pav<=0.12216950207948685\n",
      "   -0.3134 if cp>=0.18069123029708864\n",
      "   -0.6108 if cp<=0.11481974273920059 & pav<=0.08366405963897705\n",
      "Run episode 295 with rewards 45.0\n",
      "============ 296 ===========\n",
      "70 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 0, 1, 1, 1, 0, 0]\n",
      "   +0.3272 if pav<=0.2056886851787567\n",
      "   -2.7064 if pav>=0.105914668738842\n",
      "   +0.0204 if pav>=0.23533811569213875\n",
      "   -1.4089 if pa>=0.06150407791137695 & pav>=0.0003513446099532305\n",
      "   +0.3019 if cp<=0.0742868110537529 & pav>=0.005486564245074987\n",
      "   +0.0765 if pav<=0.24758950173854832\n",
      "   +1.6080 if pa<=0.17110725343227387 & pav<=0.09408825337886813\n",
      "   -2.4464 if cp>=-0.04069655835628509 & pa>=0.10482561588287355 & pav<=0.3323177874088287 & pav>=0.06272657662630081\n",
      "   +2.1074 if pav<=0.12216950207948685\n",
      "   -1.1526 if cv>=0.5134695291519167 & pav<=0.34157841801643374 & pav>=0.22666777968406687\n",
      "   +0.2020 if \n",
      "   -2.0144 if cp<=0.1334604382514954 & pav>=0.24849416315555584\n",
      "--------------\n",
      "   -0.3305 if cp<=0.040608961135149\n",
      "   +1.3820 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   -0.4750 if \n",
      "   +3.4192 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -0.5616 if cp>=0.004493808373808861 & cv>=0.21057194471359253 & pav>=0.18589775264263153\n",
      "   +0.0078 if cp<=0.10656930357217793 & cp>=0.03597051128745081 & pav<=0.2522799372673036 & pav>=0.12129032313823705\n",
      "   -0.1461 if pa<=0.17110725343227387\n",
      "   -0.4750 if cp>=-0.19503398835659028\n",
      "   +0.2584 if cp>=-0.045756562054157235 & pav<=0.19287386238574986 & pav>=0.09049114435911179\n",
      "   -3.0667 if cp>=0.18069123029708864\n",
      "   -0.4115 if cp<=0.11481974273920059 & pav<=0.08366405963897705\n",
      "   -2.0092 if pav<=0.11052447855472566\n",
      "Run episode 296 with rewards 70.0\n",
      "============ 297 ===========\n",
      "70 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0]\n",
      "   +0.7102 if pav<=0.2056886851787567\n",
      "   -3.5889 if pav>=0.105914668738842\n",
      "   -1.9605 if pa>=0.06150407791137695 & pav>=0.0003513446099532305\n",
      "   +0.2287 if cp<=0.0742868110537529 & pav>=0.005486564245074987\n",
      "   +0.6325 if pav<=0.24758950173854832\n",
      "   +2.1500 if pa<=0.17110725343227387 & pav<=0.09408825337886813\n",
      "   -1.2719 if cp>=-0.04069655835628509 & pa>=0.10482561588287355 & pav<=0.3323177874088287 & pav>=0.06272657662630081\n",
      "   +2.1381 if pav<=0.12216950207948685\n",
      "   -0.5122 if cv>=0.5134695291519167 & pav<=0.34157841801643374 & pav>=0.22666777968406687\n",
      "   -1.4364 if \n",
      "   -0.3368 if cp<=0.1334604382514954 & pav>=0.24849416315555584\n",
      "   +2.2936 if cv>=0.5466508269309998 & pav>=0.32061181068420413\n",
      "--------------\n",
      "   +0.7928 if cp<=0.040608961135149\n",
      "   +1.8528 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   +0.4841 if \n",
      "   +1.9218 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   +0.2043 if cp>=0.004493808373808861 & cv>=0.21057194471359253 & pav>=0.18589775264263153\n",
      "   -2.3357 if pa<=0.17110725343227387\n",
      "   +0.4841 if cp>=-0.19503398835659028\n",
      "   +0.8001 if cp>=-0.045756562054157235 & pav<=0.19287386238574986 & pav>=0.09049114435911179\n",
      "   -0.4045 if cp>=0.18069123029708864\n",
      "   -1.2539 if cp<=0.11481974273920059 & pav<=0.08366405963897705\n",
      "   -1.9681 if pav<=0.11052447855472566\n",
      "   -2.7564 if cv>=0.5466508269309998 & pav>=0.32061181068420413\n",
      "Run episode 297 with rewards 70.0\n",
      "============ 298 ===========\n",
      "73 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1]\n",
      "   +0.8718 if pav<=0.2056886851787567\n",
      "   -4.0463 if pav>=0.105914668738842\n",
      "   -1.2727 if pa>=0.06150407791137695 & pav>=0.0003513446099532305\n",
      "   +0.7163 if pav<=0.24758950173854832\n",
      "   +1.1584 if pa<=0.17110725343227387 & pav<=0.09408825337886813\n",
      "   -0.1746 if cp>=-0.04069655835628509 & pa>=0.10482561588287355 & pav<=0.3323177874088287 & pav>=0.06272657662630081\n",
      "   +2.4478 if pav<=0.12216950207948685\n",
      "   -0.1860 if cv>=0.5134695291519167 & pav<=0.34157841801643374 & pav>=0.22666777968406687\n",
      "   -0.7212 if \n",
      "   -0.5229 if cp<=0.1334604382514954 & pav>=0.24849416315555584\n",
      "   -0.4201 if cv>=0.5466508269309998 & pav>=0.32061181068420413\n",
      "   -0.0936 if cp>=0.3797151446342468\n",
      "--------------\n",
      "   +0.6568 if cp<=0.040608961135149\n",
      "   +1.5943 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   -0.4231 if \n",
      "   +1.4997 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -0.3236 if pa<=0.17110725343227387\n",
      "   -0.4231 if cp>=-0.19503398835659028\n",
      "   -0.6225 if cp>=-0.045756562054157235 & pav<=0.19287386238574986 & pav>=0.09049114435911179\n",
      "   -0.0995 if cp>=0.18069123029708864\n",
      "   -0.8221 if cp<=0.11481974273920059 & pav<=0.08366405963897705\n",
      "   -3.0482 if pav<=0.11052447855472566\n",
      "   +0.5165 if cv>=0.5466508269309998 & pav>=0.32061181068420413\n",
      "   -0.8463 if cp>=0.13922219276428224 & pav<=0.07770640254020693 & pav>=-0.02710523456335067\n",
      "Run episode 298 with rewards 73.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 299 ===========\n",
      "83 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1]\n",
      "   +0.5677 if pav<=0.2056886851787567\n",
      "   -4.8116 if pav>=0.105914668738842\n",
      "   -1.1973 if pa>=0.06150407791137695 & pav>=0.0003513446099532305\n",
      "   +0.5074 if pav<=0.24758950173854832\n",
      "   +2.1078 if pa<=0.17110725343227387 & pav<=0.09408825337886813\n",
      "   -0.6589 if cp>=-0.04069655835628509 & pa>=0.10482561588287355 & pav<=0.3323177874088287 & pav>=0.06272657662630081\n",
      "   +0.8828 if pav<=0.12216950207948685\n",
      "   -0.1924 if cv>=0.5134695291519167 & pav<=0.34157841801643374 & pav>=0.22666777968406687\n",
      "   -0.4767 if \n",
      "   -0.5101 if cp<=0.1334604382514954 & pav>=0.24849416315555584\n",
      "   -0.1091 if cv>=0.5466508269309998 & pav>=0.32061181068420413\n",
      "   -2.3077 if cp>=0.04248891696333886 & pav<=0.214916741847992 & pav>=0.07739706933498383\n",
      "--------------\n",
      "   -0.9530 if cp<=0.040608961135149\n",
      "   +1.7361 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   -0.1029 if \n",
      "   +1.7514 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   +0.2071 if pa<=0.17110725343227387\n",
      "   -0.1029 if cp>=-0.19503398835659028\n",
      "   +1.1425 if cp>=-0.045756562054157235 & pav<=0.19287386238574986 & pav>=0.09049114435911179\n",
      "   -1.2607 if cp<=0.11481974273920059 & pav<=0.08366405963897705\n",
      "   -2.0124 if pav<=0.11052447855472566\n",
      "   +0.0126 if cv>=0.5466508269309998 & pav>=0.32061181068420413\n",
      "   -0.4619 if cp>=0.13922219276428224 & pav<=0.07770640254020693 & pav>=-0.02710523456335067\n",
      "   +1.6812 if cv>=0.35875887870788575 & pav>=0.07739706933498383\n",
      "Run episode 299 with rewards 83.0\n",
      "============ 300 ===========\n",
      "103 actions [0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1]\n",
      "   +0.4831 if pav<=0.2056886851787567\n",
      "   -3.0965 if pav>=0.105914668738842\n",
      "   -2.6925 if pa>=0.06150407791137695 & pav>=0.0003513446099532305\n",
      "   -0.0978 if pav<=0.24758950173854832\n",
      "   +0.5050 if pa<=0.17110725343227387 & pav<=0.09408825337886813\n",
      "   +3.1825 if cp>=-0.04069655835628509 & pa>=0.10482561588287355 & pav<=0.3323177874088287 & pav>=0.06272657662630081\n",
      "   +0.7063 if pav<=0.12216950207948685\n",
      "   -0.6238 if cv>=0.5134695291519167 & pav<=0.34157841801643374 & pav>=0.22666777968406687\n",
      "   -1.3507 if \n",
      "   -0.7246 if cp<=0.1334604382514954 & pav>=0.24849416315555584\n",
      "   -3.7791 if cp>=0.04248891696333886 & pav<=0.214916741847992 & pav>=0.07739706933498383\n",
      "   +4.0634 if pav<=0.05245797932147981\n",
      "--------------\n",
      "   -6.2726 if cp<=0.040608961135149\n",
      "   +3.1592 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   -0.1911 if \n",
      "   +3.1592 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   +1.9125 if pa<=0.17110725343227387\n",
      "   -0.1911 if cp>=-0.19503398835659028\n",
      "   +1.6258 if cp>=-0.045756562054157235 & pav<=0.19287386238574986 & pav>=0.09049114435911179\n",
      "   +4.2079 if cp<=0.11481974273920059 & pav<=0.08366405963897705\n",
      "   -1.8792 if pav<=0.11052447855472566\n",
      "   -1.9197 if cp>=0.13922219276428224 & pav<=0.07770640254020693 & pav>=-0.02710523456335067\n",
      "   +2.8048 if cv>=0.35875887870788575 & pav>=0.07739706933498383\n",
      "   -4.4597 if cp<=0.1072035163640977 & cv>=0.5281909823417664\n",
      "Run episode 300 with rewards 103.0\n",
      "============ 301 ===========\n",
      "80 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1]\n",
      "   +0.5413 if pav<=0.2056886851787567\n",
      "   -3.1215 if pav>=0.105914668738842\n",
      "   -2.2486 if pa>=0.06150407791137695 & pav>=0.0003513446099532305\n",
      "   +1.4202 if pa<=0.17110725343227387 & pav<=0.09408825337886813\n",
      "   +0.7509 if cp>=-0.04069655835628509 & pa>=0.10482561588287355 & pav<=0.3323177874088287 & pav>=0.06272657662630081\n",
      "   +2.1571 if pav<=0.12216950207948685\n",
      "   -0.0317 if cv>=0.5134695291519167 & pav<=0.34157841801643374 & pav>=0.22666777968406687\n",
      "   -0.9643 if \n",
      "   -0.6995 if cp<=0.1334604382514954 & pav>=0.24849416315555584\n",
      "  -10.1702 if cp>=0.04248891696333886 & pav<=0.214916741847992 & pav>=0.07739706933498383\n",
      "   +0.8545 if pav<=0.05245797932147981\n",
      "   +3.8432 if cv<=0.37169750332832335 & pa<=0.05156339704990387 & pav<=0.15485731363296518\n",
      "--------------\n",
      "   -4.8209 if cp<=0.040608961135149\n",
      "   +2.4943 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   +2.6441 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   +0.7400 if pa<=0.17110725343227387\n",
      "   +0.5599 if cp>=-0.19503398835659028\n",
      "   +0.3234 if cp>=-0.045756562054157235 & pav<=0.19287386238574986 & pav>=0.09049114435911179\n",
      "   +0.1513 if cp<=0.11481974273920059 & pav<=0.08366405963897705\n",
      "   -2.2099 if pav<=0.11052447855472566\n",
      "   -5.5244 if cp>=0.13922219276428224 & pav<=0.07770640254020693 & pav>=-0.02710523456335067\n",
      "   +2.2563 if cv>=0.35875887870788575 & pav>=0.07739706933498383\n",
      "   -3.8208 if cp<=0.1072035163640977 & cv>=0.5281909823417664\n",
      "   +5.0332 if pa<=0.07249398231506347 & pa>=0.05156339704990387 & pav<=0.038875851780176204\n",
      "Run episode 301 with rewards 80.0\n",
      "============ 302 ===========\n",
      "82 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1]\n",
      "   +0.6728 if pav<=0.2056886851787567\n",
      "   -2.5601 if pav>=0.105914668738842\n",
      "   -1.7159 if pa>=0.06150407791137695 & pav>=0.0003513446099532305\n",
      "   +1.0597 if pa<=0.17110725343227387 & pav<=0.09408825337886813\n",
      "   -1.1795 if cp>=-0.04069655835628509 & pa>=0.10482561588287355 & pav<=0.3323177874088287 & pav>=0.06272657662630081\n",
      "   +1.3833 if pav<=0.12216950207948685\n",
      "   -1.1592 if \n",
      "   -1.6884 if cp<=0.1334604382514954 & pav>=0.24849416315555584\n",
      "   -1.2919 if cp>=0.04248891696333886 & pav<=0.214916741847992 & pav>=0.07739706933498383\n",
      "   +1.7574 if pav<=0.05245797932147981\n",
      "   +0.2260 if cv<=0.37169750332832335 & pa<=0.05156339704990387 & pav<=0.15485731363296518\n",
      "   +1.8241 if cv>=0.16368211507797242 & pav<=0.06873603016138077\n",
      "--------------\n",
      "   -0.3241 if cp<=0.040608961135149\n",
      "   +1.6652 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   +1.6651 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   +0.0746 if pa<=0.17110725343227387\n",
      "   -0.4330 if cp>=-0.19503398835659028\n",
      "   -0.0855 if cp>=-0.045756562054157235 & pav<=0.19287386238574986 & pav>=0.09049114435911179\n",
      "   -3.0010 if pav<=0.11052447855472566\n",
      "   -0.7090 if cp>=0.13922219276428224 & pav<=0.07770640254020693 & pav>=-0.02710523456335067\n",
      "   +1.0664 if cv>=0.35875887870788575 & pav>=0.07739706933498383\n",
      "   -0.3137 if cp<=0.1072035163640977 & cv>=0.5281909823417664\n",
      "   -0.2002 if pa<=0.07249398231506347 & pa>=0.05156339704990387 & pav<=0.038875851780176204\n",
      "   -0.5696 if pa>=0.033329312503337864 & pav>=-0.0030541154323145674\n",
      "Run episode 302 with rewards 82.0\n",
      "============ 303 ===========\n",
      "67 actions [0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1]\n",
      "   +0.4954 if pav<=0.2056886851787567\n",
      "   -5.1273 if pav>=0.105914668738842\n",
      "   -2.1401 if pa>=0.06150407791137695 & pav>=0.0003513446099532305\n",
      "   -0.3034 if pa<=0.17110725343227387 & pav<=0.09408825337886813\n",
      "   +1.4850 if cp>=-0.04069655835628509 & pa>=0.10482561588287355 & pav<=0.3323177874088287 & pav>=0.06272657662630081\n",
      "   +1.0443 if pav<=0.12216950207948685\n",
      "   -0.1686 if \n",
      "   -0.4603 if cp<=0.1334604382514954 & pav>=0.24849416315555584\n",
      "   +1.5158 if cp>=0.04248891696333886 & pav<=0.214916741847992 & pav>=0.07739706933498383\n",
      "   +2.2033 if pav<=0.05245797932147981\n",
      "   +1.2704 if cv>=0.16368211507797242 & pav<=0.06873603016138077\n",
      "   -2.8491 if cv>=0.2070227563381195 & pav<=0.3095852375030518 & pav>=0.058449974656105026\n",
      "--------------\n",
      "   +0.0195 if cp<=0.040608961135149\n",
      "   +1.5941 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   +1.5403 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -0.2912 if cp>=-0.19503398835659028\n",
      "   -0.2871 if cp>=-0.045756562054157235 & pav<=0.19287386238574986 & pav>=0.09049114435911179\n",
      "   -2.7759 if pav<=0.11052447855472566\n",
      "   -0.6242 if cp>=0.13922219276428224 & pav<=0.07770640254020693 & pav>=-0.02710523456335067\n",
      "   -5.2380 if cv>=0.35875887870788575 & pav>=0.07739706933498383\n",
      "   -3.4857 if cp<=0.1072035163640977 & cv>=0.5281909823417664\n",
      "   -0.1162 if pa<=0.07249398231506347 & pa>=0.05156339704990387 & pav<=0.038875851780176204\n",
      "   +0.8807 if pa>=0.033329312503337864 & pav>=-0.0030541154323145674\n",
      "   +4.8317 if cv>=0.2070227563381195 & pav>=0.058449974656105026\n",
      "Run episode 303 with rewards 67.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 304 ===========\n",
      "99 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1]\n",
      "   +1.6408 if pav<=0.2056886851787567\n",
      "   -3.9355 if pav>=0.105914668738842\n",
      "   -1.0312 if pa>=0.06150407791137695 & pav>=0.0003513446099532305\n",
      "   -1.2196 if pa<=0.17110725343227387 & pav<=0.09408825337886813\n",
      "   -0.1839 if cp>=-0.04069655835628509 & pa>=0.10482561588287355 & pav<=0.3323177874088287 & pav>=0.06272657662630081\n",
      "   +2.4210 if pav<=0.12216950207948685\n",
      "   -0.2087 if cp<=0.1334604382514954 & pav>=0.24849416315555584\n",
      "   +0.2272 if cp>=0.04248891696333886 & pav<=0.214916741847992 & pav>=0.07739706933498383\n",
      "   +1.5647 if pav<=0.05245797932147981\n",
      "   +0.9758 if cv>=0.16368211507797242 & pav<=0.06873603016138077\n",
      "   -2.9790 if cv>=0.2070227563381195 & pav<=0.3095852375030518 & pav>=0.058449974656105026\n",
      "   -0.1801 if \n",
      "--------------\n",
      "   +1.0664 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   +1.2273 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -0.6823 if cp>=-0.19503398835659028\n",
      "   -2.0763 if cp>=-0.045756562054157235 & pav<=0.19287386238574986 & pav>=0.09049114435911179\n",
      "   -3.0385 if pav<=0.11052447855472566\n",
      "   +0.6116 if cp>=0.13922219276428224 & pav<=0.07770640254020693 & pav>=-0.02710523456335067\n",
      "   -2.6709 if cv>=0.35875887870788575 & pav>=0.07739706933498383\n",
      "   -0.0000 if cp<=0.1072035163640977 & cv>=0.5281909823417664\n",
      "   -0.0408 if pa<=0.07249398231506347 & pa>=0.05156339704990387 & pav<=0.038875851780176204\n",
      "   -0.4443 if pa>=0.033329312503337864 & pav>=-0.0030541154323145674\n",
      "   +5.2193 if cv>=0.2070227563381195 & pav>=0.058449974656105026\n",
      "   -0.7595 if pav<=0.057992350310087246\n",
      "Run episode 304 with rewards 99.0\n",
      "============ 305 ===========\n",
      "82 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1]\n",
      "   +0.8135 if pav<=0.2056886851787567\n",
      "   -4.0644 if pav>=0.105914668738842\n",
      "   -1.1730 if pa>=0.06150407791137695 & pav>=0.0003513446099532305\n",
      "   +1.2553 if pa<=0.17110725343227387 & pav<=0.09408825337886813\n",
      "   -1.9561 if cp>=-0.04069655835628509 & pa>=0.10482561588287355 & pav<=0.3323177874088287 & pav>=0.06272657662630081\n",
      "   +1.5956 if pav<=0.12216950207948685\n",
      "   -0.8528 if cp<=0.1334604382514954 & pav>=0.24849416315555584\n",
      "   +4.7712 if cp>=0.04248891696333886 & pav<=0.214916741847992 & pav>=0.07739706933498383\n",
      "   +1.4591 if pav<=0.05245797932147981\n",
      "   +0.5412 if cv>=0.16368211507797242 & pav<=0.06873603016138077\n",
      "   -3.1508 if cv>=0.2070227563381195 & pav<=0.3095852375030518 & pav>=0.058449974656105026\n",
      "   -1.4687 if \n",
      "--------------\n",
      "   +1.8357 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   +1.8023 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -0.0090 if cp>=-0.19503398835659028\n",
      "   +0.2742 if cp>=-0.045756562054157235 & pav<=0.19287386238574986 & pav>=0.09049114435911179\n",
      "   -2.3381 if pav<=0.11052447855472566\n",
      "   -0.0259 if cp>=0.13922219276428224 & pav<=0.07770640254020693 & pav>=-0.02710523456335067\n",
      "   -1.0809 if cv>=0.35875887870788575 & pav>=0.07739706933498383\n",
      "   -0.0349 if pa<=0.07249398231506347 & pa>=0.05156339704990387 & pav<=0.038875851780176204\n",
      "   +0.0111 if pa>=0.033329312503337864 & pav>=-0.0030541154323145674\n",
      "   +2.2583 if cv>=0.2070227563381195 & pav>=0.058449974656105026\n",
      "   -1.4032 if pav<=0.057992350310087246\n",
      "   +3.3382 if cp<=-0.05020776540040965 & cv>=0.3491435647010804 & pav>=0.03444869220256808\n",
      "Run episode 305 with rewards 82.0\n",
      "============ 306 ===========\n",
      "103 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1]\n",
      "   +0.8312 if pav<=0.2056886851787567\n",
      "   -2.5767 if pav>=0.105914668738842\n",
      "   -1.8369 if pa>=0.06150407791137695 & pav>=0.0003513446099532305\n",
      "   +1.0794 if pa<=0.17110725343227387 & pav<=0.09408825337886813\n",
      "   -1.8651 if cp>=-0.04069655835628509 & pa>=0.10482561588287355 & pav<=0.3323177874088287 & pav>=0.06272657662630081\n",
      "   +2.1028 if pav<=0.12216950207948685\n",
      "   -0.6502 if cp<=0.1334604382514954 & pav>=0.24849416315555584\n",
      "   -0.6687 if cp>=0.04248891696333886 & pav<=0.214916741847992 & pav>=0.07739706933498383\n",
      "   +1.2897 if pav<=0.05245797932147981\n",
      "   -4.4464 if cv>=0.2070227563381195 & pav<=0.3095852375030518 & pav>=0.058449974656105026\n",
      "   -0.4738 if \n",
      "   -1.6535 if cp<=0.07111379802227019 & cv>=0.38228065371513364 & pav>=0.05966149047017097\n",
      "--------------\n",
      "   +1.3176 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   +1.3175 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -0.0952 if cp>=-0.045756562054157235 & pav<=0.19287386238574986 & pav>=0.09049114435911179\n",
      "   -2.2895 if pav<=0.11052447855472566\n",
      "   +0.1547 if cp>=0.13922219276428224 & pav<=0.07770640254020693 & pav>=-0.02710523456335067\n",
      "   +1.9341 if cv>=0.35875887870788575 & pav>=0.07739706933498383\n",
      "   -0.1928 if pa<=0.07249398231506347 & pa>=0.05156339704990387 & pav<=0.038875851780176204\n",
      "   +0.1458 if pa>=0.033329312503337864 & pav>=-0.0030541154323145674\n",
      "   +5.2662 if cv>=0.2070227563381195 & pav>=0.058449974656105026\n",
      "   -1.0882 if pav<=0.057992350310087246\n",
      "   -0.0000 if cp<=-0.05020776540040965 & cv>=0.3491435647010804 & pav>=0.03444869220256808\n",
      "   -0.9693 if \n",
      "Run episode 306 with rewards 103.0\n",
      "============ 307 ===========\n",
      "81 actions [0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0]\n",
      "   +0.4329 if pav<=0.2056886851787567\n",
      "   -4.5556 if pav>=0.105914668738842\n",
      "   -1.1626 if pa>=0.06150407791137695 & pav>=0.0003513446099532305\n",
      "   +1.6073 if pa<=0.17110725343227387 & pav<=0.09408825337886813\n",
      "   -1.6623 if cp>=-0.04069655835628509 & pa>=0.10482561588287355 & pav<=0.3323177874088287 & pav>=0.06272657662630081\n",
      "   +0.7918 if pav<=0.12216950207948685\n",
      "   -1.3100 if cp<=0.1334604382514954 & pav>=0.24849416315555584\n",
      "   -0.0001 if cp>=0.04248891696333886 & pav<=0.214916741847992 & pav>=0.07739706933498383\n",
      "   +1.4508 if pav<=0.05245797932147981\n",
      "   -1.6622 if cv>=0.2070227563381195 & pav<=0.3095852375030518 & pav>=0.058449974656105026\n",
      "   -0.0000 if cp<=0.07111379802227019 & cv>=0.38228065371513364 & pav>=0.05966149047017097\n",
      "   -0.0000 if cp>=0.016042666137218504 & cv>=-0.031419594585895536 & pav<=0.2813266634941101 & pav>=0.21118372678756728\n",
      "--------------\n",
      "   +2.1800 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   +2.1800 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   +0.6194 if cp>=-0.045756562054157235 & pav<=0.19287386238574986 & pav>=0.09049114435911179\n",
      "   -2.3851 if pav<=0.11052447855472566\n",
      "   +0.3885 if cp>=0.13922219276428224 & pav<=0.07770640254020693 & pav>=-0.02710523456335067\n",
      "   +0.2662 if cv>=0.35875887870788575 & pav>=0.07739706933498383\n",
      "   -0.0941 if pa<=0.07249398231506347 & pa>=0.05156339704990387 & pav<=0.038875851780176204\n",
      "   -0.2719 if pa>=0.033329312503337864 & pav>=-0.0030541154323145674\n",
      "   +1.5029 if cv>=0.2070227563381195 & pav>=0.058449974656105026\n",
      "   -1.4918 if pav<=0.057992350310087246\n",
      "   +0.0612 if \n",
      "   +0.6354 if cp<=0.23969206213951125 & pa>=0.15686645805835725 & pav<=0.21118372678756728\n",
      "Run episode 307 with rewards 81.0\n",
      "============ 308 ===========\n",
      "114 actions [0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 1, 0, 1, 1]\n",
      "   -0.2427 if pav<=0.2056886851787567\n",
      "   -2.5448 if pav>=0.105914668738842\n",
      "   -2.1793 if pa>=0.06150407791137695 & pav>=0.0003513446099532305\n",
      "   +2.6447 if pa<=0.17110725343227387 & pav<=0.09408825337886813\n",
      "   -1.5462 if cp>=-0.04069655835628509 & pa>=0.10482561588287355 & pav<=0.3323177874088287 & pav>=0.06272657662630081\n",
      "   -0.0675 if pav<=0.12216950207948685\n",
      "   -0.5728 if cp<=0.1334604382514954 & pav>=0.24849416315555584\n",
      "   -2.3495 if cp>=0.04248891696333886 & pav<=0.214916741847992 & pav>=0.07739706933498383\n",
      "   +3.1566 if pav<=0.05245797932147981\n",
      "   -1.6367 if cv>=0.2070227563381195 & pav<=0.3095852375030518 & pav>=0.058449974656105026\n",
      "   +0.0000 if cp<=0.07111379802227019 & cv>=0.38228065371513364 & pav>=0.05966149047017097\n",
      "   -1.2851 if cp<=0.5621634125709534 & cv>=0.15257661044597626 & pav<=0.1689499914646149\n",
      "--------------\n",
      "   +0.9601 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   +0.9685 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   +2.9662 if cp>=-0.045756562054157235 & pav<=0.19287386238574986 & pav>=0.09049114435911179\n",
      "   -1.3868 if pav<=0.11052447855472566\n",
      "   +0.4418 if cp>=0.13922219276428224 & pav<=0.07770640254020693 & pav>=-0.02710523456335067\n",
      "   +0.0435 if cv>=0.35875887870788575 & pav>=0.07739706933498383\n",
      "   -0.2398 if pa<=0.07249398231506347 & pa>=0.05156339704990387 & pav<=0.038875851780176204\n",
      "   -0.0237 if pa>=0.033329312503337864 & pav>=-0.0030541154323145674\n",
      "   +1.0215 if cv>=0.2070227563381195 & pav>=0.058449974656105026\n",
      "   -2.6782 if pav<=0.057992350310087246\n",
      "   +0.0000 if cp<=0.23969206213951125 & pa>=0.15686645805835725 & pav<=0.21118372678756728\n",
      "   +2.5209 if cp>=0.045431170612573624 & pav>=0.04802769422531128\n",
      "Run episode 308 with rewards 114.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 309 ===========\n",
      "152 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1]\n",
      "   -1.0377 if pav<=0.2056886851787567\n",
      "   -4.5073 if pav>=0.105914668738842\n",
      "   +2.4644 if pa>=0.06150407791137695 & pav>=0.0003513446099532305\n",
      "   -0.5221 if pa<=0.17110725343227387 & pav<=0.09408825337886813\n",
      "   -1.0793 if cp>=-0.04069655835628509 & pa>=0.10482561588287355 & pav<=0.3323177874088287 & pav>=0.06272657662630081\n",
      "   -0.8293 if pav<=0.12216950207948685\n",
      "   -1.0766 if cp<=0.1334604382514954 & pav>=0.24849416315555584\n",
      "   -0.4832 if cp>=0.04248891696333886 & pav<=0.214916741847992 & pav>=0.07739706933498383\n",
      "   +1.5877 if pav<=0.05245797932147981\n",
      "   -1.9303 if cv>=0.2070227563381195 & pav<=0.3095852375030518 & pav>=0.058449974656105026\n",
      "   -7.3911 if cp<=0.5621634125709534 & cv>=0.15257661044597626 & pav<=0.1689499914646149\n",
      "  +10.1188 if pav<=0.025541749224066743\n",
      "--------------\n",
      "   +2.1502 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   +2.1657 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   +0.0111 if cp>=-0.045756562054157235 & pav<=0.19287386238574986 & pav>=0.09049114435911179\n",
      "   +1.6362 if pav<=0.11052447855472566\n",
      "   +0.0558 if cp>=0.13922219276428224 & pav<=0.07770640254020693 & pav>=-0.02710523456335067\n",
      "   +0.1221 if cv>=0.35875887870788575 & pav>=0.07739706933498383\n",
      "   -1.1532 if pa<=0.07249398231506347 & pa>=0.05156339704990387 & pav<=0.038875851780176204\n",
      "   +3.8624 if pa>=0.033329312503337864 & pav>=-0.0030541154323145674\n",
      "   +0.2116 if cv>=0.2070227563381195 & pav>=0.058449974656105026\n",
      "   -7.4494 if pav<=0.057992350310087246\n",
      "   -6.6454 if cp>=0.045431170612573624 & pav>=0.04802769422531128\n",
      "   +6.1947 if cp>=0.0517803356051445 & pav>=0.025541749224066743\n",
      "Run episode 309 with rewards 152.0\n",
      "============ 310 ===========\n",
      "240 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0]\n",
      "   -1.1629 if pav<=0.2056886851787567\n",
      "   -6.1175 if pav>=0.105914668738842\n",
      "   -4.5749 if pa>=0.06150407791137695 & pav>=0.0003513446099532305\n",
      "   -3.6204 if pa<=0.17110725343227387 & pav<=0.09408825337886813\n",
      "   -0.2456 if cp>=-0.04069655835628509 & pa>=0.10482561588287355 & pav<=0.3323177874088287 & pav>=0.06272657662630081\n",
      "   -1.1263 if pav<=0.12216950207948685\n",
      "   -0.2377 if cp<=0.1334604382514954 & pav>=0.24849416315555584\n",
      "   +1.2127 if pav<=0.05245797932147981\n",
      "   -0.2687 if cv>=0.2070227563381195 & pav<=0.3095852375030518 & pav>=0.058449974656105026\n",
      "   -1.7704 if cp<=0.5621634125709534 & cv>=0.15257661044597626 & pav<=0.1689499914646149\n",
      "   +8.2872 if pav<=0.025541749224066743\n",
      "   +5.6834 if cp>=-0.002966956188902256 & cv>=-0.03643708601593971 & pav>=0.0016836747876368824\n",
      "--------------\n",
      "   +1.9887 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   +1.9898 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   +1.8907 if pav<=0.11052447855472566\n",
      "   -2.8974 if cp>=0.13922219276428224 & pav<=0.07770640254020693 & pav>=-0.02710523456335067\n",
      "   +0.0174 if cv>=0.35875887870788575 & pav>=0.07739706933498383\n",
      "   -0.6105 if pa<=0.07249398231506347 & pa>=0.05156339704990387 & pav<=0.038875851780176204\n",
      "   +6.6117 if pa>=0.033329312503337864 & pav>=-0.0030541154323145674\n",
      "   +0.0201 if cv>=0.2070227563381195 & pav>=0.058449974656105026\n",
      "   -6.6275 if pav<=0.057992350310087246\n",
      "   -3.2923 if cp>=0.045431170612573624 & pav>=0.04802769422531128\n",
      "   +4.8157 if cp>=0.0517803356051445 & pav>=0.025541749224066743\n",
      "   -5.2993 if cp>=-0.002966956188902256 & cv>=-0.03643708601593971 & pa<=0.06944651752710343 & pav<=0.13672460913658144 & pav>=0.0016836747876368824\n",
      "Run episode 310 with rewards 240.0\n",
      "best\n",
      "============ 311 ===========\n",
      "205 actions [0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 1]\n",
      "   -3.0794 if pav<=0.2056886851787567\n",
      "   -3.3734 if pav>=0.105914668738842\n",
      "   -5.4732 if pa>=0.06150407791137695 & pav>=0.0003513446099532305\n",
      "   -2.7190 if pa<=0.17110725343227387 & pav<=0.09408825337886813\n",
      "   -0.0329 if cp>=-0.04069655835628509 & pa>=0.10482561588287355 & pav<=0.3323177874088287 & pav>=0.06272657662630081\n",
      "   -2.9224 if pav<=0.12216950207948685\n",
      "   +7.1870 if pav<=0.05245797932147981\n",
      "   -0.0474 if cv>=0.2070227563381195 & pav<=0.3095852375030518 & pav>=0.058449974656105026\n",
      "   -1.7402 if cp<=0.5621634125709534 & cv>=0.15257661044597626 & pav<=0.1689499914646149\n",
      "   +6.8190 if pav<=0.025541749224066743\n",
      "   +6.8886 if cp>=-0.002966956188902256 & cv>=-0.03643708601593971 & pav>=0.0016836747876368824\n",
      "   -1.6571 if cp>=-0.2359948605298996 & cv<=0.006593240145593883 & pa>=-0.009066995047032832 & pa>=0.0315625011920929 & pav>=-0.007523675821721533\n",
      "--------------\n",
      "   +1.1962 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   +1.1952 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   +1.8411 if pav<=0.11052447855472566\n",
      "   -2.1221 if cp>=0.13922219276428224 & pav<=0.07770640254020693 & pav>=-0.02710523456335067\n",
      "   +0.6233 if pa<=0.07249398231506347 & pa>=0.05156339704990387 & pav<=0.038875851780176204\n",
      "   +5.2698 if pa>=0.033329312503337864 & pav>=-0.0030541154323145674\n",
      "   +0.0142 if cv>=0.2070227563381195 & pav>=0.058449974656105026\n",
      "   -7.1043 if pav<=0.057992350310087246\n",
      "   +0.0138 if cp>=0.045431170612573624 & pav>=0.04802769422531128\n",
      "   +1.8795 if cp>=0.0517803356051445 & pav>=0.025541749224066743\n",
      "   +0.0002 if cp>=-0.002966956188902256 & cv>=-0.03643708601593971 & pa<=0.06944651752710343 & pav<=0.13672460913658144 & pav>=0.0016836747876368824\n",
      "   +3.1468 if cv>=-0.18547097742557525 & pa<=0.0315625011920929 & pa>=-0.009066995047032832 & pav>=-0.007523675821721533\n",
      "Run episode 311 with rewards 205.0\n",
      "============ 312 ===========\n",
      "155 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1]\n",
      "   -6.8759 if pav<=0.2056886851787567\n",
      "   -3.3049 if pav>=0.105914668738842\n",
      "   -3.6796 if pa>=0.06150407791137695 & pav>=0.0003513446099532305\n",
      "   -0.7358 if pa<=0.17110725343227387 & pav<=0.09408825337886813\n",
      "   -2.4574 if pav<=0.12216950207948685\n",
      "   +4.9170 if pav<=0.05245797932147981\n",
      "   -0.6460 if cv>=0.2070227563381195 & pav<=0.3095852375030518 & pav>=0.058449974656105026\n",
      "   -3.8002 if cp<=0.5621634125709534 & cv>=0.15257661044597626 & pav<=0.1689499914646149\n",
      "   +8.2179 if pav<=0.025541749224066743\n",
      "   +5.9012 if cp>=-0.002966956188902256 & cv>=-0.03643708601593971 & pav>=0.0016836747876368824\n",
      "   -0.3387 if cp>=-0.2359948605298996 & cv<=0.006593240145593883 & pa>=-0.009066995047032832 & pa>=0.0315625011920929 & pav>=-0.007523675821721533\n",
      "   +3.1305 if pav<=0.21976910829544072\n",
      "--------------\n",
      "   +0.5765 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   +0.6303 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   +3.0285 if pav<=0.11052447855472566\n",
      "   -0.8133 if cp>=0.13922219276428224 & pav<=0.07770640254020693 & pav>=-0.02710523456335067\n",
      "   -0.0376 if pa<=0.07249398231506347 & pa>=0.05156339704990387 & pav<=0.038875851780176204\n",
      "   +5.3027 if pa>=0.033329312503337864 & pav>=-0.0030541154323145674\n",
      "   +0.2151 if cv>=0.2070227563381195 & pav>=0.058449974656105026\n",
      "   -9.9903 if pav<=0.057992350310087246\n",
      "   -2.0227 if cp>=0.045431170612573624 & pav>=0.04802769422531128\n",
      "   +3.6577 if cp>=0.0517803356051445 & pav>=0.025541749224066743\n",
      "   +5.3404 if cv>=-0.18547097742557525 & pa<=0.0315625011920929 & pa>=-0.009066995047032832 & pav>=-0.007523675821721533\n",
      "   +2.9106 if cv<=-0.02837289944291115 & pav>=0.21976910829544072\n",
      "Run episode 312 with rewards 155.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 313 ===========\n",
      "94 actions [0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1]\n",
      "   +0.7979 if pav<=0.2056886851787567\n",
      "   -3.4618 if pav>=0.105914668738842\n",
      "   -2.6259 if pa>=0.06150407791137695 & pav>=0.0003513446099532305\n",
      "   +0.9409 if pa<=0.17110725343227387 & pav<=0.09408825337886813\n",
      "   +0.8358 if pav<=0.12216950207948685\n",
      "   +1.2165 if pav<=0.05245797932147981\n",
      "   -0.0128 if cv>=0.2070227563381195 & pav<=0.3095852375030518 & pav>=0.058449974656105026\n",
      "   -5.9567 if cp<=0.5621634125709534 & cv>=0.15257661044597626 & pav<=0.1689499914646149\n",
      "   +6.6066 if pav<=0.025541749224066743\n",
      "   +0.9722 if cp>=-0.002966956188902256 & cv>=-0.03643708601593971 & pav>=0.0016836747876368824\n",
      "   -0.9640 if pav<=0.21976910829544072\n",
      "   -3.0132 if cp>=1.0629259109497071 & pav<=0.13165188729763044 & pav>=-0.0027277451474219516\n",
      "--------------\n",
      "   +2.6399 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   +2.6526 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -2.2874 if pav<=0.11052447855472566\n",
      "   -0.3459 if cp>=0.13922219276428224 & pav<=0.07770640254020693 & pav>=-0.02710523456335067\n",
      "   +0.9430 if pa>=0.033329312503337864 & pav>=-0.0030541154323145674\n",
      "   +2.2600 if cv>=0.2070227563381195 & pav>=0.058449974656105026\n",
      "   -4.1525 if pav<=0.057992350310087246\n",
      "   -3.6123 if cp>=0.045431170612573624 & pav>=0.04802769422531128\n",
      "   +1.9422 if cp>=0.0517803356051445 & pav>=0.025541749224066743\n",
      "   +0.0000 if cv>=-0.18547097742557525 & pa<=0.0315625011920929 & pa>=-0.009066995047032832 & pav>=-0.007523675821721533\n",
      "   +0.3995 if cv<=-0.02837289944291115 & pav>=0.21976910829544072\n",
      "   +4.6881 if cp>=0.0031887820921838333 & cv>=0.0027103481348603967 & pav>=-0.0027277451474219516\n",
      "Run episode 313 with rewards 94.0\n",
      "============ 314 ===========\n",
      "105 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1]\n",
      "   +1.2398 if pav<=0.2056886851787567\n",
      "   -1.1316 if pav>=0.105914668738842\n",
      "   -3.0803 if pa>=0.06150407791137695 & pav>=0.0003513446099532305\n",
      "   +1.8119 if pa<=0.17110725343227387 & pav<=0.09408825337886813\n",
      "   +1.8522 if pav<=0.12216950207948685\n",
      "   -1.5075 if pav<=0.05245797932147981\n",
      "   -2.3704 if cp<=0.5621634125709534 & cv>=0.15257661044597626 & pav<=0.1689499914646149\n",
      "   +3.6975 if pav<=0.025541749224066743\n",
      "   +1.0716 if cp>=-0.002966956188902256 & cv>=-0.03643708601593971 & pav>=0.0016836747876368824\n",
      "   +1.2375 if pav<=0.21976910829544072\n",
      "   +0.0233 if cp>=1.0629259109497071 & pav<=0.13165188729763044 & pav>=-0.0027277451474219516\n",
      "   -6.0851 if cp<=0.8425865888595583 & cp>=0.027989277616143227 & pav<=0.14895098209381105 & pav>=0.028040046989917806\n",
      "--------------\n",
      "   +1.5448 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   +1.5463 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -1.5599 if pav<=0.11052447855472566\n",
      "   -0.0421 if cp>=0.13922219276428224 & pav<=0.07770640254020693 & pav>=-0.02710523456335067\n",
      "   +0.7044 if pa>=0.033329312503337864 & pav>=-0.0030541154323145674\n",
      "   +2.0923 if cv>=0.2070227563381195 & pav>=0.058449974656105026\n",
      "   -2.7313 if pav<=0.057992350310087246\n",
      "   -0.0902 if cp>=0.045431170612573624 & pav>=0.04802769422531128\n",
      "   +2.6890 if cp>=0.0517803356051445 & pav>=0.025541749224066743\n",
      "   +0.6842 if cv<=-0.02837289944291115 & pav>=0.21976910829544072\n",
      "   +0.0202 if cp>=0.0031887820921838333 & cv>=0.0027103481348603967 & pav>=-0.0027277451474219516\n",
      "   -0.9252 if cv<=0.20317110121250154 & pav>=0.028040046989917806\n",
      "Run episode 314 with rewards 105.0\n",
      "============ 315 ===========\n",
      "105 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1]\n",
      "   +0.8117 if pav<=0.2056886851787567\n",
      "   -3.2908 if pav>=0.105914668738842\n",
      "   -2.7000 if pa>=0.06150407791137695 & pav>=0.0003513446099532305\n",
      "   +0.5333 if pa<=0.17110725343227387 & pav<=0.09408825337886813\n",
      "   +1.2567 if pav<=0.12216950207948685\n",
      "   +0.8068 if pav<=0.05245797932147981\n",
      "   -1.1720 if cp<=0.5621634125709534 & cv>=0.15257661044597626 & pav<=0.1689499914646149\n",
      "   +1.5485 if pav<=0.025541749224066743\n",
      "   +0.0796 if cp>=-0.002966956188902256 & cv>=-0.03643708601593971 & pav>=0.0016836747876368824\n",
      "   +0.8061 if pav<=0.21976910829544072\n",
      "   -6.0171 if cp<=0.8425865888595583 & cp>=0.027989277616143227 & pav<=0.14895098209381105 & pav>=0.028040046989917806\n",
      "   -0.1419 if pav<=0.0339961975812912\n",
      "--------------\n",
      "   +2.5307 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   +2.5311 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -0.8260 if pav<=0.11052447855472566\n",
      "   -0.4818 if cp>=0.13922219276428224 & pav<=0.07770640254020693 & pav>=-0.02710523456335067\n",
      "   +0.9651 if pa>=0.033329312503337864 & pav>=-0.0030541154323145674\n",
      "   +2.0854 if cv>=0.2070227563381195 & pav>=0.058449974656105026\n",
      "   -2.4619 if pav<=0.057992350310087246\n",
      "   +2.9687 if cp>=0.045431170612573624 & pav>=0.04802769422531128\n",
      "   +2.4539 if cp>=0.0517803356051445 & pav>=0.025541749224066743\n",
      "   +0.9732 if cv<=-0.02837289944291115 & pav>=0.21976910829544072\n",
      "   -0.3964 if cv<=0.20317110121250154 & pav>=0.028040046989917806\n",
      "   +0.0357 if pa>=0.08001907318830491 & pav>=0.0339961975812912\n",
      "Run episode 315 with rewards 105.0\n",
      "============ 316 ===========\n",
      "85 actions [0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1]\n",
      "   +0.1637 if pav<=0.2056886851787567\n",
      "   -2.0762 if pav>=0.105914668738842\n",
      "   -2.5960 if pa>=0.06150407791137695 & pav>=0.0003513446099532305\n",
      "   -0.1076 if pa<=0.17110725343227387 & pav<=0.09408825337886813\n",
      "   +1.6492 if pav<=0.12216950207948685\n",
      "   +1.0263 if pav<=0.05245797932147981\n",
      "   -1.1841 if cp<=0.5621634125709534 & cv>=0.15257661044597626 & pav<=0.1689499914646149\n",
      "   +2.0647 if pav<=0.025541749224066743\n",
      "   +0.1565 if pav<=0.21976910829544072\n",
      "   -1.6127 if cp<=0.8425865888595583 & cp>=0.027989277616143227 & pav<=0.14895098209381105 & pav>=0.028040046989917806\n",
      "   +2.0647 if pav<=0.0339961975812912\n",
      "   +2.4606 if pa<=0.06488432586193085 & pav<=0.15168161094188692 & pav>=0.03007043376564981\n",
      "--------------\n",
      "   +1.8666 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   +1.8665 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -1.9830 if pav<=0.11052447855472566\n",
      "   +0.3199 if cp>=0.13922219276428224 & pav<=0.07770640254020693 & pav>=-0.02710523456335067\n",
      "   +0.3099 if pa>=0.033329312503337864 & pav>=-0.0030541154323145674\n",
      "   +3.4200 if cv>=0.2070227563381195 & pav>=0.058449974656105026\n",
      "   -1.9932 if pav<=0.057992350310087246\n",
      "   +1.3656 if cp>=0.045431170612573624 & pav>=0.04802769422531128\n",
      "   +1.3656 if cp>=0.0517803356051445 & pav>=0.025541749224066743\n",
      "   +0.6422 if cv<=-0.02837289944291115 & pav>=0.21976910829544072\n",
      "   -1.6644 if cv<=0.20317110121250154 & pav>=0.028040046989917806\n",
      "   +1.7151 if pa<=0.098355832695961 & pav>=0.03007043376564981\n",
      "Run episode 316 with rewards 85.0\n",
      "============ 317 ===========\n",
      "104 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1]\n",
      "   +0.5877 if pav<=0.2056886851787567\n",
      "   -2.7256 if pav>=0.105914668738842\n",
      "   -0.7753 if pa>=0.06150407791137695 & pav>=0.0003513446099532305\n",
      "   +2.3007 if pav<=0.12216950207948685\n",
      "   -1.2678 if pav<=0.05245797932147981\n",
      "   +0.0122 if cp<=0.5621634125709534 & cv>=0.15257661044597626 & pav<=0.1689499914646149\n",
      "   +1.0791 if pav<=0.025541749224066743\n",
      "   +0.3309 if pav<=0.21976910829544072\n",
      "   -4.8591 if cp<=0.8425865888595583 & cp>=0.027989277616143227 & pav<=0.14895098209381105 & pav>=0.028040046989917806\n",
      "   +2.8443 if pav<=0.0339961975812912\n",
      "   +0.7252 if pa<=0.06488432586193085 & pav<=0.15168161094188692 & pav>=0.03007043376564981\n",
      "   -1.6083 if pav<=0.04590139463543893\n",
      "--------------\n",
      "   +3.0953 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   +3.0969 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -2.4488 if pav<=0.11052447855472566\n",
      "   +2.8010 if cp>=0.13922219276428224 & pav<=0.07770640254020693 & pav>=-0.02710523456335067\n",
      "   +1.9464 if cv>=0.2070227563381195 & pav>=0.058449974656105026\n",
      "   -0.5102 if pav<=0.057992350310087246\n",
      "   +1.9467 if cp>=0.045431170612573624 & pav>=0.04802769422531128\n",
      "   +2.4098 if cp>=0.0517803356051445 & pav>=0.025541749224066743\n",
      "   +0.3235 if cv<=-0.02837289944291115 & pav>=0.21976910829544072\n",
      "   -0.5886 if cv<=0.20317110121250154 & pav>=0.028040046989917806\n",
      "   -0.5886 if pa<=0.098355832695961 & pav>=0.03007043376564981\n",
      "   -2.0660 if cv>=0.20003361999988556\n",
      "Run episode 317 with rewards 104.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 318 ===========\n",
      "108 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1]\n",
      "   +0.1595 if pav<=0.2056886851787567\n",
      "   -3.5252 if pav>=0.105914668738842\n",
      "   -1.9431 if pa>=0.06150407791137695 & pav>=0.0003513446099532305\n",
      "   +0.4656 if pav<=0.12216950207948685\n",
      "   +1.8652 if pav<=0.05245797932147981\n",
      "   +2.1348 if pav<=0.025541749224066743\n",
      "   +0.1595 if pav<=0.21976910829544072\n",
      "   -2.7047 if cp<=0.8425865888595583 & cp>=0.027989277616143227 & pav<=0.14895098209381105 & pav>=0.028040046989917806\n",
      "   -1.9364 if pav<=0.0339961975812912\n",
      "   +1.1100 if pa<=0.06488432586193085 & pav<=0.15168161094188692 & pav>=0.03007043376564981\n",
      "   +1.8810 if pav<=0.04590139463543893\n",
      "   +2.9572 if cp<=0.12204652428627018 & cp>=0.03833851218223572 & pav<=0.1577287018299105 & pav>=-0.07046299427747725\n",
      "--------------\n",
      "   +4.7901 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   +4.7916 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -1.0605 if pav<=0.11052447855472566\n",
      "   +1.4734 if cp>=0.13922219276428224 & pav<=0.07770640254020693 & pav>=-0.02710523456335067\n",
      "   +1.8131 if cv>=0.2070227563381195 & pav>=0.058449974656105026\n",
      "   -3.6738 if pav<=0.057992350310087246\n",
      "   +1.8233 if cp>=0.045431170612573624 & pav>=0.04802769422531128\n",
      "   +2.3339 if cp>=0.0517803356051445 & pav>=0.025541749224066743\n",
      "   -1.9487 if cv<=0.20317110121250154 & pav>=0.028040046989917806\n",
      "   -1.5487 if pa<=0.098355832695961 & pav>=0.03007043376564981\n",
      "   +1.6963 if cv>=0.20003361999988556\n",
      "   -1.8385 if cv>=0.10210001766681695\n",
      "Run episode 318 with rewards 108.0\n",
      "============ 319 ===========\n",
      "96 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 0, 1]\n",
      "   -0.0763 if pav<=0.2056886851787567\n",
      "   -1.8207 if pav>=0.105914668738842\n",
      "   -1.3423 if pa>=0.06150407791137695 & pav>=0.0003513446099532305\n",
      "   +0.2287 if pav<=0.12216950207948685\n",
      "   +1.8658 if pav<=0.05245797932147981\n",
      "   +0.3724 if pav<=0.025541749224066743\n",
      "   +0.5761 if cp<=0.8425865888595583 & cp>=0.027989277616143227 & pav<=0.14895098209381105 & pav>=0.028040046989917806\n",
      "   +0.5647 if pav<=0.0339961975812912\n",
      "   +0.6244 if pa<=0.06488432586193085 & pav<=0.15168161094188692 & pav>=0.03007043376564981\n",
      "   +1.8658 if pav<=0.04590139463543893\n",
      "   +0.1977 if cp<=0.12204652428627018 & cp>=0.03833851218223572 & pav<=0.1577287018299105 & pav>=-0.07046299427747725\n",
      "   -2.2559 if cp<=0.08578387796878818 & cp>=-0.010901509039103967 & cp>=-0.041150331497192376 & pav<=0.18613080084323883 & pav>=0.03645755499601367\n",
      "--------------\n",
      "   +3.2085 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   +3.2056 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -0.5464 if cp>=0.13922219276428224 & pav<=0.07770640254020693 & pav>=-0.02710523456335067\n",
      "   +3.7467 if cv>=0.2070227563381195 & pav>=0.058449974656105026\n",
      "   -2.6159 if pav<=0.057992350310087246\n",
      "   +0.8638 if cp>=0.045431170612573624 & pav>=0.04802769422531128\n",
      "   -0.5686 if cp>=0.0517803356051445 & pav>=0.025541749224066743\n",
      "   -1.0388 if cv<=0.20317110121250154 & pav>=0.028040046989917806\n",
      "   -1.1212 if pa<=0.098355832695961 & pav>=0.03007043376564981\n",
      "   +1.6449 if cv>=0.20003361999988556\n",
      "   -1.4146 if cv>=0.10210001766681695\n",
      "   -1.3292 if cv>=-0.016934332624077793\n",
      "Run episode 319 with rewards 96.0\n",
      "============ 320 ===========\n",
      "121 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1]\n",
      "   -3.5870 if pav>=0.105914668738842\n",
      "   -3.2995 if pa>=0.06150407791137695 & pav>=0.0003513446099532305\n",
      "   +0.5827 if pav<=0.12216950207948685\n",
      "   +2.6466 if pav<=0.05245797932147981\n",
      "   +0.7892 if pav<=0.025541749224066743\n",
      "   -0.4128 if cp<=0.8425865888595583 & cp>=0.027989277616143227 & pav<=0.14895098209381105 & pav>=0.028040046989917806\n",
      "   +0.9156 if pav<=0.0339961975812912\n",
      "   +1.0307 if pa<=0.06488432586193085 & pav<=0.15168161094188692 & pav>=0.03007043376564981\n",
      "   +1.2911 if pav<=0.04590139463543893\n",
      "   -0.0668 if cp<=0.12204652428627018 & cp>=0.03833851218223572 & pav<=0.1577287018299105 & pav>=-0.07046299427747725\n",
      "   -0.3035 if cp<=0.08578387796878818 & cp>=-0.010901509039103967 & cp>=-0.041150331497192376 & pav<=0.18613080084323883 & pav>=0.03645755499601367\n",
      "   -2.5276 if cv>=0.0467057041823864 & cv>=1.314409852027893 & pav<=0.2750905752182007 & pav>=0.16334104537963887\n",
      "--------------\n",
      "   +3.3064 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   +3.3062 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   +4.0752 if cv>=0.2070227563381195 & pav>=0.058449974656105026\n",
      "   -3.4470 if pav<=0.057992350310087246\n",
      "   +2.5948 if cp>=0.045431170612573624 & pav>=0.04802769422531128\n",
      "   +1.6279 if cp>=0.0517803356051445 & pav>=0.025541749224066743\n",
      "   -0.3165 if cv<=0.20317110121250154 & pav>=0.028040046989917806\n",
      "   -0.4274 if pa<=0.098355832695961 & pav>=0.03007043376564981\n",
      "   +0.6837 if cv>=0.20003361999988556\n",
      "   +0.6837 if cv>=0.10210001766681695\n",
      "   -1.4803 if cv>=-0.016934332624077793\n",
      "   -0.8718 if pa<=0.06203033775091171\n",
      "Run episode 320 with rewards 121.0\n",
      "============ 321 ===========\n",
      "131 actions [0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0]\n",
      "   -2.3365 if pav>=0.105914668738842\n",
      "   -3.8650 if pa>=0.06150407791137695 & pav>=0.0003513446099532305\n",
      "   -0.7313 if pav<=0.12216950207948685\n",
      "   +4.3376 if pav<=0.05245797932147981\n",
      "   +1.0449 if pav<=0.025541749224066743\n",
      "   -3.0752 if cp<=0.8425865888595583 & cp>=0.027989277616143227 & pav<=0.14895098209381105 & pav>=0.028040046989917806\n",
      "   +1.8550 if pav<=0.0339961975812912\n",
      "   +2.6135 if pa<=0.06488432586193085 & pav<=0.15168161094188692 & pav>=0.03007043376564981\n",
      "   -1.2105 if pav<=0.04590139463543893\n",
      "   -0.0014 if cp<=0.08578387796878818 & cp>=-0.010901509039103967 & cp>=-0.041150331497192376 & pav<=0.18613080084323883 & pav>=0.03645755499601367\n",
      "   -0.0002 if cv>=0.0467057041823864 & cv>=1.314409852027893 & pav<=0.2750905752182007 & pav>=0.16334104537963887\n",
      "   +5.5580 if cp<=0.6569451093673706 & cp>=0.155197858810425 & pav<=0.17996464669704437 & pav>=0.03311513736844063\n",
      "--------------\n",
      "   +2.3819 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   +2.3819 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   +1.4244 if cv>=0.2070227563381195 & pav>=0.058449974656105026\n",
      "   -3.3931 if pav<=0.057992350310087246\n",
      "   +0.5662 if cp>=0.045431170612573624 & pav>=0.04802769422531128\n",
      "   +6.2721 if cp>=0.0517803356051445 & pav>=0.025541749224066743\n",
      "   +0.6562 if pa<=0.098355832695961 & pav>=0.03007043376564981\n",
      "   -0.0855 if cv>=0.20003361999988556\n",
      "   +2.1918 if cv>=0.10210001766681695\n",
      "   -1.8730 if cv>=-0.016934332624077793\n",
      "   -1.7021 if pa<=0.06203033775091171\n",
      "   -5.2125 if cp>=0.155197858810425 & pav>=0.03311513736844063\n",
      "Run episode 321 with rewards 131.0\n",
      "============ 322 ===========\n",
      "104 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 1]\n",
      "   -3.5513 if pav>=0.105914668738842\n",
      "   -1.5531 if pa>=0.06150407791137695 & pav>=0.0003513446099532305\n",
      "   -2.4235 if pav<=0.12216950207948685\n",
      "   -0.8563 if pav<=0.05245797932147981\n",
      "   +3.1108 if pav<=0.025541749224066743\n",
      "   -1.2998 if cp<=0.8425865888595583 & cp>=0.027989277616143227 & pav<=0.14895098209381105 & pav>=0.028040046989917806\n",
      "   +2.5250 if pav<=0.0339961975812912\n",
      "   +0.2071 if pa<=0.06488432586193085 & pav<=0.15168161094188692 & pav>=0.03007043376564981\n",
      "   +1.0515 if pav<=0.04590139463543893\n",
      "   -1.0844 if cp<=0.08578387796878818 & cp>=-0.010901509039103967 & cp>=-0.041150331497192376 & pav<=0.18613080084323883 & pav>=0.03645755499601367\n",
      "   -0.8625 if cp<=0.6569451093673706 & cp>=0.155197858810425 & pav<=0.17996464669704437 & pav>=0.03311513736844063\n",
      "   -9.5034 if pav<=-0.10898322612047195 & pav>=-0.10898322612047195\n",
      "--------------\n",
      "   +1.6195 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   +1.6201 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   +0.0079 if cv>=0.2070227563381195 & pav>=0.058449974656105026\n",
      "   -6.5834 if pav<=0.057992350310087246\n",
      "   +2.3875 if cp>=0.045431170612573624 & pav>=0.04802769422531128\n",
      "   +5.3865 if cp>=0.0517803356051445 & pav>=0.025541749224066743\n",
      "   +0.8487 if pa<=0.098355832695961 & pav>=0.03007043376564981\n",
      "   +2.4188 if cv>=0.10210001766681695\n",
      "   +1.4701 if cv>=-0.016934332624077793\n",
      "   -0.1522 if pa<=0.06203033775091171\n",
      "   -2.0656 if cp>=0.155197858810425 & pav>=0.03311513736844063\n",
      "  +10.7920 if pav<=-0.10898322612047195 & pav>=-0.10898322612047195\n",
      "Run episode 322 with rewards 104.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 323 ===========\n",
      "33 actions [0, 0, 0, 1, 0, 0, 1, 1, 1, 1, 1, 0, 1, 0, 1, 0, 0, 1, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0]\n",
      "   +2.4648 if pav>=0.105914668738842\n",
      "   -3.6809 if pa>=0.06150407791137695 & pav>=0.0003513446099532305\n",
      "   +0.1808 if pav<=0.12216950207948685\n",
      "   +0.5176 if pav<=0.05245797932147981\n",
      "   +3.2941 if pav<=0.025541749224066743\n",
      "   -1.4200 if cp<=0.8425865888595583 & cp>=0.027989277616143227 & pav<=0.14895098209381105 & pav>=0.028040046989917806\n",
      "   +1.8801 if pav<=0.0339961975812912\n",
      "   +0.5176 if pav<=0.04590139463543893\n",
      "   +0.0699 if cp<=0.08578387796878818 & cp>=-0.010901509039103967 & cp>=-0.041150331497192376 & pav<=0.18613080084323883 & pav>=0.03645755499601367\n",
      "   -0.0055 if cp<=0.6569451093673706 & cp>=0.155197858810425 & pav<=0.17996464669704437 & pav>=0.03311513736844063\n",
      "   -0.0000 if pav<=-0.10898322612047195 & pav>=-0.10898322612047195\n",
      "   -2.7659 if pav>=0.6552863717079163\n",
      "--------------\n",
      "   +0.5486 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   +0.5614 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -3.3007 if pav<=0.057992350310087246\n",
      "   +0.1117 if cp>=0.045431170612573624 & pav>=0.04802769422531128\n",
      "   +4.7773 if cp>=0.0517803356051445 & pav>=0.025541749224066743\n",
      "   +0.7714 if pa<=0.098355832695961 & pav>=0.03007043376564981\n",
      "   +0.4283 if cv>=0.10210001766681695\n",
      "   -0.8781 if cv>=-0.016934332624077793\n",
      "   -3.9884 if pa<=0.06203033775091171\n",
      "   +0.3614 if cp>=0.155197858810425 & pav>=0.03311513736844063\n",
      "   -0.0000 if pav<=-0.10898322612047195 & pav>=-0.10898322612047195\n",
      "   +2.7859 if pav>=0.6552863717079163\n",
      "Run episode 323 with rewards 33.0\n",
      "============ 324 ===========\n",
      "37 actions [0, 0, 0, 1, 0, 1, 1, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 0, 1, 1, 1, 0, 1]\n",
      "   +1.4393 if pav>=0.105914668738842\n",
      "   -2.6854 if pa>=0.06150407791137695 & pav>=0.0003513446099532305\n",
      "   +1.9767 if pav<=0.12216950207948685\n",
      "   +0.7276 if pav<=0.05245797932147981\n",
      "   +0.0929 if pav<=0.025541749224066743\n",
      "   +0.0000 if cp<=0.8425865888595583 & cp>=0.027989277616143227 & pav<=0.14895098209381105 & pav>=0.028040046989917806\n",
      "   +0.2026 if pav<=0.0339961975812912\n",
      "   +0.7276 if pav<=0.04590139463543893\n",
      "   +1.9525 if cp<=0.08578387796878818 & cp>=-0.010901509039103967 & cp>=-0.041150331497192376 & pav<=0.18613080084323883 & pav>=0.03645755499601367\n",
      "   +0.0000 if cp<=0.6569451093673706 & cp>=0.155197858810425 & pav<=0.17996464669704437 & pav>=0.03311513736844063\n",
      "   -0.8916 if pav>=0.6552863717079163\n",
      "   -2.9475 if pav>=1.2115373611450195\n",
      "--------------\n",
      "   -1.2228 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   +2.0219 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -6.5581 if pav<=0.057992350310087246\n",
      "   +0.0000 if cp>=0.045431170612573624 & pav>=0.04802769422531128\n",
      "   +0.0000 if cp>=0.0517803356051445 & pav>=0.025541749224066743\n",
      "   -1.1017 if pa<=0.098355832695961 & pav>=0.03007043376564981\n",
      "   +0.6238 if cv>=0.10210001766681695\n",
      "   +0.6198 if cv>=-0.016934332624077793\n",
      "   -1.6563 if pa<=0.06203033775091171\n",
      "   +0.0000 if cp>=0.155197858810425 & pav>=0.03311513736844063\n",
      "   +1.7751 if pav>=0.6552863717079163\n",
      "   +2.9577 if pav>=1.2115373611450195\n",
      "Run episode 324 with rewards 37.0\n",
      "============ 325 ===========\n",
      "48 actions [0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 1, 0, 1]\n",
      "   -0.0100 if pav>=0.105914668738842\n",
      "   -3.9810 if pa>=0.06150407791137695 & pav>=0.0003513446099532305\n",
      "   +5.4957 if pav<=0.12216950207948685\n",
      "   +0.0289 if pav<=0.05245797932147981\n",
      "   +0.0289 if pav<=0.025541749224066743\n",
      "   -4.7058 if cp<=0.8425865888595583 & cp>=0.027989277616143227 & pav<=0.14895098209381105 & pav>=0.028040046989917806\n",
      "   +0.0289 if pav<=0.0339961975812912\n",
      "   +0.0289 if pav<=0.04590139463543893\n",
      "   +1.0155 if cp<=0.08578387796878818 & cp>=-0.010901509039103967 & cp>=-0.041150331497192376 & pav<=0.18613080084323883 & pav>=0.03645755499601367\n",
      "   -4.4199 if pav>=0.6552863717079163\n",
      "   -0.0000 if pav>=1.2115373611450195\n",
      "   +1.3276 if \n",
      "--------------\n",
      "   +2.6693 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   +2.7041 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -2.1526 if pav<=0.057992350310087246\n",
      "   +2.2078 if cp>=0.0517803356051445 & pav>=0.025541749224066743\n",
      "   -2.7748 if pa<=0.098355832695961 & pav>=0.03007043376564981\n",
      "   +0.3210 if cv>=0.10210001766681695\n",
      "   -1.1647 if cv>=-0.016934332624077793\n",
      "   -4.4484 if pa<=0.06203033775091171\n",
      "   -0.2097 if cp>=0.155197858810425 & pav>=0.03311513736844063\n",
      "   +5.1511 if pav>=0.6552863717079163\n",
      "   -0.0000 if pav>=1.2115373611450195\n",
      "   -4.3362 if cp<=0.0026425935328006746 & cv<=0.18690054714679719 & cv<=0.5602268218994141 & pav<=0.17806383967399597\n",
      "Run episode 325 with rewards 48.0\n",
      "============ 326 ===========\n",
      "32 actions [0, 0, 0, 1, 0, 0, 1, 1, 1, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1]\n",
      "   +0.4115 if pav>=0.105914668738842\n",
      "   -4.7448 if pa>=0.06150407791137695 & pav>=0.0003513446099532305\n",
      "   +3.9310 if pav<=0.12216950207948685\n",
      "   +0.6428 if pav<=0.05245797932147981\n",
      "   +0.0158 if pav<=0.025541749224066743\n",
      "   +0.4402 if cp<=0.8425865888595583 & cp>=0.027989277616143227 & pav<=0.14895098209381105 & pav>=0.028040046989917806\n",
      "   +0.6428 if pav<=0.0339961975812912\n",
      "   +0.6428 if pav<=0.04590139463543893\n",
      "   +3.3772 if cp<=0.08578387796878818 & cp>=-0.010901509039103967 & cp>=-0.041150331497192376 & pav<=0.18613080084323883 & pav>=0.03645755499601367\n",
      "   -3.3852 if pav>=0.6552863717079163\n",
      "   +1.7381 if \n",
      "   -0.4798 if pav<=0.1663991153240204\n",
      "--------------\n",
      "   +1.6917 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   +3.5685 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -3.5532 if pav<=0.057992350310087246\n",
      "   +2.5927 if cp>=0.0517803356051445 & pav>=0.025541749224066743\n",
      "   -3.4783 if pa<=0.098355832695961 & pav>=0.03007043376564981\n",
      "   +0.3684 if cv>=0.10210001766681695\n",
      "   -0.5093 if cv>=-0.016934332624077793\n",
      "   -4.5952 if pa<=0.06203033775091171\n",
      "   +0.6128 if cp>=0.155197858810425 & pav>=0.03311513736844063\n",
      "   +4.0631 if pav>=0.6552863717079163\n",
      "   -1.0185 if cp<=0.0026425935328006746 & cv<=0.18690054714679719 & cv<=0.5602268218994141 & pav<=0.17806383967399597\n",
      "   -2.5858 if cp>=0.020245856419205687 & cv>=0.38944605588912967 & pav>=-0.0028841398656368096\n",
      "Run episode 326 with rewards 32.0\n",
      "============ 327 ===========\n",
      "29 actions [0, 0, 0, 1, 0, 1, 1, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1]\n",
      "   +0.8178 if pav>=0.105914668738842\n",
      "   -3.3251 if pa>=0.06150407791137695 & pav>=0.0003513446099532305\n",
      "   +2.4350 if pav<=0.12216950207948685\n",
      "   +0.0342 if pav<=0.05245797932147981\n",
      "   -0.0000 if cp<=0.8425865888595583 & cp>=0.027989277616143227 & pav<=0.14895098209381105 & pav>=0.028040046989917806\n",
      "   +0.0342 if pav<=0.0339961975812912\n",
      "   +0.0342 if pav<=0.04590139463543893\n",
      "   -0.0636 if cp<=0.08578387796878818 & cp>=-0.010901509039103967 & cp>=-0.041150331497192376 & pav<=0.18613080084323883 & pav>=0.03645755499601367\n",
      "   -1.0654 if pav>=0.6552863717079163\n",
      "   +3.2528 if \n",
      "   +0.3467 if pav<=0.1663991153240204\n",
      "   -3.4933 if cp>=-0.04796577394008635 & pa<=0.07924526929855347\n",
      "--------------\n",
      "   +1.7401 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   +1.6784 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -0.4990 if pav<=0.057992350310087246\n",
      "   -0.0000 if cp>=0.0517803356051445 & pav>=0.025541749224066743\n",
      "   -2.3356 if pa<=0.098355832695961 & pav>=0.03007043376564981\n",
      "   -1.6594 if cv>=-0.016934332624077793\n",
      "   -2.7610 if pa<=0.06203033775091171\n",
      "   -0.0000 if cp>=0.155197858810425 & pav>=0.03311513736844063\n",
      "   +2.6413 if pav>=0.6552863717079163\n",
      "   -0.1016 if cp<=0.0026425935328006746 & cv<=0.18690054714679719 & cv<=0.5602268218994141 & pav<=0.17806383967399597\n",
      "   -0.5812 if cp>=0.020245856419205687 & cv>=0.38944605588912967 & pav>=-0.0028841398656368096\n",
      "   -4.6948 if cp<=-0.04796577394008635 & cv<=-0.3538319706916809\n",
      "Run episode 327 with rewards 29.0\n",
      "============ 328 ===========\n",
      "33 actions [0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 0, 0, 1, 1, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1]\n",
      "   +0.4900 if pav>=0.105914668738842\n",
      "   -0.4858 if pa>=0.06150407791137695 & pav>=0.0003513446099532305\n",
      "   +1.4185 if pav<=0.12216950207948685\n",
      "   +0.5135 if pav<=0.05245797932147981\n",
      "   +0.3826 if pav<=0.0339961975812912\n",
      "   +0.5135 if pav<=0.04590139463543893\n",
      "   +2.4180 if cp<=0.08578387796878818 & cp>=-0.010901509039103967 & cp>=-0.041150331497192376 & pav<=0.18613080084323883 & pav>=0.03645755499601367\n",
      "   -3.7525 if pav>=0.6552863717079163\n",
      "   +1.9085 if \n",
      "   -0.9510 if pav<=0.1663991153240204\n",
      "   +2.0608 if cp>=-0.04796577394008635 & pa<=0.07924526929855347\n",
      "   -2.5912 if cp>=-0.0263704601675272 & pav>=0.24786307215690617\n",
      "--------------\n",
      "   +2.0048 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   +2.0048 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -2.2880 if pav<=0.057992350310087246\n",
      "   -0.0000 if cp>=0.0517803356051445 & pav>=0.025541749224066743\n",
      "   -3.0425 if pa<=0.098355832695961 & pav>=0.03007043376564981\n",
      "   +0.3159 if cv>=-0.016934332624077793\n",
      "   -3.2626 if pa<=0.06203033775091171\n",
      "   +4.4709 if pav>=0.6552863717079163\n",
      "   +1.7583 if cp<=0.0026425935328006746 & cv<=0.18690054714679719 & cv<=0.5602268218994141 & pav<=0.17806383967399597\n",
      "   -0.0000 if cp>=0.020245856419205687 & cv>=0.38944605588912967 & pav>=-0.0028841398656368096\n",
      "   -0.0000 if cp<=-0.04796577394008635 & cv<=-0.3538319706916809\n",
      "   -2.4437 if pav<=0.3732421875000001 & pav>=0.07938803136348728\n",
      "Run episode 328 with rewards 33.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 329 ===========\n",
      "27 actions [0, 0, 0, 1, 0, 1, 1, 1, 1, 0, 1, 0, 0, 1, 0, 1, 1, 1, 0, 0, 1, 1, 0, 1, 1, 0, 1]\n",
      "   +1.0430 if pav>=0.105914668738842\n",
      "   -0.9330 if pa>=0.06150407791137695 & pav>=0.0003513446099532305\n",
      "   +1.2182 if pav<=0.12216950207948685\n",
      "   +1.0223 if pav<=0.05245797932147981\n",
      "   +1.0223 if pav<=0.04590139463543893\n",
      "   -0.0000 if cp<=0.08578387796878818 & cp>=-0.010901509039103967 & cp>=-0.041150331497192376 & pav<=0.18613080084323883 & pav>=0.03645755499601367\n",
      "   -3.1639 if pav>=0.6552863717079163\n",
      "   +2.0653 if \n",
      "   -0.2729 if pav<=0.1663991153240204\n",
      "   +0.3633 if cp>=-0.04796577394008635 & pa<=0.07924526929855347\n",
      "   +0.1379 if cp>=-0.0263704601675272 & pav>=0.24786307215690617\n",
      "   -2.0281 if pav>=0.2556222677230835\n",
      "--------------\n",
      "   +2.1220 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   +2.4235 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -4.4521 if pav<=0.057992350310087246\n",
      "   -0.1315 if pa<=0.098355832695961 & pav>=0.03007043376564981\n",
      "   +2.1549 if cv>=-0.016934332624077793\n",
      "   -4.8769 if pa<=0.06203033775091171\n",
      "   +4.0579 if pav>=0.6552863717079163\n",
      "   +2.6622 if cp<=0.0026425935328006746 & cv<=0.18690054714679719 & cv<=0.5602268218994141 & pav<=0.17806383967399597\n",
      "   +0.0000 if cp>=0.020245856419205687 & cv>=0.38944605588912967 & pav>=-0.0028841398656368096\n",
      "   -1.1817 if cp<=-0.04796577394008635 & cv<=-0.3538319706916809\n",
      "   -4.0031 if pav<=0.3732421875000001 & pav>=0.07938803136348728\n",
      "   +3.8427 if cp<=-0.09116368442773819 & cv>=-0.03606502041220665 & pav>=0.2556222677230835\n",
      "Run episode 329 with rewards 27.0\n",
      "============ 330 ===========\n",
      "26 actions [0, 0, 0, 1, 1, 0, 1, 1, 1, 0, 1, 0, 0, 1, 1, 1, 0, 0, 1, 0, 1, 1, 1, 0, 0, 1]\n",
      "   +0.3008 if pav>=0.105914668738842\n",
      "   -1.1676 if pa>=0.06150407791137695 & pav>=0.0003513446099532305\n",
      "   +0.6418 if pav<=0.12216950207948685\n",
      "   +0.6485 if pav<=0.05245797932147981\n",
      "   +0.6485 if pav<=0.04590139463543893\n",
      "   -2.3306 if pav>=0.6552863717079163\n",
      "   +0.9426 if \n",
      "   +2.4242 if pav<=0.1663991153240204\n",
      "   +0.3727 if cp>=-0.04796577394008635 & pa<=0.07924526929855347\n",
      "   -0.0000 if cp>=-0.0263704601675272 & pav>=0.24786307215690617\n",
      "   +3.0847 if pav>=0.2556222677230835\n",
      "   -2.0042 if cp>=-0.08425067514181137 & cv<=-0.0232416495680809\n",
      "--------------\n",
      "   +1.3456 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   +1.3456 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -2.2733 if pav<=0.057992350310087246\n",
      "   +0.0610 if pa<=0.098355832695961 & pav>=0.03007043376564981\n",
      "   +5.5388 if cv>=-0.016934332624077793\n",
      "   -3.9001 if pa<=0.06203033775091171\n",
      "   +2.5806 if pav>=0.6552863717079163\n",
      "   +0.6055 if cp<=0.0026425935328006746 & cv<=0.18690054714679719 & cv<=0.5602268218994141 & pav<=0.17806383967399597\n",
      "   -1.4075 if cp<=-0.04796577394008635 & cv<=-0.3538319706916809\n",
      "   -4.1357 if pav<=0.3732421875000001 & pav>=0.07938803136348728\n",
      "   -0.0000 if cp<=-0.09116368442773819 & cv>=-0.03606502041220665 & pav>=0.2556222677230835\n",
      "   -2.6239 if cv>=0.08992091417312645\n",
      "Run episode 330 with rewards 26.0\n",
      "============ 331 ===========\n",
      "16 actions [0, 0, 0, 1, 0, 1, 0, 0, 1, 1, 1, 1, 0, 0, 1, 1]\n",
      "   +0.6229 if pav>=0.105914668738842\n",
      "   -1.5561 if pa>=0.06150407791137695 & pav>=0.0003513446099532305\n",
      "   +1.5136 if pav<=0.12216950207948685\n",
      "   +1.5136 if pav<=0.05245797932147981\n",
      "   +1.5136 if pav<=0.04590139463543893\n",
      "   -2.8310 if pav>=0.6552863717079163\n",
      "   +2.1365 if \n",
      "   -1.2731 if pav<=0.1663991153240204\n",
      "   -0.4537 if cp>=-0.04796577394008635 & pa<=0.07924526929855347\n",
      "   +3.4616 if pav>=0.2556222677230835\n",
      "   -4.4698 if cp>=-0.08425067514181137 & cv<=-0.0232416495680809\n",
      "   +0.0178 if cv>=0.5272350907325745\n",
      "--------------\n",
      "   +2.1345 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   +2.1345 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -2.2069 if pav<=0.057992350310087246\n",
      "   -1.9147 if pa<=0.098355832695961 & pav>=0.03007043376564981\n",
      "   -0.0820 if cv>=-0.016934332624077793\n",
      "   -2.1079 if pa<=0.06203033775091171\n",
      "   +3.0144 if pav>=0.6552863717079163\n",
      "   +3.9817 if cp<=0.0026425935328006746 & cv<=0.18690054714679719 & cv<=0.5602268218994141 & pav<=0.17806383967399597\n",
      "   +0.0000 if cp<=-0.04796577394008635 & cv<=-0.3538319706916809\n",
      "   -4.3608 if pav<=0.3732421875000001 & pav>=0.07938803136348728\n",
      "   -0.0820 if cv>=0.08992091417312645\n",
      "   +2.3619 if cp<=-0.019469626247882843 & pav>=0.6358610391616821\n",
      "Run episode 331 with rewards 16.0\n",
      "============ 332 ===========\n",
      "10 actions [0, 0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +1.3211 if pav>=0.105914668738842\n",
      "   +2.4382 if pa>=0.06150407791137695 & pav>=0.0003513446099532305\n",
      "   +0.5244 if pav<=0.12216950207948685\n",
      "   +0.5244 if pav<=0.05245797932147981\n",
      "   +0.5244 if pav<=0.04590139463543893\n",
      "   +0.3171 if pav>=0.6552863717079163\n",
      "   +1.8455 if \n",
      "   +0.5244 if pav<=0.1663991153240204\n",
      "   +0.0288 if cp>=-0.04796577394008635 & pa<=0.07924526929855347\n",
      "   +1.3068 if pav>=0.2556222677230835\n",
      "   -1.4321 if cp>=-0.08425067514181137 & cv<=-0.0232416495680809\n",
      "   -2.9148 if cp<=-0.12234996259212494 & cp>=-0.1445789784193039 & pav<=0.6008314490318298\n",
      "--------------\n",
      "   +1.3767 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   +1.3767 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -0.0382 if pav<=0.057992350310087246\n",
      "   -3.3676 if pa<=0.098355832695961 & pav>=0.03007043376564981\n",
      "   -1.0709 if cv>=-0.016934332624077793\n",
      "   -0.4344 if pa<=0.06203033775091171\n",
      "   +0.6007 if pav>=0.6552863717079163\n",
      "   -0.0382 if cp<=0.0026425935328006746 & cv<=0.18690054714679719 & cv<=0.5602268218994141 & pav<=0.17806383967399597\n",
      "   -1.6882 if pav<=0.3732421875000001 & pav>=0.07938803136348728\n",
      "   -0.0000 if cv>=0.08992091417312645\n",
      "   +0.6007 if cp<=-0.019469626247882843 & pav>=0.6358610391616821\n",
      "   +1.3294 if pav>=0.7336528301239016\n",
      "Run episode 332 with rewards 10.0\n",
      "============ 333 ===========\n",
      "26 actions [0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1]\n",
      "   +0.9167 if pav>=0.105914668738842\n",
      "  -15.0581 if pa>=0.06150407791137695 & pav>=0.0003513446099532305\n",
      "   +2.7548 if pav<=0.12216950207948685\n",
      "   +2.7548 if pav<=0.05245797932147981\n",
      "   +2.7548 if pav<=0.04590139463543893\n",
      "   -8.7484 if pav>=0.6552863717079163\n",
      "   +3.6715 if \n",
      "   +2.7548 if pav<=0.1663991153240204\n",
      "   -3.3059 if pav>=0.2556222677230835\n",
      "   +8.6281 if cp>=-0.08425067514181137 & cv<=-0.0232416495680809\n",
      "   +0.3483 if cp<=-0.12234996259212494 & cp>=-0.1445789784193039 & pav<=0.6008314490318298\n",
      "   +1.0000 if cp<=-0.017811225354671476\n",
      "--------------\n",
      "   -0.4620 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   -0.4620 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -0.1671 if pav<=0.057992350310087246\n",
      "   -0.4803 if pa<=0.098355832695961 & pav>=0.03007043376564981\n",
      "   -0.1671 if cv>=-0.016934332624077793\n",
      "   -0.6525 if pa<=0.06203033775091171\n",
      "   -0.0515 if pav>=0.6552863717079163\n",
      "   +0.0000 if cp<=0.0026425935328006746 & cv<=0.18690054714679719 & cv<=0.5602268218994141 & pav<=0.17806383967399597\n",
      "   -0.3156 if pav<=0.3732421875000001 & pav>=0.07938803136348728\n",
      "   +0.0327 if cp<=-0.019469626247882843 & pav>=0.6358610391616821\n",
      "   -0.0515 if pav>=0.7336528301239016\n",
      "   +0.0047 if pa>=0.16336405277252197\n",
      "Run episode 333 with rewards 26.0\n",
      "============ 334 ===========\n",
      "11 actions [0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1]\n",
      "   -0.3694 if pav>=0.105914668738842\n",
      "   -6.1981 if pa>=0.06150407791137695 & pav>=0.0003513446099532305\n",
      "   +0.5135 if pav<=0.12216950207948685\n",
      "   +1.1476 if pav<=0.05245797932147981\n",
      "   +1.1476 if pav<=0.04590139463543893\n",
      "   -0.5105 if pav>=0.6552863717079163\n",
      "   +0.1441 if \n",
      "   +0.5135 if pav<=0.1663991153240204\n",
      "   +0.0032 if pav>=0.2556222677230835\n",
      "   +1.7390 if cp>=-0.08425067514181137 & cv<=-0.0232416495680809\n",
      "   +0.1211 if cp<=-0.017811225354671476\n",
      "   +0.5492 if cv<=-0.020909873768687248\n",
      "--------------\n",
      "   -0.4288 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   -0.4288 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   +1.3322 if pav<=0.057992350310087246\n",
      "   -0.4299 if pa<=0.098355832695961 & pav>=0.03007043376564981\n",
      "   +1.3919 if cv>=-0.016934332624077793\n",
      "   -0.4322 if pa<=0.06203033775091171\n",
      "   -0.4295 if pav>=0.6552863717079163\n",
      "   +0.0063 if pav<=0.3732421875000001 & pav>=0.07938803136348728\n",
      "   -0.4295 if cp<=-0.019469626247882843 & pav>=0.6358610391616821\n",
      "   -0.4295 if pav>=0.7336528301239016\n",
      "   +1.3921 if pa>=0.16336405277252197\n",
      "   -0.3702 if cp<=-0.036720238626003265\n",
      "Run episode 334 with rewards 11.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 335 ===========\n",
      "9 actions [0, 0, 0, 0, 0, 0, 0, 0, 0]\n",
      "   +2.3619 if pav>=0.105914668738842\n",
      "   +7.7458 if pa>=0.06150407791137695 & pav>=0.0003513446099532305\n",
      "   +0.9207 if pav<=0.12216950207948685\n",
      "   +1.5105 if pav<=0.05245797932147981\n",
      "   +1.5105 if pav<=0.04590139463543893\n",
      "   +2.4615 if pav>=0.6552863717079163\n",
      "   +2.5954 if \n",
      "   +0.9207 if pav<=0.1663991153240204\n",
      "   +2.3828 if cp>=-0.08425067514181137 & cv<=-0.0232416495680809\n",
      "   +2.0934 if cp<=-0.017811225354671476\n",
      "   +2.5292 if cv<=-0.020909873768687248\n",
      "   +1.0000 if cv<=-1.1675808429718018\n",
      "--------------\n",
      "   -3.1052 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   -3.1052 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -3.7489 if pav<=0.057992350310087246\n",
      "   -1.8982 if pa<=0.098355832695961 & pav>=0.03007043376564981\n",
      "   -3.9148 if cv>=-0.016934332624077793\n",
      "   -0.8524 if pa<=0.06203033775091171\n",
      "   -2.9495 if pav>=0.6552863717079163\n",
      "   -3.5042 if cp<=-0.019469626247882843 & pav>=0.6358610391616821\n",
      "   -2.9495 if pav>=0.7336528301239016\n",
      "   -4.1350 if pa>=0.16336405277252197\n",
      "   -3.3395 if cp<=-0.036720238626003265\n",
      "   +1.0000 if cp>=0.020417679101228724\n",
      "Run episode 335 with rewards 9.0\n",
      "============ 336 ===========\n",
      "94 actions [0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 1, 0, 1, 0, 0, 1, 1, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 1, 1, 1, 1, 0, 1, 1, 1, 0, 0, 1, 1, 1, 0, 0, 0, 0, 1, 1, 1, 0, 1, 1, 1, 0, 0, 1, 0, 1, 1, 1, 1, 1, 0, 1, 1, 0, 0, 0, 0, 0, 1, 1, 1, 1, 0, 1]\n",
      "   +0.0037 if pav>=0.105914668738842\n",
      "   -0.0000 if pa>=0.06150407791137695 & pav>=0.0003513446099532305\n",
      "   +0.0040 if pav<=0.05245797932147981\n",
      "   +0.0040 if pav<=0.04590139463543893\n",
      "   -0.0000 if pav>=0.6552863717079163\n",
      "   +0.0077 if \n",
      "   +0.0040 if pav<=0.1663991153240204\n",
      "   +0.0037 if cp>=-0.08425067514181137 & cv<=-0.0232416495680809\n",
      "   -0.0000 if cp<=-0.017811225354671476\n",
      "   +0.0037 if cv<=-0.020909873768687248\n",
      "   -0.0000 if cv<=-1.1675808429718018\n",
      "   +0.0077 if cp>=-0.049787537753581995\n",
      "--------------\n",
      "   +3.9680 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   +3.9680 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -6.0065 if pav<=0.057992350310087246\n",
      "   -7.3258 if pa<=0.098355832695961 & pav>=0.03007043376564981\n",
      "   -5.9471 if cv>=-0.016934332624077793\n",
      "   +6.6740 if pav>=0.6552863717079163\n",
      "   +6.8725 if cp<=-0.019469626247882843 & pav>=0.6358610391616821\n",
      "   +6.6740 if pav>=0.7336528301239016\n",
      "  +11.2534 if pa>=0.16336405277252197\n",
      "  +11.8148 if cp<=-0.036720238626003265\n",
      "   +0.3578 if cp>=0.020417679101228724\n",
      "   +1.0000 if pa>=0.20305509865283966\n",
      "Run episode 336 with rewards 94.0\n",
      "============ 337 ===========\n",
      "54 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1]\n",
      "   +2.0508 if pav>=0.105914668738842\n",
      "   -0.2680 if pa>=0.06150407791137695 & pav>=0.0003513446099532305\n",
      "   -1.1723 if pav<=0.05245797932147981\n",
      "   -1.1723 if pav<=0.04590139463543893\n",
      "   -3.1580 if \n",
      "   +3.4575 if pav<=0.1663991153240204\n",
      "   -1.0680 if cp>=-0.08425067514181137 & cv<=-0.0232416495680809\n",
      "   +0.4025 if cp<=-0.017811225354671476\n",
      "   -1.0680 if cv<=-0.020909873768687248\n",
      "   +0.0000 if cv<=-1.1675808429718018\n",
      "   +1.0554 if cp>=-0.049787537753581995\n",
      "   +1.4545 if cp<=0.5995281219482423\n",
      "--------------\n",
      "   +1.5560 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   +3.9549 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -2.5738 if pav<=0.057992350310087246\n",
      "   -3.6589 if pa<=0.098355832695961 & pav>=0.03007043376564981\n",
      "   -4.9541 if cv>=-0.016934332624077793\n",
      "   +7.3025 if pav>=0.6552863717079163\n",
      "   +0.0255 if cp<=-0.019469626247882843 & pav>=0.6358610391616821\n",
      "   +0.5009 if pav>=0.7336528301239016\n",
      "   +7.6489 if pa>=0.16336405277252197\n",
      "   +6.0375 if cp<=-0.036720238626003265\n",
      "   +0.6835 if pa>=0.20305509865283966\n",
      "   -5.3810 if cp>=-0.013850249908864498 & pa<=0.05273257568478584\n",
      "Run episode 337 with rewards 54.0\n",
      "============ 338 ===========\n",
      "41 actions [1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 0, 1, 0, 1, 0]\n",
      "   -3.4442 if pav>=0.105914668738842\n",
      "   +0.0000 if pa>=0.06150407791137695 & pav>=0.0003513446099532305\n",
      "   -1.6336 if pav<=0.05245797932147981\n",
      "   -1.6336 if pav<=0.04590139463543893\n",
      "   +0.1062 if \n",
      "   +3.5128 if pav<=0.1663991153240204\n",
      "   +1.7397 if cp>=-0.08425067514181137 & cv<=-0.0232416495680809\n",
      "   +0.1059 if cp<=-0.017811225354671476\n",
      "   -3.2697 if cv<=-0.020909873768687248\n",
      "   +2.2085 if cp>=-0.049787537753581995\n",
      "   +0.1060 if cp<=0.5995281219482423\n",
      "   -5.0570 if pa>=-0.012810707092285156\n",
      "--------------\n",
      "   +3.4075 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   +3.4075 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -0.7486 if pav<=0.057992350310087246\n",
      "   -2.0129 if pa<=0.098355832695961 & pav>=0.03007043376564981\n",
      "   -4.1373 if cv>=-0.016934332624077793\n",
      "   -0.0000 if pav>=0.6552863717079163\n",
      "   -0.0000 if pav>=0.7336528301239016\n",
      "   -0.0000 if pa>=0.16336405277252197\n",
      "   +2.5818 if cp<=-0.036720238626003265\n",
      "   -0.0000 if pa>=0.20305509865283966\n",
      "   -0.0000 if cp>=-0.013850249908864498 & pa<=0.05273257568478584\n",
      "   +5.1083 if pa>=-0.012810707092285156\n",
      "Run episode 338 with rewards 41.0\n",
      "============ 339 ===========\n",
      "59 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 1, 0, 0, 0, 1, 0, 1, 1, 1, 0, 1, 0, 0, 1, 0, 0, 1, 0, 1, 1, 0, 1, 1, 1, 1, 0, 0, 0, 1, 0, 1]\n",
      "   -3.1485 if pav>=0.105914668738842\n",
      "   +0.7785 if pav<=0.05245797932147981\n",
      "   +0.7759 if pav<=0.04590139463543893\n",
      "   -1.6813 if \n",
      "   +1.2249 if pav<=0.1663991153240204\n",
      "   +1.0469 if cp>=-0.08425067514181137 & cv<=-0.0232416495680809\n",
      "   -0.2027 if cp<=-0.017811225354671476\n",
      "   -0.1227 if cv<=-0.020909873768687248\n",
      "   +3.1116 if cp>=-0.049787537753581995\n",
      "   -1.6813 if cp<=0.5995281219482423\n",
      "   -6.4259 if pa>=-0.012810707092285156\n",
      "   +5.0370 if cp>=0.069877527654171 & cv<=-0.3840923011302948 & pa<=-0.10324875265359879 & pav<=0.16621984541416168 & pav>=-0.024124905467033355\n",
      "--------------\n",
      "   +3.4445 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   +2.8177 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -2.0960 if pav<=0.057992350310087246\n",
      "   -1.5988 if pa<=0.098355832695961 & pav>=0.03007043376564981\n",
      "   +0.1007 if cv>=-0.016934332624077793\n",
      "   +0.0000 if pav>=0.6552863717079163\n",
      "   +0.0000 if pa>=0.16336405277252197\n",
      "   +2.0757 if cp<=-0.036720238626003265\n",
      "   +0.0000 if pa>=0.20305509865283966\n",
      "   -1.1692 if cp>=-0.013850249908864498 & pa<=0.05273257568478584\n",
      "   +5.1665 if pa>=-0.012810707092285156\n",
      "   +3.1807 if cp>=0.10926582664251328 & cv>=-0.3840923011302948 & pav>=-0.024124905467033355\n",
      "Run episode 339 with rewards 59.0\n",
      "============ 340 ===========\n",
      "75 actions [0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 0, 1, 0, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 1, 0, 0, 0, 1, 0, 1, 1, 1, 0]\n",
      "   -4.2094 if pav>=0.105914668738842\n",
      "   +0.0375 if pav<=0.05245797932147981\n",
      "   +0.0375 if pav<=0.04590139463543893\n",
      "   -0.2911 if \n",
      "   +1.1903 if pav<=0.1663991153240204\n",
      "   +0.3611 if cp>=-0.08425067514181137 & cv<=-0.0232416495680809\n",
      "   -0.5382 if cp<=-0.017811225354671476\n",
      "   +1.5128 if cp>=-0.049787537753581995\n",
      "   -0.2911 if cp<=0.5995281219482423\n",
      "   -4.4687 if pa>=-0.012810707092285156\n",
      "   +0.0000 if cp>=0.069877527654171 & cv<=-0.3840923011302948 & pa<=-0.10324875265359879 & pav<=0.16621984541416168 & pav>=-0.024124905467033355\n",
      "   +2.1094 if pa>=-0.0184244766831398\n",
      "--------------\n",
      "   +3.4681 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   +3.4681 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -1.6330 if pav<=0.057992350310087246\n",
      "   -2.0270 if pa<=0.098355832695961 & pav>=0.03007043376564981\n",
      "   -2.1613 if cv>=-0.016934332624077793\n",
      "   -0.0000 if pav>=0.6552863717079163\n",
      "   -0.0000 if pa>=0.16336405277252197\n",
      "   +2.1538 if cp<=-0.036720238626003265\n",
      "   -0.7488 if cp>=-0.013850249908864498 & pa<=0.05273257568478584\n",
      "   +2.3082 if pa>=-0.012810707092285156\n",
      "   -0.0000 if cp>=0.10926582664251328 & cv>=-0.3840923011302948 & pav>=-0.024124905467033355\n",
      "   -4.1669 if cv>=-0.038128226250410076 & pa<=-0.03187356479465961 & pa>=-0.05336616933345794 & pav<=-0.005363373120780937\n",
      "Run episode 340 with rewards 75.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 341 ===========\n",
      "64 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 0, 0]\n",
      "   -0.7647 if pav>=0.105914668738842\n",
      "   +1.3370 if pav<=0.05245797932147981\n",
      "   +1.3370 if pav<=0.04590139463543893\n",
      "   -0.6374 if \n",
      "   -0.1130 if pav<=0.1663991153240204\n",
      "   -1.4871 if cp>=-0.08425067514181137 & cv<=-0.0232416495680809\n",
      "   -0.6372 if cp<=-0.017811225354671476\n",
      "   -2.2777 if cp>=-0.049787537753581995\n",
      "   -0.6374 if cp<=0.5995281219482423\n",
      "   +0.5270 if pa>=-0.012810707092285156\n",
      "   -0.6615 if pa>=-0.0184244766831398\n",
      "   +3.6221 if cp>=-0.09509782195091246\n",
      "--------------\n",
      "   +4.5897 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   +4.5897 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -5.5235 if pav<=0.057992350310087246\n",
      "   -4.8173 if pa<=0.098355832695961 & pav>=0.03007043376564981\n",
      "   -7.4419 if cv>=-0.016934332624077793\n",
      "   +0.0000 if pa>=0.16336405277252197\n",
      "   +8.9190 if cp<=-0.036720238626003265\n",
      "   +0.0000 if cp>=-0.013850249908864498 & pa<=0.05273257568478584\n",
      "   +1.7558 if pa>=-0.012810707092285156\n",
      "   +0.0000 if cp>=0.10926582664251328 & cv>=-0.3840923011302948 & pav>=-0.024124905467033355\n",
      "   -0.0950 if cv>=-0.038128226250410076 & pa<=-0.03187356479465961 & pa>=-0.05336616933345794 & pav<=-0.005363373120780937\n",
      "   -3.5617 if pa<=-0.024554470181465147\n",
      "Run episode 341 with rewards 64.0\n",
      "============ 342 ===========\n",
      "38 actions [1, 0, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1]\n",
      "   -2.5401 if pav>=0.105914668738842\n",
      "   -1.7826 if pav<=0.05245797932147981\n",
      "   -1.7826 if pav<=0.04590139463543893\n",
      "   -0.3373 if \n",
      "   -0.0519 if cp>=-0.08425067514181137 & cv<=-0.0232416495680809\n",
      "   -0.8399 if cp<=-0.017811225354671476\n",
      "   -0.3373 if cp>=-0.049787537753581995\n",
      "   -0.3373 if cp<=0.5995281219482423\n",
      "   -0.3780 if pa>=-0.012810707092285156\n",
      "   -0.3373 if pa>=-0.0184244766831398\n",
      "   -0.3373 if cp>=-0.09509782195091246\n",
      "   +4.9419 if cp<=-0.0008626096241641661 & cv>=-0.031332161650061606 & pav<=0.2735911250114441\n",
      "--------------\n",
      "   +2.4206 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   +6.1575 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -1.7179 if pav<=0.057992350310087246\n",
      "   -7.5567 if pa<=0.098355832695961 & pav>=0.03007043376564981\n",
      "   -4.9227 if cv>=-0.016934332624077793\n",
      "   +3.2545 if cp<=-0.036720238626003265\n",
      "   +1.0910 if cp>=-0.013850249908864498 & pa<=0.05273257568478584\n",
      "   +1.7465 if pa>=-0.012810707092285156\n",
      "   +5.5697 if cp>=0.10926582664251328 & cv>=-0.3840923011302948 & pav>=-0.024124905467033355\n",
      "   +0.0000 if cv>=-0.038128226250410076 & pa<=-0.03187356479465961 & pa>=-0.05336616933345794 & pav<=-0.005363373120780937\n",
      "   +0.0003 if pa<=-0.024554470181465147\n",
      "   +3.3268 if cp<=-0.027232754603028295 & cv<=0.3430480003356934 & cv>=0.16532536149024965 & pa<=0.08026138395071031 & pa>=0.05639499574899674\n",
      "Run episode 342 with rewards 38.0\n",
      "============ 343 ===========\n",
      "47 actions [0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0]\n",
      "   -1.4109 if pav>=0.105914668738842\n",
      "   -0.9311 if pav<=0.05245797932147981\n",
      "   -0.9311 if pav<=0.04590139463543893\n",
      "   -0.2906 if \n",
      "   +0.0000 if cp<=-0.017811225354671476\n",
      "   -0.2906 if cp>=-0.049787537753581995\n",
      "   -0.2906 if cp<=0.5995281219482423\n",
      "   -2.3112 if pa>=-0.012810707092285156\n",
      "   -2.3112 if pa>=-0.0184244766831398\n",
      "   -0.2906 if cp>=-0.09509782195091246\n",
      "   +0.0000 if cp<=-0.0008626096241641661 & cv>=-0.031332161650061606 & pav<=0.2735911250114441\n",
      "   +3.8358 if cp<=0.044039408117532736 & pav<=0.04885842204093936\n",
      "--------------\n",
      "   +3.1676 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   +3.1676 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -2.7254 if pav<=0.057992350310087246\n",
      "   -2.6968 if pa<=0.098355832695961 & pav>=0.03007043376564981\n",
      "   -1.9297 if cv>=-0.016934332624077793\n",
      "   +0.0000 if cp<=-0.036720238626003265\n",
      "   +0.9489 if cp>=-0.013850249908864498 & pa<=0.05273257568478584\n",
      "   +2.0307 if pa>=-0.012810707092285156\n",
      "   +4.4994 if cp>=0.10926582664251328 & cv>=-0.3840923011302948 & pav>=-0.024124905467033355\n",
      "   -3.7072 if pa<=-0.024554470181465147\n",
      "   +0.0000 if cp<=-0.027232754603028295 & cv<=0.3430480003356934 & cv>=0.16532536149024965 & pa<=0.08026138395071031 & pa>=0.05639499574899674\n",
      "   -4.0611 if cp<=0.044039408117532736\n",
      "Run episode 343 with rewards 47.0\n",
      "============ 344 ===========\n",
      "96 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 0, 1, 1]\n",
      "   -3.3967 if pav>=0.105914668738842\n",
      "   -2.1350 if pav<=0.05245797932147981\n",
      "   -2.1350 if pav<=0.04590139463543893\n",
      "   -0.3969 if \n",
      "   -0.3969 if cp>=-0.049787537753581995\n",
      "   -0.3969 if cp<=0.5995281219482423\n",
      "   -0.2255 if pa>=-0.012810707092285156\n",
      "   -0.7420 if pa>=-0.0184244766831398\n",
      "   -0.3969 if cp>=-0.09509782195091246\n",
      "   +0.0000 if cp<=-0.0008626096241641661 & cv>=-0.031332161650061606 & pav<=0.2735911250114441\n",
      "   +2.8817 if cp<=0.044039408117532736 & pav<=0.04885842204093936\n",
      "   +0.8841 if pa>=0.06627633720636368\n",
      "--------------\n",
      "   +4.0310 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   +4.0310 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   +0.2321 if pav<=0.057992350310087246\n",
      "   -2.9723 if pa<=0.098355832695961 & pav>=0.03007043376564981\n",
      "   -2.0649 if cv>=-0.016934332624077793\n",
      "   +0.7081 if cp>=-0.013850249908864498 & pa<=0.05273257568478584\n",
      "   -0.7664 if pa>=-0.012810707092285156\n",
      "   -0.0001 if cp>=0.10926582664251328 & cv>=-0.3840923011302948 & pav>=-0.024124905467033355\n",
      "   -1.2759 if pa<=-0.024554470181465147\n",
      "   -0.0000 if cp<=-0.027232754603028295 & cv<=0.3430480003356934 & cv>=0.16532536149024965 & pa<=0.08026138395071031 & pa>=0.05639499574899674\n",
      "   -3.7160 if cp<=0.044039408117532736\n",
      "   -1.2256 if pa>=0.06627633720636368\n",
      "Run episode 344 with rewards 96.0\n",
      "============ 345 ===========\n",
      "145 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 0, 1]\n",
      "   -2.5543 if pav>=0.105914668738842\n",
      "   +0.9141 if pav<=0.05245797932147981\n",
      "   +0.9141 if pav<=0.04590139463543893\n",
      "   -1.0216 if \n",
      "   +2.7932 if cp>=-0.049787537753581995\n",
      "   -1.0216 if cp<=0.5995281219482423\n",
      "   -1.2131 if pa>=-0.012810707092285156\n",
      "   -0.3432 if pa>=-0.0184244766831398\n",
      "   -3.3773 if cp>=-0.09509782195091246\n",
      "   +0.9139 if cp<=0.044039408117532736 & pav<=0.04885842204093936\n",
      "   +1.8735 if pa>=0.06627633720636368\n",
      "   +3.5328 if cv>=-0.18048720061779022 & pa<=-0.004059776198118925\n",
      "--------------\n",
      "   +2.1396 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   +4.0397 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -3.6432 if pav<=0.057992350310087246\n",
      "   -2.3790 if pa<=0.098355832695961 & pav>=0.03007043376564981\n",
      "   -4.3473 if cv>=-0.016934332624077793\n",
      "   -0.0001 if cp>=-0.013850249908864498 & pa<=0.05273257568478584\n",
      "   -0.4845 if pa>=-0.012810707092285156\n",
      "   -0.0000 if cp>=0.10926582664251328 & cv>=-0.3840923011302948 & pav>=-0.024124905467033355\n",
      "   -0.2397 if pa<=-0.024554470181465147\n",
      "   -1.0856 if cp<=0.044039408117532736\n",
      "   -0.5126 if pa>=0.06627633720636368\n",
      "   +5.2513 if cp>=-0.08059857785701752 & cv<=0.014681009575724603 & pa>=-0.004059776198118925 & pav<=-0.07986588776111603\n",
      "Run episode 345 with rewards 145.0\n",
      "============ 346 ===========\n",
      "126 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 1, 0, 1, 1, 1, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 0, 0, 0, 1, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1]\n",
      "   -1.7943 if pav>=0.105914668738842\n",
      "   +1.6187 if pav<=0.05245797932147981\n",
      "   +1.6090 if pav<=0.04590139463543893\n",
      "   +0.3404 if \n",
      "   -1.3763 if cp>=-0.049787537753581995\n",
      "   +0.3404 if cp<=0.5995281219482423\n",
      "   -3.8173 if pa>=-0.012810707092285156\n",
      "   -3.5179 if cp>=-0.09509782195091246\n",
      "   +1.6092 if cp<=0.044039408117532736 & pav<=0.04885842204093936\n",
      "   +1.3865 if pa>=0.06627633720636368\n",
      "   +6.0837 if cv>=-0.18048720061779022 & pa<=-0.004059776198118925\n",
      "   -1.0833 if pa>=-0.0010778869735077012\n",
      "--------------\n",
      "   +4.1262 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   +4.2740 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -1.5606 if pav<=0.057992350310087246\n",
      "   -2.6087 if pa<=0.098355832695961 & pav>=0.03007043376564981\n",
      "   -4.7104 if cv>=-0.016934332624077793\n",
      "   -2.1958 if cp>=-0.013850249908864498 & pa<=0.05273257568478584\n",
      "   +2.6337 if pa>=-0.012810707092285156\n",
      "   +0.7040 if pa<=-0.024554470181465147\n",
      "   -3.6324 if cp<=0.044039408117532736\n",
      "   -2.2614 if pa>=0.06627633720636368\n",
      "   +4.6534 if cp>=-0.08059857785701752 & cv<=0.014681009575724603 & pa>=-0.004059776198118925 & pav<=-0.07986588776111603\n",
      "   +4.9849 if cp<=-0.019790080562233924 & cp>=-0.05575457662343977 & cv<=0.008943953551352026 & pa>=-0.0010778869735077012\n",
      "Run episode 346 with rewards 126.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 347 ===========\n",
      "108 actions [0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 1, 1]\n",
      "   -3.3312 if pav>=0.105914668738842\n",
      "   +1.4980 if pav<=0.05245797932147981\n",
      "   +1.4954 if pav<=0.04590139463543893\n",
      "   -1.4291 if cp>=-0.049787537753581995\n",
      "   +4.4878 if cp<=0.5995281219482423\n",
      "   -0.7923 if pa>=-0.012810707092285156\n",
      "   -1.4287 if cp>=-0.09509782195091246\n",
      "   +1.8880 if cp<=0.044039408117532736 & pav<=0.04885842204093936\n",
      "   -3.8593 if pa>=0.06627633720636368\n",
      "   +0.0336 if cv>=-0.18048720061779022 & pa<=-0.004059776198118925\n",
      "   -0.7556 if pa>=-0.0010778869735077012\n",
      "   -4.1905 if cv<=1.090015172958374 & pav>=-0.1139802634716034\n",
      "--------------\n",
      "   +4.2676 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   +4.2704 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -3.3302 if pav<=0.057992350310087246\n",
      "   -4.1315 if pa<=0.098355832695961 & pav>=0.03007043376564981\n",
      "   -2.6063 if cv>=-0.016934332624077793\n",
      "   -0.3539 if cp>=-0.013850249908864498 & pa<=0.05273257568478584\n",
      "   -1.8135 if pa>=-0.012810707092285156\n",
      "   -4.8169 if cp<=0.044039408117532736\n",
      "   +1.6628 if pa>=0.06627633720636368\n",
      "   +0.0000 if cp>=-0.08059857785701752 & cv<=0.014681009575724603 & pa>=-0.004059776198118925 & pav<=-0.07986588776111603\n",
      "   +0.0000 if cp<=-0.019790080562233924 & cp>=-0.05575457662343977 & cv<=0.008943953551352026 & pa>=-0.0010778869735077012\n",
      "   +4.3773 if pa>=0.16891589760780334\n",
      "Run episode 347 with rewards 108.0\n",
      "============ 348 ===========\n",
      "115 actions [0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 1, 0, 0, 1, 0, 1, 1, 1, 0, 0, 1, 1, 0, 1, 1, 1, 0, 0, 1]\n",
      "   -0.8383 if pav>=0.105914668738842\n",
      "   -1.5409 if pav<=0.05245797932147981\n",
      "   +7.1653 if pav<=0.04590139463543893\n",
      "   -1.5869 if cp>=-0.049787537753581995\n",
      "   +2.8832 if cp<=0.5995281219482423\n",
      "   -1.5869 if pa>=-0.012810707092285156\n",
      "   -1.5869 if cp>=-0.09509782195091246\n",
      "   +0.1207 if cp<=0.044039408117532736 & pav<=0.04885842204093936\n",
      "   -3.1504 if pa>=0.06627633720636368\n",
      "   -1.5869 if pa>=-0.0010778869735077012\n",
      "   -5.6614 if cv<=1.090015172958374 & pav>=-0.1139802634716034\n",
      "   +4.7163 if pa<=0.1111291527748108 & pav<=0.10654703080654145 & pav>=-0.13545677959918975\n",
      "--------------\n",
      "   +3.9273 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   +2.1892 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -3.1073 if pav<=0.057992350310087246\n",
      "   -3.7571 if pa<=0.098355832695961 & pav>=0.03007043376564981\n",
      "   -2.7481 if cv>=-0.016934332624077793\n",
      "   +0.6980 if cp>=-0.013850249908864498 & pa<=0.05273257568478584\n",
      "   -0.3982 if pa>=-0.012810707092285156\n",
      "   -4.1619 if cp<=0.044039408117532736\n",
      "   -0.4309 if pa>=0.06627633720636368\n",
      "   +0.0000 if cp<=-0.019790080562233924 & cp>=-0.05575457662343977 & cv<=0.008943953551352026 & pa>=-0.0010778869735077012\n",
      "   +4.0309 if pa>=0.16891589760780334\n",
      "   +5.7470 if cv<=0.7265483379364014 & pa>=0.1111291527748108 & pav>=-0.13545677959918975\n",
      "Run episode 348 with rewards 115.0\n",
      "============ 349 ===========\n",
      "108 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 0, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0]\n",
      "   -2.1424 if pav>=0.105914668738842\n",
      "   +2.3407 if pav<=0.05245797932147981\n",
      "   +3.1401 if pav<=0.04590139463543893\n",
      "   -1.8395 if cp>=-0.049787537753581995\n",
      "   +0.9891 if cp<=0.5995281219482423\n",
      "   -1.8395 if pa>=-0.012810707092285156\n",
      "   -1.8395 if cp>=-0.09509782195091246\n",
      "   -1.7227 if pa>=0.06627633720636368\n",
      "   -1.8395 if pa>=-0.0010778869735077012\n",
      "   -1.2592 if cv<=1.090015172958374 & pav>=-0.1139802634716034\n",
      "   +4.0669 if pa<=0.1111291527748108 & pav<=0.10654703080654145 & pav>=-0.13545677959918975\n",
      "   -1.7824 if cv<=1.8233052253723145\n",
      "--------------\n",
      "   +2.8953 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   +2.8963 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -3.5223 if pav<=0.057992350310087246\n",
      "   -3.9010 if pa<=0.098355832695961 & pav>=0.03007043376564981\n",
      "   -1.0382 if cv>=-0.016934332624077793\n",
      "   -0.4089 if cp>=-0.013850249908864498 & pa<=0.05273257568478584\n",
      "   -0.3342 if pa>=-0.012810707092285156\n",
      "   -4.0064 if cp<=0.044039408117532736\n",
      "   -1.7849 if pa>=0.06627633720636368\n",
      "   +4.4264 if pa>=0.16891589760780334\n",
      "   +0.0656 if cv<=0.7265483379364014 & pa>=0.1111291527748108 & pav>=-0.13545677959918975\n",
      "   +8.3523 if cp<=0.6332397222518922 & cv<=1.2735252141952516 & pa>=0.1352175295352936\n",
      "Run episode 349 with rewards 108.0\n",
      "============ 350 ===========\n",
      "112 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 1, 1, 0, 0, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 0, 1, 1, 0, 1, 1, 1, 0, 0, 1, 0, 1, 1]\n",
      "   -3.4567 if pav>=0.105914668738842\n",
      "   +1.0689 if pav<=0.05245797932147981\n",
      "   +1.0688 if pav<=0.04590139463543893\n",
      "   -1.0887 if cp>=-0.049787537753581995\n",
      "   -1.0887 if pa>=-0.012810707092285156\n",
      "   -1.0887 if cp>=-0.09509782195091246\n",
      "   -0.9453 if pa>=0.06627633720636368\n",
      "   -1.0887 if pa>=-0.0010778869735077012\n",
      "   +0.8672 if cv<=1.090015172958374 & pav>=-0.1139802634716034\n",
      "   +4.4619 if pa<=0.1111291527748108 & pav<=0.10654703080654145 & pav>=-0.13545677959918975\n",
      "   -1.3649 if cv<=1.8233052253723145\n",
      "   -2.0272 if pav>=0.0027710466645658313\n",
      "--------------\n",
      "   +2.3674 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   +2.3752 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -1.8830 if pav<=0.057992350310087246\n",
      "   -0.9205 if pa<=0.098355832695961 & pav>=0.03007043376564981\n",
      "   -2.3796 if cv>=-0.016934332624077793\n",
      "   +0.1039 if cp>=-0.013850249908864498 & pa<=0.05273257568478584\n",
      "   -2.1138 if pa>=-0.012810707092285156\n",
      "   -5.1221 if cp<=0.044039408117532736\n",
      "   -1.2050 if pa>=0.06627633720636368\n",
      "   +5.3528 if pa>=0.16891589760780334\n",
      "   +6.3394 if cp<=0.6332397222518922 & cv<=1.2735252141952516 & pa>=0.1352175295352936\n",
      "   +5.8988 if cp<=0.708822238445282 & pa>=0.12988671362400056 & pav<=0.11138861924409868 & pav>=0.0027710466645658313\n",
      "Run episode 350 with rewards 112.0\n",
      "============ 351 ===========\n",
      "85 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1]\n",
      "   -5.8370 if pav>=0.105914668738842\n",
      "   -0.7973 if pav<=0.05245797932147981\n",
      "   -1.6252 if pav<=0.04590139463543893\n",
      "   +1.9528 if cp>=-0.049787537753581995\n",
      "   +1.9528 if pa>=-0.012810707092285156\n",
      "   +1.9528 if cp>=-0.09509782195091246\n",
      "   -5.9065 if pa>=0.06627633720636368\n",
      "   +1.9528 if pa>=-0.0010778869735077012\n",
      "   +4.3967 if pa<=0.1111291527748108 & pav<=0.10654703080654145 & pav>=-0.13545677959918975\n",
      "   -1.9365 if cv<=1.8233052253723145\n",
      "   -4.3275 if pav>=0.0027710466645658313\n",
      "   -2.1797 if cp<=0.5970404863357547 & pav>=-0.09791276156902312\n",
      "--------------\n",
      "   +1.0702 if cp<=0.09485256969928751 & pav>=0.105914668738842\n",
      "   +1.0704 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -3.8709 if pav<=0.057992350310087246\n",
      "   -1.3085 if pa<=0.098355832695961 & pav>=0.03007043376564981\n",
      "   -6.1718 if cv>=-0.016934332624077793\n",
      "   -3.8309 if pa>=-0.012810707092285156\n",
      "   -5.4019 if cp<=0.044039408117532736\n",
      "   +3.7472 if pa>=0.06627633720636368\n",
      "   +5.3242 if pa>=0.16891589760780334\n",
      "   +8.2101 if cp<=0.6332397222518922 & cv<=1.2735252141952516 & pa>=0.1352175295352936\n",
      "   +2.4560 if cp<=0.708822238445282 & pa>=0.12988671362400056 & pav<=0.11138861924409868 & pav>=0.0027710466645658313\n",
      "   +4.3476 if cp<=0.16845353841781624\n",
      "Run episode 351 with rewards 85.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 352 ===========\n",
      "100 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1]\n",
      "   -4.5990 if pav>=0.105914668738842\n",
      "   +1.4835 if pav<=0.04590139463543893\n",
      "   +0.7393 if cp>=-0.049787537753581995\n",
      "   +0.7393 if pa>=-0.012810707092285156\n",
      "   +0.7393 if cp>=-0.09509782195091246\n",
      "   -6.1077 if pa>=0.06627633720636368\n",
      "   +0.7393 if pa>=-0.0010778869735077012\n",
      "   +4.0864 if pa<=0.1111291527748108 & pav<=0.10654703080654145 & pav>=-0.13545677959918975\n",
      "   +2.3884 if cv<=1.8233052253723145\n",
      "   -3.7449 if pav>=0.0027710466645658313\n",
      "   -4.1544 if cp<=0.5970404863357547 & pav>=-0.09791276156902312\n",
      "   -0.9847 if cv<=0.5537882566452026\n",
      "--------------\n",
      "   -0.3908 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -6.1511 if pav<=0.057992350310087246\n",
      "   -2.9921 if pa<=0.098355832695961 & pav>=0.03007043376564981\n",
      "   -7.2937 if cv>=-0.016934332624077793\n",
      "   -0.1338 if pa>=-0.012810707092285156\n",
      "   -4.3147 if cp<=0.044039408117532736\n",
      "   +2.6415 if pa>=0.06627633720636368\n",
      "   -0.0549 if pa>=0.16891589760780334\n",
      "   +7.1067 if cp<=0.6332397222518922 & cv<=1.2735252141952516 & pa>=0.1352175295352936\n",
      "   -1.7141 if cp<=0.708822238445282 & pa>=0.12988671362400056 & pav<=0.11138861924409868 & pav>=0.0027710466645658313\n",
      "   +3.8688 if cp<=0.16845353841781624\n",
      "   +2.0402 if cv<=0.5537882566452026 & pav>=-0.06207260489463806\n",
      "Run episode 352 with rewards 100.0\n",
      "============ 353 ===========\n",
      "113 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1]\n",
      "   -5.0529 if pav>=0.105914668738842\n",
      "   +0.8180 if pav<=0.04590139463543893\n",
      "   +1.6881 if cp>=-0.049787537753581995\n",
      "   +1.6881 if pa>=-0.012810707092285156\n",
      "   -2.6720 if pa>=0.06627633720636368\n",
      "   +1.6881 if pa>=-0.0010778869735077012\n",
      "   +6.7251 if pa<=0.1111291527748108 & pav<=0.10654703080654145 & pav>=-0.13545677959918975\n",
      "   +2.0902 if cv<=1.8233052253723145\n",
      "   -6.6822 if pav>=0.0027710466645658313\n",
      "   -3.4844 if cp<=0.5970404863357547 & pav>=-0.09791276156902312\n",
      "   -0.7696 if cv<=0.5537882566452026\n",
      "   -2.6564 if cv>=0.12479247599840164\n",
      "--------------\n",
      "   +3.4619 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -5.2594 if pav<=0.057992350310087246\n",
      "   -3.3919 if pa<=0.098355832695961 & pav>=0.03007043376564981\n",
      "   -1.9955 if cv>=-0.016934332624077793\n",
      "   -0.6776 if pa>=-0.012810707092285156\n",
      "   -3.3984 if cp<=0.044039408117532736\n",
      "   -1.9872 if pa>=0.06627633720636368\n",
      "   +1.9978 if cp<=0.6332397222518922 & cv<=1.2735252141952516 & pa>=0.1352175295352936\n",
      "   +3.8696 if cp<=0.708822238445282 & pa>=0.12988671362400056 & pav<=0.11138861924409868 & pav>=0.0027710466645658313\n",
      "   +2.3483 if cp<=0.16845353841781624\n",
      "   +2.5171 if cv<=0.5537882566452026 & pav>=-0.06207260489463806\n",
      "   -2.4985 if cv<=0.4235154509544375\n",
      "Run episode 353 with rewards 113.0\n",
      "origin 302.56631675514944 new 31724.76295977612 not updated\n",
      "============ 354 ===========\n",
      "141 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1]\n",
      "   -5.0529 if pav>=0.105914668738842\n",
      "   +0.8180 if pav<=0.04590139463543893\n",
      "   +1.6881 if cp>=-0.049787537753581995\n",
      "   +1.6881 if pa>=-0.012810707092285156\n",
      "   -2.6720 if pa>=0.06627633720636368\n",
      "   +1.6881 if pa>=-0.0010778869735077012\n",
      "   +6.7251 if pa<=0.1111291527748108 & pav<=0.10654703080654145 & pav>=-0.13545677959918975\n",
      "   +2.0902 if cv<=1.8233052253723145\n",
      "   -6.6822 if pav>=0.0027710466645658313\n",
      "   -3.4844 if cp<=0.5970404863357547 & pav>=-0.09791276156902312\n",
      "   -0.7696 if cv<=0.5537882566452026\n",
      "   -2.6564 if cv>=0.12479247599840164\n",
      "--------------\n",
      "   +2.1102 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -7.2245 if pav<=0.057992350310087246\n",
      "   -4.4940 if pa<=0.098355832695961 & pav>=0.03007043376564981\n",
      "   -1.7469 if cv>=-0.016934332624077793\n",
      "   -3.2970 if cp<=0.044039408117532736\n",
      "   -1.6610 if pa>=0.06627633720636368\n",
      "   +0.0444 if cp<=0.6332397222518922 & cv<=1.2735252141952516 & pa>=0.1352175295352936\n",
      "   +5.6895 if cp<=0.708822238445282 & pa>=0.12988671362400056 & pav<=0.11138861924409868 & pav>=0.0027710466645658313\n",
      "   +2.3564 if cp<=0.16845353841781624\n",
      "   -3.1102 if cv<=0.5537882566452026 & pav>=-0.06207260489463806\n",
      "   +4.3265 if cv<=0.4235154509544375\n",
      "   +3.4690 if cp>=-0.041911496222019194 & pa>=0.062811429053545\n",
      "Run episode 354 with rewards 141.0\n",
      "============ 355 ===========\n",
      "86 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 1]\n",
      "   -5.4732 if pav>=0.105914668738842\n",
      "   +0.5828 if pav<=0.04590139463543893\n",
      "   +0.8473 if cp>=-0.049787537753581995\n",
      "   +0.2529 if pa>=-0.012810707092285156\n",
      "   -1.7080 if pa>=0.06627633720636368\n",
      "   -0.1861 if pa>=-0.0010778869735077012\n",
      "   +5.6647 if pa<=0.1111291527748108 & pav<=0.10654703080654145 & pav>=-0.13545677959918975\n",
      "   +4.7273 if cv<=1.8233052253723145\n",
      "   -6.6777 if pav>=0.0027710466645658313\n",
      "   -2.2545 if cp<=0.5970404863357547 & pav>=-0.09791276156902312\n",
      "   -1.6812 if cv>=0.12479247599840164\n",
      "   -1.6615 if pav<=0.03712228685617447\n",
      "--------------\n",
      "   +3.7244 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -3.4823 if pav<=0.057992350310087246\n",
      "   +0.4838 if pa<=0.098355832695961 & pav>=0.03007043376564981\n",
      "   -1.7895 if cv>=-0.016934332624077793\n",
      "   -0.9377 if cp<=0.044039408117532736\n",
      "   -1.5189 if pa>=0.06627633720636368\n",
      "   +5.0019 if cp<=0.708822238445282 & pa>=0.12988671362400056 & pav<=0.11138861924409868 & pav>=0.0027710466645658313\n",
      "   -1.1304 if cp<=0.16845353841781624\n",
      "   -2.4647 if cv<=0.5537882566452026 & pav>=-0.06207260489463806\n",
      "   -0.7519 if cv<=0.4235154509544375\n",
      "   +0.8278 if cp>=-0.041911496222019194 & pa>=0.062811429053545\n",
      "   -2.5215 if cv<=0.5127084851264954 & pa<=0.13488030433654788\n",
      "Run episode 355 with rewards 86.0\n",
      "============ 356 ===========\n",
      "73 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 0, 1]\n",
      "   -6.6784 if pav>=0.105914668738842\n",
      "   +0.1250 if pav<=0.04590139463543893\n",
      "   +3.3426 if cp>=-0.049787537753581995\n",
      "   +3.3444 if pa>=-0.012810707092285156\n",
      "   -0.0275 if pa>=0.06627633720636368\n",
      "   +3.5253 if pa<=0.1111291527748108 & pav<=0.10654703080654145 & pav>=-0.13545677959918975\n",
      "   -6.0374 if cv<=1.8233052253723145\n",
      "   -2.0630 if pav>=0.0027710466645658313\n",
      "   -4.8076 if cp<=0.5970404863357547 & pav>=-0.09791276156902312\n",
      "   +0.1840 if cv>=0.12479247599840164\n",
      "   +0.9553 if pav<=0.03712228685617447\n",
      "   +1.1176 if cp>=0.007020970340818167\n",
      "--------------\n",
      "   +2.8126 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -2.6942 if pav<=0.057992350310087246\n",
      "   -2.2071 if cv>=-0.016934332624077793\n",
      "   -1.5713 if cp<=0.044039408117532736\n",
      "   -1.2607 if pa>=0.06627633720636368\n",
      "   +4.4522 if cp<=0.708822238445282 & pa>=0.12988671362400056 & pav<=0.11138861924409868 & pav>=0.0027710466645658313\n",
      "   -0.5065 if cp<=0.16845353841781624\n",
      "   -0.5008 if cv<=0.5537882566452026 & pav>=-0.06207260489463806\n",
      "   -1.4934 if cv<=0.4235154509544375\n",
      "   -1.2607 if cp>=-0.041911496222019194 & pa>=0.062811429053545\n",
      "   -1.4934 if cv<=0.5127084851264954 & pa<=0.13488030433654788\n",
      "   +1.8231 if cv<=0.3260839581489563\n",
      "Run episode 356 with rewards 73.0\n",
      "============ 357 ===========\n",
      "99 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1]\n",
      "   -7.7548 if pav>=0.105914668738842\n",
      "   -0.1138 if pav<=0.04590139463543893\n",
      "   -1.3179 if cp>=-0.049787537753581995\n",
      "   -1.3179 if pa>=-0.012810707092285156\n",
      "   +2.5545 if pa<=0.1111291527748108 & pav<=0.10654703080654145 & pav>=-0.13545677959918975\n",
      "   -1.3147 if cv<=1.8233052253723145\n",
      "   -2.2861 if pav>=0.0027710466645658313\n",
      "   +3.9115 if cp<=0.5970404863357547 & pav>=-0.09791276156902312\n",
      "   -1.3952 if cv>=0.12479247599840164\n",
      "   +4.9882 if pav<=0.03712228685617447\n",
      "   -1.3206 if cp>=0.007020970340818167\n",
      "   +1.6016 if cp>=0.39807631969451907\n",
      "--------------\n",
      "   +1.4658 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -5.9961 if pav<=0.057992350310087246\n",
      "   -1.0605 if cv>=-0.016934332624077793\n",
      "   -1.1625 if cp<=0.044039408117532736\n",
      "   +0.3634 if pa>=0.06627633720636368\n",
      "   +1.1080 if cp<=0.708822238445282 & pa>=0.12988671362400056 & pav<=0.11138861924409868 & pav>=0.0027710466645658313\n",
      "   -1.7242 if cp<=0.16845353841781624\n",
      "   -0.9864 if cv<=0.4235154509544375\n",
      "   +0.3634 if cp>=-0.041911496222019194 & pa>=0.062811429053545\n",
      "   -0.9864 if cv<=0.5127084851264954 & pa<=0.13488030433654788\n",
      "   -0.9973 if cv<=0.3260839581489563\n",
      "   +0.4107 if pav<=0.05521502792835236\n",
      "Run episode 357 with rewards 99.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 358 ===========\n",
      "76 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 1, 0, 1]\n",
      "   -3.9291 if pav>=0.105914668738842\n",
      "   -0.4198 if cp>=-0.049787537753581995\n",
      "   +0.0953 if pa>=-0.012810707092285156\n",
      "   +1.4288 if pa<=0.1111291527748108 & pav<=0.10654703080654145 & pav>=-0.13545677959918975\n",
      "   -0.5616 if cv<=1.8233052253723145\n",
      "   -1.3127 if pav>=0.0027710466645658313\n",
      "   -0.7696 if cp<=0.5970404863357547 & pav>=-0.09791276156902312\n",
      "   -3.5131 if cv>=0.12479247599840164\n",
      "   +2.7081 if pav<=0.03712228685617447\n",
      "   +1.2760 if cp>=0.007020970340818167\n",
      "   +0.0019 if cp>=0.39807631969451907\n",
      "   -4.3845 if pa<=0.04466329440474512\n",
      "--------------\n",
      "   +1.1816 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -2.2857 if pav<=0.057992350310087246\n",
      "   +0.2699 if cv>=-0.016934332624077793\n",
      "   +0.2662 if cp<=0.044039408117532736\n",
      "   -1.7404 if pa>=0.06627633720636368\n",
      "   +1.4094 if cp<=0.708822238445282 & pa>=0.12988671362400056 & pav<=0.11138861924409868 & pav>=0.0027710466645658313\n",
      "   -0.5437 if cp<=0.16845353841781624\n",
      "   -0.8186 if cv<=0.4235154509544375\n",
      "   -0.8728 if cv<=0.5127084851264954 & pa<=0.13488030433654788\n",
      "   -0.8039 if cv<=0.3260839581489563\n",
      "   -2.2857 if pav<=0.05521502792835236\n",
      "   -4.6738 if cp<=-0.12717827260494233 & cv>=-0.23145818412303926 & pav>=0.2674963116645813\n",
      "Run episode 358 with rewards 76.0\n",
      "============ 359 ===========\n",
      "67 actions [0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1]\n",
      "   -3.4972 if pav>=0.105914668738842\n",
      "   +0.3125 if cp>=-0.049787537753581995\n",
      "   +2.6761 if pa>=-0.012810707092285156\n",
      "   +1.8703 if pa<=0.1111291527748108 & pav<=0.10654703080654145 & pav>=-0.13545677959918975\n",
      "   -0.7904 if cv<=1.8233052253723145\n",
      "   -2.3181 if pav>=0.0027710466645658313\n",
      "   -1.6801 if cp<=0.5970404863357547 & pav>=-0.09791276156902312\n",
      "   +0.0026 if cv>=0.12479247599840164\n",
      "   +3.4969 if pav<=0.03712228685617447\n",
      "   +0.0000 if cp>=0.007020970340818167\n",
      "   -3.0329 if pa<=0.04466329440474512\n",
      "   +4.2877 if pav<=0.05537177994847298 & pav>=0.05537177994847298\n",
      "--------------\n",
      "   +1.0917 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -6.0263 if pav<=0.057992350310087246\n",
      "   -0.1502 if cv>=-0.016934332624077793\n",
      "   +0.0052 if pa>=0.06627633720636368\n",
      "   -0.1129 if cp<=0.708822238445282 & pa>=0.12988671362400056 & pav<=0.11138861924409868 & pav>=0.0027710466645658313\n",
      "   -0.1261 if cp<=0.16845353841781624\n",
      "   -0.1261 if cv<=0.4235154509544375\n",
      "   -3.7206 if cv<=0.5127084851264954 & pa<=0.13488030433654788\n",
      "   -0.1261 if cv<=0.3260839581489563\n",
      "   -0.8030 if pav<=0.05521502792835236\n",
      "   -5.8228 if cp<=-0.12717827260494233 & cv>=-0.23145818412303926 & pav>=0.2674963116645813\n",
      "   +1.3351 if pav<=0.26598480343818665 & pav>=0.05537177994847298\n",
      "Run episode 359 with rewards 67.0\n",
      "============ 360 ===========\n",
      "61 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 1, 0, 1, 0, 0, 1, 1, 1, 0, 0]\n",
      "   -2.9640 if pav>=0.105914668738842\n",
      "   -0.7569 if cp>=-0.049787537753581995\n",
      "   -0.7569 if pa>=-0.012810707092285156\n",
      "   +5.1815 if pa<=0.1111291527748108 & pav<=0.10654703080654145 & pav>=-0.13545677959918975\n",
      "   -0.7569 if cv<=1.8233052253723145\n",
      "   -1.0068 if pav>=0.0027710466645658313\n",
      "   -1.5112 if cp<=0.5970404863357547 & pav>=-0.09791276156902312\n",
      "   +3.6257 if cv>=0.12479247599840164\n",
      "   +0.3659 if pav<=0.03712228685617447\n",
      "   -0.6681 if pa<=0.04466329440474512\n",
      "   +0.0000 if pav<=0.05537177994847298 & pav>=0.05537177994847298\n",
      "   -2.6333 if cp>=0.02586027272045614 & pa<=0.10521500110626221\n",
      "--------------\n",
      "   +3.5767 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -1.0261 if pav<=0.057992350310087246\n",
      "   -3.3503 if cv>=-0.016934332624077793\n",
      "   +1.8766 if cp<=0.708822238445282 & pa>=0.12988671362400056 & pav<=0.11138861924409868 & pav>=0.0027710466645658313\n",
      "   +0.9654 if cp<=0.16845353841781624\n",
      "   -2.3829 if cv<=0.4235154509544375\n",
      "   -3.7804 if cv<=0.5127084851264954 & pa<=0.13488030433654788\n",
      "   +0.1754 if cv<=0.3260839581489563\n",
      "   -1.0261 if pav<=0.05521502792835236\n",
      "   -0.0000 if cp<=-0.12717827260494233 & cv>=-0.23145818412303926 & pav>=0.2674963116645813\n",
      "   +3.5781 if pav<=0.26598480343818665 & pav>=0.05537177994847298\n",
      "   +2.9821 if cp>=0.02586027272045614 & pa<=0.10521500110626221\n",
      "Run episode 360 with rewards 61.0\n",
      "============ 361 ===========\n",
      "69 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1, 1, 0, 1, 0, 1, 0, 0, 1, 1, 1, 0, 0]\n",
      "   -4.3267 if pav>=0.105914668738842\n",
      "   -0.7642 if cp>=-0.049787537753581995\n",
      "   -0.7642 if pa>=-0.012810707092285156\n",
      "   +3.3050 if pa<=0.1111291527748108 & pav<=0.10654703080654145 & pav>=-0.13545677959918975\n",
      "   -0.7642 if cv<=1.8233052253723145\n",
      "   -0.8932 if pav>=0.0027710466645658313\n",
      "   -0.7652 if cp<=0.5970404863357547 & pav>=-0.09791276156902312\n",
      "   +4.3837 if cv>=0.12479247599840164\n",
      "   +0.2785 if pav<=0.03712228685617447\n",
      "   +0.4915 if pa<=0.04466329440474512\n",
      "   -1.2353 if cp>=0.02586027272045614 & pa<=0.10521500110626221\n",
      "   -3.9104 if cp<=0.12354667484760284 & cv<=0.20852182805538177 & pa>=0.0888475999236107 & pav>=0.3512481451034546\n",
      "--------------\n",
      "   +4.2957 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -1.1001 if pav<=0.057992350310087246\n",
      "   -1.4820 if cv>=-0.016934332624077793\n",
      "   -0.3374 if cp<=0.708822238445282 & pa>=0.12988671362400056 & pav<=0.11138861924409868 & pav>=0.0027710466645658313\n",
      "   -0.7724 if cp<=0.16845353841781624\n",
      "   -2.8167 if cv<=0.4235154509544375\n",
      "   -3.7446 if cv<=0.5127084851264954 & pa<=0.13488030433654788\n",
      "   +2.8706 if cv<=0.3260839581489563\n",
      "   -1.1001 if pav<=0.05521502792835236\n",
      "   +1.7152 if pav<=0.26598480343818665 & pav>=0.05537177994847298\n",
      "   +0.2851 if cp>=0.02586027272045614 & pa<=0.10521500110626221\n",
      "   +7.7019 if cp>=0.25718066096305847\n",
      "Run episode 361 with rewards 69.0\n",
      "============ 362 ===========\n",
      "53 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1, 1]\n",
      "   -4.1499 if pav>=0.105914668738842\n",
      "   +1.2053 if cp>=-0.049787537753581995\n",
      "   +0.0886 if pa>=-0.012810707092285156\n",
      "   +1.9704 if pa<=0.1111291527748108 & pav<=0.10654703080654145 & pav>=-0.13545677959918975\n",
      "   -0.4033 if cv<=1.8233052253723145\n",
      "   -0.8240 if pav>=0.0027710466645658313\n",
      "   -0.5273 if cp<=0.5970404863357547 & pav>=-0.09791276156902312\n",
      "   +1.1245 if cv>=0.12479247599840164\n",
      "   -1.1957 if pa<=0.04466329440474512\n",
      "   +0.0000 if cp>=0.02586027272045614 & pa<=0.10521500110626221\n",
      "   -1.9504 if cp<=0.12354667484760284 & cv<=0.20852182805538177 & pa>=0.0888475999236107 & pav>=0.3512481451034546\n",
      "   -7.8558 if cp>=0.1524742841720581\n",
      "--------------\n",
      "   +3.2179 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -1.0534 if pav<=0.057992350310087246\n",
      "   -1.3305 if cv>=-0.016934332624077793\n",
      "   -0.4900 if cp<=0.708822238445282 & pa>=0.12988671362400056 & pav<=0.11138861924409868 & pav>=0.0027710466645658313\n",
      "   -0.4379 if cp<=0.16845353841781624\n",
      "   -2.4703 if cv<=0.4235154509544375\n",
      "   -4.0744 if cv<=0.5127084851264954 & pa<=0.13488030433654788\n",
      "   +4.0138 if cv<=0.3260839581489563\n",
      "   -1.0530 if pav<=0.05521502792835236\n",
      "   +1.3188 if pav<=0.26598480343818665 & pav>=0.05537177994847298\n",
      "   +0.0000 if cp>=0.25718066096305847\n",
      "   +7.8631 if cp>=0.1524742841720581\n",
      "Run episode 362 with rewards 53.0\n",
      "============ 363 ===========\n",
      "61 actions [0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1, 1, 1, 1, 0, 1, 0, 0, 1, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1]\n",
      "   -4.0463 if pav>=0.105914668738842\n",
      "   -0.0660 if cp>=-0.049787537753581995\n",
      "   -0.0658 if pa>=-0.012810707092285156\n",
      "   +0.9885 if pa<=0.1111291527748108 & pav<=0.10654703080654145 & pav>=-0.13545677959918975\n",
      "   -0.0659 if cv<=1.8233052253723145\n",
      "   -0.4489 if pav>=0.0027710466645658313\n",
      "   -0.1125 if cp<=0.5970404863357547 & pav>=-0.09791276156902312\n",
      "   +1.7608 if cv>=0.12479247599840164\n",
      "   +6.9711 if pa<=0.04466329440474512\n",
      "   -2.0463 if cp<=0.12354667484760284 & cv<=0.20852182805538177 & pa>=0.0888475999236107 & pav>=0.3512481451034546\n",
      "   +0.0014 if cp>=0.1524742841720581\n",
      "   -6.3589 if pa<=0.03756512999534607\n",
      "--------------\n",
      "   +1.9986 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -1.4951 if pav<=0.057992350310087246\n",
      "   +3.3887 if cv>=-0.016934332624077793\n",
      "   -0.7854 if cp<=0.708822238445282 & pa>=0.12988671362400056 & pav<=0.11138861924409868 & pav>=0.0027710466645658313\n",
      "   -6.0610 if cp<=0.16845353841781624\n",
      "   -0.2747 if cv<=0.4235154509544375\n",
      "   -4.4627 if cv<=0.5127084851264954 & pa<=0.13488030433654788\n",
      "   +4.6981 if cv<=0.3260839581489563\n",
      "   -1.4951 if pav<=0.05521502792835236\n",
      "   +0.8308 if pav<=0.26598480343818665 & pav>=0.05537177994847298\n",
      "   -0.0020 if cp>=0.1524742841720581\n",
      "   +3.4278 if cv<=0.0031123566441237935 & pa<=0.03756512999534607 & pav<=0.3553890585899353\n",
      "Run episode 363 with rewards 61.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 364 ===========\n",
      "51 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1]\n",
      "   -3.3729 if pav>=0.105914668738842\n",
      "   -0.4005 if cp>=-0.049787537753581995\n",
      "   -6.1492 if pa>=-0.012810707092285156\n",
      "   +2.4937 if pa<=0.1111291527748108 & pav<=0.10654703080654145 & pav>=-0.13545677959918975\n",
      "   +2.6067 if cv<=1.8233052253723145\n",
      "   -0.6587 if pav>=0.0027710466645658313\n",
      "   +1.8830 if cp<=0.5970404863357547 & pav>=-0.09791276156902312\n",
      "   +3.1782 if cv>=0.12479247599840164\n",
      "   +4.4563 if pa<=0.04466329440474512\n",
      "   -2.2838 if cp<=0.12354667484760284 & cv<=0.20852182805538177 & pa>=0.0888475999236107 & pav>=0.3512481451034546\n",
      "   -4.5817 if pa<=0.03756512999534607\n",
      "   -3.9998 if cp>=-0.007110046688467264 & cv<=-0.24353250861167908 & pav<=0.32135266065597534\n",
      "--------------\n",
      "   +2.5287 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -2.9263 if pav<=0.057992350310087246\n",
      "   +4.9722 if cv>=-0.016934332624077793\n",
      "   -0.6643 if cp<=0.708822238445282 & pa>=0.12988671362400056 & pav<=0.11138861924409868 & pav>=0.0027710466645658313\n",
      "   -2.1453 if cp<=0.16845353841781624\n",
      "   +0.1035 if cv<=0.4235154509544375\n",
      "   -1.3250 if cv<=0.5127084851264954 & pa<=0.13488030433654788\n",
      "   +0.1036 if cv<=0.3260839581489563\n",
      "   -2.9264 if pav<=0.05521502792835236\n",
      "   -5.1611 if pav<=0.26598480343818665 & pav>=0.05537177994847298\n",
      "   +3.2802 if cv<=0.0031123566441237935 & pa<=0.03756512999534607 & pav<=0.3553890585899353\n",
      "   +4.7720 if cp<=-0.007110046688467264 & cv<=-0.055950652807950974 & pav<=0.2393984496593476\n",
      "Run episode 364 with rewards 51.0\n",
      "============ 365 ===========\n",
      "69 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1]\n",
      "   -1.4792 if pav>=0.105914668738842\n",
      "   -0.4490 if pa>=-0.012810707092285156\n",
      "   +0.9270 if pa<=0.1111291527748108 & pav<=0.10654703080654145 & pav>=-0.13545677959918975\n",
      "   -0.4490 if cv<=1.8233052253723145\n",
      "   -0.9548 if pav>=0.0027710466645658313\n",
      "   -0.4677 if cp<=0.5970404863357547 & pav>=-0.09791276156902312\n",
      "   +5.9044 if cv>=0.12479247599840164\n",
      "   +0.4202 if pa<=0.04466329440474512\n",
      "   -0.0258 if cp<=0.12354667484760284 & cv<=0.20852182805538177 & pa>=0.0888475999236107 & pav>=0.3512481451034546\n",
      "   +0.4530 if pa<=0.03756512999534607\n",
      "   +0.0000 if cp>=-0.007110046688467264 & cv<=-0.24353250861167908 & pav<=0.32135266065597534\n",
      "   -4.7888 if pav>=0.10900827497243881\n",
      "--------------\n",
      "   +2.5813 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -1.5127 if pav<=0.057992350310087246\n",
      "   -2.0260 if cv>=-0.016934332624077793\n",
      "   -0.0047 if cp<=0.708822238445282 & pa>=0.12988671362400056 & pav<=0.11138861924409868 & pav>=0.0027710466645658313\n",
      "   -3.2711 if cp<=0.16845353841781624\n",
      "   +0.5221 if cv<=0.5127084851264954 & pa<=0.13488030433654788\n",
      "   +0.7552 if cv<=0.3260839581489563\n",
      "   -1.5020 if pav<=0.05521502792835236\n",
      "   -3.4937 if pav<=0.26598480343818665 & pav>=0.05537177994847298\n",
      "   -0.6306 if cv<=0.0031123566441237935 & pa<=0.03756512999534607 & pav<=0.3553890585899353\n",
      "   +0.1669 if cp<=-0.007110046688467264 & cv<=-0.055950652807950974 & pav<=0.2393984496593476\n",
      "   +4.4705 if pav>=0.10900827497243881\n",
      "Run episode 365 with rewards 69.0\n",
      "============ 366 ===========\n",
      "68 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1]\n",
      "   -2.1997 if pav>=0.105914668738842\n",
      "   -0.3624 if pa>=-0.012810707092285156\n",
      "   +1.4625 if pa<=0.1111291527748108 & pav<=0.10654703080654145 & pav>=-0.13545677959918975\n",
      "   -0.2966 if cv<=1.8233052253723145\n",
      "   -0.9015 if pav>=0.0027710466645658313\n",
      "   -0.6294 if cp<=0.5970404863357547 & pav>=-0.09791276156902312\n",
      "   +0.0081 if cv>=0.12479247599840164\n",
      "   +0.5923 if pa<=0.04466329440474512\n",
      "   -0.0048 if cp<=0.12354667484760284 & cv<=0.20852182805538177 & pa>=0.0888475999236107 & pav>=0.3512481451034546\n",
      "   +0.5121 if pa<=0.03756512999534607\n",
      "   -2.1997 if pav>=0.10900827497243881\n",
      "   +3.7211 if cp>=0.11819447576999667 & cv>=0.4006619215011597 & pav<=0.24460948705673222\n",
      "--------------\n",
      "   +4.2600 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -0.5013 if pav<=0.057992350310087246\n",
      "   +0.9667 if cv>=-0.016934332624077793\n",
      "   -2.4290 if cp<=0.16845353841781624\n",
      "   -2.9213 if cv<=0.5127084851264954 & pa<=0.13488030433654788\n",
      "   +1.7689 if cv<=0.3260839581489563\n",
      "   -0.5013 if pav<=0.05521502792835236\n",
      "   +0.7300 if pav<=0.26598480343818665 & pav>=0.05537177994847298\n",
      "   +0.0058 if cv<=0.0031123566441237935 & pa<=0.03756512999534607 & pav<=0.3553890585899353\n",
      "   +0.0000 if cp<=-0.007110046688467264 & cv<=-0.055950652807950974 & pav<=0.2393984496593476\n",
      "   +3.5126 if pav>=0.10900827497243881\n",
      "   -4.3977 if pav<=0.24460948705673222\n",
      "Run episode 366 with rewards 68.0\n",
      "============ 367 ===========\n",
      "64 actions [0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1]\n",
      "   -3.8449 if pav>=0.105914668738842\n",
      "   -0.6232 if pa>=-0.012810707092285156\n",
      "   +0.8122 if pa<=0.1111291527748108 & pav<=0.10654703080654145 & pav>=-0.13545677959918975\n",
      "   -0.6232 if cv<=1.8233052253723145\n",
      "   -1.0157 if pav>=0.0027710466645658313\n",
      "   -0.7705 if cp<=0.5970404863357547 & pav>=-0.09791276156902312\n",
      "   +1.6979 if cv>=0.12479247599840164\n",
      "   +0.1298 if pa<=0.04466329440474512\n",
      "   +0.0891 if pa<=0.03756512999534607\n",
      "   -1.1698 if pav>=0.10900827497243881\n",
      "   +0.4283 if cp>=0.11819447576999667 & cv>=0.4006619215011597 & pav<=0.24460948705673222\n",
      "   +1.2662 if pav<=0.08516121953725816\n",
      "--------------\n",
      "   +3.9102 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -1.1111 if pav<=0.057992350310087246\n",
      "   -1.3265 if cv>=-0.016934332624077793\n",
      "   -3.0251 if cp<=0.16845353841781624\n",
      "   -0.9409 if cv<=0.5127084851264954 & pa<=0.13488030433654788\n",
      "   +0.3236 if cv<=0.3260839581489563\n",
      "   -1.1111 if pav<=0.05521502792835236\n",
      "   +0.2169 if pav<=0.26598480343818665 & pav>=0.05537177994847298\n",
      "   -0.0059 if cv<=0.0031123566441237935 & pa<=0.03756512999534607 & pav<=0.3553890585899353\n",
      "   +3.8281 if pav>=0.10900827497243881\n",
      "   -0.9174 if pav<=0.24460948705673222\n",
      "   -0.3915 if \n",
      "Run episode 367 with rewards 64.0\n",
      "============ 368 ===========\n",
      "86 actions [0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 0, 0, 0, 1, 1, 0, 1, 0, 1, 1, 1, 0, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0]\n",
      "   -3.1522 if pav>=0.105914668738842\n",
      "   +0.3326 if pa>=-0.012810707092285156\n",
      "   +0.7432 if pa<=0.1111291527748108 & pav<=0.10654703080654145 & pav>=-0.13545677959918975\n",
      "   +0.3326 if cv<=1.8233052253723145\n",
      "   -0.8780 if pav>=0.0027710466645658313\n",
      "   -0.1599 if cp<=0.5970404863357547 & pav>=-0.09791276156902312\n",
      "   +0.0750 if cv>=0.12479247599840164\n",
      "   +0.2005 if pa<=0.04466329440474512\n",
      "   -3.1522 if pav>=0.10900827497243881\n",
      "   +0.0107 if cp>=0.11819447576999667 & cv>=0.4006619215011597 & pav<=0.24460948705673222\n",
      "   +0.0106 if pav<=0.08516121953725816\n",
      "   -4.7470 if cp<=0.19321814179420477 & pa>=0.1284493774175644\n",
      "--------------\n",
      "   +1.8785 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -1.4001 if pav<=0.057992350310087246\n",
      "   -0.7315 if cv>=-0.016934332624077793\n",
      "   -1.0781 if cp<=0.16845353841781624\n",
      "   -0.9327 if cv<=0.5127084851264954 & pa<=0.13488030433654788\n",
      "   -1.4571 if cv<=0.3260839581489563\n",
      "   -0.8657 if pav<=0.05521502792835236\n",
      "   -0.2497 if pav<=0.26598480343818665 & pav>=0.05537177994847298\n",
      "   +3.5867 if pav>=0.10900827497243881\n",
      "   -1.1155 if pav<=0.24460948705673222\n",
      "   -0.6760 if \n",
      "   +5.5654 if cp<=0.19321814179420477 & pa>=0.1284493774175644\n",
      "Run episode 368 with rewards 86.0\n",
      "============ 369 ===========\n",
      "66 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 1, 0, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1]\n",
      "   -1.1051 if pav>=0.105914668738842\n",
      "   -6.3737 if pa>=-0.012810707092285156\n",
      "   +1.0284 if pa<=0.1111291527748108 & pav<=0.10654703080654145 & pav>=-0.13545677959918975\n",
      "   +8.4319 if cv<=1.8233052253723145\n",
      "   -4.0545 if pav>=0.0027710466645658313\n",
      "   +3.9214 if cp<=0.5970404863357547 & pav>=-0.09791276156902312\n",
      "   -1.7881 if cv>=0.12479247599840164\n",
      "   -0.3854 if pa<=0.04466329440474512\n",
      "   -6.1491 if pav>=0.10900827497243881\n",
      "   -0.9827 if cp>=0.11819447576999667 & cv>=0.4006619215011597 & pav<=0.24460948705673222\n",
      "   -7.2961 if cp<=0.19321814179420477 & pa>=0.1284493774175644\n",
      "   -5.6154 if cp>=1.1471941471099854\n",
      "--------------\n",
      "   +0.1950 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   +1.5304 if pav<=0.057992350310087246\n",
      "   -1.3738 if cv>=-0.016934332624077793\n",
      "   -0.1091 if cp<=0.16845353841781624\n",
      "   -1.6123 if cv<=0.5127084851264954 & pa<=0.13488030433654788\n",
      "   -1.3554 if cv<=0.3260839581489563\n",
      "   +1.8700 if pav<=0.05521502792835236\n",
      "   +5.2457 if pav>=0.10900827497243881\n",
      "   -1.8987 if pav<=0.24460948705673222\n",
      "   -0.8350 if \n",
      "   +4.8611 if cp<=0.19321814179420477 & pa>=0.1284493774175644\n",
      "   -3.8095 if cp<=0.6052873730659485 & pav<=0.0543186292052269\n",
      "Run episode 369 with rewards 66.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 370 ===========\n",
      "72 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1]\n",
      "   -1.3876 if pav>=0.105914668738842\n",
      "   -0.4657 if pa>=-0.012810707092285156\n",
      "   +1.0995 if pa<=0.1111291527748108 & pav<=0.10654703080654145 & pav>=-0.13545677959918975\n",
      "   -0.4657 if cv<=1.8233052253723145\n",
      "   +0.3233 if pav>=0.0027710466645658313\n",
      "   -0.2527 if cp<=0.5970404863357547 & pav>=-0.09791276156902312\n",
      "   +1.2018 if cv>=0.12479247599840164\n",
      "   -4.9716 if pav>=0.10900827497243881\n",
      "   +1.0159 if cp>=0.11819447576999667 & cv>=0.4006619215011597 & pav<=0.24460948705673222\n",
      "   -3.6959 if cp<=0.19321814179420477 & pa>=0.1284493774175644\n",
      "   -0.0000 if cp>=1.1471941471099854\n",
      "   -0.7484 if cp<=-0.0013292874209582806 & cv>=0.0400342233479023 & pa<=0.10849975049495697 & pav>=0.07690320163965225\n",
      "--------------\n",
      "   +0.7906 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   +0.0925 if pav<=0.057992350310087246\n",
      "   -1.5160 if cv>=-0.016934332624077793\n",
      "   -0.2795 if cv<=0.5127084851264954 & pa<=0.13488030433654788\n",
      "   -0.1917 if cv<=0.3260839581489563\n",
      "   +0.0925 if pav<=0.05521502792835236\n",
      "   +4.0416 if pav>=0.10900827497243881\n",
      "   -2.1705 if pav<=0.24460948705673222\n",
      "   -1.3770 if \n",
      "   +4.4233 if cp<=0.19321814179420477 & pa>=0.1284493774175644\n",
      "   +0.2632 if cp<=0.6052873730659485 & pav<=0.0543186292052269\n",
      "   +0.8991 if cv<=0.0400342233479023 & pav<=0.1957546621561051\n",
      "Run episode 370 with rewards 72.0\n",
      "============ 371 ===========\n",
      "80 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1]\n",
      "   -3.3214 if pav>=0.105914668738842\n",
      "   +0.0661 if pa>=-0.012810707092285156\n",
      "   +1.6574 if pa<=0.1111291527748108 & pav<=0.10654703080654145 & pav>=-0.13545677959918975\n",
      "   +0.0661 if cv<=1.8233052253723145\n",
      "   -0.4585 if pav>=0.0027710466645658313\n",
      "   -0.0632 if cp<=0.5970404863357547 & pav>=-0.09791276156902312\n",
      "   -0.1336 if cv>=0.12479247599840164\n",
      "   -3.3214 if pav>=0.10900827497243881\n",
      "   -0.4980 if cp>=0.11819447576999667 & cv>=0.4006619215011597 & pav<=0.24460948705673222\n",
      "   -4.3016 if cp<=0.19321814179420477 & pa>=0.1284493774175644\n",
      "   +0.0000 if cp<=-0.0013292874209582806 & cv>=0.0400342233479023 & pa<=0.10849975049495697 & pav>=0.07690320163965225\n",
      "   +0.9588 if pav<=0.19076273441314703\n",
      "--------------\n",
      "   +1.6617 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -0.7385 if cv>=-0.016934332624077793\n",
      "   -1.7647 if cv<=0.5127084851264954 & pa<=0.13488030433654788\n",
      "   -0.3677 if cv<=0.3260839581489563\n",
      "   -0.9040 if pav<=0.05521502792835236\n",
      "   +3.0599 if pav>=0.10900827497243881\n",
      "   -1.0728 if pav<=0.24460948705673222\n",
      "   -0.5881 if \n",
      "   +5.0798 if cp<=0.19321814179420477 & pa>=0.1284493774175644\n",
      "   -0.8975 if cp<=0.6052873730659485 & pav<=0.0543186292052269\n",
      "   -0.7210 if cv<=0.0400342233479023 & pav<=0.1957546621561051\n",
      "   +0.2439 if cp<=0.20320429205894483 & cv<=0.7048550724983216 & pa>=0.12489480674266816 & pav<=0.0674781307578087\n",
      "Run episode 371 with rewards 80.0\n",
      "============ 372 ===========\n",
      "122 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 0, 0, 0, 1, 1, 0, 1, 0, 1, 1, 1, 1, 0, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1]\n",
      "   -3.1465 if pav>=0.105914668738842\n",
      "   -0.3297 if pa>=-0.012810707092285156\n",
      "   +1.1707 if pa<=0.1111291527748108 & pav<=0.10654703080654145 & pav>=-0.13545677959918975\n",
      "   -0.3297 if cv<=1.8233052253723145\n",
      "   -0.3032 if pav>=0.0027710466645658313\n",
      "   +1.4441 if cp<=0.5970404863357547 & pav>=-0.09791276156902312\n",
      "   +0.3298 if cv>=0.12479247599840164\n",
      "   -3.1465 if pav>=0.10900827497243881\n",
      "   +0.1918 if cp>=0.11819447576999667 & cv>=0.4006619215011597 & pav<=0.24460948705673222\n",
      "   -2.8793 if cp<=0.19321814179420477 & pa>=0.1284493774175644\n",
      "   +0.7259 if pav<=0.19076273441314703\n",
      "   -1.2686 if pav>=0.06502775698900223\n",
      "--------------\n",
      "   +1.4871 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -1.0647 if cv>=-0.016934332624077793\n",
      "   -0.2816 if cv<=0.5127084851264954 & pa<=0.13488030433654788\n",
      "   -0.2353 if cv<=0.3260839581489563\n",
      "   -1.1439 if pav<=0.05521502792835236\n",
      "   +2.6089 if pav>=0.10900827497243881\n",
      "   -1.3024 if pav<=0.24460948705673222\n",
      "   -0.9634 if \n",
      "   +3.8962 if cp<=0.19321814179420477 & pa>=0.1284493774175644\n",
      "   -0.4116 if cp<=0.6052873730659485 & pav<=0.0543186292052269\n",
      "   -0.2903 if cv<=0.0400342233479023 & pav<=0.1957546621561051\n",
      "   +0.0000 if cv<=0.4604156851768503 & pa>=0.12231172174215317\n",
      "Run episode 372 with rewards 122.0\n",
      "============ 373 ===========\n",
      "134 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 1, 0, 1, 1, 1, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 1, 0, 1]\n",
      "   -6.0797 if pav>=0.105914668738842\n",
      "   +0.0016 if pa>=-0.012810707092285156\n",
      "   +2.3357 if pa<=0.1111291527748108 & pav<=0.10654703080654145 & pav>=-0.13545677959918975\n",
      "   +0.1541 if cv<=1.8233052253723145\n",
      "   +0.0052 if pav>=0.0027710466645658313\n",
      "   +0.4693 if cp<=0.5970404863357547 & pav>=-0.09791276156902312\n",
      "   -0.6659 if cv>=0.12479247599840164\n",
      "   -1.3332 if pav>=0.10900827497243881\n",
      "   -5.8470 if cp<=0.19321814179420477 & pa>=0.1284493774175644\n",
      "   +0.8786 if pav<=0.19076273441314703\n",
      "   -0.8345 if pav>=0.06502775698900223\n",
      "   +0.9984 if cp<=-0.08552553206682202 & pa<=0.13353570103645324 & pa>=0.11306430697441101 & pav<=0.20473399758338928 & pav>=0.04095418825745583\n",
      "--------------\n",
      "   +2.0468 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -0.5028 if cv>=-0.016934332624077793\n",
      "   -1.9603 if cv<=0.5127084851264954 & pa<=0.13488030433654788\n",
      "   -1.1925 if cv<=0.3260839581489563\n",
      "   -1.8972 if pav<=0.05521502792835236\n",
      "   +2.7657 if pav>=0.10900827497243881\n",
      "   -0.6084 if pav<=0.24460948705673222\n",
      "   +0.0726 if \n",
      "   +6.4021 if cp<=0.19321814179420477 & pa>=0.1284493774175644\n",
      "   -1.0908 if cp<=0.6052873730659485 & pav<=0.0543186292052269\n",
      "   -0.6967 if cv<=0.0400342233479023 & pav<=0.1957546621561051\n",
      "   -1.9135 if cp>=0.2969962120056155 & pa<=0.13353570103645324 & pav<=0.20473399758338928 & pav>=0.04095418825745583\n",
      "Run episode 373 with rewards 134.0\n",
      "============ 374 ===========\n",
      "74 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1]\n",
      "   -3.6253 if pav>=0.105914668738842\n",
      "   +1.8199 if pa<=0.1111291527748108 & pav<=0.10654703080654145 & pav>=-0.13545677959918975\n",
      "   +0.4611 if cv<=1.8233052253723145\n",
      "   +0.1527 if pav>=0.0027710466645658313\n",
      "   +0.3954 if cp<=0.5970404863357547 & pav>=-0.09791276156902312\n",
      "   +0.6820 if cv>=0.12479247599840164\n",
      "   -3.2610 if pav>=0.10900827497243881\n",
      "   -4.7451 if cp<=0.19321814179420477 & pa>=0.1284493774175644\n",
      "   +0.9770 if pav<=0.19076273441314703\n",
      "   -1.5903 if pav>=0.06502775698900223\n",
      "   -0.5083 if cp<=-0.08552553206682202 & pa<=0.13353570103645324 & pa>=0.11306430697441101 & pav<=0.20473399758338928 & pav>=0.04095418825745583\n",
      "   +1.2972 if pa>=0.11800199002027512 & pav<=0.15993459522724154 & pav>=0.054659725725650796\n",
      "--------------\n",
      "   +1.7078 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -1.4588 if cv>=-0.016934332624077793\n",
      "   -0.3747 if cv<=0.5127084851264954 & pa<=0.13488030433654788\n",
      "   -0.2407 if cv<=0.3260839581489563\n",
      "   -1.5504 if pav<=0.05521502792835236\n",
      "   +2.7912 if pav>=0.10900827497243881\n",
      "   -2.0596 if pav<=0.24460948705673222\n",
      "   +5.0401 if cp<=0.19321814179420477 & pa>=0.1284493774175644\n",
      "   -0.4387 if cp<=0.6052873730659485 & pav<=0.0543186292052269\n",
      "   -0.6736 if cv<=0.0400342233479023 & pav<=0.1957546621561051\n",
      "   -0.1008 if cp>=0.2969962120056155 & pa<=0.13353570103645324 & pav<=0.20473399758338928 & pav>=0.04095418825745583\n",
      "   -0.3730 if pav>=0.054659725725650796\n",
      "Run episode 374 with rewards 74.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 375 ===========\n",
      "116 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1]\n",
      "   -3.3283 if pav>=0.105914668738842\n",
      "   +1.9096 if pa<=0.1111291527748108 & pav<=0.10654703080654145 & pav>=-0.13545677959918975\n",
      "   -0.3557 if cv<=1.8233052253723145\n",
      "   +0.1584 if cp<=0.5970404863357547 & pav>=-0.09791276156902312\n",
      "   -0.0654 if cv>=0.12479247599840164\n",
      "   -3.3283 if pav>=0.10900827497243881\n",
      "   -3.9211 if cp<=0.19321814179420477 & pa>=0.1284493774175644\n",
      "   +0.4498 if pav<=0.19076273441314703\n",
      "   -0.1605 if pav>=0.06502775698900223\n",
      "   +0.0000 if cp<=-0.08552553206682202 & pa<=0.13353570103645324 & pa>=0.11306430697441101 & pav<=0.20473399758338928 & pav>=0.04095418825745583\n",
      "   +0.5000 if pa>=0.11800199002027512 & pav<=0.15993459522724154 & pav>=0.054659725725650796\n",
      "   -0.3731 if pa>=0.1251595512032509 & pav<=0.19145653843879704\n",
      "--------------\n",
      "   +0.6700 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -0.7544 if cv>=-0.016934332624077793\n",
      "   -0.4320 if cv<=0.5127084851264954 & pa<=0.13488030433654788\n",
      "   -0.9337 if cv<=0.3260839581489563\n",
      "   -0.4594 if pav<=0.05521502792835236\n",
      "   +2.6664 if pav>=0.10900827497243881\n",
      "   -1.0311 if pav<=0.24460948705673222\n",
      "   +4.1427 if cp<=0.19321814179420477 & pa>=0.1284493774175644\n",
      "   -0.5286 if cp<=0.6052873730659485 & pav<=0.0543186292052269\n",
      "   +0.3006 if cv<=0.0400342233479023 & pav<=0.1957546621561051\n",
      "   -0.1808 if pav>=0.054659725725650796\n",
      "   -0.0612 if cp<=0.10756503641605386 & cv>=0.5931915283203125\n",
      "Run episode 375 with rewards 116.0\n",
      "============ 376 ===========\n",
      "112 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 1, 1, 0, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 1, 1, 0, 1, 0, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1]\n",
      "   -4.2018 if pav>=0.105914668738842\n",
      "   +1.4688 if pa<=0.1111291527748108 & pav<=0.10654703080654145 & pav>=-0.13545677959918975\n",
      "   +2.6329 if cv<=1.8233052253723145\n",
      "   -0.0602 if cp<=0.5970404863357547 & pav>=-0.09791276156902312\n",
      "   -0.0891 if cv>=0.12479247599840164\n",
      "   -4.2018 if pav>=0.10900827497243881\n",
      "   -4.4822 if cp<=0.19321814179420477 & pa>=0.1284493774175644\n",
      "   +0.7007 if pav<=0.19076273441314703\n",
      "   -0.7966 if pav>=0.06502775698900223\n",
      "   +2.7927 if pa>=0.11800199002027512 & pav<=0.15993459522724154 & pav>=0.054659725725650796\n",
      "   -1.9115 if pa>=0.1251595512032509 & pav<=0.19145653843879704\n",
      "   -6.7098 if cp<=0.8853330612182617 & pa>=0.14282040297985077\n",
      "--------------\n",
      "   +1.6814 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -1.2068 if cv>=-0.016934332624077793\n",
      "   -0.5601 if cv<=0.5127084851264954 & pa<=0.13488030433654788\n",
      "   -0.2139 if cv<=0.3260839581489563\n",
      "   +0.1628 if pav<=0.05521502792835236\n",
      "   +3.4751 if pav>=0.10900827497243881\n",
      "   -1.6863 if pav<=0.24460948705673222\n",
      "   +5.4032 if cp<=0.19321814179420477 & pa>=0.1284493774175644\n",
      "   -2.5532 if cp<=0.6052873730659485 & pav<=0.0543186292052269\n",
      "   -0.2207 if cv<=0.0400342233479023 & pav<=0.1957546621561051\n",
      "   -1.2711 if pav>=0.054659725725650796\n",
      "   +5.6893 if cp<=0.8853330612182617 & pa>=0.14282040297985077\n",
      "Run episode 376 with rewards 112.0\n",
      "============ 377 ===========\n",
      "109 actions [0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 1, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 0, 0, 0, 1, 0, 1, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1]\n",
      "   -2.2721 if pav>=0.105914668738842\n",
      "   +0.6971 if pa<=0.1111291527748108 & pav<=0.10654703080654145 & pav>=-0.13545677959918975\n",
      "   -1.5700 if cv<=1.8233052253723145\n",
      "   +0.8615 if cv>=0.12479247599840164\n",
      "   -5.0307 if pav>=0.10900827497243881\n",
      "   -3.7689 if cp<=0.19321814179420477 & pa>=0.1284493774175644\n",
      "   +1.7466 if pav<=0.19076273441314703\n",
      "   -2.2344 if pav>=0.06502775698900223\n",
      "   +0.6176 if pa>=0.11800199002027512 & pav<=0.15993459522724154 & pav>=0.054659725725650796\n",
      "   -3.7985 if pa>=0.1251595512032509 & pav<=0.19145653843879704\n",
      "   -2.2969 if cp<=0.8853330612182617 & pa>=0.14282040297985077\n",
      "   +2.8497 if pav>=-0.08378964513540267\n",
      "--------------\n",
      "   +1.8247 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -1.4243 if cv>=-0.016934332624077793\n",
      "   -2.6183 if cv<=0.5127084851264954 & pa<=0.13488030433654788\n",
      "   +0.9669 if cv<=0.3260839581489563\n",
      "   +3.4161 if pav>=0.10900827497243881\n",
      "   -1.7629 if pav<=0.24460948705673222\n",
      "   +4.4614 if cp<=0.19321814179420477 & pa>=0.1284493774175644\n",
      "   -4.8226 if cp<=0.6052873730659485 & pav<=0.0543186292052269\n",
      "   +0.2627 if cv<=0.0400342233479023 & pav<=0.1957546621561051\n",
      "   +0.2975 if pav>=0.054659725725650796\n",
      "   +3.8209 if cp<=0.8853330612182617 & pa>=0.14282040297985077\n",
      "   +4.6403 if cv<=1.834164834022522 & pav<=0.046417894959449826\n",
      "Run episode 377 with rewards 109.0\n",
      "============ 378 ===========\n",
      "111 actions [0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 1, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 0, 0, 0, 1, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0]\n",
      "   -3.7308 if pav>=0.105914668738842\n",
      "   +1.9306 if pa<=0.1111291527748108 & pav<=0.10654703080654145 & pav>=-0.13545677959918975\n",
      "   -2.2338 if cv<=1.8233052253723145\n",
      "   +0.3402 if cv>=0.12479247599840164\n",
      "   -3.7308 if pav>=0.10900827497243881\n",
      "   -4.5244 if cp<=0.19321814179420477 & pa>=0.1284493774175644\n",
      "   +0.9684 if pav<=0.19076273441314703\n",
      "   -0.0155 if pav>=0.06502775698900223\n",
      "   +0.2671 if pa>=0.1251595512032509 & pav<=0.19145653843879704\n",
      "   -4.8266 if cp<=0.8853330612182617 & pa>=0.14282040297985077\n",
      "   +2.4959 if pav>=-0.08378964513540267\n",
      "   +5.9499 if cp>=0.3205459237098694 & pa<=0.10980533361434937 & pav<=-0.09898474514484405 & pav<=0.15547152757644667\n",
      "--------------\n",
      "   +1.1441 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -1.4526 if cv>=-0.016934332624077793\n",
      "   -1.1780 if cv<=0.5127084851264954 & pa<=0.13488030433654788\n",
      "   +0.6510 if cv<=0.3260839581489563\n",
      "   +4.6617 if pav>=0.10900827497243881\n",
      "   -1.7806 if pav<=0.24460948705673222\n",
      "   +4.8250 if cp<=0.19321814179420477 & pa>=0.1284493774175644\n",
      "   -8.0321 if cp<=0.6052873730659485 & pav<=0.0543186292052269\n",
      "   -1.7844 if pav>=0.054659725725650796\n",
      "   +5.8289 if cp<=0.8853330612182617 & pa>=0.14282040297985077\n",
      "   +6.4291 if cv<=1.834164834022522 & pav<=0.046417894959449826\n",
      "   -5.7625 if cv>=1.4777229070663453 & pa<=0.10980533361434937 & pav<=-0.09898474514484405\n",
      "Run episode 378 with rewards 111.0\n",
      "============ 379 ===========\n",
      "113 actions [0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 1, 1, 0, 0, 0, 1, 1, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0]\n",
      "   -2.4398 if pav>=0.105914668738842\n",
      "   +6.1332 if pa<=0.1111291527748108 & pav<=0.10654703080654145 & pav>=-0.13545677959918975\n",
      "   -1.8481 if cv<=1.8233052253723145\n",
      "   +0.7906 if cv>=0.12479247599840164\n",
      "   -4.6287 if pav>=0.10900827497243881\n",
      "   -4.3672 if cp<=0.19321814179420477 & pa>=0.1284493774175644\n",
      "   +1.1917 if pav<=0.19076273441314703\n",
      "   -0.8019 if pa>=0.1251595512032509 & pav<=0.19145653843879704\n",
      "   -3.9950 if cp<=0.8853330612182617 & pa>=0.14282040297985077\n",
      "   +0.6746 if pav>=-0.08378964513540267\n",
      "   +2.0145 if cp>=0.3205459237098694 & pa<=0.10980533361434937 & pav<=-0.09898474514484405 & pav<=0.15547152757644667\n",
      "   +0.5725 if cv<=1.3502146005630513 & cv>=0.7791854739189148 & pav<=-0.08436589688062668\n",
      "--------------\n",
      "   +1.0638 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -1.0931 if cv>=-0.016934332624077793\n",
      "   -0.7547 if cv<=0.5127084851264954 & pa<=0.13488030433654788\n",
      "   +4.4762 if pav>=0.10900827497243881\n",
      "   -1.5650 if pav<=0.24460948705673222\n",
      "   +4.9330 if cp<=0.19321814179420477 & pa>=0.1284493774175644\n",
      "   -8.2031 if cp<=0.6052873730659485 & pav<=0.0543186292052269\n",
      "   -1.2538 if pav>=0.054659725725650796\n",
      "   +4.9118 if cp<=0.8853330612182617 & pa>=0.14282040297985077\n",
      "   +5.7587 if cv<=1.834164834022522 & pav<=0.046417894959449826\n",
      "   -0.4466 if cv>=1.4777229070663453 & pa<=0.10980533361434937 & pav<=-0.09898474514484405\n",
      "   -3.9211 if cv>=1.3502146005630513 & pa<=0.11173352599143982 & pav<=0.040461666882038116\n",
      "Run episode 379 with rewards 113.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 380 ===========\n",
      "121 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 1, 0, 1, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0]\n",
      "   -1.9293 if pav>=0.105914668738842\n",
      "   +2.3601 if pa<=0.1111291527748108 & pav<=0.10654703080654145 & pav>=-0.13545677959918975\n",
      "   -0.1936 if cv<=1.8233052253723145\n",
      "   +0.2651 if cv>=0.12479247599840164\n",
      "   -4.7229 if pav>=0.10900827497243881\n",
      "   -4.4994 if cp<=0.19321814179420477 & pa>=0.1284493774175644\n",
      "   +0.6464 if pav<=0.19076273441314703\n",
      "   -0.4139 if pa>=0.1251595512032509 & pav<=0.19145653843879704\n",
      "   -5.4092 if cp<=0.8853330612182617 & pa>=0.14282040297985077\n",
      "   +0.5781 if pav>=-0.08378964513540267\n",
      "   +2.5483 if cp>=0.3205459237098694 & pa<=0.10980533361434937 & pav<=-0.09898474514484405 & pav<=0.15547152757644667\n",
      "   +5.3884 if cp<=0.745016467571259 & cv>=1.4511004209518432 & pa<=0.12289265841245656 & pa>=0.11167643517255783\n",
      "--------------\n",
      "   +1.2661 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -1.1423 if cv>=-0.016934332624077793\n",
      "   -0.1673 if cv<=0.5127084851264954 & pa<=0.13488030433654788\n",
      "   +3.7943 if pav>=0.10900827497243881\n",
      "   -1.6038 if pav<=0.24460948705673222\n",
      "   +4.2444 if cp<=0.19321814179420477 & pa>=0.1284493774175644\n",
      "   -8.4459 if cp<=0.6052873730659485 & pav<=0.0543186292052269\n",
      "   -1.7119 if pav>=0.054659725725650796\n",
      "   +5.1720 if cp<=0.8853330612182617 & pa>=0.14282040297985077\n",
      "   +6.5122 if cv<=1.834164834022522 & pav<=0.046417894959449826\n",
      "   -6.0377 if cv>=1.3502146005630513 & pa<=0.11173352599143982 & pav<=0.040461666882038116\n",
      "   -6.4483 if cp<=0.745016467571259 & cv>=1.4511004209518432 & pa<=0.12289265841245656 & pa>=0.11167643517255783\n",
      "Run episode 380 with rewards 121.0\n",
      "============ 381 ===========\n",
      "164 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1, 1, 0]\n",
      "   -2.2210 if pav>=0.105914668738842\n",
      "   +3.3338 if pa<=0.1111291527748108 & pav<=0.10654703080654145 & pav>=-0.13545677959918975\n",
      "   -0.2854 if cv>=0.12479247599840164\n",
      "   -4.5977 if pav>=0.10900827497243881\n",
      "   -5.3059 if cp<=0.19321814179420477 & pa>=0.1284493774175644\n",
      "   +1.1597 if pav<=0.19076273441314703\n",
      "   +0.0270 if pa>=0.1251595512032509 & pav<=0.19145653843879704\n",
      "   -5.1117 if cp<=0.8853330612182617 & pa>=0.14282040297985077\n",
      "   -0.3756 if pav>=-0.08378964513540267\n",
      "   +1.2322 if cp>=0.3205459237098694 & pa<=0.10980533361434937 & pav<=-0.09898474514484405 & pav<=0.15547152757644667\n",
      "   +1.5801 if cp<=0.745016467571259 & cv>=1.4511004209518432 & pa<=0.12289265841245656 & pa>=0.11167643517255783\n",
      "   -1.1840 if pav<=-0.08588805049657822 & pav>=-0.08588805049657822\n",
      "--------------\n",
      "   +0.2562 if cv<=0.379887717962265 & pav>=0.10571803748607639\n",
      "   -1.2956 if cv>=-0.016934332624077793\n",
      "   +4.5141 if pav>=0.10900827497243881\n",
      "   -1.8358 if pav<=0.24460948705673222\n",
      "   +4.6101 if cp<=0.19321814179420477 & pa>=0.1284493774175644\n",
      "   -7.4037 if cp<=0.6052873730659485 & pav<=0.0543186292052269\n",
      "   -0.8324 if pav>=0.054659725725650796\n",
      "   +4.1590 if cp<=0.8853330612182617 & pa>=0.14282040297985077\n",
      "   +6.8934 if cv<=1.834164834022522 & pav<=0.046417894959449826\n",
      "   -4.7865 if cv>=1.3502146005630513 & pa<=0.11173352599143982 & pav<=0.040461666882038116\n",
      "   -2.0766 if cp<=0.745016467571259 & cv>=1.4511004209518432 & pa<=0.12289265841245656 & pa>=0.11167643517255783\n",
      "   -1.1152 if cp>=-0.022614924237132072 & cv<=1.4442379474639893 & pa>=0.11248297244310379 & pav<=-0.08588805049657822\n",
      "Run episode 381 with rewards 164.0\n",
      "============ 382 ===========\n",
      "119 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 1, 1, 0, 0, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0]\n",
      "   -1.7153 if pav>=0.105914668738842\n",
      "   +2.9479 if pa<=0.1111291527748108 & pav<=0.10654703080654145 & pav>=-0.13545677959918975\n",
      "   -2.1412 if cv>=0.12479247599840164\n",
      "   -5.7881 if pav>=0.10900827497243881\n",
      "   -5.3407 if cp<=0.19321814179420477 & pa>=0.1284493774175644\n",
      "   +3.1614 if pav<=0.19076273441314703\n",
      "   -5.1307 if cp<=0.8853330612182617 & pa>=0.14282040297985077\n",
      "   +0.1614 if pav>=-0.08378964513540267\n",
      "   -2.0506 if cp>=0.3205459237098694 & pa<=0.10980533361434937 & pav<=-0.09898474514484405 & pav<=0.15547152757644667\n",
      "   +0.0000 if cp<=0.745016467571259 & cv>=1.4511004209518432 & pa<=0.12289265841245656 & pa>=0.11167643517255783\n",
      "   +0.0000 if pav<=-0.08588805049657822 & pav>=-0.08588805049657822\n",
      "   +5.5172 if cp<=1.0446686029434207 & pa>=0.13487319946289061 & pav<=0.15826416909694677 & pav>=0.029663847386837014\n",
      "--------------\n",
      "   +0.2131 if cv>=-0.016934332624077793\n",
      "   +6.0186 if pav>=0.10900827497243881\n",
      "   -2.2393 if pav<=0.24460948705673222\n",
      "   +5.0480 if cp<=0.19321814179420477 & pa>=0.1284493774175644\n",
      "   -7.0299 if cp<=0.6052873730659485 & pav<=0.0543186292052269\n",
      "   +1.3374 if pav>=0.054659725725650796\n",
      "   +4.1994 if cp<=0.8853330612182617 & pa>=0.14282040297985077\n",
      "   +4.4138 if cv<=1.834164834022522 & pav<=0.046417894959449826\n",
      "   -0.6314 if cv>=1.3502146005630513 & pa<=0.11173352599143982 & pav<=0.040461666882038116\n",
      "   -0.0001 if cp<=0.745016467571259 & cv>=1.4511004209518432 & pa<=0.12289265841245656 & pa>=0.11167643517255783\n",
      "   +0.2749 if cp>=-0.022614924237132072 & cv<=1.4442379474639893 & pa>=0.11248297244310379 & pav<=-0.08588805049657822\n",
      "   -4.7154 if pav>=0.029663847386837014\n",
      "Run episode 382 with rewards 119.0\n",
      "============ 383 ===========\n",
      "89 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 1, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0]\n",
      "   -3.0128 if pav>=0.105914668738842\n",
      "   +1.7249 if pa<=0.1111291527748108 & pav<=0.10654703080654145 & pav>=-0.13545677959918975\n",
      "   -0.4994 if cv>=0.12479247599840164\n",
      "   -3.0128 if pav>=0.10900827497243881\n",
      "   -4.1971 if cp<=0.19321814179420477 & pa>=0.1284493774175644\n",
      "   +0.5448 if pav<=0.19076273441314703\n",
      "   -4.4656 if cp<=0.8853330612182617 & pa>=0.14282040297985077\n",
      "   -0.4739 if pav>=-0.08378964513540267\n",
      "   -0.8439 if cp>=0.3205459237098694 & pa<=0.10980533361434937 & pav<=-0.09898474514484405 & pav<=0.15547152757644667\n",
      "   -1.2546 if cp<=0.745016467571259 & cv>=1.4511004209518432 & pa<=0.12289265841245656 & pa>=0.11167643517255783\n",
      "   +0.4750 if cp<=1.0446686029434207 & pa>=0.13487319946289061 & pav<=0.15826416909694677 & pav>=0.029663847386837014\n",
      "   +0.6965 if pa<=0.08706619292497636 & pav>=-0.4346310496330261\n",
      "--------------\n",
      "   -0.8066 if cv>=-0.016934332624077793\n",
      "   +3.5669 if pav>=0.10900827497243881\n",
      "   -0.9155 if pav<=0.24460948705673222\n",
      "   +3.6694 if cp<=0.19321814179420477 & pa>=0.1284493774175644\n",
      "   -7.8763 if cp<=0.6052873730659485 & pav<=0.0543186292052269\n",
      "   -0.5415 if pav>=0.054659725725650796\n",
      "   +3.7845 if cp<=0.8853330612182617 & pa>=0.14282040297985077\n",
      "   +6.0954 if cv<=1.834164834022522 & pav<=0.046417894959449826\n",
      "   -0.8510 if cv>=1.3502146005630513 & pa<=0.11173352599143982 & pav<=0.040461666882038116\n",
      "   +0.1538 if cp>=-0.022614924237132072 & cv<=1.4442379474639893 & pa>=0.11248297244310379 & pav<=-0.08588805049657822\n",
      "   -0.5896 if pav>=0.029663847386837014\n",
      "   -3.8093 if cp>=0.9493266582489016 & pa>=-0.012121891044080256 & pav<=-0.04674722999334333\n",
      "Run episode 383 with rewards 89.0\n",
      "============ 384 ===========\n",
      "123 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 0, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 0, 0, 1, 0, 1, 1, 1, 1, 0, 1, 0, 1, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0]\n",
      "   -1.7034 if pav>=0.105914668738842\n",
      "   +0.5740 if pa<=0.1111291527748108 & pav<=0.10654703080654145 & pav>=-0.13545677959918975\n",
      "   -6.1180 if cv>=0.12479247599840164\n",
      "   -1.7034 if pav>=0.10900827497243881\n",
      "   -4.9434 if cp<=0.19321814179420477 & pa>=0.1284493774175644\n",
      "   +3.8702 if pav<=0.19076273441314703\n",
      "   -4.3513 if cp<=0.8853330612182617 & pa>=0.14282040297985077\n",
      "   -0.5732 if cp>=0.3205459237098694 & pa<=0.10980533361434937 & pav<=-0.09898474514484405 & pav<=0.15547152757644667\n",
      "   -0.9906 if cp<=0.745016467571259 & cv>=1.4511004209518432 & pa<=0.12289265841245656 & pa>=0.11167643517255783\n",
      "   -0.1640 if cp<=1.0446686029434207 & pa>=0.13487319946289061 & pav<=0.15826416909694677 & pav>=0.029663847386837014\n",
      "   +0.1556 if pa<=0.08706619292497636 & pav>=-0.4346310496330261\n",
      "   +3.4777 if cv>=0.1838614135980606 & pav<=0.043705208599567516\n",
      "--------------\n",
      "   -2.2776 if cv>=-0.016934332624077793\n",
      "   -0.2093 if pav>=0.10900827497243881\n",
      "   -2.5932 if pav<=0.24460948705673222\n",
      "   +4.6983 if cp<=0.19321814179420477 & pa>=0.1284493774175644\n",
      "   -7.5879 if cp<=0.6052873730659485 & pav<=0.0543186292052269\n",
      "   +2.4112 if pav>=0.054659725725650796\n",
      "   +4.1601 if cp<=0.8853330612182617 & pa>=0.14282040297985077\n",
      "   +7.4026 if cv<=1.834164834022522 & pav<=0.046417894959449826\n",
      "   +0.6109 if cv>=1.3502146005630513 & pa<=0.11173352599143982 & pav<=0.040461666882038116\n",
      "   -2.4812 if pav>=0.029663847386837014\n",
      "   -5.0304 if cp>=0.9493266582489016 & pa>=-0.012121891044080256 & pav<=-0.04674722999334333\n",
      "   +4.2123 if pa>=0.08103863745927811 & pav>=0.043705208599567516\n",
      "Run episode 384 with rewards 123.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 385 ===========\n",
      "133 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 1, 0, 0, 1, 0, 1, 1, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 1, 0, 1, 0, 0, 1, 1, 0, 0, 0, 1, 1, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1]\n",
      "   -1.3088 if pav>=0.105914668738842\n",
      "   +1.8830 if pa<=0.1111291527748108 & pav<=0.10654703080654145 & pav>=-0.13545677959918975\n",
      "   -7.7924 if cv>=0.12479247599840164\n",
      "   -1.3088 if pav>=0.10900827497243881\n",
      "   -5.2747 if cp<=0.19321814179420477 & pa>=0.1284493774175644\n",
      "   +5.9701 if pav<=0.19076273441314703\n",
      "   -5.4991 if cp<=0.8853330612182617 & pa>=0.14282040297985077\n",
      "   +0.3122 if cp>=0.3205459237098694 & pa<=0.10980533361434937 & pav<=-0.09898474514484405 & pav<=0.15547152757644667\n",
      "   -2.1813 if cp<=0.745016467571259 & cv>=1.4511004209518432 & pa<=0.12289265841245656 & pa>=0.11167643517255783\n",
      "   +0.0116 if cp<=1.0446686029434207 & pa>=0.13487319946289061 & pav<=0.15826416909694677 & pav>=0.029663847386837014\n",
      "   +2.5687 if cv>=0.1838614135980606 & pav<=0.043705208599567516\n",
      "   -2.7278 if cp<=0.22202084362506871 & pa<=0.09762744754552842 & pav>=-0.14960525333881372\n",
      "--------------\n",
      "   -5.2757 if cv>=-0.016934332624077793\n",
      "   -2.8255 if pav<=0.24460948705673222\n",
      "   +6.2053 if cp<=0.19321814179420477 & pa>=0.1284493774175644\n",
      "   -6.4354 if cp<=0.6052873730659485 & pav<=0.0543186292052269\n",
      "   +0.2899 if pav>=0.054659725725650796\n",
      "   +6.4800 if cp<=0.8853330612182617 & pa>=0.14282040297985077\n",
      "   +8.6234 if cv<=1.834164834022522 & pav<=0.046417894959449826\n",
      "   +2.0833 if cv>=1.3502146005630513 & pa<=0.11173352599143982 & pav<=0.040461666882038116\n",
      "   +1.0603 if pav>=0.029663847386837014\n",
      "   -6.2012 if cp>=0.9493266582489016 & pa>=-0.012121891044080256 & pav<=-0.04674722999334333\n",
      "   +6.0523 if pa>=0.08103863745927811 & pav>=0.043705208599567516\n",
      "   +4.6956 if cv<=1.772495174407959 & cv>=1.4093816995620727 & pa>=0.05492815300822258 & pav<=0.1386557340621949 & pav>=-0.14960525333881372\n",
      "Run episode 385 with rewards 133.0\n",
      "============ 386 ===========\n",
      "116 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 0, 0, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0]\n",
      "   +1.3902 if pav>=0.105914668738842\n",
      "   +5.1817 if pa<=0.1111291527748108 & pav<=0.10654703080654145 & pav>=-0.13545677959918975\n",
      "  -13.7768 if cv>=0.12479247599840164\n",
      "   +1.3902 if pav>=0.10900827497243881\n",
      "   -4.6054 if cp<=0.19321814179420477 & pa>=0.1284493774175644\n",
      "   +8.0184 if pav<=0.19076273441314703\n",
      "   -4.1414 if cp<=0.8853330612182617 & pa>=0.14282040297985077\n",
      "   +1.3769 if cp>=0.3205459237098694 & pa<=0.10980533361434937 & pav<=-0.09898474514484405 & pav<=0.15547152757644667\n",
      "   +0.0000 if cp<=0.745016467571259 & cv>=1.4511004209518432 & pa<=0.12289265841245656 & pa>=0.11167643517255783\n",
      "   +6.2775 if cv>=0.1838614135980606 & pav<=0.043705208599567516\n",
      "   -5.2166 if cp<=0.22202084362506871 & pa<=0.09762744754552842 & pav>=-0.14960525333881372\n",
      "   -2.6875 if cv<=1.3126796245574952 & pav>=-0.11675076782703399\n",
      "--------------\n",
      "   -3.8355 if cv>=-0.016934332624077793\n",
      "   -4.4986 if pav<=0.24460948705673222\n",
      "   +4.3917 if cp<=0.19321814179420477 & pa>=0.1284493774175644\n",
      "   -5.0778 if cp<=0.6052873730659485 & pav<=0.0543186292052269\n",
      "   +3.9293 if cp<=0.8853330612182617 & pa>=0.14282040297985077\n",
      "   +8.9731 if cv<=1.834164834022522 & pav<=0.046417894959449826\n",
      "   +1.0937 if cv>=1.3502146005630513 & pa<=0.11173352599143982 & pav<=0.040461666882038116\n",
      "   +1.9229 if pav>=0.029663847386837014\n",
      "   -5.6875 if cp>=0.9493266582489016 & pa>=-0.012121891044080256 & pav<=-0.04674722999334333\n",
      "   +4.5608 if pa>=0.08103863745927811 & pav>=0.043705208599567516\n",
      "   +4.1964 if cv<=1.772495174407959 & cv>=1.4093816995620727 & pa>=0.05492815300822258 & pav<=0.1386557340621949 & pav>=-0.14960525333881372\n",
      "   +8.1009 if cp<=0.5347496747970586 & cv<=1.7820865869522107 & cv>=0.02982740998268128 & cv>=0.5832018971443177 & pa<=0.12812677323818208 & pa>=0.1197730839252472 & pav<=0.16816720962524423 & pav>=0.015858380310237417\n",
      "Run episode 386 with rewards 116.0\n",
      "============ 387 ===========\n",
      "121 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1]\n",
      "   -0.5416 if pav>=0.105914668738842\n",
      "   +5.6827 if pa<=0.1111291527748108 & pav<=0.10654703080654145 & pav>=-0.13545677959918975\n",
      "   -8.1164 if cv>=0.12479247599840164\n",
      "   -0.5416 if pav>=0.10900827497243881\n",
      "   -5.6390 if cp<=0.19321814179420477 & pa>=0.1284493774175644\n",
      "   +2.4122 if pav<=0.19076273441314703\n",
      "   -0.0000 if cp<=0.8853330612182617 & pa>=0.14282040297985077\n",
      "   +0.1463 if cp>=0.3205459237098694 & pa<=0.10980533361434937 & pav<=-0.09898474514484405 & pav<=0.15547152757644667\n",
      "   +7.2399 if cv>=0.1838614135980606 & pav<=0.043705208599567516\n",
      "   +1.1767 if cp<=0.22202084362506871 & pa<=0.09762744754552842 & pav>=-0.14960525333881372\n",
      "   -3.6124 if cv<=1.3126796245574952 & pav>=-0.11675076782703399\n",
      "   -1.6245 if cp<=-0.023718906566500664\n",
      "--------------\n",
      "   -1.2776 if cv>=-0.016934332624077793\n",
      "   -1.3979 if pav<=0.24460948705673222\n",
      "   +4.6305 if cp<=0.19321814179420477 & pa>=0.1284493774175644\n",
      "   -4.2693 if cp<=0.6052873730659485 & pav<=0.0543186292052269\n",
      "   +0.0000 if cp<=0.8853330612182617 & pa>=0.14282040297985077\n",
      "   +2.4841 if cv<=1.834164834022522 & pav<=0.046417894959449826\n",
      "   -0.1226 if pav>=0.029663847386837014\n",
      "   -1.9539 if cp>=0.9493266582489016 & pa>=-0.012121891044080256 & pav<=-0.04674722999334333\n",
      "   +4.3463 if pa>=0.08103863745927811 & pav>=0.043705208599567516\n",
      "   +3.1483 if cv<=1.772495174407959 & cv>=1.4093816995620727 & pa>=0.05492815300822258 & pav<=0.1386557340621949 & pav>=-0.14960525333881372\n",
      "   +0.0053 if cp<=0.5347496747970586 & cv<=1.7820865869522107 & cv>=0.02982740998268128 & cv>=0.5832018971443177 & pa<=0.12812677323818208 & pa>=0.1197730839252472 & pav<=0.16816720962524423 & pav>=0.015858380310237417\n",
      "   +5.0027 if cp>=0.20222710072994232 & cp>=0.6786766052246097 & cv<=1.833206295967102 & pa<=0.1263148933649063 & pa>=0.1074947640299797 & pav<=0.006816068198531866\n",
      "Run episode 387 with rewards 121.0\n",
      "============ 388 ===========\n",
      "45 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1, 1, 1, 0, 1, 0]\n",
      "   -2.9833 if pav>=0.105914668738842\n",
      "   +0.8424 if pa<=0.1111291527748108 & pav<=0.10654703080654145 & pav>=-0.13545677959918975\n",
      "   -3.0115 if cv>=0.12479247599840164\n",
      "   -2.9833 if pav>=0.10900827497243881\n",
      "   +0.0002 if cp<=0.19321814179420477 & pa>=0.1284493774175644\n",
      "   -3.6812 if pav<=0.19076273441314703\n",
      "   +0.0000 if cp>=0.3205459237098694 & pa<=0.10980533361434937 & pav<=-0.09898474514484405 & pav<=0.15547152757644667\n",
      "   +8.8360 if cv>=0.1838614135980606 & pav<=0.043705208599567516\n",
      "   +2.2892 if cp<=0.22202084362506871 & pa<=0.09762744754552842 & pav>=-0.14960525333881372\n",
      "   -0.5077 if cv<=1.3126796245574952 & pav>=-0.11675076782703399\n",
      "   +2.3327 if cp<=-0.023718906566500664\n",
      "   -5.5512 if pa<=0.05730791762471199 & pav>=0.13789224624633797\n",
      "--------------\n",
      "   -7.5465 if cv>=-0.016934332624077793\n",
      "   +5.3443 if pav<=0.24460948705673222\n",
      "   +0.0002 if cp<=0.19321814179420477 & pa>=0.1284493774175644\n",
      "   -4.2527 if cp<=0.6052873730659485 & pav<=0.0543186292052269\n",
      "   -1.2243 if cv<=1.834164834022522 & pav<=0.046417894959449826\n",
      "   +2.5635 if pav>=0.029663847386837014\n",
      "   -1.5898 if cp>=0.9493266582489016 & pa>=-0.012121891044080256 & pav<=-0.04674722999334333\n",
      "   +5.1893 if pa>=0.08103863745927811 & pav>=0.043705208599567516\n",
      "   +5.4713 if cv<=1.772495174407959 & cv>=1.4093816995620727 & pa>=0.05492815300822258 & pav<=0.1386557340621949 & pav>=-0.14960525333881372\n",
      "   -1.4651 if cp<=0.5347496747970586 & cv<=1.7820865869522107 & cv>=0.02982740998268128 & cv>=0.5832018971443177 & pa<=0.12812677323818208 & pa>=0.1197730839252472 & pav<=0.16816720962524423 & pav>=0.015858380310237417\n",
      "   +0.0002 if cp>=0.20222710072994232 & cp>=0.6786766052246097 & cv<=1.833206295967102 & pa<=0.1263148933649063 & pa>=0.1074947640299797 & pav<=0.006816068198531866\n",
      "   +3.7668 if pav<=0.2759992480278015 & pav>=0.2759992480278015\n",
      "Run episode 388 with rewards 45.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 389 ===========\n",
      "94 actions [1, 0, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1, 1, 0, 1, 0, 1, 0, 0, 0, 1, 0, 1, 1, 1, 0, 0, 1, 1, 0, 1, 0, 0, 0, 1]\n",
      "   -0.9338 if pav>=0.105914668738842\n",
      "   +1.0506 if pa<=0.1111291527748108 & pav<=0.10654703080654145 & pav>=-0.13545677959918975\n",
      "   +0.0000 if cv>=0.12479247599840164\n",
      "   -0.9255 if pav>=0.10900827497243881\n",
      "   +0.0000 if cp<=0.19321814179420477 & pa>=0.1284493774175644\n",
      "   -2.6037 if pav<=0.19076273441314703\n",
      "   +0.0000 if cv>=0.1838614135980606 & pav<=0.043705208599567516\n",
      "   +0.5838 if cp<=0.22202084362506871 & pa<=0.09762744754552842 & pav>=-0.14960525333881372\n",
      "   +0.0121 if cv<=1.3126796245574952 & pav>=-0.11675076782703399\n",
      "   +2.1046 if cp<=-0.023718906566500664\n",
      "   -0.9249 if pa<=0.05730791762471199 & pav>=0.13789224624633797\n",
      "   -2.1562 if cp>=-0.013146681524813174 & pa<=-0.060607252269983286\n",
      "--------------\n",
      "   -8.1840 if cv>=-0.016934332624077793\n",
      "   +0.9219 if pav<=0.24460948705673222\n",
      "   -0.4408 if cp<=0.6052873730659485 & pav<=0.0543186292052269\n",
      "   -0.4408 if cv<=1.834164834022522 & pav<=0.046417894959449826\n",
      "   +2.7411 if pav>=0.029663847386837014\n",
      "   +0.0000 if cp>=0.9493266582489016 & pa>=-0.012121891044080256 & pav<=-0.04674722999334333\n",
      "   +0.0000 if pa>=0.08103863745927811 & pav>=0.043705208599567516\n",
      "   +0.0000 if cv<=1.772495174407959 & cv>=1.4093816995620727 & pa>=0.05492815300822258 & pav<=0.1386557340621949 & pav>=-0.14960525333881372\n",
      "   +0.0000 if cp<=0.5347496747970586 & cv<=1.7820865869522107 & cv>=0.02982740998268128 & cv>=0.5832018971443177 & pa<=0.12812677323818208 & pa>=0.1197730839252472 & pav<=0.16816720962524423 & pav>=0.015858380310237417\n",
      "   +0.0000 if cp>=0.20222710072994232 & cp>=0.6786766052246097 & cv<=1.833206295967102 & pa<=0.1263148933649063 & pa>=0.1074947640299797 & pav<=0.006816068198531866\n",
      "   +0.0000 if pav<=0.2759992480278015 & pav>=0.2759992480278015\n",
      "   -2.9375 if cp<=-0.02678089067339897 & cv>=-0.18006837964057923 & pav>=-0.39145669937133787\n",
      "Run episode 389 with rewards 94.0\n",
      "============ 390 ===========\n",
      "70 actions [1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1, 0, 1, 1, 1, 0, 1, 0, 0, 1, 0, 1]\n",
      "   -2.2108 if pav>=0.105914668738842\n",
      "   +1.2270 if pa<=0.1111291527748108 & pav<=0.10654703080654145 & pav>=-0.13545677959918975\n",
      "   +1.0183 if cv>=0.12479247599840164\n",
      "   -2.2108 if pav>=0.10900827497243881\n",
      "   -2.1879 if pav<=0.19076273441314703\n",
      "   -0.0000 if cv>=0.1838614135980606 & pav<=0.043705208599567516\n",
      "   +2.5760 if cp<=0.22202084362506871 & pa<=0.09762744754552842 & pav>=-0.14960525333881372\n",
      "   -2.4371 if cv<=1.3126796245574952 & pav>=-0.11675076782703399\n",
      "   +3.0161 if cp<=-0.023718906566500664\n",
      "   -2.1283 if pa<=0.05730791762471199 & pav>=0.13789224624633797\n",
      "   -0.0004 if cp>=-0.013146681524813174 & pa<=-0.060607252269983286\n",
      "   -3.2143 if pa>=-0.0015114990528672934\n",
      "--------------\n",
      "   -7.5525 if cv>=-0.016934332624077793\n",
      "   -2.9047 if pav<=0.24460948705673222\n",
      "   -2.7117 if cp<=0.6052873730659485 & pav<=0.0543186292052269\n",
      "   +5.1349 if cv<=1.834164834022522 & pav<=0.046417894959449826\n",
      "   +4.5370 if pav>=0.029663847386837014\n",
      "   +0.0000 if cp>=0.9493266582489016 & pa>=-0.012121891044080256 & pav<=-0.04674722999334333\n",
      "   +0.0000 if pa>=0.08103863745927811 & pav>=0.043705208599567516\n",
      "   +0.0000 if cv<=1.772495174407959 & cv>=1.4093816995620727 & pa>=0.05492815300822258 & pav<=0.1386557340621949 & pav>=-0.14960525333881372\n",
      "   +0.0000 if cp<=0.5347496747970586 & cv<=1.7820865869522107 & cv>=0.02982740998268128 & cv>=0.5832018971443177 & pa<=0.12812677323818208 & pa>=0.1197730839252472 & pav<=0.16816720962524423 & pav>=0.015858380310237417\n",
      "   +0.0000 if pav<=0.2759992480278015 & pav>=0.2759992480278015\n",
      "   -0.1233 if cp<=-0.02678089067339897 & cv>=-0.18006837964057923 & pav>=-0.39145669937133787\n",
      "   +3.5101 if pa>=-0.0015114990528672934\n",
      "Run episode 390 with rewards 70.0\n",
      "============ 391 ===========\n",
      "141 actions [0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 0, 1, 1, 0, 0, 1, 1, 1, 0, 0, 1, 1, 0, 0, 1, 0, 1, 1, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0]\n",
      "   -0.8115 if pav>=0.105914668738842\n",
      "   +4.0846 if pa<=0.1111291527748108 & pav<=0.10654703080654145 & pav>=-0.13545677959918975\n",
      "   +4.0645 if cv>=0.12479247599840164\n",
      "   -0.8115 if pav>=0.10900827497243881\n",
      "   -3.1372 if pav<=0.19076273441314703\n",
      "   +4.9015 if cp<=0.22202084362506871 & pa<=0.09762744754552842 & pav>=-0.14960525333881372\n",
      "   -2.3560 if cv<=1.3126796245574952 & pav>=-0.11675076782703399\n",
      "   -0.0005 if cp<=-0.023718906566500664\n",
      "   -0.7563 if pa<=0.05730791762471199 & pav>=0.13789224624633797\n",
      "   +1.9302 if cp>=-0.013146681524813174 & pa<=-0.060607252269983286\n",
      "   -1.3842 if pa>=-0.0015114990528672934\n",
      "   -3.9586 if pav>=-0.21564951241016386\n",
      "--------------\n",
      "   -5.8218 if cv>=-0.016934332624077793\n",
      "   +0.7811 if pav<=0.24460948705673222\n",
      "   -6.3390 if cp<=0.6052873730659485 & pav<=0.0543186292052269\n",
      "   +4.8442 if cv<=1.834164834022522 & pav<=0.046417894959449826\n",
      "   +2.5822 if pav>=0.029663847386837014\n",
      "   +0.0000 if cp>=0.9493266582489016 & pa>=-0.012121891044080256 & pav<=-0.04674722999334333\n",
      "   +0.0000 if pa>=0.08103863745927811 & pav>=0.043705208599567516\n",
      "   +0.0000 if cv<=1.772495174407959 & cv>=1.4093816995620727 & pa>=0.05492815300822258 & pav<=0.1386557340621949 & pav>=-0.14960525333881372\n",
      "   +0.0000 if pav<=0.2759992480278015 & pav>=0.2759992480278015\n",
      "   +0.0001 if cp<=-0.02678089067339897 & cv>=-0.18006837964057923 & pav>=-0.39145669937133787\n",
      "   +2.0834 if pa>=-0.0015114990528672934\n",
      "   -4.9377 if pa>=0.0015057497192174246 & pav<=-0.21564951241016386\n",
      "Run episode 391 with rewards 141.0\n",
      "============ 392 ===========\n",
      "133 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 1, 0, 1, 1, 1, 0, 0, 1, 1, 0, 0, 1, 1, 1, 0, 0, 1, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1, 1, 1, 0, 0, 0, 1, 1, 1, 0, 1, 0, 0, 0, 1, 1, 0, 1, 1, 0, 1, 0]\n",
      "   -2.5244 if pav>=0.105914668738842\n",
      "   +5.8707 if pa<=0.1111291527748108 & pav<=0.10654703080654145 & pav>=-0.13545677959918975\n",
      "   +4.6779 if cv>=0.12479247599840164\n",
      "   -2.5244 if pav>=0.10900827497243881\n",
      "   -2.5588 if pav<=0.19076273441314703\n",
      "  +10.2768 if cp<=0.22202084362506871 & pa<=0.09762744754552842 & pav>=-0.14960525333881372\n",
      "   -3.3219 if cv<=1.3126796245574952 & pav>=-0.11675076782703399\n",
      "   -0.3499 if pa<=0.05730791762471199 & pav>=0.13789224624633797\n",
      "   -0.0001 if cp>=-0.013146681524813174 & pa<=-0.060607252269983286\n",
      "   -5.6949 if pa>=-0.0015114990528672934\n",
      "   -4.7207 if pav>=-0.21564951241016386\n",
      "   +2.8786 if cp>=0.023021183907985687\n",
      "--------------\n",
      "   -2.9781 if cv>=-0.016934332624077793\n",
      "   -6.0756 if pav<=0.24460948705673222\n",
      "   -7.1376 if cp<=0.6052873730659485 & pav<=0.0543186292052269\n",
      "   +4.3161 if cv<=1.834164834022522 & pav<=0.046417894959449826\n",
      "   -0.6738 if pav>=0.029663847386837014\n",
      "   +1.1919 if pa>=0.08103863745927811 & pav>=0.043705208599567516\n",
      "   +1.2595 if cv<=1.772495174407959 & cv>=1.4093816995620727 & pa>=0.05492815300822258 & pav<=0.1386557340621949 & pav>=-0.14960525333881372\n",
      "   +0.0000 if pav<=0.2759992480278015 & pav>=0.2759992480278015\n",
      "   +0.8899 if cp<=-0.02678089067339897 & cv>=-0.18006837964057923 & pav>=-0.39145669937133787\n",
      "   +7.5349 if pa>=-0.0015114990528672934\n",
      "   -5.6880 if pa>=0.0015057497192174246 & pav<=-0.21564951241016386\n",
      "   +4.1949 if cp>=0.1761053204536438 & cv<=1.1169248819351216 & pa>=0.09713529050350189 & pav<=0.052090991288423566 & pav>=-0.23702484369277954\n",
      "Run episode 392 with rewards 133.0\n",
      "============ 393 ===========\n",
      "147 actions [0, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 1, 0, 0, 1, 1, 1, 0, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 0, 1, 1, 0, 0, 1, 0, 1, 1, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1, 1, 1, 0, 1, 0, 0, 1, 0, 0, 1, 1, 1, 0, 0, 0, 1, 1, 1, 0, 1, 0]\n",
      "   -2.1744 if pav>=0.105914668738842\n",
      "   +5.9552 if pa<=0.1111291527748108 & pav<=0.10654703080654145 & pav>=-0.13545677959918975\n",
      "   +1.1483 if cv>=0.12479247599840164\n",
      "   -0.8174 if pav>=0.10900827497243881\n",
      "   +1.3567 if pav<=0.19076273441314703\n",
      "   +7.5054 if cp<=0.22202084362506871 & pa<=0.09762744754552842 & pav>=-0.14960525333881372\n",
      "   -1.5737 if cv<=1.3126796245574952 & pav>=-0.11675076782703399\n",
      "   +2.0921 if pa<=0.05730791762471199 & pav>=0.13789224624633797\n",
      "   -2.4073 if pa>=-0.0015114990528672934\n",
      "   -9.0925 if pav>=-0.21564951241016386\n",
      "   +1.2533 if cp>=0.023021183907985687\n",
      "   +5.9758 if cv<=1.2749298095703125 & cv>=0.7504771232604981 & pav<=0.2101341933012009 & pav>=0.04774465858936311\n",
      "--------------\n",
      "   +0.7404 if cv>=-0.016934332624077793\n",
      "   -5.1675 if pav<=0.24460948705673222\n",
      "   -6.1037 if cp<=0.6052873730659485 & pav<=0.0543186292052269\n",
      "   +4.7030 if cv<=1.834164834022522 & pav<=0.046417894959449826\n",
      "   -1.9672 if pav>=0.029663847386837014\n",
      "   +1.0337 if pa>=0.08103863745927811 & pav>=0.043705208599567516\n",
      "   +6.5179 if cv<=1.772495174407959 & cv>=1.4093816995620727 & pa>=0.05492815300822258 & pav<=0.1386557340621949 & pav>=-0.14960525333881372\n",
      "   -1.5135 if cp<=-0.02678089067339897 & cv>=-0.18006837964057923 & pav>=-0.39145669937133787\n",
      "   +2.8531 if pa>=-0.0015114990528672934\n",
      "   -8.5692 if pa>=0.0015057497192174246 & pav<=-0.21564951241016386\n",
      "   +7.4850 if cp>=0.1761053204536438 & cv<=1.1169248819351216 & pa>=0.09713529050350189 & pav<=0.052090991288423566 & pav>=-0.23702484369277954\n",
      "   -3.6886 if cp<=0.7091557383537297 & pa>=0.10148679614067078 & pav<=0.04774465858936311 & pav>=-0.08200356811285017\n",
      "Run episode 393 with rewards 147.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 394 ===========\n",
      "127 actions [0, 1, 0, 1, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 1, 0, 1, 0, 0, 1, 1, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 1, 1, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 0, 1, 1, 1, 0, 0, 1, 0, 0, 1, 1, 1, 0, 0, 1, 0, 0, 1, 1, 1, 0]\n",
      "   -8.0055 if pav>=0.105914668738842\n",
      "   +1.2256 if pa<=0.1111291527748108 & pav<=0.10654703080654145 & pav>=-0.13545677959918975\n",
      "   -0.1708 if cv>=0.12479247599840164\n",
      "   +5.1415 if pav<=0.19076273441314703\n",
      "   +8.9418 if cp<=0.22202084362506871 & pa<=0.09762744754552842 & pav>=-0.14960525333881372\n",
      "   +2.3196 if cv<=1.3126796245574952 & pav>=-0.11675076782703399\n",
      "   +3.7105 if pa<=0.05730791762471199 & pav>=0.13789224624633797\n",
      "   -7.0756 if pa>=-0.0015114990528672934\n",
      "   -8.5109 if pav>=-0.21564951241016386\n",
      "   +4.5286 if cp>=0.023021183907985687\n",
      "   +6.4342 if cv<=1.2749298095703125 & cv>=0.7504771232604981 & pav<=0.2101341933012009 & pav>=0.04774465858936311\n",
      "   -2.7909 if pav>=0.06305743753910065\n",
      "--------------\n",
      "   -3.9805 if pav<=0.24460948705673222\n",
      "   -7.7897 if cp<=0.6052873730659485 & pav<=0.0543186292052269\n",
      "   +2.0323 if cv<=1.834164834022522 & pav<=0.046417894959449826\n",
      "   -2.7983 if pav>=0.029663847386837014\n",
      "   +0.6551 if pa>=0.08103863745927811 & pav>=0.043705208599567516\n",
      "   +0.6533 if cv<=1.772495174407959 & cv>=1.4093816995620727 & pa>=0.05492815300822258 & pav<=0.1386557340621949 & pav>=-0.14960525333881372\n",
      "   -0.1229 if cp<=-0.02678089067339897 & cv>=-0.18006837964057923 & pav>=-0.39145669937133787\n",
      "   +5.9211 if pa>=-0.0015114990528672934\n",
      "   -7.5479 if pa>=0.0015057497192174246 & pav<=-0.21564951241016386\n",
      "   +6.9372 if cp>=0.1761053204536438 & cv<=1.1169248819351216 & pa>=0.09713529050350189 & pav<=0.052090991288423566 & pav>=-0.23702484369277954\n",
      "   +0.0002 if cp<=0.7091557383537297 & pa>=0.10148679614067078 & pav<=0.04774465858936311 & pav>=-0.08200356811285017\n",
      "   +3.0849 if pav>=0.5656260251998901\n",
      "Run episode 394 with rewards 127.0\n",
      "origin 396.0336346016046 new 37289.562728290046 not updated\n",
      "============ 395 ===========\n",
      "127 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 1, 0, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 1, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 1, 1, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 0, 1, 1, 1, 0, 0, 1]\n",
      "   -8.0055 if pav>=0.105914668738842\n",
      "   +1.2256 if pa<=0.1111291527748108 & pav<=0.10654703080654145 & pav>=-0.13545677959918975\n",
      "   -0.1708 if cv>=0.12479247599840164\n",
      "   +5.1415 if pav<=0.19076273441314703\n",
      "   +8.9418 if cp<=0.22202084362506871 & pa<=0.09762744754552842 & pav>=-0.14960525333881372\n",
      "   +2.3196 if cv<=1.3126796245574952 & pav>=-0.11675076782703399\n",
      "   +3.7105 if pa<=0.05730791762471199 & pav>=0.13789224624633797\n",
      "   -7.0756 if pa>=-0.0015114990528672934\n",
      "   -8.5109 if pav>=-0.21564951241016386\n",
      "   +4.5286 if cp>=0.023021183907985687\n",
      "   +6.4342 if cv<=1.2749298095703125 & cv>=0.7504771232604981 & pav<=0.2101341933012009 & pav>=0.04774465858936311\n",
      "   -2.7909 if pav>=0.06305743753910065\n",
      "--------------\n",
      "   -3.0768 if pav<=0.24460948705673222\n",
      "   -5.6527 if cp<=0.6052873730659485 & pav<=0.0543186292052269\n",
      "   +0.4582 if cv<=1.834164834022522 & pav<=0.046417894959449826\n",
      "   -2.2358 if pav>=0.029663847386837014\n",
      "   -0.1177 if pa>=0.08103863745927811 & pav>=0.043705208599567516\n",
      "   +0.5722 if cv<=1.772495174407959 & cv>=1.4093816995620727 & pa>=0.05492815300822258 & pav<=0.1386557340621949 & pav>=-0.14960525333881372\n",
      "   +2.0439 if cp<=-0.02678089067339897 & cv>=-0.18006837964057923 & pav>=-0.39145669937133787\n",
      "   +3.4966 if pa>=-0.0015114990528672934\n",
      "   -4.1757 if pa>=0.0015057497192174246 & pav<=-0.21564951241016386\n",
      "   +6.5637 if cp>=0.1761053204536438 & cv<=1.1169248819351216 & pa>=0.09713529050350189 & pav<=0.052090991288423566 & pav>=-0.23702484369277954\n",
      "   +0.0006 if pav>=0.5656260251998901\n",
      "   +2.8206 if pa>=0.11967067420482635\n",
      "Run episode 395 with rewards 127.0\n",
      "origin 715.6769847675962 new 37094.45300645659 not updated\n",
      "============ 396 ===========\n",
      "118 actions [0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1, 1, 0, 1, 0, 0, 1, 1, 0, 0, 1, 1, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 1, 1, 0, 0, 1, 1, 1, 0, 1, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1, 1, 1, 0, 1, 0, 0, 1, 0, 1]\n",
      "   -8.0055 if pav>=0.105914668738842\n",
      "   +1.2256 if pa<=0.1111291527748108 & pav<=0.10654703080654145 & pav>=-0.13545677959918975\n",
      "   -0.1708 if cv>=0.12479247599840164\n",
      "   +5.1415 if pav<=0.19076273441314703\n",
      "   +8.9418 if cp<=0.22202084362506871 & pa<=0.09762744754552842 & pav>=-0.14960525333881372\n",
      "   +2.3196 if cv<=1.3126796245574952 & pav>=-0.11675076782703399\n",
      "   +3.7105 if pa<=0.05730791762471199 & pav>=0.13789224624633797\n",
      "   -7.0756 if pa>=-0.0015114990528672934\n",
      "   -8.5109 if pav>=-0.21564951241016386\n",
      "   +4.5286 if cp>=0.023021183907985687\n",
      "   +6.4342 if cv<=1.2749298095703125 & cv>=0.7504771232604981 & pav<=0.2101341933012009 & pav>=0.04774465858936311\n",
      "   -2.7909 if pav>=0.06305743753910065\n",
      "--------------\n",
      "   -0.5863 if pav<=0.24460948705673222\n",
      "   -3.6639 if cp<=0.6052873730659485 & pav<=0.0543186292052269\n",
      "   -3.6340 if cv<=1.834164834022522 & pav<=0.046417894959449826\n",
      "   -7.1022 if pav>=0.029663847386837014\n",
      "   +1.7318 if pa>=0.08103863745927811 & pav>=0.043705208599567516\n",
      "   +1.9339 if cv<=1.772495174407959 & cv>=1.4093816995620727 & pa>=0.05492815300822258 & pav<=0.1386557340621949 & pav>=-0.14960525333881372\n",
      "   +0.0007 if cp<=-0.02678089067339897 & cv>=-0.18006837964057923 & pav>=-0.39145669937133787\n",
      "   +1.4825 if pa>=-0.0015114990528672934\n",
      "   -3.1534 if pa>=0.0015057497192174246 & pav<=-0.21564951241016386\n",
      "   +6.2437 if cp>=0.1761053204536438 & cv<=1.1169248819351216 & pa>=0.09713529050350189 & pav<=0.052090991288423566 & pav>=-0.23702484369277954\n",
      "   +1.2345 if pa>=0.11967067420482635\n",
      "   +3.4248 if pav>=-0.09002201110124577\n",
      "Run episode 396 with rewards 118.0\n",
      "origin 423.80895784980726 new 33016.981666203894 not updated\n",
      "============ 397 ===========\n",
      "129 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 1, 1, 0, 0, 1, 1, 1, 0, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 1, 0, 1, 1, 1, 0, 1, 0, 0, 1, 0, 1, 1, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1, 1, 1, 0, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1]\n",
      "   -8.0055 if pav>=0.105914668738842\n",
      "   +1.2256 if pa<=0.1111291527748108 & pav<=0.10654703080654145 & pav>=-0.13545677959918975\n",
      "   -0.1708 if cv>=0.12479247599840164\n",
      "   +5.1415 if pav<=0.19076273441314703\n",
      "   +8.9418 if cp<=0.22202084362506871 & pa<=0.09762744754552842 & pav>=-0.14960525333881372\n",
      "   +2.3196 if cv<=1.3126796245574952 & pav>=-0.11675076782703399\n",
      "   +3.7105 if pa<=0.05730791762471199 & pav>=0.13789224624633797\n",
      "   -7.0756 if pa>=-0.0015114990528672934\n",
      "   -8.5109 if pav>=-0.21564951241016386\n",
      "   +4.5286 if cp>=0.023021183907985687\n",
      "   +6.4342 if cv<=1.2749298095703125 & cv>=0.7504771232604981 & pav<=0.2101341933012009 & pav>=0.04774465858936311\n",
      "   -2.7909 if pav>=0.06305743753910065\n",
      "--------------\n",
      "   -9.5305 if pav<=0.24460948705673222\n",
      "   -3.4657 if cp<=0.6052873730659485 & pav<=0.0543186292052269\n",
      "   -1.9557 if cv<=1.834164834022522 & pav<=0.046417894959449826\n",
      "   -7.1423 if pav>=0.029663847386837014\n",
      "   +2.4024 if pa>=0.08103863745927811 & pav>=0.043705208599567516\n",
      "   +2.2300 if cv<=1.772495174407959 & cv>=1.4093816995620727 & pa>=0.05492815300822258 & pav<=0.1386557340621949 & pav>=-0.14960525333881372\n",
      "   +8.9630 if pa>=-0.0015114990528672934\n",
      "   -5.9888 if pa>=0.0015057497192174246 & pav<=-0.21564951241016386\n",
      "  +10.6384 if cp>=0.1761053204536438 & cv<=1.1169248819351216 & pa>=0.09713529050350189 & pav<=0.052090991288423566 & pav>=-0.23702484369277954\n",
      "   +3.5720 if pa>=0.11967067420482635\n",
      "   +2.2128 if pav>=-0.09002201110124577\n",
      "   -2.4486 if cp>=2.3851780891418457\n",
      "Run episode 397 with rewards 129.0\n",
      "origin 359.5794250744684 new 38175.70147817509 not updated\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 398 ===========\n",
      "152 actions [0, 1, 0, 1, 0, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 1, 1, 0, 0, 1, 1, 1, 0, 0, 1, 1, 0, 0, 1, 1, 1, 0, 0, 1, 1, 0, 0, 1, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 1, 0, 1, 0, 1, 0, 0, 0, 1, 1, 1, 0, 0, 0, 1, 1, 1, 0, 0, 0, 1, 0, 1, 1, 1, 0, 0, 0, 1, 1, 1]\n",
      "   -8.0055 if pav>=0.105914668738842\n",
      "   +1.2256 if pa<=0.1111291527748108 & pav<=0.10654703080654145 & pav>=-0.13545677959918975\n",
      "   -0.1708 if cv>=0.12479247599840164\n",
      "   +5.1415 if pav<=0.19076273441314703\n",
      "   +8.9418 if cp<=0.22202084362506871 & pa<=0.09762744754552842 & pav>=-0.14960525333881372\n",
      "   +2.3196 if cv<=1.3126796245574952 & pav>=-0.11675076782703399\n",
      "   +3.7105 if pa<=0.05730791762471199 & pav>=0.13789224624633797\n",
      "   -7.0756 if pa>=-0.0015114990528672934\n",
      "   -8.5109 if pav>=-0.21564951241016386\n",
      "   +4.5286 if cp>=0.023021183907985687\n",
      "   +6.4342 if cv<=1.2749298095703125 & cv>=0.7504771232604981 & pav<=0.2101341933012009 & pav>=0.04774465858936311\n",
      "   -2.7909 if pav>=0.06305743753910065\n",
      "--------------\n",
      "   -8.2331 if pav<=0.24460948705673222\n",
      "   -4.3095 if cp<=0.6052873730659485 & pav<=0.0543186292052269\n",
      "   -6.3395 if pav>=0.029663847386837014\n",
      "   +3.8309 if pa>=0.08103863745927811 & pav>=0.043705208599567516\n",
      "   +2.6540 if cv<=1.772495174407959 & cv>=1.4093816995620727 & pa>=0.05492815300822258 & pav<=0.1386557340621949 & pav>=-0.14960525333881372\n",
      "   +5.7669 if pa>=-0.0015114990528672934\n",
      "   -1.9653 if pa>=0.0015057497192174246 & pav<=-0.21564951241016386\n",
      "   +7.4883 if cp>=0.1761053204536438 & cv<=1.1169248819351216 & pa>=0.09713529050350189 & pav<=0.052090991288423566 & pav>=-0.23702484369277954\n",
      "   -0.0005 if pa>=0.11967067420482635\n",
      "   +2.3989 if pav>=-0.09002201110124577\n",
      "   -0.0139 if cp>=2.3851780891418457\n",
      "   +4.3855 if pa>=0.11334770917892456\n",
      "Run episode 398 with rewards 152.0\n",
      "origin 1136.1650125969225 new 49318.8836695642 not updated\n",
      "============ 399 ===========\n",
      "151 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 0, 1, 1, 0, 0, 1, 1, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 0, 1]\n",
      "   -8.0055 if pav>=0.105914668738842\n",
      "   +1.2256 if pa<=0.1111291527748108 & pav<=0.10654703080654145 & pav>=-0.13545677959918975\n",
      "   -0.1708 if cv>=0.12479247599840164\n",
      "   +5.1415 if pav<=0.19076273441314703\n",
      "   +8.9418 if cp<=0.22202084362506871 & pa<=0.09762744754552842 & pav>=-0.14960525333881372\n",
      "   +2.3196 if cv<=1.3126796245574952 & pav>=-0.11675076782703399\n",
      "   +3.7105 if pa<=0.05730791762471199 & pav>=0.13789224624633797\n",
      "   -7.0756 if pa>=-0.0015114990528672934\n",
      "   -8.5109 if pav>=-0.21564951241016386\n",
      "   +4.5286 if cp>=0.023021183907985687\n",
      "   +6.4342 if cv<=1.2749298095703125 & cv>=0.7504771232604981 & pav<=0.2101341933012009 & pav>=0.04774465858936311\n",
      "   -2.7909 if pav>=0.06305743753910065\n",
      "--------------\n",
      "   -8.5301 if pav<=0.24460948705673222\n",
      "   -7.4665 if cp<=0.6052873730659485 & pav<=0.0543186292052269\n",
      "   -9.0452 if pav>=0.029663847386837014\n",
      "   +6.0448 if pa>=0.08103863745927811 & pav>=0.043705208599567516\n",
      "   +1.4270 if cv<=1.772495174407959 & cv>=1.4093816995620727 & pa>=0.05492815300822258 & pav<=0.1386557340621949 & pav>=-0.14960525333881372\n",
      "   +6.7993 if pa>=-0.0015114990528672934\n",
      "   -2.2591 if pa>=0.0015057497192174246 & pav<=-0.21564951241016386\n",
      "   +6.9455 if cp>=0.1761053204536438 & cv<=1.1169248819351216 & pa>=0.09713529050350189 & pav<=0.052090991288423566 & pav>=-0.23702484369277954\n",
      "   +6.0705 if pav>=-0.09002201110124577\n",
      "   -0.0000 if cp>=2.3851780891418457\n",
      "   -0.0017 if pa>=0.11334770917892456\n",
      "   +6.4078 if pa>=0.10990279912948608\n",
      "Run episode 399 with rewards 151.0\n",
      "origin 469.6621616208148 new 48797.32721354565 not updated\n",
      "============ 400 ===========\n",
      "133 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 0, 1, 0, 0, 1, 1, 1, 0, 1, 0, 1]\n",
      "   -8.0055 if pav>=0.105914668738842\n",
      "   +1.2256 if pa<=0.1111291527748108 & pav<=0.10654703080654145 & pav>=-0.13545677959918975\n",
      "   -0.1708 if cv>=0.12479247599840164\n",
      "   +5.1415 if pav<=0.19076273441314703\n",
      "   +8.9418 if cp<=0.22202084362506871 & pa<=0.09762744754552842 & pav>=-0.14960525333881372\n",
      "   +2.3196 if cv<=1.3126796245574952 & pav>=-0.11675076782703399\n",
      "   +3.7105 if pa<=0.05730791762471199 & pav>=0.13789224624633797\n",
      "   -7.0756 if pa>=-0.0015114990528672934\n",
      "   -8.5109 if pav>=-0.21564951241016386\n",
      "   +4.5286 if cp>=0.023021183907985687\n",
      "   +6.4342 if cv<=1.2749298095703125 & cv>=0.7504771232604981 & pav<=0.2101341933012009 & pav>=0.04774465858936311\n",
      "   -2.7909 if pav>=0.06305743753910065\n",
      "--------------\n",
      "   -6.7571 if pav<=0.24460948705673222\n",
      "   -4.7785 if cp<=0.6052873730659485 & pav<=0.0543186292052269\n",
      "   -2.5493 if pav>=0.029663847386837014\n",
      "   +7.9325 if pa>=0.08103863745927811 & pav>=0.043705208599567516\n",
      "   +3.0303 if cv<=1.772495174407959 & cv>=1.4093816995620727 & pa>=0.05492815300822258 & pav<=0.1386557340621949 & pav>=-0.14960525333881372\n",
      "   +2.5429 if pa>=-0.0015114990528672934\n",
      "   -2.1346 if pa>=0.0015057497192174246 & pav<=-0.21564951241016386\n",
      "   +7.0859 if cp>=0.1761053204536438 & cv<=1.1169248819351216 & pa>=0.09713529050350189 & pav<=0.052090991288423566 & pav>=-0.23702484369277954\n",
      "   +3.5736 if pav>=-0.09002201110124577\n",
      "   -1.6293 if pa>=0.11334770917892456\n",
      "   +6.2218 if pa>=0.10990279912948608\n",
      "   -1.8269 if pav>=0.04778921976685526\n",
      "Run episode 400 with rewards 133.0\n",
      "origin 810.54543286134 new 39705.11493242681 not updated\n",
      "============ 401 ===========\n",
      "129 actions [0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 1, 0, 0, 1, 1, 1, 0, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 0, 1, 1, 0, 1, 1, 0, 1, 0, 0, 1, 0, 0, 1, 1, 1, 0, 0, 0, 1, 1]\n",
      "   -8.0055 if pav>=0.105914668738842\n",
      "   +1.2256 if pa<=0.1111291527748108 & pav<=0.10654703080654145 & pav>=-0.13545677959918975\n",
      "   -0.1708 if cv>=0.12479247599840164\n",
      "   +5.1415 if pav<=0.19076273441314703\n",
      "   +8.9418 if cp<=0.22202084362506871 & pa<=0.09762744754552842 & pav>=-0.14960525333881372\n",
      "   +2.3196 if cv<=1.3126796245574952 & pav>=-0.11675076782703399\n",
      "   +3.7105 if pa<=0.05730791762471199 & pav>=0.13789224624633797\n",
      "   -7.0756 if pa>=-0.0015114990528672934\n",
      "   -8.5109 if pav>=-0.21564951241016386\n",
      "   +4.5286 if cp>=0.023021183907985687\n",
      "   +6.4342 if cv<=1.2749298095703125 & cv>=0.7504771232604981 & pav<=0.2101341933012009 & pav>=0.04774465858936311\n",
      "   -2.7909 if pav>=0.06305743753910065\n",
      "--------------\n",
      "   -9.0464 if pav<=0.24460948705673222\n",
      "   -9.0478 if cp<=0.6052873730659485 & pav<=0.0543186292052269\n",
      "   -3.0253 if pav>=0.029663847386837014\n",
      "  +10.0537 if pa>=0.08103863745927811 & pav>=0.043705208599567516\n",
      "   -0.0003 if cv<=1.772495174407959 & cv>=1.4093816995620727 & pa>=0.05492815300822258 & pav<=0.1386557340621949 & pav>=-0.14960525333881372\n",
      "   +6.0429 if pa>=-0.0015114990528672934\n",
      "   -1.4641 if pa>=0.0015057497192174246 & pav<=-0.21564951241016386\n",
      "   +9.0373 if cp>=0.1761053204536438 & cv<=1.1169248819351216 & pa>=0.09713529050350189 & pav<=0.052090991288423566 & pav>=-0.23702484369277954\n",
      "   +8.1184 if pav>=-0.09002201110124577\n",
      "   -0.0005 if pa>=0.10990279912948608\n",
      "   -5.5024 if pav>=0.04778921976685526\n",
      "   +5.0017 if pa>=0.1086120456457138\n",
      "Run episode 401 with rewards 129.0\n",
      "============ 402 ===========\n",
      "149 actions [0, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1, 1, 0, 0, 1, 1, 0, 0, 1, 1, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0]\n",
      "   -3.3410 if pav>=0.105914668738842\n",
      "   +4.9496 if pa<=0.1111291527748108 & pav<=0.10654703080654145 & pav>=-0.13545677959918975\n",
      "   +4.3936 if pav<=0.19076273441314703\n",
      "   +4.4230 if cp<=0.22202084362506871 & pa<=0.09762744754552842 & pav>=-0.14960525333881372\n",
      "   +0.3713 if cv<=1.3126796245574952 & pav>=-0.11675076782703399\n",
      "   +3.4217 if pa<=0.05730791762471199 & pav>=0.13789224624633797\n",
      "   -2.5514 if pa>=-0.0015114990528672934\n",
      "   -9.2234 if pav>=-0.21564951241016386\n",
      "   -1.3478 if cp>=0.023021183907985687\n",
      "   +5.2907 if cv<=1.2749298095703125 & cv>=0.7504771232604981 & pav<=0.2101341933012009 & pav>=0.04774465858936311\n",
      "   -1.8200 if pav>=0.06305743753910065\n",
      "   +5.2112 if pa>=0.11328637599945068\n",
      "--------------\n",
      "   -6.8486 if pav<=0.24460948705673222\n",
      "   -8.3750 if cp<=0.6052873730659485 & pav<=0.0543186292052269\n",
      "   -4.5118 if pav>=0.029663847386837014\n",
      "   +8.7488 if pa>=0.08103863745927811 & pav>=0.043705208599567516\n",
      "   +2.9795 if pa>=-0.0015114990528672934\n",
      "   -1.0231 if pa>=0.0015057497192174246 & pav<=-0.21564951241016386\n",
      "   +9.0423 if cp>=0.1761053204536438 & cv<=1.1169248819351216 & pa>=0.09713529050350189 & pav<=0.052090991288423566 & pav>=-0.23702484369277954\n",
      "   +9.1267 if pav>=-0.09002201110124577\n",
      "   +4.4558 if pa>=0.10990279912948608\n",
      "   -4.8249 if pav>=0.04778921976685526\n",
      "   +4.4573 if pa>=0.1086120456457138\n",
      "   -6.1230 if pa>=0.11328637599945068\n",
      "Run episode 402 with rewards 149.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 403 ===========\n",
      "149 actions [0, 1, 0, 1, 0, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 1, 0, 0, 1, 1, 0, 0, 1, 1, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 0, 0, 1, 0, 0, 1, 1, 0, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0]\n",
      "   -3.5052 if pav>=0.105914668738842\n",
      "   +3.7595 if pa<=0.1111291527748108 & pav<=0.10654703080654145 & pav>=-0.13545677959918975\n",
      "   +5.1751 if pav<=0.19076273441314703\n",
      "   +4.9028 if cp<=0.22202084362506871 & pa<=0.09762744754552842 & pav>=-0.14960525333881372\n",
      "   +5.6956 if pa<=0.05730791762471199 & pav>=0.13789224624633797\n",
      "   -2.2948 if pa>=-0.0015114990528672934\n",
      "   -9.3520 if pav>=-0.21564951241016386\n",
      "   -3.5310 if cp>=0.023021183907985687\n",
      "   +5.9051 if cv<=1.2749298095703125 & cv>=0.7504771232604981 & pav<=0.2101341933012009 & pav>=0.04774465858936311\n",
      "   -2.2847 if pav>=0.06305743753910065\n",
      "   -0.0001 if pa>=0.11328637599945068\n",
      "   +4.0653 if cp>=0.09292074441909794 & cv<=1.453850269317627 & pa<=0.09489486813545227 & pa>=0.08252426087856293 & pav<=0.05076145231723788\n",
      "--------------\n",
      "   -6.5138 if pav<=0.24460948705673222\n",
      "   -9.5027 if cp<=0.6052873730659485 & pav<=0.0543186292052269\n",
      "   -2.7904 if pav>=0.029663847386837014\n",
      "   +8.3826 if pa>=0.08103863745927811 & pav>=0.043705208599567516\n",
      "   +4.1689 if pa>=-0.0015114990528672934\n",
      "   +6.9616 if cp>=0.1761053204536438 & cv<=1.1169248819351216 & pa>=0.09713529050350189 & pav<=0.052090991288423566 & pav>=-0.23702484369277954\n",
      "   +9.9116 if pav>=-0.09002201110124577\n",
      "   +4.1607 if pa>=0.10990279912948608\n",
      "   -8.7116 if pav>=0.04778921976685526\n",
      "   +4.1477 if pa>=0.1086120456457138\n",
      "   +0.0015 if pa>=0.11328637599945068\n",
      "   -2.4931 if cp<=1.5362601757049563 & cp>=0.09292074441909794 & cv<=1.453850269317627 & pa<=0.09489486813545227 & pa>=0.08252426087856293 & pav<=0.05076145231723788\n",
      "Run episode 403 with rewards 149.0\n",
      "============ 404 ===========\n",
      "153 actions [0, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 0, 0, 0, 1, 0, 1, 1, 0, 1, 0, 0, 0, 1, 0, 1, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 0, 1, 0, 0, 1, 0]\n",
      "   -7.0050 if pav>=0.105914668738842\n",
      "   +3.2848 if pa<=0.1111291527748108 & pav<=0.10654703080654145 & pav>=-0.13545677959918975\n",
      "   +3.4548 if pav<=0.19076273441314703\n",
      "   +8.0398 if cp<=0.22202084362506871 & pa<=0.09762744754552842 & pav>=-0.14960525333881372\n",
      "   +4.7000 if pa<=0.05730791762471199 & pav>=0.13789224624633797\n",
      "   -4.2220 if pa>=-0.0015114990528672934\n",
      "   -7.8739 if pav>=-0.21564951241016386\n",
      "   -2.0248 if cp>=0.023021183907985687\n",
      "   +7.0231 if cv<=1.2749298095703125 & cv>=0.7504771232604981 & pav<=0.2101341933012009 & pav>=0.04774465858936311\n",
      "   -0.7572 if pav>=0.06305743753910065\n",
      "   +3.2954 if cp>=0.09292074441909794 & cv<=1.453850269317627 & pa<=0.09489486813545227 & pa>=0.08252426087856293 & pav<=0.05076145231723788\n",
      "   +3.5721 if cv>=0.671009647846222 & pa>=0.05027810782194139 & pav<=0.0647647328674794\n",
      "--------------\n",
      "   -6.6853 if pav<=0.24460948705673222\n",
      "   -9.8648 if cp<=0.6052873730659485 & pav<=0.0543186292052269\n",
      "   -3.8219 if pav>=0.029663847386837014\n",
      "   +8.5280 if pa>=0.08103863745927811 & pav>=0.043705208599567516\n",
      "   +7.3005 if pa>=-0.0015114990528672934\n",
      "   +5.8977 if cp>=0.1761053204536438 & cv<=1.1169248819351216 & pa>=0.09713529050350189 & pav<=0.052090991288423566 & pav>=-0.23702484369277954\n",
      "   +9.5180 if pav>=-0.09002201110124577\n",
      "   +0.0008 if pa>=0.10990279912948608\n",
      "   -6.8425 if pav>=0.04778921976685526\n",
      "   +0.0008 if pa>=0.1086120456457138\n",
      "   -3.9186 if cp<=1.5362601757049563 & cp>=0.09292074441909794 & cv<=1.453850269317627 & pa<=0.09489486813545227 & pa>=0.08252426087856293 & pav<=0.05076145231723788\n",
      "   -2.6422 if cp<=1.5557722806930545 & pa>=-0.03226159438490868\n",
      "Run episode 404 with rewards 153.0\n",
      "============ 405 ===========\n",
      "157 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 1, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 1, 0, 0, 1, 0, 1, 1, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 1, 0, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 0, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 0, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 0, 0, 1, 1, 0]\n",
      "   -6.4444 if pav>=0.105914668738842\n",
      "   +2.8196 if pa<=0.1111291527748108 & pav<=0.10654703080654145 & pav>=-0.13545677959918975\n",
      "   +7.4735 if pav<=0.19076273441314703\n",
      "   +7.9987 if cp<=0.22202084362506871 & pa<=0.09762744754552842 & pav>=-0.14960525333881372\n",
      "   +5.2798 if pa<=0.05730791762471199 & pav>=0.13789224624633797\n",
      "   -7.4598 if pa>=-0.0015114990528672934\n",
      "   -8.2717 if pav>=-0.21564951241016386\n",
      "   -4.3390 if cp>=0.023021183907985687\n",
      "   +5.1897 if cv<=1.2749298095703125 & cv>=0.7504771232604981 & pav<=0.2101341933012009 & pav>=0.04774465858936311\n",
      "   +3.8076 if cp>=0.09292074441909794 & cv<=1.453850269317627 & pa<=0.09489486813545227 & pa>=0.08252426087856293 & pav<=0.05076145231723788\n",
      "   +4.8178 if cv>=0.671009647846222 & pa>=0.05027810782194139 & pav<=0.0647647328674794\n",
      "   -6.0228 if pav>=0.803054690361023\n",
      "--------------\n",
      "   -8.0646 if pav<=0.24460948705673222\n",
      "  -10.3225 if cp<=0.6052873730659485 & pav<=0.0543186292052269\n",
      "   -1.7138 if pav>=0.029663847386837014\n",
      "   +7.3610 if pa>=0.08103863745927811 & pav>=0.043705208599567516\n",
      "  +11.2950 if pa>=-0.0015114990528672934\n",
      "   +8.1854 if cp>=0.1761053204536438 & cv<=1.1169248819351216 & pa>=0.09713529050350189 & pav<=0.052090991288423566 & pav>=-0.23702484369277954\n",
      "   +9.6262 if pav>=-0.09002201110124577\n",
      "   +0.0001 if pa>=0.10990279912948608\n",
      "   -8.4226 if pav>=0.04778921976685526\n",
      "   -3.6683 if cp<=1.5362601757049563 & cp>=0.09292074441909794 & cv<=1.453850269317627 & pa<=0.09489486813545227 & pa>=0.08252426087856293 & pav<=0.05076145231723788\n",
      "   -4.7031 if cp<=1.5557722806930545 & pa>=-0.03226159438490868\n",
      "   +5.9935 if pav>=0.803054690361023\n",
      "Run episode 405 with rewards 157.0\n",
      "============ 406 ===========\n",
      "304 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1, 0, 1, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1, 1, 0, 0, 0, 1, 0, 1, 0, 0, 1, 1, 0, 0, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 0, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1]\n",
      "   -8.3999 if pav>=0.105914668738842\n",
      "   +7.2736 if pav<=0.19076273441314703\n",
      "  +10.0935 if cp<=0.22202084362506871 & pa<=0.09762744754552842 & pav>=-0.14960525333881372\n",
      "   +2.0638 if pa<=0.05730791762471199 & pav>=0.13789224624633797\n",
      "  -11.8196 if pa>=-0.0015114990528672934\n",
      "   -5.0463 if pav>=-0.21564951241016386\n",
      "   -2.8754 if cp>=0.023021183907985687\n",
      "   +3.6344 if cv<=1.2749298095703125 & cv>=0.7504771232604981 & pav<=0.2101341933012009 & pav>=0.04774465858936311\n",
      "   +5.8078 if cp>=0.09292074441909794 & cv<=1.453850269317627 & pa<=0.09489486813545227 & pa>=0.08252426087856293 & pav<=0.05076145231723788\n",
      "   +5.8597 if cv>=0.671009647846222 & pa>=0.05027810782194139 & pav<=0.0647647328674794\n",
      "   +0.0001 if pav>=0.803054690361023\n",
      "   +5.0756 if cp<=0.9816968679428103 & cv>=1.252695846557619 & pav<=-0.2042848765850067\n",
      "--------------\n",
      "  -10.4860 if pav<=0.24460948705673222\n",
      "   -9.5894 if cp<=0.6052873730659485 & pav<=0.0543186292052269\n",
      "   +0.5387 if pav>=0.029663847386837014\n",
      "   +4.2090 if pa>=0.08103863745927811 & pav>=0.043705208599567516\n",
      "   +4.6803 if pa>=-0.0015114990528672934\n",
      "   +6.2330 if cp>=0.1761053204536438 & cv<=1.1169248819351216 & pa>=0.09713529050350189 & pav<=0.052090991288423566 & pav>=-0.23702484369277954\n",
      "   +9.3311 if pav>=-0.09002201110124577\n",
      "   -6.4117 if pav>=0.04778921976685526\n",
      "   -4.7325 if cp<=1.5362601757049563 & cp>=0.09292074441909794 & cv<=1.453850269317627 & pa<=0.09489486813545227 & pa>=0.08252426087856293 & pav<=0.05076145231723788\n",
      "   +4.6648 if cp<=1.5557722806930545 & pa>=-0.03226159438490868\n",
      "   +0.0009 if pav>=0.803054690361023\n",
      "   -7.3725 if cp<=0.9816968679428103 & cv<=0.7277598142623901 & cv>=0.19991366863250734 & pa>=0.07209430336952209 & pav<=0.2290336310863496 & pav>=0.05907522141933444\n",
      "Run episode 406 with rewards 304.0\n",
      "best\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 407 ===========\n",
      "500 actions [0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 0, 0, 1, 0, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 0, 0, 1, 1, 0, 0, 1, 1, 0, 0, 1, 1, 0, 0, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 1, 0, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 0, 1, 0, 1, 1, 1, 0, 0, 0, 1, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 1, 1, 0, 0, 0, 1, 0, 1, 1, 1, 0, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1]\n",
      "  -10.2426 if pav>=0.105914668738842\n",
      "   +5.8898 if pav<=0.19076273441314703\n",
      "   +8.4507 if cp<=0.22202084362506871 & pa<=0.09762744754552842 & pav>=-0.14960525333881372\n",
      "   +3.7135 if pa<=0.05730791762471199 & pav>=0.13789224624633797\n",
      "   -9.0246 if pa>=-0.0015114990528672934\n",
      "   -4.4810 if pav>=-0.21564951241016386\n",
      "   -1.7379 if cp>=0.023021183907985687\n",
      "   +3.5039 if cv<=1.2749298095703125 & cv>=0.7504771232604981 & pav<=0.2101341933012009 & pav>=0.04774465858936311\n",
      "   +5.9431 if cp>=0.09292074441909794 & cv<=1.453850269317627 & pa<=0.09489486813545227 & pa>=0.08252426087856293 & pav<=0.05076145231723788\n",
      "   +2.9131 if cv>=0.671009647846222 & pa>=0.05027810782194139 & pav<=0.0647647328674794\n",
      "   +5.9901 if cp<=0.9816968679428103 & cv>=1.252695846557619 & pav<=-0.2042848765850067\n",
      "   -2.3097 if cp>=0.08793166130781174 & cv<=0.7264650344848633 & cv>=-0.36476999521255493 & cv>=0.17411399781703957 & pav<=0.09162152707576755 & pav>=-0.1439988523721695\n",
      "--------------\n",
      "  -11.5635 if pav<=0.24460948705673222\n",
      "  -11.4557 if cp<=0.6052873730659485 & pav<=0.0543186292052269\n",
      "   +0.7955 if pav>=0.029663847386837014\n",
      "   +6.5933 if pa>=0.08103863745927811 & pav>=0.043705208599567516\n",
      "   +5.3029 if pa>=-0.0015114990528672934\n",
      "   +9.1419 if cp>=0.1761053204536438 & cv<=1.1169248819351216 & pa>=0.09713529050350189 & pav<=0.052090991288423566 & pav>=-0.23702484369277954\n",
      "  +10.5379 if pav>=-0.09002201110124577\n",
      "   -6.3694 if pav>=0.04778921976685526\n",
      "   -4.9192 if cp<=1.5362601757049563 & cp>=0.09292074441909794 & cv<=1.453850269317627 & pa<=0.09489486813545227 & pa>=0.08252426087856293 & pav<=0.05076145231723788\n",
      "   +5.3298 if cp<=1.5557722806930545 & pa>=-0.03226159438490868\n",
      "   -9.2491 if cp<=0.9816968679428103 & cv<=0.7277598142623901 & cv>=0.19991366863250734 & pa>=0.07209430336952209 & pav<=0.2290336310863496 & pav>=0.05907522141933444\n",
      "   -5.2248 if cp<=0.08793166130781174 & pa>=0.06844294667243958 & pav<=-0.017319971695542336 & pav>=-0.1439988523721695\n",
      "Run episode 407 with rewards 500.0\n",
      "best\n",
      "============ 408 ===========\n",
      "500 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 1, 0, 1, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 1, 0, 1, 1, 0, 0, 1, 0, 0, 1, 1, 0, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 0, 1, 1, 0, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 1, 1, 1, 0, 0, 0, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 1, 1, 0, 0, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 0, 1, 1, 1, 0, 0, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 1, 1, 0, 0, 0, 1, 0, 0, 1, 0, 1, 1, 1, 0, 0, 0, 1, 1, 1, 0, 1, 0, 0, 0, 1, 1, 1, 1, 0, 0, 0, 0, 1, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 1, 1, 0, 0, 0, 1, 0, 1, 1, 1, 0, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 0, 1, 0, 0, 1, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 0]\n",
      "  -13.0397 if pav>=0.105914668738842\n",
      "   +3.4251 if pav<=0.19076273441314703\n",
      "   +9.8099 if cp<=0.22202084362506871 & pa<=0.09762744754552842 & pav>=-0.14960525333881372\n",
      "   +6.2786 if pa<=0.05730791762471199 & pav>=0.13789224624633797\n",
      "   -8.7793 if pa>=-0.0015114990528672934\n",
      "   -3.3649 if pav>=-0.21564951241016386\n",
      "   +3.4399 if cv<=1.2749298095703125 & cv>=0.7504771232604981 & pav<=0.2101341933012009 & pav>=0.04774465858936311\n",
      "   +2.0927 if cp>=0.09292074441909794 & cv<=1.453850269317627 & pa<=0.09489486813545227 & pa>=0.08252426087856293 & pav<=0.05076145231723788\n",
      "   +4.3832 if cv>=0.671009647846222 & pa>=0.05027810782194139 & pav<=0.0647647328674794\n",
      "   +4.0432 if cp<=0.9816968679428103 & cv>=1.252695846557619 & pav<=-0.2042848765850067\n",
      "   -4.4565 if cp>=0.08793166130781174 & cv<=0.7264650344848633 & cv>=-0.36476999521255493 & cv>=0.17411399781703957 & pav<=0.09162152707576755 & pav>=-0.1439988523721695\n",
      "   +4.3321 if cp>=2.296234130859375\n",
      "--------------\n",
      "  -10.0450 if pav<=0.24460948705673222\n",
      "  -12.2032 if cp<=0.6052873730659485 & pav<=0.0543186292052269\n",
      "   +6.7089 if pa>=0.08103863745927811 & pav>=0.043705208599567516\n",
      "   +5.2893 if pa>=-0.0015114990528672934\n",
      "   +9.2197 if cp>=0.1761053204536438 & cv<=1.1169248819351216 & pa>=0.09713529050350189 & pav<=0.052090991288423566 & pav>=-0.23702484369277954\n",
      "   +9.6335 if pav>=-0.09002201110124577\n",
      "   -5.8346 if pav>=0.04778921976685526\n",
      "   -0.5510 if cp<=1.5362601757049563 & cp>=0.09292074441909794 & cv<=1.453850269317627 & pa<=0.09489486813545227 & pa>=0.08252426087856293 & pav<=0.05076145231723788\n",
      "   +6.1299 if cp<=1.5557722806930545 & pa>=-0.03226159438490868\n",
      "   -9.9244 if cp<=0.9816968679428103 & cv<=0.7277598142623901 & cv>=0.19991366863250734 & pa>=0.07209430336952209 & pav<=0.2290336310863496 & pav>=0.05907522141933444\n",
      "   -6.1318 if cp<=0.08793166130781174 & pa>=0.06844294667243958 & pav<=-0.017319971695542336 & pav>=-0.1439988523721695\n",
      "   -1.3458 if pa>=-0.05133495703339576 & pav<=0.2011939972639087\n",
      "Run episode 408 with rewards 500.0\n",
      "best\n",
      "============ 409 ===========\n",
      "130 actions [0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 1, 0, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 1, 0, 0, 0, 1, 0, 1]\n",
      "  -13.7886 if pav>=0.105914668738842\n",
      "   +2.7392 if pav<=0.19076273441314703\n",
      "  +10.5144 if cp<=0.22202084362506871 & pa<=0.09762744754552842 & pav>=-0.14960525333881372\n",
      "   +7.0127 if pa<=0.05730791762471199 & pav>=0.13789224624633797\n",
      "   -8.3057 if pa>=-0.0015114990528672934\n",
      "   +1.2817 if pav>=-0.21564951241016386\n",
      "   +4.2164 if cv<=1.2749298095703125 & cv>=0.7504771232604981 & pav<=0.2101341933012009 & pav>=0.04774465858936311\n",
      "   +5.6492 if cv>=0.671009647846222 & pa>=0.05027810782194139 & pav<=0.0647647328674794\n",
      "   +5.5572 if cp<=0.9816968679428103 & cv>=1.252695846557619 & pav<=-0.2042848765850067\n",
      "   -5.4842 if cp>=0.08793166130781174 & cv<=0.7264650344848633 & cv>=-0.36476999521255493 & cv>=0.17411399781703957 & pav<=0.09162152707576755 & pav>=-0.1439988523721695\n",
      "   +3.5293 if cp>=2.296234130859375\n",
      "   -4.0123 if pav>=-0.21673575043678284\n",
      "--------------\n",
      "   -9.5371 if pav<=0.24460948705673222\n",
      "  -14.8681 if cp<=0.6052873730659485 & pav<=0.0543186292052269\n",
      "   -2.1748 if pa>=0.08103863745927811 & pav>=0.043705208599567516\n",
      "   +5.4531 if pa>=-0.0015114990528672934\n",
      "  +14.9773 if cp>=0.1761053204536438 & cv<=1.1169248819351216 & pa>=0.09713529050350189 & pav<=0.052090991288423566 & pav>=-0.23702484369277954\n",
      "   +9.2274 if pav>=-0.09002201110124577\n",
      "   -5.7081 if pav>=0.04778921976685526\n",
      "   +5.0000 if cp<=1.5557722806930545 & pa>=-0.03226159438490868\n",
      "   -3.8968 if cp<=0.9816968679428103 & cv<=0.7277598142623901 & cv>=0.19991366863250734 & pa>=0.07209430336952209 & pav<=0.2290336310863496 & pav>=0.05907522141933444\n",
      "   -6.2291 if cp<=0.08793166130781174 & pa>=0.06844294667243958 & pav<=-0.017319971695542336 & pav>=-0.1439988523721695\n",
      "   -1.6519 if pa>=-0.05133495703339576 & pav<=0.2011939972639087\n",
      "   +1.9229 if cp<=1.7203015565872193 & cp>=1.0971697807312013 & cv<=-0.04158004000782966 & cv<=-0.2375558942556381 & pa<=-0.019524512067437168 & pav<=0.06660144031047821 & pav<=0.2128232628107072 & pav>=-0.21673575043678284\n",
      "Run episode 409 with rewards 130.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 410 ===========\n",
      "136 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 0, 1, 1]\n",
      "   -8.9972 if pav>=0.105914668738842\n",
      "   +3.1400 if pav<=0.19076273441314703\n",
      "  +11.3492 if cp<=0.22202084362506871 & pa<=0.09762744754552842 & pav>=-0.14960525333881372\n",
      "   +2.3081 if pa<=0.05730791762471199 & pav>=0.13789224624633797\n",
      "   -8.3431 if pa>=-0.0015114990528672934\n",
      "   +4.7261 if cv<=1.2749298095703125 & cv>=0.7504771232604981 & pav<=0.2101341933012009 & pav>=0.04774465858936311\n",
      "   +8.4003 if cv>=0.671009647846222 & pa>=0.05027810782194139 & pav<=0.0647647328674794\n",
      "   +1.4356 if cp<=0.9816968679428103 & cv>=1.252695846557619 & pav<=-0.2042848765850067\n",
      "   -1.1800 if cp>=0.08793166130781174 & cv<=0.7264650344848633 & cv>=-0.36476999521255493 & cv>=0.17411399781703957 & pav<=0.09162152707576755 & pav>=-0.1439988523721695\n",
      "  -19.9286 if cp>=2.296234130859375\n",
      "   -3.5344 if pav>=-0.21673575043678284\n",
      "   -3.5470 if pa>=0.12037359923124313\n",
      "--------------\n",
      "   -9.8041 if pav<=0.24460948705673222\n",
      "  -13.0377 if cp<=0.6052873730659485 & pav<=0.0543186292052269\n",
      "   -1.9155 if pa>=0.08103863745927811 & pav>=0.043705208599567516\n",
      "   +4.1848 if pa>=-0.0015114990528672934\n",
      "   +6.8638 if cp>=0.1761053204536438 & cv<=1.1169248819351216 & pa>=0.09713529050350189 & pav<=0.052090991288423566 & pav>=-0.23702484369277954\n",
      "   +8.9804 if pav>=-0.09002201110124577\n",
      "   -8.1584 if pav>=0.04778921976685526\n",
      "   +4.1653 if cp<=1.5557722806930545 & pa>=-0.03226159438490868\n",
      "   -3.4782 if cp<=0.9816968679428103 & cv<=0.7277598142623901 & cv>=0.19991366863250734 & pa>=0.07209430336952209 & pav<=0.2290336310863496 & pav>=0.05907522141933444\n",
      "   -6.1781 if cp<=0.08793166130781174 & pa>=0.06844294667243958 & pav<=-0.017319971695542336 & pav>=-0.1439988523721695\n",
      "   +0.0000 if cp<=1.7203015565872193 & cp>=1.0971697807312013 & cv<=-0.04158004000782966 & cv<=-0.2375558942556381 & pa<=-0.019524512067437168 & pav<=0.06660144031047821 & pav<=0.2128232628107072 & pav>=-0.21673575043678284\n",
      "   +4.1638 if pav>=0.07094108760356906\n",
      "Run episode 410 with rewards 136.0\n",
      "============ 411 ===========\n",
      "143 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1, 0, 1, 1, 0, 0, 1, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 0]\n",
      "   -2.9985 if pav>=0.105914668738842\n",
      "   +3.0179 if pav<=0.19076273441314703\n",
      "   +8.8093 if cp<=0.22202084362506871 & pa<=0.09762744754552842 & pav>=-0.14960525333881372\n",
      "   -1.8027 if pa<=0.05730791762471199 & pav>=0.13789224624633797\n",
      "   -3.5017 if pa>=-0.0015114990528672934\n",
      "   +2.9215 if cv<=1.2749298095703125 & cv>=0.7504771232604981 & pav<=0.2101341933012009 & pav>=0.04774465858936311\n",
      "   +7.6790 if cv>=0.671009647846222 & pa>=0.05027810782194139 & pav<=0.0647647328674794\n",
      "   +1.2810 if cp<=0.9816968679428103 & cv>=1.252695846557619 & pav<=-0.2042848765850067\n",
      "  +22.6074 if cp>=2.296234130859375\n",
      "   -6.9247 if pav>=-0.21673575043678284\n",
      "   +3.1348 if pa>=0.12037359923124313\n",
      "   -0.6730 if cv<=0.13792100548744202 & cv<=1.2311040163040161 & pa>=0.04021962732076645 & pav<=0.17802542448043823 & pav>=-0.19224731624126434\n",
      "--------------\n",
      "   -1.5100 if pav<=0.24460948705673222\n",
      "   -7.2506 if cp<=0.6052873730659485 & pav<=0.0543186292052269\n",
      "   -4.2098 if pa>=0.08103863745927811 & pav>=0.043705208599567516\n",
      "   -1.6640 if pa>=-0.0015114990528672934\n",
      "   +6.1727 if cp>=0.1761053204536438 & cv<=1.1169248819351216 & pa>=0.09713529050350189 & pav<=0.052090991288423566 & pav>=-0.23702484369277954\n",
      "   +9.7977 if pav>=-0.09002201110124577\n",
      "   -4.8831 if pav>=0.04778921976685526\n",
      "   -2.6715 if cp<=1.5557722806930545 & pa>=-0.03226159438490868\n",
      "   -4.4696 if cp<=0.9816968679428103 & cv<=0.7277598142623901 & cv>=0.19991366863250734 & pa>=0.07209430336952209 & pav<=0.2290336310863496 & pav>=0.05907522141933444\n",
      "   -1.1110 if cp<=0.08793166130781174 & pa>=0.06844294667243958 & pav<=-0.017319971695542336 & pav>=-0.1439988523721695\n",
      "   +7.1409 if pav>=0.07094108760356906\n",
      "   -2.7064 if cp>=0.15984652936458588 & pa>=0.10311844199895859 & pav<=0.04924763366580012 & pav>=-0.05265270173549652\n",
      "Run episode 411 with rewards 143.0\n",
      "============ 412 ===========\n",
      "118 actions [0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 0, 1, 1, 0, 1, 1, 0, 1, 0, 0, 1, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1]\n",
      "   +0.3533 if pav>=0.105914668738842\n",
      "   +6.2076 if pav<=0.19076273441314703\n",
      "   +5.2368 if cp<=0.22202084362506871 & pa<=0.09762744754552842 & pav>=-0.14960525333881372\n",
      "   -2.1293 if pa<=0.05730791762471199 & pav>=0.13789224624633797\n",
      "   -3.6693 if pa>=-0.0015114990528672934\n",
      "   +2.1876 if cv<=1.2749298095703125 & cv>=0.7504771232604981 & pav<=0.2101341933012009 & pav>=0.04774465858936311\n",
      "   +3.4125 if cv>=0.671009647846222 & pa>=0.05027810782194139 & pav<=0.0647647328674794\n",
      "   +0.4791 if cp<=0.9816968679428103 & cv>=1.252695846557619 & pav<=-0.2042848765850067\n",
      "  -19.5421 if cp>=2.296234130859375\n",
      "   -5.6430 if pav>=-0.21673575043678284\n",
      "   -3.3982 if pa>=0.12037359923124313\n",
      "   -3.6766 if cv<=1.1020641803741456 & pa>=0.10671222060918809 & pav<=0.23113564848899845 & pav>=-0.035066262632608404\n",
      "--------------\n",
      "   -1.8326 if pav<=0.24460948705673222\n",
      "   -9.7236 if cp<=0.6052873730659485 & pav<=0.0543186292052269\n",
      "   -6.3581 if pa>=0.08103863745927811 & pav>=0.043705208599567516\n",
      "   -1.3115 if pa>=-0.0015114990528672934\n",
      "   +6.7067 if cp>=0.1761053204536438 & cv<=1.1169248819351216 & pa>=0.09713529050350189 & pav<=0.052090991288423566 & pav>=-0.23702484369277954\n",
      "   +9.2269 if pav>=-0.09002201110124577\n",
      "   -1.2090 if pav>=0.04778921976685526\n",
      "   -0.5688 if cp<=1.5557722806930545 & pa>=-0.03226159438490868\n",
      "  -10.4488 if cp<=0.9816968679428103 & cv<=0.7277598142623901 & cv>=0.19991366863250734 & pa>=0.07209430336952209 & pav<=0.2290336310863496 & pav>=0.05907522141933444\n",
      "   +2.9334 if pav>=0.07094108760356906\n",
      "   -1.5387 if cp>=0.15984652936458588 & pa>=0.10311844199895859 & pav<=0.04924763366580012 & pav>=-0.05265270173549652\n",
      "   +5.6581 if cp<=0.4493234395980838 & pa>=0.10671222060918809 & pa>=0.1134915977716446 & pav<=0.08552064299583462 & pav>=-0.035066262632608404\n",
      "Run episode 412 with rewards 118.0\n",
      "============ 413 ===========\n",
      "137 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 1, 1, 0, 0, 0]\n",
      "   +8.3272 if pav<=0.19076273441314703\n",
      "   +2.5288 if cp<=0.22202084362506871 & pa<=0.09762744754552842 & pav>=-0.14960525333881372\n",
      "   +0.4721 if pa<=0.05730791762471199 & pav>=0.13789224624633797\n",
      "   -1.1443 if pa>=-0.0015114990528672934\n",
      "   +0.6382 if cv<=1.2749298095703125 & cv>=0.7504771232604981 & pav<=0.2101341933012009 & pav>=0.04774465858936311\n",
      "   +3.7560 if cv>=0.671009647846222 & pa>=0.05027810782194139 & pav<=0.0647647328674794\n",
      "   -3.0946 if cp<=0.9816968679428103 & cv>=1.252695846557619 & pav<=-0.2042848765850067\n",
      "  +24.4301 if cp>=2.296234130859375\n",
      "   -8.8364 if pav>=-0.21673575043678284\n",
      "   -4.9637 if pa>=0.12037359923124313\n",
      "   -3.1153 if cv<=1.1020641803741456 & pa>=0.10671222060918809 & pav<=0.23113564848899845 & pav>=-0.035066262632608404\n",
      "   -2.3285 if pa>=0.14750264585018158\n",
      "--------------\n",
      "   -1.1141 if pav<=0.24460948705673222\n",
      "  -11.1068 if cp<=0.6052873730659485 & pav<=0.0543186292052269\n",
      "   -6.2306 if pa>=0.08103863745927811 & pav>=0.043705208599567516\n",
      "   -0.4331 if pa>=-0.0015114990528672934\n",
      "   +5.8433 if cp>=0.1761053204536438 & cv<=1.1169248819351216 & pa>=0.09713529050350189 & pav<=0.052090991288423566 & pav>=-0.23702484369277954\n",
      "   +5.9564 if pav>=-0.09002201110124577\n",
      "   +0.8091 if pav>=0.04778921976685526\n",
      "   -9.6328 if cp<=0.9816968679428103 & cv<=0.7277598142623901 & cv>=0.19991366863250734 & pa>=0.07209430336952209 & pav<=0.2290336310863496 & pav>=0.05907522141933444\n",
      "   +2.4165 if pav>=0.07094108760356906\n",
      "   +1.1466 if cp>=0.15984652936458588 & pa>=0.10311844199895859 & pav<=0.04924763366580012 & pav>=-0.05265270173549652\n",
      "   +3.9824 if cp<=0.4493234395980838 & pa>=0.10671222060918809 & pa>=0.1134915977716446 & pav<=0.08552064299583462 & pav>=-0.035066262632608404\n",
      "   -4.5465 if cp<=0.6084646463394169 & cp>=0.15900577604770666 & cv>=0.6649441838264473 & pa<=0.13059536516666412 & pav>=0.08577578365802775\n",
      "Run episode 413 with rewards 137.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 414 ===========\n",
      "199 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 1, 1, 0, 1, 1, 1]\n",
      "   +7.0012 if pav<=0.19076273441314703\n",
      "   +2.5474 if cp<=0.22202084362506871 & pa<=0.09762744754552842 & pav>=-0.14960525333881372\n",
      "   +2.1823 if pa>=-0.0015114990528672934\n",
      "   -0.0136 if cv<=1.2749298095703125 & cv>=0.7504771232604981 & pav<=0.2101341933012009 & pav>=0.04774465858936311\n",
      "   +1.5660 if cv>=0.671009647846222 & pa>=0.05027810782194139 & pav<=0.0647647328674794\n",
      "   +5.3813 if cp<=0.9816968679428103 & cv>=1.252695846557619 & pav<=-0.2042848765850067\n",
      "  -12.8058 if cp>=2.296234130859375\n",
      "  -10.3144 if pav>=-0.21673575043678284\n",
      "   -3.4868 if pa>=0.12037359923124313\n",
      "   -6.0887 if cv<=1.1020641803741456 & pa>=0.10671222060918809 & pav<=0.23113564848899845 & pav>=-0.035066262632608404\n",
      "   -0.8209 if pa>=0.14750264585018158\n",
      "   -0.0739 if pa>=0.14568965137004852\n",
      "--------------\n",
      "   -1.1379 if pav<=0.24460948705673222\n",
      "  -12.9703 if cp<=0.6052873730659485 & pav<=0.0543186292052269\n",
      "   -4.2944 if pa>=0.08103863745927811 & pav>=0.043705208599567516\n",
      "   +7.9289 if cp>=0.1761053204536438 & cv<=1.1169248819351216 & pa>=0.09713529050350189 & pav<=0.052090991288423566 & pav>=-0.23702484369277954\n",
      "   +5.4278 if pav>=-0.09002201110124577\n",
      "   -0.1034 if pav>=0.04778921976685526\n",
      "   -7.8515 if cp<=0.9816968679428103 & cv<=0.7277598142623901 & cv>=0.19991366863250734 & pa>=0.07209430336952209 & pav<=0.2290336310863496 & pav>=0.05907522141933444\n",
      "   +2.4496 if pav>=0.07094108760356906\n",
      "   +2.1257 if cp>=0.15984652936458588 & pa>=0.10311844199895859 & pav<=0.04924763366580012 & pav>=-0.05265270173549652\n",
      "   +4.3179 if cp<=0.4493234395980838 & pa>=0.10671222060918809 & pa>=0.1134915977716446 & pav<=0.08552064299583462 & pav>=-0.035066262632608404\n",
      "   -7.0284 if cp<=0.6084646463394169 & cp>=0.15900577604770666 & cv>=0.6649441838264473 & pa<=0.13059536516666412 & pav>=0.08577578365802775\n",
      "   +2.1445 if pa>=0.14568965137004852\n",
      "Run episode 414 with rewards 199.0\n",
      "============ 415 ===========\n",
      "120 actions [0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0]\n",
      "   +2.9948 if pav<=0.19076273441314703\n",
      "   +1.4409 if cp<=0.22202084362506871 & pa<=0.09762744754552842 & pav>=-0.14960525333881372\n",
      "   -2.2504 if pa>=-0.0015114990528672934\n",
      "   +5.3132 if cv>=0.671009647846222 & pa>=0.05027810782194139 & pav<=0.0647647328674794\n",
      "   +5.5584 if cp<=0.9816968679428103 & cv>=1.252695846557619 & pav<=-0.2042848765850067\n",
      "  +16.0024 if cp>=2.296234130859375\n",
      "   -5.0740 if pav>=-0.21673575043678284\n",
      "   -6.2742 if pa>=0.12037359923124313\n",
      "   -6.3656 if cv<=1.1020641803741456 & pa>=0.10671222060918809 & pav<=0.23113564848899845 & pav>=-0.035066262632608404\n",
      "   +0.3480 if pa>=0.14750264585018158\n",
      "   +0.0637 if pa>=0.14568965137004852\n",
      "   +1.5289 if cv>=0.6918205738067628 & pav<=-0.03038508407771587\n",
      "--------------\n",
      "   -1.3094 if pav<=0.24460948705673222\n",
      "  -13.2045 if cp<=0.6052873730659485 & pav<=0.0543186292052269\n",
      "   -5.0619 if pa>=0.08103863745927811 & pav>=0.043705208599567516\n",
      "   -0.0003 if cp>=0.1761053204536438 & cv<=1.1169248819351216 & pa>=0.09713529050350189 & pav<=0.052090991288423566 & pav>=-0.23702484369277954\n",
      "   +5.2467 if pav>=-0.09002201110124577\n",
      "   -4.1652 if cp<=0.9816968679428103 & cv<=0.7277598142623901 & cv>=0.19991366863250734 & pa>=0.07209430336952209 & pav<=0.2290336310863496 & pav>=0.05907522141933444\n",
      "   +6.7247 if pav>=0.07094108760356906\n",
      "   +3.6591 if cp>=0.15984652936458588 & pa>=0.10311844199895859 & pav<=0.04924763366580012 & pav>=-0.05265270173549652\n",
      "   +5.8812 if cp<=0.4493234395980838 & pa>=0.10671222060918809 & pa>=0.1134915977716446 & pav<=0.08552064299583462 & pav>=-0.035066262632608404\n",
      "   -0.0003 if cp<=0.6084646463394169 & cp>=0.15900577604770666 & cv>=0.6649441838264473 & pa<=0.13059536516666412 & pav>=0.08577578365802775\n",
      "   +1.7741 if pa>=0.14568965137004852\n",
      "  -17.3216 if cp>=2.386007308959961\n",
      "Run episode 415 with rewards 120.0\n",
      "============ 416 ===========\n",
      "127 actions [0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 1, 0, 1, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0]\n",
      "   +0.7229 if pav<=0.19076273441314703\n",
      "   +1.5023 if cp<=0.22202084362506871 & pa<=0.09762744754552842 & pav>=-0.14960525333881372\n",
      "   +0.6170 if pa>=-0.0015114990528672934\n",
      "   +3.2511 if cv>=0.671009647846222 & pa>=0.05027810782194139 & pav<=0.0647647328674794\n",
      "   +4.2986 if cp<=0.9816968679428103 & cv>=1.252695846557619 & pav<=-0.2042848765850067\n",
      "  +19.6000 if cp>=2.296234130859375\n",
      "   -3.9469 if pav>=-0.21673575043678284\n",
      "   -7.9895 if pa>=0.12037359923124313\n",
      "   -8.7500 if cv<=1.1020641803741456 & pa>=0.10671222060918809 & pav<=0.23113564848899845 & pav>=-0.035066262632608404\n",
      "   -0.0000 if pa>=0.14750264585018158\n",
      "   +1.0014 if cv>=0.6918205738067628 & pav<=-0.03038508407771587\n",
      "   +0.0000 if cp>=2.399513006210327\n",
      "--------------\n",
      "   -1.3738 if pav<=0.24460948705673222\n",
      "  -14.0378 if cp<=0.6052873730659485 & pav<=0.0543186292052269\n",
      "   -8.1413 if pa>=0.08103863745927811 & pav>=0.043705208599567516\n",
      "   -2.7420 if cp>=0.1761053204536438 & cv<=1.1169248819351216 & pa>=0.09713529050350189 & pav<=0.052090991288423566 & pav>=-0.23702484369277954\n",
      "   +7.5822 if pav>=-0.09002201110124577\n",
      "   -5.9612 if cp<=0.9816968679428103 & cv<=0.7277598142623901 & cv>=0.19991366863250734 & pa>=0.07209430336952209 & pav<=0.2290336310863496 & pav>=0.05907522141933444\n",
      "   +8.7796 if pav>=0.07094108760356906\n",
      "   +8.3070 if cp>=0.15984652936458588 & pa>=0.10311844199895859 & pav<=0.04924763366580012 & pav>=-0.05265270173549652\n",
      "   +7.7608 if cp<=0.4493234395980838 & pa>=0.10671222060918809 & pa>=0.1134915977716446 & pav<=0.08552064299583462 & pav>=-0.035066262632608404\n",
      "   +1.5623 if pa>=0.14568965137004852\n",
      "  +18.4266 if cp>=2.386007308959961\n",
      "   -0.0587 if cv<=1.3230483055114746 & pa<=0.10162533968687057 & pa>=0.07813916802406311 & pav<=0.06761358976364137\n",
      "Run episode 416 with rewards 127.0\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/tmp/ipykernel_21016/4286230475.py:3: RuntimeWarning: overflow encountered in exp\n",
      "  exps = np.exp(all_values)\n",
      "/tmp/ipykernel_21016/4286230475.py:4: RuntimeWarning: overflow encountered in exp\n",
      "  res = np.exp(all_values[np.arange(values.shape[0]), action]) / np.sum(exps, axis=1)\n",
      "/tmp/ipykernel_21016/4286230475.py:4: RuntimeWarning: invalid value encountered in divide\n",
      "  res = np.exp(all_values[np.arange(values.shape[0]), action]) / np.sum(exps, axis=1)\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 417 ===========\n",
      "133 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0]\n",
      "  +10.5233 if pav<=0.19076273441314703\n",
      "   +2.3357 if cp<=0.22202084362506871 & pa<=0.09762744754552842 & pav>=-0.14960525333881372\n",
      "   -6.6201 if pa>=-0.0015114990528672934\n",
      "   +6.1723 if cv>=0.671009647846222 & pa>=0.05027810782194139 & pav<=0.0647647328674794\n",
      "   +3.3539 if cp<=0.9816968679428103 & cv>=1.252695846557619 & pav<=-0.2042848765850067\n",
      "   -2.0344 if cp>=2.296234130859375\n",
      "   -8.6455 if pav>=-0.21673575043678284\n",
      "   -4.4722 if pa>=0.12037359923124313\n",
      "   -4.1321 if cv<=1.1020641803741456 & pa>=0.10671222060918809 & pav<=0.23113564848899845 & pav>=-0.035066262632608404\n",
      "   -0.8544 if cv>=0.6918205738067628 & pav<=-0.03038508407771587\n",
      "   +0.0000 if cp>=2.399513006210327\n",
      "   -2.6460 if cv>=1.7891154527664186 & pa>=0.09802673459053039 & pav<=-0.14905341863632202\n",
      "--------------\n",
      "   -0.7880 if pav<=0.24460948705673222\n",
      "  -15.8094 if cp<=0.6052873730659485 & pav<=0.0543186292052269\n",
      "  -10.8691 if pa>=0.08103863745927811 & pav>=0.043705208599567516\n",
      "   +0.2614 if cp>=0.1761053204536438 & cv<=1.1169248819351216 & pa>=0.09713529050350189 & pav<=0.052090991288423566 & pav>=-0.23702484369277954\n",
      "   +9.1158 if pav>=-0.09002201110124577\n",
      "   -4.4159 if cp<=0.9816968679428103 & cv<=0.7277598142623901 & cv>=0.19991366863250734 & pa>=0.07209430336952209 & pav<=0.2290336310863496 & pav>=0.05907522141933444\n",
      "  +24.0363 if pav>=0.07094108760356906\n",
      "   +1.1269 if cp>=0.15984652936458588 & pa>=0.10311844199895859 & pav<=0.04924763366580012 & pav>=-0.05265270173549652\n",
      "   +0.7713 if cp<=0.4493234395980838 & pa>=0.10671222060918809 & pa>=0.1134915977716446 & pav<=0.08552064299583462 & pav>=-0.035066262632608404\n",
      "   +0.0933 if pa>=0.14568965137004852\n",
      "   +1.1002 if cp>=2.386007308959961\n",
      "   +1.0000 if cp>=2.3784821033477783\n",
      "Run episode 417 with rewards 133.0\n",
      "============ 418 ===========\n",
      "188 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 0, 1, 1, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0, 0]\n",
      "   +3.6148 if pav<=0.19076273441314703\n",
      "   +2.3208 if cp<=0.22202084362506871 & pa<=0.09762744754552842 & pav>=-0.14960525333881372\n",
      "   +3.0188 if pa>=-0.0015114990528672934\n",
      "   +1.5041 if cv>=0.671009647846222 & pa>=0.05027810782194139 & pav<=0.0647647328674794\n",
      "   +3.2214 if cp<=0.9816968679428103 & cv>=1.252695846557619 & pav<=-0.2042848765850067\n",
      "  +12.2001 if cp>=2.296234130859375\n",
      "   -8.0181 if pav>=-0.21673575043678284\n",
      "   -5.9564 if pa>=0.12037359923124313\n",
      "   +2.5428 if cv<=1.1020641803741456 & pa>=0.10671222060918809 & pav<=0.23113564848899845 & pav>=-0.035066262632608404\n",
      "   +4.5415 if cv>=0.6918205738067628 & pav<=-0.03038508407771587\n",
      "   -5.7379 if cv>=1.7891154527664186 & pa>=0.09802673459053039 & pav<=-0.14905341863632202\n",
      "   -4.8505 if cv<=1.0507530689239504 & pa>=0.1327274411916733 & pav<=0.07322581559419634\n",
      "--------------\n",
      "   -0.8969 if pav<=0.24460948705673222\n",
      "  -11.8644 if cp<=0.6052873730659485 & pav<=0.0543186292052269\n",
      "   +0.4310 if pa>=0.08103863745927811 & pav>=0.043705208599567516\n",
      "   -0.3966 if cp>=0.1761053204536438 & cv<=1.1169248819351216 & pa>=0.09713529050350189 & pav<=0.052090991288423566 & pav>=-0.23702484369277954\n",
      "   +6.3610 if pav>=-0.09002201110124577\n",
      "   +0.2000 if cp<=0.9816968679428103 & cv<=0.7277598142623901 & cv>=0.19991366863250734 & pa>=0.07209430336952209 & pav<=0.2290336310863496 & pav>=0.05907522141933444\n",
      "   +1.7178 if pav>=0.07094108760356906\n",
      "   +1.7176 if cp>=0.15984652936458588 & pa>=0.10311844199895859 & pav<=0.04924763366580012 & pav>=-0.05265270173549652\n",
      "   +0.5275 if cp<=0.4493234395980838 & pa>=0.10671222060918809 & pa>=0.1134915977716446 & pav<=0.08552064299583462 & pav>=-0.035066262632608404\n",
      "   +0.0002 if cp>=2.386007308959961\n",
      "   +0.0001 if cp>=2.3784821033477783\n",
      "   -2.7631 if pav>=-0.15832958519458767\n",
      "Run episode 418 with rewards 188.0\n",
      "============ 419 ===========\n",
      "120 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1]\n",
      "   +2.1689 if pav<=0.19076273441314703\n",
      "   +2.3859 if cp<=0.22202084362506871 & pa<=0.09762744754552842 & pav>=-0.14960525333881372\n",
      "   -0.4670 if pa>=-0.0015114990528672934\n",
      "   +2.3440 if cp<=0.9816968679428103 & cv>=1.252695846557619 & pav<=-0.2042848765850067\n",
      "  -25.1015 if cp>=2.296234130859375\n",
      "   -6.6219 if pav>=-0.21673575043678284\n",
      "   -2.1179 if pa>=0.12037359923124313\n",
      "   +4.4391 if cv<=1.1020641803741456 & pa>=0.10671222060918809 & pav<=0.23113564848899845 & pav>=-0.035066262632608404\n",
      "   +8.5767 if cv>=0.6918205738067628 & pav<=-0.03038508407771587\n",
      "   -7.1929 if cv>=1.7891154527664186 & pa>=0.09802673459053039 & pav<=-0.14905341863632202\n",
      "   -1.8398 if cv<=1.0507530689239504 & pa>=0.1327274411916733 & pav<=0.07322581559419634\n",
      "   -0.3145 if pa>=0.12797485291957855 & pav<=0.0966734975576401\n",
      "--------------\n",
      "   -0.2232 if pav<=0.24460948705673222\n",
      "  -14.6368 if cp<=0.6052873730659485 & pav<=0.0543186292052269\n",
      "   +6.4759 if pa>=0.08103863745927811 & pav>=0.043705208599567516\n",
      "   -0.3909 if cp>=0.1761053204536438 & cv<=1.1169248819351216 & pa>=0.09713529050350189 & pav<=0.052090991288423566 & pav>=-0.23702484369277954\n",
      "   +9.8909 if pav>=-0.09002201110124577\n",
      "   +0.0907 if cp<=0.9816968679428103 & cv<=0.7277598142623901 & cv>=0.19991366863250734 & pa>=0.07209430336952209 & pav<=0.2290336310863496 & pav>=0.05907522141933444\n",
      "  +12.0805 if pav>=0.07094108760356906\n",
      "   +6.2139 if cp>=0.15984652936458588 & pa>=0.10311844199895859 & pav<=0.04924763366580012 & pav>=-0.05265270173549652\n",
      "   -6.2335 if cp<=0.4493234395980838 & pa>=0.10671222060918809 & pa>=0.1134915977716446 & pav<=0.08552064299583462 & pav>=-0.035066262632608404\n",
      "  +10.1589 if cp>=2.386007308959961\n",
      "   -4.4770 if pav>=-0.15832958519458767\n",
      "   -3.1062 if cp>=0.7997480034828184 & pa<=0.12797485291957855 & pa>=0.09812829941511156 & pav<=-0.015129328705370428\n",
      "Run episode 419 with rewards 120.0\n",
      "============ 420 ===========\n",
      "119 actions [0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 0, 0, 0]\n",
      "   +0.2825 if pav<=0.19076273441314703\n",
      "   +3.0359 if cp<=0.22202084362506871 & pa<=0.09762744754552842 & pav>=-0.14960525333881372\n",
      "   -1.1228 if pa>=-0.0015114990528672934\n",
      "   +5.5486 if cp<=0.9816968679428103 & cv>=1.252695846557619 & pav<=-0.2042848765850067\n",
      "  +29.8075 if cp>=2.296234130859375\n",
      "   -5.0387 if pav>=-0.21673575043678284\n",
      "   -0.9742 if pa>=0.12037359923124313\n",
      "   +3.7459 if cv<=1.1020641803741456 & pa>=0.10671222060918809 & pav<=0.23113564848899845 & pav>=-0.035066262632608404\n",
      "   +4.4110 if cv>=0.6918205738067628 & pav<=-0.03038508407771587\n",
      "   +0.0250 if cv>=1.7891154527664186 & pa>=0.09802673459053039 & pav<=-0.14905341863632202\n",
      "   +1.5325 if cv<=1.0507530689239504 & pa>=0.1327274411916733 & pav<=0.07322581559419634\n",
      "   +1.0000 if pa>=0.12465851306915283 & pav<=-0.16428629457950591\n",
      "--------------\n",
      "   -0.5731 if pav<=0.24460948705673222\n",
      "  -10.8281 if cp<=0.6052873730659485 & pav<=0.0543186292052269\n",
      "   +0.3728 if pa>=0.08103863745927811 & pav>=0.043705208599567516\n",
      "   -1.9091 if cp>=0.1761053204536438 & cv<=1.1169248819351216 & pa>=0.09713529050350189 & pav<=0.052090991288423566 & pav>=-0.23702484369277954\n",
      "   +6.0488 if pav>=-0.09002201110124577\n",
      "   +1.3492 if pav>=0.07094108760356906\n",
      "   +5.9438 if cp>=0.15984652936458588 & pa>=0.10311844199895859 & pav<=0.04924763366580012 & pav>=-0.05265270173549652\n",
      "   -3.0972 if cp<=0.4493234395980838 & pa>=0.10671222060918809 & pa>=0.1134915977716446 & pav<=0.08552064299583462 & pav>=-0.035066262632608404\n",
      "   +0.0000 if cp>=2.386007308959961\n",
      "   -2.3062 if pav>=-0.15832958519458767\n",
      "   -2.2559 if cp>=0.7997480034828184 & pa<=0.12797485291957855 & pa>=0.09812829941511156 & pav<=-0.015129328705370428\n",
      "   +3.4330 if cp>=0.634221923351288 & cv<=1.8501845121383667 & pav<=-0.037270663678646086\n",
      "Run episode 420 with rewards 119.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 421 ===========\n",
      "134 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0, 0, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 0, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 0, 1, 0, 0, 1, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 0, 0, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 0, 0, 1, 0, 0, 1, 1, 0, 0, 0]\n",
      "   +1.3697 if pav<=0.19076273441314703\n",
      "   +6.7038 if cp<=0.22202084362506871 & pa<=0.09762744754552842 & pav>=-0.14960525333881372\n",
      "   +2.0455 if pa>=-0.0015114990528672934\n",
      "   +0.9961 if cp<=0.9816968679428103 & cv>=1.252695846557619 & pav<=-0.2042848765850067\n",
      "  -17.5972 if cp>=2.296234130859375\n",
      "  -12.3465 if pav>=-0.21673575043678284\n",
      "   -4.5147 if pa>=0.12037359923124313\n",
      "  +12.0341 if cv<=1.1020641803741456 & pa>=0.10671222060918809 & pav<=0.23113564848899845 & pav>=-0.035066262632608404\n",
      "   +9.0691 if cv>=0.6918205738067628 & pav<=-0.03038508407771587\n",
      "   -0.2842 if cv<=1.0507530689239504 & pa>=0.1327274411916733 & pav<=0.07322581559419634\n",
      "   +1.6556 if pa>=0.12465851306915283 & pav<=-0.16428629457950591\n",
      "   +8.6996 if cp<=0.18981581628322605 & cv>=0.17357257902622222 & pav>=0.20544615983963016\n",
      "--------------\n",
      "   -6.0452 if pav<=0.24460948705673222\n",
      "   -9.4154 if cp<=0.6052873730659485 & pav<=0.0543186292052269\n",
      "   -3.0690 if pa>=0.08103863745927811 & pav>=0.043705208599567516\n",
      "   -2.6358 if cp>=0.1761053204536438 & cv<=1.1169248819351216 & pa>=0.09713529050350189 & pav<=0.052090991288423566 & pav>=-0.23702484369277954\n",
      "   +7.4370 if pav>=-0.09002201110124577\n",
      "   +1.4118 if pav>=0.07094108760356906\n",
      "   +2.3241 if cp>=0.15984652936458588 & pa>=0.10311844199895859 & pav<=0.04924763366580012 & pav>=-0.05265270173549652\n",
      "   -2.0024 if cp<=0.4493234395980838 & pa>=0.10671222060918809 & pa>=0.1134915977716446 & pav<=0.08552064299583462 & pav>=-0.035066262632608404\n",
      "   -2.8988 if pav>=-0.15832958519458767\n",
      "   -2.7068 if cp>=0.7997480034828184 & pa<=0.12797485291957855 & pa>=0.09812829941511156 & pav<=-0.015129328705370428\n",
      "   +3.7629 if cp>=0.634221923351288 & cv<=1.8501845121383667 & pav<=-0.037270663678646086\n",
      "   +5.0834 if pav<=0.20544615983963016\n",
      "Run episode 421 with rewards 134.0\n",
      "============ 422 ===========\n",
      "130 actions [0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1, 0, 0, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 0, 0, 1, 1, 0, 0, 1, 1, 0, 0, 0, 1, 0, 1, 1, 0, 0, 0, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 0, 0, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 0, 0, 1, 1, 0, 0, 0, 1, 0]\n",
      "   +1.0535 if pav<=0.19076273441314703\n",
      "   +7.7054 if cp<=0.22202084362506871 & pa<=0.09762744754552842 & pav>=-0.14960525333881372\n",
      "   +0.0000 if pa>=-0.0015114990528672934\n",
      "   +0.0000 if cp<=0.9816968679428103 & cv>=1.252695846557619 & pav<=-0.2042848765850067\n",
      "   +0.0000 if cp>=2.296234130859375\n",
      "  -12.4994 if pav>=-0.21673575043678284\n",
      "   +0.0000 if pa>=0.12037359923124313\n",
      "   +0.0000 if cv<=1.1020641803741456 & pa>=0.10671222060918809 & pav<=0.23113564848899845 & pav>=-0.035066262632608404\n",
      "   +0.0000 if cv>=0.6918205738067628 & pav<=-0.03038508407771587\n",
      "   +0.0000 if pa>=0.12465851306915283 & pav<=-0.16428629457950591\n",
      "   +0.0000 if cp<=0.18981581628322605 & cv>=0.17357257902622222 & pav>=0.20544615983963016\n",
      "   -1.8349 if cv<=0.01230156067758799 & pa>=-0.08508429378271103 & pav<=-0.023137659952044424 & pav>=-0.23292139768600462\n",
      "--------------\n",
      "   -0.8960 if pav<=0.24460948705673222\n",
      "   -8.5509 if cp<=0.6052873730659485 & pav<=0.0543186292052269\n",
      "   +0.0012 if pa>=0.08103863745927811 & pav>=0.043705208599567516\n",
      "   +0.0010 if cp>=0.1761053204536438 & cv<=1.1169248819351216 & pa>=0.09713529050350189 & pav<=0.052090991288423566 & pav>=-0.23702484369277954\n",
      "   +8.2482 if pav>=-0.09002201110124577\n",
      "   +0.0009 if cp>=0.15984652936458588 & pa>=0.10311844199895859 & pav<=0.04924763366580012 & pav>=-0.05265270173549652\n",
      "   +0.0008 if cp<=0.4493234395980838 & pa>=0.10671222060918809 & pa>=0.1134915977716446 & pav<=0.08552064299583462 & pav>=-0.035066262632608404\n",
      "   -4.4119 if pav>=-0.15832958519458767\n",
      "   +0.0010 if cp>=0.7997480034828184 & pa<=0.12797485291957855 & pa>=0.09812829941511156 & pav<=-0.015129328705370428\n",
      "   +0.0014 if cp>=0.634221923351288 & cv<=1.8501845121383667 & pav<=-0.037270663678646086\n",
      "   -1.1633 if pav<=0.20544615983963016\n",
      "   +1.3215 if pav<=-0.023137659952044424\n",
      "Run episode 422 with rewards 130.0\n",
      "============ 423 ===========\n",
      "115 actions [1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0, 0, 0, 1, 1, 0, 0, 1, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 1, 0, 0, 0, 1, 0, 1, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 0, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 0, 0, 1, 0, 0, 1, 0, 1, 0, 0]\n",
      "   -0.9881 if pav<=0.19076273441314703\n",
      "   +3.4536 if cp<=0.22202084362506871 & pa<=0.09762744754552842 & pav>=-0.14960525333881372\n",
      "   +1.4417 if pa>=-0.0015114990528672934\n",
      "   +0.0000 if cp>=2.296234130859375\n",
      "  -10.8539 if pav>=-0.21673575043678284\n",
      "   +0.0000 if pa>=0.12037359923124313\n",
      "   +0.0000 if cv<=1.1020641803741456 & pa>=0.10671222060918809 & pav<=0.23113564848899845 & pav>=-0.035066262632608404\n",
      "   +0.0000 if cv>=0.6918205738067628 & pav<=-0.03038508407771587\n",
      "   +0.0000 if pa>=0.12465851306915283 & pav<=-0.16428629457950591\n",
      "   +0.0000 if cp<=0.18981581628322605 & cv>=0.17357257902622222 & pav>=0.20544615983963016\n",
      "   -1.0197 if cv<=0.01230156067758799 & pa>=-0.08508429378271103 & pav<=-0.023137659952044424 & pav>=-0.23292139768600462\n",
      "   +4.4877 if cv<=-0.03672660887241363 & pav>=-0.1544262498617172\n",
      "--------------\n",
      "   -1.1896 if pav<=0.24460948705673222\n",
      "  -10.6161 if cp<=0.6052873730659485 & pav<=0.0543186292052269\n",
      "   +0.0000 if pa>=0.08103863745927811 & pav>=0.043705208599567516\n",
      "   +0.0000 if cp>=0.1761053204536438 & cv<=1.1169248819351216 & pa>=0.09713529050350189 & pav<=0.052090991288423566 & pav>=-0.23702484369277954\n",
      "  +10.8671 if pav>=-0.09002201110124577\n",
      "   +0.0000 if cp>=0.15984652936458588 & pa>=0.10311844199895859 & pav<=0.04924763366580012 & pav>=-0.05265270173549652\n",
      "   -6.4680 if pav>=-0.15832958519458767\n",
      "   +0.0000 if cp>=0.7997480034828184 & pa<=0.12797485291957855 & pa>=0.09812829941511156 & pav<=-0.015129328705370428\n",
      "   +0.0000 if cp>=0.634221923351288 & cv<=1.8501845121383667 & pav<=-0.037270663678646086\n",
      "   -1.3940 if pav<=0.20544615983963016\n",
      "   +3.9248 if pav<=-0.023137659952044424\n",
      "   -4.4406 if cp>=-0.003365041548386215 & cp>=0.03385642990469933 & cv<=-0.03672660887241363 & cv>=-0.23577652871608734 & pa>=-0.06778540164232254 & pav<=-0.009735857695341094\n",
      "Run episode 423 with rewards 115.0\n",
      "============ 424 ===========\n",
      "150 actions [0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1, 0, 1, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 0, 0, 1, 1, 0, 0, 1, 0, 1, 1, 0, 0, 0, 1, 0, 1, 0, 1, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 0, 1, 0, 1, 0, 1, 1, 0, 0, 0, 1, 0, 1, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 1, 0]\n",
      "   -0.9335 if pav<=0.19076273441314703\n",
      "   +5.2327 if cp<=0.22202084362506871 & pa<=0.09762744754552842 & pav>=-0.14960525333881372\n",
      "   +0.0000 if pa>=-0.0015114990528672934\n",
      "   +0.0000 if cp>=2.296234130859375\n",
      "   -9.1765 if pav>=-0.21673575043678284\n",
      "   +0.0000 if pa>=0.12037359923124313\n",
      "   +0.0000 if cv<=1.1020641803741456 & pa>=0.10671222060918809 & pav<=0.23113564848899845 & pav>=-0.035066262632608404\n",
      "   +0.0000 if cv>=0.6918205738067628 & pav<=-0.03038508407771587\n",
      "   +0.0000 if cp<=0.18981581628322605 & cv>=0.17357257902622222 & pav>=0.20544615983963016\n",
      "   -6.1731 if cv<=0.01230156067758799 & pa>=-0.08508429378271103 & pav<=-0.023137659952044424 & pav>=-0.23292139768600462\n",
      "   +3.0547 if cv<=-0.03672660887241363 & pav>=-0.1544262498617172\n",
      "   -2.1665 if cv<=-0.7518346071243286 & pav>=-0.23082737326622008\n",
      "--------------\n",
      "   -1.2037 if pav<=0.24460948705673222\n",
      "  -10.4424 if cp<=0.6052873730659485 & pav<=0.0543186292052269\n",
      "   -0.0000 if pa>=0.08103863745927811 & pav>=0.043705208599567516\n",
      "   -0.0000 if cp>=0.1761053204536438 & cv<=1.1169248819351216 & pa>=0.09713529050350189 & pav<=0.052090991288423566 & pav>=-0.23702484369277954\n",
      "  +10.5113 if pav>=-0.09002201110124577\n",
      "   -5.5531 if pav>=-0.15832958519458767\n",
      "   -0.0000 if cp>=0.7997480034828184 & pa<=0.12797485291957855 & pa>=0.09812829941511156 & pav<=-0.015129328705370428\n",
      "   -0.0000 if cp>=0.634221923351288 & cv<=1.8501845121383667 & pav<=-0.037270663678646086\n",
      "   -1.8439 if pav<=0.20544615983963016\n",
      "   +2.7292 if pav<=-0.023137659952044424\n",
      "   -0.0001 if cp>=-0.003365041548386215 & cp>=0.03385642990469933 & cv<=-0.03672660887241363 & cv>=-0.23577652871608734 & pa>=-0.06778540164232254 & pav<=-0.009735857695341094\n",
      "   +3.5140 if cv>=-0.3721600353717804 & pa>=-0.09160481989383697 & pav<=-0.0010380603140219958 & pav>=-0.23082737326622008\n",
      "Run episode 424 with rewards 150.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 425 ===========\n",
      "126 actions [0, 1, 0, 1, 1, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1, 1, 0, 0, 1, 0, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 0, 0, 1, 1, 0, 0]\n",
      "   -0.1561 if pav<=0.19076273441314703\n",
      "   +7.8899 if cp<=0.22202084362506871 & pa<=0.09762744754552842 & pav>=-0.14960525333881372\n",
      "   +0.9216 if pa>=-0.0015114990528672934\n",
      "   +0.0000 if cp>=2.296234130859375\n",
      "  -12.9724 if pav>=-0.21673575043678284\n",
      "   +0.0000 if cv<=1.1020641803741456 & pa>=0.10671222060918809 & pav<=0.23113564848899845 & pav>=-0.035066262632608404\n",
      "   +0.0000 if cv>=0.6918205738067628 & pav<=-0.03038508407771587\n",
      "   +0.0000 if cp<=0.18981581628322605 & cv>=0.17357257902622222 & pav>=0.20544615983963016\n",
      "   -4.6744 if cv<=0.01230156067758799 & pa>=-0.08508429378271103 & pav<=-0.023137659952044424 & pav>=-0.23292139768600462\n",
      "   +3.8999 if cv<=-0.03672660887241363 & pav>=-0.1544262498617172\n",
      "   -1.0773 if cv<=-0.7518346071243286 & pav>=-0.23082737326622008\n",
      "   +6.7281 if cp<=0.005269695818424239 & pa<=-0.08916560113430022 & pa>=-0.0962302953004837 & pav<=-0.1148708403110504 & pav>=-0.21949760615825653\n",
      "--------------\n",
      "   +1.0908 if pav<=0.24460948705673222\n",
      "  -12.6924 if cp<=0.6052873730659485 & pav<=0.0543186292052269\n",
      "   +0.0000 if pa>=0.08103863745927811 & pav>=0.043705208599567516\n",
      "   +8.0897 if pav>=-0.09002201110124577\n",
      "   -4.8302 if pav>=-0.15832958519458767\n",
      "   +0.0000 if cp>=0.7997480034828184 & pa<=0.12797485291957855 & pa>=0.09812829941511156 & pav<=-0.015129328705370428\n",
      "   +0.0000 if cp>=0.634221923351288 & cv<=1.8501845121383667 & pav<=-0.037270663678646086\n",
      "   -1.2448 if pav<=0.20544615983963016\n",
      "   +1.2067 if pav<=-0.023137659952044424\n",
      "   +0.0000 if cp>=-0.003365041548386215 & cp>=0.03385642990469933 & cv<=-0.03672660887241363 & cv>=-0.23577652871608734 & pa>=-0.06778540164232254 & pav<=-0.009735857695341094\n",
      "   +5.6318 if cv>=-0.3721600353717804 & pa>=-0.09160481989383697 & pav<=-0.0010380603140219958 & pav>=-0.23082737326622008\n",
      "   +5.1194 if cp>=0.005269695818424239 & pa<=-0.08916560113430022 & pa>=-0.0962302953004837 & pav<=-0.1148708403110504 & pav>=-0.21949760615825653\n",
      "Run episode 425 with rewards 126.0\n",
      "============ 426 ===========\n",
      "500 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 0, 0, 1, 0, 1, 0, 0, 1, 1, 1, 0, 0, 0, 1, 0, 0, 1, 0, 1, 1, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 1, 0, 0, 0, 1, 0, 1, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 1, 1, 0, 1, 0, 0, 1, 1, 1, 0, 0, 1, 1, 0, 0, 1, 0, 1, 1, 1, 0, 0, 1, 1, 0, 0, 1, 1, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1, 1, 0, 0, 1, 1, 0, 0, 1, 0, 1, 1, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1, 1, 0, 0, 1, 1, 0, 1, 0, 0, 1, 0, 1, 1, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 1, 0, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0]\n",
      "   +0.5259 if pav<=0.19076273441314703\n",
      "  +10.7591 if cp<=0.22202084362506871 & pa<=0.09762744754552842 & pav>=-0.14960525333881372\n",
      "   -1.5013 if pa>=-0.0015114990528672934\n",
      "   -0.0000 if cp>=2.296234130859375\n",
      "  -12.2865 if pav>=-0.21673575043678284\n",
      "   -0.0000 if cv<=1.1020641803741456 & pa>=0.10671222060918809 & pav<=0.23113564848899845 & pav>=-0.035066262632608404\n",
      "   -0.0000 if cv>=0.6918205738067628 & pav<=-0.03038508407771587\n",
      "   -0.0000 if cv<=0.01230156067758799 & pa>=-0.08508429378271103 & pav<=-0.023137659952044424 & pav>=-0.23292139768600462\n",
      "   +2.2891 if cv<=-0.03672660887241363 & pav>=-0.1544262498617172\n",
      "   +0.5309 if cv<=-0.7518346071243286 & pav>=-0.23082737326622008\n",
      "   -0.0000 if cp<=0.005269695818424239 & pa<=-0.08916560113430022 & pa>=-0.0962302953004837 & pav<=-0.1148708403110504 & pav>=-0.21949760615825653\n",
      "   -3.4417 if cp<=0.08225484937429428 & cv<=0.20080436766147616 & cv<=0.38548803329467773 & cv>=0.01071805227547884 & pa>=0.03449692204594612\n",
      "--------------\n",
      "   -3.6327 if pav<=0.24460948705673222\n",
      "  -11.9173 if cp<=0.6052873730659485 & pav<=0.0543186292052269\n",
      "   -0.0000 if pa>=0.08103863745927811 & pav>=0.043705208599567516\n",
      "   +9.0358 if pav>=-0.09002201110124577\n",
      "   -0.5970 if pav>=-0.15832958519458767\n",
      "   -0.0000 if cp>=0.634221923351288 & cv<=1.8501845121383667 & pav<=-0.037270663678646086\n",
      "   -3.6730 if pav<=0.20544615983963016\n",
      "   +4.7484 if pav<=-0.023137659952044424\n",
      "   -0.0000 if cp>=-0.003365041548386215 & cp>=0.03385642990469933 & cv<=-0.03672660887241363 & cv>=-0.23577652871608734 & pa>=-0.06778540164232254 & pav<=-0.009735857695341094\n",
      "   +5.3644 if cv>=-0.3721600353717804 & pa>=-0.09160481989383697 & pav<=-0.0010380603140219958 & pav>=-0.23082737326622008\n",
      "   -0.0000 if cp>=0.005269695818424239 & pa<=-0.08916560113430022 & pa>=-0.0962302953004837 & pav<=-0.1148708403110504 & pav>=-0.21949760615825653\n",
      "   -7.0024 if cp<=0.08225484937429428 & cv>=0.01071805227547884 & pa<=0.03449692204594612\n",
      "Run episode 426 with rewards 500.0\n",
      "best\n",
      "============ 427 ===========\n",
      "388 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0, 0, 0, 1, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 0, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 1, 1, 0, 0, 0, 1, 0, 1, 1, 1, 0, 0, 0, 1, 1, 1, 0, 0, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 0, 1, 1, 1, 0, 0, 0, 1, 1, 1, 0, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 1, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0]\n",
      "   +0.8286 if pav<=0.19076273441314703\n",
      "  +11.0257 if cp<=0.22202084362506871 & pa<=0.09762744754552842 & pav>=-0.14960525333881372\n",
      "   -2.8419 if pa>=-0.0015114990528672934\n",
      "   +0.0000 if cp>=2.296234130859375\n",
      "  -12.5207 if pav>=-0.21673575043678284\n",
      "   +0.0000 if cv<=1.1020641803741456 & pa>=0.10671222060918809 & pav<=0.23113564848899845 & pav>=-0.035066262632608404\n",
      "   -0.4556 if cv<=0.01230156067758799 & pa>=-0.08508429378271103 & pav<=-0.023137659952044424 & pav>=-0.23292139768600462\n",
      "   +2.3907 if cv<=-0.03672660887241363 & pav>=-0.1544262498617172\n",
      "   -0.9900 if cv<=-0.7518346071243286 & pav>=-0.23082737326622008\n",
      "   +0.0000 if cp<=0.005269695818424239 & pa<=-0.08916560113430022 & pa>=-0.0962302953004837 & pav<=-0.1148708403110504 & pav>=-0.21949760615825653\n",
      "   +0.2996 if cp<=0.08225484937429428 & cv<=0.20080436766147616 & cv<=0.38548803329467773 & cv>=0.01071805227547884 & pa>=0.03449692204594612\n",
      "   +2.1518 if cp<=-0.4500594079494473 & cv<=-0.571373462677002 & pa<=0.07155385911464696 & pav<=0.17903927564620983 & pav>=-0.21598759591579436\n",
      "--------------\n",
      "   -3.0543 if pav<=0.24460948705673222\n",
      "  -14.0023 if cp<=0.6052873730659485 & pav<=0.0543186292052269\n",
      "   +9.7695 if pav>=-0.09002201110124577\n",
      "   +0.6401 if pav>=-0.15832958519458767\n",
      "   -4.9592 if cp>=0.634221923351288 & cv<=1.8501845121383667 & pav<=-0.037270663678646086\n",
      "   -6.2236 if pav<=0.20544615983963016\n",
      "   +8.5706 if pav<=-0.023137659952044424\n",
      "   +0.0000 if cp>=-0.003365041548386215 & cp>=0.03385642990469933 & cv<=-0.03672660887241363 & cv>=-0.23577652871608734 & pa>=-0.06778540164232254 & pav<=-0.009735857695341094\n",
      "   +6.3855 if cv>=-0.3721600353717804 & pa>=-0.09160481989383697 & pav<=-0.0010380603140219958 & pav>=-0.23082737326622008\n",
      "   +0.0000 if cp>=0.005269695818424239 & pa<=-0.08916560113430022 & pa>=-0.0962302953004837 & pav<=-0.1148708403110504 & pav>=-0.21949760615825653\n",
      "   -6.5336 if cp<=0.08225484937429428 & cv>=0.01071805227547884 & pa<=0.03449692204594612\n",
      "   -1.2470 if cp<=-0.4500594079494473 & pa<=-0.0017869767267256898 & pav<=0.17903927564620983 & pav>=0.060604631900787374\n",
      "Run episode 427 with rewards 388.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============ 428 ===========\n",
      "340 actions [0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1, 0, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 0, 0, 1, 1, 0, 1, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 1, 0, 0, 0, 1, 1, 0, 0, 1, 1, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 0, 1, 1, 0, 1, 0, 0, 0, 1, 0, 1, 0, 0, 1, 0, 0, 1, 0, 1, 0, 0, 1, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1]\n",
      "   +0.0965 if pav<=0.19076273441314703\n",
      "  +10.8027 if cp<=0.22202084362506871 & pa<=0.09762744754552842 & pav>=-0.14960525333881372\n",
      "   -3.5908 if pa>=-0.0015114990528672934\n",
      "   +0.0000 if cp>=2.296234130859375\n",
      "  -11.0574 if pav>=-0.21673575043678284\n",
      "   +0.3661 if cv<=0.01230156067758799 & pa>=-0.08508429378271103 & pav<=-0.023137659952044424 & pav>=-0.23292139768600462\n",
      "   +3.4799 if cv<=-0.03672660887241363 & pav>=-0.1544262498617172\n",
      "   -0.3574 if cv<=-0.7518346071243286 & pav>=-0.23082737326622008\n",
      "   +0.0000 if cp<=0.005269695818424239 & pa<=-0.08916560113430022 & pa>=-0.0962302953004837 & pav<=-0.1148708403110504 & pav>=-0.21949760615825653\n",
      "   +0.4288 if cp<=0.08225484937429428 & cv<=0.20080436766147616 & cv<=0.38548803329467773 & cv>=0.01071805227547884 & pa>=0.03449692204594612\n",
      "   +2.0934 if cp<=-0.4500594079494473 & cv<=-0.571373462677002 & pa<=0.07155385911464696 & pav<=0.17903927564620983 & pav>=-0.21598759591579436\n",
      "   -1.4561 if pav>=-0.19589755833148956\n",
      "--------------\n",
      "   -2.8157 if pav<=0.24460948705673222\n",
      "  -13.5220 if cp<=0.6052873730659485 & pav<=0.0543186292052269\n",
      "   +7.0274 if pav>=-0.09002201110124577\n",
      "   +2.9193 if pav>=-0.15832958519458767\n",
      "   +0.0215 if cp>=0.634221923351288 & cv<=1.8501845121383667 & pav<=-0.037270663678646086\n",
      "   -5.6531 if pav<=0.20544615983963016\n",
      "   +6.3130 if pav<=-0.023137659952044424\n",
      "   +7.1683 if cv>=-0.3721600353717804 & pa>=-0.09160481989383697 & pav<=-0.0010380603140219958 & pav>=-0.23082737326622008\n",
      "   +0.0000 if cp>=0.005269695818424239 & pa<=-0.08916560113430022 & pa>=-0.0962302953004837 & pav<=-0.1148708403110504 & pav>=-0.21949760615825653\n",
      "   -5.3056 if cp<=0.08225484937429428 & cv>=0.01071805227547884 & pa<=0.03449692204594612\n",
      "   -1.6137 if cp<=-0.4500594079494473 & pa<=-0.0017869767267256898 & pav<=0.17903927564620983 & pav>=0.060604631900787374\n",
      "   +4.6788 if cp>=-1.022295570373535 & cv<=-0.5275522708892822 & cv<=0.008957441709935666 & pa>=0.0045568111352622545 & pa>=0.021748847886919977 & pav<=0.25550577640533456\n",
      "Run episode 428 with rewards 340.0\n",
      "============ 429 ===========\n",
      "218 actions [0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 1, 0, 0, 1, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 0, 1, 0, 0, 1, 1, 0, 0, 1, 0, 0, 1, 1, 0, 0, 1, 0, 0, 1, 0, 1, 0, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 1, 0, 1]\n",
      "   +0.0160 if pav<=0.19076273441314703\n",
      "  +11.3760 if cp<=0.22202084362506871 & pa<=0.09762744754552842 & pav>=-0.14960525333881372\n",
      "   -3.5148 if pa>=-0.0015114990528672934\n",
      "  -11.3567 if pav>=-0.21673575043678284\n",
      "   +0.0085 if cv<=0.01230156067758799 & pa>=-0.08508429378271103 & pav<=-0.023137659952044424 & pav>=-0.23292139768600462\n",
      "   +5.9333 if cv<=-0.03672660887241363 & pav>=-0.1544262498617172\n",
      "   -1.2572 if cv<=-0.7518346071243286 & pav>=-0.23082737326622008\n",
      "   +0.0000 if cp<=0.005269695818424239 & pa<=-0.08916560113430022 & pa>=-0.0962302953004837 & pav<=-0.1148708403110504 & pav>=-0.21949760615825653\n",
      "   -0.1877 if cp<=0.08225484937429428 & cv<=0.20080436766147616 & cv<=0.38548803329467773 & cv>=0.01071805227547884 & pa>=0.03449692204594612\n",
      "   +2.9726 if cp<=-0.4500594079494473 & cv<=-0.571373462677002 & pa<=0.07155385911464696 & pav<=0.17903927564620983 & pav>=-0.21598759591579436\n",
      "   -1.1750 if pav>=-0.19589755833148956\n",
      "   -1.6419 if cv<=0.0398288331925869 & pav>=-0.14578897058963777\n",
      "--------------\n",
      "   +0.3949 if pav<=0.24460948705673222\n",
      "  -11.1457 if cp<=0.6052873730659485 & pav<=0.0543186292052269\n",
      "   +4.8235 if pav>=-0.09002201110124577\n",
      "   +3.1394 if pav>=-0.15832958519458767\n",
      "   -0.0000 if cp>=0.634221923351288 & cv<=1.8501845121383667 & pav<=-0.037270663678646086\n",
      "   -8.2076 if pav<=0.20544615983963016\n",
      "   +3.0857 if pav<=-0.023137659952044424\n",
      "   +7.2404 if cv>=-0.3721600353717804 & pa>=-0.09160481989383697 & pav<=-0.0010380603140219958 & pav>=-0.23082737326622008\n",
      "   -3.7874 if cp<=0.08225484937429428 & cv>=0.01071805227547884 & pa<=0.03449692204594612\n",
      "   -1.9693 if cp<=-0.4500594079494473 & pa<=-0.0017869767267256898 & pav<=0.17903927564620983 & pav>=0.060604631900787374\n",
      "   -0.0007 if cp>=-1.022295570373535 & cv<=-0.5275522708892822 & cv<=0.008957441709935666 & pa>=0.0045568111352622545 & pa>=0.021748847886919977 & pav<=0.25550577640533456\n",
      "   +3.2550 if cp<=-0.00029016217449678286 & cp>=-0.022550329193472864 & cv<=0.0398288331925869 & pa>=-0.01158604193478823 & pav<=0.061660340428352486\n",
      "Run episode 429 with rewards 218.0\n",
      "============ 430 ===========\n",
      "500 actions [0, 1, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 1, 0, 0, 0, 1, 1, 0, 0, 1, 1, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 0, 1, 1, 0, 0, 1, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 0, 1, 1, 1, 0, 1, 0, 0, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 1, 1, 0, 1, 0, 0, 1, 0, 1, 1, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 0, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 0, 1, 0, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 1]\n",
      "   +0.8138 if pav<=0.19076273441314703\n",
      "  +13.8684 if cp<=0.22202084362506871 & pa<=0.09762744754552842 & pav>=-0.14960525333881372\n",
      "   -5.1985 if pa>=-0.0015114990528672934\n",
      "   -8.6443 if pav>=-0.21673575043678284\n",
      "   +0.3917 if cv<=0.01230156067758799 & pa>=-0.08508429378271103 & pav<=-0.023137659952044424 & pav>=-0.23292139768600462\n",
      "   +5.4864 if cv<=-0.03672660887241363 & pav>=-0.1544262498617172\n",
      "   -3.0484 if cv<=-0.7518346071243286 & pav>=-0.23082737326622008\n",
      "   -0.3068 if cp<=0.08225484937429428 & cv<=0.20080436766147616 & cv<=0.38548803329467773 & cv>=0.01071805227547884 & pa>=0.03449692204594612\n",
      "   +7.2811 if cp<=-0.4500594079494473 & cv<=-0.571373462677002 & pa<=0.07155385911464696 & pav<=0.17903927564620983 & pav>=-0.21598759591579436\n",
      "   -6.7602 if pav>=-0.19589755833148956\n",
      "   +0.2662 if cv<=0.0398288331925869 & pav>=-0.14578897058963777\n",
      "   +2.5242 if cp<=0.2860182881355287 & cp>=0.117185239493847 & cv>=0.31940749883651737 & pa>=-0.03374017179012294 & pav<=0.08734904229640963 & pav>=-0.15420448184013366\n",
      "--------------\n",
      "   -4.2355 if pav<=0.24460948705673222\n",
      "   -8.1878 if cp<=0.6052873730659485 & pav<=0.0543186292052269\n",
      "   +7.0667 if pav>=-0.09002201110124577\n",
      "   +4.2082 if pav>=-0.15832958519458767\n",
      "   -6.9833 if pav<=0.20544615983963016\n",
      "   +6.8302 if pav<=-0.023137659952044424\n",
      "   +5.2202 if cv>=-0.3721600353717804 & pa>=-0.09160481989383697 & pav<=-0.0010380603140219958 & pav>=-0.23082737326622008\n",
      "   -2.7073 if cp<=0.08225484937429428 & cv>=0.01071805227547884 & pa<=0.03449692204594612\n",
      "   -0.8640 if cp<=-0.4500594079494473 & pa<=-0.0017869767267256898 & pav<=0.17903927564620983 & pav>=0.060604631900787374\n",
      "   +0.0000 if cp>=-1.022295570373535 & cv<=-0.5275522708892822 & cv<=0.008957441709935666 & pa>=0.0045568111352622545 & pa>=0.021748847886919977 & pav<=0.25550577640533456\n",
      "   +0.0001 if cp<=-0.00029016217449678286 & cp>=-0.022550329193472864 & cv<=0.0398288331925869 & pa>=-0.01158604193478823 & pav<=0.061660340428352486\n",
      "   -2.8477 if pav<=0.08734904229640963\n",
      "Run episode 430 with rewards 500.0\n",
      "best\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "origin 6245.489225713024 new 260385.92317042308 not updated\n",
      "============ 431 ===========\n",
      "500 actions [0, 1, 0, 1, 1, 0, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 1, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 0, 1, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 1, 0, 0, 0, 1, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 1, 0, 0, 1, 0, 0, 1, 1, 1, 0, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 0, 1, 1, 0, 0, 1, 0, 1, 0, 0, 1, 1, 0, 0, 1, 0, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 1, 0, 1, 0, 1, 1, 1, 0, 1, 0, 0, 1, 1, 0, 0, 1, 0, 1, 1, 1, 0, 0, 1, 1, 0, 1, 0, 0, 1, 0, 1, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 1, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 0, 1, 1, 0, 0, 1, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0, 0, 1, 0, 0, 1, 1, 0, 0, 0, 1, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1]\n",
      "   +0.8138 if pav<=0.19076273441314703\n",
      "  +13.8684 if cp<=0.22202084362506871 & pa<=0.09762744754552842 & pav>=-0.14960525333881372\n",
      "   -5.1985 if pa>=-0.0015114990528672934\n",
      "   -8.6443 if pav>=-0.21673575043678284\n",
      "   +0.3917 if cv<=0.01230156067758799 & pa>=-0.08508429378271103 & pav<=-0.023137659952044424 & pav>=-0.23292139768600462\n",
      "   +5.4864 if cv<=-0.03672660887241363 & pav>=-0.1544262498617172\n",
      "   -3.0484 if cv<=-0.7518346071243286 & pav>=-0.23082737326622008\n",
      "   -0.3068 if cp<=0.08225484937429428 & cv<=0.20080436766147616 & cv<=0.38548803329467773 & cv>=0.01071805227547884 & pa>=0.03449692204594612\n",
      "   +7.2811 if cp<=-0.4500594079494473 & cv<=-0.571373462677002 & pa<=0.07155385911464696 & pav<=0.17903927564620983 & pav>=-0.21598759591579436\n",
      "   -6.7602 if pav>=-0.19589755833148956\n",
      "   +0.2662 if cv<=0.0398288331925869 & pav>=-0.14578897058963777\n",
      "   +2.5242 if cp<=0.2860182881355287 & cp>=0.117185239493847 & cv>=0.31940749883651737 & pa>=-0.03374017179012294 & pav<=0.08734904229640963 & pav>=-0.15420448184013366\n",
      "--------------\n",
      "   -1.0736 if pav<=0.24460948705673222\n",
      "   -7.8067 if cp<=0.6052873730659485 & pav<=0.0543186292052269\n",
      "   +7.7101 if pav>=-0.09002201110124577\n",
      "   +3.5541 if pav>=-0.15832958519458767\n",
      "   -9.9289 if pav<=0.20544615983963016\n",
      "   +5.3843 if pav<=-0.023137659952044424\n",
      "   +6.9675 if cv>=-0.3721600353717804 & pa>=-0.09160481989383697 & pav<=-0.0010380603140219958 & pav>=-0.23082737326622008\n",
      "   -2.6571 if cp<=0.08225484937429428 & cv>=0.01071805227547884 & pa<=0.03449692204594612\n",
      "   +0.0347 if cp<=-0.4500594079494473 & pa<=-0.0017869767267256898 & pav<=0.17903927564620983 & pav>=0.060604631900787374\n",
      "   -1.5263 if cp<=-0.00029016217449678286 & cp>=-0.022550329193472864 & cv<=0.0398288331925869 & pa>=-0.01158604193478823 & pav<=0.061660340428352486\n",
      "   -3.6146 if pav<=0.08734904229640963\n",
      "   +4.6077 if pa>=0.07008213549852371\n",
      "Run episode 431 with rewards 500.0\n",
      "best\n",
      "============ 432 ===========\n",
      "500 actions [0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 0, 1, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 0, 1, 0, 0, 1, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 1, 0, 0, 0, 1, 1, 0, 0, 1, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 1, 0, 0, 0, 1, 0, 1, 1, 1, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 0, 1, 0, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 1, 0, 1, 0, 0, 0, 1, 1, 1, 0, 0, 0, 1, 0, 1, 1, 1, 0, 0, 0, 1, 0, 1, 1, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 1, 0, 0, 0, 1, 0, 1, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 1, 0, 1, 0, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 0, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 0, 1, 1]\n",
      "   +1.7565 if pav<=0.19076273441314703\n",
      "  +13.0517 if cp<=0.22202084362506871 & pa<=0.09762744754552842 & pav>=-0.14960525333881372\n",
      "   -4.7577 if pa>=-0.0015114990528672934\n",
      "   -8.1197 if pav>=-0.21673575043678284\n",
      "   +0.7959 if cv<=0.01230156067758799 & pa>=-0.08508429378271103 & pav<=-0.023137659952044424 & pav>=-0.23292139768600462\n",
      "   +4.9188 if cv<=-0.03672660887241363 & pav>=-0.1544262498617172\n",
      "   -0.9646 if cv<=-0.7518346071243286 & pav>=-0.23082737326622008\n",
      "   -1.1397 if cp<=0.08225484937429428 & cv<=0.20080436766147616 & cv<=0.38548803329467773 & cv>=0.01071805227547884 & pa>=0.03449692204594612\n",
      "   +2.8314 if cp<=-0.4500594079494473 & cv<=-0.571373462677002 & pa<=0.07155385911464696 & pav<=0.17903927564620983 & pav>=-0.21598759591579436\n",
      "   -7.0858 if pav>=-0.19589755833148956\n",
      "   +0.0025 if cp<=0.2860182881355287 & cp>=0.117185239493847 & cv>=0.31940749883651737 & pa>=-0.03374017179012294 & pav<=0.08734904229640963 & pav>=-0.15420448184013366\n",
      "   -6.2872 if cp>=0.11891164332628266 & cv>=0.00946156978607181 & pa>=0.006182188075035811 & pav>=-0.1704284697771072\n",
      "--------------\n",
      "   -3.9449 if pav<=0.24460948705673222\n",
      "   -7.1640 if cp<=0.6052873730659485 & pav<=0.0543186292052269\n",
      "   +9.0613 if pav>=-0.09002201110124577\n",
      "   +4.7274 if pav>=-0.15832958519458767\n",
      "   -8.0554 if pav<=0.20544615983963016\n",
      "   +7.0645 if pav<=-0.023137659952044424\n",
      "   +6.8311 if cv>=-0.3721600353717804 & pa>=-0.09160481989383697 & pav<=-0.0010380603140219958 & pav>=-0.23082737326622008\n",
      "   -4.4334 if cp<=0.08225484937429428 & cv>=0.01071805227547884 & pa<=0.03449692204594612\n",
      "   -0.0006 if cp<=-0.00029016217449678286 & cp>=-0.022550329193472864 & cv<=0.0398288331925869 & pa>=-0.01158604193478823 & pav<=0.061660340428352486\n",
      "   -4.8481 if pav<=0.08734904229640963\n",
      "   +2.1434 if pa>=0.07008213549852371\n",
      "   -1.3847 if cv<=0.19191737174987794 & pav>=-0.1704284697771072\n",
      "Run episode 432 with rewards 500.0\n",
      "best\n",
      "origin 6645.011788559728 new 259904.7329818129 not updated\n",
      "origin 6644.361022409434 new 261223.65146883056 not updated\n",
      "============ 433 ===========\n",
      "389 actions [0, 1, 0, 1, 0, 1, 1, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1, 1, 0, 1, 1, 0, 1, 0, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 1, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 1, 1, 0, 1, 0, 1, 0, 0, 1, 1, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 1, 0, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 0, 1, 0, 0, 1, 0, 1, 0, 0, 1, 1, 0, 0, 0, 1, 1, 0, 0, 1, 0, 1, 0, 0, 1, 0, 0, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0]\n",
      "   +1.7565 if pav<=0.19076273441314703\n",
      "  +13.0517 if cp<=0.22202084362506871 & pa<=0.09762744754552842 & pav>=-0.14960525333881372\n",
      "   -4.7577 if pa>=-0.0015114990528672934\n",
      "   -8.1197 if pav>=-0.21673575043678284\n",
      "   +0.7959 if cv<=0.01230156067758799 & pa>=-0.08508429378271103 & pav<=-0.023137659952044424 & pav>=-0.23292139768600462\n",
      "   +4.9188 if cv<=-0.03672660887241363 & pav>=-0.1544262498617172\n",
      "   -0.9646 if cv<=-0.7518346071243286 & pav>=-0.23082737326622008\n",
      "   -1.1397 if cp<=0.08225484937429428 & cv<=0.20080436766147616 & cv<=0.38548803329467773 & cv>=0.01071805227547884 & pa>=0.03449692204594612\n",
      "   +2.8314 if cp<=-0.4500594079494473 & cv<=-0.571373462677002 & pa<=0.07155385911464696 & pav<=0.17903927564620983 & pav>=-0.21598759591579436\n",
      "   -7.0858 if pav>=-0.19589755833148956\n",
      "   +0.0025 if cp<=0.2860182881355287 & cp>=0.117185239493847 & cv>=0.31940749883651737 & pa>=-0.03374017179012294 & pav<=0.08734904229640963 & pav>=-0.15420448184013366\n",
      "   -6.2872 if cp>=0.11891164332628266 & cv>=0.00946156978607181 & pa>=0.006182188075035811 & pav>=-0.1704284697771072\n",
      "--------------\n",
      "   -3.9449 if pav<=0.24460948705673222\n",
      "   -7.1640 if cp<=0.6052873730659485 & pav<=0.0543186292052269\n",
      "   +9.0613 if pav>=-0.09002201110124577\n",
      "   +4.7274 if pav>=-0.15832958519458767\n",
      "   -8.0554 if pav<=0.20544615983963016\n",
      "   +7.0645 if pav<=-0.023137659952044424\n",
      "   +6.8311 if cv>=-0.3721600353717804 & pa>=-0.09160481989383697 & pav<=-0.0010380603140219958 & pav>=-0.23082737326622008\n",
      "   -4.4334 if cp<=0.08225484937429428 & cv>=0.01071805227547884 & pa<=0.03449692204594612\n",
      "   -0.0006 if cp<=-0.00029016217449678286 & cp>=-0.022550329193472864 & cv<=0.0398288331925869 & pa>=-0.01158604193478823 & pav<=0.061660340428352486\n",
      "   -4.8481 if pav<=0.08734904229640963\n",
      "   +2.1434 if pa>=0.07008213549852371\n",
      "   -1.3847 if cv<=0.19191737174987794 & pav>=-0.1704284697771072\n",
      "Run episode 433 with rewards 389.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "origin 2775.7966576498825 new 192674.90285894228 not updated\n",
      "============ 434 ===========\n",
      "500 actions [1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 0, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 0, 1, 1, 0, 0, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 1, 0, 1, 0, 0, 1, 0, 0, 1, 1, 0, 1, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0, 0, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 1, 0, 0, 0, 1, 1, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 0, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 1, 0, 1, 0, 1, 0, 0, 0, 1, 0, 1, 1, 0, 1, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0]\n",
      "   +0.1730 if pav<=0.19076273441314703\n",
      "  +11.7446 if cp<=0.22202084362506871 & pa<=0.09762744754552842 & pav>=-0.14960525333881372\n",
      "   -4.7741 if pa>=-0.0015114990528672934\n",
      "   -6.7524 if pav>=-0.21673575043678284\n",
      "   +0.1119 if cv<=0.01230156067758799 & pa>=-0.08508429378271103 & pav<=-0.023137659952044424 & pav>=-0.23292139768600462\n",
      "   +3.8186 if cv<=-0.03672660887241363 & pav>=-0.1544262498617172\n",
      "   -1.1369 if cv<=-0.7518346071243286 & pav>=-0.23082737326622008\n",
      "   -2.6605 if cp<=0.08225484937429428 & cv<=0.20080436766147616 & cv<=0.38548803329467773 & cv>=0.01071805227547884 & pa>=0.03449692204594612\n",
      "   +4.0722 if cp<=-0.4500594079494473 & cv<=-0.571373462677002 & pa<=0.07155385911464696 & pav<=0.17903927564620983 & pav>=-0.21598759591579436\n",
      "   -5.7787 if pav>=-0.19589755833148956\n",
      "   +0.0006 if cp>=0.11891164332628266 & cv>=0.00946156978607181 & pa>=0.006182188075035811 & pav>=-0.1704284697771072\n",
      "   +2.4487 if cp<=-0.26036535501480085 & cp>=-0.5987647056579589 & pa>=0.038168987631797796 & pav<=0.21498430073261263 & pav>=-0.20625107586383817\n",
      "--------------\n",
      "   -3.9449 if pav<=0.24460948705673222\n",
      "   -7.1640 if cp<=0.6052873730659485 & pav<=0.0543186292052269\n",
      "   +9.0613 if pav>=-0.09002201110124577\n",
      "   +4.7274 if pav>=-0.15832958519458767\n",
      "   -8.0554 if pav<=0.20544615983963016\n",
      "   +7.0645 if pav<=-0.023137659952044424\n",
      "   +6.8311 if cv>=-0.3721600353717804 & pa>=-0.09160481989383697 & pav<=-0.0010380603140219958 & pav>=-0.23082737326622008\n",
      "   -4.4334 if cp<=0.08225484937429428 & cv>=0.01071805227547884 & pa<=0.03449692204594612\n",
      "   -0.0006 if cp<=-0.00029016217449678286 & cp>=-0.022550329193472864 & cv<=0.0398288331925869 & pa>=-0.01158604193478823 & pav<=0.061660340428352486\n",
      "   -4.8481 if pav<=0.08734904229640963\n",
      "   +2.1434 if pa>=0.07008213549852371\n",
      "   -1.3847 if cv<=0.19191737174987794 & pav>=-0.1704284697771072\n",
      "Run episode 434 with rewards 500.0\n",
      "best\n",
      "origin 6768.4933347304195 new 263893.5811922646 not updated\n",
      "============ 435 ===========\n",
      "500 actions [0, 1, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 0, 0, 1, 0, 1, 1, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0, 0, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 0, 0, 1, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 0, 0, 1, 0, 1, 1, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 0, 0, 1, 1, 0, 1, 1, 0, 1, 0, 0, 1, 0, 0, 1, 1, 0, 1, 1, 0, 1, 0, 1, 0, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 0, 1, 0, 1, 1, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 0, 0, 1, 0, 1, 1, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 0, 1, 1, 0, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 0, 0, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 0, 1, 0, 0, 1, 0, 1]\n",
      "   +0.1617 if pav<=0.19076273441314703\n",
      "   +9.0703 if cp<=0.22202084362506871 & pa<=0.09762744754552842 & pav>=-0.14960525333881372\n",
      "   -4.1787 if pa>=-0.0015114990528672934\n",
      "   -5.9555 if pav>=-0.21673575043678284\n",
      "   +0.7352 if cv<=0.01230156067758799 & pa>=-0.08508429378271103 & pav<=-0.023137659952044424 & pav>=-0.23292139768600462\n",
      "   +4.5669 if cv<=-0.03672660887241363 & pav>=-0.1544262498617172\n",
      "   +0.0004 if cv<=-0.7518346071243286 & pav>=-0.23082737326622008\n",
      "   +0.0015 if cp<=0.08225484937429428 & cv<=0.20080436766147616 & cv<=0.38548803329467773 & cv>=0.01071805227547884 & pa>=0.03449692204594612\n",
      "   +0.0014 if cp<=-0.4500594079494473 & cv<=-0.571373462677002 & pa<=0.07155385911464696 & pav<=0.17903927564620983 & pav>=-0.21598759591579436\n",
      "   -7.9348 if pav>=-0.19589755833148956\n",
      "   +0.0008 if cp<=-0.26036535501480085 & cp>=-0.5987647056579589 & pa>=0.038168987631797796 & pav<=0.21498430073261263 & pav>=-0.20625107586383817\n",
      "   +2.5355 if pav>=-0.12721649706363677\n",
      "--------------\n",
      "   -3.9449 if pav<=0.24460948705673222\n",
      "   -7.1640 if cp<=0.6052873730659485 & pav<=0.0543186292052269\n",
      "   +9.0613 if pav>=-0.09002201110124577\n",
      "   +4.7274 if pav>=-0.15832958519458767\n",
      "   -8.0554 if pav<=0.20544615983963016\n",
      "   +7.0645 if pav<=-0.023137659952044424\n",
      "   +6.8311 if cv>=-0.3721600353717804 & pa>=-0.09160481989383697 & pav<=-0.0010380603140219958 & pav>=-0.23082737326622008\n",
      "   -4.4334 if cp<=0.08225484937429428 & cv>=0.01071805227547884 & pa<=0.03449692204594612\n",
      "   -0.0006 if cp<=-0.00029016217449678286 & cp>=-0.022550329193472864 & cv<=0.0398288331925869 & pa>=-0.01158604193478823 & pav<=0.061660340428352486\n",
      "   -4.8481 if pav<=0.08734904229640963\n",
      "   +2.1434 if pa>=0.07008213549852371\n",
      "   -1.3847 if cv<=0.19191737174987794 & pav>=-0.1704284697771072\n",
      "Run episode 435 with rewards 500.0\n",
      "best\n",
      "\n",
      "Done\n"
     ]
    }
   ],
   "source": [
    "rewards = train()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "3d20e8e0",
   "metadata": {},
   "outputs": [],
   "source": [
    "for i in range(action_space):\n",
    "    print(actor.best_model[i].rules_)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 25,
   "id": "0b443f87",
   "metadata": {},
   "outputs": [],
   "source": [
    "def test(num_test_episodes=100):\n",
    "    \"\"\"\n",
    "    Test the learned policy using the trained actor model.\n",
    "\n",
    "    Args:\n",
    "        num_test_episodes (int): Number of episodes to test the model.\n",
    "\n",
    "    Returns:\n",
    "        float: Average reward over the test episodes.\n",
    "    \"\"\"\n",
    "    total_reward = 0\n",
    "\n",
    "    for episode in range(num_test_episodes):\n",
    "        state = env.reset()[0]  # Reset the environment and get the initial state\n",
    "        episode_reward = 0\n",
    "\n",
    "        for t in range(1, 10000):  # Limit the number of time steps\n",
    "            # Convert state to tensor and predict action probabilities\n",
    "            #             state_tensor = torch.tensor(state, dtype=torch.float32).to(device)\n",
    "            action_probs = actor.predict(pd.DataFrame(np.array([state]), columns=column_names))\n",
    "            # Select action based on the highest probability\n",
    "            action = np.argmax(action_probs)\n",
    "            # Take the chosen action\n",
    "            next_state, reward, done, trunc, _ = env.step(action)\n",
    "            # Accumulate reward\n",
    "            episode_reward += reward\n",
    "            if done or trunc:\n",
    "                break\n",
    "            # Update state\n",
    "            state = next_state\n",
    "        total_reward += episode_reward\n",
    "        print(f\"Test Episode {episode + 1}, Reward: {episode_reward}\")\n",
    "    avg_reward = total_reward / num_test_episodes\n",
    "    print(f\"\\nAverage Reward over {num_test_episodes} Test Episodes: {avg_reward}\")\n",
    "    return avg_reward"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 26,
   "id": "ef9e3e26",
   "metadata": {
    "scrolled": false
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Test Episode 1, Reward: 500.0\n",
      "Test Episode 2, Reward: 500.0\n",
      "Test Episode 3, Reward: 460.0\n",
      "Test Episode 4, Reward: 500.0\n",
      "Test Episode 5, Reward: 500.0\n",
      "Test Episode 6, Reward: 500.0\n",
      "Test Episode 7, Reward: 500.0\n",
      "Test Episode 8, Reward: 500.0\n",
      "Test Episode 9, Reward: 500.0\n",
      "Test Episode 10, Reward: 500.0\n",
      "Test Episode 11, Reward: 500.0\n",
      "Test Episode 12, Reward: 500.0\n",
      "Test Episode 13, Reward: 500.0\n",
      "Test Episode 14, Reward: 500.0\n",
      "Test Episode 15, Reward: 500.0\n",
      "Test Episode 16, Reward: 500.0\n",
      "Test Episode 17, Reward: 418.0\n",
      "Test Episode 18, Reward: 500.0\n",
      "Test Episode 19, Reward: 500.0\n",
      "Test Episode 20, Reward: 500.0\n",
      "Test Episode 21, Reward: 500.0\n",
      "Test Episode 22, Reward: 500.0\n",
      "Test Episode 23, Reward: 500.0\n",
      "Test Episode 24, Reward: 492.0\n",
      "Test Episode 25, Reward: 500.0\n",
      "Test Episode 26, Reward: 500.0\n",
      "Test Episode 27, Reward: 490.0\n",
      "Test Episode 28, Reward: 500.0\n",
      "Test Episode 29, Reward: 500.0\n",
      "Test Episode 30, Reward: 500.0\n",
      "Test Episode 31, Reward: 500.0\n",
      "Test Episode 32, Reward: 500.0\n",
      "Test Episode 33, Reward: 500.0\n",
      "Test Episode 34, Reward: 500.0\n",
      "Test Episode 35, Reward: 500.0\n",
      "Test Episode 36, Reward: 500.0\n",
      "Test Episode 37, Reward: 500.0\n",
      "Test Episode 38, Reward: 500.0\n",
      "Test Episode 39, Reward: 500.0\n",
      "Test Episode 40, Reward: 500.0\n",
      "Test Episode 41, Reward: 500.0\n",
      "Test Episode 42, Reward: 500.0\n",
      "Test Episode 43, Reward: 226.0\n",
      "Test Episode 44, Reward: 246.0\n",
      "Test Episode 45, Reward: 500.0\n",
      "Test Episode 46, Reward: 500.0\n",
      "Test Episode 47, Reward: 500.0\n",
      "Test Episode 48, Reward: 500.0\n",
      "Test Episode 49, Reward: 500.0\n",
      "Test Episode 50, Reward: 500.0\n",
      "Test Episode 51, Reward: 407.0\n",
      "Test Episode 52, Reward: 458.0\n",
      "Test Episode 53, Reward: 500.0\n",
      "Test Episode 54, Reward: 500.0\n",
      "Test Episode 55, Reward: 500.0\n",
      "Test Episode 56, Reward: 500.0\n",
      "Test Episode 57, Reward: 500.0\n",
      "Test Episode 58, Reward: 500.0\n",
      "Test Episode 59, Reward: 500.0\n",
      "Test Episode 60, Reward: 500.0\n",
      "Test Episode 61, Reward: 470.0\n",
      "Test Episode 62, Reward: 500.0\n",
      "Test Episode 63, Reward: 500.0\n",
      "Test Episode 64, Reward: 500.0\n",
      "Test Episode 65, Reward: 500.0\n",
      "Test Episode 66, Reward: 500.0\n",
      "Test Episode 67, Reward: 500.0\n",
      "Test Episode 68, Reward: 500.0\n",
      "Test Episode 69, Reward: 500.0\n",
      "Test Episode 70, Reward: 500.0\n",
      "Test Episode 71, Reward: 500.0\n",
      "Test Episode 72, Reward: 500.0\n",
      "Test Episode 73, Reward: 500.0\n",
      "Test Episode 74, Reward: 485.0\n",
      "Test Episode 75, Reward: 214.0\n",
      "Test Episode 76, Reward: 500.0\n",
      "Test Episode 77, Reward: 499.0\n",
      "Test Episode 78, Reward: 479.0\n",
      "Test Episode 79, Reward: 500.0\n",
      "Test Episode 80, Reward: 500.0\n",
      "Test Episode 81, Reward: 500.0\n",
      "Test Episode 82, Reward: 500.0\n",
      "Test Episode 83, Reward: 500.0\n",
      "Test Episode 84, Reward: 500.0\n",
      "Test Episode 85, Reward: 500.0\n",
      "Test Episode 86, Reward: 500.0\n",
      "Test Episode 87, Reward: 494.0\n",
      "Test Episode 88, Reward: 500.0\n",
      "Test Episode 89, Reward: 500.0\n",
      "Test Episode 90, Reward: 500.0\n",
      "Test Episode 91, Reward: 500.0\n",
      "Test Episode 92, Reward: 500.0\n",
      "Test Episode 93, Reward: 500.0\n",
      "Test Episode 94, Reward: 500.0\n",
      "Test Episode 95, Reward: 500.0\n",
      "Test Episode 96, Reward: 500.0\n",
      "Test Episode 97, Reward: 500.0\n",
      "Test Episode 98, Reward: 214.0\n",
      "Test Episode 99, Reward: 500.0\n",
      "Test Episode 100, Reward: 500.0\n",
      "\n",
      "Average Reward over 100 Test Episodes: 485.52\n"
     ]
    }
   ],
   "source": [
    "avg_test_reward = test(num_test_episodes=100)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 27,
   "id": "31340922",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[<matplotlib.lines.Line2D at 0x7fa153827610>]"
      ]
     },
     "execution_count": 27,
     "metadata": {},
     "output_type": "execute_result"
    },
    {
     "data": {
      "image/png": "iVBORw0KGgoAAAANSUhEUgAAAXcAAAD4CAYAAAAXUaZHAAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjUuMiwgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy8qNh9FAAAACXBIWXMAAAsTAAALEwEAmpwYAABQjElEQVR4nO2dd3gc1dWH3ztb1Ltk2ZZky8bdgI0xtuk9AUwNhEAIEEoIhCSkEki+fAmpQL7QSYITIJAQIBA6hG6aqTa44N67qtWlbTP3+2NmVruSbK1klZV93ufxo527M7N3x9JvzvzuuecqrTWCIAjCvoUx2B0QBEEQ+h4Rd0EQhH0QEXdBEIR9EBF3QRCEfRARd0EQhH0Q72B3AKCwsFCXl5cPdjcEQRCGFIsWLarRWhd19V5SiHt5eTkLFy4c7G4IgiAMKZRSm3f3ntgygiAI+yAi7oIgCPsgIu6CIAj7ICLugiAI+yAi7oIgCPsgCYm7UmqTUmqZUmqxUmqh05avlHpNKbXW+ZnntCul1F1KqXVKqaVKqRn9+QUEQRCEzvQkcj9eaz1daz3T2b4BeENrPR54w9kGOBUY7/y7CvhzX3VWEARBSIy9yXM/CzjOef0Q8BbwE6f9YW3XEv5QKZWrlBqhtd65Nx0VBEFIBp5ctI2GtjCXHVGOYaiEjlmxo5G2sMmho/N4bUUly7bVU5yTSkVDgBMnFzO9LLfP+5mouGvgVaWUBu7TWs8DimMEuwIodl6XAFtjjt3mtMWJu1LqKuzInlGjRvWu94IgCANIMGLyoyeWAHDshELGDctK6LjT7noXgE03z+Xnz3xORWMg+t7wnNRBFfejtNbblVLDgNeUUqti39Raa0f4E8a5QcwDmDlzpqwYIghC0mNa7VIVsXonWxHLitv2Gf2T15LQWbXW252fVcDTwCygUik1AsD5WeXsvh0oizm81GkTBEEY0sTqeQeNTpiOi995ErR2ekq34q6UylBKZbmvgS8AnwPPAZc6u10KPOu8fg64xMmamQM0iN8uCMK+gBWjzJreRe5WB3X3evpH3BOxZYqBp5VS7v7/0lq/rJT6BPi3UuoKYDNwvrP/S8BpwDqgFbisz3stCIIwCOiYaL23y093PKy/IvduxV1rvQGY1kV7LXBiF+0auLZPeicIgpBEmL1V9BgsS+MxVNS/9w6WLSMIgiDYxNkyvY3cNfhirBjPYA6oCoIgCPHi3tE7TxQN+Dzt0iuRuyAIwiATmyHTW4PG0hqfxyCDNn7rvZ/8mk/6pG8dEXEXBEFIkHhbppeRu2PLZNLGRd43yGja2FfdiyMpltkTBEEYCsSnQvb+HF7DwKPCAChvah/0rDMi7oIgCAkSG6zvTeTu9xp4scUdX0of9KwzIu6CIAgJElt+oPd57hqfR+EnBIDypfVF1zohnrsgCEKC7K0to7XG0uA1DFKcyN3w9k/kLuIuCIKQIFacLdPz401Lo7XG5zVIcTx3RNwFQRAGl73NlolYduTuM1R75O7rnwFVEXdBEIQEiZ/E1PPj3TLBPo8h4i4IgpAsxE9i6kXkbton8HkNUpwBVUMGVAVBEAaXuJIDvYjcQ664GyrquRt+idwFQRAGlb3NlomYXdgyIu6CIAiDy95my4SdyN3rUfgdcfeILSMIgjC47G1VyLATuftjInePRO6CIAiDi2XtnS0TG7mnqDCWVni8/j7qXTwi7oIgCAli7WVtGVfcXc89hBevx9NX3YtDxF0QBCFB9nZANdxhQDWIr9/WUBVxFwRBSJC9TYVsj9wVKYQI4peVmARBEAab2ElMvRlQjUuFVGGC2och4i4IgjC47O0C2e0Dqu22TH8h4i4IgpAge+u5uzNU/R4l4i4IgpAs7HVVSDfP3SuRuyAIQtIQ77n3/PioLWO4nnv/5LiDiLsgCELCxA+i7k2euyKVEKF+XOlUxF0QBCFB9r62jH2QoWC0qmS7LuyjnnVGxF0QBCFB9n4Skx25ZwSryFUtrNSj+qhnnRFxFwRBSJC+SoXMa14LwGqrrE/61RUi7oIgCAkSa8vsTVXI3KZ1AKzSIu6CIAiDzt5WhXSX2UsL1tCsU2kks4961pmExV0p5VFKfaaUesHZHqOU+kgptU4p9bhSyu+0pzjb65z3y/up74IgCAPK3ua5u7ZMSrieOp3VZ/3qip5E7tcBK2O2bwFu11qPA+qAK5z2K4A6p/12Zz9BEIQhT29y22MJOydICdWxiyQQd6VUKTAX+JuzrYATgCedXR4CznZen+Vs47x/orO/IAjCkKa3A6puWd9wxIncQ8kTud8BXA+487MKgHqtdcTZ3gaUOK9LgK0AzvsNzv5xKKWuUkotVEotrK6u7l3vBUEQBpBYz70nA6oeJ751bRl/MkTuSqnTgSqt9aK+/GCt9Tyt9Uyt9cyioqK+PLUgCEK/0NtJTIajtK4t4w/V9Xvknsjc1yOBM5VSpwGpQDZwJ5CrlPI60XkpsN3ZfztQBmxTSnmBHKC2z3suCIIwwPR2EpOh2m0ZP2F8kRZ2DbYto7W+UWtdqrUuBy4A3tRaXwTMB85zdrsUeNZ5/ZyzjfP+m7o3w8qCIAhJRm+zZVxbJmJpcmkGoG6wbZk98BPgB0qpddie+v1O+/1AgdP+A+CGveuiIAhCctDbPHc3pSRkWvzD/3sAapPAlomitX4LeMt5vQGY1cU+AeDLfdA3QRCEpCLec+9B5O5kywTDFsWqDo3B1y66jCszsvu6i1H6r96kIAjCPsbe1pYJhE0MLDaPv5ijp5b3Xce6QMoPCIIgJEhvB1TdiL8tbOIngjb6bwUmFxF3QRCEBOltKqRr4bSGTHxE0Eb/rcDkIuIuCIKQILGRe08mMbl7BoJBPEqjPRK5C4IgJA29rgrp7BwJBe0XIu6CIAjJQ1zhsF5E7pFwyN4WW0YQBCF56P2Aqr13JGxH7mLLCIIgJBG9H1C1fxpW2H4h4i4IgpA89LYqpHbifJ+yC+mKLSMIgpBE9HYSk7uvH6dKuuS5C4IgJA9xtkwPjnP39Tnirj0SuQuCICQNvV5D1dlVxF0QBCEJsXq5iKp7U3BtGSUDqoIgCMmDpdvL9/ZmhqoP096WyF0QBCF5sLSOLrzR09oyKV4Dr5MtI6mQgiAISYSldbQ2e08HVNP8nqjnjkTugiAIyUOcuPcwFTLd55FUSEEQhGTE0sRE7ompu5tVY0futueOVyJ3QRCEpMGyeh65u/uJLSMIgpCkWFrjjYp7gpG789NrGNHyA0rEXRAEIXmwNBg9zJZxbwI+j4p67pZ47oIgCMlDXOSe4DFxkbs7iUk8d0EQhOTBsjQejy3uiU5icvfzepSIuyAIQjJiaXo8icndz+dpj9yRkr+CIAjJg6U1XmUxRW3q2RqqgNdQ+J0BVcPj7fvOdUDEXRAEIUEsrZllLuallJ9SWr8woWPcyN21ZYLai3J8+/5ExF0QBCFBLAtyaALg4MqnEzomugqTx8CHSRgvSom4C4IgJA2W1tFZpuNq50NLbQLH2D/dbJkw3mg6ZX8i4i4IgpAglibqm3t1GJY+3u0xbp6711CkECaCh/6XdhF3QRCEhLG0xk8YgIjyQfWqbo+J5rl7FEWqnhqdLZG7IAhCMmGLu23LtHlzIdjU7TGxqZBlqpptehgDoO3di7tSKlUp9bFSaolSarlS6ianfYxS6iOl1Dql1ONKKb/TnuJsr3PeL+/n7yAIgjAgWBq8Tq56qy8nIXF3Q3evgjJVxVZdlBziDgSBE7TW04DpwClKqTnALcDtWutxQB1whbP/FUCd0367s58gCMKQx7LabZk2T2Li7s5QzdKNZKggW3VRctgy2qbZ2fQ5/zRwAvCk0/4QcLbz+ixnG+f9E9VA5P0IgiD0M6al8asIIe0l6MlIzJZxfhaGdwKwNVlsGQCllEcptRioAl4D1gP1WmtnLi3bgBLndQmwFcB5vwEo6MM+C4IgDAqm1niJEMKXuLi7kXvETpus0HnJEbkDaK1NrfV0oBSYBUza2w9WSl2llFqolFpYXV29t6cTBEHod2xbxs5VD3gyINjY7TFu5J5KEIA2UpIvFVJrXQ/MBw4HcpVSboGEUmC783o7UAbgvJ8DdMr011rP01rP1FrPLCoq6l3vBUEQBhBT6+hEpKCRbkfu3VQQc9/2W7a4B7Q/OWaoKqWKlFK5zus04GRgJbbIn+fsdinwrPP6OWcb5/03daJLlgiCICQxlqXx6zAh5SVgZIA2Idy2x2Nc+fMTAiCAnwEoLUMipclGAA8ppTzYN4N/a61fUEqtAB5TSv0G+Ay439n/fuAfSql1wC7ggn7otyAIwoDjeu4RnAFVsKN3f/puj3Ej2xQdY8sMQOTerbhrrZcCh3TRvgHbf+/YHgC+3Ce9EwRBSCJMi6gtEzAcQQ81A8W7PSZaFdK1ZQYocpcZqoIgCAliWRofYcL4CHocce9mUDVaFdIKENIeLAzUAAypirgLgiAkiKk1Xu1E7soR90A34h4TuQewV2BSA6C8Iu6CIAgJYlkaL2HCeAkZqXZjJLjnYxx195hBAqQAJF8qpCAIwv6MqTU+HSasfHZVSAAztMdj3MjdYwUIaPuYpJnEJAiCINjlB1xbJuLmo3Qj7i5eMxC1ZUTcBUEQkoh2W8aH6c7hNMN7PKY9co/x3JMkz10QBEEgJs9deQnrBG0ZJ1vGawZocz13SYUUBEFIHkwLPDpMBB9h5XEa9yzuVkzkHnRuCJIKKQiCkERYWuPVYcdzdyP37mwZN1sm1nPv127an9H/HyEIgrBvYFoajyvuKrEBVbf8gCfGlpEBVUEQhCTCcrJlIr1JhTSDBPTADaiKuAuCICSIqTUeHbLz3LXrue/ZlnFjd9uWcTx3idwFQRCSB8sy8WiTCF60UmD4Eh9QjfHcBwIRd0EQhATxOCuLhpXPHij1+BO0ZbST557S/510EHEXBEFIEI9lC3lEeW2zxePrPlsGTQr2Pq7nPhCIuAuCICSA1joauZv4bLslwcg9NboKk6+/uxlFxF0QBCEBLA1+urJlui8/kEb7Qh0DhYi7IAhCApiWxqdscY+3ZbobUNWkKnufNi2euyAISUAgbFJ+w4s8uGDjYHdl0DEtHY3cI3jtDMcEbBmAVNdzl8hdEIRkoDFgi9I9b64b5J4MPqaOEXfltwuCJWjLiOcuCEJSEopYg92FQce0ND5H3E3lxbJIyJbRaNKU7bkHJXIXBCEZiJj2DJygiLuzOLYzoIovJnLvPlsmBfHcBUFIIlxxD5ki7qbWpCjbgjGVz56clECeu6W1eO6CICQXYUtE3SUuco9myyQQuSOeuyAISYYbuQvO4thRz93vRO6J2TKu5y4zVAVBSArCYsdEiUuFVF5nElP3tgzoaOTeJrVlBEFIBkTc27Es2iN3owe2jJY8d0EQkoyIJbaMS+yAagR/wuUHLE10huqwvOx+76eLd8A+SRCEIYdE7u3Yee6m/dpdYi+RPHetSSWI6UnhpeuOoSkQ6e+uAiLugiDsgdgBVa31gKwglKxYMQOqEcOHJ9EBVexsGcuTRlaqj6zUgcmYEVtGEITdEolJhdzfJzLZA6quLePD6kFVyFTCWN7UgehmFBF3QRB2Szgmcm8JDoydkKzElR8wnOg7wfIDqSqE5Rm4TBlIQNyVUmVKqflKqRVKqeVKqeuc9nyl1GtKqbXOzzynXSml7lJKrVNKLVVKzejvLyEIQv8QiRN3cxB7MvhYWuNX7mId3vg8d737gWe3nrv2JF/kHgF+qLWeAswBrlVKTQFuAN7QWo8H3nC2AU4Fxjv/rgL+3Oe9FgRhQIi1ZdrC+7e4u3nuluHDMIz22jJosHZ/bbSzyEfSRe5a651a60+d103ASqAEOAt4yNntIeBs5/VZwMPa5kMgVyk1oq87LghC/xNrywT2c3F3B1S14UMp2qtCAv98fy31rV3bMxrnOM/A5bhDDz13pVQ5cAjwEVCstd7pvFUBFDuvS4CtMYdtc9o6nusqpdRCpdTC6urqnvZbEIQBIBKTCrm/i7vpTGKyDD8KFRO5w60vLuOG/yzr8jitwaeSWNyVUpnAf4Dvaa0bY9/TWmvsjJ+E0VrP01rP1FrPLCoq6smhgiAMEOGYSUwByZbBTxjt8YGivSoktujX7TZyt20ZbQxc0TBIUNyVUj5sYX9Ea/2U01zp2i3OzyqnfTtQFnN4qdMmCMIQQyL3duwBVdO2ZaC9/AC2uBu7mQNgOSs4aU+SibuyZy3cD6zUWt8W89ZzwKXO60uBZ2PaL3GyZuYADTH2jSAIQ4iIeO5R2iN3vy3kbrYMtu1iOGraKWVU43j1yWfLHAlcDJyglFrs/DsNuBk4WSm1FjjJ2QZ4CdgArAP+Cnyr77stCMJAEFvPPRjez22Z6ICq3x5QdatCYtsuCsXzS3Yw9RevsHJnu3M9WAOq3ZYf0Fq/B+xuzvGJXeyvgWv3sl+CICQBcZF7ZP+O3N3FOrTHFvd4W8ZEKXhzle1Or9jRyOQRdpEwd0CVZPTcBUHYP4n13Pf7yN2t5+7x2dkyWsd57ko5bRC1aKA9zz1ps2UEQdj/CJkaw3lu3989d0tr0lUQ7U2Pidzbs2UMZZf3BVAxZke04FiyDagKgrD/EjEtUn0ePIba720Z04IMAlj+TCdKJxq5+1WkPYMGiE2c0STvgKogCPspEUvjNRQ53gi01Q92dwaViGWRQRvan2ELeQdbxlDKHmSFuNLI2s2WkchdEIRkIWxa+DwGdxt/5MeLvwjm/lsZ0tKaDBUAX0aXtoxSRD33OLSFX5kgkbsgCMlCxNR4PYojWWw3rHp+UPszmJgWZBJAp2Q6kTtxkTso3MzR2IFoLKfeu1cid0EQkoSwZUfuNXZFb1jzyuB2aBDRkZC9hqrrucfUlvE7A6racd1DsaUanMU8dLJVhRQEYf8lYmpSDYs83WA3VHw+uB3qJRHT4vFPtmDuxYLfKtJiv/Bn2ULeobaMismWiV17VplB+4V47oIgJAsRy2K42oUHi0YjB6pXQWTPKw8lI39/fxM/+c8yHv9ka/c77wYj5Ih7SiagbCGPlh8wMS0dXbMjdklC5dgyki0jCELSEDY1I6gF4BP/bNs/rlk9yL3qOTXN9g1pd5UbE8ETaQZA+TPbB09jPHe79r2t7rF18F1xl8hdEISkIWJaDKcGgCWeqXZj445B7FHvcL3w3RRuTAiPE7mr1Mz2KUoxtWXCphW1fWI9d+WusSozVIWBwLI0/1m0Lc4bFISORCxNHrbfvt5dc2c/zXdftcUubpuWmYPRYRKTzxH3iGkxSlV28NwlchcGkFdXVPLDJ5Zw5+trB7srQhITNu3B1AhetliFdmNb3eB2agCobgry82c+Z3VFEwAba1pYu60CAG9qdkxVyHhb5pjGF3gn5fvkNyyPnqvdlpHIXRgQ7MfH1ZVNg9wPIZkJhC3yaaDFm0dtJN1prB/UPvWKLmq+7Im3Vlfxjw83c/59H7CtrpVv/mMh2Spgv5mS2T6JyfBgofApO3I/pO0DADLb7PWJ2kImd726wj5OxF0YCLLT7EfEmubgIPdESGZaQxHydAMtvjzaTAUp2UMycneHNyN7sCEf/2QL76yx13N2B14b2sL8fcEm1lQ2c+xoJ0/dn9leFVIpTLxc6nmV1HA9aZbty6eE7Gu0prLJmeCE2DLCAOH8tou4C3uiJWiSqxto8+XZ6X2puX3uub+1uopr//Vp11P3+wjXA99T8bOf/GcZlzzwMQB1reFo+/rqZkrz0jg9YxVkjYD0QnsNVeyMGR9hclUL32z7G9mWPT6REbTrunsMO6oHwCuTmIQBIOKM6lc1Bvm/V1azo75tQD5Xa81db6xlc23LgHyesHe0hCJkmfUE/Hl2Bkhabp9H7h9sqOXFpTtpCXUW3g3VzX0i+m654rZQ15H78h0Ncdt1Le0pkwdue5QXA5fCmpfhoC+DYWAoxYbqFsbc+FJ0vy9E3qJM25lE2SFb3FuCEbsGPEhtGWFgcFO2ghGLe+av45fPLe/miL6hojHAba+t4bIHPxmQzxP2jpZghIxIHQF/PhFLo9Py+txzdxcBqWoMxLV/uKGWE/74Nk8s2rbXn9Hm3DjauqhJ/+7aaube9V5cm2vL+AlzSeQ/5OhGmH4RHPk9YPdL0wHs0PnkhXbA2tcIN2xvt2WktowwEHSchp2Z0u2Ki336ufv7wg9DgWDExGMG8FsBwikFAFgpOX0eubu/C9VN8Rahuw7pih2NnY7pKa2OuAe7+L1rbOtc6bKuJcywTB8/9T5CkWrgb2Nuh7P/BBn2degqX/5y4zdcYf2MT60JjA8sg0fOY9ZLp5PK4OS5D8xftJB0RDqIe3FO6oB8rvuErfZmNokwILQGTbJpBSCSkuP8zMXTx557VNw7jP+4E4FSvD2LQRdtrqMoM4VRBenRNjdi7ypyjz3/YWoV5j8epLnlm9yU+iinRl7lb5FTaRhxZNwxHf9+AD6xJtAWManTPnKzMjnYu5nsxrWMVPYMX8mWEQaEjpF7XvrAPDL245iZ0Mc0ByNkKVvctT8TgIjfyZZx/iO11mypbd2rzwk4tkzHyD3YS3E/98/vc9Jtb8e1xdoyf3t3A+U3vEjQGVwNxWTQ/Mj3bzzrX2N2y3yOa32V58zD+U3kaxRmxg+Gfrq589NLIGwSsTSf6gl8bdflfLfmbADKlZ0fL9kywoBgdlDZvSiW1yMiTsFrCdyTn9aQSSb2QLtOyQYg7M+168uEbUGf984GjvnDfNbuxXyJtt3YMq74+nsg7o0BO8sl1CHlMRq5h0x++9JKwE4mgPZMmpOnFNOqbRH/hXUvaVYzC7JPBRRpPk/c+XY22OMDhoKvBH/OGeHfx9WTAdih7UlfF3rnE9YelHMNBwoR9/0U07I6bA+MuruPsyLuyU9zMEKmssVdpWYBEPI5AuX47s8utrNDalt6X5Brd567O9DqMRKXqU01XWdhueIeCoXQGrxEqHQGcF3755xDSihXFdSQx+vmIXwy/nuc86WLADhkVG7c+Z64+nBu/tJB+L0GH+nJ1OdMAsBrKGaNyQdguyPuADdFLiHky0r4e/QFIu77KW5gc89XDwHsut0DgRslJTpTUBg8WoKRaOTuRp1Br+29u7nuFY5AtoZ6v/xewBHXjp67m5Met/BFN2x0xH14dvwYUiAY5jbfn7iz7hp+4n2Uj1O+RVVdvX1+53dyUlEKZaqaf0WO5crwj2k97NvMOaCQjb8/jfHF8cJ8WHk+F8waFY3WR+akATBjVF7U4mwhLbr/k+YxPXoC6QtE3PdT3Mh9xqg8lOocyfcX7k1EIveBIRA2+b9XVlPfi1K3raEIWU7kbjiRe9CNPp3IfZcTsXeVcZIobgaLa5O4tASdDJc9TDzqiCvuHRMEDgwv5Uue9xhlbeca7/Pkq2Yq135G2LQIOzePgtaNeJXFOssukDZumD3OsKfBf/eJd2SuLeRHjS/E7223cELaQ63O4rXrT2FY1sAkLbiIuO+nuPaIx1CUGbWktVUMyOe6kbsh6j4gzHtnA/fMX9erRSqagyZZTraMkWpH7AE3cg/URwcpod3r7g3ttkwAnrgMnrzcPmebfc5gDyL3Ksfaif3tCpsWY8LrAajVWax1xHvlkg+47+310eg7dfsCAD62bItlRHbiYjzCuZkcNb4Qv8eW1SkjspkZ/AvHBO+gLD99T4f3CyLu+ymWI+7eYB3v+L7DNZ+dOSA1Q9w/JJH2geH1lZVAzwYlXVpD7baMJ922ZVo97ZF77MIXDa17I+62eM9sew+WPwWf/wdCLdEbRk8i92hWTMiMTopatbOJA9hGLbkcE7yDU0O/J6B9fNf7NFXVNVFbxrvpbSicQAV2LrthdP9bOrYwA4DzZ5bx3RPGMa00l/MOLSXFazD34BE0khFnzwwkIu77KW7k7mve2d7Y1P/Ru5stI+o+MLhlJWqag1z50EIWb61P+Fh3QFX70vH77BztVsO2Kmirpz5G0Pcqco+YeA3FFLWpvXHzB1GrxxX/RHC9/9WVTcz63Rtsr29j8dY6Jhjb2JUxlhbSiOBlsR5HqarhlNbnop6+Ub0KSg7lxe8exQvfOSqhz3vsqjn844pZlBdm8IMvTMRjKA4/oIDVvzmVa48fl3C/+wOZxLSf4nqFnmBMtN66q98/NzIEI/eG1jApPoPUDulwQwFXuJZua+DdtTWsrWri7R8fn9CxrUGTEhWAlKxo5N9GGhheaKujvi1EIQ18z/sk/h2HAVN61cdA2GRkbhplTVVU6xzyVAtNK96koe1EoGe2TFvMjeAgtYFXXgvRsGMt0431fJ7/VZwVA0m98CF4fBZFTcsJmxZeA1RLNWQOY+rInIQ/b1h2KsP2YN/c8ZXp5AzQHJKOiLjvp7ji7g3EiHtb/4v7UFz5adqvXmVicRavfP+Ywe5Kj3GF0fWv27oozrU7moMRcj1tqJSs6ESioKntypCBehpaw8z1fMjXvG8Q2vEecGOP+6e1JhC2GJWfTllzNWutEtJVAP+K99DNB/KM//94uuWnwCEJna8tJmvn+ZT/geV2rZeWtOGsn3QVrLVTN0eWjOZ56wiOaV5lL0jiDYIZhIyiHn+HPXH2ISV9er6eILbMfopryxiBgY3cXc99qA2oJsuiJo2BcMICrbWOirubstjV9Pvd0RKMkG3ER+6hiAUZhWzduolrHvmUqY6V4tdBCAf2cLaucftXmpdGmapmqx7GYmscY0JrOF0tYLqxnnNq5iV8PreGTKmqiraNVLvIOPQCUnKGR9syUrysVmPJCVXiD9RSbDj/v30s7oNJt+KulHpAKVWllPo8pi1fKfWaUmqt8zPPaVdKqbuUUuuUUkuVUjP6s/NC73EjdyM2Wh+AyF1mqO4dB//yVU69852E9o2dpVnppBkGe+RfmxTSCGl5UXG//j9LWRosJrTTnuU51djUfkDj9oTP7eJmykwu9DFM1XPEzENZbI0jTbfxc98/ARgVWgvhxEpSuzevo4zP498onUlmSrs9ku73sNhzoH3++o8Y5nHEPb2QfYVEIve/A6d0aLsBeENrPR54w9kGOBUY7/y7Cvhz33RT6Gui4h7YRQtphJV/QCP3oTKJaaBm7iaC25dNTi2XlmCEe+ev2+3qQl151R2n5YM9CFl+w4s8/Vl7ad2Tb3ubl5ZtZ7S1FQonkhKTuz1/VwEHGDv5gvEJ49U2NqfaqYO9E3cnxzxiZ/WUjZ3M9hEnssCcCsAOVUy+tQvunQ07l3Z7Pvep5hC1jgaVBZf9F4oPgvKjyEptd6GVUqzzHECjN5+JDe8xTDmVJzP2I3HXWr8DdPyrPwt4yHn9EHB2TPvD2uZDIFcpNaKP+rrP0BqKcOVDC9lWt3cFl/YG09IYClTrLhpUNi2e7AEaUB1akfvezLzsK15ZXtHlgip3vbGWP7yymmecEgAdcaPi7FQvGbSxKfWrfNnzVqf9dtTbdsodr6/FsjRvr6lmbVUzo1QVqQSheEpc8a7VVikA8/y341cm7xZdYL/R0PO6624f80POjSFvNKnpWXwtfCOnhm7mppJ53J1+LdRvJrL4sW7P50buBxkbWe8dD6OPgGveg7S8OHEH8Hi8rMk4lPLWZRQarrjvR7bMbijWWrs5dBVAsfO6BIidLbHNaeuEUuoqpdRCpdTC6urqXnZjaPLaikpeX1nJzf9dNWh9MLXGaxjQtosmlUWzkT0wA6pJFAknQk8GIPuLb/5jEffMX8e6qua4dtdf/tETS/idUwwrFteCKcxKYaKy/yx/7/1bp/0anMFWj1I8+ek2LnWWmnOPYdjU6MQcgM/1mOjreyNnsjbPGWjujbg7Oew5AecGlTua7DQfGoP6rAl407O5u/FoPrYmsn3Jm92erzVkkkKI8WobG7zxqYhZqfFZK36vQYWvjNxIDSOpsRv3p8i9O7S9BlaP/2K11vO01jO11jOLivadu2UiJEMtc9PSGAbQWkujkW2L+4BG7oN/DRKhq6XfBotVFbYv7M6G9Hrar+G8dzZ02t+1ZbJTfYwz7MjYq6xO/rW7jq5hqLjVkKLiXjQxbkLPFl3MicE/MCbwT/4QuQDDl0oleVC3aY/9X1fV3Onpw7VlsgLbwZsGmcPIcRZvL81LI8VrEIpYfGJNpCSwBkK7f9o1LU0oYvGL1MfxKZPVKVPj3u8Yufs8itVBW8y/GnoCckYN+Dqn/Ulvxb3StVucn+7Q9HagLGa/UqdN6ILBjGEjphO5t+6i2RX3AUyFTGDyX1KQDLaMy9oqW9xTfR4aWsNx0XRXuDM7c1MNDlOro+26dl3cfrXN9kxTj1Kk+9sFcKKxlVr/SEjJjLZNK7VzwNfrEj766cl8/NMT8XsMNuvhULt+j/056ba3OeLm+OjbfTLKaN0OuaNAKbJTXXFPj3r9K63ReDH3eANpC5sYWHyJN3jaPJIlqbPi3u84T8HnMXi7JqYg2Gl/2GP/hxq9FffngEud15cCz8a0X+JkzcwBGmLsGyGJsLTGYyhoq6PJyKHRyBrYAdUhI+7JE7lv22VHvRtrWpj2q1ejdsrucCP3ucGX+LK3PcMmVBtfZ6bWidyVig84JqmtVKcdEN1e/7vT+Ptl7YLpTuDxew02WCOgw00jEVxbJq1lG+SNBugUuUNM+dyG3dfIaQ1FKFcVpBJigXVgt6WCfR6Dzbq4vWHCF3vc/2QmkVTIR4EPgIlKqW1KqSuAm4GTlVJrgZOcbYCXgA3AOuCvwLf6pddDnKiuDWLoHrEsUlQEgo20eLJoUvEr7PTb5w5QaeG+wl2UIRnYsquV//U+zDc9zwPtFRl3h+u5TwjbYzu/Dn8NgEDt5rj9XFumORihuS3MAWo7c4wVjDN2sDOl3V/3GIrcLmZb+jwG663h0FrT4/pEbkXIlOZtkGuLe3aa/fRQmpcWjbb3JO5aaxra7Pz/SWoLYEf6nt08Hs4Za9db93sMGsikQufxXMZ5QyfiSJBuZ6hqrS/czVsndrGvBq7d204J/Y9pafKNFrCgxZNDmBBoEwINkJbbb5/r5rkPheX23l5TzXcf/WywuxGlsrGVy1NfBuA+84xuZ/u6tkxReAfvm1N4wDyF672PYdXHC2SNc5MoaN3AySvu5rqUdutkQ+oUYosVdDVW4vMYbNROUlzteiidmfB3CoQtsmnGE2rsInJPj95cq8khjBdfF4O2f39/Ezc9v4IHvj6TycYWTAzW6ZHM7kLc1/321OgEOp/X/jkneC/ThuVyZsK9HhpI+YFBIBl0zbQ0Bcr2cFs8OQQsJ0Jt29Wv4u7aMsmUP747lm2rH+wuAPbqPhFLU6ras8q8RGgK7Hk8wLVl8oPbeEvPQGOwUxeQ20Egq5uCjKSGf/FTMuraa6r/IHQ1kdTZnc77yzOmUJLXXsLW51Fs0cPsjfrNPRR3kzL3ezmR++FjC7jgsDIOGZXL9jpnmT8MqlQBJV2I+3+X2QXvVlc0M05tZ1dKCcGAH28X4u6NGafwxbxuCSbP2EpfIeUHBgF3cQA9iDIfsTS5yk6ta/Xm0IAzsNTav2V/3Wizq9Xjk43YRZF394g/ELjWxFTVbqcsTLkGs7lmj8cFwibZNJMarmejtqfe79AFeBrjBXJjVRN/9t+BAu6LzOWvkdN41zyQp62jmDii87qfXz9yDCdPafeqU7wGO7RdJpf6ntWNjxN3J3IvyEzh5nMPJt3vZVRB+01ku1UAdZs7ncN9mKhtDjJGVVCXap+nuxIXseLeKuIu9AVdzRIcaCxLkxcj7vWuuPdzxoybCjkUIvdYcegqCtwbmgJhTvjjWzz68ZZu93VviLFT/XNVC+e1tk/qMZTu5HUFIxYHKDufYZMj7hv0CNLqV4Njj9U2B8lo3cI0YwM3Ry7g95GLeGbYtzj61wt45tqjufrYA+gOn8egmXSslJwe57oHIhajVKXzpUZ3en9UzCIXi8wD0Ds+hZbauH3c/6dFm2oYoypoy7HHCbpJJsIXk0qaTCmvfYWI+yDg/rEOpu8csTR52LZMwJtDvXYj98TFPRSxelQfHNonMUUGaFm/vcHN5Jim1jHK6NuJdhUNATZUt3DjU8to3kPUaFntxb+mqM2ssUq4PXwuS6yxnGi9D8AEtZWX/TfAbVNYt7OOHz+xhEDYJBixGG/YYrta2xnKS/QBeMPNsMtOW1xd0cQYZdsaRx5tD6O56YnTynITemJxI+BIZskes1lctNbc9PxyFm+tj0buOjWnSzuwOKac7nPmESgrAi/+AKx2MXaTYqq3byBFhdEF44Hun7biIvckSnntK0TcB4GeLPjbX5iWJjcq7rnUaSeXubV2D0fF88dXV3P2vQtY04OKidHIfQhkzbhT459N+V9eM77Tp+eOrc7o+sqxvLmqkum/epVdMasdTTU2sYKx3GmeyzPmkQxXdXzJeIen/f/LBLUVmnbw2lvzeWLRNh56fxPBsMlEtQ3Lk8pWbU8UXGqNtU/2xGVghvlsaz1jlT07NH2kXSOmpwtv+Jx0xXBWSUKRe0VjgAcXbOL8v3xAW9hktFGN6iJqh3iBXqlHUTHqDFjxDGx4K9pu34w0c40PASgYfRAAX5gynD0RK+7hIfD72FNE3AcBNxIbzMg9Ku6+dCxfKvU6HZTRI1vGLYPbkxo5birkUPDcA2ELPzFCF2rpxTlMlu9o6NQeW9ZgZ0Nncf/DK2uobw2zbJt97MnGQoarOjb7bJtkiWX/vM3/Fyp0PucF/xeAsSF7stIryysIRiwmqK1ECiainT/1tdquC0PlMp56+nH+8MpqDs+pg7R8iotHAtDYzUBtR9zJVMGMkt167rE2nLuIdci0CIYtyozqqN/eFf+6cjaPXDkbpRTPjPy+3VixlNZQhMVb69nVEuK33ge40fcoW/KPoOzg41jxqy92W0vd151vM8QZ0t9u+YIX+fBPV2ElgYfdE6K2zCAOqJqWJkc3QVq+nY2hlb0IQw9smQxnNqO7Sn0itNsyQ0HcTUo9MQPMvxvZ45rlP316GXPvei86UcglNnKvcNL9zrj7Pea9Y9slmSn2IOq2+jYu8/yXv/pvI6h9rE23F61YodvFcFHpxSzUE9FpeeTXLwOgtiVEMGwyydgKw9pXSLIweGz2UwB8vtze96jcWigYFy1r0NMnS7+TUhhMLYJgQ5fleWPTNjfVtAcDwVCYkVRDXvluz3/EuEKOHFfImMIMbn6rgm26kOq1n/DQ+5s5+94F5O5aykXeN3jSPIa2cx4Ew4ibabs7Yl2bx66ak8A3HVoMaXFv3PwZc6oep7mu/9f+7EvcP57BnNATsTQ5uhHS8/E4qXakF/TIlslwBKgnaWTh6HdP7hvyy59X8Lf3NjLa2yF7qGZ11wfshqVO5F3dUdxjIveKxgBaa5Ztb+B3L9kTjjJSbHHaUN3Mican7GAYM4J/YXua7ScHSOHU4O95Mv8btE0+D1CEyk/goPo3KaSB1rYg/tadFKkGjJLpcZ+90zMCrTwURCr47tElpFZ+BmWzyEr1UZKbxk1nxtdk6Q43Ag6mOBkzLZ3HJ2LFfWNNMxd43qRUVRFqqCCFcJeDqR2ZXpoLwAprNOnVS9lcYycEXOB5k2adyv+Gv86E0uI9nCEey3l0/ulpk5gztiDh44YKQ1rczRz7F6Ktcs81LZIN9xd9MLNmLK3J1k2QbkfupivuPbBl3OhoTwOCHXEHUk1Lw/r50JCcpYeu/uciQhGLUR77elwe+pH9RuXyHp0n0xFpt36LS8fIvWOZg1Snpsq6qmbGG9tZmXIQLaRhxTzxrNSjebvoIlJS0gBoPOw6UnUbC1Ov4SHzJwxrsCNzT1l73nmaz0NrGHR2CSOpZlJoKZghOOAEABbccAKXHlHeo+/o2jJtfnvmZ1fiHhvIVFZWcLPvbzzt/1/MKudmmT+m0zEdOXaiPW7winkYGa1bGV35CvmeAKd6PmbLsBN44Ydf7FFBOrdPQ3Ft3EQY0uLu/kKEajpXxEtm3Mi9Jwv/7i0bqpu56fnlUXGImJos3QTpBXgMw4nc83tky7h/FI3d1DiJxR24yrdq4R9nwyPnJf4lBoESw36S+dCagvam9ljc3UqEVU3xdo4r7sXZKexoCFDf4Rq2ONkblVVVFKt6atPs3/WOz3qpXoM0v/3/cOdSgy2WLYBT1CbO3/g/hPGihh8U3T/d76E1ZBLKKqVUVTN9x78hJRtGHd6j7xWLO6Da6op7cxeRe0x2lPv3WqQaGdO6DAsFJYd2+znHjLe/29PWUSy3RnNN9W/51Hc52Z4Qk878EWOLMrs5QzymE7mnekXckw5/QTkA1q6Ng9uRHhJyBG4gs2beWFnFgws2scMZvDO1JttqiHruZi/E3bVWYjM6uj3G+SM/h/l2Q9UKiCR+/EBTqqpp8xfQSiqRgkmwfVGPjnfFvbrJtmW27mpl2k2vsnKnvTjE6Lx0jql+lKL7ZzGMdgvILQqW0Wg/lR44bRZnTBvJt4+Pr1Ge6vNEKyf+88Mt3BS5hCqdy0prFABv5385roxtmt/DIx9tYU0gj8OMNYysfheO+TH40+ktbuTe6nNtmapO+8RG7t6G9tz+bxlPsdU7GtLyuv2cvAw/z157JBYGv45cjKkV69OnoS54FKOs+5tDR9xAZzAnqPUnQ1rcs7KyqdS5GPWdZ60lI+urm2kJRgiHw1zheRF/qDH6ntaaz7d3zqroK1zrxLUHtBkhXbc4kbuyhTot3/bcE0zjcW2lutYeRO4R+9wnGQvbG3d8mvDxA02ZtY2mTDtqbhv7BdjyQbezMLXWLNvWgNY6ahNUOWuYPv3Zdhrawvzzwy2MUTv5ddPPuLLtAfxNWzjWsyR6Dvdp6HBjBQB54w/j7gsPYWRuWtxnpfk90cgd4A3rUGYF/8Rpod9xcvBWthxyfdz+7nkfrBrf3jjz8oSvR1e4nnuz1xHobjz3EqdCeEh78CmTz9MSL1cwrSwXsJ+kZgTv44mD5sGEL/Sq3+79RsQ9CclJ87FFDyOlqftZfoPBy5/v5JQ73sG0NFprTvzj21z24CcMb/qcn/se4WfNv47u+9ySHZx+93u8/HnnCskR0+JfH22JZlX0hqi4t9gik2o2YaA7e+5mEMKJpTa6Tx513VQnjKUtbJJPIweqTejJZzmdq+zBNxlYysxttGTZ4t447mwA3nzuIa5/csluj3nq0+2ccc97vL6yioDjpVc5kXtsSuBXvG8zsfVT7rLOJ5iSzxxHyMGO3McWZnC650MWWeMZUWrnp3e876Z6jbgl8ACOGleIxmCtLmXaqNy499w0x2dDM/nMGkft9G/F1WvvDe7i2UH84M/q2paJidxHqSqaPDlcFPoZvwtfyAuFV/Ts85ybSQOZ3RZP2xMSuScxrrintfR8ea+B4EdPLGVVRRNVTYGouH68aRebNqwBYJq53F701zJZ7yyhtmJn+4SgdVVNBMImH2/axU+fXsac37/Rq37866MtPLvYHriscSL3TNN5SkjLx+OJyZaBhDNmehO5t4YiHGsswVCayNQvOY39X0e+J7h2Ux6N5NJEa7YtrG0ZZeDPZPOapfx74e5/595eY4tbRWP7QKnruVsx6jzN2EhV5iRuC53NjrxZfNFYyDS1Dq01jYEIXy+rYIqxGePgL0ePMTuoe2leejRy/uYxY/ns5yfzrePaSwaUF2R02UcLg3NCvyJ8/C8Suyh7wJ3GHzItyCzq2paJ8dzLVQXNaaUsNiYzzzwDrz+t0/574plrj+Ts6XZOvpu+2RvcPom4JyHpfg/bKSYzWAmRYPcHDDBuquD2ura4hRVKlF3wqYl0uO9o+FWB7X/T/vha2xzkpNve4abnl9McM6kkEN5zTrll6biMCrBzrV1Rd22ZDFfc0zt47pC4uDuRe08GVNtCJud63mGLVUR4zAk9+rz+IBSx+PfCrXHXzL0RH+DM3GzLtsWyJWyxySyMVmeMPSZsWpx17wLeWFkZXUquORCJDpzWNoewdi6jZNeHzhGaqWoD9bkHAvBM0VU0kc7PfI9Q0xzCtDTHVT4E6QUccua3o58zdWQ2Z04b2b5dks2MUbk8fPksrj9lEnkZfrLT2muu52f4o6+zY5aZcwW5q/rsPcWNpB//ZCsrWzKhsfOC3a4dB5pJxhaacydES/umensmQ1NGZnPHBYfwjytm8fUeZvbE4gb9Iu5JiFKKGu8IFLpXi/P2N+4kn+31bdTHRLelqpo6ncnVxi+dFk1Bmz0o7OaBb6q1rZGFm+ri0ua6W6Dh9Lvf4+hb50e33YG89uPt7Vhxd7NldJor7olF0lFx78F0dR1q5ghjBc9aRxI20sCX3uMFHvqSee+s5/onl/LcknZBamyzxb3UuQlHcuy6LCt3NrImVMDxxmKONZZQuWk5G6vtJ67a5hBLttZzxUMLWVfZyLHGEqobmvEG6viy5y1orsK47yguWPVdDCzGqp1k00KgyM5kWdaUzQORU5hlrMb3xEWcaSxg1K734fBvg789+vZ5DO668JDo9vhhWSilOGZCUVSkYtcKdT3/Fb/6Ih//7CSevPpw5l18KDNG5ZHiNfokDdC1ZRZtrmNFa3anevHQni1TRD0FqgmzaGo0l7+3N5ijxxfFlfDtKe5TlGcfW6TDZcjXc69PLYE2oG4jFHRfwW4gSXdnGda1xZWPLVE1bNeFLDXL4TuL4J5D8TVuAabYE2cKM0h3/uhy031xOdDrqppZsrWeUw8aETdg57JiZ2PcdnvdF82t3nmUr0mDuY+TaTnt6QV4DVvwrbR8PNCluAcjJs8u3sG5M0qjIuLaMs3BCJal4xZR3h1p4XoMr2aLHmYvJpHWswydrr7z3hB9oom5abo3q5HKfqKIZJYAdayuaGKULsKrLB7y3wIP38KH1mTG/HIBTTE3uMNCH/FX/218uuYDDg14met7E6x50fePMpZFnwpCZUfBB5V8uqWOD82TGK+2c/6W17jL/xqtWWNIP+zKLvtdXpDOptrWqLDG4ubWx+LOSZhZbt/AlVJ8tKFvnphip/Hv0IWopg/swl5G+43DzZaZYtjjY76RB1H7qX3Np4zsXFZ4IPjFGVPwGIqjxhcOyuf3N0M6cgdoSnNqZdQmX667K8rb6lqjkftktZkTPIvZrgsJRix++V4zJh5SGjdzpLGMMlXJ755ZyKZau/5GRoo3TtznvbOBax75lEc/3sKYG19iU03X9U6qGgNsq2tlVYUt4mca73O+921mNbwMNWvJivXcHVGOpDrZDl1MZLr7jXVc/+RSXl3ePhs4FFMjpymBiUympUk17Ui3UWcw67dvoNPzEp449fqKSsbc+BIbnGi5L3DvE7EWi7sIxghVS73OwOMMOP79/U2EnHhouTWaf0WOZ46xksDSp+OeXo4w7Fz4GS3vMNd8k7VWCQvMqTxv2lPcH/bfwi98/6Be5ZI6zE5trG8NM3rEMK6PfJNHx97CD0JXs/2C1yC1a+H773XHsOyXXWeJZKZ2H7OdPKWY/zl9Srf7JUKsuO/UBShtQlP8rHF3HOMrKR8S1F4yRk2P2l8Hjszpk370lNEFGfz1kpn77CSmIR+5mxnF1NXlkbd9IXDVYHcnDlfQt9cHqG+zo5TveJ8G4J/mSYQsi79/uJ3L/fkcW/soJ/vtX/aF1gQeqboTsIUm1mdvrtrExZ73uf9d+1H94427+HjTLs6eXhK3BOSpd76Lp6WS46dP4A7fPZzteZ9mnUqaCuFZ/AhZuomI8uH1Z0RrlZv+HEB16YEvcVYlqoqxedrz9DW8fSs0robzH97t9WgLm+Qo+2bUgN3/Op1FfoKR+0tOJtHCTXU9nrCyO9xa4LGzhV2hHqFq2akLorVTAB6InMpXZo/hnAUzieDhKONzChc/SuPhx0T3OdxYwWLfIdzP2VweeoQ7/FfydrMdhFgYRPCQTyNb8+ZwQown/vsvHcTZ9y7gwdrJrLHKuKkgd7f9ttMfuxalFK+Hr84exekHjejx9egNsXXRo4t2NGyFnPbCXSHTYiQ1nKbfZtuB36S0uL1iY1/9XwrxDHlxz0n3s9gzheM3LbBDyCTxz7bVtbKrJUQWrRgtldS32o/DhxjreMY8gnetg6P7btHDGIU9SPepNY6ZxhpmrjuVr/nH89/6M0hpmMNUtZEzPB9wdegF8MFlgSmso5THPtnCp1vq2VbXxoWzyqLnPLJtPnel3svKFWVM9tge6GPm8Rzs286sVS+SbZXR4skhR6n2yB3DrqndhdhuqLZF+d21NZwzo4TsVF9UEC/wzCfnw7/ZO7buah+Y7UBrKEI29nkatT1pZmsglfxw53kK5Te8yEWzR/Hbc+JnV7rn6Qlaa3saf3FWp/fcdUZj0zndyH2k2kVa4ShCRntkevLsaXhO/gqhBa8C8ImexBkVi2l0JnKNUTuZZGzl/VHn8fzy8TzPL5lRnAvN9QBcF24fHD0hfxjnOeI+oTiTaaU5jBuWyZrKZrJSvWSl9n6w83cx162/ibXJtrkLWT/wRfjWRzDMLiMcMTXTDHtCVukRXwHg2WuPZGNNyz47oDnYDHlbJifNy0fmJGjcBrXrBrs7UY66xR7UfNh/M3+v/RqnfvYtHvbfwgi1i8+s8XH7fpRpL5LwtHkk54Z+ya8te1LJocZa/id4G1cuPp8XU37G1d4XosccHX4PgGXbG5itVjL601uoaggwkhq+5XmWP/r+AsBkwxb234Uv5K7IOfw3cijUrOEM6w1avfYjfzRyN7suHhaKWGx3MkA+WrmRt/7yA2jdRShiMT21gl94Y6L1nbvP/24LmWQre6C4QduR+9ZAGrTUxCVwu4XIHvkofv6C6xu3dpMx1JHnluzg5NvfYf6qzil67tNV7Cxbe9BZMzm9kfKxE6Ipc8dNLOK35xxEluNpF2ensMQaiz9QQ6TeTjX9su89TK2YdcY3GFtof8fSvK5nf2alekn3e3nkytk8ec0RKKWi2R8luT1LD0wWalLLucd/BU0qC+upq6L/rxHL4iBjI1p5YZhdmGxaWW63ZXmF3rMPiLuPZ4Mz0MqAxf8a7O4AdqQIUKYqOcRYRyMZpDdtZKaxGpTBitTpHFbePt268OgrODv4Kz6ZciPfPmEC94dO4qbwxXzgay9DGsHDrd5vRrcPtz4DNNoM87D/Zs5te5KSx07klZSfcL3vcT6wpnB88I+8YM7mx5k3M888g0YyeTR8DJHyY+1zGvYgr1sb5OfPfk6rJ6eTuMemcd7m+xNn1j8MH9xDKGJxvedR2vDz3hdfBGDz5+/v9rq0hkxynMj94uOn8Y2jx/BWy2i7TOxm+7jqpiDfefSzPV7fXc09K1dQ2WjnmL+6onP1UPe7xWYh1TSHmOrdgQrUQfGBTC/L47oTx3PHV6YDdqS68H9O4rlvHxWtq16w400UFt/MW4RVfize3BKmOxOIhsfkYt9y7kHRQdDZY2wL48hxhWQ7UfqXZpSQk+bb7Q0hWfndOQfx3LePZMLwbP6v8URuCZ2HUbEEdtj/l2FTc6DaSKhgIvh6n5suJM4+Ie47rTzMMSfAimcHuztA++DiyYY9rX5u8DfMabuDc/OehJ9V8MTPL+df32gX7pOnFLNYjyMlM5/cdPsx/UHzVP574B8pD/yLy0M/4qtpf+bd7DP4RugH/CVyOhPUNv7iu4N1qZeQomyBKmxdz2ZdzLwJ87gkfANjJk7j2+Hr2JAxLfpZAVLYONm+SYxsWwu0F2R6YelOVjR4Ow1wugL42+NzONnjlAr4/D/ocIAZ1lKeNY9kh280m6xiVi18c7fXpTVke+5aGVz9hekcXJrLi5GZRLyZsORRAG55eRVvOhF2mapk2fwnose7A3BVTT2b06Cwn0xWxkwQc3Ej97o4cQ9yTuoiQMGkuXgMxfdPnhD9vwF78eyizBRWGgewJesQ5my4h7m+T/E0bME340IAJg3Pivb7jGkjefLqw/nKYaModaLy4ycVdeqPG8n/z9zJPfqOg81XZ4/i4NJcvn/SBACeNY8kYKSh37sNsOcBjDV2Es6fOJjd3K/YJ8QdoLXoIDsdMgkmM7kThS4bXUNTynC2arvG9ANfnxkt4hSbYTDSqaF9/swy8jPs7zM8O5XTD7Ynq7xpzaAxZQQFWSm8Zs3kE2siHqU5xfNJ9BwnBP+PgwPz+M9h/+IbF57Pu9efwPWn2H9I3znBzshwPfnXm+0Zlw3F9g2mLD+dc2fYA37VVpZdhtds97UbnMHgOa1vAfAn8yyo28QZ4ZdJ1UHetg5mbWUTH1qT7Sn0Vte2SVvIJJsWIr5scHKzC/PzeEtPhzUvg2VF65wfoLbzbsr3OejtKwmtfxcgOpmrY+5+d7iD2eu7yLJx39vVGopaCDXNIQ5TK2HENMja/VJthqEozEzj30XXkmo2c4/nNsguhclnAHDqgSOcn8O5+8JDommI9140g5vOnMqInK6tlwNLcigv7HpmabJz+AEFvPPj4znpkPHcG5yLWvk8p994Nz97agnF1GFliw0zUOwz4t6YMQa0BUlQIdKdKFTQtJK63PaFDzr+Mb/yvWN4/Qd2lsWlR5QzeUR2NDo8qDSHWWPy+bmTrhYyrehswyWWLdZt2s9jo36J/vZCNuiRNJLJL86YilKKsvx0Jg3PZtPNczlu4jA23TyXr82x69/f8toGDg/cTfjch6J9+eP50/jeSeN5pvUgO3Jf1e7vN7SFUViUbHyS6rxDeCh8MgDXWI9gYfCxNZm/vruRBdaB5KhWIls+6vK6tIYi5KgWrFQ79S0nzceFs0bxfNvBdrGpHZ9R1xoCNPf67qJZ24/v6pmroXVXNHKvbAzAyufhrZsT+v9wnzyaAhHqO1SwrG8Nc6bxPg+3XIP+zTBY8Ry1zUFGW1uh+MBuzz08J5VPg2V8njGbGpUHX5oXnXRUlp/OppvncvT4+Ah98ojsHtdMH0qMKkjn1vMO5gnv6bQZGVznfYqcSC0+ZYKI+4Ax5MXdnWpdl+as5FK7NqHjghGT8hte5P73+v5mUNtsZ8mkN22ipcAWiK4SAiYOz2LcsPgMjnxH3KeV2gJYlGVH+i3BSHQiVA05XBS6ketKHuWCy7+PKhzP7V+Zxj+umLXHfhVktE+k2kkBwwrjV585alwhr5mHUusvgXf+D5yBxIa2MLONVaQ2bmTX5IupJJ+WvEmkEaIqfRxXnmhnZrxtHUytzsJ67joIdo6S28K2565TcqNtI3JSeduaZo+ZrHmZdVXNTFWbmWRs5deRizkr+Ct8Tdtg0YM0ByIYWHy5/m/w+Nfgrd9D1co9fmewBbyIen7tfYDICz+EJY8BdimH7MBObvXPo02nYOaOgee+A00V5Jq7oKh7C2Fkbhrvr6/ljNrvcG7aA1B+ZLfH7A/4PAbjR43kPutsTvZ8yp3+ewFQOaWD3LP9h6Ev7s5AVKXP+aWpWZPQceur7IG9W19e1ed9qm0JcaLjtweHHwYkvtrLuGGZHDOhiFOcR/oiR9BbgyYFTuSuFCywDsKIqYF9ziGlnSLEjriRf7rfw1PfOqLTTM+Z5fl8ZdZoftP6JahcBivsnPyG1jDHGYvRho/M6XYlx5XD5gIQ9qTzg5MnMHlENo1kcl342/h2rYUXvtephGFryGS4qoOM9hmBw7PTqCeLpsJDMFe/TFVTkB+XLkcrgyPnXsISPY6KrKmw4jmaghFuTX2Aa7zP8x/zKPuGsOxJAN5cVUlNc2e7Zm1lEwvW1XBbyjwu9r5O4YqH4elvQvVqNtW28AXPQlIJcXX4e2yZ9n0I1HNMwBk3GNa97+1mtWgMLj68vNv99ycmFmdxR2Auj0WOY7Zh/52pXIncB4ohL+6uLbMrkgL5B9Cw6m3ue7v7ZfdWVzZ2u09XNLSFOy123JFdLSG+7n0Zq3AC5ig7kktU3DNSvDx8+SzGDbMndriRe3MoQoEj9KV5tqAkMhMxFr/X4N3rj2fpL77AjFFdL45w+AGFPBOZTTDnAHjvdrBMGtoiHG0sQ5fNZmRRATlpPp5Xx7PeGsGi0Xa51qeuOYLXf3AM7+uD+GDUVbDsiajwugQCAQ5Q22F4u93hVvXbVHgsnsqlnO+Zz7E1j6Imn8mZRxxMSW4a76ccAzsXc1nTfZzHm/wlcgY/DH+L+fpQrAV3UfXpC1z+94V8/cGPAdv++XjjLupbQ5x8+zsUt63naLWYW8Pn86PRT6INLyx8gE01LcwxVtKcXsYWXczaFNtC+7rxkt25BMTdra8+sTiLK48e24P/jX2fic6A8u2R8who++/UI5H7gDHkxb0g04/XULzyeQWBsSeTs/1tdrx6JxWLX4Nduy9JsLqimS8aH/Nt9W+sF38E838Pge4F/7Q73+XQ37zOK0s2YwY7T/0PhE2WLl3EdGMDxoxLo7ZRx5rbieJG7lrb3xVgnDOjr6saIt1Rlp++x2JLB47MRmPwSfk3oGIZvPlrVP1mphqbMcafhFKKA0uymb8lwomhP1JRZN+80vwexg3LYurIHO4KnQXDpsCCO+Oi98Yty/ArE39Je/aOmyb4Uc5phD1p3Or7K9qfCWfdA8CsMfncUnsUesR0zo88T1j5OfBrN3PjqZP4cfAK1pnDGfbcRbzp/wE/rvopFXccT8PvJmI+MJeld1/AT72P8HLKDQRVKq+mz+XJ1SGWF3wR85MHqF/2CrONlXjGHAXAbe/X05xRRrGqpzV3AiQgRG7/e3qj3R9wUz0ryec+8wy26wK8mfveQtTJypD/jUz3e/nZ3Mnc9PwKLvGO5N9euMn3EDxjDxauzT+W1rJjKSsbTZWVw39X1lGa46Vw8bPc4H8GSyvaFmWSYTWx6aPnaBxxJNnFZZjpwygcMZpIejHVrRbBQBsV1dV8pflhjvMv4eCnba9+Z9oEtmUdzC5vMSqziLdW7uSrfGDPDJ96NunavsRTe1kcKTvNPr4kN41CxzMfNyyT+aur46r/9RXlBRlkpnj52kej+EPqSXz5vds5XT8OCjjQXu/0wJIcFqyzc+H9HW4Uc8bm89d3N/JI+RlcVHELNX//KoFRx7OkNR/vqmfBC8aI9tm57hPNb9+qYrP3q/zGez/G4ddCih31HT9pGE9/tp071MV8n8XszJzKUZNKOWoSnDSlmLl/TOHH3n8zI2UrJbSwdZeHJs8BlKXUkd/6Mcd47fTHpzyn8OA1X+DoW+dzxdZTeSHlXS5YfR2mMvDMuQIWVbG6sokbjbO4238PvlmJrU7kWl0HlQxOfZRkZlRBe67+7ZFzuTtyNmv3ooqj0DOGvLgDXHbkGKaOzOGO1wv49/g3qais4IMly5mlVnFF7Utk73oblkA+MCnmuJqyL3Br1g088VkFX/W9w3WBf1O64X68G+NXd3FjjWnAF72wKuVA7m05k5D2cYr1MQe2PkeasrMwvuCBNiMDjv4J5JRSAvztkpnMHtv1lPzuUErxr2/MZmxhJtlpXo4eX8iZ00r4x4ebKc7u+8kghqH400UzWLGzkTc2/pDAJj9z9BLeSjuB43LtVMorjhpDVoqX99fXclh5/Pe66pgD2LKrlft2zKHNOoMLNr1G4eaXKAXwQk3BTArzx3Y4Zizz3tnAPyMnkjXtDH5yzLHR946bWER5QTp3bhhOhecbzD7kS4xy3jugKJPzD5/Arz+4mKevOoIxpbmsWV7B5BHZmJbmsNvmk0kr6QQ5dsZULsxP56LZo3jkI/jPEc8T+fSfjBo5nDPLDuPJq3fx3JIdPPwBUHI0dx/+xYSu18zRedz71RmcOHlYL6/4vs3vzjmI5TsaeHLRNoIR1acVPYU9o3SC62X26KRKnQLciR2//k1rvcectZkzZ+qFCxfuaZceEwibPLhgE1k+zcTsEItXrkY1VzN3Sh7vravhsDnHUT7O9lS317fZtTxSvCzbuou2+irC9dvZvHkDmaEairN85GdngS+N8gPn4C+eSHMwwq7mECHTItMTYVtlDQtXruOEScWMPmACKan9m6e8dVcrxdmpXZZ87UuCEZNPN9cztiijxzeTmuYgq3Y0ULt1FZFdmznsgOGUTTsO5elcM2VtZRNPf7ad7544vtP4RCBsUtEQwFCK4Tnx39myNDsbA11O11++owGFIjvNS2FmCqk+D4GwSWVjgNG7WaGoqjGA32vETVgS9p5A2KSqMRgXzQt7j1Jqkda6y0Vo+1zclVIeYA1wMrAN+AS4UGu9YnfH9Ie4C4Ig7OvsSdz7I+ybBazTWm/QWoeAx4Cz+uFzBEEQhN3QH+JeAsSus7XNaYtDKXWVUmqhUmphdXXn1dIFQRCE3jNoQ9da63la65la65lFRXuefCMIgiD0jP4Q9+1AWcx2qdMmCIIgDBD9Ie6fAOOVUmOUUn7gAuC5fvgcQRAEYTf0eZ671jqilPo28Ap2KuQDWuvlff05giAIwu7pl0lMWuuXgJf649yCIAhC98hcYEEQhH2Qfpmh2uNOKFUNbO7l4YVATR92Z19BrsvukWvTNXJduiaZr8torXWX6YZJIe57g1Jq4e5maO3PyHXZPXJtukauS9cM1esitowgCMI+iIi7IAjCPsi+IO7zBrsDSYpcl90j16Zr5Lp0zZC8LkPecxcEQRA6sy9E7oIgCEIHRNwFQRD2QYa0uCulTlFKrVZKrVNK3TDY/RlIlFIPKKWqlFKfx7TlK6VeU0qtdX7mOe1KKXWXc52WKqVmDF7P+xelVJlSar5SaoVSarlS6jqnfb++NkqpVKXUx0qpJc51uclpH6OU+sj5/o879aBQSqU42+uc98sH9Qv0M0opj1LqM6XUC872kL8uQ1bcnRWf7gVOBaYAFyqlpgxurwaUvwOndGi7AXhDaz0eeMPZBvsajXf+XQX8eYD6OBhEgB9qracAc4Brnd+L/f3aBIETtNbTgOnAKUqpOcAtwO1a63FAHXCFs/8VQJ3Tfruz377MdcDKmO2hf1201kPyH3A48ErM9o3AjYPdrwG+BuXA5zHbq4ERzusRwGrn9X3YSx122m9f/wc8i73ko1yb9u+YDnwKzMaeeel12qN/U9iF/w53Xnud/dRg972frkcp9g3/BOAFQO0L12XIRu4kuOLTfkax1nqn87oCKHZe75fXynlkPgT4CLk2rvWwGKgCXgPWA/Va64izS+x3j14X5/0GoGBAOzxw3AFcD1jOdgH7wHUZyuIu7AFthxb7bZ6rUioT+A/wPa11Y+x7++u10VqbWuvp2JHqLGDS4PZo8FFKnQ5Uaa0XDXZf+pqhLO6y4lNnKpVSIwCcn1VO+351rZRSPmxhf0Rr/ZTTLNfGQWtdD8zHthtylVJu6e/Y7x69Ls77OUDtwPZ0QDgSOFMptQl4DNuauZN94LoMZXGXFZ868xxwqfP6Umy/2W2/xMkMmQM0xFgU+xRKKQXcD6zUWt8W89Z+fW2UUkVKqVzndRr2OMRKbJE/z9mt43Vxr9d5wJvOE88+hdb6Rq11qda6HFtD3tRaX8S+cF0G2/Tfy4GQ04A12N7hzwa7PwP83R8FdgJhbE/wCmzv7w1gLfA6kO/sq7Azi9YDy4CZg93/frwuR2FbLkuBxc6/0/b3awMcDHzmXJfPgf912scCHwPrgCeAFKc91dle57w/drC/wwBco+OAF/aV6yLlBwRBEPZBhrItIwiCIOwGEXdBEIR9EBF3QRCEfRARd0EQhH0QEXdBEIR9EBF3QRCEfRARd0EQhH2Q/we5TYskpwNSKgAAAABJRU5ErkJggg==\n",
      "text/plain": [
       "<Figure size 432x288 with 1 Axes>"
      ]
     },
     "metadata": {
      "needs_background": "light"
     },
     "output_type": "display_data"
    }
   ],
   "source": [
    "import matplotlib.pyplot as plt\n",
    "# Generate recent 50 interval average\n",
    "average_reward = []\n",
    "for idx in range(len(rewards)):\n",
    "    avg_list = np.empty(shape=(1,), dtype=int)\n",
    "    if idx < 5:\n",
    "        avg_list = rewards[:idx+1]\n",
    "    else:\n",
    "        avg_list = rewards[idx-4:idx+1]\n",
    "    average_reward.append(np.average(avg_list))\n",
    "plt.plot(rewards)\n",
    "plt.plot(average_reward)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "9f18bae5",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "44b0354e",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "58e2db1b",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "8385f8b3",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "c1d27da3",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "fb4df6e4",
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.10.12"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
