{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "id": "67576132",
   "metadata": {},
   "outputs": [],
   "source": [
    "from math import inf\n",
    "import numpy as np\n",
    "import scipy\n",
    "import torch\n",
    "import torch.nn as nn\n",
    "import torch.nn.functional as F\n",
    "import torch.optim as optim\n",
    "import gymnasium as gym\n",
    "import pandas as pd\n",
    "from datetime import datetime\n",
    "from sklearn.base import BaseEstimator\n",
    "from realkd.boosting import WeightUpdateMethod\n",
    "from pandas import qcut\n",
    "from realkd.rules import SquaredLoss, AdditiveRuleEnsemble, Rule\n",
    "from realkd.search import Context\n",
    "from typing import Optional\n",
    "import warnings\n",
    "import random"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "id": "8b8f01e2",
   "metadata": {},
   "outputs": [],
   "source": [
    "statespace_size_g = 4\n",
    "np.random.seed(576757)\n",
    "torch.manual_seed(34581035)\n",
    "number_rules=16\n",
    "regular = 50.0\n",
    "column_names=['x1','x2','x3-x1','x4-x2', 'c']"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "id": "24f75485",
   "metadata": {},
   "outputs": [],
   "source": [
    "def same_location(location1, location2):\n",
    "    # Check if either location is None\n",
    "    if location1 is None or location2 is None:\n",
    "        return False\n",
    "\n",
    "    # Compare the locations\n",
    "    return location1[0] == location2[0] and location1[1] == location2[1]\n",
    "\n",
    "class GridWorldEnv(gym.Env):\n",
    "    def __init__(self, size):\n",
    "        \"\"\"\n",
    "        :param height: The height of the environment grid.\n",
    "        :param width: The width of the environment grid.\n",
    "        :functionality: Initializes the Environment object with height and width,\n",
    "                        and calls regenerate_locations to set random target, agent, and item locations.\n",
    "        \"\"\"\n",
    "        self.item_location = None\n",
    "        self.agent_location = None\n",
    "        self.size = size\n",
    "        self.target_location = None\n",
    "        self.num_steps=0\n",
    "        self.carry_item=0\n",
    "        # We have 4 actions, corresponding to \"right\", \"up\", \"left\", \"down\"\n",
    "        self.action_space = gym.spaces.Discrete(4)\n",
    "        # Dictionary maps the abstract actions to the directions on the grid\n",
    "        self._action_to_direction = {\n",
    "            3: np.array([1, 0]),  # right\n",
    "            0: np.array([0, 1]),  # up\n",
    "            2: np.array([-1, 0]),  # left\n",
    "            1: np.array([0, -1]),  # down\n",
    "        }\n",
    "        self.reset()\n",
    "#         self.observation_space = gym.spaces.Dict(\n",
    "#             {\n",
    "#                 \"agent\": gym.spaces.Box(0, size - 1, shape=(2,), dtype=int),\n",
    "#                 \"item\": gym.spaces.Box(0, size - 1, shape=(2,), dtype=int),\n",
    "#                 \"target\": gym.spaces.Box(0, size - 1, shape=(2,), dtype=int),\n",
    "#             }\n",
    "#         )\n",
    "        self.observation_space = gym.spaces.Tuple(\n",
    "            [gym.spaces.Discrete(self.size),\n",
    "            gym.spaces.Discrete(self.size),\n",
    "            gym.spaces.Discrete(self.size),\n",
    "            gym.spaces.Discrete(self.size),\n",
    "            gym.spaces.Discrete(2),]\n",
    "        )\n",
    "    def _get_obs(self):\n",
    "#         return {\"agent\": np.array(self.agent_location), \n",
    "#                 \"item\": np.array(self.item_location), \n",
    "#                 \"target\": np.array(self.target_location)}\n",
    "        return np.array([self.agent_location[0], self.agent_location[1],\n",
    "                        self.item_location[0]-self.agent_location[0], \n",
    "                         self.item_location[1]-self.agent_location[1],\n",
    "                        self.carry_item])\n",
    "    \n",
    "    def _get_info(self):\n",
    "        return {\n",
    "            \"distance\": np.linalg.norm(\n",
    "                np.array(self.agent_location) - np.array(self.item_location), ord=1\n",
    "            ) + np.linalg.norm(\n",
    "                np.array(self.target_location) - np.array(self.item_location), ord=1\n",
    "            )\n",
    "        } if not self.carry_item else {\n",
    "            \"distance\": np.linalg.norm(\n",
    "                np.array(self.agent_location) - np.array(self.target_location), ord=1\n",
    "            )\n",
    "        }\n",
    "    \n",
    "    def reset(self, seed: Optional[int] = None, options: Optional[dict] = None):\n",
    "        \"\"\"\n",
    "        :return: None\n",
    "        :functionality: Generates new random locations for the target, agent, and the item,\n",
    "                        ensuring no overlaps between them.\n",
    "        \"\"\"\n",
    "        if seed is not None:\n",
    "            random.seed(seed)\n",
    "            np.random.seed(seed)\n",
    "        self.carry_item=0\n",
    "        self.set_target_location([self.size-1, self.size-1])\n",
    "        self.set_agent_location(self.generate_random_location([self.target_location]))\n",
    "        self.set_item_location(self.generate_random_location([self.target_location, self.agent_location]))\n",
    "        return self._get_obs(), self._get_info()\n",
    "    \n",
    "    def set_target_location(self, new_location):\n",
    "        \"\"\"\n",
    "        :param new_location: The new location for the target.\n",
    "        :return: None\n",
    "        :functionality: Updates the target's location to the new location.\n",
    "        \"\"\"\n",
    "        self.target_location = new_location\n",
    "\n",
    "    def set_agent_location(self, new_location):\n",
    "        \"\"\"\n",
    "        :param new_location: The new location for the agent.\n",
    "        :return: None\n",
    "        :functionality: Updates the agent's location to the new location.\n",
    "        \"\"\"\n",
    "        self.agent_location = new_location\n",
    "\n",
    "    def set_item_location(self, new_location):\n",
    "        \"\"\"\n",
    "        :param new_location: The new location for the item.\n",
    "        :return: None\n",
    "        :functionality: Updates the item's location to the new location.\n",
    "        \"\"\"\n",
    "        self.item_location = new_location\n",
    "\n",
    "    def generate_random_location(self, exclude=()):\n",
    "        \"\"\"\n",
    "        :param exclude: A list of locations to be excluded when generating a new random location.\n",
    "        :return: A new random location as a list [x, y] that is not in the exclude list.\n",
    "        :functionality: Generates a random location within the bounds of the environment\n",
    "                        grid, ensuring that it does not match any of the locations in the exclude list.\n",
    "        \"\"\"\n",
    "        \n",
    "        # Helper function to check if a location already exists in the exclude list\n",
    "        def location_exist(new_location):\n",
    "            for loc in exclude:\n",
    "                if same_location(loc, new_location):\n",
    "                    return True\n",
    "            return False\n",
    "        \n",
    "        # Generate an initial random location\n",
    "        location = [np.random.randint(0, self.size), np.random.randint(0, self.size)]\n",
    "        \n",
    "        # If the generated location exists in the exclude list, keep generating new ones until it doesn't\n",
    "        while location_exist(location):  \n",
    "            location = [np.random.randint(0, self.size), np.random.randint(0, self.size)]\n",
    "        \n",
    "        return location\n",
    "    def step(self, action): \n",
    "        \"\"\"\n",
    "        Update the agent's location based on the action taken.\n",
    "\n",
    "        :param action: Action taken by the agent.\n",
    "        :param env: Reference to the environment to check for boundaries and get reward.\n",
    "        \"\"\"\n",
    "        # Movement logic for each action\n",
    "        if action == 0 and self.agent_location[0] > 0:\n",
    "            self.agent_location[0] -= 1\n",
    "        elif action == 1 and self.agent_location[0] < self.size - 1:\n",
    "            self.agent_location[0] += 1\n",
    "        elif action == 2 and self.agent_location[1] > 0:\n",
    "            self.agent_location[1] -= 1\n",
    "        elif action == 3 and self.agent_location[1] < self.size - 1:\n",
    "            self.agent_location[1] += 1\n",
    "        reward, terminated=self.get_reward()\n",
    "        info = self._get_info()\n",
    "        return self._get_obs(), reward, terminated, False, info\n",
    "        \n",
    "    def get_reward(self):\n",
    "        \"\"\"\n",
    "        :param state: The current state of the agent.\n",
    "        :return: None\n",
    "        :functionality: Evaluates the agent's current state to assign a reward.\n",
    "                        Updates the state's reward attribute accordingly.\n",
    "        \"\"\"\n",
    "        # If the agent is at the item location and not carrying the item, reward it and update its state\n",
    "        done=False\n",
    "        if same_location(self.agent_location, self.item_location) and not self.carry_item:\n",
    "            reward = 20\n",
    "            self.carry_item = 1                                                                                            \n",
    "        # If the agent is at the target location and carrying the item, reward it\n",
    "        elif same_location(self.agent_location, self.target_location) and self.carry_item:\n",
    "            reward = 20\n",
    "            self.carry_item=0\n",
    "            done=True\n",
    "        # Otherwise, penalize the agent\n",
    "        else:\n",
    "            reward = -1\n",
    "        \n",
    "        return reward, done\n",
    "        \n",
    "gym.register(\n",
    "    id=\"gymnasium_env/GridWorld-v0\",\n",
    "    entry_point=GridWorldEnv,\n",
    ")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "id": "db545637",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "cuda\n",
      "<class 'gymnasium.wrappers.common.OrderEnforcing'>\n"
     ]
    }
   ],
   "source": [
    "# env = gym.make('CartPole-v1', render_mode='rgb_array')\n",
    "env=gym.make(\"gymnasium_env/GridWorld-v0\", size=statespace_size_g)\n",
    "device = torch.device(\"cuda\" if torch.cuda.is_available() else \"cpu\")\n",
    "print(device)\n",
    "print(type(env))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "id": "7aa6c889",
   "metadata": {},
   "outputs": [],
   "source": [
    "# column_names = ['cp', 'cv', 'pa', 'pav']"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "id": "84732b72",
   "metadata": {},
   "outputs": [],
   "source": [
    "def orthonormalization(Q):\n",
    "    n, k = Q.shape\n",
    "    O = np.zeros(shape=(n, k))\n",
    "    q = Q[:, 0]\n",
    "    O[:, 0] = q / (norm(q) + 1e-6)\n",
    "    for i in range(1, k):\n",
    "        O_i = O[:, :i]\n",
    "        q = Q[:, i]\n",
    "        q_orth = q - O_i.dot(O_i.T.dot(q))\n",
    "        O[:, i] = q_orth / (norm(q_orth) + 1e-6)\n",
    "    return O"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "id": "973f1f9b",
   "metadata": {},
   "outputs": [],
   "source": [
    "def softmax1(action, values, other_values, location):\n",
    "    all_values = np.insert(other_values, location, values, axis=1)\n",
    "    exps = np.exp(all_values)\n",
    "    res = np.exp(all_values[np.arange(values.shape[0]), action]) / np.sum(exps, axis=1)\n",
    "    return res\n",
    "\n",
    "def norm(x):\n",
    "    \"\"\"\n",
    "    Calculate the L-2 norm of a vector\n",
    "    :param x: the vector whose L-2 norm is to be calculated\n",
    "    :return: the L-2 norm of the vector\n",
    "    \"\"\"\n",
    "    return (x * x).sum() ** 0.5\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "id": "5b0af6ac",
   "metadata": {},
   "outputs": [],
   "source": [
    "class PiLoss:\n",
    "    _instance = None\n",
    "\n",
    "    def __new__(cls):\n",
    "        if cls._instance is None:\n",
    "            cls._instance = super(PiLoss, cls).__new__(cls)\n",
    "        return cls._instance\n",
    "\n",
    "    @staticmethod\n",
    "    def __call__(action, values, advantage, other_values, current):\n",
    "        \"\"\"\n",
    "        :param action: the action chosen\n",
    "        :param values: the values provided by current model\n",
    "        :param other_values: the output by other models\n",
    "        :param current: the action represented by the current model\n",
    "        \"\"\"\n",
    "        sm = softmax1(action, values, other_values, current)+1e-6\n",
    "        return -np.log(sm) * advantage\n",
    "\n",
    "    @staticmethod\n",
    "    def g(action, values, advantage, other_values, current):\n",
    "        return np.where(action == current, -advantage * (1 - softmax1(current, values, other_values, current)),\n",
    "                        advantage * softmax1(current, values, other_values, current))\n",
    "\n",
    "    @staticmethod\n",
    "    def h(action, values, advantage, other_values, current):\n",
    "        sm = softmax1(current, values, other_values, current)\n",
    "        return advantage * sm * (1 - sm)\n",
    "\n",
    "    @staticmethod\n",
    "    def __repr__():\n",
    "        return 'pi_loss'\n",
    "\n",
    "    @staticmethod\n",
    "    def __str__():\n",
    "        return 'pi_loss'"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 9,
   "id": "67942365",
   "metadata": {},
   "outputs": [],
   "source": [
    "loss_functions = {\n",
    "    'pi_loss': PiLoss()\n",
    "}"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 10,
   "id": "693287f4",
   "metadata": {},
   "outputs": [],
   "source": [
    "def loss_function(loss):\n",
    "    \"\"\"Provides loss functions from string representation.\n",
    "\n",
    "    :param loss: string identifier of loss function loss function\n",
    "    :return: loss function matching corresponding to input string (or unchanged input if was already loss function)\n",
    "    \"\"\"\n",
    "    if callable(loss):\n",
    "        return loss\n",
    "    else:\n",
    "        return loss_functions[loss]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 11,
   "id": "ae0af97c",
   "metadata": {},
   "outputs": [],
   "source": [
    "def calc_risk(loss, action, rules, states, reg, advantage, others, current):\n",
    "    weights = np.array([rule.y for rule in rules])\n",
    "    risk = sum(loss(action, rules(states), advantage, others, current)) + reg * sum(weights * weights) / 2\n",
    "    return risk"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 12,
   "id": "d06dc96b",
   "metadata": {},
   "outputs": [],
   "source": [
    "class FullyCorrectiveA2C:\n",
    "    def __init__(self, loss='pi_loss', reg=regular, solver='L-BFGS-B'):\n",
    "        self.loss = loss_function(loss)\n",
    "        self.reg = reg\n",
    "        self.solver = solver\n",
    "\n",
    "    @staticmethod\n",
    "    def get_risk(loss, action, q_mat, reg, advantage, others, current):\n",
    "        def sum_loss(weights):\n",
    "            return sum(loss(action, q_mat.dot(weights), advantage, others, current)) + reg * sum(weights * weights) / 2\n",
    "\n",
    "        return sum_loss\n",
    "\n",
    "    @staticmethod\n",
    "    def get_gradient(g, action, q_mat, reg, advantage, other, current):\n",
    "        def gradient(weights):\n",
    "            grad_vec = g(action, q_mat.dot(weights), advantage, other, current)\n",
    "            return q_mat.T.dot(grad_vec) + reg * weights\n",
    "\n",
    "        return gradient\n",
    "\n",
    "    @staticmethod\n",
    "    def get_hessian(h, action, q_mat, reg, advantage, other, current):\n",
    "        def hessian(weights):\n",
    "            h_vec = h(action, q_mat.dot(weights), advantage, other, current)\n",
    "            return q_mat.T.dot(np.diag(h_vec)).dot(q_mat) + np.diag([reg] * len(weights))\n",
    "\n",
    "        return hessian\n",
    "\n",
    "    def calc_weight(self, data, action, rules, advantage, other, current):\n",
    "        g = self.loss.g\n",
    "        h = self.loss.h\n",
    "        loss = self.loss\n",
    "        y = np.array(action)\n",
    "        q_mat = np.column_stack(\n",
    "            [rules[i].q(data) + np.zeros(len(data)) for i in range(len(rules))])\n",
    "        sum_loss = self.get_risk(loss, y, q_mat, self.reg, advantage, other, current)\n",
    "        gradient = self.get_gradient(g, y, q_mat, self.reg, advantage, other, current)\n",
    "        hessian = self.get_hessian(h, y, q_mat, self.reg, advantage, other, current)\n",
    "        if self.solver == 'GD':  # Gradient descent\n",
    "            w = np.array([r.y for r in rules])\n",
    "            old_w = np.ones_like(w) * (1.0 if len(w) - sum(w) > 1e-5 else 2.0)\n",
    "            i = 0\n",
    "            while norm(old_w - w) > 1e-3 and i < 50:\n",
    "                old_w = np.array(w)\n",
    "                if norm(gradient(w)) == 0:\n",
    "                    break\n",
    "                p = -gradient(w) / norm(gradient(w))\n",
    "                w += GoldenRatioSearch(sum_loss, old_w, p, gradient).run() * p\n",
    "                i += 1\n",
    "        elif self.solver == 'Line':\n",
    "            w = np.array([r.y for r in rules])\n",
    "            if norm(gradient(w)) != 0:\n",
    "                p = -gradient(w) / norm(gradient(w))\n",
    "                distance = GoldenRatioSearch(sum_loss, w, p, gradient).run()\n",
    "                w += distance * p\n",
    "        else:\n",
    "            w = np.array([r.y for r in rules])\n",
    "            w = scipy.optimize.minimize(sum_loss, w, method=self.solver, jac=gradient,  # hess=hessian,\n",
    "                                        options={'disp': False}).x\n",
    "\n",
    "        return w"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 13,
   "id": "2d0c04a8",
   "metadata": {},
   "outputs": [],
   "source": [
    "class ObjectFunction:\n",
    "    def __init__(self, data, target, predictions, loss, reg, advantage, other_values, current, rules=None):\n",
    "        self.loss = loss_function(loss)\n",
    "        self.reg = reg\n",
    "        predictions = np.zeros_like(\n",
    "            target) if predictions is None else predictions\n",
    "        g = np.array(self.loss.g(target, predictions, advantage, other_values, current))\n",
    "        h = np.array(self.loss.h(target, predictions, advantage, other_values, current)) + 1e-6\n",
    "        r = g / h\n",
    "        order = np.argsort(r)[::-1]\n",
    "        self.g = g[order]\n",
    "        self.h = h[order]\n",
    "        self.data = data.iloc[order].reset_index(drop=True)\n",
    "        self.target = target.iloc[order].reset_index(drop=True)\n",
    "        self.n = len(target)\n",
    "\n",
    "    def __call__(self, ext):\n",
    "        raise NotImplementedError()\n",
    "\n",
    "    def bound(self, ext):\n",
    "        raise NotImplementedError()\n",
    "\n",
    "    def search(self, method='greedy', verbose=False, **search_params):\n",
    "        from realkd.search import search_methods\n",
    "        ctx = Context.from_df(self.data, **search_params)\n",
    "        if verbose >= 2:\n",
    "            print(\n",
    "                f'Created search context with {len(ctx.attributes)} attributes')\n",
    "        return search_methods[method](ctx, self, self.bound, verbose=verbose, **search_params).run()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 14,
   "id": "eaec4413",
   "metadata": {},
   "outputs": [],
   "source": [
    "class OrthogonalBoostingObjective(ObjectFunction):\n",
    "    def __init__(self, data, target, advantage, other_values, current, predictions=None, loss=SquaredLoss, reg=regular,\n",
    "                 rules=None,\n",
    "                 epsilon=1e-4, **kwargs):\n",
    "        super().__init__(data, target, predictions, loss, reg, advantage, other_values, current, rules)\n",
    "        self.rules = [] if rules is None else rules\n",
    "        self.loss = loss_function(loss)\n",
    "        self.reg = reg\n",
    "        self.epsilon = epsilon\n",
    "        predictions = np.zeros_like(\n",
    "            target) if predictions is None else predictions\n",
    "        g = np.array(self.loss.g(target, predictions, advantage, other_values, current))\n",
    "        self.n = len(target)\n",
    "        r = g\n",
    "        order = np.argsort(r)[::-1]\n",
    "        self.g = g[order]\n",
    "        self.data = data.iloc[order].reset_index(drop=True)\n",
    "        self.target = target.iloc[order].reset_index(drop=True)\n",
    "        if len(rules) != 0:\n",
    "            orth_basis = kwargs['orth_basis']\n",
    "            self.orth_basis = orth_basis[order]\n",
    "            self.g = self.g - self.orth_basis @ self.orth_basis.T @ self.g\n",
    "        else:\n",
    "            self.orth_basis = np.zeros(self.n)\n",
    "\n",
    "    def __call__(self, ext):\n",
    "        if len(ext) == 0:\n",
    "            return -inf\n",
    "        g_q = self.g[ext]\n",
    "        if len(self.rules) == 0:\n",
    "            h_q = self.h[ext]\n",
    "            return abs(g_q.sum()) / np.sqrt(h_q.sum())\n",
    "        length = self.fast_orth_norm(ext)\n",
    "        if length > 1e-4:\n",
    "            obj = abs(g_q.sum()) / (length + self.epsilon)\n",
    "        else:\n",
    "            obj = 0\n",
    "        return obj\n",
    "\n",
    "    def fast_orth_norm(self, ext):\n",
    "        deltas = self.orth_basis[ext]\n",
    "        length = len(ext)\n",
    "        okqi = abs(np.sum(deltas, axis=0))\n",
    "        q_para_norms = (okqi ** 2).sum()\n",
    "        q_orth_norms_sq = np.abs(length - q_para_norms)\n",
    "        return np.sqrt(q_orth_norms_sq)\n",
    "\n",
    "    def fast_para_norms_prefix(self, ext):\n",
    "        deltas = self.orth_basis[ext]\n",
    "        length = len(ext)\n",
    "        okqi = np.cumsum(deltas, axis=0)\n",
    "        q_para_norms = (okqi ** 2).sum(axis=1)\n",
    "        q_orth_norms_sq = np.abs(np.arange(1, length + 1) - q_para_norms)\n",
    "        q_orth_norms = np.sqrt(q_orth_norms_sq)\n",
    "        return q_orth_norms\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 15,
   "id": "626cceb7",
   "metadata": {},
   "outputs": [],
   "source": [
    "class GeneralRuleBoostingEstimator(BaseEstimator):\n",
    "    def __init__(self, num_rules, objective_function, weight_update_method, loss='squared', reg=regular,\n",
    "                 search='greedy', max_col_attr=10,\n",
    "                 search_params=None, verbose=False):\n",
    "        if search_params is None:\n",
    "            search_params = {'order': 'bestboundfirst', 'apx': 1.0, 'max_depth': None, 'discretization': qcut,\n",
    "                             'max_col_attr': max_col_attr}\n",
    "        self.num_rules = num_rules\n",
    "        self.num_components = 500\n",
    "        self.objective = objective_function\n",
    "        self.objective_function = objective_function\n",
    "        self.max_col_attr = max_col_attr\n",
    "        self.weight_update_method = weight_update_method\n",
    "        self.loss = loss_function(loss)\n",
    "        self.reg = reg\n",
    "        self.weight_update_method.loss = loss\n",
    "        self.weight_update_method.reg = reg\n",
    "        self.verbose = verbose\n",
    "        self.search = search\n",
    "        self.rules_ = AdditiveRuleEnsemble([])\n",
    "        self.search_params = search_params\n",
    "        self.history = []\n",
    "        self.time = []\n",
    "\n",
    "    def set_reg(self, reg):\n",
    "        self.reg = reg\n",
    "        self.objective.reg = reg\n",
    "        self.weight_update_method.reg = reg\n",
    "\n",
    "    def fit(self, data, target, advantage, other_values, current, has_origin_rules=False, verbose=False):\n",
    "        if not has_origin_rules:\n",
    "            self.history = []\n",
    "            self.time = []\n",
    "            self.rules_.members = []\n",
    "            orth_basis = np.array([])\n",
    "        else:\n",
    "            q_mat = np.column_stack(\n",
    "                [self.rules_[i].q(data) + np.zeros(len(data)) for i in range(len(self.rules_))])\n",
    "            orth_basis = orthonormalization(q_mat)\n",
    "        num_components = 0\n",
    "        while len(self.rules_) < self.num_rules and num_components < self.num_components:\n",
    "            start_time = datetime.now()\n",
    "            # Search for a rule\n",
    "            scores = self.rules_(data)\n",
    "            obj = self.objective(data, target, advantage, other_values, current, predictions=scores,\n",
    "                                 loss=self.loss, reg=self.reg, rules=self.rules_, orth_basis=orth_basis)\n",
    "            q = obj.search(method=self.search, verbose=verbose,\n",
    "                           **self.search_params)\n",
    "            if hasattr(self.objective, 'opt_weight') and callable(getattr(self.objective, 'opt_weight')):\n",
    "                y = obj.opt_weight(q)\n",
    "            else:\n",
    "                y = 1.0  # np.random.random()\n",
    "            q_vec = q(data)\n",
    "            num_components += (1 + len(q))\n",
    "            if len(orth_basis) == 0:\n",
    "                basis = q_vec / norm(q_vec)\n",
    "                orth_basis = np.array([basis]).T\n",
    "            else:\n",
    "                basis = q_vec - orth_basis.dot(orth_basis.T.dot(q_vec))\n",
    "                basis = basis / (norm(basis) + 1e-6)\n",
    "                orth_basis = np.hstack((orth_basis, np.array([basis]).T))\n",
    "            rule = Rule(q, y)\n",
    "            if self.verbose:\n",
    "                print(rule)\n",
    "            self.rules_.append(rule)\n",
    "            # Calculate weights\n",
    "            weights = self.weight_update_method.calc_weight(\n",
    "                data, target, self.rules_, advantage, other_values, current)\n",
    "            for i in range(len(self.rules_)):\n",
    "                self.rules_[i].y = weights[i]\n",
    "            self.history.append(AdditiveRuleEnsemble(\n",
    "                [Rule(q=rule.q, y=rule.y) for rule in self.rules_.members]))\n",
    "            end_time = datetime.now()\n",
    "            self.time.append(str(end_time - start_time))\n",
    "        return self\n",
    "\n",
    "    def predict(self, data):\n",
    "        loss = loss_function(self.loss)\n",
    "        return loss.preidictions(self.rules_(data))\n",
    "\n",
    "    def decision_function(self, data):\n",
    "        return self.rules_(data)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 16,
   "id": "b50ce787",
   "metadata": {},
   "outputs": [],
   "source": [
    "# class Actor(nn.Module):\n",
    "#     def __init__(self, action_space, node=16):\n",
    "#         super(Actor, self).__init__()\n",
    "#         self.fc1 = nn.Linear(4, node)  \n",
    "# #         self.fc1_ = nn.Linear(node, node)\n",
    "#         self.fc2 = nn.Linear(node, action_space)\n",
    "\n",
    "#     def forward(self, state):\n",
    "#         x = F.relu(self.fc1(state))\n",
    "# #         x = F.relu(self.fc1_(x))\n",
    "#         x = self.fc2(x)\n",
    "#         return x"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 17,
   "id": "84b0ee0a",
   "metadata": {},
   "outputs": [],
   "source": [
    "def copy_rules(origin_rules):\n",
    "    rules = []\n",
    "    for n in range(len(origin_rules)):\n",
    "        rule = origin_rules[n]\n",
    "        rules.append(Rule(q=rule.q, y=rule.y))\n",
    "    return AdditiveRuleEnsemble(rules)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 18,
   "id": "bb3fcc8c",
   "metadata": {},
   "outputs": [],
   "source": [
    "class ActorRule():\n",
    "    def __init__(self, action_space=4, num_rules=number_rules):\n",
    "        self.action_space = action_space\n",
    "        self.model = [GeneralRuleBoostingEstimator(num_rules=num_rules, objective_function=OrthogonalBoostingObjective,\n",
    "                                                   weight_update_method=FullyCorrectiveA2C(), loss=PiLoss(),\n",
    "                                                   reg=regular, search='greedy', max_col_attr=20, verbose=False) for _ in\n",
    "                      range(action_space)]\n",
    "        self.best_model = [\n",
    "            GeneralRuleBoostingEstimator(num_rules=num_rules, objective_function=OrthogonalBoostingObjective,\n",
    "                                         weight_update_method=FullyCorrectiveA2C(), loss=PiLoss(),\n",
    "                                         reg=0.01, search='greedy', max_col_attr=20, verbose=False) for _ in\n",
    "            range(action_space)]\n",
    "\n",
    "    def __call__(self, state):\n",
    "        res = [self.model[i].rules_(state) for i in range(len(self.model))]\n",
    "        return np.array(res)\n",
    "\n",
    "    def predict(self, state):\n",
    "        res = [self.best_model[i].rules_(state) for i in range(len(self.model))]\n",
    "        return np.array(res)\n",
    "\n",
    "\n",
    "def update_rules(estimator: GeneralRuleBoostingEstimator, x, y, adv, other_values, current):\n",
    "    queries_lst = []\n",
    "    queries = {}\n",
    "    original_rules = copy_rules(estimator.rules_)\n",
    "    origin_risk = calc_risk(PiLoss(), y, original_rules, x, estimator.reg, adv, other_values, current)\n",
    "    for i in range(len(estimator.rules_)):\n",
    "        q_str = str(estimator.rules_[i].q)\n",
    "        if q_str not in queries:\n",
    "            queries[q_str] = estimator.rules_[i].y\n",
    "            queries_lst.append(estimator.rules_[i].q)\n",
    "        else:\n",
    "            queries[q_str] += estimator.rules_[i].y\n",
    "    for k in queries:\n",
    "        queries[k] = abs(queries[k])\n",
    "    min_weight_query = min(queries, key=queries.get)\n",
    "    rules = []\n",
    "    for i in range(len(queries_lst)):\n",
    "        q_str = str(queries_lst[i])\n",
    "        if q_str != min_weight_query:\n",
    "            rules.append(Rule(q=queries_lst[i], y=queries[str(queries_lst[i])]))\n",
    "    if len(rules) == 0:\n",
    "        rules = [Rule(q=queries_lst[0], y=queries[str(queries_lst[0])])]\n",
    "    new_rules = AdditiveRuleEnsemble(rules)\n",
    "    weights = FullyCorrectiveA2C(loss_function('pi_loss'), estimator.reg).calc_weight(x, y, new_rules, adv,\n",
    "                                                                                      other_values, current)\n",
    "    for i in range(len(new_rules)):\n",
    "        new_rules[i].y = weights[i]\n",
    "    estimator.rules_ = new_rules\n",
    "    estimator.fit(x, y, adv, other_values, current, has_origin_rules=True)\n",
    "    weights = FullyCorrectiveA2C(loss_function('pi_loss'), estimator.reg).calc_weight(x, y, estimator.rules_, adv,\n",
    "                                                                                      other_values, current)\n",
    "    for i in range(len(estimator.rules_)):\n",
    "        estimator.rules_[i].y = weights[i]\n",
    "    new_risk = calc_risk(PiLoss(), y, estimator.rules_, x, estimator.reg, adv, other_values, current)\n",
    "    if new_risk > origin_risk:\n",
    "        estimator.rules_ = copy_rules(original_rules)\n",
    "        print(\"origin\", origin_risk, 'new', new_risk, 'not updated')\n",
    "        # risk = sum(PiLoss.__call__(y, estimator.rules_[i].y))\n",
    "    return estimator"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 19,
   "id": "2824981f",
   "metadata": {},
   "outputs": [],
   "source": [
    "class Critic(nn.Module):\n",
    "    def __init__(self, node=16):\n",
    "        super(Critic, self).__init__()\n",
    "        self.fc1 = nn.Linear(5, node)\n",
    "        self.fc2 = nn.Linear(node, 1)\n",
    "\n",
    "    def forward(self, state):\n",
    "        x = F.relu(self.fc1(state))\n",
    "        x = self.fc2(x)\n",
    "        return x"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 20,
   "id": "6b6e2dd7",
   "metadata": {},
   "outputs": [],
   "source": [
    "gamma = 0.99\n",
    "actor = ActorRule()\n",
    "critic = Critic().to(device)\n",
    "critic_optimizer = optim.AdamW(critic.parameters(), lr=0.001)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 21,
   "id": "24c116b8",
   "metadata": {},
   "outputs": [],
   "source": [
    "class ActorNet(nn.Module):\n",
    "    def __init__(self, hidden_dim=16):\n",
    "        super().__init__()\n",
    "\n",
    "        self.hidden = nn.Linear(5, hidden_dim)\n",
    "        self.output = nn.Linear(hidden_dim, 4)\n",
    "\n",
    "    def forward(self, s):\n",
    "        outs = self.hidden(s)\n",
    "        outs = F.relu(outs)\n",
    "        logits = self.output(outs)\n",
    "        return logits\n",
    "\n",
    "\n",
    "actor_func = ActorNet().to(device)\n",
    "value_func = critic"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 22,
   "id": "c565d5ef",
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/home/fyan/.local/lib/python3.10/site-packages/gymnasium/utils/passive_env_checker.py:142: UserWarning: \u001b[33mWARN: The obs returned by the `reset()` method was expecting a tuple, actual type: <class 'numpy.ndarray'>\u001b[0m\n",
      "  logger.warn(f\"{pre} was expecting a tuple, actual type: {type(obs)}\")\n",
      "/home/fyan/.local/lib/python3.10/site-packages/gymnasium/utils/passive_env_checker.py:158: UserWarning: \u001b[33mWARN: The obs returned by the `reset()` method is not within the observation space.\u001b[0m\n",
      "  logger.warn(f\"{pre} is not within the observation space.\")\n",
      "/home/fyan/.local/lib/python3.10/site-packages/gymnasium/utils/passive_env_checker.py:142: UserWarning: \u001b[33mWARN: The obs returned by the `step()` method was expecting a tuple, actual type: <class 'numpy.ndarray'>\u001b[0m\n",
      "  logger.warn(f\"{pre} was expecting a tuple, actual type: {type(obs)}\")\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Run episode 0 with rewards -72\n",
      "Run episode 1 with rewards -159\n",
      "Run episode 2 with rewards 4\n",
      "Run episode 3 with rewards 22\n",
      "Run episode 4 with rewards -22\n",
      "Run episode 5 with rewards -45\n",
      "Run episode 6 with rewards -57\n",
      "Run episode 7 with rewards -31\n",
      "Run episode 8 with rewards -41\n",
      "Run episode 9 with rewards -55\n",
      "Run episode 10 with rewards -108\n",
      "Run episode 11 with rewards -46\n",
      "Run episode 12 with rewards -141\n",
      "Run episode 13 with rewards -103\n",
      "Run episode 14 with rewards -49\n",
      "Run episode 15 with rewards -32\n",
      "Run episode 16 with rewards 4\n",
      "Run episode 17 with rewards 9\n",
      "Run episode 18 with rewards -5\n",
      "Run episode 19 with rewards -34\n",
      "Run episode 20 with rewards 30\n",
      "Run episode 21 with rewards 23\n",
      "Run episode 22 with rewards -18\n",
      "Run episode 23 with rewards 28\n",
      "Run episode 24 with rewards -22\n",
      "Run episode 25 with rewards 19\n",
      "Run episode 26 with rewards -42\n",
      "Run episode 27 with rewards 23\n",
      "Run episode 28 with rewards 3\n",
      "Run episode 29 with rewards -87\n",
      "Run episode 30 with rewards -54\n",
      "Run episode 31 with rewards -180\n",
      "Run episode 32 with rewards -19\n",
      "Run episode 33 with rewards 25\n",
      "Run episode 34 with rewards -19\n",
      "Run episode 35 with rewards -53\n",
      "Run episode 36 with rewards -112\n",
      "Run episode 37 with rewards -68\n",
      "Run episode 38 with rewards -57\n",
      "Run episode 39 with rewards -37\n",
      "Run episode 40 with rewards 12\n",
      "Run episode 41 with rewards -36\n",
      "Run episode 42 with rewards -104\n",
      "Run episode 43 with rewards 9\n",
      "Run episode 44 with rewards -122\n",
      "Run episode 45 with rewards -31\n",
      "Run episode 46 with rewards -127\n",
      "Run episode 47 with rewards 26\n",
      "Run episode 48 with rewards 23\n",
      "Run episode 49 with rewards -130\n",
      "Run episode 50 with rewards 9\n",
      "Run episode 51 with rewards -4\n",
      "Run episode 52 with rewards 34\n",
      "Run episode 53 with rewards -37\n",
      "Run episode 54 with rewards -38\n",
      "Run episode 55 with rewards -27\n",
      "Run episode 56 with rewards -49\n",
      "Run episode 57 with rewards -21\n",
      "Run episode 58 with rewards 6\n",
      "Run episode 59 with rewards -16\n",
      "Run episode 60 with rewards 17\n",
      "Run episode 61 with rewards 31\n",
      "Run episode 62 with rewards 33\n",
      "Run episode 63 with rewards -47\n",
      "Run episode 64 with rewards -38\n",
      "Run episode 65 with rewards -8\n",
      "Run episode 66 with rewards 21\n",
      "Run episode 67 with rewards -7\n",
      "Run episode 68 with rewards 20\n",
      "Run episode 69 with rewards -22\n",
      "Run episode 70 with rewards 21\n",
      "Run episode 71 with rewards -28\n",
      "Run episode 72 with rewards -70\n",
      "Run episode 73 with rewards -28\n",
      "Run episode 74 with rewards 18\n",
      "Run episode 75 with rewards -66\n",
      "Run episode 76 with rewards 32\n",
      "Run episode 77 with rewards -57\n",
      "Run episode 78 with rewards -33\n",
      "Run episode 79 with rewards 21\n",
      "Run episode 80 with rewards -39\n",
      "Run episode 81 with rewards -42\n",
      "Run episode 82 with rewards 9\n",
      "Run episode 83 with rewards -37\n",
      "Run episode 84 with rewards -20\n",
      "Run episode 85 with rewards -56\n",
      "Run episode 86 with rewards 33\n",
      "Run episode 87 with rewards 12\n",
      "Run episode 88 with rewards 11\n",
      "Run episode 89 with rewards -115\n",
      "Run episode 90 with rewards 26\n",
      "Run episode 91 with rewards -10\n",
      "Run episode 92 with rewards 11\n",
      "Run episode 93 with rewards -25\n",
      "Run episode 94 with rewards -44\n",
      "Run episode 95 with rewards -18\n",
      "Run episode 96 with rewards -26\n",
      "Run episode 97 with rewards -12\n",
      "Run episode 98 with rewards -38\n",
      "Run episode 99 with rewards -10\n",
      "Run episode 100 with rewards 26\n",
      "Run episode 101 with rewards 36\n"
     ]
    }
   ],
   "source": [
    "opt1 = torch.optim.AdamW(value_func.parameters(), lr=0.001)\n",
    "opt2 = torch.optim.AdamW(actor_func.parameters(), lr=0.001)\n",
    "def pick_sample(s):\n",
    "    with torch.no_grad():\n",
    "        #   --> size : (1, 4)\n",
    "        s_batch = np.expand_dims(s, axis=0)\n",
    "        s_batch = torch.tensor(s_batch, dtype=torch.float).to(device)\n",
    "        # Get logits from state\n",
    "        #   --> size : (1, 2)\n",
    "        logits = actor_func(s_batch)\n",
    "        #   --> size : (2)\n",
    "        logits = logits.squeeze(dim=0)\n",
    "        # From logits to probabilities\n",
    "        probs = F.softmax(logits, dim=-1)\n",
    "        # Pick up action's sample\n",
    "        a = torch.multinomial(probs, num_samples=1)\n",
    "        # Return\n",
    "        return a.tolist()[0]\n",
    "reward_records = []\n",
    "for i in range(200):\n",
    "    #\n",
    "    # Run episode till done\n",
    "    #\n",
    "    done = False\n",
    "    states = []\n",
    "    actions = []\n",
    "    rewards = []\n",
    "    s, _ = env.reset(seed=np.random.randint(0, 1e6))\n",
    "    num_steps=0\n",
    "    while not done and num_steps<=200:\n",
    "        states.append(s.tolist())\n",
    "        a = pick_sample(s)\n",
    "        s, r, term, trunc, _ = env.step(a)\n",
    "        done = term or trunc\n",
    "        actions.append(a)\n",
    "        rewards.append(r)\n",
    "        num_steps+=1\n",
    "    #\n",
    "    # Get cumulative rewards\n",
    "    #\n",
    "    cum_rewards = np.zeros_like(rewards)\n",
    "    reward_len = len(rewards)\n",
    "    for j in reversed(range(reward_len)):\n",
    "        cum_rewards[j] = rewards[j] + (cum_rewards[j+1]*gamma if j+1 < reward_len else 0)\n",
    "    \n",
    "    #\n",
    "    # Train (optimize parameters)\n",
    "    #\n",
    "\n",
    "    # Optimize value loss (Critic)\n",
    "    opt1.zero_grad()\n",
    "    states = torch.tensor(states, dtype=torch.float).to(device)\n",
    "    cum_rewards = torch.tensor(cum_rewards, dtype=torch.float).to(device)\n",
    "    values = value_func(states)\n",
    "    values = values.squeeze(dim=1)\n",
    "    vf_loss = F.mse_loss(\n",
    "        values,\n",
    "        cum_rewards,\n",
    "        reduction=\"none\")\n",
    "    vf_loss.sum().backward()\n",
    "    opt1.step()\n",
    "\n",
    "    # Todo 2; RULE BASED UPDATES\n",
    "    with torch.no_grad():\n",
    "        values = value_func(states).squeeze(dim=1)\n",
    "    opt2.zero_grad()\n",
    "    actions = torch.tensor(actions, dtype=torch.int64).to(device)\n",
    "    advantages = cum_rewards - values\n",
    "#     print(advantages)\n",
    "    logits = actor_func(states)\n",
    "    log_probs = -F.cross_entropy(logits, actions, reduction=\"none\")\n",
    "    pi_loss = -log_probs * advantages\n",
    "    pi_loss.sum().backward()\n",
    "    opt2.step()\n",
    "    \n",
    "    # Output total rewards in episode (max 500)\n",
    "    print(\"Run episode {} with rewards {}\".format(i, sum(rewards)))#, end=\"\\r\")\n",
    "    reward_records.append(sum(rewards))\n",
    "    if sum(rewards)>35 and i>80:\n",
    "        break"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 23,
   "id": "f28c7004",
   "metadata": {},
   "outputs": [],
   "source": [
    "def manhattan_distance(location1, location2):\n",
    "    \"\"\"\n",
    "    :param location1: A tuple or list representing the coordinates (x, y) of the first location.\n",
    "    :param location2: A tuple or list representing the coordinates (x, y) of the second location.\n",
    "    :return: Integer representing the Manhattan distance between the two locations.\n",
    "    :functionality: Calculates and returns the Manhattan distance between two points in a 2D grid.\n",
    "    \"\"\"\n",
    "    return abs(location1[0] - location2[0]) + abs(location1[1] - location2[1])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 24,
   "id": "a3a7c7ce",
   "metadata": {},
   "outputs": [],
   "source": [
    "def accuracy_test(env, agent, test_num=10):\n",
    "    \"\"\"\n",
    "    :param env: An Environment object representing the environment in which the agent operates.\n",
    "    :param agent: An Agent object representing the agent being tested.\n",
    "    :param test_num: Integer representing the number of tests to perform.\n",
    "    :return: Float representing the ratio of times the agent successfully found the exact shortest path \n",
    "             in the given environment over the total number of tests.\n",
    "    :functionality: Tests the agent's ability to match the exact shortest path in the given environment. \n",
    "                    The accuracy is computed based on the number of times the agent's path length \n",
    "                    matches the actual minimum distance.\n",
    "    \"\"\"\n",
    "    \n",
    "    accuracy = 0\n",
    "\n",
    "    for _ in range(test_num):\n",
    "        # Regenerate random locations for items and agents in the environment\n",
    "        state, _=env.reset()\n",
    "\n",
    "        # Calculate the actual minimum distance needed to pick the item and reach the target\n",
    "        actual_length = manhattan_distance((state[0], state[1]), (state[2],state[3])) + manhattan_distance(\n",
    "            (state[2], state[3]), (4, 4)) + 1\n",
    "\n",
    "        # Initialize agent's state\n",
    "#         agent.agent_location = env.agent_location\n",
    "#         agent.carry_item = 0\n",
    "#         agent.reward = 0\n",
    "        episode_reward = 0\n",
    "        num_steps=0\n",
    "        for t in range(1, 100):  # Limit the number of time steps\n",
    "            # Convert state to tensor and predict action probabilities\n",
    "            #             state_tensor = torch.tensor(state, dtype=torch.float32).to(device)\n",
    "            action_probs = actor(pd.DataFrame(np.array([state]), columns=column_names))\n",
    "            # Select action based on the highest probability\n",
    "            action = np.argmax(action_probs)\n",
    "            # Take the chosen action\n",
    "            next_state, reward, done, trunc, _ = env.step(action)\n",
    "            # Accumulate reward\n",
    "            episode_reward += reward\n",
    "            if done or trunc:\n",
    "                break\n",
    "            # Update state\n",
    "            state = next_state\n",
    "            num_steps+=1\n",
    "        # Check if the path length found by the agent matches the actual minimum distance\n",
    "        if num_steps <= 3*actual_length:\n",
    "            accuracy += 1\n",
    "\n",
    "    # Calculate and return the accuracy ratio\n",
    "    return accuracy / test_num\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 25,
   "id": "73589768",
   "metadata": {},
   "outputs": [],
   "source": [
    "def softmax(logits):\n",
    "    exp_logits = np.exp(logits)\n",
    "    sum_logits = np.sum(exp_logits)\n",
    "    return (exp_logits / sum_logits).reshape([-1])\n",
    "\n",
    "def pick_sample(s):\n",
    "    with torch.no_grad():\n",
    "        s_batch = np.expand_dims(s, axis=0)\n",
    "        logits = actor(pd.DataFrame(s_batch, columns=column_names))\n",
    "        probs = softmax(logits)\n",
    "        a = torch.multinomial(torch.tensor(probs), num_samples=1)\n",
    "        return a.tolist()[0]\n",
    "\n",
    "\n",
    "def train():\n",
    "    reward_records = []\n",
    "    best_rewards = -100000\n",
    "    accuracies = []\n",
    "    best_accuracy = 0\n",
    "    # best_model = None\n",
    "    for i in range(150):\n",
    "\n",
    "        done = False\n",
    "        states = []\n",
    "        actions = []\n",
    "        rewards = []\n",
    "        \n",
    "#         if i == 2:\n",
    "#             print('stop here')\n",
    "        cum_rwds=np.array([])\n",
    "        for ii in range(10):\n",
    "            s, _ = env.reset(seed=np.random.randint(0, 1e6))\n",
    "            print('init state', s)\n",
    "            num_steps=0\n",
    "            done=False\n",
    "            rewards = []\n",
    "            while not done and num_steps<=200:\n",
    "                states.append(s.tolist())\n",
    "                a = pick_sample(s)\n",
    "                s, r, term, trunc, _ = env.step(a)\n",
    "    #             print(s, 'r:', r, 'term: ',term,'tr:', trunc, end=',')\n",
    "                done = term or trunc\n",
    "                actions.append(a)\n",
    "                rewards.append(r)\n",
    "                num_steps+=1\n",
    "            cum_rewards = np.zeros_like(rewards)\n",
    "            reward_len = len(rewards)\n",
    "            for j in reversed(range(reward_len)):\n",
    "                cum_rewards[j] = rewards[j] + (cum_rewards[j + 1] * gamma if j + 1 < reward_len else 0)\n",
    "            cum_rwds=np.hstack([cum_rwds, cum_rewards])\n",
    "            print(cum_rwds.shape, cum_rewards.shape)\n",
    "\n",
    "        # if sum(rewards) > 480:\n",
    "        #     break\n",
    "        #\n",
    "        # Get cumulative rewards\n",
    "        #\n",
    "        print('============', i, '===========')\n",
    "#         print(len(actions), 'actions', actions)\n",
    "#         print(type(env))\n",
    "        avg_accuracy = accuracy_test(env, actor)\n",
    "        accuracies.append(avg_accuracy)\n",
    "        print(\"Run episode {} with rewards {}, accuracy {}\".format(i, sum(rewards), avg_accuracy))  # , end=\"\\r\")\n",
    "#         if i > 0:\n",
    "        if avg_accuracy >= best_accuracy:\n",
    "#             best_rewards = sum(rewards)\n",
    "            best_accuracy = avg_accuracy\n",
    "            for rr in range(actor.action_space):\n",
    "                rules = []\n",
    "                for n in range(len(actor.model[rr].rules_)):\n",
    "                    rule = actor.model[rr].rules_[n]\n",
    "                    rules.append(Rule(q=rule.q, y=rule.y))\n",
    "                actor.best_model[rr].rules_ = AdditiveRuleEnsemble(rules)\n",
    "            print('best')\n",
    "        if np.average(accuracies[:-5])>=0.99:\n",
    "            break\n",
    "#         cum_rewards = np.zeros_like(rewards)\n",
    "#         reward_len = len(rewards)\n",
    "#         for j in reversed(range(reward_len)):\n",
    "#             cum_rewards[j] = rewards[j] + (cum_rewards[j + 1] * gamma if j + 1 < reward_len else 0)\n",
    "        #\n",
    "        # Train (optimize parameters)\n",
    "        #\n",
    "        # Optimize value loss (Critic)\n",
    "        critic_optimizer.zero_grad()\n",
    "        states = torch.tensor(states, dtype=torch.float).to(device)\n",
    "        cum_rewards = torch.tensor(cum_rwds, dtype=torch.float).to(device)\n",
    "        values = critic(states)\n",
    "        values = values.squeeze(dim=1)\n",
    "        vf_loss = F.mse_loss(\n",
    "            values,\n",
    "            cum_rewards,\n",
    "            reduction=\"none\")\n",
    "        vf_loss.sum().backward()\n",
    "        critic_optimizer.step()\n",
    "#         if np.average(reward_records[-5:]) > 32.0:\n",
    "#             break\n",
    "        #     else:\n",
    "        #         for rr in range(actor.action_space):\n",
    "        #             rules = []\n",
    "        #             for n in range(len(actor.best_model[rr].rules_)):\n",
    "        #                 rule = actor.best_model[rr].rules_[n]\n",
    "        #                 rules.append(Rule(q=rule.q, y=rule.y))\n",
    "        #             actor.model[rr].rules_ = AdditiveRuleEnsemble(rules)\n",
    "        #         print('')\n",
    "\n",
    "        #\n",
    "        # Todo 2; RULE BASED UPDATES\n",
    "        with torch.no_grad():\n",
    "            values = critic(states).squeeze(dim=1)\n",
    "        actions = torch.tensor(actions, dtype=torch.int64).to(device)\n",
    "        advantages = cum_rewards - values\n",
    "        states_array = states.cpu().detach().numpy()\n",
    "        x = pd.DataFrame(states_array, columns=column_names)\n",
    "        y = pd.Series(actions.cpu().detach().numpy())\n",
    "#         advantages = (advantages-advantages.mean())/advantages.std()\n",
    "        adv = pd.Series(advantages.cpu().detach().numpy())\n",
    "        outputs = actor(x).T\n",
    "        # print('adv', advantages.cpu().detach().numpy())\n",
    "        # print('outputs', outputs.tolist())\n",
    "        for j in range(len(actor.model)):\n",
    "            m = actor.model[j]\n",
    "            masks = np.ones_like(outputs, dtype=bool)\n",
    "            masks[:, j] = False\n",
    "            other_values = outputs[masks].reshape(-1, outputs.shape[1] - 1)\n",
    "\n",
    "            if len(m.rules_) == 0:\n",
    "                m.fit(x, y, adv, other_values, j)\n",
    "            else:\n",
    "                for _ in range(1):\n",
    "                    update_rules(m, x, y, adv, other_values, j)\n",
    "            print('-----------------',j,'--------------')\n",
    "            print(m.rules_)\n",
    "        \n",
    "        # print(\n",
    "        #     \"{}\\n--------------\\n{}\\nRun episode {} with rewards {}\".format(actor.model[0].rules_,\n",
    "        #                                                                     actor.model[1].rules_,\n",
    "        #                                                                     i,\n",
    "        #                                                                     sum(rewards)))  # , end=\"\\r\")\n",
    "        reward_records.append(sum(rewards))\n",
    "    print(\"\\nDone\")\n",
    "    env.close()\n",
    "    return reward_records"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 26,
   "id": "b411aa5d",
   "metadata": {
    "scrolled": true
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "init state [ 2  3 -2 -2  0]\n",
      "(201,) (201,)\n",
      "init state [ 3  2 -3 -1  0]\n",
      "(338,) (137,)\n",
      "init state [ 2  2  0 -1  0]\n",
      "(378,) (40,)\n",
      "init state [ 0  3  3 -1  0]\n",
      "(458,) (80,)\n",
      "init state [ 2  1 -2  0  0]\n",
      "(506,) (48,)\n",
      "init state [ 0  2  3 -2  0]\n",
      "(603,) (97,)\n",
      "init state [ 3  0 -1  3  0]\n",
      "(682,) (79,)\n",
      "init state [ 2  3 -2 -3  0]\n",
      "(735,) (53,)\n",
      "init state [ 3  1 -2  0  0]\n",
      "(758,) (23,)\n",
      "init state [ 1  3  1 -1  0]\n",
      "(764,) (6,)\n",
      "============ 0 ===========\n",
      "Run episode 0 with rewards 36, accuracy 0.0\n",
      "best\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/home/fyan/.local/lib/python3.10/site-packages/numpy/lib/function_base.py:518: RuntimeWarning: Mean of empty slice.\n",
      "  avg = a.mean(axis, **keepdims_kw)\n",
      "/home/fyan/.local/lib/python3.10/site-packages/numpy/core/_methods.py:190: RuntimeWarning: invalid value encountered in double_scalars\n",
      "  ret = ret.dtype.type(ret / rcount)\n",
      "/tmp/ipykernel_377/4131041232.py:32: RuntimeWarning: invalid value encountered in sqrt\n",
      "  return abs(g_q.sum()) / np.sqrt(h_q.sum())\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 0 --------------\n",
      "   -0.5622 if c>=1.0 & x2>=3.0\n",
      "   -0.4231 if c>=1.0 & x1>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0\n",
      "   +0.6964 if c<=0.0 & x1<=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.4277 if c<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=1.0 & x3-x1<=2.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.6320 if c>=1.0 & x1>=2.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   -0.3062 if c>=1.0 & x3-x1<=-3.0 & x4-x2<=-1.0\n",
      "   -0.1266 if x1>=3.0 & x2>=3.0 & x3-x1>=0.0\n",
      "   -0.2692 if c<=0.0 & x2<=1.0 & x3-x1<=2.0 & x3-x1>=1.0 & x4-x2<=0.0\n",
      "   +0.3546 if c<=0.0 & x1<=1.0 & x2<=1.0 & x3-x1<=1.0 & x4-x2<=-1.0\n",
      "   -0.1597 if c>=1.0 & x2<=0.0 & x3-x1<=-3.0 & x4-x2<=0.0\n",
      "   +0.5329 if c<=0.0 & x1<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   -0.2169 if c<=0.0 & x1<=2.0 & x2>=2.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2>=-1.0 & x4-x2>=1.0\n",
      "   -0.2791 if c<=0.0 & x3-x1<=2.0 & x3-x1>=2.0 & x4-x2<=2.0 & x4-x2>=-2.0\n",
      "   -0.1175 if c>=1.0 & x1>=2.0 & x4-x2<=-3.0\n",
      "   +0.2351 if c>=1.0 & x1<=2.0 & x3-x1>=3.0 & x4-x2<=-2.0 & x4-x2>=-2.0\n",
      "   +0.1784 if c<=0.0 & x1<=1.0 & x3-x1<=-1.0 & x4-x2>=-1.0\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/tmp/ipykernel_377/4131041232.py:32: RuntimeWarning: invalid value encountered in sqrt\n",
      "  return abs(g_q.sum()) / np.sqrt(h_q.sum())\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 1 --------------\n",
      "   +0.9518 if x2>=1.0 & x3-x1>=1.0 & x3-x1>=2.0\n",
      "   +0.9500 if c<=0.0 & x2<=2.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2<=1.0\n",
      "   +0.3362 if c>=1.0 & x1>=2.0 & x2>=3.0 & x3-x1>=1.0\n",
      "   +0.9160 if c>=1.0 & x1>=1.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   -0.5193 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x3-x1>=0.0 & x4-x2<=-1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   +0.3173 if x1>=1.0 & x2>=3.0 & x3-x1>=2.0 & x4-x2>=-1.0\n",
      "   -0.7879 if c<=0.0 & x1<=2.0 & x2<=2.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   +0.2682 if c>=1.0 & x1>=2.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.6211 if x1<=0.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   -0.4240 if x1<=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.1856 if c<=0.0 & x1<=1.0 & x1<=2.0 & x3-x1<=2.0 & x3-x1>=0.0 & x4-x2<=-2.0 & x4-x2>=-2.0\n",
      "   +0.8598 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   -0.1716 if x1>=2.0 & x2>=3.0 & x3-x1<=1.0 & x4-x2>=-1.0\n",
      "   -0.2516 if c>=1.0 & x2>=1.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   -0.0679 if x1>=2.0 & x2<=2.0 & x2>=2.0 & x3-x1>=0.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   -0.1848 if x1<=0.0 & x2>=1.0 & x4-x2>=1.0\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/tmp/ipykernel_377/4131041232.py:32: RuntimeWarning: invalid value encountered in sqrt\n",
      "  return abs(g_q.sum()) / np.sqrt(h_q.sum())\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 2 --------------\n",
      "   -0.6699 if x1<=2.0 & x4-x2>=1.0\n",
      "   -0.5798 if c<=0.0 & x1>=2.0 & x2>=1.0 & x3-x1<=2.0 & x3-x1>=1.0 & x4-x2<=-1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.3474 if x2<=2.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.3424 if c>=1.0 & x1>=3.0 & x2>=2.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   +0.3143 if c<=0.0 & x1>=3.0 & x2>=3.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.7211 if x3-x1>=2.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   +0.5286 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.4170 if x1>=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2<=1.0\n",
      "   -0.0850 if c<=0.0 & x1<=0.0 & x3-x1<=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.8206 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -0.1187 if c<=0.0 & x1<=0.0 & x2<=1.0 & x3-x1<=2.0 & x4-x2<=0.0\n",
      "   -0.2177 if c<=0.0 & x1<=0.0 & x2<=0.0 & x3-x1<=2.0\n",
      "   -0.4008 if c<=0.0 & x1<=1.0 & x2<=2.0 & x2>=2.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   -0.5704 if x1<=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.0736 if c>=1.0 & x4-x2>=3.0\n",
      "   -0.2223 if x2<=2.0 & x2>=2.0 & x3-x1>=3.0\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/tmp/ipykernel_377/4131041232.py:32: RuntimeWarning: invalid value encountered in sqrt\n",
      "  return abs(g_q.sum()) / np.sqrt(h_q.sum())\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 3 --------------\n",
      "   +0.1631 if x1>=2.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.5975 if c>=1.0 & x1>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0\n",
      "   +0.5213 if c>=1.0 & x3-x1<=-3.0 & x4-x2<=-1.0\n",
      "   -0.7301 if c<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=2.0\n",
      "   +0.3684 if c<=0.0 & x1<=1.0 & x1<=2.0 & x2>=2.0 & x2>=3.0 & x3-x1<=1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   +0.4066 if x1<=2.0 & x1>=2.0 & x2<=2.0 & x2>=2.0 & x4-x2>=0.0\n",
      "   +0.2453 if c>=1.0 & x2<=0.0 & x3-x1<=-3.0 & x4-x2<=0.0\n",
      "   -0.2482 if c<=0.0 & x1>=3.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.2003 if c>=1.0 & x1>=2.0 & x2<=0.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   +0.3835 if x1>=2.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   +0.3935 if x1>=2.0 & x4-x2>=1.0\n",
      "   -0.0231 if c>=1.0 & x2>=1.0 & x3-x1<=-1.0 & x4-x2>=2.0\n",
      "   +0.1938 if c<=0.0 & x1<=0.0 & x2<=2.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   +0.2337 if x1<=0.0 & x3-x1>=2.0 & x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.3158 if x3-x1>=3.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   +0.0279 if c<=0.0 & x1>=2.0 & x2<=1.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "init state [ 0  2  3 -1  0]\n",
      "(26,) (26,)\n",
      "init state [ 3  1 -3  2  0]\n",
      "(41,) (15,)\n",
      "init state [ 2  0 -1  1  0]\n",
      "(60,) (19,)\n",
      "init state [ 3  0 -2  3  0]\n",
      "(77,) (17,)\n",
      "init state [ 2  0 -2  2  0]\n",
      "(91,) (14,)\n",
      "init state [ 0  2  3 -1  0]\n",
      "(137,) (46,)\n",
      "init state [0 2 0 1 0]\n",
      "(172,) (35,)\n",
      "init state [0 1 2 1 0]\n",
      "(189,) (17,)\n",
      "init state [ 2  3  1 -1  0]\n",
      "(202,) (13,)\n",
      "init state [2 2 0 1 0]\n",
      "(217,) (15,)\n",
      "============ 1 ===========\n",
      "Run episode 1 with rewards 27, accuracy 0.0\n",
      "best\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/home/fyan/.local/lib/python3.10/site-packages/numpy/lib/function_base.py:518: RuntimeWarning: Mean of empty slice.\n",
      "  avg = a.mean(axis, **keepdims_kw)\n",
      "/home/fyan/.local/lib/python3.10/site-packages/numpy/core/_methods.py:190: RuntimeWarning: invalid value encountered in double_scalars\n",
      "  ret = ret.dtype.type(ret / rcount)\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 0 --------------\n",
      "   -0.3332 if c>=1.0 & x2>=3.0\n",
      "   +0.0054 if c>=1.0 & x1>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0\n",
      "   +0.2827 if c<=0.0 & x1<=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.0436 if c<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=1.0 & x3-x1<=2.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.4717 if c>=1.0 & x1>=2.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   +0.0000 if c>=1.0 & x3-x1<=-3.0 & x4-x2<=-1.0\n",
      "   +0.1643 if x1>=3.0 & x2>=3.0 & x3-x1>=0.0\n",
      "   +0.0000 if c<=0.0 & x2<=1.0 & x3-x1<=2.0 & x3-x1>=1.0 & x4-x2<=0.0\n",
      "   +0.0000 if c<=0.0 & x1<=1.0 & x2<=1.0 & x3-x1<=1.0 & x4-x2<=-1.0\n",
      "   +0.0000 if c>=1.0 & x2<=0.0 & x3-x1<=-3.0 & x4-x2<=0.0\n",
      "   +0.6719 if c<=0.0 & x1<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   +0.4236 if c<=0.0 & x1<=2.0 & x2>=2.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2>=-1.0 & x4-x2>=1.0\n",
      "   -0.2749 if c<=0.0 & x3-x1<=2.0 & x3-x1>=2.0 & x4-x2<=2.0 & x4-x2>=-2.0\n",
      "   -0.0248 if c>=1.0 & x1<=2.0 & x3-x1>=3.0 & x4-x2<=-2.0 & x4-x2>=-2.0\n",
      "   +0.5616 if c<=0.0 & x1<=1.0 & x3-x1<=-1.0 & x4-x2>=-1.0\n",
      "   -0.5563 if x1<=1.0 & x4-x2>=2.0\n",
      "----------------- 1 --------------\n",
      "   +0.7713 if x2>=1.0 & x3-x1>=1.0 & x3-x1>=2.0\n",
      "   +0.3081 if c<=0.0 & x2<=2.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2<=1.0\n",
      "   +0.0705 if c>=1.0 & x1>=2.0 & x2>=3.0 & x3-x1>=1.0\n",
      "   +0.1985 if c>=1.0 & x1>=1.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   -0.1861 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x3-x1>=0.0 & x4-x2<=-1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   +0.1005 if x1>=1.0 & x2>=3.0 & x3-x1>=2.0 & x4-x2>=-1.0\n",
      "   -0.7694 if c<=0.0 & x1<=2.0 & x2<=2.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   +0.2331 if c>=1.0 & x1>=2.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.2230 if x1<=0.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   +0.0000 if x1<=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   +0.1350 if c<=0.0 & x1<=1.0 & x1<=2.0 & x3-x1<=2.0 & x3-x1>=0.0 & x4-x2<=-2.0 & x4-x2>=-2.0\n",
      "   +0.6212 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   -0.2335 if x1>=2.0 & x2>=3.0 & x3-x1<=1.0 & x4-x2>=-1.0\n",
      "   +0.0696 if c>=1.0 & x2>=1.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   +0.1137 if x1<=0.0 & x2>=1.0 & x4-x2>=1.0\n",
      "   -0.6211 if x1<=2.0 & x4-x2>=2.0\n",
      "----------------- 2 --------------\n",
      "   -0.5558 if x1<=2.0 & x4-x2>=1.0\n",
      "   -0.2374 if c<=0.0 & x1>=2.0 & x2>=1.0 & x3-x1<=2.0 & x3-x1>=1.0 & x4-x2<=-1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.0596 if x2<=2.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.2179 if c>=1.0 & x1>=3.0 & x2>=2.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   +0.3066 if c<=0.0 & x1>=3.0 & x2>=3.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.2011 if x3-x1>=2.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   +0.5159 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.2781 if x1>=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2<=1.0\n",
      "   -0.0784 if c<=0.0 & x1<=0.0 & x3-x1<=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.3920 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   +0.0000 if c<=0.0 & x1<=0.0 & x2<=1.0 & x3-x1<=2.0 & x4-x2<=0.0\n",
      "   +0.0000 if c<=0.0 & x1<=0.0 & x2<=0.0 & x3-x1<=2.0\n",
      "   -0.0129 if c<=0.0 & x1<=1.0 & x2<=2.0 & x2>=2.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   -0.3390 if x1<=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.0275 if x2<=2.0 & x2>=2.0 & x3-x1>=3.0\n",
      "   -0.3707 if c<=0.0 & x2>=3.0 & x3-x1<=1.0\n",
      "----------------- 3 --------------\n",
      "   +0.3946 if x1>=2.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.1180 if c>=1.0 & x1>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0\n",
      "   +0.0000 if c>=1.0 & x3-x1<=-3.0 & x4-x2<=-1.0\n",
      "   -0.3848 if c<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=2.0\n",
      "   +0.0000 if c<=0.0 & x1<=1.0 & x1<=2.0 & x2>=2.0 & x2>=3.0 & x3-x1<=1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   +0.0040 if x1<=2.0 & x1>=2.0 & x2<=2.0 & x2>=2.0 & x4-x2>=0.0\n",
      "   +0.0000 if c>=1.0 & x2<=0.0 & x3-x1<=-3.0 & x4-x2<=0.0\n",
      "   -0.4694 if c<=0.0 & x1>=3.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.1098 if c>=1.0 & x1>=2.0 & x2<=0.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   +0.4719 if x1>=2.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   +0.4848 if x1>=2.0 & x4-x2>=1.0\n",
      "   +0.0699 if c<=0.0 & x1<=0.0 & x2<=2.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   +0.1699 if x1<=0.0 & x3-x1>=2.0 & x4-x2<=2.0 & x4-x2>=0.0\n",
      "   +0.2069 if x3-x1>=3.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   +0.0000 if c<=0.0 & x1>=2.0 & x2<=1.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.5955 if x1>=3.0 & x2>=2.0 & x3-x1<=0.0\n",
      "init state [ 3  0 -2  2  0]\n",
      "(20,) (20,)\n",
      "init state [ 2  1 -2  0  0]\n",
      "(32,) (12,)\n",
      "init state [ 2  1 -1  0  0]\n",
      "(72,) (40,)\n",
      "init state [ 2  2 -2 -1  0]\n",
      "(104,) (32,)\n",
      "init state [ 2  2  0 -1  0]\n",
      "(140,) (36,)\n",
      "init state [0 2 0 1 0]\n",
      "(169,) (29,)\n",
      "init state [ 1  1  0 -1  0]\n",
      "(202,) (33,)\n",
      "init state [ 3  1  0 -1  0]\n",
      "(213,) (11,)\n",
      "init state [ 3  2 -1 -1  0]\n",
      "(251,) (38,)\n",
      "init state [1 2 1 1 0]\n",
      "(280,) (29,)\n",
      "============ 2 ===========\n",
      "Run episode 2 with rewards 13, accuracy 0.2\n",
      "best\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/home/fyan/.local/lib/python3.10/site-packages/numpy/lib/function_base.py:518: RuntimeWarning: Mean of empty slice.\n",
      "  avg = a.mean(axis, **keepdims_kw)\n",
      "/home/fyan/.local/lib/python3.10/site-packages/numpy/core/_methods.py:190: RuntimeWarning: invalid value encountered in double_scalars\n",
      "  ret = ret.dtype.type(ret / rcount)\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 0 --------------\n",
      "   -0.4209 if c>=1.0 & x2>=3.0\n",
      "   +0.0418 if c>=1.0 & x1>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0\n",
      "   -0.1792 if c<=0.0 & x1<=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.1443 if c<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=1.0 & x3-x1<=2.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.5553 if c>=1.0 & x1>=2.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   -0.0831 if c>=1.0 & x3-x1<=-3.0 & x4-x2<=-1.0\n",
      "   -0.1150 if x1>=3.0 & x2>=3.0 & x3-x1>=0.0\n",
      "   -0.0881 if c<=0.0 & x2<=1.0 & x3-x1<=2.0 & x3-x1>=1.0 & x4-x2<=0.0\n",
      "   -0.0405 if c<=0.0 & x1<=1.0 & x2<=1.0 & x3-x1<=1.0 & x4-x2<=-1.0\n",
      "   +0.3252 if c<=0.0 & x1<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   -0.0519 if c<=0.0 & x1<=2.0 & x2>=2.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2>=-1.0 & x4-x2>=1.0\n",
      "   -0.0066 if c<=0.0 & x3-x1<=2.0 & x3-x1>=2.0 & x4-x2<=2.0 & x4-x2>=-2.0\n",
      "   +0.0000 if c>=1.0 & x1<=2.0 & x3-x1>=3.0 & x4-x2<=-2.0 & x4-x2>=-2.0\n",
      "   +0.0463 if c<=0.0 & x1<=1.0 & x3-x1<=-1.0 & x4-x2>=-1.0\n",
      "   +0.0425 if x1<=1.0 & x4-x2>=2.0\n",
      "   +0.9742 if c<=0.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "----------------- 1 --------------\n",
      "   +0.2136 if x2>=1.0 & x3-x1>=1.0 & x3-x1>=2.0\n",
      "   +0.3416 if c<=0.0 & x2<=2.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2<=1.0\n",
      "   +0.0000 if c>=1.0 & x1>=2.0 & x2>=3.0 & x3-x1>=1.0\n",
      "   +0.3648 if c>=1.0 & x1>=1.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   -0.2038 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x3-x1>=0.0 & x4-x2<=-1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   +0.0000 if x1>=1.0 & x2>=3.0 & x3-x1>=2.0 & x4-x2>=-1.0\n",
      "   -0.2933 if c<=0.0 & x1<=2.0 & x2<=2.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   -0.0308 if c>=1.0 & x1>=2.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.2223 if x1<=0.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   -0.0899 if c<=0.0 & x1<=1.0 & x1<=2.0 & x3-x1<=2.0 & x3-x1>=0.0 & x4-x2<=-2.0 & x4-x2>=-2.0\n",
      "   +0.6991 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   -0.0169 if x1>=2.0 & x2>=3.0 & x3-x1<=1.0 & x4-x2>=-1.0\n",
      "   +0.1079 if c>=1.0 & x2>=1.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   +0.1290 if x1<=0.0 & x2>=1.0 & x4-x2>=1.0\n",
      "   -0.1158 if x1<=2.0 & x4-x2>=2.0\n",
      "   +0.0211 if x4-x2<=-3.0\n",
      "----------------- 2 --------------\n",
      "   -0.5574 if x1<=2.0 & x4-x2>=1.0\n",
      "   -0.1407 if c<=0.0 & x1>=2.0 & x2>=1.0 & x3-x1<=2.0 & x3-x1>=1.0 & x4-x2<=-1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.1524 if x2<=2.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.2130 if c>=1.0 & x1>=3.0 & x2>=2.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   +0.3010 if c<=0.0 & x1>=3.0 & x2>=3.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.1540 if x3-x1>=2.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   +0.5899 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.2355 if x1>=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2<=1.0\n",
      "   +0.0228 if c<=0.0 & x1<=0.0 & x3-x1<=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.8057 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   +0.0000 if c<=0.0 & x1<=0.0 & x2<=0.0 & x3-x1<=2.0\n",
      "   -0.2925 if c<=0.0 & x1<=1.0 & x2<=2.0 & x2>=2.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   -0.0563 if x1<=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.0000 if x2<=2.0 & x2>=2.0 & x3-x1>=3.0\n",
      "   +0.2760 if c<=0.0 & x2>=3.0 & x3-x1<=1.0\n",
      "   +1.0037 if c<=0.0 & x1<=2.0 & x2<=2.0 & x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "----------------- 3 --------------\n",
      "   +0.2861 if x1>=2.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.1733 if c>=1.0 & x1>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0\n",
      "   +0.2227 if c>=1.0 & x3-x1<=-3.0 & x4-x2<=-1.0\n",
      "   -0.2910 if c<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=2.0\n",
      "   +0.0000 if c<=0.0 & x1<=1.0 & x1<=2.0 & x2>=2.0 & x2>=3.0 & x3-x1<=1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.1272 if x1<=2.0 & x1>=2.0 & x2<=2.0 & x2>=2.0 & x4-x2>=0.0\n",
      "   +0.0000 if c>=1.0 & x2<=0.0 & x3-x1<=-3.0 & x4-x2<=0.0\n",
      "   +0.0157 if c<=0.0 & x1>=3.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.0926 if c>=1.0 & x1>=2.0 & x2<=0.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   +0.5073 if x1>=2.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   +0.2861 if x1>=2.0 & x4-x2>=1.0\n",
      "   +0.0069 if c<=0.0 & x1<=0.0 & x2<=2.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   -0.0947 if x1<=0.0 & x3-x1>=2.0 & x4-x2<=2.0 & x4-x2>=0.0\n",
      "   +0.0000 if x3-x1>=3.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   +0.4024 if x1>=3.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   -0.3998 if c<=0.0 & x1>=2.0 & x2>=1.0 & x2>=3.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "init state [ 3  1 -3  0  0]\n",
      "(13,) (13,)\n",
      "init state [2 1 0 2 0]\n",
      "(18,) (5,)\n",
      "init state [1 2 1 1 0]\n",
      "(21,) (3,)\n",
      "init state [0 0 2 3 0]\n",
      "(49,) (28,)\n",
      "init state [ 3  1 -3  0  0]\n",
      "(79,) (30,)\n",
      "init state [0 1 1 1 0]\n",
      "(102,) (23,)\n",
      "init state [1 0 2 1 0]\n",
      "(127,) (25,)\n",
      "init state [ 2  2  0 -1  0]\n",
      "(171,) (44,)\n",
      "init state [ 0  2  3 -1  0]\n",
      "(183,) (12,)\n",
      "init state [1 1 2 0 0]\n",
      "(212,) (29,)\n",
      "============ 3 ===========\n",
      "Run episode 3 with rewards 13, accuracy 0.5\n",
      "best\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/home/fyan/.local/lib/python3.10/site-packages/numpy/lib/function_base.py:518: RuntimeWarning: Mean of empty slice.\n",
      "  avg = a.mean(axis, **keepdims_kw)\n",
      "/home/fyan/.local/lib/python3.10/site-packages/numpy/core/_methods.py:190: RuntimeWarning: invalid value encountered in double_scalars\n",
      "  ret = ret.dtype.type(ret / rcount)\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 0 --------------\n",
      "   -0.0728 if c>=1.0 & x2>=3.0\n",
      "   +0.0945 if c>=1.0 & x1>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0\n",
      "   +0.0124 if c<=0.0 & x1<=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.3091 if c<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=1.0 & x3-x1<=2.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.3700 if c>=1.0 & x1>=2.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   -0.2221 if c>=1.0 & x3-x1<=-3.0 & x4-x2<=-1.0\n",
      "   -0.1315 if x1>=3.0 & x2>=3.0 & x3-x1>=0.0\n",
      "   -0.0816 if c<=0.0 & x2<=1.0 & x3-x1<=2.0 & x3-x1>=1.0 & x4-x2<=0.0\n",
      "   +0.0000 if c<=0.0 & x1<=1.0 & x2<=1.0 & x3-x1<=1.0 & x4-x2<=-1.0\n",
      "   +0.2854 if c<=0.0 & x1<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   +0.6486 if c<=0.0 & x1<=2.0 & x2>=2.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2>=-1.0 & x4-x2>=1.0\n",
      "   -0.3119 if c<=0.0 & x3-x1<=2.0 & x3-x1>=2.0 & x4-x2<=2.0 & x4-x2>=-2.0\n",
      "   +0.2854 if c<=0.0 & x1<=1.0 & x3-x1<=-1.0 & x4-x2>=-1.0\n",
      "   -0.0492 if x1<=1.0 & x4-x2>=2.0\n",
      "   +0.5434 if c<=0.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.6745 if x1>=2.0 & x2>=1.0 & x3-x1>=0.0\n",
      "----------------- 1 --------------\n",
      "   +0.3766 if x2>=1.0 & x3-x1>=1.0 & x3-x1>=2.0\n",
      "   +0.4133 if c<=0.0 & x2<=2.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2<=1.0\n",
      "   +0.1034 if c>=1.0 & x1>=1.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   -0.1684 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x3-x1>=0.0 & x4-x2<=-1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   +0.0000 if x1>=1.0 & x2>=3.0 & x3-x1>=2.0 & x4-x2>=-1.0\n",
      "   -0.8363 if c<=0.0 & x1<=2.0 & x2<=2.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   +0.0531 if c>=1.0 & x1>=2.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.3068 if x1<=0.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   -0.0633 if c<=0.0 & x1<=1.0 & x1<=2.0 & x3-x1<=2.0 & x3-x1>=0.0 & x4-x2<=-2.0 & x4-x2>=-2.0\n",
      "   +1.3970 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.3690 if x1>=2.0 & x2>=3.0 & x3-x1<=1.0 & x4-x2>=-1.0\n",
      "   -0.0501 if c>=1.0 & x2>=1.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   -0.0708 if x1<=0.0 & x2>=1.0 & x4-x2>=1.0\n",
      "   -0.0472 if x1<=2.0 & x4-x2>=2.0\n",
      "   +0.0000 if x4-x2<=-3.0\n",
      "   -0.5979 if x1>=2.0 & x4-x2>=0.0\n",
      "----------------- 2 --------------\n",
      "   -0.6041 if x1<=2.0 & x4-x2>=1.0\n",
      "   -0.2738 if c<=0.0 & x1>=2.0 & x2>=1.0 & x3-x1<=2.0 & x3-x1>=1.0 & x4-x2<=-1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.0096 if x2<=2.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.1319 if c>=1.0 & x1>=3.0 & x2>=2.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   +0.4031 if c<=0.0 & x1>=3.0 & x2>=3.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.2063 if x3-x1>=2.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   +0.9984 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.0549 if x1>=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2<=1.0\n",
      "   -0.1220 if c<=0.0 & x1<=0.0 & x3-x1<=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.5945 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -0.2512 if c<=0.0 & x1<=1.0 & x2<=2.0 & x2>=2.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   -0.0951 if x1<=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.1331 if x2<=2.0 & x2>=2.0 & x3-x1>=3.0\n",
      "   +0.3709 if c<=0.0 & x2>=3.0 & x3-x1<=1.0\n",
      "   -0.0492 if c<=0.0 & x1<=2.0 & x2<=2.0 & x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "   -0.3876 if x3-x1<=2.0 & x4-x2<=0.0\n",
      "----------------- 3 --------------\n",
      "   +0.5760 if x1>=2.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.0579 if c>=1.0 & x1>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0\n",
      "   +0.1928 if c>=1.0 & x3-x1<=-3.0 & x4-x2<=-1.0\n",
      "   -0.1556 if c<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=2.0\n",
      "   +0.0000 if c<=0.0 & x1<=1.0 & x1<=2.0 & x2>=2.0 & x2>=3.0 & x3-x1<=1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.1435 if x1<=2.0 & x1>=2.0 & x2<=2.0 & x2>=2.0 & x4-x2>=0.0\n",
      "   -0.0346 if c<=0.0 & x1>=3.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.1073 if c>=1.0 & x1>=2.0 & x2<=0.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   +0.0020 if x1>=2.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   +0.5645 if x1>=2.0 & x4-x2>=1.0\n",
      "   -0.0619 if c<=0.0 & x1<=0.0 & x2<=2.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   +0.2032 if x1<=0.0 & x3-x1>=2.0 & x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.1594 if x3-x1>=3.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   +0.7040 if x1>=3.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   +0.0000 if c<=0.0 & x1>=2.0 & x2>=1.0 & x2>=3.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   +0.4072 if c<=0.0 & x1<=2.0 & x1>=1.0 & x1>=2.0 & x2<=1.0 & x2>=1.0 & x3-x1>=-1.0\n",
      "init state [ 0  1  0 -1  0]\n",
      "(24,) (24,)\n",
      "init state [ 1  0 -1  1  0]\n",
      "(38,) (14,)\n",
      "init state [3 0 0 2 0]\n",
      "(41,) (3,)\n",
      "init state [ 3  1 -3 -1  0]\n",
      "(90,) (49,)\n",
      "init state [ 0  2  3 -1  0]\n",
      "(100,) (10,)\n",
      "init state [0 0 1 0 0]\n",
      "(158,) (58,)\n",
      "init state [0 0 3 1 0]\n",
      "(177,) (19,)\n",
      "init state [0 0 1 2 0]\n",
      "(206,) (29,)\n",
      "init state [ 3  1 -1  1  0]\n",
      "(224,) (18,)\n",
      "init state [ 2  2 -2  0  0]\n",
      "(256,) (32,)\n",
      "============ 4 ===========\n",
      "Run episode 4 with rewards 10, accuracy 0.2\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/home/fyan/.local/lib/python3.10/site-packages/numpy/lib/function_base.py:518: RuntimeWarning: Mean of empty slice.\n",
      "  avg = a.mean(axis, **keepdims_kw)\n",
      "/home/fyan/.local/lib/python3.10/site-packages/numpy/core/_methods.py:190: RuntimeWarning: invalid value encountered in double_scalars\n",
      "  ret = ret.dtype.type(ret / rcount)\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 0 --------------\n",
      "   -0.4946 if c>=1.0 & x2>=3.0\n",
      "   -0.0625 if c>=1.0 & x1>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0\n",
      "   -0.1364 if c<=0.0 & x1<=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.0424 if c<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=1.0 & x3-x1<=2.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.4597 if c>=1.0 & x1>=2.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   +0.1438 if c>=1.0 & x3-x1<=-3.0 & x4-x2<=-1.0\n",
      "   +0.0000 if x1>=3.0 & x2>=3.0 & x3-x1>=0.0\n",
      "   -0.1720 if c<=0.0 & x2<=1.0 & x3-x1<=2.0 & x3-x1>=1.0 & x4-x2<=0.0\n",
      "   +0.3225 if c<=0.0 & x1<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   +0.0000 if c<=0.0 & x1<=2.0 & x2>=2.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2>=-1.0 & x4-x2>=1.0\n",
      "   -0.0952 if c<=0.0 & x3-x1<=2.0 & x3-x1>=2.0 & x4-x2<=2.0 & x4-x2>=-2.0\n",
      "   +0.6056 if c<=0.0 & x1<=1.0 & x3-x1<=-1.0 & x4-x2>=-1.0\n",
      "   +0.1773 if x1<=1.0 & x4-x2>=2.0\n",
      "   +0.0076 if c<=0.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.4025 if x1>=2.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   -0.6670 if x4-x2<=-3.0\n",
      "----------------- 1 --------------\n",
      "   +0.6056 if x2>=1.0 & x3-x1>=1.0 & x3-x1>=2.0\n",
      "   +0.2661 if c<=0.0 & x2<=2.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2<=1.0\n",
      "   +0.2547 if c>=1.0 & x1>=1.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   -0.1499 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x3-x1>=0.0 & x4-x2<=-1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.3598 if c<=0.0 & x1<=2.0 & x2<=2.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   -0.0100 if c>=1.0 & x1>=2.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.1632 if x1<=0.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   +0.0000 if c<=0.0 & x1<=1.0 & x1<=2.0 & x3-x1<=2.0 & x3-x1>=0.0 & x4-x2<=-2.0 & x4-x2>=-2.0\n",
      "   +1.1760 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.0240 if x1>=2.0 & x2>=3.0 & x3-x1<=1.0 & x4-x2>=-1.0\n",
      "   -0.0997 if c>=1.0 & x2>=1.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   -0.0409 if x1<=0.0 & x2>=1.0 & x4-x2>=1.0\n",
      "   -0.2828 if x1<=2.0 & x4-x2>=2.0\n",
      "   +0.1065 if x4-x2<=-3.0\n",
      "   -0.0664 if x1>=2.0 & x4-x2>=0.0\n",
      "   -0.0549 if x2>=3.0 & x3-x1<=-2.0 & x4-x2>=-2.0\n",
      "----------------- 2 --------------\n",
      "   -0.3462 if x1<=2.0 & x4-x2>=1.0\n",
      "   -0.2405 if c<=0.0 & x1>=2.0 & x2>=1.0 & x3-x1<=2.0 & x3-x1>=1.0 & x4-x2<=-1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.1901 if c>=1.0 & x1>=3.0 & x2>=2.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   +0.0000 if c<=0.0 & x1>=3.0 & x2>=3.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.2352 if x3-x1>=2.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   +0.6831 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.4317 if x1>=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2<=1.0\n",
      "   -0.1290 if c<=0.0 & x1<=0.0 & x3-x1<=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.6545 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -0.0275 if c<=0.0 & x1<=1.0 & x2<=2.0 & x2>=2.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   -0.2334 if x1<=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.0396 if x2<=2.0 & x2>=2.0 & x3-x1>=3.0\n",
      "   +0.6792 if c<=0.0 & x2>=3.0 & x3-x1<=1.0\n",
      "   -0.0951 if c<=0.0 & x1<=2.0 & x2<=2.0 & x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "   -0.2535 if x3-x1<=2.0 & x4-x2<=0.0\n",
      "   -0.4638 if x1>=3.0 & x2>=2.0 & x3-x1>=-1.0 & x4-x2>=0.0\n",
      "----------------- 3 --------------\n",
      "   +0.6505 if x1>=2.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.2201 if c>=1.0 & x1>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0\n",
      "   +0.1302 if c>=1.0 & x3-x1<=-3.0 & x4-x2<=-1.0\n",
      "   -0.1396 if c<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=2.0\n",
      "   -0.0918 if x1<=2.0 & x1>=2.0 & x2<=2.0 & x2>=2.0 & x4-x2>=0.0\n",
      "   -0.4211 if c<=0.0 & x1>=3.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.0506 if c>=1.0 & x1>=2.0 & x2<=0.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   +0.1901 if x1>=2.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   +0.6193 if x1>=2.0 & x4-x2>=1.0\n",
      "   +0.0000 if c<=0.0 & x1<=0.0 & x2<=2.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   +0.0037 if x1<=0.0 & x3-x1>=2.0 & x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.0493 if x3-x1>=3.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   +0.0912 if x1>=3.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   -0.3184 if c<=0.0 & x1>=2.0 & x2>=1.0 & x2>=3.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   +0.1230 if c<=0.0 & x1<=2.0 & x1>=1.0 & x1>=2.0 & x2<=1.0 & x2>=1.0 & x3-x1>=-1.0\n",
      "   +0.6961 if x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "init state [ 0  3  3 -3  0]\n",
      "(31,) (31,)\n",
      "init state [0 2 0 1 0]\n",
      "(44,) (13,)\n",
      "init state [ 2  1 -2 -1  0]\n",
      "(71,) (27,)\n",
      "init state [0 1 0 1 0]\n",
      "(107,) (36,)\n",
      "init state [ 0  2  2 -2  0]\n",
      "(149,) (42,)\n",
      "init state [ 3  0 -2  2  0]\n",
      "(165,) (16,)\n",
      "init state [ 0  3  3 -3  0]\n",
      "(219,) (54,)\n",
      "init state [ 2  0 -1  2  0]\n",
      "(229,) (10,)\n",
      "init state [1 1 1 1 0]\n",
      "(242,) (13,)\n",
      "init state [ 1  2  0 -2  0]\n",
      "(363,) (121,)\n",
      "============ 5 ===========\n",
      "Run episode 5 with rewards -79, accuracy 0.2\n",
      "----------------- 0 --------------\n",
      "   -0.3890 if c>=1.0 & x2>=3.0\n",
      "   -0.1932 if c>=1.0 & x1>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0\n",
      "   -0.0470 if c<=0.0 & x1<=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.0644 if c<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=1.0 & x3-x1<=2.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.3129 if c>=1.0 & x1>=2.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   +0.0604 if c>=1.0 & x3-x1<=-3.0 & x4-x2<=-1.0\n",
      "   -0.3976 if c<=0.0 & x2<=1.0 & x3-x1<=2.0 & x3-x1>=1.0 & x4-x2<=0.0\n",
      "   +0.4041 if c<=0.0 & x1<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   -0.1596 if c<=0.0 & x1<=2.0 & x2>=2.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2>=-1.0 & x4-x2>=1.0\n",
      "   -0.3052 if c<=0.0 & x3-x1<=2.0 & x3-x1>=2.0 & x4-x2<=2.0 & x4-x2>=-2.0\n",
      "   +0.3942 if c<=0.0 & x1<=1.0 & x3-x1<=-1.0 & x4-x2>=-1.0\n",
      "   -0.0045 if x1<=1.0 & x4-x2>=2.0\n",
      "   +0.1946 if c<=0.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.3621 if x1>=2.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   -0.4315 if x4-x2<=-3.0\n",
      "   +0.4228 if x1>=3.0 & x2>=3.0 & x3-x1<=-2.0 & x4-x2>=-1.0\n",
      "----------------- 1 --------------\n",
      "   +0.3242 if x2>=1.0 & x3-x1>=1.0 & x3-x1>=2.0\n",
      "   -0.2404 if c<=0.0 & x2<=2.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2<=1.0\n",
      "   +1.0359 if c>=1.0 & x1>=1.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   -0.2141 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x3-x1>=0.0 & x4-x2<=-1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.4261 if c<=0.0 & x1<=2.0 & x2<=2.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   +0.0000 if c>=1.0 & x1>=2.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   -0.0597 if x1<=0.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   +0.4231 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.0686 if x1>=2.0 & x2>=3.0 & x3-x1<=1.0 & x4-x2>=-1.0\n",
      "   -0.1048 if c>=1.0 & x2>=1.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   +0.1551 if x1<=0.0 & x2>=1.0 & x4-x2>=1.0\n",
      "   -0.1040 if x1<=2.0 & x4-x2>=2.0\n",
      "   +0.0737 if x4-x2<=-3.0\n",
      "   -0.2661 if x1>=2.0 & x4-x2>=0.0\n",
      "   +0.1822 if x2>=3.0 & x3-x1<=-2.0 & x4-x2>=-2.0\n",
      "   +0.3803 if x3-x1<=2.0 & x3-x1>=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "----------------- 2 --------------\n",
      "   -0.6654 if x1<=2.0 & x4-x2>=1.0\n",
      "   +0.1068 if c<=0.0 & x1>=2.0 & x2>=1.0 & x3-x1<=2.0 & x3-x1>=1.0 & x4-x2<=-1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.1897 if c>=1.0 & x1>=3.0 & x2>=2.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   -0.2094 if x3-x1>=2.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   +0.7761 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.2716 if x1>=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2<=1.0\n",
      "   +0.0917 if c<=0.0 & x1<=0.0 & x3-x1<=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.8363 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   +0.6741 if c<=0.0 & x1<=1.0 & x2<=2.0 & x2>=2.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   -0.2362 if x1<=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.0131 if x2<=2.0 & x2>=2.0 & x3-x1>=3.0\n",
      "   +0.5648 if c<=0.0 & x2>=3.0 & x3-x1<=1.0\n",
      "   -0.0852 if c<=0.0 & x1<=2.0 & x2<=2.0 & x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "   -0.0830 if x3-x1<=2.0 & x4-x2<=0.0\n",
      "   -0.0064 if x1>=3.0 & x2>=2.0 & x3-x1>=-1.0 & x4-x2>=0.0\n",
      "   +0.0852 if x4-x2>=-2.0\n",
      "----------------- 3 --------------\n",
      "   +0.6259 if x1>=2.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.2478 if c>=1.0 & x1>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0\n",
      "   -0.0428 if c>=1.0 & x3-x1<=-3.0 & x4-x2<=-1.0\n",
      "   +0.2310 if c<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=2.0\n",
      "   +0.2183 if x1<=2.0 & x1>=2.0 & x2<=2.0 & x2>=2.0 & x4-x2>=0.0\n",
      "   +0.0694 if c<=0.0 & x1>=3.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.0000 if c>=1.0 & x1>=2.0 & x2<=0.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   +0.4415 if x1>=2.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   +0.6259 if x1>=2.0 & x4-x2>=1.0\n",
      "   +0.0498 if x1<=0.0 & x3-x1>=2.0 & x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.0360 if x3-x1>=3.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   +0.3062 if x1>=3.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   -0.1411 if c<=0.0 & x1>=2.0 & x2>=1.0 & x2>=3.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   +0.0862 if c<=0.0 & x1<=2.0 & x1>=1.0 & x1>=2.0 & x2<=1.0 & x2>=1.0 & x3-x1>=-1.0\n",
      "   +0.1573 if x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   -0.4099 if x3-x1<=-3.0 & x4-x2>=1.0\n",
      "init state [0 0 3 1 0]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(20,) (20,)\n",
      "init state [ 2  3 -2 -3  0]\n",
      "(89,) (69,)\n",
      "init state [ 0  3  2 -1  0]\n",
      "(101,) (12,)\n",
      "init state [2 1 1 0 0]\n",
      "(108,) (7,)\n",
      "init state [ 2  0 -1  2  0]\n",
      "(122,) (14,)\n",
      "init state [ 2  2 -1  0  0]\n",
      "(140,) (18,)\n",
      "init state [ 3  1 -3  2  0]\n",
      "(182,) (42,)\n",
      "init state [ 2  3  1 -2  0]\n",
      "(235,) (53,)\n",
      "init state [ 2  0 -1  3  0]\n",
      "(262,) (27,)\n",
      "init state [1 0 2 0 0]\n",
      "(297,) (35,)\n",
      "============ 6 ===========\n",
      "Run episode 6 with rewards 7, accuracy 0.2\n",
      "----------------- 0 --------------\n",
      "   -0.4441 if c>=1.0 & x2>=3.0\n",
      "   +0.0000 if c>=1.0 & x1>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0\n",
      "   -0.0300 if c<=0.0 & x1<=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.1443 if c<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=1.0 & x3-x1<=2.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.2380 if c>=1.0 & x1>=2.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   +0.0000 if c>=1.0 & x3-x1<=-3.0 & x4-x2<=-1.0\n",
      "   -0.3759 if c<=0.0 & x2<=1.0 & x3-x1<=2.0 & x3-x1>=1.0 & x4-x2<=0.0\n",
      "   +0.8064 if c<=0.0 & x1<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   -0.2909 if c<=0.0 & x1<=2.0 & x2>=2.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2>=-1.0 & x4-x2>=1.0\n",
      "   -0.1463 if c<=0.0 & x3-x1<=2.0 & x3-x1>=2.0 & x4-x2<=2.0 & x4-x2>=-2.0\n",
      "   +0.3927 if c<=0.0 & x1<=1.0 & x3-x1<=-1.0 & x4-x2>=-1.0\n",
      "   +0.2440 if c<=0.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.0197 if x1>=2.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   +0.1631 if x4-x2<=-3.0\n",
      "   +0.4506 if x1>=3.0 & x2>=3.0 & x3-x1<=-2.0 & x4-x2>=-1.0\n",
      "   -0.3405 if x1<=1.0 & x4-x2>=3.0\n",
      "----------------- 1 --------------\n",
      "   +0.6899 if x2>=1.0 & x3-x1>=1.0 & x3-x1>=2.0\n",
      "   +0.4257 if c<=0.0 & x2<=2.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2<=1.0\n",
      "   +0.7041 if c>=1.0 & x1>=1.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   -0.1273 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x3-x1>=0.0 & x4-x2<=-1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.3686 if c<=0.0 & x1<=2.0 & x2<=2.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   +0.2278 if x1<=0.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   +0.5135 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   -0.0362 if x1>=2.0 & x2>=3.0 & x3-x1<=1.0 & x4-x2>=-1.0\n",
      "   +0.0958 if c>=1.0 & x2>=1.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   -0.2403 if x1<=0.0 & x2>=1.0 & x4-x2>=1.0\n",
      "   -0.1948 if x1<=2.0 & x4-x2>=2.0\n",
      "   +0.4941 if x4-x2<=-3.0\n",
      "   +0.2055 if x1>=2.0 & x4-x2>=0.0\n",
      "   -0.1867 if x2>=3.0 & x3-x1<=-2.0 & x4-x2>=-2.0\n",
      "   +0.3628 if x3-x1<=2.0 & x3-x1>=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.5262 if x2>=2.0 & x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "----------------- 2 --------------\n",
      "   -0.0207 if x1<=2.0 & x4-x2>=1.0\n",
      "   +0.4477 if c<=0.0 & x1>=2.0 & x2>=1.0 & x3-x1<=2.0 & x3-x1>=1.0 & x4-x2<=-1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.2477 if c>=1.0 & x1>=3.0 & x2>=2.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   -0.0078 if x3-x1>=2.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   +0.8948 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.1964 if x1>=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2<=1.0\n",
      "   +0.0000 if c<=0.0 & x1<=0.0 & x3-x1<=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.1968 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -0.0580 if c<=0.0 & x1<=1.0 & x2<=2.0 & x2>=2.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   +0.0737 if x1<=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.1636 if x2<=2.0 & x2>=2.0 & x3-x1>=3.0\n",
      "   +0.5984 if c<=0.0 & x2>=3.0 & x3-x1<=1.0\n",
      "   -0.0416 if c<=0.0 & x1<=2.0 & x2<=2.0 & x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "   -0.4059 if x3-x1<=2.0 & x4-x2<=0.0\n",
      "   -0.1920 if x4-x2>=-2.0\n",
      "   -0.2727 if x1>=2.0 & x2>=2.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "----------------- 3 --------------\n",
      "   +0.5001 if x1>=2.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.0000 if c>=1.0 & x1>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0\n",
      "   -0.0000 if c>=1.0 & x3-x1<=-3.0 & x4-x2<=-1.0\n",
      "   -0.2729 if c<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=2.0\n",
      "   -0.2477 if x1<=2.0 & x1>=2.0 & x2<=2.0 & x2>=2.0 & x4-x2>=0.0\n",
      "   -0.0000 if c<=0.0 & x1>=3.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.3121 if x1>=2.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   +0.6754 if x1>=2.0 & x4-x2>=1.0\n",
      "   -0.0020 if x1<=0.0 & x3-x1>=2.0 & x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.0393 if x3-x1>=3.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   +0.2995 if x1>=3.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   -0.1301 if c<=0.0 & x1>=2.0 & x2>=1.0 & x2>=3.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   -0.4996 if c<=0.0 & x1<=2.0 & x1>=1.0 & x1>=2.0 & x2<=1.0 & x2>=1.0 & x3-x1>=-1.0\n",
      "   +0.3122 if x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   +0.0226 if x3-x1<=-3.0 & x4-x2>=1.0\n",
      "   +0.4513 if c<=0.0 & x1<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=2.0 & x4-x2>=1.0\n",
      "init state [0 0 0 1 0]\n",
      "(19,) (19,)\n",
      "init state [ 2  3  0 -3  0]\n",
      "(39,) (20,)\n",
      "init state [ 3  1 -1  1  0]\n",
      "(48,) (9,)\n",
      "init state [ 1  3  1 -1  0]\n",
      "(62,) (14,)\n",
      "init state [1 0 2 2 0]\n",
      "(78,) (16,)\n",
      "init state [2 0 1 1 0]\n",
      "(108,) (30,)\n",
      "init state [1 0 1 1 0]\n",
      "(128,) (20,)\n",
      "init state [ 2  1 -1 -1  0]\n",
      "(141,) (13,)\n",
      "init state [0 0 1 3 0]\n",
      "(149,) (8,)\n",
      "init state [ 3  1 -3  0  0]\n",
      "(165,) (16,)\n",
      "============ 7 ===========\n",
      "Run episode 7 with rewards 26, accuracy 0.6\n",
      "best\n",
      "----------------- 0 --------------\n",
      "   -0.5424 if c>=1.0 & x2>=3.0\n",
      "   +0.0102 if c>=1.0 & x1>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0\n",
      "   +0.1347 if c<=0.0 & x1<=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.3016 if c<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=1.0 & x3-x1<=2.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.3668 if c>=1.0 & x1>=2.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   -0.1496 if c<=0.0 & x2<=1.0 & x3-x1<=2.0 & x3-x1>=1.0 & x4-x2<=0.0\n",
      "   +0.0740 if c<=0.0 & x1<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   +0.0000 if c<=0.0 & x1<=2.0 & x2>=2.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2>=-1.0 & x4-x2>=1.0\n",
      "   -0.1554 if c<=0.0 & x3-x1<=2.0 & x3-x1>=2.0 & x4-x2<=2.0 & x4-x2>=-2.0\n",
      "   +0.1240 if c<=0.0 & x1<=1.0 & x3-x1<=-1.0 & x4-x2>=-1.0\n",
      "   +0.2035 if c<=0.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.0822 if x1>=2.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   +0.0301 if x4-x2<=-3.0\n",
      "   +0.0000 if x1>=3.0 & x2>=3.0 & x3-x1<=-2.0 & x4-x2>=-1.0\n",
      "   -0.2500 if x1<=1.0 & x4-x2>=3.0\n",
      "   +0.6461 if c<=0.0 & x1>=1.0 & x2>=3.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "----------------- 1 --------------\n",
      "   +0.6424 if x2>=1.0 & x3-x1>=1.0 & x3-x1>=2.0\n",
      "   +0.5351 if c<=0.0 & x2<=2.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2<=1.0\n",
      "   +0.8931 if c>=1.0 & x1>=1.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   -0.1691 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x3-x1>=0.0 & x4-x2<=-1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   +0.0656 if c<=0.0 & x1<=2.0 & x2<=2.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   +0.2427 if x1<=0.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   +0.6632 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.0000 if c>=1.0 & x2>=1.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   -0.4325 if x1<=0.0 & x2>=1.0 & x4-x2>=1.0\n",
      "   -0.3633 if x1<=2.0 & x4-x2>=2.0\n",
      "   +0.2220 if x4-x2<=-3.0\n",
      "   +0.3500 if x1>=2.0 & x4-x2>=0.0\n",
      "   -0.0810 if x2>=3.0 & x3-x1<=-2.0 & x4-x2>=-2.0\n",
      "   +0.5178 if x3-x1<=2.0 & x3-x1>=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.2224 if x2>=2.0 & x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.8587 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "----------------- 2 --------------\n",
      "   -0.1729 if x1<=2.0 & x4-x2>=1.0\n",
      "   +0.0000 if c<=0.0 & x1>=2.0 & x2>=1.0 & x3-x1<=2.0 & x3-x1>=1.0 & x4-x2<=-1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.1278 if c>=1.0 & x1>=3.0 & x2>=2.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   -0.4353 if x3-x1>=2.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   +0.9329 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.2514 if x1>=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2<=1.0\n",
      "   -0.3739 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -0.2107 if c<=0.0 & x1<=1.0 & x2<=2.0 & x2>=2.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   +0.0098 if x1<=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.0666 if x2<=2.0 & x2>=2.0 & x3-x1>=3.0\n",
      "   +0.1559 if c<=0.0 & x2>=3.0 & x3-x1<=1.0\n",
      "   -0.0324 if c<=0.0 & x1<=2.0 & x2<=2.0 & x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "   -0.1497 if x3-x1<=2.0 & x4-x2<=0.0\n",
      "   -0.5749 if x4-x2>=-2.0\n",
      "   -0.1739 if x1>=2.0 & x2>=2.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.3059 if x4-x2>=3.0\n",
      "----------------- 3 --------------\n",
      "   +0.3604 if x1>=2.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.0989 if c>=1.0 & x1>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0\n",
      "   +0.0873 if c<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=2.0\n",
      "   -0.0631 if x1<=2.0 & x1>=2.0 & x2<=2.0 & x2>=2.0 & x4-x2>=0.0\n",
      "   -0.0000 if c<=0.0 & x1>=3.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.2720 if x1>=2.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   +0.3293 if x1>=2.0 & x4-x2>=1.0\n",
      "   +0.1429 if x1<=0.0 & x3-x1>=2.0 & x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.0586 if x3-x1>=3.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   +0.7404 if x1>=3.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   -0.0426 if c<=0.0 & x1>=2.0 & x2>=1.0 & x2>=3.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   -0.2023 if c<=0.0 & x1<=2.0 & x1>=1.0 & x1>=2.0 & x2<=1.0 & x2>=1.0 & x3-x1>=-1.0\n",
      "   -0.1468 if x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   -0.0000 if x3-x1<=-3.0 & x4-x2>=1.0\n",
      "   +0.3984 if c<=0.0 & x1<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=2.0 & x4-x2>=1.0\n",
      "   +0.3804 if x2>=1.0 & x4-x2>=2.0\n",
      "init state [ 1  0 -1  0  0]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(36,) (36,)\n",
      "init state [2 1 0 1 0]\n",
      "(39,) (3,)\n",
      "init state [ 3  0 -3  1  0]\n",
      "(67,) (28,)\n",
      "init state [ 1  3  1 -1  0]\n",
      "(86,) (19,)\n",
      "init state [2 0 1 2 0]\n",
      "(96,) (10,)\n",
      "init state [ 1  1 -1  2  0]\n",
      "(137,) (41,)\n",
      "init state [ 1  3 -1 -2  0]\n",
      "(178,) (41,)\n",
      "init state [0 0 2 3 0]\n",
      "(190,) (12,)\n",
      "init state [1 1 2 1 0]\n",
      "(203,) (13,)\n",
      "init state [ 0  3  0 -2  0]\n",
      "(233,) (30,)\n",
      "============ 8 ===========\n",
      "Run episode 8 with rewards 12, accuracy 0.2\n",
      "----------------- 0 --------------\n",
      "   -0.3861 if c>=1.0 & x2>=3.0\n",
      "   -0.1176 if c>=1.0 & x1>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0\n",
      "   +0.1138 if c<=0.0 & x1<=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.2286 if c<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=1.0 & x3-x1<=2.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.1242 if c>=1.0 & x1>=2.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   +0.0000 if c<=0.0 & x2<=1.0 & x3-x1<=2.0 & x3-x1>=1.0 & x4-x2<=0.0\n",
      "   +0.2928 if c<=0.0 & x1<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   +0.3259 if c<=0.0 & x3-x1<=2.0 & x3-x1>=2.0 & x4-x2<=2.0 & x4-x2>=-2.0\n",
      "   +0.0752 if c<=0.0 & x1<=1.0 & x3-x1<=-1.0 & x4-x2>=-1.0\n",
      "   +0.5523 if c<=0.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.4094 if x1>=2.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   -0.0193 if x4-x2<=-3.0\n",
      "   -0.1745 if x1>=3.0 & x2>=3.0 & x3-x1<=-2.0 & x4-x2>=-1.0\n",
      "   -0.5182 if x1<=1.0 & x4-x2>=3.0\n",
      "   +0.1807 if c<=0.0 & x1>=1.0 & x2>=3.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   -0.4973 if x3-x1>=3.0\n",
      "----------------- 1 --------------\n",
      "   +0.5343 if x2>=1.0 & x3-x1>=1.0 & x3-x1>=2.0\n",
      "   +0.0444 if c<=0.0 & x2<=2.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2<=1.0\n",
      "   +0.5649 if c>=1.0 & x1>=1.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   -0.0746 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x3-x1>=0.0 & x4-x2<=-1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.6552 if c<=0.0 & x1<=2.0 & x2<=2.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   -0.0416 if x1<=0.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   +1.0567 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.2943 if x1<=0.0 & x2>=1.0 & x4-x2>=1.0\n",
      "   +0.0423 if x1<=2.0 & x4-x2>=2.0\n",
      "   -0.1289 if x4-x2<=-3.0\n",
      "   -0.2666 if x1>=2.0 & x4-x2>=0.0\n",
      "   +0.1576 if x2>=3.0 & x3-x1<=-2.0 & x4-x2>=-2.0\n",
      "   +0.3373 if x3-x1<=2.0 & x3-x1>=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.4326 if x2>=2.0 & x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -1.1973 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   -0.4793 if x3-x1>=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "----------------- 2 --------------\n",
      "   -0.1652 if x1<=2.0 & x4-x2>=1.0\n",
      "   -0.0897 if c>=1.0 & x1>=3.0 & x2>=2.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   -0.4045 if x3-x1>=2.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   +0.6120 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.0573 if x1>=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2<=1.0\n",
      "   -0.3984 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   +0.0000 if c<=0.0 & x1<=1.0 & x2<=2.0 & x2>=2.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   -0.1583 if x1<=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.0658 if x2<=2.0 & x2>=2.0 & x3-x1>=3.0\n",
      "   +0.1773 if c<=0.0 & x2>=3.0 & x3-x1<=1.0\n",
      "   +0.3281 if c<=0.0 & x1<=2.0 & x2<=2.0 & x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "   -0.1104 if x3-x1<=2.0 & x4-x2<=0.0\n",
      "   -0.5762 if x4-x2>=-2.0\n",
      "   -0.1353 if x1>=2.0 & x2>=2.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.3373 if x4-x2>=3.0\n",
      "   +0.5278 if x1>=3.0 & x2>=3.0 & x3-x1>=0.0\n",
      "----------------- 3 --------------\n",
      "   +0.3487 if x1>=2.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.0452 if c>=1.0 & x1>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0\n",
      "   -0.3714 if c<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=2.0\n",
      "   +0.7062 if x1<=2.0 & x1>=2.0 & x2<=2.0 & x2>=2.0 & x4-x2>=0.0\n",
      "   -0.1293 if x1>=2.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   +0.2004 if x1>=2.0 & x4-x2>=1.0\n",
      "   +0.1235 if x1<=0.0 & x3-x1>=2.0 & x4-x2<=2.0 & x4-x2>=0.0\n",
      "   +0.0000 if x3-x1>=3.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   +0.6891 if x1>=3.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   +0.0113 if c<=0.0 & x1>=2.0 & x2>=1.0 & x2>=3.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   +0.4877 if c<=0.0 & x1<=2.0 & x1>=1.0 & x1>=2.0 & x2<=1.0 & x2>=1.0 & x3-x1>=-1.0\n",
      "   +0.6418 if x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   -0.1268 if x3-x1<=-3.0 & x4-x2>=1.0\n",
      "   +0.0000 if c<=0.0 & x1<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=2.0 & x4-x2>=1.0\n",
      "   -0.3409 if x2>=1.0 & x4-x2>=2.0\n",
      "   +0.5837 if c<=0.0 & x1<=1.0 & x2<=0.0 & x4-x2<=2.0 & x4-x2>=1.0\n",
      "init state [ 2  3 -1 -3  0]\n",
      "(42,) (42,)\n",
      "init state [0 0 1 1 0]\n",
      "(61,) (19,)\n",
      "init state [ 2  3  0 -1  0]\n",
      "(69,) (8,)\n",
      "init state [ 3  1 -1 -1  0]\n",
      "(98,) (29,)\n",
      "init state [ 0  2  3 -1  0]\n",
      "(139,) (41,)\n",
      "init state [2 2 1 0 0]\n",
      "(145,) (6,)\n",
      "init state [ 3  1 -3  1  0]\n",
      "(158,) (13,)\n",
      "init state [ 2  0 -2  2  0]\n",
      "(170,) (12,)\n",
      "init state [ 1  1 -1  0  0]\n",
      "(216,) (46,)\n",
      "init state [ 1  1  2 -1  0]\n",
      "(269,) (53,)\n",
      "============ 9 ===========\n",
      "Run episode 9 with rewards -11, accuracy 0.2\n",
      "----------------- 0 --------------\n",
      "   -0.2224 if c>=1.0 & x2>=3.0\n",
      "   -0.2056 if c>=1.0 & x1>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0\n",
      "   +0.0086 if c<=0.0 & x1<=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.0964 if c<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=1.0 & x3-x1<=2.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.2536 if c>=1.0 & x1>=2.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   +0.2405 if c<=0.0 & x1<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   -0.2908 if c<=0.0 & x3-x1<=2.0 & x3-x1>=2.0 & x4-x2<=2.0 & x4-x2>=-2.0\n",
      "   +0.1149 if c<=0.0 & x1<=1.0 & x3-x1<=-1.0 & x4-x2>=-1.0\n",
      "   +0.2756 if c<=0.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.1929 if x1>=2.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   -0.3244 if x4-x2<=-3.0\n",
      "   +0.0000 if x1>=3.0 & x2>=3.0 & x3-x1<=-2.0 & x4-x2>=-1.0\n",
      "   +0.0000 if x1<=1.0 & x4-x2>=3.0\n",
      "   +0.2699 if c<=0.0 & x1>=1.0 & x2>=3.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   +0.0623 if x3-x1>=3.0\n",
      "   -0.7853 if c<=0.0 & x1<=1.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2>=-2.0\n",
      "----------------- 1 --------------\n",
      "   +0.4405 if x2>=1.0 & x3-x1>=1.0 & x3-x1>=2.0\n",
      "   +0.0565 if c<=0.0 & x2<=2.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2<=1.0\n",
      "   +0.5170 if c>=1.0 & x1>=1.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   -0.4953 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x3-x1>=0.0 & x4-x2<=-1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.5125 if c<=0.0 & x1<=2.0 & x2<=2.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   +0.4367 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   -0.0362 if x1<=0.0 & x2>=1.0 & x4-x2>=1.0\n",
      "   -0.0882 if x1<=2.0 & x4-x2>=2.0\n",
      "   +0.3590 if x4-x2<=-3.0\n",
      "   +0.0553 if x1>=2.0 & x4-x2>=0.0\n",
      "   -0.3535 if x2>=3.0 & x3-x1<=-2.0 & x4-x2>=-2.0\n",
      "   +0.0089 if x3-x1<=2.0 & x3-x1>=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.3312 if x2>=2.0 & x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.8587 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   +0.0000 if x3-x1>=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.4926 if x1>=2.0 & x2<=1.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "----------------- 2 --------------\n",
      "   -0.2848 if x1<=2.0 & x4-x2>=1.0\n",
      "   +0.0147 if c>=1.0 & x1>=3.0 & x2>=2.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   -0.1142 if x3-x1>=2.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   +1.2644 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.3964 if x1>=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2<=1.0\n",
      "   -0.7042 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -0.0834 if x1<=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.0414 if x2<=2.0 & x2>=2.0 & x3-x1>=3.0\n",
      "   +0.4847 if c<=0.0 & x2>=3.0 & x3-x1<=1.0\n",
      "   -0.1299 if c<=0.0 & x1<=2.0 & x2<=2.0 & x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "   +0.1179 if x3-x1<=2.0 & x4-x2<=0.0\n",
      "   -0.6413 if x4-x2>=-2.0\n",
      "   +0.1485 if x1>=2.0 & x2>=2.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.0000 if x4-x2>=3.0\n",
      "   +0.3459 if x1>=3.0 & x2>=3.0 & x3-x1>=0.0\n",
      "   +0.5500 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x4-x2<=-1.0\n",
      "----------------- 3 --------------\n",
      "   -0.0931 if x1>=2.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.3462 if c>=1.0 & x1>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0\n",
      "   -0.0615 if c<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=2.0\n",
      "   +0.2593 if x1<=2.0 & x1>=2.0 & x2<=2.0 & x2>=2.0 & x4-x2>=0.0\n",
      "   -0.0931 if x1>=2.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   -0.0931 if x1>=2.0 & x4-x2>=1.0\n",
      "   +0.0114 if x1<=0.0 & x3-x1>=2.0 & x4-x2<=2.0 & x4-x2>=0.0\n",
      "   +0.0688 if x1>=3.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   -0.1718 if c<=0.0 & x1>=2.0 & x2>=1.0 & x2>=3.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   -0.2548 if c<=0.0 & x1<=2.0 & x1>=1.0 & x1>=2.0 & x2<=1.0 & x2>=1.0 & x3-x1>=-1.0\n",
      "   +0.6364 if x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   +0.0102 if x3-x1<=-3.0 & x4-x2>=1.0\n",
      "   +0.3434 if c<=0.0 & x1<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=2.0 & x4-x2>=1.0\n",
      "   -0.0000 if x2>=1.0 & x4-x2>=2.0\n",
      "   +0.3282 if c<=0.0 & x1<=1.0 & x2<=0.0 & x4-x2<=2.0 & x4-x2>=1.0\n",
      "   +0.5694 if x3-x1<=-2.0 & x4-x2>=-1.0\n",
      "init state [ 1  0 -1  0  0]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(44,) (44,)\n",
      "init state [1 1 2 0 0]\n",
      "(75,) (31,)\n",
      "init state [0 1 2 0 0]\n",
      "(104,) (29,)\n",
      "init state [1 0 0 1 0]\n",
      "(109,) (5,)\n",
      "init state [1 2 2 0 0]\n",
      "(113,) (4,)\n",
      "init state [ 3  1 -3 -1  0]\n",
      "(187,) (74,)\n",
      "init state [0 1 1 0 0]\n",
      "(218,) (31,)\n",
      "init state [0 0 3 2 0]\n",
      "(227,) (9,)\n",
      "init state [ 0  3  0 -3  0]\n",
      "(267,) (40,)\n",
      "init state [ 0  1  1 -1  0]\n",
      "(296,) (29,)\n",
      "============ 10 ===========\n",
      "Run episode 10 with rewards 13, accuracy 0.4\n",
      "----------------- 0 --------------\n",
      "   -0.6114 if c>=1.0 & x2>=3.0\n",
      "   -0.0159 if c>=1.0 & x1>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0\n",
      "   -0.2889 if c<=0.0 & x1<=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.0742 if c<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=1.0 & x3-x1<=2.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.3679 if c>=1.0 & x1>=2.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   +0.2122 if c<=0.0 & x1<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   -0.2705 if c<=0.0 & x3-x1<=2.0 & x3-x1>=2.0 & x4-x2<=2.0 & x4-x2>=-2.0\n",
      "   +0.2230 if c<=0.0 & x1<=1.0 & x3-x1<=-1.0 & x4-x2>=-1.0\n",
      "   -0.1287 if c<=0.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.3832 if x1>=2.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   +0.1770 if x4-x2<=-3.0\n",
      "   +0.0000 if x1<=1.0 & x4-x2>=3.0\n",
      "   +0.0000 if c<=0.0 & x1>=1.0 & x2>=3.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   -0.0620 if x3-x1>=3.0\n",
      "   -0.3288 if c<=0.0 & x1<=1.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2>=-2.0\n",
      "   -0.3044 if x4-x2>=2.0\n",
      "----------------- 1 --------------\n",
      "   +0.4627 if x2>=1.0 & x3-x1>=1.0 & x3-x1>=2.0\n",
      "   +0.7249 if c<=0.0 & x2<=2.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2<=1.0\n",
      "   +0.7430 if c>=1.0 & x1>=1.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   -0.1508 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x3-x1>=0.0 & x4-x2<=-1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.5678 if c<=0.0 & x1<=2.0 & x2<=2.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   +0.3041 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   -0.0000 if x1<=0.0 & x2>=1.0 & x4-x2>=1.0\n",
      "   +0.2113 if x1<=2.0 & x4-x2>=2.0\n",
      "   -0.0351 if x4-x2<=-3.0\n",
      "   +0.6552 if x1>=2.0 & x4-x2>=0.0\n",
      "   -0.0000 if x2>=3.0 & x3-x1<=-2.0 & x4-x2>=-2.0\n",
      "   +0.3783 if x3-x1<=2.0 & x3-x1>=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.3307 if x2>=2.0 & x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.3612 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   +0.4387 if x1>=2.0 & x2<=1.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   +0.5598 if x3-x1>=2.0 & x4-x2>=2.0\n",
      "----------------- 2 --------------\n",
      "   -0.2791 if x1<=2.0 & x4-x2>=1.0\n",
      "   -0.0304 if c>=1.0 & x1>=3.0 & x2>=2.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   -0.1392 if x3-x1>=2.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   +1.4496 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.2486 if x1>=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2<=1.0\n",
      "   -0.2724 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -0.0197 if x1<=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.0157 if x2<=2.0 & x2>=2.0 & x3-x1>=3.0\n",
      "   +0.4527 if c<=0.0 & x2>=3.0 & x3-x1<=1.0\n",
      "   -0.2974 if c<=0.0 & x1<=2.0 & x2<=2.0 & x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "   +0.0727 if x3-x1<=2.0 & x4-x2<=0.0\n",
      "   -0.6649 if x4-x2>=-2.0\n",
      "   +0.0000 if x1>=2.0 & x2>=2.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.0000 if x1>=3.0 & x2>=3.0 & x3-x1>=0.0\n",
      "   +0.3555 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   -0.4523 if c<=0.0 & x4-x2>=1.0\n",
      "----------------- 3 --------------\n",
      "   -0.0475 if x1>=2.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.0410 if c>=1.0 & x1>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0\n",
      "   -0.3671 if c<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=2.0\n",
      "   -0.1760 if x1<=2.0 & x1>=2.0 & x2<=2.0 & x2>=2.0 & x4-x2>=0.0\n",
      "   -0.0043 if x1>=2.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   +0.0305 if x1>=2.0 & x4-x2>=1.0\n",
      "   -0.2275 if x1<=0.0 & x3-x1>=2.0 & x4-x2<=2.0 & x4-x2>=0.0\n",
      "   +0.2389 if x1>=3.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   +0.0000 if c<=0.0 & x1>=2.0 & x2>=1.0 & x2>=3.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   -0.3730 if c<=0.0 & x1<=2.0 & x1>=1.0 & x1>=2.0 & x2<=1.0 & x2>=1.0 & x3-x1>=-1.0\n",
      "   +0.2758 if x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   +0.0000 if x3-x1<=-3.0 & x4-x2>=1.0\n",
      "   +0.0000 if c<=0.0 & x1<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=2.0 & x4-x2>=1.0\n",
      "   +0.0362 if c<=0.0 & x1<=1.0 & x2<=0.0 & x4-x2<=2.0 & x4-x2>=1.0\n",
      "   +0.2297 if x3-x1<=-2.0 & x4-x2>=-1.0\n",
      "   +0.3766 if x3-x1<=1.0 & x4-x2>=0.0 & x4-x2>=2.0\n",
      "init state [ 3  2  0 -2  0]\n",
      "(71,) (71,)\n",
      "init state [ 3  2  0 -2  0]\n",
      "(81,) (10,)\n",
      "init state [ 3  0 -1  2  0]\n",
      "(101,) (20,)\n",
      "init state [1 0 2 0 0]\n",
      "(115,) (14,)\n",
      "init state [ 3  2 -2  1  0]\n",
      "(133,) (18,)\n",
      "init state [ 3  1 -2 -1  0]\n",
      "(166,) (33,)\n",
      "init state [ 3  0 -2  3  0]\n",
      "(188,) (22,)\n",
      "init state [ 3  1 -2  2  0]\n",
      "(205,) (17,)\n",
      "init state [ 1  2  0 -1  0]\n",
      "(240,) (35,)\n",
      "init state [ 2  2 -2 -2  0]\n",
      "(298,) (58,)\n",
      "============ 11 ===========\n",
      "Run episode 11 with rewards -16, accuracy 0.1\n",
      "----------------- 0 --------------\n",
      "   -0.4778 if c>=1.0 & x2>=3.0\n",
      "   -0.0660 if c>=1.0 & x1>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0\n",
      "   +0.0476 if c<=0.0 & x1<=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.1685 if c<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=1.0 & x3-x1<=2.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.5214 if c>=1.0 & x1>=2.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   +0.6740 if c<=0.0 & x1<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   +0.0395 if c<=0.0 & x3-x1<=2.0 & x3-x1>=2.0 & x4-x2<=2.0 & x4-x2>=-2.0\n",
      "   +0.0000 if c<=0.0 & x1<=1.0 & x3-x1<=-1.0 & x4-x2>=-1.0\n",
      "   +0.0503 if c<=0.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.6195 if x1>=2.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   +0.2079 if x4-x2<=-3.0\n",
      "   +0.2101 if c<=0.0 & x1>=1.0 & x2>=3.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   -0.1048 if x3-x1>=3.0\n",
      "   -0.1731 if c<=0.0 & x1<=1.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2>=-2.0\n",
      "   -0.3671 if x4-x2>=2.0\n",
      "   +0.7734 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "----------------- 1 --------------\n",
      "   -0.0200 if x2>=1.0 & x3-x1>=1.0 & x3-x1>=2.0\n",
      "   +0.4236 if c<=0.0 & x2<=2.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2<=1.0\n",
      "   +0.5980 if c>=1.0 & x1>=1.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   -0.1843 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x3-x1>=0.0 & x4-x2<=-1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.4394 if c<=0.0 & x1<=2.0 & x2<=2.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   +0.1812 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.0555 if x1<=2.0 & x4-x2>=2.0\n",
      "   -0.0864 if x4-x2<=-3.0\n",
      "   +0.4633 if x1>=2.0 & x4-x2>=0.0\n",
      "   +0.0364 if x2>=3.0 & x3-x1<=-2.0 & x4-x2>=-2.0\n",
      "   +0.0756 if x3-x1<=2.0 & x3-x1>=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.1894 if x2>=2.0 & x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.4483 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   +0.1423 if x1>=2.0 & x2<=1.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   -0.0000 if x3-x1>=2.0 & x4-x2>=2.0\n",
      "   +0.2320 if x3-x1>=3.0\n",
      "----------------- 2 --------------\n",
      "   -0.0862 if x1<=2.0 & x4-x2>=1.0\n",
      "   -0.1708 if c>=1.0 & x1>=3.0 & x2>=2.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   -0.0454 if x3-x1>=2.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   +1.3165 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.2970 if x1>=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2<=1.0\n",
      "   -0.5119 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   +0.0082 if x1<=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.0000 if x2<=2.0 & x2>=2.0 & x3-x1>=3.0\n",
      "   +0.0255 if c<=0.0 & x2>=3.0 & x3-x1<=1.0\n",
      "   -0.0478 if c<=0.0 & x1<=2.0 & x2<=2.0 & x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "   +0.3865 if x3-x1<=2.0 & x4-x2<=0.0\n",
      "   -0.2713 if x4-x2>=-2.0\n",
      "   +0.0652 if x1>=3.0 & x2>=3.0 & x3-x1>=0.0\n",
      "   +0.5950 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   -0.3191 if c<=0.0 & x4-x2>=1.0\n",
      "   -0.3959 if x3-x1<=1.0 & x4-x2<=1.0\n",
      "----------------- 3 --------------\n",
      "   +0.1693 if x1>=2.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.0391 if c>=1.0 & x1>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0\n",
      "   -0.1245 if c<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=2.0\n",
      "   -0.4122 if x1<=2.0 & x1>=2.0 & x2<=2.0 & x2>=2.0 & x4-x2>=0.0\n",
      "   +0.1766 if x1>=2.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   +0.1693 if x1>=2.0 & x4-x2>=1.0\n",
      "   -0.1005 if x1<=0.0 & x3-x1>=2.0 & x4-x2<=2.0 & x4-x2>=0.0\n",
      "   +0.2690 if x1>=3.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   -0.3247 if c<=0.0 & x1>=2.0 & x2>=1.0 & x2>=3.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   -0.1406 if c<=0.0 & x1<=2.0 & x1>=1.0 & x1>=2.0 & x2<=1.0 & x2>=1.0 & x3-x1>=-1.0\n",
      "   +0.1987 if x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   +0.0000 if c<=0.0 & x1<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=2.0 & x4-x2>=1.0\n",
      "   +0.0000 if c<=0.0 & x1<=1.0 & x2<=0.0 & x4-x2<=2.0 & x4-x2>=1.0\n",
      "   +0.2865 if x3-x1<=-2.0 & x4-x2>=-1.0\n",
      "   -0.0437 if x3-x1<=1.0 & x4-x2>=0.0 & x4-x2>=2.0\n",
      "   -0.2649 if c>=1.0 & x1<=2.0 & x1>=2.0 & x2<=2.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "init state [ 0  3  2 -3  0]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(41,) (41,)\n",
      "init state [0 0 2 2 0]\n",
      "(50,) (9,)\n",
      "init state [ 3  2 -3 -2  0]\n",
      "(94,) (44,)\n",
      "init state [0 0 2 3 0]\n",
      "(110,) (16,)\n",
      "init state [ 2  3 -2  0  0]\n",
      "(117,) (7,)\n",
      "init state [ 1  3  1 -1  0]\n",
      "(121,) (4,)\n",
      "init state [ 0  3  0 -2  0]\n",
      "(152,) (31,)\n",
      "init state [ 2  0 -1  3  0]\n",
      "(196,) (44,)\n",
      "init state [ 0  3  1 -1  0]\n",
      "(203,) (7,)\n",
      "init state [1 1 1 1 0]\n",
      "(217,) (14,)\n",
      "============ 12 ===========\n",
      "Run episode 12 with rewards 28, accuracy 0.2\n",
      "----------------- 0 --------------\n",
      "   -0.6829 if c>=1.0 & x2>=3.0\n",
      "   -0.1440 if c>=1.0 & x1>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0\n",
      "   -0.2456 if c<=0.0 & x1<=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.1099 if c<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=1.0 & x3-x1<=2.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.4294 if c>=1.0 & x1>=2.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   +0.2058 if c<=0.0 & x1<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   -0.4123 if c<=0.0 & x3-x1<=2.0 & x3-x1>=2.0 & x4-x2<=2.0 & x4-x2>=-2.0\n",
      "   +0.0112 if c<=0.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.4509 if x1>=2.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   -0.2808 if x4-x2<=-3.0\n",
      "   -0.2290 if c<=0.0 & x1>=1.0 & x2>=3.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   +0.0000 if x3-x1>=3.0\n",
      "   -0.1410 if c<=0.0 & x1<=1.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2>=-2.0\n",
      "   -0.3386 if x4-x2>=2.0\n",
      "   +0.5338 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.7105 if c<=0.0 & x2>=3.0 & x3-x1<=1.0 & x4-x2>=0.0\n",
      "----------------- 1 --------------\n",
      "   +0.6184 if x2>=1.0 & x3-x1>=1.0 & x3-x1>=2.0\n",
      "   +0.5410 if c<=0.0 & x2<=2.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2<=1.0\n",
      "   +0.7496 if c>=1.0 & x1>=1.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   +0.1573 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x3-x1>=0.0 & x4-x2<=-1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.1355 if c<=0.0 & x1<=2.0 & x2<=2.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   +0.4758 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.0709 if x1<=2.0 & x4-x2>=2.0\n",
      "   +0.1221 if x4-x2<=-3.0\n",
      "   +0.2685 if x1>=2.0 & x4-x2>=0.0\n",
      "   +0.1446 if x2>=3.0 & x3-x1<=-2.0 & x4-x2>=-2.0\n",
      "   -0.3635 if x3-x1<=2.0 & x3-x1>=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.1232 if x2>=2.0 & x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.0982 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   +0.0000 if x1>=2.0 & x2<=1.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   +0.0000 if x3-x1>=3.0\n",
      "   -0.4000 if x3-x1>=2.0 & x4-x2>=2.0\n",
      "----------------- 2 --------------\n",
      "   -0.4670 if x1<=2.0 & x4-x2>=1.0\n",
      "   -0.0706 if c>=1.0 & x1>=3.0 & x2>=2.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   +0.4107 if x3-x1>=2.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   +1.4502 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.0967 if x1>=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2<=1.0\n",
      "   -0.1557 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -0.2982 if x1<=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.5081 if c<=0.0 & x2>=3.0 & x3-x1<=1.0\n",
      "   -0.0522 if c<=0.0 & x1<=2.0 & x2<=2.0 & x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "   +0.1706 if x3-x1<=2.0 & x4-x2<=0.0\n",
      "   -0.4633 if x4-x2>=-2.0\n",
      "   +0.0000 if x1>=3.0 & x2>=3.0 & x3-x1>=0.0\n",
      "   +0.1903 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   -0.5536 if c<=0.0 & x4-x2>=1.0\n",
      "   -0.5887 if x3-x1<=1.0 & x4-x2<=1.0\n",
      "   -0.2858 if x3-x1>=0.0 & x4-x2<=-3.0\n",
      "----------------- 3 --------------\n",
      "   +0.2400 if x1>=2.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.4350 if c>=1.0 & x1>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0\n",
      "   -0.3750 if c<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=2.0\n",
      "   +0.2012 if x1<=2.0 & x1>=2.0 & x2<=2.0 & x2>=2.0 & x4-x2>=0.0\n",
      "   +0.3987 if x1>=2.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   +0.2400 if x1>=2.0 & x4-x2>=1.0\n",
      "   -0.1027 if x1<=0.0 & x3-x1>=2.0 & x4-x2<=2.0 & x4-x2>=0.0\n",
      "   +0.3864 if x1>=3.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   -0.5564 if c<=0.0 & x1>=2.0 & x2>=1.0 & x2>=3.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   -0.2407 if c<=0.0 & x1<=2.0 & x1>=1.0 & x1>=2.0 & x2<=1.0 & x2>=1.0 & x3-x1>=-1.0\n",
      "   +0.1755 if x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   +0.1978 if c<=0.0 & x1<=1.0 & x2<=0.0 & x4-x2<=2.0 & x4-x2>=1.0\n",
      "   -0.0443 if x3-x1<=-2.0 & x4-x2>=-1.0\n",
      "   +0.0074 if x3-x1<=1.0 & x4-x2>=0.0 & x4-x2>=2.0\n",
      "   -0.1100 if c>=1.0 & x1<=2.0 & x1>=2.0 & x2<=2.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   +0.4395 if c<=0.0 & x2>=2.0 & x3-x1>=0.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "init state [ 3  2  0 -2  0]\n",
      "(24,) (24,)\n",
      "init state [ 0  3  1 -2  0]\n",
      "(88,) (64,)\n",
      "init state [1 2 0 1 0]\n",
      "(103,) (15,)\n",
      "init state [ 2  0 -1  3  0]\n",
      "(133,) (30,)\n",
      "init state [ 3  2  0 -1  0]\n",
      "(137,) (4,)\n",
      "init state [ 0  3  2 -2  0]\n",
      "(148,) (11,)\n",
      "init state [0 1 3 0 0]\n",
      "(154,) (6,)\n",
      "init state [ 2  0 -1  3  0]\n",
      "(170,) (16,)\n",
      "init state [ 1  2  1 -1  0]\n",
      "(180,) (10,)\n",
      "init state [0 0 1 2 0]\n",
      "(186,) (6,)\n",
      "============ 13 ===========\n",
      "Run episode 13 with rewards 36, accuracy 0.5\n",
      "----------------- 0 --------------\n",
      "   -0.6380 if c>=1.0 & x2>=3.0\n",
      "   +0.1400 if c>=1.0 & x1>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0\n",
      "   -0.2619 if c<=0.0 & x1<=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.1324 if c<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=1.0 & x3-x1<=2.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.4578 if c>=1.0 & x1>=2.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   +0.0230 if c<=0.0 & x1<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   -0.2649 if c<=0.0 & x3-x1<=2.0 & x3-x1>=2.0 & x4-x2<=2.0 & x4-x2>=-2.0\n",
      "   +0.4593 if c<=0.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.9910 if x1>=2.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   -0.0630 if x4-x2<=-3.0\n",
      "   +0.0000 if c<=0.0 & x1>=1.0 & x2>=3.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   -0.2667 if c<=0.0 & x1<=1.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2>=-2.0\n",
      "   -0.2362 if x4-x2>=2.0\n",
      "   -0.1275 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.4854 if c<=0.0 & x2>=3.0 & x3-x1<=1.0 & x4-x2>=0.0\n",
      "   -0.7032 if x4-x2<=2.0 & x4-x2>=1.0\n",
      "----------------- 1 --------------\n",
      "   +0.6581 if x2>=1.0 & x3-x1>=1.0 & x3-x1>=2.0\n",
      "   +0.8789 if c<=0.0 & x2<=2.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2<=1.0\n",
      "   +0.5654 if c>=1.0 & x1>=1.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   +0.1786 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x3-x1>=0.0 & x4-x2<=-1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   +0.1131 if c<=0.0 & x1<=2.0 & x2<=2.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   +0.4812 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.0898 if x1<=2.0 & x4-x2>=2.0\n",
      "   +0.2062 if x4-x2<=-3.0\n",
      "   +0.2426 if x1>=2.0 & x4-x2>=0.0\n",
      "   -0.2026 if x2>=3.0 & x3-x1<=-2.0 & x4-x2>=-2.0\n",
      "   +0.3716 if x3-x1<=2.0 & x3-x1>=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.2582 if x2>=2.0 & x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.4821 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   +0.1083 if x3-x1>=3.0\n",
      "   +0.0000 if x3-x1>=2.0 & x4-x2>=2.0\n",
      "   -0.3539 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "----------------- 2 --------------\n",
      "   -0.2628 if x1<=2.0 & x4-x2>=1.0\n",
      "   +0.1170 if c>=1.0 & x1>=3.0 & x2>=2.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   -0.2242 if x3-x1>=2.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   +1.1198 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.2587 if x1>=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2<=1.0\n",
      "   -0.3380 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   +0.0000 if x1<=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.3674 if c<=0.0 & x2>=3.0 & x3-x1<=1.0\n",
      "   +0.0047 if c<=0.0 & x1<=2.0 & x2<=2.0 & x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "   +0.0658 if x3-x1<=2.0 & x4-x2<=0.0\n",
      "   -0.4772 if x4-x2>=-2.0\n",
      "   -0.0445 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   -0.1716 if c<=0.0 & x4-x2>=1.0\n",
      "   +0.0798 if x3-x1<=1.0 & x4-x2<=1.0\n",
      "   +0.0508 if x3-x1>=0.0 & x4-x2<=-3.0\n",
      "   -0.4352 if c<=0.0 & x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1>=1.0\n",
      "----------------- 3 --------------\n",
      "   +0.3653 if x1>=2.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.1484 if c>=1.0 & x1>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0\n",
      "   -0.1690 if c<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=2.0\n",
      "   -0.4083 if x1<=2.0 & x1>=2.0 & x2<=2.0 & x2>=2.0 & x4-x2>=0.0\n",
      "   +0.3653 if x1>=2.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   +0.3653 if x1>=2.0 & x4-x2>=1.0\n",
      "   -0.2170 if x1<=0.0 & x3-x1>=2.0 & x4-x2<=2.0 & x4-x2>=0.0\n",
      "   +0.0732 if x1>=3.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   +0.4458 if c<=0.0 & x1>=2.0 & x2>=1.0 & x2>=3.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   -0.1654 if c<=0.0 & x1<=2.0 & x1>=1.0 & x1>=2.0 & x2<=1.0 & x2>=1.0 & x3-x1>=-1.0\n",
      "   +0.7592 if x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   +0.1684 if c<=0.0 & x1<=1.0 & x2<=0.0 & x4-x2<=2.0 & x4-x2>=1.0\n",
      "   -0.0397 if x3-x1<=-2.0 & x4-x2>=-1.0\n",
      "   -0.1406 if c>=1.0 & x1<=2.0 & x1>=2.0 & x2<=2.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   +0.0000 if c<=0.0 & x2>=2.0 & x3-x1>=0.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.0904 if x4-x2>=3.0\n",
      "init state [ 3  0 -2  0  0]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(32,) (32,)\n",
      "init state [1 0 1 2 0]\n",
      "(41,) (9,)\n",
      "init state [ 3  0 -3  0  0]\n",
      "(89,) (48,)\n",
      "init state [ 3  2 -1 -2  0]\n",
      "(129,) (40,)\n",
      "init state [ 3  2 -3 -1  0]\n",
      "(182,) (53,)\n",
      "init state [ 3  1 -3  1  0]\n",
      "(242,) (60,)\n",
      "init state [1 0 1 1 0]\n",
      "(259,) (17,)\n",
      "init state [ 1  3  2 -3  0]\n",
      "(280,) (21,)\n",
      "init state [ 3  0 -3  1  0]\n",
      "(300,) (20,)\n",
      "init state [0 2 3 0 0]\n",
      "(306,) (6,)\n",
      "============ 14 ===========\n",
      "Run episode 14 with rewards 36, accuracy 0.6\n",
      "best\n",
      "----------------- 0 --------------\n",
      "   -0.4644 if c>=1.0 & x2>=3.0\n",
      "   +0.0733 if c>=1.0 & x1>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0\n",
      "   -0.1006 if c<=0.0 & x1<=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.1249 if c<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=1.0 & x3-x1<=2.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.3616 if c>=1.0 & x1>=2.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   +0.3049 if c<=0.0 & x1<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   -0.2013 if c<=0.0 & x3-x1<=2.0 & x3-x1>=2.0 & x4-x2<=2.0 & x4-x2>=-2.0\n",
      "   +0.4129 if c<=0.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.4859 if x1>=2.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   -0.2342 if x4-x2<=-3.0\n",
      "   -0.2596 if c<=0.0 & x1<=1.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2>=-2.0\n",
      "   +0.0728 if x4-x2>=2.0\n",
      "   +0.2519 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.0000 if c<=0.0 & x2>=3.0 & x3-x1<=1.0 & x4-x2>=0.0\n",
      "   -0.1060 if x4-x2<=2.0 & x4-x2>=1.0\n",
      "   -0.5243 if c<=0.0 & x3-x1>=0.0 & x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=-2.0 & x4-x2>=0.0\n",
      "----------------- 1 --------------\n",
      "   +0.3710 if x2>=1.0 & x3-x1>=1.0 & x3-x1>=2.0\n",
      "   +0.8913 if c<=0.0 & x2<=2.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2<=1.0\n",
      "   +0.2114 if c>=1.0 & x1>=1.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   -0.2228 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x3-x1>=0.0 & x4-x2<=-1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.4319 if c<=0.0 & x1<=2.0 & x2<=2.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   +1.1283 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   -0.0526 if x1<=2.0 & x4-x2>=2.0\n",
      "   +0.4341 if x4-x2<=-3.0\n",
      "   -0.1167 if x1>=2.0 & x4-x2>=0.0\n",
      "   -0.3500 if x2>=3.0 & x3-x1<=-2.0 & x4-x2>=-2.0\n",
      "   +0.1958 if x3-x1<=2.0 & x3-x1>=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.2274 if x2>=2.0 & x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.9070 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   +0.2062 if x3-x1>=3.0\n",
      "   -0.2429 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.2974 if x3-x1>=2.0 & x4-x2>=2.0\n",
      "----------------- 2 --------------\n",
      "   -0.3611 if x1<=2.0 & x4-x2>=1.0\n",
      "   -0.1828 if c>=1.0 & x1>=3.0 & x2>=2.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   -0.1096 if x3-x1>=2.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   +1.2377 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.0521 if x1>=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2<=1.0\n",
      "   -0.6334 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   +0.4995 if c<=0.0 & x2>=3.0 & x3-x1<=1.0\n",
      "   +0.0139 if c<=0.0 & x1<=2.0 & x2<=2.0 & x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "   +0.1047 if x3-x1<=2.0 & x4-x2<=0.0\n",
      "   -0.2906 if x4-x2>=-2.0\n",
      "   +0.2840 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   -0.3003 if c<=0.0 & x4-x2>=1.0\n",
      "   -0.0318 if x3-x1<=1.0 & x4-x2<=1.0\n",
      "   -0.0471 if x3-x1>=0.0 & x4-x2<=-3.0\n",
      "   -0.3282 if c<=0.0 & x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1>=1.0\n",
      "   -0.4168 if x1>=1.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "----------------- 3 --------------\n",
      "   +0.2191 if x1>=2.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.0387 if c>=1.0 & x1>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0\n",
      "   -0.2645 if c<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=2.0\n",
      "   -0.2153 if x1<=2.0 & x1>=2.0 & x2<=2.0 & x2>=2.0 & x4-x2>=0.0\n",
      "   -0.0226 if x1>=2.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   +0.2191 if x1>=2.0 & x4-x2>=1.0\n",
      "   -0.2434 if x1<=0.0 & x3-x1>=2.0 & x4-x2<=2.0 & x4-x2>=0.0\n",
      "   +0.5010 if x1>=3.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   +0.0000 if c<=0.0 & x1>=2.0 & x2>=1.0 & x2>=3.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   -0.0340 if c<=0.0 & x1<=2.0 & x1>=1.0 & x1>=2.0 & x2<=1.0 & x2>=1.0 & x3-x1>=-1.0\n",
      "   +0.4920 if x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   +0.0807 if c<=0.0 & x1<=1.0 & x2<=0.0 & x4-x2<=2.0 & x4-x2>=1.0\n",
      "   +0.1912 if x3-x1<=-2.0 & x4-x2>=-1.0\n",
      "   +0.1908 if c>=1.0 & x1<=2.0 & x1>=2.0 & x2<=2.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   +0.0000 if x4-x2>=3.0\n",
      "   +0.8435 if c>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=-2.0 & x4-x2>=-2.0\n",
      "init state [1 2 0 1 0]\n",
      "(12,) (12,)\n",
      "init state [0 0 2 1 0]\n",
      "(46,) (34,)\n",
      "init state [ 3  1 -2  1  0]\n",
      "(65,) (19,)\n",
      "init state [0 2 1 1 0]\n",
      "(73,) (8,)\n",
      "init state [ 0  3  0 -3  0]\n",
      "(96,) (23,)\n",
      "init state [ 3  1 -3  2  0]\n",
      "(132,) (36,)\n",
      "init state [0 2 1 1 0]\n",
      "(150,) (18,)\n",
      "init state [0 0 1 2 0]\n",
      "(162,) (12,)\n",
      "init state [ 2  1  1 -1  0]\n",
      "(170,) (8,)\n",
      "init state [ 0  3  0 -3  0]\n",
      "(180,) (10,)\n",
      "============ 15 ===========\n",
      "Run episode 15 with rewards 32, accuracy 0.3\n",
      "----------------- 0 --------------\n",
      "   -0.4624 if c>=1.0 & x2>=3.0\n",
      "   -0.0163 if c>=1.0 & x1>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0\n",
      "   -0.2820 if c<=0.0 & x1<=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.4819 if c<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=1.0 & x3-x1<=2.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.1515 if c>=1.0 & x1>=2.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   +0.4408 if c<=0.0 & x1<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   -0.1115 if c<=0.0 & x3-x1<=2.0 & x3-x1>=2.0 & x4-x2<=2.0 & x4-x2>=-2.0\n",
      "   +0.6695 if c<=0.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.1937 if x1>=2.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   -0.3290 if x4-x2<=-3.0\n",
      "   -0.0037 if c<=0.0 & x1<=1.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2>=-2.0\n",
      "   +0.5945 if x4-x2>=2.0\n",
      "   +0.0578 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.1926 if x4-x2<=2.0 & x4-x2>=1.0\n",
      "   -0.3644 if c<=0.0 & x3-x1>=0.0 & x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=-2.0 & x4-x2>=0.0\n",
      "   +0.0110 if x3-x1<=-3.0 & x4-x2>=2.0\n",
      "----------------- 1 --------------\n",
      "   +0.0533 if x2>=1.0 & x3-x1>=1.0 & x3-x1>=2.0\n",
      "   +0.2015 if c<=0.0 & x2<=2.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2<=1.0\n",
      "   +0.5134 if c>=1.0 & x1>=1.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   -0.2222 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x3-x1>=0.0 & x4-x2<=-1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.2144 if c<=0.0 & x1<=2.0 & x2<=2.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   +0.7571 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.2291 if x4-x2<=-3.0\n",
      "   -0.4847 if x1>=2.0 & x4-x2>=0.0\n",
      "   -0.1174 if x2>=3.0 & x3-x1<=-2.0 & x4-x2>=-2.0\n",
      "   -0.0415 if x3-x1<=2.0 & x3-x1>=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.4588 if x2>=2.0 & x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.4909 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   +0.0000 if x3-x1>=3.0\n",
      "   +0.0777 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.0000 if x3-x1>=2.0 & x4-x2>=2.0\n",
      "   +0.3394 if c<=0.0 & x1>=2.0 & x3-x1>=1.0\n",
      "----------------- 2 --------------\n",
      "   -0.5602 if x1<=2.0 & x4-x2>=1.0\n",
      "   -0.0223 if c>=1.0 & x1>=3.0 & x2>=2.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   +0.1331 if x3-x1>=2.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   +1.0054 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.0977 if x1>=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2<=1.0\n",
      "   -0.5582 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   +0.2494 if c<=0.0 & x2>=3.0 & x3-x1<=1.0\n",
      "   +0.3015 if x3-x1<=2.0 & x4-x2<=0.0\n",
      "   -0.3880 if x4-x2>=-2.0\n",
      "   +0.5289 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   -0.5536 if c<=0.0 & x4-x2>=1.0\n",
      "   -0.3736 if x3-x1<=1.0 & x4-x2<=1.0\n",
      "   +0.1054 if x3-x1>=0.0 & x4-x2<=-3.0\n",
      "   -0.2481 if c<=0.0 & x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1>=1.0\n",
      "   -0.0115 if x1>=1.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   +0.3394 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=-2.0\n",
      "----------------- 3 --------------\n",
      "   +0.3080 if x1>=2.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.0495 if c>=1.0 & x1>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0\n",
      "   -0.0400 if c<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=2.0\n",
      "   -0.0264 if x1<=2.0 & x1>=2.0 & x2<=2.0 & x2>=2.0 & x4-x2>=0.0\n",
      "   +0.4504 if x1>=2.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   +0.3080 if x1>=2.0 & x4-x2>=1.0\n",
      "   -0.1168 if x1<=0.0 & x3-x1>=2.0 & x4-x2<=2.0 & x4-x2>=0.0\n",
      "   +0.2094 if x1>=3.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   -0.1040 if c<=0.0 & x1>=2.0 & x2>=1.0 & x2>=3.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   -0.0933 if c<=0.0 & x1<=2.0 & x1>=1.0 & x1>=2.0 & x2<=1.0 & x2>=1.0 & x3-x1>=-1.0\n",
      "   -0.0781 if x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   -0.0056 if c<=0.0 & x1<=1.0 & x2<=0.0 & x4-x2<=2.0 & x4-x2>=1.0\n",
      "   +0.1855 if x3-x1<=-2.0 & x4-x2>=-1.0\n",
      "   +0.4061 if c>=1.0 & x1<=2.0 & x1>=2.0 & x2<=2.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   +0.3657 if c>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=-2.0 & x4-x2>=-2.0\n",
      "   -0.0137 if x1>=1.0 & x1>=2.0 & x2<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "init state [0 3 1 0 0]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(11,) (11,)\n",
      "init state [2 0 1 1 0]\n",
      "(30,) (19,)\n",
      "init state [0 0 2 1 0]\n",
      "(99,) (69,)\n",
      "init state [ 2  0 -1  2  0]\n",
      "(110,) (11,)\n",
      "init state [2 1 1 1 0]\n",
      "(138,) (28,)\n",
      "init state [ 2  3  0 -3  0]\n",
      "(150,) (12,)\n",
      "init state [ 2  1 -2  1  0]\n",
      "(162,) (12,)\n",
      "init state [ 2  3  0 -1  0]\n",
      "(174,) (12,)\n",
      "init state [ 0  2  0 -2  0]\n",
      "(187,) (13,)\n",
      "init state [0 0 1 1 0]\n",
      "(204,) (17,)\n",
      "============ 16 ===========\n",
      "Run episode 16 with rewards 25, accuracy 0.2\n",
      "----------------- 0 --------------\n",
      "   -0.3673 if c>=1.0 & x2>=3.0\n",
      "   -0.2577 if c>=1.0 & x1>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0\n",
      "   -0.3129 if c<=0.0 & x1<=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.4244 if c<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=1.0 & x3-x1<=2.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.5591 if c>=1.0 & x1>=2.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   +0.3666 if c<=0.0 & x1<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   -0.1133 if c<=0.0 & x3-x1<=2.0 & x3-x1>=2.0 & x4-x2<=2.0 & x4-x2>=-2.0\n",
      "   +0.8725 if c<=0.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.1927 if x1>=2.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   -0.3141 if x4-x2<=-3.0\n",
      "   -0.0900 if x4-x2>=2.0\n",
      "   -0.3677 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.7167 if x4-x2<=2.0 & x4-x2>=1.0\n",
      "   +0.0219 if c<=0.0 & x3-x1>=0.0 & x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=-2.0 & x4-x2>=0.0\n",
      "   +0.0000 if x3-x1<=-3.0 & x4-x2>=2.0\n",
      "   -0.5523 if x1>=3.0 & x2>=3.0 & x3-x1<=1.0\n",
      "----------------- 1 --------------\n",
      "   +0.0901 if x2>=1.0 & x3-x1>=1.0 & x3-x1>=2.0\n",
      "   +0.2403 if c<=0.0 & x2<=2.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2<=1.0\n",
      "   +0.3419 if c>=1.0 & x1>=1.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   +0.0678 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x3-x1>=0.0 & x4-x2<=-1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.5918 if c<=0.0 & x1<=2.0 & x2<=2.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   +0.7928 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   -0.0491 if x4-x2<=-3.0\n",
      "   -0.2830 if x1>=2.0 & x4-x2>=0.0\n",
      "   -0.0136 if x2>=3.0 & x3-x1<=-2.0 & x4-x2>=-2.0\n",
      "   +0.1650 if x3-x1<=2.0 & x3-x1>=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.4506 if x2>=2.0 & x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.5352 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   +0.3828 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.0000 if x3-x1>=2.0 & x4-x2>=2.0\n",
      "   -0.0008 if c<=0.0 & x1>=2.0 & x3-x1>=1.0\n",
      "   +0.7299 if c<=0.0 & x2<=1.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "----------------- 2 --------------\n",
      "   -0.1499 if x1<=2.0 & x4-x2>=1.0\n",
      "   -0.0841 if c>=1.0 & x1>=3.0 & x2>=2.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   +0.0324 if x3-x1>=2.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   +0.7286 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.0965 if x1>=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2<=1.0\n",
      "   -0.5545 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   +1.0706 if c<=0.0 & x2>=3.0 & x3-x1<=1.0\n",
      "   +0.1004 if x3-x1<=2.0 & x4-x2<=0.0\n",
      "   -0.3376 if x4-x2>=-2.0\n",
      "   +0.5635 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   -0.2282 if c<=0.0 & x4-x2>=1.0\n",
      "   -0.3200 if x3-x1<=1.0 & x4-x2<=1.0\n",
      "   +0.1241 if x3-x1>=0.0 & x4-x2<=-3.0\n",
      "   -0.0297 if c<=0.0 & x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1>=1.0\n",
      "   +0.0000 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=-2.0\n",
      "   -0.6505 if x2>=2.0 & x3-x1<=1.0 & x4-x2>=0.0\n",
      "----------------- 3 --------------\n",
      "   +0.5448 if x1>=2.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.5721 if c>=1.0 & x1>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0\n",
      "   -0.2628 if c<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=2.0\n",
      "   +0.0131 if x1<=2.0 & x1>=2.0 & x2<=2.0 & x2>=2.0 & x4-x2>=0.0\n",
      "   +0.3746 if x1>=2.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   +0.1298 if x1>=2.0 & x4-x2>=1.0\n",
      "   -0.0236 if x1<=0.0 & x3-x1>=2.0 & x4-x2<=2.0 & x4-x2>=0.0\n",
      "   +0.3529 if x1>=3.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   -0.2824 if c<=0.0 & x1>=2.0 & x2>=1.0 & x2>=3.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   -0.2554 if c<=0.0 & x1<=2.0 & x1>=1.0 & x1>=2.0 & x2<=1.0 & x2>=1.0 & x3-x1>=-1.0\n",
      "   +0.2010 if x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   +0.1765 if x3-x1<=-2.0 & x4-x2>=-1.0\n",
      "   +0.7173 if c>=1.0 & x1<=2.0 & x1>=2.0 & x2<=2.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   +0.2884 if c>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=-2.0 & x4-x2>=-2.0\n",
      "   +0.0175 if x1>=1.0 & x1>=2.0 & x2<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   -0.2154 if x3-x1<=-3.0\n",
      "init state [2 0 1 1 0]\n",
      "(9,) (9,)\n",
      "init state [0 1 1 2 0]\n",
      "(24,) (15,)\n",
      "init state [ 0  2  1 -2  0]\n",
      "(46,) (22,)\n",
      "init state [ 0  3  2 -2  0]\n",
      "(70,) (24,)\n",
      "init state [ 3  1 -2  2  0]\n",
      "(91,) (21,)\n",
      "init state [ 2  3 -2  0  0]\n",
      "(102,) (11,)\n",
      "init state [ 3  1 -2 -1  0]\n",
      "(142,) (40,)\n",
      "init state [ 2  0 -1  0  0]\n",
      "(148,) (6,)\n",
      "init state [2 1 0 2 0]\n",
      "(158,) (10,)\n",
      "init state [2 1 0 1 0]\n",
      "(163,) (5,)\n",
      "============ 17 ===========\n",
      "Run episode 17 with rewards 37, accuracy 1.0\n",
      "best\n",
      "----------------- 0 --------------\n",
      "   -0.3890 if c>=1.0 & x2>=3.0\n",
      "   -0.2512 if c>=1.0 & x1>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0\n",
      "   -0.1423 if c<=0.0 & x1<=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.0651 if c<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=1.0 & x3-x1<=2.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.3757 if c>=1.0 & x1>=2.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   -0.0481 if c<=0.0 & x1<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   -0.0152 if c<=0.0 & x3-x1<=2.0 & x3-x1>=2.0 & x4-x2<=2.0 & x4-x2>=-2.0\n",
      "   +0.6662 if c<=0.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.0401 if x1>=2.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   -0.2707 if x4-x2<=-3.0\n",
      "   -0.2484 if x4-x2>=2.0\n",
      "   -0.1695 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.8040 if x4-x2<=2.0 & x4-x2>=1.0\n",
      "   -0.2123 if c<=0.0 & x3-x1>=0.0 & x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=-2.0 & x4-x2>=0.0\n",
      "   -0.3184 if x1>=3.0 & x2>=3.0 & x3-x1<=1.0\n",
      "   -0.0642 if x4-x2>=3.0\n",
      "----------------- 1 --------------\n",
      "   +0.0464 if x2>=1.0 & x3-x1>=1.0 & x3-x1>=2.0\n",
      "   -0.1426 if c<=0.0 & x2<=2.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2<=1.0\n",
      "   +0.4335 if c>=1.0 & x1>=1.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   +0.0678 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x3-x1>=0.0 & x4-x2<=-1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.5894 if c<=0.0 & x1<=2.0 & x2<=2.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   +0.7996 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.5935 if x4-x2<=-3.0\n",
      "   -0.0649 if x1>=2.0 & x4-x2>=0.0\n",
      "   -0.1921 if x2>=3.0 & x3-x1<=-2.0 & x4-x2>=-2.0\n",
      "   +0.0000 if x3-x1<=2.0 & x3-x1>=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.2944 if x2>=2.0 & x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.7695 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   +0.5511 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.1734 if c<=0.0 & x1>=2.0 & x3-x1>=1.0\n",
      "   +0.5615 if c<=0.0 & x2<=1.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   +0.5313 if x2>=1.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "----------------- 2 --------------\n",
      "   -0.3224 if x1<=2.0 & x4-x2>=1.0\n",
      "   -0.1367 if c>=1.0 & x1>=3.0 & x2>=2.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   -0.0191 if x3-x1>=2.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   +0.6925 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.2177 if x1>=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2<=1.0\n",
      "   -0.4111 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   +0.5866 if c<=0.0 & x2>=3.0 & x3-x1<=1.0\n",
      "   +0.0121 if x3-x1<=2.0 & x4-x2<=0.0\n",
      "   -0.3536 if x4-x2>=-2.0\n",
      "   +0.2128 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   -0.3655 if c<=0.0 & x4-x2>=1.0\n",
      "   -0.3880 if x3-x1<=1.0 & x4-x2<=1.0\n",
      "   -0.0872 if x3-x1>=0.0 & x4-x2<=-3.0\n",
      "   -0.0607 if c<=0.0 & x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1>=1.0\n",
      "   -0.2478 if x2>=2.0 & x3-x1<=1.0 & x4-x2>=0.0\n",
      "   +0.5983 if c<=0.0 & x1<=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "----------------- 3 --------------\n",
      "   +0.5810 if x1>=2.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.0567 if c>=1.0 & x1>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0\n",
      "   -0.1014 if c<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=2.0\n",
      "   +0.4334 if x1>=2.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   +0.4024 if x1>=2.0 & x4-x2>=1.0\n",
      "   +0.0000 if x1<=0.0 & x3-x1>=2.0 & x4-x2<=2.0 & x4-x2>=0.0\n",
      "   +0.8053 if x1>=3.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   -0.2773 if c<=0.0 & x1>=2.0 & x2>=1.0 & x2>=3.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   -0.0850 if c<=0.0 & x1<=2.0 & x1>=1.0 & x1>=2.0 & x2<=1.0 & x2>=1.0 & x3-x1>=-1.0\n",
      "   -0.3427 if x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   +0.1046 if x3-x1<=-2.0 & x4-x2>=-1.0\n",
      "   +0.0667 if c>=1.0 & x1<=2.0 & x1>=2.0 & x2<=2.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   -0.0019 if c>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=-2.0 & x4-x2>=-2.0\n",
      "   +0.1557 if x1>=1.0 & x1>=2.0 & x2<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.0000 if x3-x1<=-3.0\n",
      "   +0.5067 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "init state [1 0 2 2 0]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(9,) (9,)\n",
      "init state [ 3  1 -3  1  0]\n",
      "(30,) (21,)\n",
      "init state [ 1  3 -1 -3  0]\n",
      "(61,) (31,)\n",
      "init state [2 0 1 1 0]\n",
      "(69,) (8,)\n",
      "init state [ 2  1  0 -1  0]\n",
      "(108,) (39,)\n",
      "init state [ 3  2 -3 -1  0]\n",
      "(185,) (77,)\n",
      "init state [0 0 2 2 0]\n",
      "(204,) (19,)\n",
      "init state [ 2  3  1 -2  0]\n",
      "(255,) (51,)\n",
      "init state [ 0  1  3 -1  0]\n",
      "(285,) (30,)\n",
      "init state [ 3  1 -3  0  0]\n",
      "(325,) (40,)\n",
      "============ 18 ===========\n",
      "Run episode 18 with rewards 2, accuracy 0.5\n",
      "----------------- 0 --------------\n",
      "   -0.4209 if c>=1.0 & x2>=3.0\n",
      "   -0.1227 if c>=1.0 & x1>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0\n",
      "   +0.1080 if c<=0.0 & x1<=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.0000 if c<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=1.0 & x3-x1<=2.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.0736 if c>=1.0 & x1>=2.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   +0.1698 if c<=0.0 & x1<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   +0.1567 if c<=0.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.1496 if x1>=2.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   -0.1658 if x4-x2<=-3.0\n",
      "   -0.2565 if x4-x2>=2.0\n",
      "   -0.3698 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.6256 if x4-x2<=2.0 & x4-x2>=1.0\n",
      "   -0.3966 if c<=0.0 & x3-x1>=0.0 & x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=-2.0 & x4-x2>=0.0\n",
      "   -0.4265 if x1>=3.0 & x2>=3.0 & x3-x1<=1.0\n",
      "   +0.0000 if x4-x2>=3.0\n",
      "   +0.4396 if x3-x1<=-1.0 & x4-x2>=1.0\n",
      "----------------- 1 --------------\n",
      "   +0.2964 if x2>=1.0 & x3-x1>=1.0 & x3-x1>=2.0\n",
      "   -0.0713 if c<=0.0 & x2<=2.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2<=1.0\n",
      "   +0.6776 if c>=1.0 & x1>=1.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   -0.3990 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x3-x1>=0.0 & x4-x2<=-1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.5404 if c<=0.0 & x1<=2.0 & x2<=2.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   +0.7688 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.4424 if x4-x2<=-3.0\n",
      "   +0.4215 if x1>=2.0 & x4-x2>=0.0\n",
      "   -0.2159 if x2>=3.0 & x3-x1<=-2.0 & x4-x2>=-2.0\n",
      "   -0.2230 if x2>=2.0 & x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.2744 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   +0.5274 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.5467 if c<=0.0 & x1>=2.0 & x3-x1>=1.0\n",
      "   +0.6696 if c<=0.0 & x2<=1.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   +0.2156 if x2>=1.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   -0.4600 if x3-x1<=2.0 & x3-x1>=1.0 & x4-x2<=-2.0 & x4-x2>=-2.0\n",
      "----------------- 2 --------------\n",
      "   -0.1948 if x1<=2.0 & x4-x2>=1.0\n",
      "   -0.1511 if c>=1.0 & x1>=3.0 & x2>=2.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   +0.0760 if x3-x1>=2.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   +0.5292 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.2850 if x1>=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2<=1.0\n",
      "   -0.3720 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   +1.5792 if c<=0.0 & x2>=3.0 & x3-x1<=1.0\n",
      "   -0.1810 if x4-x2>=-2.0\n",
      "   +0.0417 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   -0.6164 if c<=0.0 & x4-x2>=1.0\n",
      "   -0.2867 if x3-x1<=1.0 & x4-x2<=1.0\n",
      "   +0.0374 if x3-x1>=0.0 & x4-x2<=-3.0\n",
      "   +0.2773 if c<=0.0 & x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1>=1.0\n",
      "   -0.6020 if x2>=2.0 & x3-x1<=1.0 & x4-x2>=0.0\n",
      "   +0.5722 if c<=0.0 & x1<=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.5774 if c<=0.0 & x1<=1.0 & x1>=1.0 & x2<=1.0 & x2>=1.0 & x3-x1>=1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "----------------- 3 --------------\n",
      "   +0.2204 if x1>=2.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.2413 if c>=1.0 & x1>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0\n",
      "   +0.0483 if c<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=2.0\n",
      "   +0.2050 if x1>=2.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   -0.0148 if x1>=2.0 & x4-x2>=1.0\n",
      "   +0.4010 if x1>=3.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   -0.0659 if c<=0.0 & x1>=2.0 & x2>=1.0 & x2>=3.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   -0.0602 if c<=0.0 & x1<=2.0 & x1>=1.0 & x1>=2.0 & x2<=1.0 & x2>=1.0 & x3-x1>=-1.0\n",
      "   -0.0190 if x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   -0.2450 if x3-x1<=-2.0 & x4-x2>=-1.0\n",
      "   +0.0868 if c>=1.0 & x1<=2.0 & x1>=2.0 & x2<=2.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   +0.1007 if c>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=-2.0 & x4-x2>=-2.0\n",
      "   +0.1626 if x1>=1.0 & x1>=2.0 & x2<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   -0.2860 if x3-x1<=-3.0\n",
      "   +0.6807 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   -0.6890 if x2>=3.0\n",
      "init state [ 3  1 -2 -1  0]\n",
      "(55,) (55,)\n",
      "init state [ 3  1 -3  2  0]\n",
      "(102,) (47,)\n",
      "init state [1 2 1 1 0]\n",
      "(113,) (11,)\n",
      "init state [ 0  2  0 -2  0]\n",
      "(135,) (22,)\n",
      "init state [ 1  3  0 -1  0]\n",
      "(141,) (6,)\n",
      "init state [1 1 2 1 0]\n",
      "(147,) (6,)\n",
      "init state [1 1 1 0 0]\n",
      "(185,) (38,)\n",
      "init state [2 2 1 0 0]\n",
      "(191,) (6,)\n",
      "init state [2 0 0 2 0]\n",
      "(200,) (9,)\n",
      "init state [1 0 1 0 0]\n",
      "(206,) (6,)\n",
      "============ 19 ===========\n",
      "Run episode 19 with rewards 36, accuracy 0.5\n",
      "----------------- 0 --------------\n",
      "   -0.4884 if c>=1.0 & x2>=3.0\n",
      "   -0.2222 if c>=1.0 & x1>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0\n",
      "   -0.1912 if c<=0.0 & x1<=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.0354 if c<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=1.0 & x3-x1<=2.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.3565 if c>=1.0 & x1>=2.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   +0.1848 if c<=0.0 & x1<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   +0.5400 if c<=0.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.2671 if x1>=2.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   -0.1818 if x4-x2<=-3.0\n",
      "   +0.2057 if x4-x2>=2.0\n",
      "   +0.1902 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.4573 if x4-x2<=2.0 & x4-x2>=1.0\n",
      "   -0.3125 if c<=0.0 & x3-x1>=0.0 & x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=-2.0 & x4-x2>=0.0\n",
      "   -0.0569 if x1>=3.0 & x2>=3.0 & x3-x1<=1.0\n",
      "   +0.2382 if x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   -0.3386 if x2<=2.0 & x3-x1<=-3.0\n",
      "----------------- 1 --------------\n",
      "   +0.2526 if x2>=1.0 & x3-x1>=1.0 & x3-x1>=2.0\n",
      "   +0.7982 if c>=1.0 & x1>=1.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   -0.0927 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x3-x1>=0.0 & x4-x2<=-1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.3072 if c<=0.0 & x1<=2.0 & x2<=2.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   +0.0478 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.3413 if x4-x2<=-3.0\n",
      "   +0.5622 if x1>=2.0 & x4-x2>=0.0\n",
      "   +0.0010 if x2>=3.0 & x3-x1<=-2.0 & x4-x2>=-2.0\n",
      "   +0.1085 if x2>=2.0 & x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.4307 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   +0.4250 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.2263 if c<=0.0 & x1>=2.0 & x3-x1>=1.0\n",
      "   +0.2852 if c<=0.0 & x2<=1.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   +0.7602 if x2>=1.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   -0.1052 if x3-x1<=2.0 & x3-x1>=1.0 & x4-x2<=-2.0 & x4-x2>=-2.0\n",
      "   +0.6281 if c<=0.0 & x1<=2.0 & x2<=0.0 & x4-x2>=0.0\n",
      "----------------- 2 --------------\n",
      "   -0.2114 if x1<=2.0 & x4-x2>=1.0\n",
      "   -0.0497 if c>=1.0 & x1>=3.0 & x2>=2.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   -0.0454 if x3-x1>=2.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   +0.8957 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.1616 if x1>=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2<=1.0\n",
      "   -0.3461 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   +0.3540 if c<=0.0 & x2>=3.0 & x3-x1<=1.0\n",
      "   -0.4913 if x4-x2>=-2.0\n",
      "   +0.3114 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   -0.5793 if c<=0.0 & x4-x2>=1.0\n",
      "   -0.2197 if x3-x1<=1.0 & x4-x2<=1.0\n",
      "   -0.0334 if c<=0.0 & x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1>=1.0\n",
      "   -0.4654 if x2>=2.0 & x3-x1<=1.0 & x4-x2>=0.0\n",
      "   +0.6700 if c<=0.0 & x1<=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.0000 if c<=0.0 & x1<=1.0 & x1>=1.0 & x2<=1.0 & x2>=1.0 & x3-x1>=1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.0140 if c<=0.0 & x2<=2.0 & x3-x1>=0.0 & x4-x2<=-2.0 & x4-x2>=-2.0\n",
      "----------------- 3 --------------\n",
      "   +0.2388 if x1>=2.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.4023 if c>=1.0 & x1>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0\n",
      "   +0.2822 if c<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=2.0\n",
      "   +0.0059 if x1>=2.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   -0.1122 if x1>=3.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   +0.0000 if c<=0.0 & x1>=2.0 & x2>=1.0 & x2>=3.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   -0.0170 if c<=0.0 & x1<=2.0 & x1>=1.0 & x1>=2.0 & x2<=1.0 & x2>=1.0 & x3-x1>=-1.0\n",
      "   +0.4816 if x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   -0.3035 if x3-x1<=-2.0 & x4-x2>=-1.0\n",
      "   +0.4103 if c>=1.0 & x1<=2.0 & x1>=2.0 & x2<=2.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   -0.0229 if c>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=-2.0 & x4-x2>=-2.0\n",
      "   +0.2302 if x1>=1.0 & x1>=2.0 & x2<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   -0.1669 if x3-x1<=-3.0\n",
      "   +0.7407 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   -0.3013 if x2>=3.0\n",
      "   -0.1470 if x3-x1>=2.0\n",
      "init state [0 2 1 1 0]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(19,) (19,)\n",
      "init state [ 2  0 -2  3  0]\n",
      "(32,) (13,)\n",
      "init state [ 1  2  0 -2  0]\n",
      "(70,) (38,)\n",
      "init state [ 2  0 -2  3  0]\n",
      "(92,) (22,)\n",
      "init state [0 0 0 2 0]\n",
      "(161,) (69,)\n",
      "init state [ 2  3 -1 -3  0]\n",
      "(175,) (14,)\n",
      "init state [2 1 1 1 0]\n",
      "(180,) (5,)\n",
      "init state [ 1  3  0 -3  0]\n",
      "(209,) (29,)\n",
      "init state [0 0 0 3 0]\n",
      "(239,) (30,)\n",
      "init state [ 1  3  0 -3  0]\n",
      "(258,) (19,)\n",
      "============ 20 ===========\n",
      "Run episode 20 with rewards 23, accuracy 0.1\n",
      "----------------- 0 --------------\n",
      "   -0.6046 if c>=1.0 & x2>=3.0\n",
      "   -0.0000 if c>=1.0 & x1>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0\n",
      "   -0.2172 if c<=0.0 & x1<=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.2745 if c>=1.0 & x1>=2.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   -0.2309 if c<=0.0 & x1<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   +0.6941 if c<=0.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.2279 if x1>=2.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   -0.4016 if x4-x2<=-3.0\n",
      "   +0.0155 if x4-x2>=2.0\n",
      "   +0.0829 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.6485 if x4-x2<=2.0 & x4-x2>=1.0\n",
      "   -0.0491 if c<=0.0 & x3-x1>=0.0 & x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=-2.0 & x4-x2>=0.0\n",
      "   -0.1648 if x1>=3.0 & x2>=3.0 & x3-x1<=1.0\n",
      "   -0.2474 if x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   -0.0003 if x2<=2.0 & x3-x1<=-3.0\n",
      "   -0.4600 if x1>=2.0 & x2<=2.0 & x4-x2<=-2.0\n",
      "----------------- 1 --------------\n",
      "   +0.0000 if x2>=1.0 & x3-x1>=1.0 & x3-x1>=2.0\n",
      "   +0.6796 if c>=1.0 & x1>=1.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   +0.1727 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x3-x1>=0.0 & x4-x2<=-1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.6294 if c<=0.0 & x1<=2.0 & x2<=2.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   +0.1351 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.3315 if x4-x2<=-3.0\n",
      "   +0.0898 if x1>=2.0 & x4-x2>=0.0\n",
      "   -0.3933 if x2>=2.0 & x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.8722 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   +0.0221 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.2429 if c<=0.0 & x1>=2.0 & x3-x1>=1.0\n",
      "   +0.6845 if c<=0.0 & x2<=1.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   +0.2919 if x2>=1.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   -0.1680 if x3-x1<=2.0 & x3-x1>=1.0 & x4-x2<=-2.0 & x4-x2>=-2.0\n",
      "   +0.3162 if c<=0.0 & x1<=2.0 & x2<=0.0 & x4-x2>=0.0\n",
      "   +0.7759 if x2>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "----------------- 2 --------------\n",
      "   +0.1702 if x1<=2.0 & x4-x2>=1.0\n",
      "   +0.0598 if c>=1.0 & x1>=3.0 & x2>=2.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   +0.0000 if x3-x1>=2.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   +0.3586 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.2383 if x1>=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2<=1.0\n",
      "   -0.3924 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   +0.1496 if c<=0.0 & x2>=3.0 & x3-x1<=1.0\n",
      "   -0.1394 if x4-x2>=-2.0\n",
      "   +0.4581 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   -0.1569 if c<=0.0 & x4-x2>=1.0\n",
      "   -0.2818 if x3-x1<=1.0 & x4-x2<=1.0\n",
      "   -0.0335 if c<=0.0 & x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1>=1.0\n",
      "   -0.7159 if x2>=2.0 & x3-x1<=1.0 & x4-x2>=0.0\n",
      "   +0.5507 if c<=0.0 & x1<=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.3912 if c<=0.0 & x2<=2.0 & x3-x1>=0.0 & x4-x2<=-2.0 & x4-x2>=-2.0\n",
      "   +0.6008 if c<=0.0 & x2<=2.0 & x4-x2<=-2.0\n",
      "----------------- 3 --------------\n",
      "   +0.4812 if x1>=2.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.0000 if c>=1.0 & x1>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0\n",
      "   +0.3035 if c<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=2.0\n",
      "   +0.1021 if x1>=2.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   +0.4399 if x1>=3.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   -0.3727 if c<=0.0 & x1<=2.0 & x1>=1.0 & x1>=2.0 & x2<=1.0 & x2>=1.0 & x3-x1>=-1.0\n",
      "   +0.5175 if x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   -0.0905 if x3-x1<=-2.0 & x4-x2>=-1.0\n",
      "   -0.0139 if c>=1.0 & x1<=2.0 & x1>=2.0 & x2<=2.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   -0.0263 if c>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=-2.0 & x4-x2>=-2.0\n",
      "   -0.5510 if x1>=1.0 & x1>=2.0 & x2<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   -0.0277 if x3-x1<=-3.0\n",
      "   +0.2025 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   -0.4973 if x2>=3.0\n",
      "   +0.0000 if x3-x1>=2.0\n",
      "   +0.9236 if x3-x1<=-1.0 & x4-x2>=1.0\n",
      "init state [1 2 2 0 0]\n",
      "(5,) (5,)\n",
      "init state [ 1  3 -1 -3  0]\n",
      "(53,) (48,)\n",
      "init state [1 1 0 2 0]\n",
      "(57,) (4,)\n",
      "init state [ 3  0 -3  3  0]\n",
      "(84,) (27,)\n",
      "init state [0 2 0 1 0]\n",
      "(102,) (18,)\n",
      "init state [0 3 2 0 0]\n",
      "(106,) (4,)\n",
      "init state [ 1  3  0 -2  0]\n",
      "(136,) (30,)\n",
      "init state [1 2 2 0 0]\n",
      "(143,) (7,)\n",
      "init state [1 0 1 3 0]\n",
      "(157,) (14,)\n",
      "init state [ 1  1 -1  1  0]\n",
      "(176,) (19,)\n",
      "============ 21 ===========\n",
      "Run episode 21 with rewards 23, accuracy 0.1\n",
      "----------------- 0 --------------\n",
      "   -0.4589 if c>=1.0 & x2>=3.0\n",
      "   -0.0628 if c<=0.0 & x1<=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.2686 if c>=1.0 & x1>=2.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   +0.3828 if c<=0.0 & x1<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   +0.4562 if c<=0.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.3896 if x1>=2.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   +0.0368 if x4-x2<=-3.0\n",
      "   +0.0405 if x4-x2>=2.0\n",
      "   +0.3659 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.1684 if x4-x2<=2.0 & x4-x2>=1.0\n",
      "   +0.1824 if c<=0.0 & x3-x1>=0.0 & x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=-2.0 & x4-x2>=0.0\n",
      "   -0.1066 if x1>=3.0 & x2>=3.0 & x3-x1<=1.0\n",
      "   -0.0193 if x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   +0.1808 if x2<=2.0 & x3-x1<=-3.0\n",
      "   -0.1311 if x1>=2.0 & x2<=2.0 & x4-x2<=-2.0\n",
      "   -0.2764 if x3-x1>=3.0\n",
      "----------------- 1 --------------\n",
      "   +0.1961 if c>=1.0 & x1>=1.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   +0.2754 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x3-x1>=0.0 & x4-x2<=-1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.5124 if c<=0.0 & x1<=2.0 & x2<=2.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   +0.4476 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   -0.0225 if x4-x2<=-3.0\n",
      "   -0.1732 if x1>=2.0 & x4-x2>=0.0\n",
      "   +0.1691 if x2>=2.0 & x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.7860 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   -0.1653 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.4243 if c<=0.0 & x1>=2.0 & x3-x1>=1.0\n",
      "   -0.1125 if c<=0.0 & x2<=1.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   +0.8601 if x2>=1.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   -0.0000 if x3-x1<=2.0 & x3-x1>=1.0 & x4-x2<=-2.0 & x4-x2>=-2.0\n",
      "   +0.0960 if c<=0.0 & x1<=2.0 & x2<=0.0 & x4-x2>=0.0\n",
      "   +0.7268 if x2>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.3336 if x3-x1>=3.0\n",
      "----------------- 2 --------------\n",
      "   -0.1259 if x1<=2.0 & x4-x2>=1.0\n",
      "   -0.0481 if c>=1.0 & x1>=3.0 & x2>=2.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   +0.3362 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.1546 if x1>=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2<=1.0\n",
      "   -0.1560 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   +0.0674 if c<=0.0 & x2>=3.0 & x3-x1<=1.0\n",
      "   -0.7594 if x4-x2>=-2.0\n",
      "   +0.0901 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   +0.0507 if c<=0.0 & x4-x2>=1.0\n",
      "   -0.1565 if x3-x1<=1.0 & x4-x2<=1.0\n",
      "   -0.3043 if c<=0.0 & x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1>=1.0\n",
      "   +0.0014 if x2>=2.0 & x3-x1<=1.0 & x4-x2>=0.0\n",
      "   -0.1040 if c<=0.0 & x1<=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.0000 if c<=0.0 & x2<=2.0 & x3-x1>=0.0 & x4-x2<=-2.0 & x4-x2>=-2.0\n",
      "   -0.0652 if c<=0.0 & x2<=2.0 & x4-x2<=-2.0\n",
      "   +0.2280 if x3-x1>=2.0 & x4-x2>=3.0\n",
      "----------------- 3 --------------\n",
      "   +0.2214 if x1>=2.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.0000 if c>=1.0 & x1>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0\n",
      "   -0.3144 if c<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=2.0\n",
      "   +0.1047 if x1>=2.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   +0.3655 if x1>=3.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   -0.0072 if c<=0.0 & x1<=2.0 & x1>=1.0 & x1>=2.0 & x2<=1.0 & x2>=1.0 & x3-x1>=-1.0\n",
      "   +0.6046 if x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   -0.1391 if x3-x1<=-2.0 & x4-x2>=-1.0\n",
      "   +0.3478 if c>=1.0 & x1<=2.0 & x1>=2.0 & x2<=2.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   +0.0000 if c>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=-2.0 & x4-x2>=-2.0\n",
      "   -0.1265 if x1>=1.0 & x1>=2.0 & x2<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   -0.0600 if x3-x1<=-3.0\n",
      "   +0.4675 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   -0.7214 if x2>=3.0\n",
      "   +0.4698 if x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   -0.4897 if x2<=2.0 & x2>=2.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "init state [ 3  0 -3  1  0]\n",
      "(18,) (18,)\n",
      "init state [1 0 2 1 0]\n",
      "(93,) (75,)\n",
      "init state [ 2  2  1 -2  0]\n",
      "(148,) (55,)\n",
      "init state [ 0  3  2 -2  0]\n",
      "(345,) (197,)\n",
      "init state [ 2  3  0 -3  0]\n",
      "(439,) (94,)\n",
      "init state [ 3  0 -3  2  0]\n",
      "(489,) (50,)\n",
      "init state [ 3  0 -3  1  0]\n",
      "(526,) (37,)\n",
      "init state [2 1 0 1 0]\n",
      "(529,) (3,)\n",
      "init state [ 2  3  1 -3  0]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(571,) (42,)\n",
      "init state [1 3 1 0 0]\n",
      "(573,) (2,)\n",
      "============ 22 ===========\n",
      "Run episode 22 with rewards 40, accuracy 0.6\n",
      "----------------- 0 --------------\n",
      "   -0.0488 if c>=1.0 & x2>=3.0\n",
      "   +0.1023 if c<=0.0 & x1<=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.0046 if c>=1.0 & x1>=2.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   +0.2855 if c<=0.0 & x1<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   -0.0666 if c<=0.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.3335 if x1>=2.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   -0.5336 if x4-x2<=-3.0\n",
      "   -0.0204 if x4-x2>=2.0\n",
      "   -0.8639 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.1277 if x4-x2<=2.0 & x4-x2>=1.0\n",
      "   -0.1731 if c<=0.0 & x3-x1>=0.0 & x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=-2.0 & x4-x2>=0.0\n",
      "   -0.5689 if x1>=3.0 & x2>=3.0 & x3-x1<=1.0\n",
      "   +0.2450 if x2<=2.0 & x3-x1<=-3.0\n",
      "   -0.2594 if x1>=2.0 & x2<=2.0 & x4-x2<=-2.0\n",
      "   -0.0321 if x3-x1>=3.0\n",
      "   +0.7486 if x3-x1<=-2.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "----------------- 1 --------------\n",
      "   +0.6517 if c>=1.0 & x1>=1.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   -0.3560 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x3-x1>=0.0 & x4-x2<=-1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.1655 if c<=0.0 & x1<=2.0 & x2<=2.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   -0.0826 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.6546 if x4-x2<=-3.0\n",
      "   -0.3023 if x1>=2.0 & x4-x2>=0.0\n",
      "   +0.1883 if x2>=2.0 & x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.3125 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   -0.3670 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.2037 if c<=0.0 & x1>=2.0 & x3-x1>=1.0\n",
      "   +0.1106 if c<=0.0 & x2<=1.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   +0.5129 if x2>=1.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   +0.0988 if c<=0.0 & x1<=2.0 & x2<=0.0 & x4-x2>=0.0\n",
      "   +0.7597 if x2>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.0359 if x3-x1>=3.0\n",
      "   +0.3013 if x2<=0.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "----------------- 2 --------------\n",
      "   -0.4745 if x1<=2.0 & x4-x2>=1.0\n",
      "   -0.0707 if c>=1.0 & x1>=3.0 & x2>=2.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   +1.8013 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +2.5415 if x1>=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2<=1.0\n",
      "   -0.9485 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   +3.8580 if c<=0.0 & x2>=3.0 & x3-x1<=1.0\n",
      "   +0.3154 if x4-x2>=-2.0\n",
      "   +0.5186 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   -0.5226 if c<=0.0 & x4-x2>=1.0\n",
      "   +0.0758 if x3-x1<=1.0 & x4-x2<=1.0\n",
      "   +0.1687 if c<=0.0 & x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1>=1.0\n",
      "   -0.7722 if x2>=2.0 & x3-x1<=1.0 & x4-x2>=0.0\n",
      "   -0.1681 if c<=0.0 & x1<=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.7146 if c<=0.0 & x2<=2.0 & x4-x2<=-2.0\n",
      "   +0.0000 if x3-x1>=2.0 & x4-x2>=3.0\n",
      "   +0.1834 if c<=0.0 & x3-x1<=-2.0 & x4-x2<=1.0\n",
      "----------------- 3 --------------\n",
      "   +0.0618 if x1>=2.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.1451 if c<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=2.0\n",
      "   -0.2449 if x1>=2.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   -1.3383 if x1>=3.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   +0.2333 if c<=0.0 & x1<=2.0 & x1>=1.0 & x1>=2.0 & x2<=1.0 & x2>=1.0 & x3-x1>=-1.0\n",
      "   +0.3424 if x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   -0.0545 if x3-x1<=-2.0 & x4-x2>=-1.0\n",
      "   +0.6570 if c>=1.0 & x1<=2.0 & x1>=2.0 & x2<=2.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   +0.1847 if c>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=-2.0 & x4-x2>=-2.0\n",
      "   -0.3119 if x1>=1.0 & x1>=2.0 & x2<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.1801 if x3-x1<=-3.0\n",
      "   +0.6568 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   -1.2040 if x2>=3.0\n",
      "   -0.6369 if x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   -0.2891 if x2<=2.0 & x2>=2.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   +0.4553 if c<=0.0 & x1<=0.0 & x4-x2>=1.0\n",
      "init state [ 3  2 -3  1  0]\n",
      "(20,) (20,)\n",
      "init state [ 2  2 -2 -2  0]\n",
      "(56,) (36,)\n",
      "init state [ 2  0 -1  1  0]\n",
      "(172,) (116,)\n",
      "init state [ 2  3 -1 -1  0]\n",
      "(202,) (30,)\n",
      "init state [ 2  0 -1  3  0]\n",
      "(250,) (48,)\n",
      "init state [1 1 0 2 0]\n",
      "(383,) (133,)\n",
      "init state [1 0 2 1 0]\n",
      "(397,) (14,)\n",
      "init state [ 3  2 -3  0  0]\n",
      "(408,) (11,)\n",
      "init state [1 1 1 0 0]\n",
      "(416,) (8,)\n",
      "init state [ 3  2 -3 -2  0]\n",
      "(476,) (60,)\n",
      "============ 23 ===========\n",
      "Run episode 23 with rewards -18, accuracy 0.0\n",
      "----------------- 0 --------------\n",
      "   -0.3578 if c>=1.0 & x2>=3.0\n",
      "   +0.1945 if c<=0.0 & x1<=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.2062 if c<=0.0 & x1<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   +0.1996 if c<=0.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.2804 if x1>=2.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   -0.2337 if x4-x2<=-3.0\n",
      "   +0.1603 if x4-x2>=2.0\n",
      "   -0.2149 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.4007 if x4-x2<=2.0 & x4-x2>=1.0\n",
      "   +0.0506 if c<=0.0 & x3-x1>=0.0 & x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=-2.0 & x4-x2>=0.0\n",
      "   +0.0011 if x1>=3.0 & x2>=3.0 & x3-x1<=1.0\n",
      "   +0.5623 if x2<=2.0 & x3-x1<=-3.0\n",
      "   +0.1144 if x1>=2.0 & x2<=2.0 & x4-x2<=-2.0\n",
      "   +0.1310 if x3-x1>=3.0\n",
      "   +0.5057 if x3-x1<=-2.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.7708 if c<=0.0 & x1<=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "----------------- 1 --------------\n",
      "   +0.4556 if c>=1.0 & x1>=1.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   -0.0730 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x3-x1>=0.0 & x4-x2<=-1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.5987 if c<=0.0 & x1<=2.0 & x2<=2.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   +0.6656 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.4544 if x4-x2<=-3.0\n",
      "   -0.2025 if x1>=2.0 & x4-x2>=0.0\n",
      "   +0.0597 if x2>=2.0 & x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.4579 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   +0.0593 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.0007 if c<=0.0 & x1>=2.0 & x3-x1>=1.0\n",
      "   +0.0722 if c<=0.0 & x2<=1.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   +0.6893 if x2>=1.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   -0.1420 if c<=0.0 & x1<=2.0 & x2<=0.0 & x4-x2>=0.0\n",
      "   +0.5467 if x2>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.0566 if x2<=0.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   -0.2116 if x2>=2.0 & x3-x1<=-3.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "----------------- 2 --------------\n",
      "   -0.8932 if x1<=2.0 & x4-x2>=1.0\n",
      "   -0.0384 if c>=1.0 & x1>=3.0 & x2>=2.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   +0.8918 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.5203 if x1>=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2<=1.0\n",
      "   -0.4774 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   +0.7684 if c<=0.0 & x2>=3.0 & x3-x1<=1.0\n",
      "   -0.4653 if x4-x2>=-2.0\n",
      "   +0.2018 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   -0.3031 if c<=0.0 & x4-x2>=1.0\n",
      "   -0.1930 if x3-x1<=1.0 & x4-x2<=1.0\n",
      "   +0.0250 if c<=0.0 & x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1>=1.0\n",
      "   -0.0544 if x2>=2.0 & x3-x1<=1.0 & x4-x2>=0.0\n",
      "   -0.0121 if c<=0.0 & x1<=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.0340 if c<=0.0 & x2<=2.0 & x4-x2<=-2.0\n",
      "   +0.4941 if c<=0.0 & x3-x1<=-2.0 & x4-x2<=1.0\n",
      "   -0.3111 if c<=0.0 & x2>=2.0 & x3-x1<=-2.0 & x4-x2<=0.0\n",
      "----------------- 3 --------------\n",
      "   +0.7247 if x1>=2.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.4710 if c<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=2.0\n",
      "   +0.6145 if x1>=2.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   -0.0407 if x1>=3.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   +0.1904 if c<=0.0 & x1<=2.0 & x1>=1.0 & x1>=2.0 & x2<=1.0 & x2>=1.0 & x3-x1>=-1.0\n",
      "   +0.8475 if x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   +0.6536 if c>=1.0 & x1<=2.0 & x1>=2.0 & x2<=2.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   +0.3270 if c>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=-2.0 & x4-x2>=-2.0\n",
      "   +0.7161 if x1>=1.0 & x1>=2.0 & x2<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   -0.3103 if x3-x1<=-3.0\n",
      "   +0.2839 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   -0.0491 if x2>=3.0\n",
      "   +0.4070 if x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   -0.2131 if x2<=2.0 & x2>=2.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   +0.0788 if c<=0.0 & x1<=0.0 & x4-x2>=1.0\n",
      "   -0.0079 if x1>=3.0 & x3-x1>=0.0 & x4-x2<=0.0\n",
      "init state [ 0  1  2 -1  0]\n",
      "(46,) (46,)\n",
      "init state [ 0  3  1 -3  0]\n",
      "(119,) (73,)\n",
      "init state [ 3  0 -1  0  0]\n",
      "(134,) (15,)\n",
      "init state [0 0 3 0 0]\n",
      "(223,) (89,)\n",
      "init state [3 1 0 1 0]\n",
      "(227,) (4,)\n",
      "init state [ 1  2 -1 -1  0]\n",
      "(261,) (34,)\n",
      "init state [ 0  2  0 -1  0]\n",
      "(316,) (55,)\n",
      "init state [ 0  3  1 -2  0]\n",
      "(348,) (32,)\n",
      "init state [0 1 0 2 0]\n",
      "(356,) (8,)\n",
      "init state [ 3  2 -3  0  0]\n",
      "(375,) (19,)\n",
      "============ 24 ===========\n",
      "Run episode 24 with rewards 23, accuracy 0.2\n",
      "----------------- 0 --------------\n",
      "   -0.0212 if c>=1.0 & x2>=3.0\n",
      "   -0.0806 if c<=0.0 & x1<=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.8470 if c<=0.0 & x1<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   +0.5972 if c<=0.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.4588 if x1>=2.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   -0.1220 if x4-x2<=-3.0\n",
      "   -0.0185 if x4-x2>=2.0\n",
      "   -0.0762 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.1850 if x4-x2<=2.0 & x4-x2>=1.0\n",
      "   -0.0812 if c<=0.0 & x3-x1>=0.0 & x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=-2.0 & x4-x2>=0.0\n",
      "   +0.0595 if x2<=2.0 & x3-x1<=-3.0\n",
      "   -0.4977 if x1>=2.0 & x2<=2.0 & x4-x2<=-2.0\n",
      "   +0.0605 if x3-x1>=3.0\n",
      "   +0.0691 if x3-x1<=-2.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.2617 if c<=0.0 & x1<=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   -0.4231 if x1>=2.0 & x2>=1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 1 --------------\n",
      "   -0.0461 if c>=1.0 & x1>=1.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   +0.1449 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x3-x1>=0.0 & x4-x2<=-1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.7294 if c<=0.0 & x1<=2.0 & x2<=2.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   +0.2829 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   -0.1710 if x4-x2<=-3.0\n",
      "   -0.2562 if x1>=2.0 & x4-x2>=0.0\n",
      "   +0.4886 if x2>=2.0 & x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.6763 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   -0.0213 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.1302 if c<=0.0 & x2<=1.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   +0.0000 if x2>=1.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   -0.0755 if c<=0.0 & x1<=2.0 & x2<=0.0 & x4-x2>=0.0\n",
      "   +0.9422 if x2>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.0836 if x2<=0.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   +0.3500 if x2>=2.0 & x3-x1<=-3.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.5358 if x1>=3.0 & x2<=2.0 & x2>=1.0 & x3-x1>=0.0\n",
      "----------------- 2 --------------\n",
      "   -0.3349 if x1<=2.0 & x4-x2>=1.0\n",
      "   -0.4130 if c>=1.0 & x1>=3.0 & x2>=2.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   +0.6241 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.1056 if x1>=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2<=1.0\n",
      "   -0.6639 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   +0.0723 if c<=0.0 & x2>=3.0 & x3-x1<=1.0\n",
      "   -0.4185 if x4-x2>=-2.0\n",
      "   +0.2761 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   -0.3796 if c<=0.0 & x4-x2>=1.0\n",
      "   +0.0204 if x3-x1<=1.0 & x4-x2<=1.0\n",
      "   -0.1738 if c<=0.0 & x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1>=1.0\n",
      "   -0.4140 if x2>=2.0 & x3-x1<=1.0 & x4-x2>=0.0\n",
      "   +0.5630 if c<=0.0 & x2<=2.0 & x4-x2<=-2.0\n",
      "   +0.1725 if c<=0.0 & x3-x1<=-2.0 & x4-x2<=1.0\n",
      "   +0.0900 if c<=0.0 & x2>=2.0 & x3-x1<=-2.0 & x4-x2<=0.0\n",
      "   +0.8178 if x3-x1>=-2.0 & x4-x2<=0.0\n",
      "----------------- 3 --------------\n",
      "   +0.7357 if x1>=2.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.1578 if c<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=2.0\n",
      "   +0.3517 if x1>=2.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   -0.0059 if x1>=3.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   +0.0011 if c<=0.0 & x1<=2.0 & x1>=1.0 & x1>=2.0 & x2<=1.0 & x2>=1.0 & x3-x1>=-1.0\n",
      "   +0.2793 if x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   +0.1279 if c>=1.0 & x1<=2.0 & x1>=2.0 & x2<=2.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   +0.0053 if c>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=-2.0 & x4-x2>=-2.0\n",
      "   +0.5689 if x1>=1.0 & x1>=2.0 & x2<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   -0.1958 if x3-x1<=-3.0\n",
      "   +0.5238 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   -0.6943 if x2>=3.0\n",
      "   +0.1332 if x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   -0.2229 if x2<=2.0 & x2>=2.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   +0.2796 if c<=0.0 & x1<=0.0 & x4-x2>=1.0\n",
      "   -0.5906 if c<=0.0 & x2<=1.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "init state [2 2 1 0 0]\n",
      "(2,) (2,)\n",
      "init state [ 1  2 -1 -2  0]\n",
      "(24,) (22,)\n",
      "init state [ 2  2 -2  1  0]\n",
      "(38,) (14,)\n",
      "init state [0 3 1 0 0]\n",
      "(42,) (4,)\n",
      "init state [ 2  2 -2 -2  0]\n",
      "(114,) (72,)\n",
      "init state [0 0 1 1 0]\n",
      "(129,) (15,)\n",
      "init state [0 1 1 1 0]\n",
      "(143,) (14,)\n",
      "init state [ 2  0 -2  2  0]\n",
      "(151,) (8,)\n",
      "init state [1 2 1 1 0]\n",
      "(175,) (24,)\n",
      "init state [ 1  3  1 -1  0]\n",
      "(179,) (4,)\n",
      "============ 25 ===========\n",
      "Run episode 25 with rewards 38, accuracy 0.2\n",
      "----------------- 0 --------------\n",
      "   -0.2442 if c>=1.0 & x2>=3.0\n",
      "   -0.4283 if c<=0.0 & x1<=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.2317 if c<=0.0 & x1<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   +0.5888 if c<=0.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.1496 if x1>=2.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   +0.0494 if x4-x2<=-3.0\n",
      "   -0.2593 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.6274 if x4-x2<=2.0 & x4-x2>=1.0\n",
      "   -0.3413 if c<=0.0 & x3-x1>=0.0 & x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=-2.0 & x4-x2>=0.0\n",
      "   -0.4099 if x2<=2.0 & x3-x1<=-3.0\n",
      "   -0.0737 if x1>=2.0 & x2<=2.0 & x4-x2<=-2.0\n",
      "   -0.0000 if x3-x1>=3.0\n",
      "   +0.5050 if x3-x1<=-2.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.3678 if c<=0.0 & x1<=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   -0.2676 if x1>=2.0 & x2>=1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   +0.8310 if c<=0.0 & x1<=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "----------------- 1 --------------\n",
      "   +0.3220 if c>=1.0 & x1>=1.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   -0.2686 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x3-x1>=0.0 & x4-x2<=-1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.6116 if c<=0.0 & x1<=2.0 & x2<=2.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   +0.8378 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   -0.0589 if x4-x2<=-3.0\n",
      "   -0.4213 if x1>=2.0 & x4-x2>=0.0\n",
      "   +0.3131 if x2>=2.0 & x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.6165 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   -0.0627 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.0141 if c<=0.0 & x2<=1.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   -0.1629 if c<=0.0 & x1<=2.0 & x2<=0.0 & x4-x2>=0.0\n",
      "   +0.5880 if x2>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.1594 if x2<=0.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   -0.1881 if x2>=2.0 & x3-x1<=-3.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.0811 if x1>=3.0 & x2<=2.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   +0.3880 if x3-x1>=1.0 & x4-x2>=2.0\n",
      "----------------- 2 --------------\n",
      "   +0.0257 if x1<=2.0 & x4-x2>=1.0\n",
      "   -0.1225 if c>=1.0 & x1>=3.0 & x2>=2.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   +0.8617 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.0993 if x1>=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2<=1.0\n",
      "   -0.2687 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   +0.1805 if c<=0.0 & x2>=3.0 & x3-x1<=1.0\n",
      "   -0.4061 if x4-x2>=-2.0\n",
      "   +0.3819 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   +0.0732 if c<=0.0 & x4-x2>=1.0\n",
      "   +0.0752 if c<=0.0 & x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1>=1.0\n",
      "   -0.5679 if x2>=2.0 & x3-x1<=1.0 & x4-x2>=0.0\n",
      "   -0.0028 if c<=0.0 & x2<=2.0 & x4-x2<=-2.0\n",
      "   -0.2079 if c<=0.0 & x3-x1<=-2.0 & x4-x2<=1.0\n",
      "   -0.2456 if c<=0.0 & x2>=2.0 & x3-x1<=-2.0 & x4-x2<=0.0\n",
      "   -0.0142 if x3-x1>=-2.0 & x4-x2<=0.0\n",
      "   -0.4774 if c<=0.0 & x2<=1.0 & x4-x2>=1.0\n",
      "----------------- 3 --------------\n",
      "   +0.7911 if x1>=2.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.3713 if c<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=2.0\n",
      "   +0.3752 if x1>=2.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   +0.8222 if x1>=3.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   +0.0538 if x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   +0.4127 if c>=1.0 & x1<=2.0 & x1>=2.0 & x2<=2.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   +0.0000 if c>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=-2.0 & x4-x2>=-2.0\n",
      "   +0.3899 if x1>=1.0 & x1>=2.0 & x2<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.6548 if x3-x1<=-3.0\n",
      "   +0.5039 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   -0.0368 if x2>=3.0\n",
      "   +0.3752 if x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   -0.4374 if x2<=2.0 & x2>=2.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   +0.2474 if c<=0.0 & x1<=0.0 & x4-x2>=1.0\n",
      "   +0.2753 if c<=0.0 & x2<=1.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   -0.4078 if x2>=1.0 & x3-x1<=-2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "init state [0 0 2 1 0]\n",
      "(23,) (23,)\n",
      "init state [ 3  0 -3  2  0]\n",
      "(52,) (29,)\n",
      "init state [ 3  2  0 -1  0]\n",
      "(65,) (13,)\n",
      "init state [ 3  2 -1 -2  0]\n",
      "(99,) (34,)\n",
      "init state [ 3  0 -3  1  0]\n",
      "(139,) (40,)\n",
      "init state [ 1  3  2 -3  0]\n",
      "(171,) (32,)\n",
      "init state [ 3  0 -2  1  0]\n",
      "(186,) (15,)\n",
      "init state [ 2  2 -2 -2  0]\n",
      "(243,) (57,)\n",
      "init state [ 2  2  1 -2  0]\n",
      "(259,) (16,)\n",
      "init state [ 3  0 -3  2  0]\n",
      "(289,) (30,)\n",
      "============ 26 ===========\n",
      "Run episode 26 with rewards 12, accuracy 0.4\n",
      "----------------- 0 --------------\n",
      "   -0.2647 if c>=1.0 & x2>=3.0\n",
      "   -0.0644 if c<=0.0 & x1<=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.3082 if c<=0.0 & x1<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   +0.9825 if c<=0.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.4427 if x1>=2.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   -0.3388 if x4-x2<=-3.0\n",
      "   +0.0285 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.1926 if x4-x2<=2.0 & x4-x2>=1.0\n",
      "   -0.0117 if c<=0.0 & x3-x1>=0.0 & x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=-2.0 & x4-x2>=0.0\n",
      "   +0.1140 if x2<=2.0 & x3-x1<=-3.0\n",
      "   +0.0279 if x1>=2.0 & x2<=2.0 & x4-x2<=-2.0\n",
      "   +0.3377 if x3-x1<=-2.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.0226 if c<=0.0 & x1<=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   -0.1621 if x1>=2.0 & x2>=1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   +0.3045 if c<=0.0 & x1<=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.3653 if x2>=1.0 & x3-x1>=2.0 & x4-x2>=0.0\n",
      "----------------- 1 --------------\n",
      "   +0.7952 if c>=1.0 & x1>=1.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   -0.4226 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x3-x1>=0.0 & x4-x2<=-1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.1859 if c<=0.0 & x1<=2.0 & x2<=2.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   +0.3299 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.4746 if x4-x2<=-3.0\n",
      "   +0.0777 if x1>=2.0 & x4-x2>=0.0\n",
      "   +0.4105 if x2>=2.0 & x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.5807 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   +0.1317 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   -0.1024 if c<=0.0 & x1<=2.0 & x2<=0.0 & x4-x2>=0.0\n",
      "   +0.5674 if x2>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.0189 if x2<=0.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   +0.1505 if x2>=2.0 & x3-x1<=-3.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.0971 if x1>=3.0 & x2<=2.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   +0.0000 if x3-x1>=1.0 & x4-x2>=2.0\n",
      "   -0.5491 if x1>=1.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=-2.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 2 --------------\n",
      "   -0.0381 if x1<=2.0 & x4-x2>=1.0\n",
      "   -0.1141 if c>=1.0 & x1>=3.0 & x2>=2.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   +1.1298 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.0976 if x1>=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2<=1.0\n",
      "   -0.3584 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   +0.5173 if c<=0.0 & x2>=3.0 & x3-x1<=1.0\n",
      "   +0.0180 if x4-x2>=-2.0\n",
      "   +0.2236 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   +0.0155 if c<=0.0 & x4-x2>=1.0\n",
      "   -0.3352 if c<=0.0 & x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1>=1.0\n",
      "   -0.2239 if x2>=2.0 & x3-x1<=1.0 & x4-x2>=0.0\n",
      "   -0.1186 if c<=0.0 & x3-x1<=-2.0 & x4-x2<=1.0\n",
      "   -0.0224 if c<=0.0 & x2>=2.0 & x3-x1<=-2.0 & x4-x2<=0.0\n",
      "   -0.0793 if x3-x1>=-2.0 & x4-x2<=0.0\n",
      "   +0.0155 if c<=0.0 & x2<=1.0 & x4-x2>=1.0\n",
      "   -0.6742 if x2<=1.0\n",
      "----------------- 3 --------------\n",
      "   +0.1052 if x1>=2.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.2665 if c<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=2.0\n",
      "   +0.1052 if x1>=2.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   +0.3607 if x1>=3.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   -0.1337 if x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   -0.0085 if c>=1.0 & x1<=2.0 & x1>=2.0 & x2<=2.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   +0.4833 if x1>=1.0 & x1>=2.0 & x2<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   -0.1050 if x3-x1<=-3.0\n",
      "   +1.1109 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   -0.2666 if x2>=3.0\n",
      "   +0.5250 if x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   -0.2561 if x2<=2.0 & x2>=2.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   +0.0356 if c<=0.0 & x1<=0.0 & x4-x2>=1.0\n",
      "   -0.2661 if c<=0.0 & x2<=1.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   -0.3968 if x2>=1.0 & x3-x1<=-2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.5361 if x1<=0.0 & x1<=1.0 & x2<=2.0 & x2>=1.0 & x3-x1>=2.0\n",
      "init state [ 1  3 -1 -3  0]\n",
      "(34,) (34,)\n",
      "init state [ 1  1 -1 -1  0]\n",
      "(108,) (74,)\n",
      "init state [ 2  0 -2  1  0]\n",
      "(130,) (22,)\n",
      "init state [ 1  3 -1  0  0]\n",
      "(134,) (4,)\n",
      "init state [ 0  3  0 -3  0]\n",
      "(180,) (46,)\n",
      "init state [ 1  3  0 -1  0]\n",
      "(184,) (4,)\n",
      "init state [ 2  2  0 -2  0]\n",
      "(198,) (14,)\n",
      "init state [0 0 2 3 0]\n",
      "(218,) (20,)\n",
      "init state [ 1  2  1 -1  0]\n",
      "(229,) (11,)\n",
      "init state [ 2  3  0 -2  0]\n",
      "(240,) (11,)\n",
      "============ 27 ===========\n",
      "Run episode 27 with rewards 31, accuracy 0.8\n",
      "----------------- 0 --------------\n",
      "   -0.2574 if c>=1.0 & x2>=3.0\n",
      "   -0.2741 if c<=0.0 & x1<=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.3791 if c<=0.0 & x1<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   +0.7899 if c<=0.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.5744 if x1>=2.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   -0.0219 if x4-x2<=-3.0\n",
      "   +0.1344 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.3880 if x4-x2<=2.0 & x4-x2>=1.0\n",
      "   +0.1799 if x2<=2.0 & x3-x1<=-3.0\n",
      "   +0.2202 if x1>=2.0 & x2<=2.0 & x4-x2<=-2.0\n",
      "   -0.0299 if x3-x1<=-2.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.3844 if c<=0.0 & x1<=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   +0.1139 if x1>=2.0 & x2>=1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   +0.4508 if c<=0.0 & x1<=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.2126 if x2>=1.0 & x3-x1>=2.0 & x4-x2>=0.0\n",
      "   -0.3697 if x1>=1.0 & x2>=1.0 & x4-x2>=2.0\n",
      "----------------- 1 --------------\n",
      "   +0.2927 if c>=1.0 & x1>=1.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   -0.2822 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x3-x1>=0.0 & x4-x2<=-1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.4073 if c<=0.0 & x1<=2.0 & x2<=2.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   +0.3541 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   -0.0102 if x4-x2<=-3.0\n",
      "   +0.0232 if x1>=2.0 & x4-x2>=0.0\n",
      "   +0.0937 if x2>=2.0 & x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.5214 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   +0.3913 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   -0.2391 if c<=0.0 & x1<=2.0 & x2<=0.0 & x4-x2>=0.0\n",
      "   +0.4964 if x2>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.0185 if x2<=0.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   -0.0000 if x2>=2.0 & x3-x1<=-3.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.0000 if x1>=3.0 & x2<=2.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   +0.1679 if x1>=1.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=-2.0\n",
      "   +0.5589 if x1<=2.0 & x1>=1.0 & x2>=1.0 & x4-x2>=2.0\n",
      "----------------- 2 --------------\n",
      "   -0.0209 if x1<=2.0 & x4-x2>=1.0\n",
      "   -0.0481 if c>=1.0 & x1>=3.0 & x2>=2.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   +1.1773 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.5577 if x1>=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2<=1.0\n",
      "   -0.2665 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   +0.0065 if c<=0.0 & x2>=3.0 & x3-x1<=1.0\n",
      "   -0.1329 if x4-x2>=-2.0\n",
      "   -0.1155 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   -0.2066 if c<=0.0 & x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1>=1.0\n",
      "   -0.4814 if x2>=2.0 & x3-x1<=1.0 & x4-x2>=0.0\n",
      "   -0.3747 if c<=0.0 & x3-x1<=-2.0 & x4-x2<=1.0\n",
      "   -0.1608 if c<=0.0 & x2>=2.0 & x3-x1<=-2.0 & x4-x2<=0.0\n",
      "   -0.0393 if x3-x1>=-2.0 & x4-x2<=0.0\n",
      "   +0.1016 if c<=0.0 & x2<=1.0 & x4-x2>=1.0\n",
      "   -0.2960 if x2<=1.0\n",
      "   +0.1258 if x4-x2>=-1.0\n",
      "----------------- 3 --------------\n",
      "   +0.4291 if x1>=2.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.3941 if c<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=2.0\n",
      "   +0.1059 if x1>=2.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   +0.3507 if x1>=3.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   -0.1610 if x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   +0.2394 if x1>=1.0 & x1>=2.0 & x2<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.2326 if x3-x1<=-3.0\n",
      "   +0.9874 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   -0.1907 if x2>=3.0\n",
      "   +0.1059 if x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   -0.0272 if x2<=2.0 & x2>=2.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   +0.0575 if c<=0.0 & x1<=0.0 & x4-x2>=1.0\n",
      "   -0.5493 if c<=0.0 & x2<=1.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   -0.3130 if x2>=1.0 & x3-x1<=-2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.0276 if x1<=0.0 & x1<=1.0 & x2<=2.0 & x2>=1.0 & x3-x1>=2.0\n",
      "   +0.2616 if x1>=3.0 & x4-x2>=3.0\n",
      "init state [ 1  0 -1  0  0]\n",
      "(59,) (59,)\n",
      "init state [ 0  3  3 -1  0]\n",
      "(81,) (22,)\n",
      "init state [0 2 1 0 0]\n",
      "(91,) (10,)\n",
      "init state [1 2 2 0 0]\n",
      "(108,) (17,)\n",
      "init state [ 2  3  1 -1  0]\n",
      "(112,) (4,)\n",
      "init state [ 3  2 -1 -1  0]\n",
      "(137,) (25,)\n",
      "init state [0 0 3 0 0]\n",
      "(193,) (56,)\n",
      "init state [ 2  1 -2  0  0]\n",
      "(233,) (40,)\n",
      "init state [ 1  3  0 -1  0]\n",
      "(246,) (13,)\n",
      "init state [ 3  2 -3  1  0]\n",
      "(311,) (65,)\n",
      "============ 28 ===========\n",
      "Run episode 28 with rewards -23, accuracy 0.6\n",
      "----------------- 0 --------------\n",
      "   -0.1241 if c>=1.0 & x2>=3.0\n",
      "   +0.1246 if c<=0.0 & x1<=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.0392 if c<=0.0 & x1<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   +0.5739 if c<=0.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.5441 if x1>=2.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   +0.6322 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.0862 if x4-x2<=2.0 & x4-x2>=1.0\n",
      "   +0.0249 if x2<=2.0 & x3-x1<=-3.0\n",
      "   -0.2453 if x1>=2.0 & x2<=2.0 & x4-x2<=-2.0\n",
      "   +0.0054 if x3-x1<=-2.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.3834 if c<=0.0 & x1<=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   -0.2270 if x1>=2.0 & x2>=1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   +0.4667 if c<=0.0 & x1<=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   +0.1053 if x2>=1.0 & x3-x1>=2.0 & x4-x2>=0.0\n",
      "   -0.0112 if x1>=1.0 & x2>=1.0 & x4-x2>=2.0\n",
      "   -0.1690 if x1>=1.0 & x2>=2.0 & x3-x1>=2.0 & x4-x2>=0.0\n",
      "----------------- 1 --------------\n",
      "   +0.2062 if c>=1.0 & x1>=1.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   -0.3052 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x3-x1>=0.0 & x4-x2<=-1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.2638 if c<=0.0 & x1<=2.0 & x2<=2.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   +0.2130 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   -0.0096 if x4-x2<=-3.0\n",
      "   -0.0174 if x1>=2.0 & x4-x2>=0.0\n",
      "   +0.1769 if x2>=2.0 & x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.3947 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   +0.7582 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.0398 if c<=0.0 & x1<=2.0 & x2<=0.0 & x4-x2>=0.0\n",
      "   +0.6606 if x2>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.0152 if x2<=0.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   -0.0301 if x2>=2.0 & x3-x1<=-3.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.3051 if x1>=1.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=-2.0\n",
      "   +0.0116 if x1<=2.0 & x1>=1.0 & x2>=1.0 & x4-x2>=2.0\n",
      "   -0.5097 if c<=0.0 & x1>=1.0 & x3-x1>=2.0 & x4-x2>=-1.0\n",
      "----------------- 2 --------------\n",
      "   -0.1978 if x1<=2.0 & x4-x2>=1.0\n",
      "   +0.1689 if c>=1.0 & x1>=3.0 & x2>=2.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   +1.0627 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.0891 if x1>=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2<=1.0\n",
      "   -0.0509 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -0.3709 if x4-x2>=-2.0\n",
      "   +0.2332 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   -0.0108 if c<=0.0 & x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1>=1.0\n",
      "   -0.3218 if x2>=2.0 & x3-x1<=1.0 & x4-x2>=0.0\n",
      "   -0.0717 if c<=0.0 & x3-x1<=-2.0 & x4-x2<=1.0\n",
      "   -0.0718 if c<=0.0 & x2>=2.0 & x3-x1<=-2.0 & x4-x2<=0.0\n",
      "   -0.1454 if x3-x1>=-2.0 & x4-x2<=0.0\n",
      "   -0.0204 if c<=0.0 & x2<=1.0 & x4-x2>=1.0\n",
      "   -0.3293 if x2<=1.0\n",
      "   -0.4393 if x4-x2>=-1.0\n",
      "   +0.9002 if x1>=3.0 & x2>=2.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 3 --------------\n",
      "   +0.2524 if x1>=2.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.4283 if c<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=2.0\n",
      "   +0.0976 if x1>=2.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   +0.0836 if x1>=3.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   -0.0457 if x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   +0.0245 if x1>=1.0 & x1>=2.0 & x2<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.3732 if x3-x1<=-3.0\n",
      "   +0.8015 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.3836 if x2>=3.0\n",
      "   +0.1730 if x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   -0.1657 if c<=0.0 & x1<=0.0 & x4-x2>=1.0\n",
      "   -0.0292 if c<=0.0 & x2<=1.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   -0.1404 if x2>=1.0 & x3-x1<=-2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.0088 if x1<=0.0 & x1<=1.0 & x2<=2.0 & x2>=1.0 & x3-x1>=2.0\n",
      "   -0.0000 if x1>=3.0 & x4-x2>=3.0\n",
      "   -0.8139 if x2>=3.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "init state [ 0  3  0 -2  0]\n",
      "(15,) (15,)\n",
      "init state [ 1  3  2 -2  0]\n",
      "(46,) (31,)\n",
      "init state [0 3 2 0 0]\n",
      "(49,) (3,)\n",
      "init state [ 2  0 -2  0  0]\n",
      "(224,) (175,)\n",
      "init state [2 1 1 1 0]\n",
      "(228,) (4,)\n",
      "init state [ 1  1 -1  0  0]\n",
      "(235,) (7,)\n",
      "init state [0 2 2 0 0]\n",
      "(259,) (24,)\n",
      "init state [1 0 2 0 0]\n",
      "(288,) (29,)\n",
      "init state [ 2  1  1 -1  0]\n",
      "(362,) (74,)\n",
      "init state [ 2  3  1 -1  0]\n",
      "(367,) (5,)\n",
      "============ 29 ===========\n",
      "Run episode 29 with rewards 37, accuracy 0.4\n",
      "----------------- 0 --------------\n",
      "   -0.2600 if c>=1.0 & x2>=3.0\n",
      "   -0.0807 if c<=0.0 & x1<=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.2858 if c<=0.0 & x1<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   +0.3966 if c<=0.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.7222 if x1>=2.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   -0.0655 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.1814 if x4-x2<=2.0 & x4-x2>=1.0\n",
      "   +0.1018 if x2<=2.0 & x3-x1<=-3.0\n",
      "   -0.0218 if x1>=2.0 & x2<=2.0 & x4-x2<=-2.0\n",
      "   +0.4182 if c<=0.0 & x1<=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   -0.2199 if x1>=2.0 & x2>=1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   +0.4415 if c<=0.0 & x1<=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   +0.0119 if x2>=1.0 & x3-x1>=2.0 & x4-x2>=0.0\n",
      "   +0.0000 if x1>=1.0 & x2>=1.0 & x4-x2>=2.0\n",
      "   +0.0000 if x1>=1.0 & x2>=2.0 & x3-x1>=2.0 & x4-x2>=0.0\n",
      "   -0.2743 if c<=0.0 & x2>=3.0 & x3-x1>=0.0 & x4-x2>=-1.0 & x4-x2>=0.0\n",
      "----------------- 1 --------------\n",
      "   +0.3132 if c>=1.0 & x1>=1.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   +0.3601 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x3-x1>=0.0 & x4-x2<=-1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.6191 if c<=0.0 & x1<=2.0 & x2<=2.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   +0.9348 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.0668 if x1>=2.0 & x4-x2>=0.0\n",
      "   +0.2401 if x2>=2.0 & x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.8031 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   +0.2473 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.1814 if c<=0.0 & x1<=2.0 & x2<=0.0 & x4-x2>=0.0\n",
      "   +0.2921 if x2>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.0194 if x2<=0.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   -0.0000 if x2>=2.0 & x3-x1<=-3.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.3166 if x1>=1.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=-2.0\n",
      "   -0.0000 if x1<=2.0 & x1>=1.0 & x2>=1.0 & x4-x2>=2.0\n",
      "   -0.0141 if c<=0.0 & x1>=1.0 & x3-x1>=2.0 & x4-x2>=-1.0\n",
      "   +0.3497 if x3-x1>=1.0 & x4-x2>=1.0\n",
      "----------------- 2 --------------\n",
      "   -0.1318 if x1<=2.0 & x4-x2>=1.0\n",
      "   -0.1561 if c>=1.0 & x1>=3.0 & x2>=2.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   +0.4176 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.0503 if x1>=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2<=1.0\n",
      "   -0.4174 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   +0.7750 if x4-x2>=-2.0\n",
      "   +0.7935 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   -0.3989 if x2>=2.0 & x3-x1<=1.0 & x4-x2>=0.0\n",
      "   +4.0402 if c<=0.0 & x3-x1<=-2.0 & x4-x2<=1.0\n",
      "   +2.7506 if c<=0.0 & x2>=2.0 & x3-x1<=-2.0 & x4-x2<=0.0\n",
      "   -0.0195 if x3-x1>=-2.0 & x4-x2<=0.0\n",
      "   -0.3041 if c<=0.0 & x2<=1.0 & x4-x2>=1.0\n",
      "   +0.3722 if x2<=1.0\n",
      "   -0.7721 if x4-x2>=-1.0\n",
      "   +0.1660 if x1>=3.0 & x2>=2.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   +0.0228 if x1<=2.0 & x2<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "----------------- 3 --------------\n",
      "   +0.3428 if x1>=2.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.3006 if c<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=2.0\n",
      "   -0.0000 if x1>=2.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   -0.2049 if x1>=3.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   +0.6525 if x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   +0.0436 if x1>=1.0 & x1>=2.0 & x2<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   -0.3824 if x3-x1<=-3.0\n",
      "   +1.0695 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.0724 if x2>=3.0\n",
      "   -0.0000 if x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   -0.0000 if c<=0.0 & x1<=0.0 & x4-x2>=1.0\n",
      "   -0.2384 if c<=0.0 & x2<=1.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   -0.1389 if x2>=1.0 & x3-x1<=-2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.0384 if x1<=0.0 & x1<=1.0 & x2<=2.0 & x2>=1.0 & x3-x1>=2.0\n",
      "   +0.3607 if x2>=3.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.2204 if x3-x1>=1.0 & x4-x2>=1.0\n",
      "init state [3 1 0 1 0]\n",
      "(5,) (5,)\n",
      "init state [ 2  2  1 -2  0]\n",
      "(21,) (16,)\n",
      "init state [ 0  3  1 -3  0]\n",
      "(39,) (18,)\n",
      "init state [ 3  2  0 -1  0]\n",
      "(73,) (34,)\n",
      "init state [ 2  0 -1  1  0]\n",
      "(87,) (14,)\n",
      "init state [ 1  2 -1  0  0]\n",
      "(92,) (5,)\n",
      "init state [ 3  0 -1  0  0]\n",
      "(107,) (15,)\n",
      "init state [0 0 1 2 0]\n",
      "(117,) (10,)\n",
      "init state [ 3  0 -3  3  0]\n",
      "(157,) (40,)\n",
      "init state [ 2  1 -2  0  0]\n",
      "(218,) (61,)\n",
      "============ 30 ===========\n",
      "Run episode 30 with rewards -19, accuracy 0.4\n",
      "----------------- 0 --------------\n",
      "   -0.2969 if c>=1.0 & x2>=3.0\n",
      "   +0.3998 if c<=0.0 & x1<=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.4651 if c<=0.0 & x1<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   +0.1366 if c<=0.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.5033 if x1>=2.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   +0.0438 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.1231 if x4-x2<=2.0 & x4-x2>=1.0\n",
      "   +0.1733 if x2<=2.0 & x3-x1<=-3.0\n",
      "   -0.1602 if x1>=2.0 & x2<=2.0 & x4-x2<=-2.0\n",
      "   +0.2832 if c<=0.0 & x1<=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   -0.0239 if x1>=2.0 & x2>=1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   +0.2705 if c<=0.0 & x1<=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   +0.0000 if x2>=1.0 & x3-x1>=2.0 & x4-x2>=0.0\n",
      "   +0.0000 if x1>=1.0 & x2>=2.0 & x3-x1>=2.0 & x4-x2>=0.0\n",
      "   +0.0000 if c<=0.0 & x2>=3.0 & x3-x1>=0.0 & x4-x2>=-1.0 & x4-x2>=0.0\n",
      "   -0.6609 if c<=0.0 & x2<=0.0 & x4-x2<=2.0 & x4-x2>=2.0\n",
      "----------------- 1 --------------\n",
      "   +0.5795 if c>=1.0 & x1>=1.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   +0.3559 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x3-x1>=0.0 & x4-x2<=-1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.5598 if c<=0.0 & x1<=2.0 & x2<=2.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   +0.3954 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.1955 if x1>=2.0 & x4-x2>=0.0\n",
      "   +1.0718 if x2>=2.0 & x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.8613 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   +0.0284 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   -0.0152 if c<=0.0 & x1<=2.0 & x2<=0.0 & x4-x2>=0.0\n",
      "   +0.5563 if x2>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.0861 if x2<=0.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   +0.0000 if x2>=2.0 & x3-x1<=-3.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.0184 if x1>=1.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=-2.0\n",
      "   +0.0000 if c<=0.0 & x1>=1.0 & x3-x1>=2.0 & x4-x2>=-1.0\n",
      "   +0.2190 if x3-x1>=1.0 & x4-x2>=1.0\n",
      "   -0.4068 if x1>=3.0 & x4-x2<=-1.0\n",
      "----------------- 2 --------------\n",
      "   +0.3459 if x1<=2.0 & x4-x2>=1.0\n",
      "   +0.0697 if c>=1.0 & x1>=3.0 & x2>=2.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   +0.8821 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.2440 if x1>=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2<=1.0\n",
      "   -0.5067 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   +0.1371 if x4-x2>=-2.0\n",
      "   +0.2417 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   -0.0808 if x2>=2.0 & x3-x1<=1.0 & x4-x2>=0.0\n",
      "   -0.2746 if c<=0.0 & x3-x1<=-2.0 & x4-x2<=1.0\n",
      "   +0.1074 if c<=0.0 & x2>=2.0 & x3-x1<=-2.0 & x4-x2<=0.0\n",
      "   +0.1857 if c<=0.0 & x2<=1.0 & x4-x2>=1.0\n",
      "   +0.0824 if x2<=1.0\n",
      "   -0.4835 if x4-x2>=-1.0\n",
      "   -0.2306 if x1>=3.0 & x2>=2.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.0167 if x1<=2.0 & x2<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   -0.5333 if x1<=0.0 & x2<=2.0 & x3-x1<=0.0\n",
      "----------------- 3 --------------\n",
      "   +0.2587 if x1>=2.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.0393 if c<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=2.0\n",
      "   +0.1028 if x1>=3.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   +0.3708 if x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   +0.5052 if x1>=1.0 & x1>=2.0 & x2<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   -0.1107 if x3-x1<=-3.0\n",
      "   +0.7307 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.1149 if x2>=3.0\n",
      "   -0.4173 if x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   +0.0103 if c<=0.0 & x1<=0.0 & x4-x2>=1.0\n",
      "   +0.1128 if c<=0.0 & x2<=1.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   +0.4611 if x2>=1.0 & x3-x1<=-2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.0000 if x1<=0.0 & x1<=1.0 & x2<=2.0 & x2>=1.0 & x3-x1>=2.0\n",
      "   -0.0198 if x2>=3.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.1670 if x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.6031 if c<=0.0 & x1<=1.0 & x1>=1.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "init state [ 2  2 -2 -1  0]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(51,) (51,)\n",
      "init state [ 3  2 -3 -2  0]\n",
      "(77,) (26,)\n",
      "init state [ 3  0 -2  0  0]\n",
      "(94,) (17,)\n",
      "init state [ 0  3  3 -3  0]\n",
      "(133,) (39,)\n",
      "init state [ 1  3  0 -2  0]\n",
      "(158,) (25,)\n",
      "init state [ 2  3 -1 -3  0]\n",
      "(203,) (45,)\n",
      "init state [ 1  3  2 -2  0]\n",
      "(228,) (25,)\n",
      "init state [ 2  3 -2 -3  0]\n",
      "(286,) (58,)\n",
      "init state [0 1 1 2 0]\n",
      "(291,) (5,)\n",
      "init state [ 3  1 -3  2  0]\n",
      "(338,) (47,)\n",
      "============ 31 ===========\n",
      "Run episode 31 with rewards -5, accuracy 0.1\n",
      "----------------- 0 --------------\n",
      "   -0.3789 if c>=1.0 & x2>=3.0\n",
      "   -0.0864 if c<=0.0 & x1<=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.4205 if c<=0.0 & x1<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   +0.3258 if c<=0.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.3394 if x1>=2.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   -0.1209 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.4025 if x4-x2<=2.0 & x4-x2>=1.0\n",
      "   +0.1684 if x2<=2.0 & x3-x1<=-3.0\n",
      "   -0.3161 if x1>=2.0 & x2<=2.0 & x4-x2<=-2.0\n",
      "   +0.5430 if c<=0.0 & x1<=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   +0.2668 if x1>=2.0 & x2>=1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   -0.0539 if c<=0.0 & x1<=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.0000 if x2>=1.0 & x3-x1>=2.0 & x4-x2>=0.0\n",
      "   -0.0000 if c<=0.0 & x2>=3.0 & x3-x1>=0.0 & x4-x2>=-1.0 & x4-x2>=0.0\n",
      "   -0.0000 if c<=0.0 & x2<=0.0 & x4-x2<=2.0 & x4-x2>=2.0\n",
      "   +0.6260 if c<=0.0 & x1>=3.0 & x2<=2.0 & x3-x1<=-2.0 & x3-x1>=-2.0\n",
      "----------------- 1 --------------\n",
      "   +0.3288 if c>=1.0 & x1>=1.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   -0.0906 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x3-x1>=0.0 & x4-x2<=-1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.5574 if c<=0.0 & x1<=2.0 & x2<=2.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   +0.0609 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.0888 if x1>=2.0 & x4-x2>=0.0\n",
      "   +0.3350 if x2>=2.0 & x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.5357 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   +0.1919 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   -0.0644 if c<=0.0 & x1<=2.0 & x2<=0.0 & x4-x2>=0.0\n",
      "   +0.5970 if x2>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.0106 if x2<=0.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   +0.0458 if x1>=1.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=-2.0\n",
      "   +0.0411 if c<=0.0 & x1>=1.0 & x3-x1>=2.0 & x4-x2>=-1.0\n",
      "   +0.4387 if x3-x1>=1.0 & x4-x2>=1.0\n",
      "   -0.4614 if x1>=3.0 & x4-x2<=-1.0\n",
      "   -0.4505 if c<=0.0 & x1<=2.0 & x2>=2.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "----------------- 2 --------------\n",
      "   -0.2188 if x1<=2.0 & x4-x2>=1.0\n",
      "   -0.0634 if c>=1.0 & x1>=3.0 & x2>=2.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   +1.3918 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.3529 if x1>=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2<=1.0\n",
      "   -0.2027 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   +0.1857 if x4-x2>=-2.0\n",
      "   +0.4126 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   +0.0642 if x2>=2.0 & x3-x1<=1.0 & x4-x2>=0.0\n",
      "   +0.0714 if c<=0.0 & x3-x1<=-2.0 & x4-x2<=1.0\n",
      "   +0.1919 if c<=0.0 & x2>=2.0 & x3-x1<=-2.0 & x4-x2<=0.0\n",
      "   -0.1704 if c<=0.0 & x2<=1.0 & x4-x2>=1.0\n",
      "   -0.4011 if x2<=1.0\n",
      "   -0.4619 if x4-x2>=-1.0\n",
      "   -0.5105 if x1>=3.0 & x2>=2.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   +0.1542 if x1<=0.0 & x2<=2.0 & x3-x1<=0.0\n",
      "   +0.3682 if x1<=0.0 & x2<=1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "----------------- 3 --------------\n",
      "   +0.2580 if x1>=2.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.1471 if c<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=2.0\n",
      "   -0.0070 if x1>=3.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   +0.6216 if x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   +0.1515 if x1>=1.0 & x1>=2.0 & x2<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.1976 if x3-x1<=-3.0\n",
      "   +0.7228 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   -0.1837 if x2>=3.0\n",
      "   +0.3251 if x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   +0.0643 if c<=0.0 & x1<=0.0 & x4-x2>=1.0\n",
      "   -0.1554 if c<=0.0 & x2<=1.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   +0.3452 if x2>=1.0 & x3-x1<=-2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.1924 if x2>=3.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.1297 if x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.2599 if c<=0.0 & x1<=1.0 & x1>=1.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +1.0244 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "init state [0 2 1 0 0]\n",
      "(9,) (9,)\n",
      "init state [ 3  0 -1  0  0]\n",
      "(49,) (40,)\n",
      "init state [3 1 0 1 0]\n",
      "(51,) (2,)\n",
      "init state [ 2  2  0 -1  0]\n",
      "(78,) (27,)\n",
      "init state [0 0 3 1 0]\n",
      "(121,) (43,)\n",
      "init state [ 0  3  2 -1  0]\n",
      "(142,) (21,)\n",
      "init state [0 3 1 0 0]\n",
      "(168,) (26,)\n",
      "init state [ 3  0 -3  0  0]\n",
      "(206,) (38,)\n",
      "init state [1 1 2 0 0]\n",
      "(235,) (29,)\n",
      "init state [1 0 2 1 0]\n",
      "(249,) (14,)\n",
      "============ 32 ===========\n",
      "Run episode 32 with rewards 28, accuracy 0.8\n",
      "----------------- 0 --------------\n",
      "   -0.3436 if c>=1.0 & x2>=3.0\n",
      "   -0.0534 if c<=0.0 & x1<=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.1829 if c<=0.0 & x1<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   +0.0653 if c<=0.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.4718 if x1>=2.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   +0.0518 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.1298 if x4-x2<=2.0 & x4-x2>=1.0\n",
      "   -0.0569 if x2<=2.0 & x3-x1<=-3.0\n",
      "   -0.1380 if x1>=2.0 & x2<=2.0 & x4-x2<=-2.0\n",
      "   +0.2051 if c<=0.0 & x1<=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   +0.2632 if x1>=2.0 & x2>=1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   +0.4251 if c<=0.0 & x1<=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.0802 if c<=0.0 & x2>=3.0 & x3-x1>=0.0 & x4-x2>=-1.0 & x4-x2>=0.0\n",
      "   +0.0000 if c<=0.0 & x2<=0.0 & x4-x2<=2.0 & x4-x2>=2.0\n",
      "   +0.0000 if c<=0.0 & x1>=3.0 & x2<=2.0 & x3-x1<=-2.0 & x3-x1>=-2.0\n",
      "   -0.4778 if c<=0.0 & x1>=3.0 & x2<=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "----------------- 1 --------------\n",
      "   +0.4575 if c>=1.0 & x1>=1.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   -0.0133 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x3-x1>=0.0 & x4-x2<=-1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.3461 if c<=0.0 & x1<=2.0 & x2<=2.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   +0.2436 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.2536 if x1>=2.0 & x4-x2>=0.0\n",
      "   +0.1795 if x2>=2.0 & x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.4582 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   -0.2143 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.1337 if c<=0.0 & x1<=2.0 & x2<=0.0 & x4-x2>=0.0\n",
      "   +0.5727 if x2>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.1719 if x1>=1.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=-2.0\n",
      "   +0.3186 if c<=0.0 & x1>=1.0 & x3-x1>=2.0 & x4-x2>=-1.0\n",
      "   +0.0127 if x3-x1>=1.0 & x4-x2>=1.0\n",
      "   -0.2789 if x1>=3.0 & x4-x2<=-1.0\n",
      "   -0.0534 if c<=0.0 & x1<=2.0 & x2>=2.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   +0.7303 if c<=0.0 & x1<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=2.0\n",
      "----------------- 2 --------------\n",
      "   +0.0243 if x1<=2.0 & x4-x2>=1.0\n",
      "   +0.9939 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.1812 if x1>=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2<=1.0\n",
      "   -0.6411 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   +0.2916 if x4-x2>=-2.0\n",
      "   -0.0218 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   -0.2557 if x2>=2.0 & x3-x1<=1.0 & x4-x2>=0.0\n",
      "   +0.1076 if c<=0.0 & x3-x1<=-2.0 & x4-x2<=1.0\n",
      "   +0.0877 if c<=0.0 & x2>=2.0 & x3-x1<=-2.0 & x4-x2<=0.0\n",
      "   -0.0539 if c<=0.0 & x2<=1.0 & x4-x2>=1.0\n",
      "   -0.2366 if x2<=1.0\n",
      "   -0.2972 if x4-x2>=-1.0\n",
      "   -0.2679 if x1>=3.0 & x2>=2.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   +0.0445 if x1<=0.0 & x2<=2.0 & x3-x1<=0.0\n",
      "   -0.0844 if x1<=0.0 & x2<=1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.7694 if x4-x2>=0.0\n",
      "----------------- 3 --------------\n",
      "   +0.3548 if x1>=2.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.3484 if c<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=2.0\n",
      "   +0.9916 if x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   +0.1453 if x1>=1.0 & x1>=2.0 & x2<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.1907 if x3-x1<=-3.0\n",
      "   +0.4597 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   -0.1612 if x2>=3.0\n",
      "   -0.0000 if x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   -0.0239 if c<=0.0 & x1<=0.0 & x4-x2>=1.0\n",
      "   -0.2223 if c<=0.0 & x2<=1.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   -0.0000 if x2>=1.0 & x3-x1<=-2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.4805 if x2>=3.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   +0.1046 if x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.1839 if c<=0.0 & x1<=1.0 & x1>=1.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.3737 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.2065 if c>=1.0 & x3-x1<=-3.0 & x4-x2<=-2.0\n",
      "init state [ 0  3  1 -1  0]\n",
      "(8,) (8,)\n",
      "init state [ 2  3 -2 -1  0]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(50,) (42,)\n",
      "init state [2 0 0 2 0]\n",
      "(75,) (25,)\n",
      "init state [ 1  1 -1  0  0]\n",
      "(99,) (24,)\n",
      "init state [1 0 2 1 0]\n",
      "(120,) (21,)\n",
      "init state [ 3  0 -1  1  0]\n",
      "(142,) (22,)\n",
      "init state [ 1  3  0 -3  0]\n",
      "(184,) (42,)\n",
      "init state [ 3  2 -1  0  0]\n",
      "(212,) (28,)\n",
      "init state [0 1 1 1 0]\n",
      "(223,) (11,)\n",
      "init state [ 3  0 -2  1  0]\n",
      "(252,) (29,)\n",
      "============ 33 ===========\n",
      "Run episode 33 with rewards 13, accuracy 0.1\n",
      "----------------- 0 --------------\n",
      "   -0.4645 if c>=1.0 & x2>=3.0\n",
      "   -0.3092 if c<=0.0 & x1<=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.1194 if c<=0.0 & x1<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   +0.4146 if c<=0.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.1511 if x1>=2.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   -0.0939 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.4229 if x4-x2<=2.0 & x4-x2>=1.0\n",
      "   -0.1121 if x2<=2.0 & x3-x1<=-3.0\n",
      "   -0.0724 if x1>=2.0 & x2<=2.0 & x4-x2<=-2.0\n",
      "   +0.0837 if c<=0.0 & x1<=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   -0.3569 if x1>=2.0 & x2>=1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   +0.3636 if c<=0.0 & x1<=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   +0.0000 if c<=0.0 & x2>=3.0 & x3-x1>=0.0 & x4-x2>=-1.0 & x4-x2>=0.0\n",
      "   +0.1695 if c<=0.0 & x1>=3.0 & x2<=2.0 & x3-x1<=-2.0 & x3-x1>=-2.0\n",
      "   -0.0966 if c<=0.0 & x1>=3.0 & x2<=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   +0.1967 if x3-x1>=3.0 & x4-x2<=-1.0\n",
      "----------------- 1 --------------\n",
      "   +0.4000 if c>=1.0 & x1>=1.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   -0.0466 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x3-x1>=0.0 & x4-x2<=-1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.4860 if c<=0.0 & x1<=2.0 & x2<=2.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   +0.2491 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.0763 if x1>=2.0 & x4-x2>=0.0\n",
      "   +0.2859 if x2>=2.0 & x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.7289 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   +0.1359 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.2918 if c<=0.0 & x1<=2.0 & x2<=0.0 & x4-x2>=0.0\n",
      "   +0.4185 if x2>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.0022 if x1>=1.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=-2.0\n",
      "   +0.1502 if c<=0.0 & x1>=1.0 & x3-x1>=2.0 & x4-x2>=-1.0\n",
      "   -0.1014 if x1>=3.0 & x4-x2<=-1.0\n",
      "   -0.2427 if c<=0.0 & x1<=2.0 & x2>=2.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   +0.2364 if c<=0.0 & x1<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=2.0\n",
      "   +0.1872 if x3-x1<=-1.0 & x4-x2<=-3.0\n",
      "----------------- 2 --------------\n",
      "   +0.1252 if x1<=2.0 & x4-x2>=1.0\n",
      "   +0.7287 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.0512 if x1>=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2<=1.0\n",
      "   -0.5550 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -0.1099 if x4-x2>=-2.0\n",
      "   -0.2564 if x2>=2.0 & x3-x1<=1.0 & x4-x2>=0.0\n",
      "   +0.0224 if c<=0.0 & x3-x1<=-2.0 & x4-x2<=1.0\n",
      "   +0.0340 if c<=0.0 & x2>=2.0 & x3-x1<=-2.0 & x4-x2<=0.0\n",
      "   +0.1111 if c<=0.0 & x2<=1.0 & x4-x2>=1.0\n",
      "   -0.4033 if x2<=1.0\n",
      "   +0.0799 if x4-x2>=-1.0\n",
      "   +0.0066 if x1>=3.0 & x2>=2.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   +0.2665 if x1<=0.0 & x2<=2.0 & x3-x1<=0.0\n",
      "   -0.1278 if x1<=0.0 & x2<=1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.6651 if x4-x2>=0.0\n",
      "   +0.4237 if x4-x2<=-1.0\n",
      "----------------- 3 --------------\n",
      "   +0.6110 if x1>=2.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.5405 if c<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=2.0\n",
      "   +0.5110 if x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   +0.1881 if x1>=1.0 & x1>=2.0 & x2<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.3332 if x3-x1<=-3.0\n",
      "   +0.4415 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   -0.1292 if x2>=3.0\n",
      "   -0.0476 if c<=0.0 & x1<=0.0 & x4-x2>=1.0\n",
      "   +0.3040 if c<=0.0 & x2<=1.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   +0.1483 if x2>=1.0 & x3-x1<=-2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.5209 if x2>=3.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.2973 if x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.1203 if c<=0.0 & x1<=1.0 & x1>=1.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.8880 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.0000 if c>=1.0 & x3-x1<=-3.0 & x4-x2<=-2.0\n",
      "   -0.0487 if c<=0.0 & x1>=3.0 & x3-x1<=-2.0\n",
      "init state [ 2  1 -1  0  0]\n",
      "(30,) (30,)\n",
      "init state [ 3  1 -1  1  0]\n",
      "(34,) (4,)\n",
      "init state [ 0  3  3 -3  0]\n",
      "(64,) (30,)\n",
      "init state [2 1 1 0 0]\n",
      "(70,) (6,)\n",
      "init state [ 2  2 -2 -1  0]\n",
      "(87,) (17,)\n",
      "init state [2 0 1 0 0]\n",
      "(103,) (16,)\n",
      "init state [ 3  2 -2  0  0]\n",
      "(116,) (13,)\n",
      "init state [0 3 1 0 0]\n",
      "(119,) (3,)\n",
      "init state [ 1  2  0 -1  0]\n",
      "(138,) (19,)\n",
      "init state [1 1 1 0 0]\n",
      "(159,) (21,)\n",
      "============ 34 ===========\n",
      "Run episode 34 with rewards 21, accuracy 0.8\n",
      "----------------- 0 --------------\n",
      "   -0.2822 if c>=1.0 & x2>=3.0\n",
      "   -0.0930 if c<=0.0 & x1<=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.0230 if c<=0.0 & x1<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   +0.6508 if c<=0.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.6276 if x1>=2.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   +0.0951 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.2773 if x4-x2<=2.0 & x4-x2>=1.0\n",
      "   +0.2665 if x2<=2.0 & x3-x1<=-3.0\n",
      "   -0.2905 if x1>=2.0 & x2<=2.0 & x4-x2<=-2.0\n",
      "   +0.1307 if c<=0.0 & x1<=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   -0.2300 if x1>=2.0 & x2>=1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   +0.7123 if c<=0.0 & x1<=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   +0.1605 if c<=0.0 & x1>=3.0 & x2<=2.0 & x3-x1<=-2.0 & x3-x1>=-2.0\n",
      "   -0.0000 if c<=0.0 & x1>=3.0 & x2<=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.0283 if x3-x1>=3.0 & x4-x2<=-1.0\n",
      "   +0.0810 if x1>=2.0 & x4-x2<=-2.0\n",
      "----------------- 1 --------------\n",
      "   +0.0843 if c>=1.0 & x1>=1.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   -0.2031 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x3-x1>=0.0 & x4-x2<=-1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.3398 if c<=0.0 & x1<=2.0 & x2<=2.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   +0.7163 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   -0.2777 if x1>=2.0 & x4-x2>=0.0\n",
      "   +0.0891 if x2>=2.0 & x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.8473 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   +0.5528 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.1727 if c<=0.0 & x1<=2.0 & x2<=0.0 & x4-x2>=0.0\n",
      "   +0.2055 if x2>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.0000 if c<=0.0 & x1>=1.0 & x3-x1>=2.0 & x4-x2>=-1.0\n",
      "   -0.1178 if x1>=3.0 & x4-x2<=-1.0\n",
      "   -0.3692 if c<=0.0 & x1<=2.0 & x2>=2.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   +0.3115 if c<=0.0 & x1<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=2.0\n",
      "   +0.0000 if x3-x1<=-1.0 & x4-x2<=-3.0\n",
      "   +0.4079 if x1>=2.0 & x3-x1>=1.0 & x4-x2>=-2.0\n",
      "----------------- 2 --------------\n",
      "   -0.0524 if x1<=2.0 & x4-x2>=1.0\n",
      "   +0.7843 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.1612 if x1>=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2<=1.0\n",
      "   -0.4030 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -0.0512 if x4-x2>=-2.0\n",
      "   -0.1084 if x2>=2.0 & x3-x1<=1.0 & x4-x2>=0.0\n",
      "   +0.3379 if c<=0.0 & x3-x1<=-2.0 & x4-x2<=1.0\n",
      "   +0.2358 if c<=0.0 & x2>=2.0 & x3-x1<=-2.0 & x4-x2<=0.0\n",
      "   -0.0691 if c<=0.0 & x2<=1.0 & x4-x2>=1.0\n",
      "   -0.3127 if x2<=1.0\n",
      "   -0.1977 if x4-x2>=-1.0\n",
      "   -0.0153 if x1<=0.0 & x2<=2.0 & x3-x1<=0.0\n",
      "   -0.1931 if x1<=0.0 & x2<=1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.5666 if x4-x2>=0.0\n",
      "   +0.4244 if x4-x2<=-1.0\n",
      "   -0.3777 if x1>=3.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "----------------- 3 --------------\n",
      "   +0.5561 if x1>=2.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.2197 if c<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=2.0\n",
      "   +0.6122 if x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   -0.0096 if x1>=1.0 & x1>=2.0 & x2<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   -0.0800 if x3-x1<=-3.0\n",
      "   +0.9340 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   -0.0952 if x2>=3.0\n",
      "   +0.0000 if c<=0.0 & x1<=0.0 & x4-x2>=1.0\n",
      "   +0.1591 if c<=0.0 & x2<=1.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   +0.2866 if x2>=1.0 & x3-x1<=-2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.2576 if x2>=3.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   +0.0000 if x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.0000 if c<=0.0 & x1<=1.0 & x1>=1.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.5119 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.0916 if c<=0.0 & x1>=3.0 & x3-x1<=-2.0\n",
      "   -0.5708 if x1<=2.0 & x4-x2>=-2.0\n",
      "init state [ 0  3  0 -3  0]\n",
      "(47,) (47,)\n",
      "init state [ 0  3  0 -2  0]\n",
      "(62,) (15,)\n",
      "init state [ 2  3 -1 -3  0]\n",
      "(75,) (13,)\n",
      "init state [ 3  2 -3 -1  0]\n",
      "(86,) (11,)\n",
      "init state [2 0 0 3 0]\n",
      "(93,) (7,)\n",
      "init state [ 2  3 -1 -1  0]\n",
      "(99,) (6,)\n",
      "init state [ 1  0 -1  2  0]\n",
      "(122,) (23,)\n",
      "init state [ 3  1 -1  2  0]\n",
      "(128,) (6,)\n",
      "init state [ 1  3  2 -3  0]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(154,) (26,)\n",
      "init state [ 1  1 -1  0  0]\n",
      "(178,) (24,)\n",
      "============ 35 ===========\n",
      "Run episode 35 with rewards 18, accuracy 0.3\n",
      "----------------- 0 --------------\n",
      "   -0.1602 if c>=1.0 & x2>=3.0\n",
      "   +0.1317 if c<=0.0 & x1<=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.2961 if c<=0.0 & x1<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   +0.8068 if c<=0.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.3533 if x1>=2.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   -0.2519 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.1942 if x4-x2<=2.0 & x4-x2>=1.0\n",
      "   +0.0484 if x2<=2.0 & x3-x1<=-3.0\n",
      "   -0.2548 if x1>=2.0 & x2<=2.0 & x4-x2<=-2.0\n",
      "   +0.1917 if c<=0.0 & x1<=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   -0.6159 if x1>=2.0 & x2>=1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   +0.3172 if c<=0.0 & x1<=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   +0.0000 if c<=0.0 & x1>=3.0 & x2<=2.0 & x3-x1<=-2.0 & x3-x1>=-2.0\n",
      "   -0.0579 if x3-x1>=3.0 & x4-x2<=-1.0\n",
      "   -0.0786 if x1>=2.0 & x4-x2<=-2.0\n",
      "   -0.2412 if x4-x2>=3.0\n",
      "----------------- 1 --------------\n",
      "   +0.2494 if c>=1.0 & x1>=1.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   -0.2197 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x3-x1>=0.0 & x4-x2<=-1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.4506 if c<=0.0 & x1<=2.0 & x2<=2.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   +0.3987 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   -0.2641 if x1>=2.0 & x4-x2>=0.0\n",
      "   -0.1133 if x2>=2.0 & x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -1.1032 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   +0.2999 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.3842 if c<=0.0 & x1<=2.0 & x2<=0.0 & x4-x2>=0.0\n",
      "   +0.5137 if x2>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.5247 if x1>=3.0 & x4-x2<=-1.0\n",
      "   -0.0215 if c<=0.0 & x1<=2.0 & x2>=2.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   -0.1625 if c<=0.0 & x1<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=2.0\n",
      "   -0.1309 if x3-x1<=-1.0 & x4-x2<=-3.0\n",
      "   +0.0978 if x1>=2.0 & x3-x1>=1.0 & x4-x2>=-2.0\n",
      "   +0.4428 if x3-x1>=0.0 & x4-x2>=3.0\n",
      "----------------- 2 --------------\n",
      "   -0.0844 if x1<=2.0 & x4-x2>=1.0\n",
      "   +1.1379 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.1856 if x1>=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2<=1.0\n",
      "   -0.5545 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -0.4797 if x4-x2>=-2.0\n",
      "   -0.3846 if x2>=2.0 & x3-x1<=1.0 & x4-x2>=0.0\n",
      "   +0.2255 if c<=0.0 & x3-x1<=-2.0 & x4-x2<=1.0\n",
      "   +0.2727 if c<=0.0 & x2>=2.0 & x3-x1<=-2.0 & x4-x2<=0.0\n",
      "   -0.1427 if c<=0.0 & x2<=1.0 & x4-x2>=1.0\n",
      "   -0.3060 if x2<=1.0\n",
      "   -0.2383 if x4-x2>=-1.0\n",
      "   +0.0023 if x1<=0.0 & x2<=1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.8235 if x4-x2>=0.0\n",
      "   +0.6128 if x4-x2<=-1.0\n",
      "   +0.1022 if x1>=3.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   +0.6507 if c<=0.0 & x1<=2.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "----------------- 3 --------------\n",
      "   +0.5239 if x1>=2.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.2199 if c<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=2.0\n",
      "   +0.1998 if x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   +0.1327 if x1>=1.0 & x1>=2.0 & x2<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.1116 if x3-x1<=-3.0\n",
      "   +0.7210 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.0985 if x2>=3.0\n",
      "   -0.2522 if c<=0.0 & x2<=1.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   -0.0341 if x2>=1.0 & x3-x1<=-2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.0699 if x2>=3.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.0000 if x3-x1>=1.0 & x4-x2>=1.0\n",
      "   -0.0000 if c<=0.0 & x1<=1.0 & x1>=1.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.5730 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.2158 if c<=0.0 & x1>=3.0 & x3-x1<=-2.0\n",
      "   -1.1020 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.6020 if x4-x2<=2.0 & x4-x2>=-2.0\n",
      "init state [ 1  2  0 -2  0]\n",
      "(20,) (20,)\n",
      "init state [0 1 3 0 0]\n",
      "(40,) (20,)\n",
      "init state [2 0 0 3 0]\n",
      "(51,) (11,)\n",
      "init state [0 0 2 2 0]\n",
      "(62,) (11,)\n",
      "init state [0 2 2 1 0]\n",
      "(73,) (11,)\n",
      "init state [ 1  2  0 -2  0]\n",
      "(85,) (12,)\n",
      "init state [ 2  2  0 -2  0]\n",
      "(93,) (8,)\n",
      "init state [ 0  1  1 -1  0]\n",
      "(127,) (34,)\n",
      "init state [ 1  3  2 -1  0]\n",
      "(153,) (26,)\n",
      "init state [0 0 2 0 0]\n",
      "(177,) (24,)\n",
      "============ 36 ===========\n",
      "Run episode 36 with rewards 18, accuracy 0.7\n",
      "----------------- 0 --------------\n",
      "   -0.0744 if c>=1.0 & x2>=3.0\n",
      "   -0.3123 if c<=0.0 & x1<=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.0000 if c<=0.0 & x1<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   +0.4715 if c<=0.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.3881 if x1>=2.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   -0.1279 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.3319 if x4-x2<=2.0 & x4-x2>=1.0\n",
      "   +0.0000 if x2<=2.0 & x3-x1<=-3.0\n",
      "   -0.2544 if x1>=2.0 & x2<=2.0 & x4-x2<=-2.0\n",
      "   +0.0000 if c<=0.0 & x1<=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   -0.5795 if x1>=2.0 & x2>=1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   +0.1204 if c<=0.0 & x1<=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   +0.1217 if x3-x1>=3.0 & x4-x2<=-1.0\n",
      "   -0.3341 if x1>=2.0 & x4-x2<=-2.0\n",
      "   -0.1939 if x4-x2>=3.0\n",
      "   +0.5240 if x1>=3.0 & x2>=3.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "----------------- 1 --------------\n",
      "   +0.0000 if c>=1.0 & x1>=1.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   -0.2956 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x3-x1>=0.0 & x4-x2<=-1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.3578 if c<=0.0 & x1<=2.0 & x2<=2.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   +0.5766 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   -0.5777 if x1>=2.0 & x4-x2>=0.0\n",
      "   -0.0953 if x2>=2.0 & x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.7516 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   +0.1951 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.5698 if c<=0.0 & x1<=2.0 & x2<=0.0 & x4-x2>=0.0\n",
      "   +0.2404 if x2>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.4651 if x1>=3.0 & x4-x2<=-1.0\n",
      "   -0.1007 if c<=0.0 & x1<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=2.0\n",
      "   +0.0000 if x3-x1<=-1.0 & x4-x2<=-3.0\n",
      "   -0.2116 if x1>=2.0 & x3-x1>=1.0 & x4-x2>=-2.0\n",
      "   +0.2929 if x3-x1>=0.0 & x4-x2>=3.0\n",
      "   +0.5411 if x3-x1>=2.0 & x4-x2>=1.0\n",
      "----------------- 2 --------------\n",
      "   -0.0325 if x1<=2.0 & x4-x2>=1.0\n",
      "   +1.0947 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.3445 if x1>=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2<=1.0\n",
      "   -0.4203 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -0.0341 if x4-x2>=-2.0\n",
      "   -0.0954 if x2>=2.0 & x3-x1<=1.0 & x4-x2>=0.0\n",
      "   +0.0000 if c<=0.0 & x3-x1<=-2.0 & x4-x2<=1.0\n",
      "   +0.0000 if c<=0.0 & x2>=2.0 & x3-x1<=-2.0 & x4-x2<=0.0\n",
      "   -0.0112 if c<=0.0 & x2<=1.0 & x4-x2>=1.0\n",
      "   -0.0351 if x2<=1.0\n",
      "   -0.5693 if x4-x2>=-1.0\n",
      "   -0.5494 if x4-x2>=0.0\n",
      "   +0.5153 if x4-x2<=-1.0\n",
      "   -0.1185 if x1>=3.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   +0.3565 if c<=0.0 & x1<=2.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.4341 if x4-x2<=0.0 & x4-x2>=0.0\n",
      "----------------- 3 --------------\n",
      "   +0.3545 if x1>=2.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.2681 if c<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=2.0\n",
      "   +0.6810 if x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   +0.1491 if x1>=1.0 & x1>=2.0 & x2<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   -0.0000 if x3-x1<=-3.0\n",
      "   +0.9455 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.0215 if x2>=3.0\n",
      "   -0.0000 if c<=0.0 & x2<=1.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   +0.1077 if x2>=1.0 & x3-x1<=-2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.0769 if x2>=3.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.0292 if x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.3545 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.0000 if c<=0.0 & x1>=3.0 & x3-x1<=-2.0\n",
      "   -1.0781 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.7102 if x4-x2<=2.0 & x4-x2>=-2.0\n",
      "   -0.4555 if x1<=2.0 & x4-x2>=2.0\n",
      "init state [ 1  1 -1  2  0]\n",
      "(23,) (23,)\n",
      "init state [0 0 2 1 0]\n",
      "(45,) (22,)\n",
      "init state [0 1 3 1 0]\n",
      "(52,) (7,)\n",
      "init state [0 0 1 0 0]\n",
      "(76,) (24,)\n",
      "init state [ 2  1 -2  1  0]\n",
      "(89,) (13,)\n",
      "init state [ 1  3  1 -2  0]\n",
      "(99,) (10,)\n",
      "init state [ 3  1 -1 -1  0]\n",
      "(117,) (18,)\n",
      "init state [ 2  2 -1  0  0]\n",
      "(134,) (17,)\n",
      "init state [ 2  0 -2  2  0]\n",
      "(143,) (9,)\n",
      "init state [0 1 1 1 0]\n",
      "(159,) (16,)\n",
      "============ 37 ===========\n",
      "Run episode 37 with rewards 26, accuracy 0.5\n",
      "----------------- 0 --------------\n",
      "   -0.6914 if c>=1.0 & x2>=3.0\n",
      "   -0.5233 if c<=0.0 & x1<=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.1572 if c<=0.0 & x1<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   +0.9127 if c<=0.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.3746 if x1>=2.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   -0.1495 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.4787 if x4-x2<=2.0 & x4-x2>=1.0\n",
      "   -0.1574 if x1>=2.0 & x2<=2.0 & x4-x2<=-2.0\n",
      "   +0.1846 if c<=0.0 & x1<=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   -0.5305 if x1>=2.0 & x2>=1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   +0.4379 if c<=0.0 & x1<=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   +0.0000 if x3-x1>=3.0 & x4-x2<=-1.0\n",
      "   -0.1416 if x1>=2.0 & x4-x2<=-2.0\n",
      "   +0.0000 if x4-x2>=3.0\n",
      "   +0.4904 if x1>=3.0 & x2>=3.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.5329 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1>=1.0 & x4-x2<=0.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 1 --------------\n",
      "   +0.6798 if c>=1.0 & x1>=1.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   -0.0954 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x3-x1>=0.0 & x4-x2<=-1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.2679 if c<=0.0 & x1<=2.0 & x2<=2.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   +0.0475 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   -0.3451 if x1>=2.0 & x4-x2>=0.0\n",
      "   +0.4001 if x2>=2.0 & x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.2185 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   +0.4341 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.0870 if c<=0.0 & x1<=2.0 & x2<=0.0 & x4-x2>=0.0\n",
      "   +0.2404 if x2>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.4274 if x1>=3.0 & x4-x2<=-1.0\n",
      "   -0.4342 if c<=0.0 & x1<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=2.0\n",
      "   +0.1410 if x1>=2.0 & x3-x1>=1.0 & x4-x2>=-2.0\n",
      "   +0.0000 if x3-x1>=0.0 & x4-x2>=3.0\n",
      "   +0.0874 if x3-x1>=2.0 & x4-x2>=1.0\n",
      "   +0.3063 if x3-x1>=3.0\n",
      "----------------- 2 --------------\n",
      "   -0.2390 if x1<=2.0 & x4-x2>=1.0\n",
      "   +1.0225 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.3752 if x1>=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2<=1.0\n",
      "   -0.3463 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -0.1605 if x4-x2>=-2.0\n",
      "   -0.0529 if x2>=2.0 & x3-x1<=1.0 & x4-x2>=0.0\n",
      "   -0.2310 if c<=0.0 & x2>=2.0 & x3-x1<=-2.0 & x4-x2<=0.0\n",
      "   -0.2712 if c<=0.0 & x2<=1.0 & x4-x2>=1.0\n",
      "   -0.4577 if x2<=1.0\n",
      "   -0.1432 if x4-x2>=-1.0\n",
      "   -0.6578 if x4-x2>=0.0\n",
      "   +0.4187 if x4-x2<=-1.0\n",
      "   -0.1915 if x1>=3.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   +0.2455 if c<=0.0 & x1<=2.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.3630 if x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.5895 if x1>=2.0 & x2>=2.0 & x3-x1>=1.0\n",
      "----------------- 3 --------------\n",
      "   +0.1558 if x1>=2.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.5495 if c<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=2.0\n",
      "   -0.3945 if x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   +0.2128 if x1>=1.0 & x1>=2.0 & x2<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.5499 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   -0.2434 if x2>=3.0\n",
      "   +0.0634 if c<=0.0 & x2<=1.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   -0.1900 if x2>=1.0 & x3-x1<=-2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.1575 if x2>=3.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   +0.2494 if x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.6333 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.2653 if c<=0.0 & x1>=3.0 & x3-x1<=-2.0\n",
      "   -0.6053 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.1510 if x4-x2<=2.0 & x4-x2>=-2.0\n",
      "   -0.0107 if x1<=2.0 & x4-x2>=2.0\n",
      "   +0.9404 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "init state [0 0 1 0 0]\n",
      "(11,) (11,)\n",
      "init state [ 3  0 -3  0  0]\n",
      "(38,) (27,)\n",
      "init state [0 0 1 1 0]\n",
      "(47,) (9,)\n",
      "init state [ 2  3 -2 -3  0]\n",
      "(104,) (57,)\n",
      "init state [2 1 1 0 0]\n",
      "(113,) (9,)\n",
      "init state [ 2  2 -2  0  0]\n",
      "(136,) (23,)\n",
      "init state [1 2 2 0 0]\n",
      "(153,) (17,)\n",
      "init state [ 3  0 -3  1  0]\n",
      "(162,) (9,)\n",
      "init state [ 2  1 -2 -1  0]\n",
      "(186,) (24,)\n",
      "init state [ 3  2 -3 -1  0]\n",
      "(197,) (11,)\n",
      "============ 38 ===========\n",
      "Run episode 38 with rewards 31, accuracy 0.7\n",
      "----------------- 0 --------------\n",
      "   -0.2331 if c>=1.0 & x2>=3.0\n",
      "   -0.3458 if c<=0.0 & x1<=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.0842 if c<=0.0 & x1<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   +0.8174 if c<=0.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.3331 if x1>=2.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   -0.2099 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.0138 if x4-x2<=2.0 & x4-x2>=1.0\n",
      "   -0.0307 if x1>=2.0 & x2<=2.0 & x4-x2<=-2.0\n",
      "   +0.3454 if c<=0.0 & x1<=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   -0.2911 if x1>=2.0 & x2>=1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   +0.4241 if c<=0.0 & x1<=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   +0.0479 if x1>=2.0 & x4-x2<=-2.0\n",
      "   +0.0000 if x4-x2>=3.0\n",
      "   +0.0714 if x1>=3.0 & x2>=3.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.3773 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1>=1.0 & x4-x2<=0.0\n",
      "   -0.6606 if c>=1.0 & x1>=1.0 & x2<=2.0\n",
      "----------------- 1 --------------\n",
      "   +0.4127 if c>=1.0 & x1>=1.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   -0.0682 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x3-x1>=0.0 & x4-x2<=-1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.2126 if c<=0.0 & x1<=2.0 & x2<=2.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   +0.2278 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   -0.3880 if x1>=2.0 & x4-x2>=0.0\n",
      "   +0.4981 if x2>=2.0 & x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.6007 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   +0.4046 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.0566 if c<=0.0 & x1<=2.0 & x2<=0.0 & x4-x2>=0.0\n",
      "   +0.6125 if x2>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.5758 if x1>=3.0 & x4-x2<=-1.0\n",
      "   -0.1043 if c<=0.0 & x1<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=2.0\n",
      "   -0.1816 if x1>=2.0 & x3-x1>=1.0 & x4-x2>=-2.0\n",
      "   -0.0305 if x3-x1>=2.0 & x4-x2>=1.0\n",
      "   +0.0330 if x3-x1>=3.0\n",
      "   -0.4400 if x1>=1.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "----------------- 2 --------------\n",
      "   -0.2368 if x1<=2.0 & x4-x2>=1.0\n",
      "   +0.3690 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.0895 if x1>=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2<=1.0\n",
      "   -0.1653 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -0.3838 if x4-x2>=-2.0\n",
      "   +0.3547 if c<=0.0 & x2>=2.0 & x3-x1<=-2.0 & x4-x2<=0.0\n",
      "   -0.2680 if c<=0.0 & x2<=1.0 & x4-x2>=1.0\n",
      "   -0.3326 if x2<=1.0\n",
      "   -0.1197 if x4-x2>=-1.0\n",
      "   -0.3883 if x4-x2>=0.0\n",
      "   +0.2565 if x4-x2<=-1.0\n",
      "   +0.1385 if x1>=3.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   -0.0078 if c<=0.0 & x1<=2.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.1203 if x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.2312 if x1>=2.0 & x2>=2.0 & x3-x1>=1.0\n",
      "   +0.5182 if c<=0.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "----------------- 3 --------------\n",
      "   +0.0688 if x1>=2.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.3263 if c<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=2.0\n",
      "   -0.2825 if x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   +0.2160 if x1>=1.0 & x1>=2.0 & x2<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.5950 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   -0.3488 if x2>=3.0\n",
      "   -0.5816 if c<=0.0 & x2<=1.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   -0.2544 if x2>=1.0 & x3-x1<=-2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.3245 if x2>=3.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   +0.2029 if x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.4337 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.4446 if c<=0.0 & x1>=3.0 & x3-x1<=-2.0\n",
      "   -0.2600 if x1<=2.0 & x4-x2>=-2.0\n",
      "   -0.1965 if x4-x2<=2.0 & x4-x2>=-2.0\n",
      "   +0.7984 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.2557 if x3-x1<=-3.0 & x4-x2<=0.0\n",
      "init state [ 0  2  2 -1  0]\n",
      "(23,) (23,)\n",
      "init state [ 2  0 -2  1  0]\n",
      "(40,) (17,)\n",
      "init state [0 0 2 2 0]\n",
      "(58,) (18,)\n",
      "init state [ 0  1  2 -1  0]\n",
      "(67,) (9,)\n",
      "init state [0 1 1 1 0]\n",
      "(90,) (23,)\n",
      "init state [ 1  2  1 -1  0]\n",
      "(106,) (16,)\n",
      "init state [ 1  3  0 -2  0]\n",
      "(116,) (10,)\n",
      "init state [1 0 1 2 0]\n",
      "(129,) (13,)\n",
      "init state [ 2  0 -2  2  0]\n",
      "(143,) (14,)\n",
      "init state [1 0 2 1 0]\n",
      "(153,) (10,)\n",
      "============ 39 ===========\n",
      "Run episode 39 with rewards 32, accuracy 0.4\n",
      "----------------- 0 --------------\n",
      "   -0.0653 if c>=1.0 & x2>=3.0\n",
      "   -0.1499 if c<=0.0 & x1<=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.5161 if c<=0.0 & x1<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   +0.6560 if c<=0.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.4306 if x1>=2.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   +0.1447 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.2456 if x4-x2<=2.0 & x4-x2>=1.0\n",
      "   -0.0701 if x1>=2.0 & x2<=2.0 & x4-x2<=-2.0\n",
      "   +0.1530 if c<=0.0 & x1<=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   -0.0480 if x1>=2.0 & x2>=1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   +0.7494 if c<=0.0 & x1<=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   +0.2365 if x1>=2.0 & x4-x2<=-2.0\n",
      "   +0.0000 if x1>=3.0 & x2>=3.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.6428 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1>=1.0 & x4-x2<=0.0\n",
      "   -0.6745 if c>=1.0 & x1>=1.0 & x2<=2.0\n",
      "   -0.1744 if c<=0.0 & x2>=2.0 & x3-x1<=0.0\n",
      "----------------- 1 --------------\n",
      "   +0.1560 if c>=1.0 & x1>=1.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   +0.4101 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x3-x1>=0.0 & x4-x2<=-1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.4448 if c<=0.0 & x1<=2.0 & x2<=2.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   +0.4536 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   -0.2567 if x1>=2.0 & x4-x2>=0.0\n",
      "   +0.3128 if x2>=2.0 & x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.4712 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   +0.3380 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.5231 if c<=0.0 & x1<=2.0 & x2<=0.0 & x4-x2>=0.0\n",
      "   +0.2552 if x2>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.1313 if x1>=3.0 & x4-x2<=-1.0\n",
      "   +0.3169 if c<=0.0 & x1<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=2.0\n",
      "   -0.1535 if x1>=2.0 & x3-x1>=1.0 & x4-x2>=-2.0\n",
      "   +0.0000 if x3-x1>=3.0\n",
      "   +0.0049 if x1>=1.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   -0.4189 if x4-x2>=2.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 2 --------------\n",
      "   -0.3198 if x1<=2.0 & x4-x2>=1.0\n",
      "   +0.3780 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.3034 if x1>=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2<=1.0\n",
      "   -0.3543 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -0.1608 if x4-x2>=-2.0\n",
      "   +0.0000 if c<=0.0 & x2>=2.0 & x3-x1<=-2.0 & x4-x2<=0.0\n",
      "   -0.3465 if c<=0.0 & x2<=1.0 & x4-x2>=1.0\n",
      "   -0.4283 if x2<=1.0\n",
      "   +0.0397 if x4-x2>=-1.0\n",
      "   -0.5863 if x4-x2>=0.0\n",
      "   +0.4255 if x4-x2<=-1.0\n",
      "   -0.1133 if x1>=3.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   -0.1677 if x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.0000 if x1>=2.0 & x2>=2.0 & x3-x1>=1.0\n",
      "   +0.1222 if c<=0.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.1293 if x2>=3.0 & x3-x1>=0.0 & x4-x2<=-2.0\n",
      "----------------- 3 --------------\n",
      "   -0.2082 if c<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=2.0\n",
      "   +0.1917 if x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   +0.0858 if x1>=1.0 & x1>=2.0 & x2<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.9345 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   -0.1625 if x2>=3.0\n",
      "   -0.3706 if c<=0.0 & x2<=1.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   +0.2998 if x2>=1.0 & x3-x1<=-2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.0854 if x2>=3.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   +0.2355 if x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.6147 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.2378 if c<=0.0 & x1>=3.0 & x3-x1<=-2.0\n",
      "   -0.5963 if x1<=2.0 & x4-x2>=-2.0\n",
      "   -0.0767 if x4-x2<=2.0 & x4-x2>=-2.0\n",
      "   +0.3807 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.1896 if x3-x1<=-3.0 & x4-x2<=0.0\n",
      "   -0.2163 if x1<=2.0 & x3-x1<=1.0 & x4-x2>=1.0\n",
      "init state [ 2  0 -2  0  0]\n",
      "(28,) (28,)\n",
      "init state [1 0 2 2 0]\n",
      "(35,) (7,)\n",
      "init state [ 2  3 -2 -3  0]\n",
      "(55,) (20,)\n",
      "init state [1 0 2 0 0]\n",
      "(95,) (40,)\n",
      "init state [0 1 1 0 0]\n",
      "(101,) (6,)\n",
      "init state [ 1  1 -1  1  0]\n",
      "(122,) (21,)\n",
      "init state [1 2 0 1 0]\n",
      "(162,) (40,)\n",
      "init state [ 3  2 -1 -2  0]\n",
      "(188,) (26,)\n",
      "init state [ 2  1 -2  2  0]\n",
      "(210,) (22,)\n",
      "init state [0 0 2 2 0]\n",
      "(229,) (19,)\n",
      "============ 40 ===========\n",
      "Run episode 40 with rewards 23, accuracy 0.5\n",
      "----------------- 0 --------------\n",
      "   -0.3802 if c>=1.0 & x2>=3.0\n",
      "   +0.1551 if c<=0.0 & x1<=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.4807 if c<=0.0 & x1<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   -0.2082 if c<=0.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.5109 if x1>=2.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   -0.2237 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.0794 if x4-x2<=2.0 & x4-x2>=1.0\n",
      "   -0.0623 if x1>=2.0 & x2<=2.0 & x4-x2<=-2.0\n",
      "   +0.4959 if c<=0.0 & x1<=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   -0.7166 if x1>=2.0 & x2>=1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   +0.6217 if c<=0.0 & x1<=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.0324 if x1>=2.0 & x4-x2<=-2.0\n",
      "   +0.2272 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1>=1.0 & x4-x2<=0.0\n",
      "   -0.3576 if c>=1.0 & x1>=1.0 & x2<=2.0\n",
      "   -0.5905 if c<=0.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   +0.1294 if x1>=3.0 & x4-x2<=-2.0\n",
      "----------------- 1 --------------\n",
      "   +0.4024 if c>=1.0 & x1>=1.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   +0.3196 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x3-x1>=0.0 & x4-x2<=-1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.2026 if c<=0.0 & x1<=2.0 & x2<=2.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   +0.1668 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   -0.2817 if x1>=2.0 & x4-x2>=0.0\n",
      "   +0.1434 if x2>=2.0 & x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.9238 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   -0.0589 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.2326 if c<=0.0 & x1<=2.0 & x2<=0.0 & x4-x2>=0.0\n",
      "   +0.7212 if x2>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.0451 if x1>=3.0 & x4-x2<=-1.0\n",
      "   +0.7655 if c<=0.0 & x1<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=2.0\n",
      "   +0.3048 if x1>=2.0 & x3-x1>=1.0 & x4-x2>=-2.0\n",
      "   +0.3715 if x1>=1.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   -0.0532 if x4-x2>=2.0\n",
      "   +0.4026 if x1<=1.0 & x2>=3.0 & x4-x2>=-1.0\n",
      "----------------- 2 --------------\n",
      "   -0.5922 if x1<=2.0 & x4-x2>=1.0\n",
      "   +0.3813 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.3544 if x1>=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2<=1.0\n",
      "   -0.5524 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -0.1837 if x4-x2>=-2.0\n",
      "   +0.1327 if c<=0.0 & x2>=2.0 & x3-x1<=-2.0 & x4-x2<=0.0\n",
      "   -0.3665 if c<=0.0 & x2<=1.0 & x4-x2>=1.0\n",
      "   -0.4026 if x2<=1.0\n",
      "   -0.2630 if x4-x2>=-1.0\n",
      "   -0.4661 if x4-x2>=0.0\n",
      "   +0.1135 if x4-x2<=-1.0\n",
      "   +0.1251 if x1>=3.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   +0.1050 if x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.4882 if c<=0.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.1019 if x2>=3.0 & x3-x1>=0.0 & x4-x2<=-2.0\n",
      "   -0.1152 if c>=1.0 & x2>=1.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "----------------- 3 --------------\n",
      "   +0.1264 if c<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=2.0\n",
      "   +0.6014 if x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   +0.0902 if x1>=1.0 & x1>=2.0 & x2<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.3921 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   -0.1580 if x2>=3.0\n",
      "   -0.3530 if c<=0.0 & x2<=1.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   +0.3425 if x2>=1.0 & x3-x1<=-2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.1580 if x2>=3.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.4147 if x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.8014 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.3730 if c<=0.0 & x1>=3.0 & x3-x1<=-2.0\n",
      "   -0.4871 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.4611 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.1718 if x3-x1<=-3.0 & x4-x2<=0.0\n",
      "   -0.0340 if x1<=2.0 & x3-x1<=1.0 & x4-x2>=1.0\n",
      "   +0.4735 if c>=1.0 & x2>=2.0 & x3-x1>=-2.0\n",
      "init state [ 3  1 -2  0  0]\n",
      "(6,) (6,)\n",
      "init state [ 2  3 -1 -3  0]\n",
      "(36,) (30,)\n",
      "init state [ 1  2  1 -2  0]\n",
      "(43,) (7,)\n",
      "init state [0 1 0 1 0]\n",
      "(59,) (16,)\n",
      "init state [ 2  3 -2 -3  0]\n",
      "(87,) (28,)\n",
      "init state [ 3  2 -3  0  0]\n",
      "(159,) (72,)\n",
      "init state [1 0 1 0 0]\n",
      "(166,) (7,)\n",
      "init state [0 0 1 2 0]\n",
      "(178,) (12,)\n",
      "init state [1 1 0 1 0]\n",
      "(184,) (6,)\n",
      "init state [ 3  1 -3  1  0]\n",
      "(215,) (31,)\n",
      "============ 41 ===========\n",
      "Run episode 41 with rewards 11, accuracy 0.2\n",
      "----------------- 0 --------------\n",
      "   -0.3025 if c>=1.0 & x2>=3.0\n",
      "   -0.0314 if c<=0.0 & x1<=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.3507 if c<=0.0 & x1<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   +0.3304 if c<=0.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.1559 if x1>=2.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   -0.2475 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.2249 if x4-x2<=2.0 & x4-x2>=1.0\n",
      "   +0.0446 if x1>=2.0 & x2<=2.0 & x4-x2<=-2.0\n",
      "   +0.1759 if c<=0.0 & x1<=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   +0.0134 if x1>=2.0 & x2>=1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   -0.3884 if c<=0.0 & x1<=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.2514 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1>=1.0 & x4-x2<=0.0\n",
      "   -0.7971 if c>=1.0 & x1>=1.0 & x2<=2.0\n",
      "   -0.0997 if c<=0.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   -0.1371 if x1>=3.0 & x4-x2<=-2.0\n",
      "   +0.6298 if c<=0.0 & x2<=1.0 & x3-x1<=-2.0\n",
      "----------------- 1 --------------\n",
      "   +0.3596 if c>=1.0 & x1>=1.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   -0.3007 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x3-x1>=0.0 & x4-x2<=-1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.1650 if c<=0.0 & x1<=2.0 & x2<=2.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   +0.1750 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   -0.1214 if x1>=2.0 & x4-x2>=0.0\n",
      "   +0.2197 if x2>=2.0 & x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -1.0409 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   +0.2792 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.5842 if c<=0.0 & x1<=2.0 & x2<=0.0 & x4-x2>=0.0\n",
      "   +0.2298 if x2>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.0007 if c<=0.0 & x1<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=2.0\n",
      "   +0.0000 if x1>=2.0 & x3-x1>=1.0 & x4-x2>=-2.0\n",
      "   +0.0691 if x1>=1.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.3784 if x4-x2>=2.0\n",
      "   +0.2714 if x1<=1.0 & x2>=3.0 & x4-x2>=-1.0\n",
      "   +0.7944 if c<=0.0 & x2<=2.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "----------------- 2 --------------\n",
      "   -0.2959 if x1<=2.0 & x4-x2>=1.0\n",
      "   +0.6783 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.1977 if x1>=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2<=1.0\n",
      "   -0.2777 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   +0.0745 if x4-x2>=-2.0\n",
      "   +1.2005 if c<=0.0 & x2>=2.0 & x3-x1<=-2.0 & x4-x2<=0.0\n",
      "   -0.3851 if c<=0.0 & x2<=1.0 & x4-x2>=1.0\n",
      "   -0.9671 if x2<=1.0\n",
      "   +0.0102 if x4-x2>=-1.0\n",
      "   -0.5973 if x4-x2>=0.0\n",
      "   +0.8461 if x4-x2<=-1.0\n",
      "   -0.1244 if x1>=3.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   -0.2122 if x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.5846 if c<=0.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.3709 if c>=1.0 & x2>=1.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.0627 if c<=0.0 & x2>=3.0 & x3-x1>=0.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 3 --------------\n",
      "   -0.2495 if c<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=2.0\n",
      "   +0.5484 if x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   +0.3752 if x1>=1.0 & x1>=2.0 & x2<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.7130 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   -0.1870 if x2>=3.0\n",
      "   -0.2755 if c<=0.0 & x2<=1.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   +0.3713 if x2>=1.0 & x3-x1<=-2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.2002 if x2>=3.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.0654 if x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.5768 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.5141 if c<=0.0 & x1>=3.0 & x3-x1<=-2.0\n",
      "   -0.2630 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.4674 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.1194 if x3-x1<=-3.0 & x4-x2<=0.0\n",
      "   +0.5001 if c>=1.0 & x2>=2.0 & x3-x1>=-2.0\n",
      "   -0.6900 if x1<=2.0 & x1>=2.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "init state [ 1  2  2 -1  0]\n",
      "(9,) (9,)\n",
      "init state [ 3  0 -2  2  0]\n",
      "(26,) (17,)\n",
      "init state [0 0 1 1 0]\n",
      "(38,) (12,)\n",
      "init state [1 0 1 2 0]\n",
      "(51,) (13,)\n",
      "init state [ 0  3  3 -1  0]\n",
      "(56,) (5,)\n",
      "init state [ 2  0 -2  3  0]\n",
      "(79,) (23,)\n",
      "init state [ 3  1 -3  0  0]\n",
      "(103,) (24,)\n",
      "init state [3 0 0 1 0]\n",
      "(107,) (4,)\n",
      "init state [0 0 1 2 0]\n",
      "(113,) (6,)\n",
      "init state [ 2  0 -2  0  0]\n",
      "(131,) (18,)\n",
      "============ 42 ===========\n",
      "Run episode 42 with rewards 24, accuracy 0.9\n",
      "----------------- 0 --------------\n",
      "   -0.2928 if c>=1.0 & x2>=3.0\n",
      "   -0.4328 if c<=0.0 & x1<=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.1177 if c<=0.0 & x1<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   +0.3505 if c<=0.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.4164 if x1>=2.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   -0.0101 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.1050 if x4-x2<=2.0 & x4-x2>=1.0\n",
      "   +0.0000 if x1>=2.0 & x2<=2.0 & x4-x2<=-2.0\n",
      "   +0.1796 if c<=0.0 & x1<=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   -0.3724 if c<=0.0 & x1<=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   +0.0789 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1>=1.0 & x4-x2<=0.0\n",
      "   -0.6460 if c>=1.0 & x1>=1.0 & x2<=2.0\n",
      "   +0.2026 if c<=0.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   +0.0000 if x1>=3.0 & x4-x2<=-2.0\n",
      "   +0.7559 if c<=0.0 & x2<=1.0 & x3-x1<=-2.0\n",
      "   -0.3269 if x3-x1>=3.0\n",
      "----------------- 1 --------------\n",
      "   +0.1410 if c>=1.0 & x1>=1.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   +0.0000 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x3-x1>=0.0 & x4-x2<=-1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   +0.0111 if c<=0.0 & x1<=2.0 & x2<=2.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   +0.3849 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.1519 if x1>=2.0 & x4-x2>=0.0\n",
      "   -0.3557 if x2>=2.0 & x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -1.0306 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   +0.3831 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.4600 if c<=0.0 & x1<=2.0 & x2<=0.0 & x4-x2>=0.0\n",
      "   +0.2967 if x2>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.0957 if c<=0.0 & x1<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=2.0\n",
      "   -0.1496 if x1>=1.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.2995 if x4-x2>=2.0\n",
      "   +0.2538 if x1<=1.0 & x2>=3.0 & x4-x2>=-1.0\n",
      "   +0.4699 if c<=0.0 & x2<=2.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   +0.7454 if x3-x1>=3.0\n",
      "----------------- 2 --------------\n",
      "   -0.2656 if x1<=2.0 & x4-x2>=1.0\n",
      "   -0.0000 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.2959 if x1>=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2<=1.0\n",
      "   -0.0136 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -0.0109 if x4-x2>=-2.0\n",
      "   -0.0000 if c<=0.0 & x2>=2.0 & x3-x1<=-2.0 & x4-x2<=0.0\n",
      "   -0.3477 if c<=0.0 & x2<=1.0 & x4-x2>=1.0\n",
      "   -0.6363 if x2<=1.0\n",
      "   -1.0014 if x4-x2>=0.0\n",
      "   +0.7297 if x4-x2<=-1.0\n",
      "   -0.1443 if x1>=3.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   -0.6200 if x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.0000 if c<=0.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.0951 if c>=1.0 & x2>=1.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.1999 if c<=0.0 & x2>=3.0 & x3-x1>=0.0\n",
      "   -0.2098 if x2>=3.0 & x3-x1>=3.0\n",
      "----------------- 3 --------------\n",
      "   +0.0204 if c<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=2.0\n",
      "   +0.5561 if x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   +0.0414 if x1>=1.0 & x1>=2.0 & x2<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.6920 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   -0.1631 if x2>=3.0\n",
      "   -0.0550 if c<=0.0 & x2<=1.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   +0.3628 if x2>=1.0 & x3-x1<=-2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.0735 if x2>=3.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   +1.0392 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.3517 if c<=0.0 & x1>=3.0 & x3-x1<=-2.0\n",
      "   -0.6360 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.5539 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.0525 if x3-x1<=-3.0 & x4-x2<=0.0\n",
      "   +0.5267 if c>=1.0 & x2>=2.0 & x3-x1>=-2.0\n",
      "   -0.5941 if x1<=2.0 & x1>=2.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.5246 if x2>=1.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "init state [ 1  1 -1  0  0]\n",
      "(16,) (16,)\n",
      "init state [1 0 2 2 0]\n",
      "(34,) (18,)\n",
      "init state [0 1 2 2 0]\n",
      "(44,) (10,)\n",
      "init state [ 1  0 -1  3  0]\n",
      "(52,) (8,)\n",
      "init state [ 1  2 -1 -1  0]\n",
      "(76,) (24,)\n",
      "init state [ 1  1  0 -1  0]\n",
      "(102,) (26,)\n",
      "init state [ 0  3  1 -1  0]\n",
      "(111,) (9,)\n",
      "init state [ 2  1 -1  0  0]\n",
      "(131,) (20,)\n",
      "init state [ 3  1 -3  1  0]\n",
      "(168,) (37,)\n",
      "init state [ 3  0 -2  3  0]\n",
      "(190,) (22,)\n",
      "============ 43 ===========\n",
      "Run episode 43 with rewards 20, accuracy 0.6\n",
      "----------------- 0 --------------\n",
      "   -0.1588 if c>=1.0 & x2>=3.0\n",
      "   -0.2919 if c<=0.0 & x1<=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.4785 if c<=0.0 & x1<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   +0.5975 if c<=0.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.0330 if x1>=2.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   +0.0315 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.1286 if x4-x2<=2.0 & x4-x2>=1.0\n",
      "   +0.0414 if c<=0.0 & x1<=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   -0.0324 if c<=0.0 & x1<=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   +0.0000 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1>=1.0 & x4-x2<=0.0\n",
      "   -0.4835 if c>=1.0 & x1>=1.0 & x2<=2.0\n",
      "   +0.3458 if c<=0.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   +0.2721 if x1>=3.0 & x4-x2<=-2.0\n",
      "   +0.3988 if c<=0.0 & x2<=1.0 & x3-x1<=-2.0\n",
      "   +0.8380 if x3-x1>=3.0\n",
      "   -0.7354 if x1<=2.0 & x1>=1.0 & x4-x2<=0.0\n",
      "----------------- 1 --------------\n",
      "   +0.1829 if c>=1.0 & x1>=1.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   -0.0098 if c<=0.0 & x1<=2.0 & x2<=2.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   +0.2639 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.1476 if x1>=2.0 & x4-x2>=0.0\n",
      "   -0.1599 if x2>=2.0 & x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.7969 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   -0.1131 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   -0.2512 if c<=0.0 & x1<=2.0 & x2<=0.0 & x4-x2>=0.0\n",
      "   +0.4242 if x2>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.2159 if c<=0.0 & x1<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=2.0\n",
      "   +0.0719 if x1>=1.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   -0.0030 if x4-x2>=2.0\n",
      "   +0.1544 if x1<=1.0 & x2>=3.0 & x4-x2>=-1.0\n",
      "   -0.2793 if c<=0.0 & x2<=2.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.0158 if x3-x1>=3.0\n",
      "   +0.5341 if x2>=1.0 & x3-x1>=2.0\n",
      "----------------- 2 --------------\n",
      "   -0.1897 if x1<=2.0 & x4-x2>=1.0\n",
      "   +0.2878 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.1073 if x1>=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2<=1.0\n",
      "   -0.1088 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -0.0717 if x4-x2>=-2.0\n",
      "   -0.0405 if c<=0.0 & x2>=2.0 & x3-x1<=-2.0 & x4-x2<=0.0\n",
      "   -0.4424 if c<=0.0 & x2<=1.0 & x4-x2>=1.0\n",
      "   -0.4407 if x2<=1.0\n",
      "   -0.7021 if x4-x2>=0.0\n",
      "   +0.6304 if x4-x2<=-1.0\n",
      "   -0.0110 if x1>=3.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   -0.4206 if x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.1405 if c>=1.0 & x2>=1.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.0358 if c<=0.0 & x2>=3.0 & x3-x1>=0.0\n",
      "   +0.0000 if x2>=3.0 & x3-x1>=3.0\n",
      "   -0.2131 if x3-x1>=-2.0\n",
      "----------------- 3 --------------\n",
      "   +0.3616 if x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   +0.2129 if x1>=1.0 & x1>=2.0 & x2<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.7942 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   -0.0651 if x2>=3.0\n",
      "   -0.2546 if c<=0.0 & x2<=1.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   -0.0252 if x2>=1.0 & x3-x1<=-2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.0962 if x2>=3.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   +0.9735 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.2119 if c<=0.0 & x1>=3.0 & x3-x1<=-2.0\n",
      "   -0.2799 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.4820 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.2612 if x3-x1<=-3.0 & x4-x2<=0.0\n",
      "   +0.2029 if c>=1.0 & x2>=2.0 & x3-x1>=-2.0\n",
      "   -0.8711 if x1<=2.0 & x1>=2.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.0266 if x2>=1.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   -0.6262 if x1<=1.0 & x2<=1.0 & x4-x2<=2.0 & x4-x2>=0.0\n",
      "init state [ 1  3  0 -1  0]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(17,) (17,)\n",
      "init state [ 3  2 -3  1  0]\n",
      "(32,) (15,)\n",
      "init state [ 3  1  0 -1  0]\n",
      "(50,) (18,)\n",
      "init state [0 2 2 0 0]\n",
      "(78,) (28,)\n",
      "init state [ 3  2 -1  1  0]\n",
      "(83,) (5,)\n",
      "init state [0 0 0 3 0]\n",
      "(91,) (8,)\n",
      "init state [ 2  1  0 -1  0]\n",
      "(102,) (11,)\n",
      "init state [ 3  2  0 -1  0]\n",
      "(115,) (13,)\n",
      "init state [ 0  3  3 -2  0]\n",
      "(127,) (12,)\n",
      "init state [0 2 2 1 0]\n",
      "(131,) (4,)\n",
      "============ 44 ===========\n",
      "Run episode 44 with rewards 38, accuracy 1.0\n",
      "best\n",
      "----------------- 0 --------------\n",
      "   -0.3314 if c>=1.0 & x2>=3.0\n",
      "   +0.0028 if c<=0.0 & x1<=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.2389 if c<=0.0 & x1<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   -0.3669 if c<=0.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.2129 if x1>=2.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   +0.0535 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.0903 if x4-x2<=2.0 & x4-x2>=1.0\n",
      "   +0.0000 if c<=0.0 & x1<=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   -0.4757 if c<=0.0 & x1<=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.1447 if c>=1.0 & x1>=1.0 & x2<=2.0\n",
      "   +0.2008 if c<=0.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   +0.1625 if x1>=3.0 & x4-x2<=-2.0\n",
      "   +0.2135 if c<=0.0 & x2<=1.0 & x3-x1<=-2.0\n",
      "   +0.3620 if x3-x1>=3.0\n",
      "   -0.5131 if x1<=2.0 & x1>=1.0 & x4-x2<=0.0\n",
      "   +0.1833 if x3-x1<=-3.0\n",
      "----------------- 1 --------------\n",
      "   +0.2829 if c>=1.0 & x1>=1.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   +0.0286 if c<=0.0 & x1<=2.0 & x2<=2.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   +0.3841 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.6821 if x1>=2.0 & x4-x2>=0.0\n",
      "   -0.3700 if x2>=2.0 & x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.6360 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   +0.2335 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   -0.1033 if c<=0.0 & x1<=2.0 & x2<=0.0 & x4-x2>=0.0\n",
      "   +0.6633 if x2>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.1664 if c<=0.0 & x1<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=2.0\n",
      "   +0.0000 if x1>=1.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.4013 if x1<=1.0 & x2>=3.0 & x4-x2>=-1.0\n",
      "   +0.1706 if c<=0.0 & x2<=2.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.0086 if x3-x1>=3.0\n",
      "   +0.4126 if x2>=1.0 & x3-x1>=2.0\n",
      "   -1.1118 if x2<=2.0 & x3-x1<=0.0\n",
      "----------------- 2 --------------\n",
      "   +0.4061 if x1<=2.0 & x4-x2>=1.0\n",
      "   +0.8439 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.1303 if x1>=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2<=1.0\n",
      "   -0.1741 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -0.1663 if x4-x2>=-2.0\n",
      "   +0.0000 if c<=0.0 & x2>=2.0 & x3-x1<=-2.0 & x4-x2<=0.0\n",
      "   +0.4593 if c<=0.0 & x2<=1.0 & x4-x2>=1.0\n",
      "   -0.1644 if x2<=1.0\n",
      "   -0.1217 if x4-x2>=0.0\n",
      "   +0.0003 if x4-x2<=-1.0\n",
      "   -0.0967 if x1>=3.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   -0.4021 if x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.2352 if c>=1.0 & x2>=1.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.0273 if c<=0.0 & x2>=3.0 & x3-x1>=0.0\n",
      "   -0.0928 if x3-x1>=-2.0\n",
      "   -0.7453 if x1<=2.0 & x4-x2>=-1.0\n",
      "----------------- 3 --------------\n",
      "   -0.3157 if x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   +0.1613 if x1>=1.0 & x1>=2.0 & x2<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.9178 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   -0.1064 if x2>=3.0\n",
      "   -0.1499 if c<=0.0 & x2<=1.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   -0.0314 if x2>=3.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   +0.2588 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.0573 if c<=0.0 & x1>=3.0 & x3-x1<=-2.0\n",
      "   -0.1025 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.5735 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.0000 if x3-x1<=-3.0 & x4-x2<=0.0\n",
      "   +0.1157 if c>=1.0 & x2>=2.0 & x3-x1>=-2.0\n",
      "   -0.7412 if x1<=2.0 & x1>=2.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   +0.0041 if x2>=1.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   -0.4341 if x1<=1.0 & x2<=1.0 & x4-x2<=2.0 & x4-x2>=0.0\n",
      "   +0.8715 if x3-x1>=-1.0 & x4-x2>=1.0\n",
      "init state [0 1 3 1 0]\n",
      "(15,) (15,)\n",
      "init state [0 0 0 3 0]\n",
      "(26,) (11,)\n",
      "init state [ 3  2 -2  0  0]\n",
      "(36,) (10,)\n",
      "init state [ 2  1 -2  2  0]\n",
      "(48,) (12,)\n",
      "init state [0 0 2 2 0]\n",
      "(68,) (20,)\n",
      "init state [0 0 0 2 0]\n",
      "(75,) (7,)\n",
      "init state [1 1 0 1 0]\n",
      "(91,) (16,)\n",
      "init state [2 2 1 0 0]\n",
      "(93,) (2,)\n",
      "init state [ 3  1 -3  2  0]\n",
      "(104,) (11,)\n",
      "init state [ 3  2 -1  1  0]\n",
      "(108,) (4,)\n",
      "============ 45 ===========\n",
      "Run episode 45 with rewards 38, accuracy 0.5\n",
      "----------------- 0 --------------\n",
      "   -0.4075 if c>=1.0 & x2>=3.0\n",
      "   +0.3398 if c<=0.0 & x1<=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.5118 if c<=0.0 & x1<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   -0.0271 if c<=0.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.1427 if x1>=2.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   +0.2831 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.1934 if x4-x2<=2.0 & x4-x2>=1.0\n",
      "   -0.0847 if c<=0.0 & x1<=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.3661 if c>=1.0 & x1>=1.0 & x2<=2.0\n",
      "   -0.0031 if c<=0.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   +0.0000 if x1>=3.0 & x4-x2<=-2.0\n",
      "   +0.4828 if c<=0.0 & x2<=1.0 & x3-x1<=-2.0\n",
      "   -0.0680 if x3-x1>=3.0\n",
      "   -0.5983 if x1<=2.0 & x1>=1.0 & x4-x2<=0.0\n",
      "   +0.1816 if x3-x1<=-3.0\n",
      "   +0.3967 if c<=0.0 & x1>=3.0\n",
      "----------------- 1 --------------\n",
      "   +0.1279 if c>=1.0 & x1>=1.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   -0.0185 if c<=0.0 & x1<=2.0 & x2<=2.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   +0.4051 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.4067 if x1>=2.0 & x4-x2>=0.0\n",
      "   -0.1415 if x2>=2.0 & x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -1.0523 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   +0.2880 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   -0.2493 if c<=0.0 & x1<=2.0 & x2<=0.0 & x4-x2>=0.0\n",
      "   +0.5830 if x2>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.0493 if c<=0.0 & x1<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=2.0\n",
      "   +0.1285 if x1<=1.0 & x2>=3.0 & x4-x2>=-1.0\n",
      "   +0.1716 if c<=0.0 & x2<=2.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   +0.1595 if x3-x1>=3.0\n",
      "   +0.0789 if x2>=1.0 & x3-x1>=2.0\n",
      "   -0.8588 if x2<=2.0 & x3-x1<=0.0\n",
      "   -0.3702 if x2<=2.0 & x3-x1<=2.0 & x4-x2<=1.0\n",
      "----------------- 2 --------------\n",
      "   -0.2578 if x1<=2.0 & x4-x2>=1.0\n",
      "   +0.5245 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.2950 if x1>=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2<=1.0\n",
      "   -0.1731 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -0.2609 if x4-x2>=-2.0\n",
      "   +0.0808 if c<=0.0 & x2<=1.0 & x4-x2>=1.0\n",
      "   -0.0315 if x2<=1.0\n",
      "   -0.2592 if x4-x2>=0.0\n",
      "   -0.0017 if x4-x2<=-1.0\n",
      "   -0.0605 if x1>=3.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   +0.1585 if x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.1530 if c>=1.0 & x2>=1.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.4068 if c<=0.0 & x2>=3.0 & x3-x1>=0.0\n",
      "   -0.2143 if x3-x1>=-2.0\n",
      "   +0.1013 if x1<=2.0 & x4-x2>=-1.0\n",
      "   -0.3072 if x3-x1<=-1.0\n",
      "----------------- 3 --------------\n",
      "   -0.3098 if x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   -0.1203 if x1>=1.0 & x1>=2.0 & x2<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.3097 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   -0.0881 if x2>=3.0\n",
      "   +0.0000 if c<=0.0 & x2<=1.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   -0.2649 if x2>=3.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   +0.0933 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.3598 if c<=0.0 & x1>=3.0 & x3-x1<=-2.0\n",
      "   -0.0551 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.3143 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.3539 if c>=1.0 & x2>=2.0 & x3-x1>=-2.0\n",
      "   -0.3162 if x1<=2.0 & x1>=2.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.1759 if x2>=1.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   -0.0730 if x1<=1.0 & x2<=1.0 & x4-x2<=2.0 & x4-x2>=0.0\n",
      "   +0.7328 if x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   +0.4917 if c>=1.0 & x2<=1.0\n",
      "init state [ 2  2 -2 -2  0]\n",
      "(55,) (55,)\n",
      "init state [3 0 0 1 0]\n",
      "(65,) (10,)\n",
      "init state [ 1  0 -1  2  0]\n",
      "(77,) (12,)\n",
      "init state [ 3  0 -2  0  0]\n",
      "(118,) (41,)\n",
      "init state [ 3  2 -3 -1  0]\n",
      "(146,) (28,)\n",
      "init state [ 1  3  2 -2  0]\n",
      "(176,) (30,)\n",
      "init state [ 3  2 -1  1  0]\n",
      "(179,) (3,)\n",
      "init state [ 3  1 -2  1  0]\n",
      "(194,) (15,)\n",
      "init state [2 2 0 1 0]\n",
      "(204,) (10,)\n",
      "init state [1 2 2 0 0]\n",
      "(210,) (6,)\n",
      "============ 46 ===========\n",
      "Run episode 46 with rewards 36, accuracy 0.6\n",
      "----------------- 0 --------------\n",
      "   -0.3084 if c>=1.0 & x2>=3.0\n",
      "   -0.0791 if c<=0.0 & x1<=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.7962 if c<=0.0 & x1<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   -0.2232 if c<=0.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.3163 if x1>=2.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   +0.4781 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.3340 if x4-x2<=2.0 & x4-x2>=1.0\n",
      "   -0.1390 if c<=0.0 & x1<=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.2035 if c>=1.0 & x1>=1.0 & x2<=2.0\n",
      "   +0.3481 if c<=0.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   -0.1357 if c<=0.0 & x2<=1.0 & x3-x1<=-2.0\n",
      "   -0.0048 if x3-x1>=3.0\n",
      "   -0.7538 if x1<=2.0 & x1>=1.0 & x4-x2<=0.0\n",
      "   +0.0247 if x3-x1<=-3.0\n",
      "   +0.1052 if c<=0.0 & x1>=3.0\n",
      "   +0.6894 if x1>=1.0 & x2>=2.0 & x4-x2>=1.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 1 --------------\n",
      "   +0.4702 if c>=1.0 & x1>=1.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   +0.5550 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.3174 if x1>=2.0 & x4-x2>=0.0\n",
      "   -0.2813 if x2>=2.0 & x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.7466 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   +0.0609 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.0965 if c<=0.0 & x1<=2.0 & x2<=0.0 & x4-x2>=0.0\n",
      "   +0.2468 if x2>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.4910 if c<=0.0 & x1<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=2.0\n",
      "   +0.6659 if x1<=1.0 & x2>=3.0 & x4-x2>=-1.0\n",
      "   -0.0877 if c<=0.0 & x2<=2.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   +0.0156 if x3-x1>=3.0\n",
      "   +0.8409 if x2>=1.0 & x3-x1>=2.0\n",
      "   -0.6989 if x2<=2.0 & x3-x1<=0.0\n",
      "   -0.0728 if x2<=2.0 & x3-x1<=2.0 & x4-x2<=1.0\n",
      "   -0.5101 if c<=0.0 & x3-x1>=-1.0 & x4-x2<=-2.0\n",
      "----------------- 2 --------------\n",
      "   -0.3993 if x1<=2.0 & x4-x2>=1.0\n",
      "   +0.9465 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.0385 if x1>=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2<=1.0\n",
      "   -0.4371 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -0.0527 if x4-x2>=-2.0\n",
      "   -0.2484 if c<=0.0 & x2<=1.0 & x4-x2>=1.0\n",
      "   +0.4116 if x2<=1.0\n",
      "   -0.8458 if x4-x2>=0.0\n",
      "   +0.0968 if x1>=3.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   -0.2901 if x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.2059 if c>=1.0 & x2>=1.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.1505 if c<=0.0 & x2>=3.0 & x3-x1>=0.0\n",
      "   -0.2040 if x3-x1>=-2.0\n",
      "   -0.0744 if x1<=2.0 & x4-x2>=-1.0\n",
      "   -0.1243 if x3-x1<=-1.0\n",
      "   +0.6447 if x1>=1.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=-2.0\n",
      "----------------- 3 --------------\n",
      "   +0.1760 if x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   +0.1160 if x1>=1.0 & x1>=2.0 & x2<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.0839 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   -0.3882 if x2>=3.0\n",
      "   -0.3911 if x2>=3.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   +0.2524 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.2922 if c<=0.0 & x1>=3.0 & x3-x1<=-2.0\n",
      "   -0.0534 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.3776 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.1020 if c>=1.0 & x2>=2.0 & x3-x1>=-2.0\n",
      "   +0.2516 if x1<=2.0 & x1>=2.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.0835 if x2>=1.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   +0.2485 if x1<=1.0 & x2<=1.0 & x4-x2<=2.0 & x4-x2>=0.0\n",
      "   +0.0099 if x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   +0.2532 if c>=1.0 & x2<=1.0\n",
      "   +0.6024 if x1<=1.0 & x2<=1.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "init state [ 1  2  2 -1  0]\n",
      "(11,) (11,)\n",
      "init state [1 0 0 1 0]\n",
      "(39,) (28,)\n",
      "init state [ 2  1 -1  1  0]\n",
      "(44,) (5,)\n",
      "init state [2 2 0 1 0]\n",
      "(53,) (9,)\n",
      "init state [0 1 2 2 0]\n",
      "(64,) (11,)\n",
      "init state [ 1  1  2 -1  0]\n",
      "(84,) (20,)\n",
      "init state [ 1  2  2 -2  0]\n",
      "(96,) (12,)\n",
      "init state [ 3  0 -2  1  0]\n",
      "(113,) (17,)\n",
      "init state [ 3  0 -1  0  0]\n",
      "(120,) (7,)\n",
      "init state [0 1 2 1 0]\n",
      "(129,) (9,)\n",
      "============ 47 ===========\n",
      "Run episode 47 with rewards 33, accuracy 0.5\n",
      "----------------- 0 --------------\n",
      "   -0.0235 if c>=1.0 & x2>=3.0\n",
      "   +0.2082 if c<=0.0 & x1<=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.5359 if c<=0.0 & x1<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   -0.0042 if c<=0.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.4920 if x1>=2.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   +0.1436 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.1302 if x4-x2<=2.0 & x4-x2>=1.0\n",
      "   +0.2504 if c<=0.0 & x1<=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.5546 if c>=1.0 & x1>=1.0 & x2<=2.0\n",
      "   +0.2742 if c<=0.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   -0.1667 if c<=0.0 & x2<=1.0 & x3-x1<=-2.0\n",
      "   -0.5581 if x1<=2.0 & x1>=1.0 & x4-x2<=0.0\n",
      "   +0.0000 if x3-x1<=-3.0\n",
      "   -0.0098 if c<=0.0 & x1>=3.0\n",
      "   +0.5184 if x1>=1.0 & x2>=2.0 & x4-x2>=1.0\n",
      "   -0.3017 if c<=0.0 & x1>=3.0 & x3-x1>=0.0\n",
      "----------------- 1 --------------\n",
      "   +0.4559 if c>=1.0 & x1>=1.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   +0.4120 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   -0.1157 if x1>=2.0 & x4-x2>=0.0\n",
      "   +0.1966 if x2>=2.0 & x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.5977 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   +0.2211 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.1567 if c<=0.0 & x1<=2.0 & x2<=0.0 & x4-x2>=0.0\n",
      "   +0.2496 if x2>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.1713 if c<=0.0 & x1<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=2.0\n",
      "   +0.2558 if x1<=1.0 & x2>=3.0 & x4-x2>=-1.0\n",
      "   -0.1688 if c<=0.0 & x2<=2.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   +0.7343 if x2>=1.0 & x3-x1>=2.0\n",
      "   -0.4324 if x2<=2.0 & x3-x1<=0.0\n",
      "   -0.0290 if x2<=2.0 & x3-x1<=2.0 & x4-x2<=1.0\n",
      "   +0.0338 if c<=0.0 & x3-x1>=-1.0 & x4-x2<=-2.0\n",
      "   +0.3519 if c<=0.0 & x1>=3.0 & x2<=2.0 & x4-x2<=-2.0\n",
      "----------------- 2 --------------\n",
      "   -0.4146 if x1<=2.0 & x4-x2>=1.0\n",
      "   +1.2647 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.5147 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -0.0511 if x4-x2>=-2.0\n",
      "   -0.1674 if c<=0.0 & x2<=1.0 & x4-x2>=1.0\n",
      "   -0.0486 if x2<=1.0\n",
      "   -0.9078 if x4-x2>=0.0\n",
      "   -0.0237 if x1>=3.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   -0.4682 if x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.3307 if c>=1.0 & x2>=1.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.2327 if c<=0.0 & x2>=3.0 & x3-x1>=0.0\n",
      "   -0.1393 if x3-x1>=-2.0\n",
      "   -0.0154 if x1<=2.0 & x4-x2>=-1.0\n",
      "   -0.0151 if x3-x1<=-1.0\n",
      "   +0.2259 if x1>=1.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=-2.0\n",
      "   -0.1468 if x1>=3.0 & x2<=2.0 & x4-x2<=-2.0\n",
      "----------------- 3 --------------\n",
      "   -0.3340 if x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   +0.0396 if x1>=1.0 & x1>=2.0 & x2<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.2301 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   -0.5830 if x2>=3.0\n",
      "   -0.2933 if x2>=3.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   +0.2170 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.2928 if c<=0.0 & x1>=3.0 & x3-x1<=-2.0\n",
      "   +0.0805 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.7321 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.1992 if c>=1.0 & x2>=2.0 & x3-x1>=-2.0\n",
      "   +0.1279 if x1<=2.0 & x1>=2.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.1994 if x2>=1.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   +0.4288 if x1<=1.0 & x2<=1.0 & x4-x2<=2.0 & x4-x2>=0.0\n",
      "   +0.3960 if c>=1.0 & x2<=1.0\n",
      "   +0.3369 if x1<=1.0 & x2<=1.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.6064 if x1<=2.0 & x1>=2.0 & x2<=1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "init state [ 1  1  2 -1  0]\n",
      "(18,) (18,)\n",
      "init state [ 3  0 -2  0  0]\n",
      "(63,) (45,)\n",
      "init state [ 2  0 -2  3  0]\n",
      "(81,) (18,)\n",
      "init state [1 1 0 1 0]\n",
      "(85,) (4,)\n",
      "init state [ 1  3  1 -3  0]\n",
      "(93,) (8,)\n",
      "init state [ 0  3  3 -2  0]\n",
      "(110,) (17,)\n",
      "init state [0 0 2 2 0]\n",
      "(116,) (6,)\n",
      "init state [ 3  0 -3  0  0]\n",
      "(138,) (22,)\n",
      "init state [ 0  3  2 -1  0]\n",
      "(168,) (30,)\n",
      "init state [0 2 1 0 0]\n",
      "(172,) (4,)\n",
      "============ 48 ===========\n",
      "Run episode 48 with rewards 38, accuracy 0.5\n",
      "----------------- 0 --------------\n",
      "   -0.0987 if c>=1.0 & x2>=3.0\n",
      "   +0.1609 if c<=0.0 & x1<=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.1051 if c<=0.0 & x1<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   +0.0983 if c<=0.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.3308 if x1>=2.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   -0.1044 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.0138 if x4-x2<=2.0 & x4-x2>=1.0\n",
      "   -0.1101 if c<=0.0 & x1<=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.4989 if c>=1.0 & x1>=1.0 & x2<=2.0\n",
      "   +0.2781 if c<=0.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   +0.2569 if c<=0.0 & x2<=1.0 & x3-x1<=-2.0\n",
      "   -0.6100 if x1<=2.0 & x1>=1.0 & x4-x2<=0.0\n",
      "   +0.4457 if c<=0.0 & x1>=3.0\n",
      "   +0.1873 if x1>=1.0 & x2>=2.0 & x4-x2>=1.0\n",
      "   +0.1725 if c<=0.0 & x1>=3.0 & x3-x1>=0.0\n",
      "   +0.4944 if x2>=1.0 & x3-x1>=2.0 & x4-x2>=0.0\n",
      "----------------- 1 --------------\n",
      "   +0.2016 if c>=1.0 & x1>=1.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   +0.6062 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.1394 if x1>=2.0 & x4-x2>=0.0\n",
      "   +0.1555 if x2>=2.0 & x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.7129 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   +0.5385 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.7196 if c<=0.0 & x1<=2.0 & x2<=0.0 & x4-x2>=0.0\n",
      "   +0.2366 if x2>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.3337 if c<=0.0 & x1<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=2.0\n",
      "   +0.1102 if x1<=1.0 & x2>=3.0 & x4-x2>=-1.0\n",
      "   -0.0213 if c<=0.0 & x2<=2.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   +0.1362 if x2>=1.0 & x3-x1>=2.0\n",
      "   -0.8697 if x2<=2.0 & x3-x1<=0.0\n",
      "   +0.0217 if c<=0.0 & x3-x1>=-1.0 & x4-x2<=-2.0\n",
      "   +0.0488 if c<=0.0 & x1>=3.0 & x2<=2.0 & x4-x2<=-2.0\n",
      "   +0.3364 if x3-x1>=2.0 & x4-x2>=2.0\n",
      "----------------- 2 --------------\n",
      "   -0.1655 if x1<=2.0 & x4-x2>=1.0\n",
      "   +0.6662 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.5224 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -0.0006 if x4-x2>=-2.0\n",
      "   -0.3907 if c<=0.0 & x2<=1.0 & x4-x2>=1.0\n",
      "   +0.0527 if x2<=1.0\n",
      "   -0.6896 if x4-x2>=0.0\n",
      "   -0.0759 if x1>=3.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   -0.4644 if x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.4166 if c>=1.0 & x2>=1.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.1269 if c<=0.0 & x2>=3.0 & x3-x1>=0.0\n",
      "   +0.0215 if x3-x1>=-2.0\n",
      "   +0.0538 if x1<=2.0 & x4-x2>=-1.0\n",
      "   +0.5034 if x1>=1.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=-2.0\n",
      "   -0.1522 if x1>=3.0 & x2<=2.0 & x4-x2<=-2.0\n",
      "   -0.2603 if c<=0.0 & x1>=2.0 & x1>=3.0 & x3-x1>=0.0 & x4-x2<=-1.0 & x4-x2<=-2.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 3 --------------\n",
      "   +0.3813 if x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   +0.1007 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   -0.0895 if x2>=3.0\n",
      "   -0.0791 if x2>=3.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   +0.7295 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.1519 if c<=0.0 & x1>=3.0 & x3-x1<=-2.0\n",
      "   -0.1893 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.5170 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.3117 if c>=1.0 & x2>=2.0 & x3-x1>=-2.0\n",
      "   +0.1092 if x1<=2.0 & x1>=2.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.2090 if x2>=1.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   +0.0111 if x1<=1.0 & x2<=1.0 & x4-x2<=2.0 & x4-x2>=0.0\n",
      "   +0.2444 if c>=1.0 & x2<=1.0\n",
      "   +0.2874 if x1<=1.0 & x2<=1.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.0015 if x1<=2.0 & x1>=2.0 & x2<=1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.7310 if x2<=2.0 & x3-x1<=1.0 & x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "init state [0 1 1 0 0]\n",
      "(8,) (8,)\n",
      "init state [ 2  1 -2  0  0]\n",
      "(40,) (32,)\n",
      "init state [0 1 0 1 0]\n",
      "(47,) (7,)\n",
      "init state [ 3  1 -2  1  0]\n",
      "(60,) (13,)\n",
      "init state [ 0  2  3 -2  0]\n",
      "(71,) (11,)\n",
      "init state [ 0  3  2 -3  0]\n",
      "(92,) (21,)\n",
      "init state [0 0 2 1 0]\n",
      "(107,) (15,)\n",
      "init state [0 0 2 3 0]\n",
      "(127,) (20,)\n",
      "init state [2 2 1 0 0]\n",
      "(129,) (2,)\n",
      "init state [ 3  2 -2  0  0]\n",
      "(136,) (7,)\n",
      "============ 49 ===========\n",
      "Run episode 49 with rewards 35, accuracy 0.6\n",
      "----------------- 0 --------------\n",
      "   -0.1504 if c>=1.0 & x2>=3.0\n",
      "   +0.7996 if c<=0.0 & x1<=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.1424 if c<=0.0 & x1<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   -0.0106 if c<=0.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.0942 if x1>=2.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   -0.1904 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.0743 if c<=0.0 & x1<=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.6019 if c>=1.0 & x1>=1.0 & x2<=2.0\n",
      "   +0.1699 if c<=0.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   +0.7261 if c<=0.0 & x2<=1.0 & x3-x1<=-2.0\n",
      "   -0.6650 if x1<=2.0 & x1>=1.0 & x4-x2<=0.0\n",
      "   +0.1855 if c<=0.0 & x1>=3.0\n",
      "   +0.4250 if x1>=1.0 & x2>=2.0 & x4-x2>=1.0\n",
      "   +0.0000 if c<=0.0 & x1>=3.0 & x3-x1>=0.0\n",
      "   +0.0384 if x2>=1.0 & x3-x1>=2.0 & x4-x2>=0.0\n",
      "   -0.3011 if x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "----------------- 1 --------------\n",
      "   +0.8701 if c>=1.0 & x1>=1.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   +0.5539 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.0410 if x1>=2.0 & x4-x2>=0.0\n",
      "   +0.2490 if x2>=2.0 & x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.8740 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   +0.1192 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.7991 if c<=0.0 & x1<=2.0 & x2<=0.0 & x4-x2>=0.0\n",
      "   +0.3621 if x2>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.3124 if c<=0.0 & x1<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=2.0\n",
      "   +0.1331 if x1<=1.0 & x2>=3.0 & x4-x2>=-1.0\n",
      "   -0.0987 if x2>=1.0 & x3-x1>=2.0\n",
      "   -0.7711 if x2<=2.0 & x3-x1<=0.0\n",
      "   +0.2976 if c<=0.0 & x3-x1>=-1.0 & x4-x2<=-2.0\n",
      "   -0.0490 if c<=0.0 & x1>=3.0 & x2<=2.0 & x4-x2<=-2.0\n",
      "   -0.0872 if x3-x1>=2.0 & x4-x2>=2.0\n",
      "   +0.8319 if x1<=0.0 & x2<=2.0 & x3-x1>=1.0 & x4-x2<=2.0\n",
      "----------------- 2 --------------\n",
      "   -0.6080 if x1<=2.0 & x4-x2>=1.0\n",
      "   +0.6203 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.3089 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -0.4049 if c<=0.0 & x2<=1.0 & x4-x2>=1.0\n",
      "   -0.4751 if x2<=1.0\n",
      "   -0.6620 if x4-x2>=0.0\n",
      "   -0.0736 if x1>=3.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   -0.0083 if x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.2075 if c>=1.0 & x2>=1.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.1518 if c<=0.0 & x2>=3.0 & x3-x1>=0.0\n",
      "   +0.0757 if x3-x1>=-2.0\n",
      "   +0.0540 if x1<=2.0 & x4-x2>=-1.0\n",
      "   +0.0617 if x1>=1.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=-2.0\n",
      "   -0.1199 if x1>=3.0 & x2<=2.0 & x4-x2<=-2.0\n",
      "   +0.0000 if c<=0.0 & x1>=2.0 & x1>=3.0 & x3-x1>=0.0 & x4-x2<=-1.0 & x4-x2<=-2.0\n",
      "   -0.6457 if c>=1.0 & x2>=2.0\n",
      "----------------- 3 --------------\n",
      "   +0.7818 if x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   +0.3553 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.0435 if x2>=3.0\n",
      "   -0.2399 if x2>=3.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   +0.1653 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.1488 if c<=0.0 & x1>=3.0 & x3-x1<=-2.0\n",
      "   -0.0989 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.5750 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.1196 if c>=1.0 & x2>=2.0 & x3-x1>=-2.0\n",
      "   -0.4414 if x1<=2.0 & x1>=2.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.2444 if x2>=1.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   -0.0644 if x1<=1.0 & x2<=1.0 & x4-x2<=2.0 & x4-x2>=0.0\n",
      "   +0.4617 if c>=1.0 & x2<=1.0\n",
      "   +0.1371 if x1<=1.0 & x2<=1.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   -0.4031 if x2<=2.0 & x3-x1<=1.0 & x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.6527 if x2<=2.0 & x3-x1>=2.0\n",
      "init state [ 1  3  1 -2  0]\n",
      "(20,) (20,)\n",
      "init state [ 2  3  1 -3  0]\n",
      "(52,) (32,)\n",
      "init state [0 0 0 3 0]\n",
      "(64,) (12,)\n",
      "init state [3 0 0 2 0]\n",
      "(67,) (3,)\n",
      "init state [ 1  2 -1  1  0]\n",
      "(82,) (15,)\n",
      "init state [0 1 3 1 0]\n",
      "(101,) (19,)\n",
      "init state [1 2 1 0 0]\n",
      "(106,) (5,)\n",
      "init state [ 3  1 -1 -1  0]\n",
      "(131,) (25,)\n",
      "init state [1 1 1 1 0]\n",
      "(151,) (20,)\n",
      "init state [ 2  3 -1  0  0]\n",
      "(168,) (17,)\n",
      "============ 50 ===========\n",
      "Run episode 50 with rewards 25, accuracy 0.3\n",
      "----------------- 0 --------------\n",
      "   -0.1382 if c>=1.0 & x2>=3.0\n",
      "   +0.1252 if c<=0.0 & x1<=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.0504 if c<=0.0 & x1<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   +0.3003 if c<=0.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.1664 if x1>=2.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   +0.0736 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.5193 if c<=0.0 & x1<=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.3328 if c>=1.0 & x1>=1.0 & x2<=2.0\n",
      "   +0.0242 if c<=0.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   +0.0000 if c<=0.0 & x2<=1.0 & x3-x1<=-2.0\n",
      "   -0.5563 if x1<=2.0 & x1>=1.0 & x4-x2<=0.0\n",
      "   +0.2635 if c<=0.0 & x1>=3.0\n",
      "   +0.0591 if x1>=1.0 & x2>=2.0 & x4-x2>=1.0\n",
      "   +0.3154 if x2>=1.0 & x3-x1>=2.0 & x4-x2>=0.0\n",
      "   +0.0163 if x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.4772 if x4-x2<=2.0 & x4-x2>=2.0\n",
      "----------------- 1 --------------\n",
      "   +0.3138 if c>=1.0 & x1>=1.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   +0.7122 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   -0.2778 if x2>=2.0 & x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.8411 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   +0.1608 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.3292 if c<=0.0 & x1<=2.0 & x2<=0.0 & x4-x2>=0.0\n",
      "   +0.2981 if x2>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.0912 if c<=0.0 & x1<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=2.0\n",
      "   -0.2279 if x1<=1.0 & x2>=3.0 & x4-x2>=-1.0\n",
      "   -0.3049 if x2>=1.0 & x3-x1>=2.0\n",
      "   -0.5317 if x2<=2.0 & x3-x1<=0.0\n",
      "   +0.3900 if c<=0.0 & x3-x1>=-1.0 & x4-x2<=-2.0\n",
      "   -0.0899 if c<=0.0 & x1>=3.0 & x2<=2.0 & x4-x2<=-2.0\n",
      "   +0.0000 if x3-x1>=2.0 & x4-x2>=2.0\n",
      "   +0.2120 if x1<=0.0 & x2<=2.0 & x3-x1>=1.0 & x4-x2<=2.0\n",
      "   +0.4397 if c<=0.0 & x1<=1.0 & x2<=2.0 & x3-x1<=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "----------------- 2 --------------\n",
      "   -0.1928 if x1<=2.0 & x4-x2>=1.0\n",
      "   -0.1045 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.1754 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -0.3522 if c<=0.0 & x2<=1.0 & x4-x2>=1.0\n",
      "   -0.1193 if x2<=1.0\n",
      "   -0.6339 if x4-x2>=0.0\n",
      "   -0.1191 if x1>=3.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   -0.2509 if x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.2098 if c>=1.0 & x2>=1.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.0285 if c<=0.0 & x2>=3.0 & x3-x1>=0.0\n",
      "   -0.0890 if x3-x1>=-2.0\n",
      "   +0.1615 if x1<=2.0 & x4-x2>=-1.0\n",
      "   +0.0688 if x1>=1.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=-2.0\n",
      "   +0.2026 if x1>=3.0 & x2<=2.0 & x4-x2<=-2.0\n",
      "   -0.4387 if c>=1.0 & x2>=2.0\n",
      "   +0.6787 if c<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=-1.0\n",
      "----------------- 3 --------------\n",
      "   -0.1005 if x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   +0.5233 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.0057 if x2>=3.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   +0.5525 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.2184 if c<=0.0 & x1>=3.0 & x3-x1<=-2.0\n",
      "   -0.2468 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.7523 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.2668 if c>=1.0 & x2>=2.0 & x3-x1>=-2.0\n",
      "   -0.1327 if x1<=2.0 & x1>=2.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.0997 if x2>=1.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   +0.3847 if x1<=1.0 & x2<=1.0 & x4-x2<=2.0 & x4-x2>=0.0\n",
      "   +0.0582 if c>=1.0 & x2<=1.0\n",
      "   -0.0222 if x1<=1.0 & x2<=1.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   -0.2896 if x2<=2.0 & x3-x1<=1.0 & x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.3950 if x2<=2.0 & x3-x1>=2.0\n",
      "   +0.7908 if x2>=1.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "init state [ 0  2  3 -2  0]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(27,) (27,)\n",
      "init state [0 0 1 1 0]\n",
      "(34,) (7,)\n",
      "init state [ 2  1  1 -1  0]\n",
      "(67,) (33,)\n",
      "init state [ 3  2 -2 -2  0]\n",
      "(134,) (67,)\n",
      "init state [ 0  2  2 -1  0]\n",
      "(147,) (13,)\n",
      "init state [ 1  2 -1 -2  0]\n",
      "(190,) (43,)\n",
      "init state [ 0  3  1 -2  0]\n",
      "(215,) (25,)\n",
      "init state [ 1  3 -1 -1  0]\n",
      "(274,) (59,)\n",
      "init state [ 0  3  3 -1  0]\n",
      "(296,) (22,)\n",
      "init state [0 1 2 2 0]\n",
      "(301,) (5,)\n",
      "============ 51 ===========\n",
      "Run episode 51 with rewards 37, accuracy 0.4\n",
      "----------------- 0 --------------\n",
      "   -0.2805 if c>=1.0 & x2>=3.0\n",
      "   -0.4103 if c<=0.0 & x1<=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.1949 if c<=0.0 & x1<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   +0.3098 if c<=0.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.2443 if x1>=2.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   -0.2488 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.1357 if c<=0.0 & x1<=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.4260 if c>=1.0 & x1>=1.0 & x2<=2.0\n",
      "   -0.3823 if c<=0.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   -0.5107 if x1<=2.0 & x1>=1.0 & x4-x2<=0.0\n",
      "   +0.3566 if c<=0.0 & x1>=3.0\n",
      "   -0.0859 if x1>=1.0 & x2>=2.0 & x4-x2>=1.0\n",
      "   -0.2001 if x2>=1.0 & x3-x1>=2.0 & x4-x2>=0.0\n",
      "   -0.1717 if x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.3144 if x4-x2<=2.0 & x4-x2>=2.0\n",
      "   +0.7383 if c<=0.0 & x1<=2.0 & x2<=0.0 & x3-x1<=-1.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "----------------- 1 --------------\n",
      "   +0.6440 if c>=1.0 & x1>=1.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   +0.3045 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.3631 if x2>=2.0 & x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.8501 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   +0.5597 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   -0.0213 if c<=0.0 & x1<=2.0 & x2<=0.0 & x4-x2>=0.0\n",
      "   +0.3822 if x2>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.1142 if c<=0.0 & x1<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=2.0\n",
      "   -0.0527 if x1<=1.0 & x2>=3.0 & x4-x2>=-1.0\n",
      "   +0.3034 if x2>=1.0 & x3-x1>=2.0\n",
      "   -0.8617 if x2<=2.0 & x3-x1<=0.0\n",
      "   +0.0361 if c<=0.0 & x3-x1>=-1.0 & x4-x2<=-2.0\n",
      "   +0.1435 if c<=0.0 & x1>=3.0 & x2<=2.0 & x4-x2<=-2.0\n",
      "   +0.2719 if x1<=0.0 & x2<=2.0 & x3-x1>=1.0 & x4-x2<=2.0\n",
      "   +0.1633 if c<=0.0 & x1<=1.0 & x2<=2.0 & x3-x1<=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   +0.6132 if x3-x1>=1.0 & x4-x2>=2.0\n",
      "----------------- 2 --------------\n",
      "   -0.2057 if x1<=2.0 & x4-x2>=1.0\n",
      "   -0.2975 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.4940 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -0.1452 if c<=0.0 & x2<=1.0 & x4-x2>=1.0\n",
      "   +0.3395 if x2<=1.0\n",
      "   -0.6265 if x4-x2>=0.0\n",
      "   +0.3304 if x1>=3.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   -0.4269 if x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.2270 if c>=1.0 & x2>=1.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.1014 if x3-x1>=-2.0\n",
      "   -0.2382 if x1<=2.0 & x4-x2>=-1.0\n",
      "   +0.2849 if x1>=1.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=-2.0\n",
      "   +0.0232 if x1>=3.0 & x2<=2.0 & x4-x2<=-2.0\n",
      "   -0.5185 if c>=1.0 & x2>=2.0\n",
      "   +0.0749 if c<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=-1.0\n",
      "   +0.3675 if x1<=0.0 & x2<=0.0 & x4-x2>=1.0\n",
      "----------------- 3 --------------\n",
      "   +0.0078 if x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   +0.5251 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +1.0460 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.4338 if c<=0.0 & x1>=3.0 & x3-x1<=-2.0\n",
      "   -0.3364 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.7489 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.1602 if c>=1.0 & x2>=2.0 & x3-x1>=-2.0\n",
      "   -0.1381 if x1<=2.0 & x1>=2.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   +0.1024 if x2>=1.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   +0.0609 if x1<=1.0 & x2<=1.0 & x4-x2<=2.0 & x4-x2>=0.0\n",
      "   +0.4055 if c>=1.0 & x2<=1.0\n",
      "   -0.1362 if x1<=1.0 & x2<=1.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   -0.6012 if x2<=2.0 & x3-x1<=1.0 & x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.1103 if x2<=2.0 & x3-x1>=2.0\n",
      "   +0.6104 if x2>=1.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   -0.7015 if c<=0.0 & x1>=3.0 & x2<=2.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "init state [1 2 1 1 0]\n",
      "(11,) (11,)\n",
      "init state [ 0  2  2 -2  0]\n",
      "(47,) (36,)\n",
      "init state [0 0 0 2 0]\n",
      "(58,) (11,)\n",
      "init state [ 2  0 -1  0  0]\n",
      "(64,) (6,)\n",
      "init state [0 1 2 2 0]\n",
      "(72,) (8,)\n",
      "init state [ 1  3  2 -2  0]\n",
      "(81,) (9,)\n",
      "init state [ 2  1 -1  2  0]\n",
      "(91,) (10,)\n",
      "init state [ 2  3 -1 -3  0]\n",
      "(114,) (23,)\n",
      "init state [ 1  1 -1 -1  0]\n",
      "(167,) (53,)\n",
      "init state [1 1 2 0 0]\n",
      "(178,) (11,)\n",
      "============ 52 ===========\n",
      "Run episode 52 with rewards 31, accuracy 0.9\n",
      "----------------- 0 --------------\n",
      "   -0.3716 if c>=1.0 & x2>=3.0\n",
      "   -0.0669 if c<=0.0 & x1<=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.0328 if c<=0.0 & x1<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   -0.2634 if c<=0.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.8036 if x1>=2.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   +0.1599 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.2238 if c<=0.0 & x1<=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.1599 if c>=1.0 & x1>=1.0 & x2<=2.0\n",
      "   -0.3846 if c<=0.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   -0.4904 if x1<=2.0 & x1>=1.0 & x4-x2<=0.0\n",
      "   -0.1168 if c<=0.0 & x1>=3.0\n",
      "   -0.2311 if x2>=1.0 & x3-x1>=2.0 & x4-x2>=0.0\n",
      "   +0.1563 if x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.1066 if x4-x2<=2.0 & x4-x2>=2.0\n",
      "   +0.7546 if c<=0.0 & x1<=2.0 & x2<=0.0 & x3-x1<=-1.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   -0.3662 if x3-x1>=3.0\n",
      "----------------- 1 --------------\n",
      "   +0.4955 if c>=1.0 & x1>=1.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   +0.3243 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.3659 if x2>=2.0 & x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.5593 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   +0.6019 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.6551 if x2>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.0314 if c<=0.0 & x1<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=2.0\n",
      "   +0.3180 if x1<=1.0 & x2>=3.0 & x4-x2>=-1.0\n",
      "   +0.4237 if x2>=1.0 & x3-x1>=2.0\n",
      "   -0.6803 if x2<=2.0 & x3-x1<=0.0\n",
      "   -0.2698 if c<=0.0 & x3-x1>=-1.0 & x4-x2<=-2.0\n",
      "   +0.0705 if c<=0.0 & x1>=3.0 & x2<=2.0 & x4-x2<=-2.0\n",
      "   +0.6803 if x1<=0.0 & x2<=2.0 & x3-x1>=1.0 & x4-x2<=2.0\n",
      "   +0.0342 if c<=0.0 & x1<=1.0 & x2<=2.0 & x3-x1<=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   +0.3429 if x3-x1>=1.0 & x4-x2>=2.0\n",
      "   -0.6739 if c<=0.0 & x1>=1.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "----------------- 2 --------------\n",
      "   +0.0842 if x1<=2.0 & x4-x2>=1.0\n",
      "   +0.5113 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.5220 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -0.1957 if c<=0.0 & x2<=1.0 & x4-x2>=1.0\n",
      "   +0.0319 if x2<=1.0\n",
      "   -0.0803 if x4-x2>=0.0\n",
      "   -0.0141 if x1>=3.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   -0.1319 if x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.1226 if c>=1.0 & x2>=1.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.1730 if x3-x1>=-2.0\n",
      "   -0.1986 if x1<=2.0 & x4-x2>=-1.0\n",
      "   -0.2777 if x1>=1.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=-2.0\n",
      "   -0.6852 if c>=1.0 & x2>=2.0\n",
      "   +0.0000 if c<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1<=-1.0\n",
      "   +0.2651 if x1<=0.0 & x2<=0.0 & x4-x2>=1.0\n",
      "   -0.1329 if x3-x1<=2.0 & x4-x2<=1.0\n",
      "----------------- 3 --------------\n",
      "   +0.1299 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.5305 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.2507 if c<=0.0 & x1>=3.0 & x3-x1<=-2.0\n",
      "   -0.3734 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.6231 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.2194 if c>=1.0 & x2>=2.0 & x3-x1>=-2.0\n",
      "   -0.3243 if x1<=2.0 & x1>=2.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.3221 if x2>=1.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   -0.0739 if x1<=1.0 & x2<=1.0 & x4-x2<=2.0 & x4-x2>=0.0\n",
      "   +0.2863 if c>=1.0 & x2<=1.0\n",
      "   +0.0415 if x1<=1.0 & x2<=1.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   -0.3890 if x2<=2.0 & x3-x1<=1.0 & x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.4853 if x2<=2.0 & x3-x1>=2.0\n",
      "   +0.4378 if x2>=1.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   -0.3990 if c<=0.0 & x1>=3.0 & x2<=2.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   +0.7731 if x1>=1.0 & x2<=1.0 & x3-x1>=0.0 & x4-x2<=2.0 & x4-x2>=1.0\n",
      "init state [0 0 1 2 0]\n",
      "(15,) (15,)\n",
      "init state [ 3  1 -1  2  0]\n",
      "(28,) (13,)\n",
      "init state [0 3 2 0 0]\n",
      "(31,) (3,)\n",
      "init state [ 0  2  1 -2  0]\n",
      "(70,) (39,)\n",
      "init state [1 3 1 0 0]\n",
      "(73,) (3,)\n",
      "init state [ 2  3 -1 -2  0]\n",
      "(89,) (16,)\n",
      "init state [ 2  2 -2  1  0]\n",
      "(107,) (18,)\n",
      "init state [ 0  2  2 -2  0]\n",
      "(120,) (13,)\n",
      "init state [ 2  2 -2  0  0]\n",
      "(246,) (126,)\n",
      "init state [1 0 0 2 0]\n",
      "(258,) (12,)\n",
      "============ 53 ===========\n",
      "Run episode 53 with rewards 30, accuracy 0.4\n",
      "----------------- 0 --------------\n",
      "   -0.1285 if c>=1.0 & x2>=3.0\n",
      "   -0.0670 if c<=0.0 & x1<=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.1067 if c<=0.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.3859 if x1>=2.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   -0.0854 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.1493 if c<=0.0 & x1<=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.0817 if c>=1.0 & x1>=1.0 & x2<=2.0\n",
      "   +0.1891 if c<=0.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   -1.0140 if x1<=2.0 & x1>=1.0 & x4-x2<=0.0\n",
      "   +0.7333 if c<=0.0 & x1>=3.0\n",
      "   -0.0742 if x2>=1.0 & x3-x1>=2.0 & x4-x2>=0.0\n",
      "   -0.2224 if x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.0007 if x4-x2<=2.0 & x4-x2>=2.0\n",
      "   +0.8020 if c<=0.0 & x1<=2.0 & x2<=0.0 & x3-x1<=-1.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.0000 if x3-x1>=3.0\n",
      "   +0.4100 if x2<=0.0 & x3-x1>=2.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 1 --------------\n",
      "   +0.4218 if c>=1.0 & x1>=1.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   +0.8030 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.1997 if x2>=2.0 & x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.9901 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   +0.5232 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.2132 if x2>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.3470 if x1<=1.0 & x2>=3.0 & x4-x2>=-1.0\n",
      "   +0.0208 if x2>=1.0 & x3-x1>=2.0\n",
      "   -0.3252 if x2<=2.0 & x3-x1<=0.0\n",
      "   -0.2050 if c<=0.0 & x3-x1>=-1.0 & x4-x2<=-2.0\n",
      "   -0.0000 if c<=0.0 & x1>=3.0 & x2<=2.0 & x4-x2<=-2.0\n",
      "   +0.3092 if x1<=0.0 & x2<=2.0 & x3-x1>=1.0 & x4-x2<=2.0\n",
      "   -0.1787 if c<=0.0 & x1<=1.0 & x2<=2.0 & x3-x1<=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.1683 if x3-x1>=1.0 & x4-x2>=2.0\n",
      "   -0.1099 if c<=0.0 & x1>=1.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.6724 if x2>=1.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "----------------- 2 --------------\n",
      "   -0.3227 if x1<=2.0 & x4-x2>=1.0\n",
      "   +0.1498 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.2354 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   +0.3096 if c<=0.0 & x2<=1.0 & x4-x2>=1.0\n",
      "   +0.4197 if x2<=1.0\n",
      "   -0.4211 if x4-x2>=0.0\n",
      "   -0.0235 if x1>=3.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   -0.3476 if x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.1747 if c>=1.0 & x2>=1.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.3650 if x3-x1>=-2.0\n",
      "   -0.3077 if x1<=2.0 & x4-x2>=-1.0\n",
      "   -0.2298 if x1>=1.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=-2.0\n",
      "   -0.3804 if c>=1.0 & x2>=2.0\n",
      "   +0.2780 if x1<=0.0 & x2<=0.0 & x4-x2>=1.0\n",
      "   +0.0821 if x3-x1<=2.0 & x4-x2<=1.0\n",
      "   +1.2628 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "----------------- 3 --------------\n",
      "   +0.3116 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.1899 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.2828 if c<=0.0 & x1>=3.0 & x3-x1<=-2.0\n",
      "   -0.2048 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.2461 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.0636 if c>=1.0 & x2>=2.0 & x3-x1>=-2.0\n",
      "   -0.1179 if x1<=2.0 & x1>=2.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.4458 if x2>=1.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   -0.1081 if x1<=1.0 & x2<=1.0 & x4-x2<=2.0 & x4-x2>=0.0\n",
      "   +0.1818 if c>=1.0 & x2<=1.0\n",
      "   -0.3350 if x2<=2.0 & x3-x1<=1.0 & x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.2441 if x2<=2.0 & x3-x1>=2.0\n",
      "   +0.3293 if x2>=1.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   -0.4042 if c<=0.0 & x1>=3.0 & x2<=2.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   +0.1520 if x1>=1.0 & x2<=1.0 & x3-x1>=0.0 & x4-x2<=2.0 & x4-x2>=1.0\n",
      "   +0.8569 if x2<=0.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "init state [ 0  3  2 -3  0]\n",
      "(20,) (20,)\n",
      "init state [ 2  1 -1  0  0]\n",
      "(50,) (30,)\n",
      "init state [ 3  2 -3  0  0]\n",
      "(80,) (30,)\n",
      "init state [ 2  0 -2  3  0]\n",
      "(107,) (27,)\n",
      "init state [ 2  2  1 -2  0]\n",
      "(120,) (13,)\n",
      "init state [ 1  0 -1  1  0]\n",
      "(134,) (14,)\n",
      "init state [ 3  0 -3  0  0]\n",
      "(168,) (34,)\n",
      "init state [2 0 1 0 0]\n",
      "(193,) (25,)\n",
      "init state [ 2  2  0 -2  0]\n",
      "(209,) (16,)\n",
      "init state [2 1 0 2 0]\n",
      "(214,) (5,)\n",
      "============ 54 ===========\n",
      "Run episode 54 with rewards 37, accuracy 0.7\n",
      "----------------- 0 --------------\n",
      "   -0.0184 if c>=1.0 & x2>=3.0\n",
      "   -0.1195 if c<=0.0 & x1<=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.4273 if c<=0.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.4932 if x1>=2.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   -0.0750 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.2793 if c<=0.0 & x1<=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.3940 if c>=1.0 & x1>=1.0 & x2<=2.0\n",
      "   -0.1851 if c<=0.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   -0.4237 if x1<=2.0 & x1>=1.0 & x4-x2<=0.0\n",
      "   +0.0214 if c<=0.0 & x1>=3.0\n",
      "   -0.0000 if x2>=1.0 & x3-x1>=2.0 & x4-x2>=0.0\n",
      "   -0.1072 if x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.3844 if x4-x2<=2.0 & x4-x2>=2.0\n",
      "   +0.3975 if c<=0.0 & x1<=2.0 & x2<=0.0 & x3-x1<=-1.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   -0.0293 if x2<=0.0 & x3-x1>=2.0\n",
      "   -0.5962 if c<=0.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "----------------- 1 --------------\n",
      "   +0.1560 if c>=1.0 & x1>=1.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   +0.5559 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.3821 if x2>=2.0 & x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.6018 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   -0.2641 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.3134 if x2>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.3260 if x1<=1.0 & x2>=3.0 & x4-x2>=-1.0\n",
      "   +0.2018 if x2>=1.0 & x3-x1>=2.0\n",
      "   -0.7757 if x2<=2.0 & x3-x1<=0.0\n",
      "   -0.2512 if c<=0.0 & x3-x1>=-1.0 & x4-x2<=-2.0\n",
      "   +0.5645 if x1<=0.0 & x2<=2.0 & x3-x1>=1.0 & x4-x2<=2.0\n",
      "   -0.1762 if c<=0.0 & x1<=1.0 & x2<=2.0 & x3-x1<=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   +0.0000 if x3-x1>=1.0 & x4-x2>=2.0\n",
      "   -0.2322 if c<=0.0 & x1>=1.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.0000 if x2>=1.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.5772 if x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "----------------- 2 --------------\n",
      "   +0.0016 if x1<=2.0 & x4-x2>=1.0\n",
      "   +0.5449 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.1397 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -0.0133 if c<=0.0 & x2<=1.0 & x4-x2>=1.0\n",
      "   -0.0759 if x2<=1.0\n",
      "   -0.3048 if x4-x2>=0.0\n",
      "   -0.4829 if x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.3056 if c>=1.0 & x2>=1.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.4028 if x3-x1>=-2.0\n",
      "   +0.1052 if x1<=2.0 & x4-x2>=-1.0\n",
      "   -0.1640 if x1>=1.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=-2.0\n",
      "   -0.2885 if c>=1.0 & x2>=2.0\n",
      "   -0.1367 if x1<=0.0 & x2<=0.0 & x4-x2>=1.0\n",
      "   +0.0723 if x3-x1<=2.0 & x4-x2<=1.0\n",
      "   +0.9499 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   -0.1832 if x3-x1<=-3.0 & x4-x2<=1.0\n",
      "----------------- 3 --------------\n",
      "   +0.3053 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.6578 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.1029 if c<=0.0 & x1>=3.0 & x3-x1<=-2.0\n",
      "   -0.0305 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.7762 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.3756 if x1<=2.0 & x1>=2.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.1846 if x2>=1.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   -0.4146 if x1<=1.0 & x2<=1.0 & x4-x2<=2.0 & x4-x2>=0.0\n",
      "   +0.4208 if c>=1.0 & x2<=1.0\n",
      "   -0.3422 if x2<=2.0 & x3-x1<=1.0 & x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.0445 if x2<=2.0 & x3-x1>=2.0\n",
      "   +0.5047 if x2>=1.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   -0.0000 if c<=0.0 & x1>=3.0 & x2<=2.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   +0.2118 if x1>=1.0 & x2<=1.0 & x3-x1>=0.0 & x4-x2<=2.0 & x4-x2>=1.0\n",
      "   +0.4495 if x2<=0.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   -0.6715 if x1<=1.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "init state [ 1  1 -1  0  0]\n",
      "(39,) (39,)\n",
      "init state [ 2  2 -2  0  0]\n",
      "(66,) (27,)\n",
      "init state [1 2 1 0 0]\n",
      "(79,) (13,)\n",
      "init state [ 2  3  0 -2  0]\n",
      "(92,) (13,)\n",
      "init state [3 0 0 2 0]\n",
      "(99,) (7,)\n",
      "init state [ 3  2 -2  1  0]\n",
      "(104,) (5,)\n",
      "init state [ 1  2 -1 -2  0]\n",
      "(130,) (26,)\n",
      "init state [0 1 1 0 0]\n",
      "(141,) (11,)\n",
      "init state [ 1  2  2 -1  0]\n",
      "(165,) (24,)\n",
      "init state [ 2  3  1 -1  0]\n",
      "(168,) (3,)\n",
      "============ 55 ===========\n",
      "Run episode 55 with rewards 39, accuracy 0.5\n",
      "----------------- 0 --------------\n",
      "   -0.3036 if c>=1.0 & x2>=3.0\n",
      "   -0.0677 if c<=0.0 & x1<=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.2431 if c<=0.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.4080 if x1>=2.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   +0.2129 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.3841 if c<=0.0 & x1<=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.0896 if c>=1.0 & x1>=1.0 & x2<=2.0\n",
      "   +0.6497 if c<=0.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   +0.0939 if x1<=2.0 & x1>=1.0 & x4-x2<=0.0\n",
      "   +0.5860 if c<=0.0 & x1>=3.0\n",
      "   -0.1405 if x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.2688 if x4-x2<=2.0 & x4-x2>=2.0\n",
      "   +0.2369 if c<=0.0 & x1<=2.0 & x2<=0.0 & x3-x1<=-1.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.0000 if x2<=0.0 & x3-x1>=2.0\n",
      "   -0.4360 if c<=0.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   -0.5290 if x1>=1.0 & x2>=1.0 & x3-x1<=1.0\n",
      "----------------- 1 --------------\n",
      "   +0.2970 if c>=1.0 & x1>=1.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   +0.7225 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.7119 if x2>=2.0 & x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.9471 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   +0.0041 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.1545 if x2>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.1792 if x1<=1.0 & x2>=3.0 & x4-x2>=-1.0\n",
      "   +0.0041 if x2>=1.0 & x3-x1>=2.0\n",
      "   -0.9157 if x2<=2.0 & x3-x1<=0.0\n",
      "   -0.5258 if c<=0.0 & x3-x1>=-1.0 & x4-x2<=-2.0\n",
      "   +0.2510 if x1<=0.0 & x2<=2.0 & x3-x1>=1.0 & x4-x2<=2.0\n",
      "   +0.0288 if c<=0.0 & x1<=1.0 & x2<=2.0 & x3-x1<=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.4693 if c<=0.0 & x1>=1.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   -0.2222 if x2>=1.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.2651 if x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.0462 if x1>=1.0 & x2<=1.0 & x3-x1<=0.0 & x4-x2>=0.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 2 --------------\n",
      "   +0.4962 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.1153 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   +0.1211 if c<=0.0 & x2<=1.0 & x4-x2>=1.0\n",
      "   +0.1468 if x2<=1.0\n",
      "   -0.5414 if x4-x2>=0.0\n",
      "   -0.2283 if x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.2014 if c>=1.0 & x2>=1.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.0964 if x3-x1>=-2.0\n",
      "   -0.5990 if x1<=2.0 & x4-x2>=-1.0\n",
      "   -0.0618 if x1>=1.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=-2.0\n",
      "   -0.2672 if c>=1.0 & x2>=2.0\n",
      "   -0.0527 if x1<=0.0 & x2<=0.0 & x4-x2>=1.0\n",
      "   +0.1469 if x3-x1<=2.0 & x4-x2<=1.0\n",
      "   +0.6113 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   +0.1473 if x3-x1<=-3.0 & x4-x2<=1.0\n",
      "   -0.2370 if c<=0.0 & x3-x1>=-1.0 & x3-x1>=-2.0 & x4-x2<=-2.0\n",
      "----------------- 3 --------------\n",
      "   +0.5311 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.1344 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.4140 if c<=0.0 & x1>=3.0 & x3-x1<=-2.0\n",
      "   +0.6760 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.5264 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.3540 if x1<=2.0 & x1>=2.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   +0.2899 if x2>=1.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   -0.0229 if x1<=1.0 & x2<=1.0 & x4-x2<=2.0 & x4-x2>=0.0\n",
      "   +0.1595 if c>=1.0 & x2<=1.0\n",
      "   -0.1516 if x2<=2.0 & x3-x1<=1.0 & x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   +0.0271 if x2<=2.0 & x3-x1>=2.0\n",
      "   +0.1251 if x2>=1.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   +0.4760 if x1>=1.0 & x2<=1.0 & x3-x1>=0.0 & x4-x2<=2.0 & x4-x2>=1.0\n",
      "   +0.3064 if x2<=0.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   -0.3349 if x1<=1.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   -0.2753 if x3-x1<=0.0 & x3-x1>=-2.0\n",
      "init state [0 2 3 0 0]\n",
      "(13,) (13,)\n",
      "init state [ 2  3 -2 -2  0]\n",
      "(40,) (27,)\n",
      "init state [ 1  1  0 -1  0]\n",
      "(75,) (35,)\n",
      "init state [ 3  0 -3  3  0]\n",
      "(100,) (25,)\n",
      "init state [ 3  2  0 -2  0]\n",
      "(107,) (7,)\n",
      "init state [3 1 0 1 0]\n",
      "(113,) (6,)\n",
      "init state [2 1 1 0 0]\n",
      "(118,) (5,)\n",
      "init state [1 2 0 1 0]\n",
      "(123,) (5,)\n",
      "init state [ 3  0 -3  3  0]\n",
      "(138,) (15,)\n",
      "init state [1 2 1 1 0]\n",
      "(144,) (6,)\n",
      "============ 56 ===========\n",
      "Run episode 56 with rewards 36, accuracy 0.5\n",
      "----------------- 0 --------------\n",
      "   -0.4818 if c>=1.0 & x2>=3.0\n",
      "   +0.0970 if c<=0.0 & x1<=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.2612 if c<=0.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.8399 if x1>=2.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   +0.1127 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.0863 if c<=0.0 & x1<=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.1609 if c>=1.0 & x1>=1.0 & x2<=2.0\n",
      "   +0.3776 if c<=0.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   +0.0327 if x1<=2.0 & x1>=1.0 & x4-x2<=0.0\n",
      "   +0.0229 if c<=0.0 & x1>=3.0\n",
      "   -0.3010 if x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.4131 if x4-x2<=2.0 & x4-x2>=2.0\n",
      "   -0.0952 if c<=0.0 & x1<=2.0 & x2<=0.0 & x3-x1<=-1.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   -0.0360 if c<=0.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   -0.2764 if x1>=1.0 & x2>=1.0 & x3-x1<=1.0\n",
      "   +0.3186 if x1>=1.0 & x3-x1>=2.0\n",
      "----------------- 1 --------------\n",
      "   +0.5149 if c>=1.0 & x1>=1.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   +0.7401 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.4695 if x2>=2.0 & x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.8928 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   -0.3276 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.1845 if x2>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.2307 if x1<=1.0 & x2>=3.0 & x4-x2>=-1.0\n",
      "   -0.8748 if x2<=2.0 & x3-x1<=0.0\n",
      "   -0.1268 if c<=0.0 & x3-x1>=-1.0 & x4-x2<=-2.0\n",
      "   +0.1637 if x1<=0.0 & x2<=2.0 & x3-x1>=1.0 & x4-x2<=2.0\n",
      "   -0.1723 if c<=0.0 & x1<=1.0 & x2<=2.0 & x3-x1<=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.0967 if c<=0.0 & x1>=1.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.4470 if x2>=1.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.3561 if x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   -0.0084 if x1>=1.0 & x2<=1.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   -0.2593 if x3-x1>=2.0 & x4-x2>=0.0\n",
      "----------------- 2 --------------\n",
      "   +0.7569 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.1908 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   +0.1581 if c<=0.0 & x2<=1.0 & x4-x2>=1.0\n",
      "   +0.2543 if x2<=1.0\n",
      "   -0.5773 if x4-x2>=0.0\n",
      "   -0.1365 if x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.1003 if c>=1.0 & x2>=1.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.2698 if x3-x1>=-2.0\n",
      "   -0.7833 if x1<=2.0 & x4-x2>=-1.0\n",
      "   -0.1010 if x1>=1.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=-2.0\n",
      "   -0.2110 if c>=1.0 & x2>=2.0\n",
      "   +0.0528 if x3-x1<=2.0 & x4-x2<=1.0\n",
      "   +0.4133 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   +0.0178 if x3-x1<=-3.0 & x4-x2<=1.0\n",
      "   +0.4437 if c<=0.0 & x3-x1>=-1.0 & x3-x1>=-2.0 & x4-x2<=-2.0\n",
      "   -0.2747 if c<=0.0 & x1>=2.0 & x2>=1.0 & x3-x1>=1.0\n",
      "----------------- 3 --------------\n",
      "   +0.3644 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   -0.0375 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.1620 if c<=0.0 & x1>=3.0 & x3-x1<=-2.0\n",
      "   +0.1918 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.6009 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.0590 if x1<=2.0 & x1>=2.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   +0.0703 if x2>=1.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   +0.2425 if c>=1.0 & x2<=1.0\n",
      "   -0.0153 if x2<=2.0 & x3-x1<=1.0 & x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   +0.1226 if x2<=2.0 & x3-x1>=2.0\n",
      "   +0.5130 if x2>=1.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   +0.1247 if x1>=1.0 & x2<=1.0 & x3-x1>=0.0 & x4-x2<=2.0 & x4-x2>=1.0\n",
      "   +0.1285 if x2<=0.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   -0.0330 if x1<=1.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   +0.1124 if x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.2680 if x2>=3.0 & x3-x1>=2.0\n",
      "init state [ 3  0 -3  1  0]\n",
      "(26,) (26,)\n",
      "init state [ 3  2 -3  0  0]\n",
      "(44,) (18,)\n",
      "init state [1 3 1 0 0]\n",
      "(46,) (2,)\n",
      "init state [ 3  1 -1  1  0]\n",
      "(51,) (5,)\n",
      "init state [ 3  2 -1 -2  0]\n",
      "(60,) (9,)\n",
      "init state [ 0  3  3 -3  0]\n",
      "(86,) (26,)\n",
      "init state [ 2  2 -1 -2  0]\n",
      "(108,) (22,)\n",
      "init state [ 2  3 -1 -1  0]\n",
      "(171,) (63,)\n",
      "init state [ 3  0 -3  3  0]\n",
      "(193,) (22,)\n",
      "init state [ 2  2 -1 -1  0]\n",
      "(212,) (19,)\n",
      "============ 57 ===========\n",
      "Run episode 57 with rewards 23, accuracy 0.4\n",
      "----------------- 0 --------------\n",
      "   -0.4568 if c>=1.0 & x2>=3.0\n",
      "   +0.2426 if c<=0.0 & x1<=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.2964 if c<=0.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.5503 if x1>=2.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   +0.0156 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.0473 if c<=0.0 & x1<=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.2396 if c>=1.0 & x1>=1.0 & x2<=2.0\n",
      "   +0.7157 if c<=0.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   +0.1115 if x1<=2.0 & x1>=1.0 & x4-x2<=0.0\n",
      "   +0.0000 if x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.3287 if x4-x2<=2.0 & x4-x2>=2.0\n",
      "   +0.0000 if c<=0.0 & x1<=2.0 & x2<=0.0 & x3-x1<=-1.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   -0.4150 if c<=0.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   -0.4367 if x1>=1.0 & x2>=1.0 & x3-x1<=1.0\n",
      "   -0.0638 if x1>=1.0 & x3-x1>=2.0\n",
      "   -0.2305 if x1<=0.0 & x4-x2>=1.0\n",
      "----------------- 1 --------------\n",
      "   +0.7659 if c>=1.0 & x1>=1.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   +0.3566 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   -0.3976 if x2>=2.0 & x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -1.0960 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   -0.1676 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.0900 if x2>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.1345 if x1<=1.0 & x2>=3.0 & x4-x2>=-1.0\n",
      "   -0.5487 if x2<=2.0 & x3-x1<=0.0\n",
      "   +0.1207 if c<=0.0 & x3-x1>=-1.0 & x4-x2<=-2.0\n",
      "   +0.4058 if x1<=0.0 & x2<=2.0 & x3-x1>=1.0 & x4-x2<=2.0\n",
      "   +0.1308 if c<=0.0 & x1<=1.0 & x2<=2.0 & x3-x1<=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   +0.0000 if c<=0.0 & x1>=1.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.0000 if x2>=1.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.2476 if x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.0000 if x3-x1>=2.0 & x4-x2>=0.0\n",
      "   +0.5118 if c<=0.0 & x1>=3.0 & x3-x1>=-2.0\n",
      "----------------- 2 --------------\n",
      "   +0.5176 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.3981 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -0.1549 if c<=0.0 & x2<=1.0 & x4-x2>=1.0\n",
      "   +0.0087 if x2<=1.0\n",
      "   -0.5352 if x4-x2>=0.0\n",
      "   -0.2627 if x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.1730 if c>=1.0 & x2>=1.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.1376 if x3-x1>=-2.0\n",
      "   -0.2548 if x1<=2.0 & x4-x2>=-1.0\n",
      "   -0.1901 if x1>=1.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=-2.0\n",
      "   -0.5415 if c>=1.0 & x2>=2.0\n",
      "   +0.0639 if x3-x1<=2.0 & x4-x2<=1.0\n",
      "   +0.5150 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   +0.2453 if c<=0.0 & x3-x1>=-1.0 & x3-x1>=-2.0 & x4-x2<=-2.0\n",
      "   +0.0158 if c<=0.0 & x1>=2.0 & x2>=1.0 & x3-x1>=1.0\n",
      "   +0.4750 if c<=0.0 & x1>=3.0 & x2<=2.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 3 --------------\n",
      "   -0.0899 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.4148 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.5386 if c<=0.0 & x1>=3.0 & x3-x1<=-2.0\n",
      "   +0.2193 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.5656 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.0715 if x1<=2.0 & x1>=2.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.2642 if x2>=1.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   +0.3585 if c>=1.0 & x2<=1.0\n",
      "   -0.0716 if x2<=2.0 & x3-x1>=2.0\n",
      "   +0.5507 if x2>=1.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   +0.0000 if x1>=1.0 & x2<=1.0 & x3-x1>=0.0 & x4-x2<=2.0 & x4-x2>=1.0\n",
      "   +0.0000 if x2<=0.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   -0.0240 if x1<=1.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   +0.0723 if x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   +0.0378 if x2>=3.0 & x3-x1>=2.0\n",
      "   -0.2831 if c<=0.0 & x2<=0.0\n",
      "init state [ 2  2  1 -1  0]\n",
      "(6,) (6,)\n",
      "init state [ 3  1 -2  1  0]\n",
      "(22,) (16,)\n",
      "init state [ 0  3  2 -3  0]\n",
      "(43,) (21,)\n",
      "init state [ 3  2  0 -2  0]\n",
      "(54,) (11,)\n",
      "init state [0 0 1 2 0]\n",
      "(64,) (10,)\n",
      "init state [ 1  0 -1  1  0]\n",
      "(75,) (11,)\n",
      "init state [ 2  1 -2  2  0]\n",
      "(92,) (17,)\n",
      "init state [ 3  2  0 -2  0]\n",
      "(107,) (15,)\n",
      "init state [0 0 1 0 0]\n",
      "(115,) (8,)\n",
      "init state [ 2  3 -2  0  0]\n",
      "(129,) (14,)\n",
      "============ 58 ===========\n",
      "Run episode 58 with rewards 28, accuracy 0.4\n",
      "----------------- 0 --------------\n",
      "   -0.1786 if c>=1.0 & x2>=3.0\n",
      "   -0.1506 if c<=0.0 & x1<=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.6305 if c<=0.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.6300 if x1>=2.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   +0.0125 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.3385 if c<=0.0 & x1<=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.2932 if c>=1.0 & x1>=1.0 & x2<=2.0\n",
      "   +0.3190 if c<=0.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   -0.2396 if x1<=2.0 & x1>=1.0 & x4-x2<=0.0\n",
      "   -0.0947 if x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.2203 if x4-x2<=2.0 & x4-x2>=2.0\n",
      "   -0.2283 if c<=0.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   -0.0975 if x1>=1.0 & x2>=1.0 & x3-x1<=1.0\n",
      "   +0.0000 if x1>=1.0 & x3-x1>=2.0\n",
      "   -0.4635 if x1<=0.0 & x4-x2>=1.0\n",
      "   -0.3088 if c<=0.0 & x1<=1.0 & x1>=1.0 & x2<=1.0\n",
      "----------------- 1 --------------\n",
      "   +0.6036 if c>=1.0 & x1>=1.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   +0.4290 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   -0.2061 if x2>=2.0 & x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.4039 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   -0.1109 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.0407 if x2>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.4780 if x1<=1.0 & x2>=3.0 & x4-x2>=-1.0\n",
      "   -0.4203 if x2<=2.0 & x3-x1<=0.0\n",
      "   -0.2377 if c<=0.0 & x3-x1>=-1.0 & x4-x2<=-2.0\n",
      "   +0.1827 if x1<=0.0 & x2<=2.0 & x3-x1>=1.0 & x4-x2<=2.0\n",
      "   +0.2721 if c<=0.0 & x1<=1.0 & x2<=2.0 & x3-x1<=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   +0.3307 if x2>=1.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.0792 if x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.0000 if x3-x1>=2.0 & x4-x2>=0.0\n",
      "   -0.1537 if c<=0.0 & x1>=3.0 & x3-x1>=-2.0\n",
      "   +0.3161 if x2>=2.0 & x3-x1>=1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "----------------- 2 --------------\n",
      "   +1.0588 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.4944 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -0.2343 if c<=0.0 & x2<=1.0 & x4-x2>=1.0\n",
      "   -0.6589 if x4-x2>=0.0\n",
      "   -0.2710 if x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.0124 if c>=1.0 & x2>=1.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.2537 if x3-x1>=-2.0\n",
      "   -0.2801 if x1<=2.0 & x4-x2>=-1.0\n",
      "   -0.0375 if x1>=1.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=-2.0\n",
      "   -0.3675 if c>=1.0 & x2>=2.0\n",
      "   -0.0351 if x3-x1<=2.0 & x4-x2<=1.0\n",
      "   +0.6071 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   +0.3497 if c<=0.0 & x3-x1>=-1.0 & x3-x1>=-2.0 & x4-x2<=-2.0\n",
      "   -0.0372 if c<=0.0 & x1>=2.0 & x2>=1.0 & x3-x1>=1.0\n",
      "   +0.0000 if c<=0.0 & x1>=3.0 & x2<=2.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   +0.4083 if c<=0.0 & x1<=2.0 & x1>=2.0 & x3-x1<=0.0 & x4-x2<=1.0\n",
      "----------------- 3 --------------\n",
      "   -0.0250 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.3726 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.4799 if c<=0.0 & x1>=3.0 & x3-x1<=-2.0\n",
      "   +0.1480 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.5820 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.1359 if x1<=2.0 & x1>=2.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.2139 if x2>=1.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   +0.4819 if c>=1.0 & x2<=1.0\n",
      "   -0.0971 if x2<=2.0 & x3-x1>=2.0\n",
      "   +0.0624 if x2>=1.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   +0.2049 if x2<=0.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   -0.1738 if x1<=1.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   +0.1805 if x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   +0.0028 if x2>=3.0 & x3-x1>=2.0\n",
      "   +0.2331 if c<=0.0 & x2<=0.0\n",
      "   +0.3725 if x4-x2>=2.0\n",
      "init state [0 0 0 1 0]\n",
      "(33,) (33,)\n",
      "init state [0 0 2 3 0]\n",
      "(56,) (23,)\n",
      "init state [ 2  2 -2  1  0]\n",
      "(72,) (16,)\n",
      "init state [1 3 1 0 0]\n",
      "(79,) (7,)\n",
      "init state [ 1  1  1 -1  0]\n",
      "(93,) (14,)\n",
      "init state [ 0  3  1 -2  0]\n",
      "(103,) (10,)\n",
      "init state [ 2  3 -1 -3  0]\n",
      "(121,) (18,)\n",
      "init state [ 1  3  1 -2  0]\n",
      "(142,) (21,)\n",
      "init state [ 1  3  0 -3  0]\n",
      "(152,) (10,)\n",
      "init state [2 2 1 0 0]\n",
      "(180,) (28,)\n",
      "============ 59 ===========\n",
      "Run episode 59 with rewards 14, accuracy 0.5\n",
      "----------------- 0 --------------\n",
      "   +0.0685 if c>=1.0 & x2>=3.0\n",
      "   -0.0354 if c<=0.0 & x1<=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.6142 if c<=0.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.1273 if x1>=2.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   -0.0515 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.1480 if c<=0.0 & x1<=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.5603 if c>=1.0 & x1>=1.0 & x2<=2.0\n",
      "   +0.7896 if c<=0.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   -0.6039 if x1<=2.0 & x1>=1.0 & x4-x2<=0.0\n",
      "   -0.1099 if x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.0362 if x4-x2<=2.0 & x4-x2>=2.0\n",
      "   +0.0104 if c<=0.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   -0.0464 if x1>=1.0 & x2>=1.0 & x3-x1<=1.0\n",
      "   -0.2387 if x1<=0.0 & x4-x2>=1.0\n",
      "   -0.4451 if c<=0.0 & x1<=1.0 & x1>=1.0 & x2<=1.0\n",
      "   +0.5559 if c<=0.0 & x1<=0.0 & x2<=1.0 & x4-x2>=0.0\n",
      "----------------- 1 --------------\n",
      "   +0.7456 if c>=1.0 & x1>=1.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   +0.2898 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   -0.0302 if x2>=2.0 & x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.2815 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   +0.1330 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.0889 if x2>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.3802 if x1<=1.0 & x2>=3.0 & x4-x2>=-1.0\n",
      "   -0.3286 if x2<=2.0 & x3-x1<=0.0\n",
      "   -0.5562 if c<=0.0 & x3-x1>=-1.0 & x4-x2<=-2.0\n",
      "   -0.1503 if x1<=0.0 & x2<=2.0 & x3-x1>=1.0 & x4-x2<=2.0\n",
      "   -0.0242 if c<=0.0 & x1<=1.0 & x2<=2.0 & x3-x1<=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.2471 if x2>=1.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.2769 if x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   -0.0857 if c<=0.0 & x1>=3.0 & x3-x1>=-2.0\n",
      "   +0.4137 if x2>=2.0 & x3-x1>=1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   +0.5991 if x2>=2.0 & x3-x1<=-2.0 & x3-x1<=1.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "----------------- 2 --------------\n",
      "   +0.7980 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.3026 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -0.2199 if c<=0.0 & x2<=1.0 & x4-x2>=1.0\n",
      "   -0.7487 if x4-x2>=0.0\n",
      "   -0.3256 if x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.1823 if c>=1.0 & x2>=1.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.0608 if x3-x1>=-2.0\n",
      "   -0.2332 if x1<=2.0 & x4-x2>=-1.0\n",
      "   -0.2167 if x1>=1.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=-2.0\n",
      "   -0.5685 if c>=1.0 & x2>=2.0\n",
      "   -0.1210 if x3-x1<=2.0 & x4-x2<=1.0\n",
      "   +0.4811 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   +0.4996 if c<=0.0 & x3-x1>=-1.0 & x3-x1>=-2.0 & x4-x2<=-2.0\n",
      "   +0.2151 if c<=0.0 & x1>=2.0 & x2>=1.0 & x3-x1>=1.0\n",
      "   +0.2108 if c<=0.0 & x1<=2.0 & x1>=2.0 & x3-x1<=0.0 & x4-x2<=1.0\n",
      "   +0.8840 if x1<=0.0 & x3-x1>=1.0 & x4-x2<=-1.0\n",
      "----------------- 3 --------------\n",
      "   +0.0440 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.0653 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.0580 if c<=0.0 & x1>=3.0 & x3-x1<=-2.0\n",
      "   +0.1958 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.3878 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.4180 if x1<=2.0 & x1>=2.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   +0.0781 if x2>=1.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   +0.4353 if c>=1.0 & x2<=1.0\n",
      "   +0.3952 if x2<=2.0 & x3-x1>=2.0\n",
      "   +0.0744 if x2>=1.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   +0.2397 if x2<=0.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   -0.0057 if x1<=1.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   -0.0103 if x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   +0.0316 if c<=0.0 & x2<=0.0\n",
      "   -0.0046 if x4-x2>=2.0\n",
      "   -0.9345 if x1<=0.0 & x2<=1.0 & x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "init state [ 1  1 -1 -1  0]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(21,) (21,)\n",
      "init state [1 2 0 1 0]\n",
      "(27,) (6,)\n",
      "init state [ 2  2  0 -1  0]\n",
      "(41,) (14,)\n",
      "init state [ 0  1  2 -1  0]\n",
      "(63,) (22,)\n",
      "init state [ 2  0 -2  0  0]\n",
      "(139,) (76,)\n",
      "init state [ 0  3  2 -3  0]\n",
      "(168,) (29,)\n",
      "init state [0 2 3 0 0]\n",
      "(191,) (23,)\n",
      "init state [1 1 1 2 0]\n",
      "(214,) (23,)\n",
      "init state [ 2  0 -2  1  0]\n",
      "(253,) (39,)\n",
      "init state [ 3  0 -1  0  0]\n",
      "(262,) (9,)\n",
      "============ 60 ===========\n",
      "Run episode 60 with rewards 33, accuracy 0.7\n",
      "----------------- 0 --------------\n",
      "   -0.3605 if c>=1.0 & x2>=3.0\n",
      "   -0.0793 if c<=0.0 & x1<=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.9017 if c<=0.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.3678 if x1>=2.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   +0.2239 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.5942 if c<=0.0 & x1<=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.7469 if c>=1.0 & x1>=1.0 & x2<=2.0\n",
      "   +0.2412 if c<=0.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   -0.1636 if x1<=2.0 & x1>=1.0 & x4-x2<=0.0\n",
      "   -0.2433 if x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.3728 if x4-x2<=2.0 & x4-x2>=2.0\n",
      "   +0.2317 if x1>=1.0 & x2>=1.0 & x3-x1<=1.0\n",
      "   -0.1012 if x1<=0.0 & x4-x2>=1.0\n",
      "   -0.1229 if c<=0.0 & x1<=1.0 & x1>=1.0 & x2<=1.0\n",
      "   -0.0583 if c<=0.0 & x1<=0.0 & x2<=1.0 & x4-x2>=0.0\n",
      "   -0.2413 if x1<=0.0 & x2>=2.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "----------------- 1 --------------\n",
      "   +0.5325 if c>=1.0 & x1>=1.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   +0.1942 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.3554 if x2>=2.0 & x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.0891 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   +0.3635 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.3310 if x2>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.3042 if x1<=1.0 & x2>=3.0 & x4-x2>=-1.0\n",
      "   -0.3890 if x2<=2.0 & x3-x1<=0.0\n",
      "   -0.5043 if c<=0.0 & x3-x1>=-1.0 & x4-x2<=-2.0\n",
      "   +0.1621 if x1<=0.0 & x2<=2.0 & x3-x1>=1.0 & x4-x2<=2.0\n",
      "   -0.4771 if x2>=1.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.3103 if x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.1048 if c<=0.0 & x1>=3.0 & x3-x1>=-2.0\n",
      "   -0.0248 if x2>=2.0 & x3-x1>=1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   +0.0000 if x2>=2.0 & x3-x1<=-2.0 & x3-x1<=1.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.4138 if x2>=1.0 & x3-x1>=3.0\n",
      "----------------- 2 --------------\n",
      "   +0.8297 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.3048 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -0.1607 if c<=0.0 & x2<=1.0 & x4-x2>=1.0\n",
      "   -0.9399 if x4-x2>=0.0\n",
      "   -0.6087 if x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.0558 if c>=1.0 & x2>=1.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.1232 if x1<=2.0 & x4-x2>=-1.0\n",
      "   -0.1257 if x1>=1.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=-2.0\n",
      "   -0.3473 if c>=1.0 & x2>=2.0\n",
      "   -0.2462 if x3-x1<=2.0 & x4-x2<=1.0\n",
      "   +0.1448 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   +0.2163 if c<=0.0 & x3-x1>=-1.0 & x3-x1>=-2.0 & x4-x2<=-2.0\n",
      "   +0.1216 if c<=0.0 & x1>=2.0 & x2>=1.0 & x3-x1>=1.0\n",
      "   +0.2160 if c<=0.0 & x1<=2.0 & x1>=2.0 & x3-x1<=0.0 & x4-x2<=1.0\n",
      "   +0.6061 if x1<=0.0 & x3-x1>=1.0 & x4-x2<=-1.0\n",
      "   +0.7089 if c<=0.0 & x1<=2.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "----------------- 3 --------------\n",
      "   +0.6302 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   -0.1336 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.0844 if c<=0.0 & x1>=3.0 & x3-x1<=-2.0\n",
      "   -0.1201 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.3132 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.4716 if x1<=2.0 & x1>=2.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.0413 if x2>=1.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   +0.2969 if c>=1.0 & x2<=1.0\n",
      "   -0.1147 if x2<=2.0 & x3-x1>=2.0\n",
      "   -0.2038 if x2>=1.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   +0.1148 if x2<=0.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.0752 if x1<=1.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   -0.1930 if x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.2479 if c<=0.0 & x2<=0.0\n",
      "   -0.0452 if x1<=0.0 & x2<=1.0 & x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.5770 if x1<=0.0 & x3-x1<=2.0 & x4-x2>=1.0\n",
      "init state [ 0  1  1 -1  0]\n",
      "(12,) (12,)\n",
      "init state [1 0 1 2 0]\n",
      "(28,) (16,)\n",
      "init state [ 3  0 -3  1  0]\n",
      "(48,) (20,)\n",
      "init state [2 1 1 1 0]\n",
      "(100,) (52,)\n",
      "init state [ 1  3  0 -2  0]\n",
      "(116,) (16,)\n",
      "init state [ 2  2  1 -2  0]\n",
      "(140,) (24,)\n",
      "init state [ 1  0 -1  0  0]\n",
      "(152,) (12,)\n",
      "init state [ 2  0 -2  3  0]\n",
      "(192,) (40,)\n",
      "init state [ 2  2 -2  0  0]\n",
      "(208,) (16,)\n",
      "init state [ 1  1  2 -1  0]\n",
      "(230,) (22,)\n",
      "============ 61 ===========\n",
      "Run episode 61 with rewards 20, accuracy 0.1\n",
      "----------------- 0 --------------\n",
      "   -0.3361 if c>=1.0 & x2>=3.0\n",
      "   -0.2983 if c<=0.0 & x1<=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.6694 if c<=0.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.1966 if x1>=2.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   +0.2148 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.3689 if c<=0.0 & x1<=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.3807 if c>=1.0 & x1>=1.0 & x2<=2.0\n",
      "   +0.2824 if c<=0.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   +0.1196 if x1<=2.0 & x1>=1.0 & x4-x2<=0.0\n",
      "   -0.2491 if x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.4647 if x4-x2<=2.0 & x4-x2>=2.0\n",
      "   -0.0953 if x1>=1.0 & x2>=1.0 & x3-x1<=1.0\n",
      "   +0.1747 if x1<=0.0 & x4-x2>=1.0\n",
      "   -0.0940 if c<=0.0 & x1<=1.0 & x1>=1.0 & x2<=1.0\n",
      "   +0.0000 if x1<=0.0 & x2>=2.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.4154 if x2>=2.0 & x3-x1>=2.0 & x4-x2>=-1.0\n",
      "----------------- 1 --------------\n",
      "   +0.4713 if c>=1.0 & x1>=1.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   -0.1607 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   -0.1416 if x2>=2.0 & x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.0777 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   +0.0934 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.4530 if x2>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.2177 if x1<=1.0 & x2>=3.0 & x4-x2>=-1.0\n",
      "   -0.2918 if x2<=2.0 & x3-x1<=0.0\n",
      "   -0.3267 if c<=0.0 & x3-x1>=-1.0 & x4-x2<=-2.0\n",
      "   +0.4088 if x1<=0.0 & x2<=2.0 & x3-x1>=1.0 & x4-x2<=2.0\n",
      "   +0.2199 if x2>=1.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.4151 if x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.0592 if c<=0.0 & x1>=3.0 & x3-x1>=-2.0\n",
      "   -0.1210 if x2>=2.0 & x3-x1>=1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   +0.2658 if x2>=1.0 & x3-x1>=3.0\n",
      "   +0.7396 if x3-x1>=0.0 & x3-x1>=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "----------------- 2 --------------\n",
      "   +1.0214 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.3740 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -0.0691 if c<=0.0 & x2<=1.0 & x4-x2>=1.0\n",
      "   -0.8500 if x4-x2>=0.0\n",
      "   -0.5835 if x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.1982 if x1<=2.0 & x4-x2>=-1.0\n",
      "   -0.1116 if x1>=1.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=-2.0\n",
      "   -0.5028 if c>=1.0 & x2>=2.0\n",
      "   -0.3855 if x3-x1<=2.0 & x4-x2<=1.0\n",
      "   +0.5862 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   +0.2180 if c<=0.0 & x3-x1>=-1.0 & x3-x1>=-2.0 & x4-x2<=-2.0\n",
      "   -0.0278 if c<=0.0 & x1>=2.0 & x2>=1.0 & x3-x1>=1.0\n",
      "   -0.1981 if c<=0.0 & x1<=2.0 & x1>=2.0 & x3-x1<=0.0 & x4-x2<=1.0\n",
      "   +0.1603 if x1<=0.0 & x3-x1>=1.0 & x4-x2<=-1.0\n",
      "   +0.3789 if c<=0.0 & x1<=2.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   -0.1642 if c<=0.0 & x1>=2.0 & x2<=1.0 & x4-x2<=-1.0\n",
      "----------------- 3 --------------\n",
      "   +0.4025 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.4789 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.3501 if c<=0.0 & x1>=3.0 & x3-x1<=-2.0\n",
      "   -0.2337 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.5574 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.1372 if x1<=2.0 & x1>=2.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.0758 if c>=1.0 & x2<=1.0\n",
      "   -0.2646 if x2<=2.0 & x3-x1>=2.0\n",
      "   -0.2727 if x2>=1.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   +0.5794 if x2<=0.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.0731 if x1<=1.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   +0.0890 if x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   +0.3777 if c<=0.0 & x2<=0.0\n",
      "   -0.3660 if x1<=0.0 & x2<=1.0 & x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.0162 if x1<=0.0 & x3-x1<=2.0 & x4-x2>=1.0\n",
      "   +0.6034 if x1<=2.0 & x1>=1.0 & x3-x1<=1.0 & x4-x2>=-1.0\n",
      "init state [0 2 0 1 0]\n",
      "(12,) (12,)\n",
      "init state [ 2  2 -1 -2  0]\n",
      "(42,) (30,)\n",
      "init state [ 3  1  0 -1  0]\n",
      "(47,) (5,)\n",
      "init state [ 0  3  3 -3  0]\n",
      "(96,) (49,)\n",
      "init state [ 1  1 -1 -1  0]\n",
      "(129,) (33,)\n",
      "init state [ 1  0 -1  0  0]\n",
      "(166,) (37,)\n",
      "init state [ 1  1 -1  1  0]\n",
      "(181,) (15,)\n",
      "init state [2 0 1 0 0]\n",
      "(194,) (13,)\n",
      "init state [0 0 2 0 0]\n",
      "(223,) (29,)\n",
      "init state [ 1  1 -1 -1  0]\n",
      "(250,) (27,)\n",
      "============ 62 ===========\n",
      "Run episode 62 with rewards 15, accuracy 0.6\n",
      "----------------- 0 --------------\n",
      "   -0.5193 if c>=1.0 & x2>=3.0\n",
      "   +0.0791 if c<=0.0 & x1<=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.3797 if c<=0.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.4670 if x1>=2.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   +0.2181 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.0365 if c<=0.0 & x1<=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.2247 if c>=1.0 & x1>=1.0 & x2<=2.0\n",
      "   -0.0151 if c<=0.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   -0.1647 if x1<=2.0 & x1>=1.0 & x4-x2<=0.0\n",
      "   +0.0000 if x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.0000 if x4-x2<=2.0 & x4-x2>=2.0\n",
      "   +0.2368 if x1>=1.0 & x2>=1.0 & x3-x1<=1.0\n",
      "   -0.0769 if x1<=0.0 & x4-x2>=1.0\n",
      "   +0.1336 if c<=0.0 & x1<=1.0 & x1>=1.0 & x2<=1.0\n",
      "   +0.0000 if x2>=2.0 & x3-x1>=2.0 & x4-x2>=-1.0\n",
      "   +0.6095 if c<=0.0 & x1<=2.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 1 --------------\n",
      "   +0.6538 if c>=1.0 & x1>=1.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   +0.3368 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   -0.0981 if x2>=2.0 & x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   +0.1850 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   -0.0285 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   -0.1615 if x2>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.0793 if x1<=1.0 & x2>=3.0 & x4-x2>=-1.0\n",
      "   -0.1829 if x2<=2.0 & x3-x1<=0.0\n",
      "   -0.1777 if c<=0.0 & x3-x1>=-1.0 & x4-x2<=-2.0\n",
      "   -0.0754 if x1<=0.0 & x2<=2.0 & x3-x1>=1.0 & x4-x2<=2.0\n",
      "   +0.0000 if x2>=1.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.4376 if x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.0000 if x2>=2.0 & x3-x1>=1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.0447 if x2>=1.0 & x3-x1>=3.0\n",
      "   +0.1939 if x3-x1>=0.0 & x3-x1>=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.7449 if c<=0.0 & x1>=3.0 & x2<=2.0\n",
      "----------------- 2 --------------\n",
      "   +1.3499 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.3288 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -0.1694 if c<=0.0 & x2<=1.0 & x4-x2>=1.0\n",
      "   -0.4885 if x4-x2>=0.0\n",
      "   -0.2420 if x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.0455 if x1<=2.0 & x4-x2>=-1.0\n",
      "   -0.0558 if x1>=1.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=-2.0\n",
      "   -0.5394 if c>=1.0 & x2>=2.0\n",
      "   -0.4424 if x3-x1<=2.0 & x4-x2<=1.0\n",
      "   +0.4847 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   +0.3912 if c<=0.0 & x3-x1>=-1.0 & x3-x1>=-2.0 & x4-x2<=-2.0\n",
      "   +0.1587 if c<=0.0 & x1<=2.0 & x1>=2.0 & x3-x1<=0.0 & x4-x2<=1.0\n",
      "   -0.0455 if x1<=0.0 & x3-x1>=1.0 & x4-x2<=-1.0\n",
      "   +0.1782 if c<=0.0 & x1<=2.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   -0.1683 if c<=0.0 & x1>=2.0 & x2<=1.0 & x4-x2<=-1.0\n",
      "   -0.4743 if c<=0.0 & x1>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "----------------- 3 --------------\n",
      "   +0.7143 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.1226 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.2030 if c<=0.0 & x1>=3.0 & x3-x1<=-2.0\n",
      "   +0.1139 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.5814 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.1000 if x1<=2.0 & x1>=2.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   +0.8424 if c>=1.0 & x2<=1.0\n",
      "   -0.1240 if x2<=2.0 & x3-x1>=2.0\n",
      "   -0.2778 if x2>=1.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   -0.0000 if x2<=0.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.2470 if x1<=1.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   -0.1308 if x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.1732 if c<=0.0 & x2<=0.0\n",
      "   -0.0117 if x1<=0.0 & x2<=1.0 & x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.0481 if x1<=2.0 & x1>=1.0 & x3-x1<=1.0 & x4-x2>=-1.0\n",
      "   +0.2044 if x2>=2.0 & x3-x1<=1.0\n",
      "init state [1 0 1 3 0]\n",
      "(36,) (36,)\n",
      "init state [ 3  0 -2  1  0]\n",
      "(60,) (24,)\n",
      "init state [ 3  0 -2  2  0]\n",
      "(71,) (11,)\n",
      "init state [ 0  3  2 -1  0]\n",
      "(85,) (14,)\n",
      "init state [ 3  1 -2 -1  0]\n",
      "(108,) (23,)\n",
      "init state [1 0 0 2 0]\n",
      "(113,) (5,)\n",
      "init state [ 0  2  3 -2  0]\n",
      "(151,) (38,)\n",
      "init state [0 0 0 3 0]\n",
      "(174,) (23,)\n",
      "init state [ 1  3  1 -3  0]\n",
      "(195,) (21,)\n",
      "init state [ 3  2 -1  0  0]\n",
      "(200,) (5,)\n",
      "============ 63 ===========\n",
      "Run episode 63 with rewards 37, accuracy 0.2\n",
      "----------------- 0 --------------\n",
      "   -0.6045 if c>=1.0 & x2>=3.0\n",
      "   -0.2635 if c<=0.0 & x1<=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.2068 if c<=0.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.2002 if x1>=2.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   +0.1560 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.1205 if c<=0.0 & x1<=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.2785 if c>=1.0 & x1>=1.0 & x2<=2.0\n",
      "   +0.5359 if c<=0.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   +0.0987 if x1<=2.0 & x1>=1.0 & x4-x2<=0.0\n",
      "   +0.1609 if x4-x2<=2.0 & x4-x2>=2.0\n",
      "   +0.0681 if x1>=1.0 & x2>=1.0 & x3-x1<=1.0\n",
      "   +0.0772 if x1<=0.0 & x4-x2>=1.0\n",
      "   -0.1270 if c<=0.0 & x1<=1.0 & x1>=1.0 & x2<=1.0\n",
      "   -0.2259 if x2>=2.0 & x3-x1>=2.0 & x4-x2>=-1.0\n",
      "   +0.3179 if c<=0.0 & x1<=2.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.6401 if c<=0.0 & x2>=2.0 & x4-x2>=1.0\n",
      "----------------- 1 --------------\n",
      "   +0.8640 if c>=1.0 & x1>=1.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   +0.3564 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   -0.2806 if x2>=2.0 & x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.2212 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   -0.0102 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   -0.1593 if x2>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.0079 if x1<=1.0 & x2>=3.0 & x4-x2>=-1.0\n",
      "   -0.2327 if x2<=2.0 & x3-x1<=0.0\n",
      "   +0.1924 if c<=0.0 & x3-x1>=-1.0 & x4-x2<=-2.0\n",
      "   -0.2246 if x1<=0.0 & x2<=2.0 & x3-x1>=1.0 & x4-x2<=2.0\n",
      "   +0.1572 if x2>=1.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.2030 if x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.0446 if x2>=1.0 & x3-x1>=3.0\n",
      "   +0.0562 if x3-x1>=0.0 & x3-x1>=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.2122 if c<=0.0 & x1>=3.0 & x2<=2.0\n",
      "   +0.4943 if x2<=2.0 & x4-x2<=1.0\n",
      "----------------- 2 --------------\n",
      "   +1.1534 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.3790 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -0.0606 if c<=0.0 & x2<=1.0 & x4-x2>=1.0\n",
      "   -0.8774 if x4-x2>=0.0\n",
      "   -0.5028 if x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.2497 if x1>=1.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=-2.0\n",
      "   -0.4657 if c>=1.0 & x2>=2.0\n",
      "   -0.3921 if x3-x1<=2.0 & x4-x2<=1.0\n",
      "   +0.3809 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   +0.3160 if c<=0.0 & x3-x1>=-1.0 & x3-x1>=-2.0 & x4-x2<=-2.0\n",
      "   -0.1463 if c<=0.0 & x1<=2.0 & x1>=2.0 & x3-x1<=0.0 & x4-x2<=1.0\n",
      "   +0.2210 if x1<=0.0 & x3-x1>=1.0 & x4-x2<=-1.0\n",
      "   +0.2286 if c<=0.0 & x1<=2.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   -0.1810 if c<=0.0 & x1>=2.0 & x2<=1.0 & x4-x2<=-1.0\n",
      "   +0.3097 if c<=0.0 & x1>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.1427 if c<=0.0 & x1<=1.0 & x4-x2<=-2.0\n",
      "----------------- 3 --------------\n",
      "   +0.2523 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.4219 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.0649 if c<=0.0 & x1>=3.0 & x3-x1<=-2.0\n",
      "   +0.0044 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.4071 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.1069 if x1<=2.0 & x1>=2.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   +0.3655 if c>=1.0 & x2<=1.0\n",
      "   -0.0854 if x2<=2.0 & x3-x1>=2.0\n",
      "   +0.0267 if x2>=1.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   -0.1293 if x1<=1.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   +0.3974 if x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   +0.0506 if c<=0.0 & x2<=0.0\n",
      "   -0.0250 if x1<=0.0 & x2<=1.0 & x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.0800 if x1<=2.0 & x1>=1.0 & x3-x1<=1.0 & x4-x2>=-1.0\n",
      "   -0.2868 if x2>=2.0 & x3-x1<=1.0\n",
      "   +0.5066 if x3-x1<=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "init state [1 0 2 1 0]\n",
      "(8,) (8,)\n",
      "init state [0 1 0 1 0]\n",
      "(24,) (16,)\n",
      "init state [ 0  3  2 -2  0]\n",
      "(39,) (15,)\n",
      "init state [ 2  3  1 -3  0]\n",
      "(49,) (10,)\n",
      "init state [ 0  3  0 -1  0]\n",
      "(65,) (16,)\n",
      "init state [ 3  2 -2 -1  0]\n",
      "(97,) (32,)\n",
      "init state [ 2  2 -2  0  0]\n",
      "(122,) (25,)\n",
      "init state [3 0 0 2 0]\n",
      "(131,) (9,)\n",
      "init state [ 3  2 -2  0  0]\n",
      "(144,) (13,)\n",
      "init state [0 0 1 0 0]\n",
      "(157,) (13,)\n",
      "============ 64 ===========\n",
      "Run episode 64 with rewards 29, accuracy 0.8\n",
      "----------------- 0 --------------\n",
      "   -0.5940 if c>=1.0 & x2>=3.0\n",
      "   +0.0976 if c<=0.0 & x1<=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.1811 if c<=0.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.5198 if x1>=2.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   +0.1494 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.0252 if c<=0.0 & x1<=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.5768 if c>=1.0 & x1>=1.0 & x2<=2.0\n",
      "   +0.7833 if c<=0.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   +0.3234 if x1<=2.0 & x1>=1.0 & x4-x2<=0.0\n",
      "   -0.0925 if x4-x2<=2.0 & x4-x2>=2.0\n",
      "   +0.2615 if x1<=0.0 & x4-x2>=1.0\n",
      "   -0.2499 if c<=0.0 & x1<=1.0 & x1>=1.0 & x2<=1.0\n",
      "   -0.0761 if x2>=2.0 & x3-x1>=2.0 & x4-x2>=-1.0\n",
      "   +0.4741 if c<=0.0 & x1<=2.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.0000 if c<=0.0 & x2>=2.0 & x4-x2>=1.0\n",
      "   -0.9896 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "----------------- 1 --------------\n",
      "   +0.5490 if c>=1.0 & x1>=1.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   +0.2698 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.2161 if x2>=2.0 & x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.0940 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   +0.6656 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   -0.1294 if x2>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.3044 if x2<=2.0 & x3-x1<=0.0\n",
      "   +0.3261 if c<=0.0 & x3-x1>=-1.0 & x4-x2<=-2.0\n",
      "   +0.0770 if x1<=0.0 & x2<=2.0 & x3-x1>=1.0 & x4-x2<=2.0\n",
      "   +0.0000 if x2>=1.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "   -0.3007 if x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.0000 if x2>=1.0 & x3-x1>=3.0\n",
      "   +0.0000 if x3-x1>=0.0 & x3-x1>=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.1178 if c<=0.0 & x1>=3.0 & x2<=2.0\n",
      "   +0.4471 if x2<=2.0 & x4-x2<=1.0\n",
      "   +0.3937 if x2<=2.0 & x3-x1>=2.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 2 --------------\n",
      "   +0.8773 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.1500 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -0.6966 if x4-x2>=0.0\n",
      "   -0.4948 if x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.2024 if x1>=1.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=-2.0\n",
      "   -0.3781 if c>=1.0 & x2>=2.0\n",
      "   -0.2642 if x3-x1<=2.0 & x4-x2<=1.0\n",
      "   +0.3583 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   +0.2249 if c<=0.0 & x3-x1>=-1.0 & x3-x1>=-2.0 & x4-x2<=-2.0\n",
      "   -0.1048 if c<=0.0 & x1<=2.0 & x1>=2.0 & x3-x1<=0.0 & x4-x2<=1.0\n",
      "   +0.2471 if x1<=0.0 & x3-x1>=1.0 & x4-x2<=-1.0\n",
      "   -0.4233 if c<=0.0 & x1<=2.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   +0.1190 if c<=0.0 & x1>=2.0 & x2<=1.0 & x4-x2<=-1.0\n",
      "   +0.0000 if c<=0.0 & x1>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.2049 if c<=0.0 & x1<=1.0 & x4-x2<=-2.0\n",
      "   +0.4096 if x1>=2.0 & x2>=3.0 & x3-x1>=0.0 & x4-x2<=-2.0\n",
      "----------------- 3 --------------\n",
      "   +0.2462 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.1071 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.2151 if c<=0.0 & x1>=3.0 & x3-x1<=-2.0\n",
      "   +0.4845 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.0749 if x1<=2.0 & x1>=2.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   +0.4394 if c>=1.0 & x2<=1.0\n",
      "   -0.2105 if x2<=2.0 & x3-x1>=2.0\n",
      "   -0.1187 if x2>=1.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   -0.0441 if x1<=1.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   +0.4735 if x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   +0.2325 if c<=0.0 & x2<=0.0\n",
      "   -0.1323 if x1<=0.0 & x2<=1.0 & x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.0037 if x1<=2.0 & x1>=1.0 & x3-x1<=1.0 & x4-x2>=-1.0\n",
      "   -0.1406 if x2>=2.0 & x3-x1<=1.0\n",
      "   +0.3829 if x3-x1<=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.4288 if x4-x2>=2.0\n",
      "init state [ 2  2 -2 -2  0]\n",
      "(11,) (11,)\n",
      "init state [ 3  1 -2  1  0]\n",
      "(56,) (45,)\n",
      "init state [ 3  2  0 -2  0]\n",
      "(65,) (9,)\n",
      "init state [ 2  3 -1 -2  0]\n",
      "(82,) (17,)\n",
      "init state [0 1 2 2 0]\n",
      "(98,) (16,)\n",
      "init state [ 1  2  1 -2  0]\n",
      "(113,) (15,)\n",
      "init state [ 2  1 -1  0  0]\n",
      "(130,) (17,)\n",
      "init state [ 3  1 -1 -1  0]\n",
      "(148,) (18,)\n",
      "init state [ 2  3 -2 -2  0]\n",
      "(179,) (31,)\n",
      "init state [0 1 1 2 0]\n",
      "(204,) (25,)\n",
      "============ 65 ===========\n",
      "Run episode 65 with rewards 17, accuracy 0.3\n",
      "----------------- 0 --------------\n",
      "   -0.4011 if c>=1.0 & x2>=3.0\n",
      "   +0.2328 if c<=0.0 & x1<=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.3790 if c<=0.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.0844 if x1>=2.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   +0.3630 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.0627 if c<=0.0 & x1<=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.3263 if c>=1.0 & x1>=1.0 & x2<=2.0\n",
      "   +1.1131 if c<=0.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   -0.3879 if x1<=2.0 & x1>=1.0 & x4-x2<=0.0\n",
      "   +0.0135 if x4-x2<=2.0 & x4-x2>=2.0\n",
      "   +0.4606 if x1<=0.0 & x4-x2>=1.0\n",
      "   -0.0366 if c<=0.0 & x1<=1.0 & x1>=1.0 & x2<=1.0\n",
      "   +0.0000 if x2>=2.0 & x3-x1>=2.0 & x4-x2>=-1.0\n",
      "   +0.5312 if c<=0.0 & x1<=2.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   +0.0334 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.4273 if c<=0.0 & x1<=2.0 & x3-x1>=-1.0\n",
      "----------------- 1 --------------\n",
      "   +0.6780 if c>=1.0 & x1>=1.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   +0.4333 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   -0.0172 if x2>=2.0 & x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.0918 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   +0.3730 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.1990 if x2>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.1449 if x2<=2.0 & x3-x1<=0.0\n",
      "   -0.1233 if c<=0.0 & x3-x1>=-1.0 & x4-x2<=-2.0\n",
      "   -0.0081 if x1<=0.0 & x2<=2.0 & x3-x1>=1.0 & x4-x2<=2.0\n",
      "   -0.2869 if x2>=1.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.2821 if x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.0000 if x3-x1>=0.0 & x3-x1>=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.0738 if c<=0.0 & x1>=3.0 & x2<=2.0\n",
      "   -0.4858 if x2<=2.0 & x4-x2<=1.0\n",
      "   +0.1469 if x2<=2.0 & x3-x1>=2.0\n",
      "   +0.4925 if x1>=1.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "----------------- 2 --------------\n",
      "   +1.1299 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.2657 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -0.9728 if x4-x2>=0.0\n",
      "   -0.5266 if x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.0623 if x1>=1.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=-2.0\n",
      "   -0.5200 if c>=1.0 & x2>=2.0\n",
      "   -0.2396 if x3-x1<=2.0 & x4-x2<=1.0\n",
      "   +0.5891 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   -0.0912 if c<=0.0 & x3-x1>=-1.0 & x3-x1>=-2.0 & x4-x2<=-2.0\n",
      "   -0.0401 if c<=0.0 & x1<=2.0 & x1>=2.0 & x3-x1<=0.0 & x4-x2<=1.0\n",
      "   -0.3849 if x1<=0.0 & x3-x1>=1.0 & x4-x2<=-1.0\n",
      "   -0.0461 if c<=0.0 & x1<=2.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   +0.7083 if c<=0.0 & x1>=2.0 & x2<=1.0 & x4-x2<=-1.0\n",
      "   -0.1463 if c<=0.0 & x1<=1.0 & x4-x2<=-2.0\n",
      "   +0.0516 if x1>=2.0 & x2>=3.0 & x3-x1>=0.0 & x4-x2<=-2.0\n",
      "   -0.1930 if c<=0.0 & x1>=3.0 & x3-x1>=0.0\n",
      "----------------- 3 --------------\n",
      "   +0.5789 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   -0.3953 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.0264 if c<=0.0 & x1>=3.0 & x3-x1<=-2.0\n",
      "   +0.7790 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.0800 if x1<=2.0 & x1>=2.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   +0.7123 if c>=1.0 & x2<=1.0\n",
      "   -0.0423 if x2<=2.0 & x3-x1>=2.0\n",
      "   -0.1357 if x2>=1.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   +0.5570 if x1<=1.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   -0.2090 if x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.0951 if c<=0.0 & x2<=0.0\n",
      "   -0.0451 if x1<=0.0 & x2<=1.0 & x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.0952 if x2>=2.0 & x3-x1<=1.0\n",
      "   +0.0828 if x3-x1<=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.1017 if x4-x2>=2.0\n",
      "   -0.5432 if c<=0.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "init state [ 3  0 -3  1  0]\n",
      "(29,) (29,)\n",
      "init state [0 2 2 0 0]\n",
      "(35,) (6,)\n",
      "init state [ 2  1 -1  0  0]\n",
      "(43,) (8,)\n",
      "init state [3 0 0 2 0]\n",
      "(49,) (6,)\n",
      "init state [ 2  2 -2 -2  0]\n",
      "(61,) (12,)\n",
      "init state [0 1 2 0 0]\n",
      "(67,) (6,)\n",
      "init state [1 1 2 1 0]\n",
      "(111,) (44,)\n",
      "init state [2 1 1 0 0]\n",
      "(120,) (9,)\n",
      "init state [0 0 2 1 0]\n",
      "(136,) (16,)\n",
      "init state [0 0 1 1 0]\n",
      "(146,) (10,)\n",
      "============ 66 ===========\n",
      "Run episode 66 with rewards 32, accuracy 0.3\n",
      "----------------- 0 --------------\n",
      "   -0.4028 if c>=1.0 & x2>=3.0\n",
      "   +0.0944 if c<=0.0 & x1<=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.1226 if c<=0.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.0419 if x1>=2.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   +0.0796 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.0662 if c<=0.0 & x1<=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.4119 if c>=1.0 & x1>=1.0 & x2<=2.0\n",
      "   +1.0169 if c<=0.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   -0.3166 if x1<=2.0 & x1>=1.0 & x4-x2<=0.0\n",
      "   -0.3754 if x4-x2<=2.0 & x4-x2>=2.0\n",
      "   +0.1075 if x1<=0.0 & x4-x2>=1.0\n",
      "   +0.2262 if c<=0.0 & x1<=1.0 & x1>=1.0 & x2<=1.0\n",
      "   +0.4107 if c<=0.0 & x1<=2.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   +0.0812 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.2731 if c<=0.0 & x1<=2.0 & x3-x1>=-1.0\n",
      "   -0.3088 if x2>=1.0 & x3-x1>=3.0\n",
      "----------------- 1 --------------\n",
      "   +0.6350 if c>=1.0 & x1>=1.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   +0.4995 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   -0.3687 if x2>=2.0 & x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.0552 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   +0.1970 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.5773 if x2>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.3134 if x2<=2.0 & x3-x1<=0.0\n",
      "   -0.1440 if c<=0.0 & x3-x1>=-1.0 & x4-x2<=-2.0\n",
      "   +0.0379 if x1<=0.0 & x2<=2.0 & x3-x1>=1.0 & x4-x2<=2.0\n",
      "   -0.4855 if x2>=1.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.0906 if x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.3431 if c<=0.0 & x1>=3.0 & x2<=2.0\n",
      "   -0.2206 if x2<=2.0 & x4-x2<=1.0\n",
      "   +0.4819 if x2<=2.0 & x3-x1>=2.0\n",
      "   +0.4968 if x1>=1.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.5914 if x2>=1.0 & x3-x1<=0.0\n",
      "----------------- 2 --------------\n",
      "   +0.8652 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.0711 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -0.9528 if x4-x2>=0.0\n",
      "   -0.3279 if x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.1778 if x1>=1.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=-2.0\n",
      "   -0.1215 if c>=1.0 & x2>=2.0\n",
      "   -0.2601 if x3-x1<=2.0 & x4-x2<=1.0\n",
      "   +0.0622 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   +0.1320 if c<=0.0 & x3-x1>=-1.0 & x3-x1>=-2.0 & x4-x2<=-2.0\n",
      "   +0.2655 if x1<=0.0 & x3-x1>=1.0 & x4-x2<=-1.0\n",
      "   -0.0516 if c<=0.0 & x1<=2.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   +0.0000 if c<=0.0 & x1>=2.0 & x2<=1.0 & x4-x2<=-1.0\n",
      "   +0.1320 if c<=0.0 & x1<=1.0 & x4-x2<=-2.0\n",
      "   -0.0683 if x1>=2.0 & x2>=3.0 & x3-x1>=0.0 & x4-x2<=-2.0\n",
      "   -0.3841 if c<=0.0 & x1>=3.0 & x3-x1>=0.0\n",
      "   +0.2640 if c<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1>=0.0 & x4-x2<=-1.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 3 --------------\n",
      "   +0.4784 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   -0.2466 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.9628 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.0955 if x1<=2.0 & x1>=2.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   +0.3424 if c>=1.0 & x2<=1.0\n",
      "   -0.3940 if x2<=2.0 & x3-x1>=2.0\n",
      "   +0.2045 if x2>=1.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   +0.2490 if x1<=1.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   +0.0134 if x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   +0.0323 if c<=0.0 & x2<=0.0\n",
      "   +0.2148 if x1<=0.0 & x2<=1.0 & x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.0467 if x2>=2.0 & x3-x1<=1.0\n",
      "   +0.1024 if x3-x1<=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.1923 if x4-x2>=2.0\n",
      "   -0.7470 if c<=0.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.4346 if x2>=1.0 & x3-x1>=3.0 & x4-x2>=1.0\n",
      "init state [1 3 1 0 0]\n",
      "(10,) (10,)\n",
      "init state [ 0  3  2 -2  0]\n",
      "(37,) (27,)\n",
      "init state [ 2  1 -1  1  0]\n",
      "(48,) (11,)\n",
      "init state [1 1 0 2 0]\n",
      "(71,) (23,)\n",
      "init state [ 1  3  2 -1  0]\n",
      "(77,) (6,)\n",
      "init state [ 2  2 -1 -1  0]\n",
      "(91,) (14,)\n",
      "init state [0 0 3 2 0]\n",
      "(104,) (13,)\n",
      "init state [ 3  1 -2  2  0]\n",
      "(124,) (20,)\n",
      "init state [ 2  2  1 -2  0]\n",
      "(142,) (18,)\n",
      "init state [0 0 3 1 0]\n",
      "(149,) (7,)\n",
      "============ 67 ===========\n",
      "Run episode 67 with rewards 35, accuracy 0.5\n",
      "----------------- 0 --------------\n",
      "   -0.2826 if c>=1.0 & x2>=3.0\n",
      "   +0.0062 if c<=0.0 & x1<=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.3067 if c<=0.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.1729 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.3719 if c<=0.0 & x1<=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.4235 if c>=1.0 & x1>=1.0 & x2<=2.0\n",
      "   +1.2856 if c<=0.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   -0.2870 if x1<=2.0 & x1>=1.0 & x4-x2<=0.0\n",
      "   -0.3788 if x4-x2<=2.0 & x4-x2>=2.0\n",
      "   +0.3694 if x1<=0.0 & x4-x2>=1.0\n",
      "   -0.1660 if c<=0.0 & x1<=1.0 & x1>=1.0 & x2<=1.0\n",
      "   +0.2058 if c<=0.0 & x1<=2.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   +0.0670 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.4653 if c<=0.0 & x1<=2.0 & x3-x1>=-1.0\n",
      "   +0.0000 if x2>=1.0 & x3-x1>=3.0\n",
      "   +0.3736 if x1>=2.0 & x2>=3.0 & x4-x2<=-2.0\n",
      "----------------- 1 --------------\n",
      "   +0.2120 if c>=1.0 & x1>=1.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   +0.0543 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   -0.1566 if x2>=2.0 & x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.4549 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   -0.1248 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.2802 if x2>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.2509 if x2<=2.0 & x3-x1<=0.0\n",
      "   +0.0229 if c<=0.0 & x3-x1>=-1.0 & x4-x2<=-2.0\n",
      "   -0.5513 if x2>=1.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "   -0.1107 if x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.2016 if c<=0.0 & x1>=3.0 & x2<=2.0\n",
      "   +0.1827 if x2<=2.0 & x4-x2<=1.0\n",
      "   +0.7924 if x2<=2.0 & x3-x1>=2.0\n",
      "   +0.2019 if x1>=1.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.4014 if x2>=1.0 & x3-x1<=0.0\n",
      "   +0.9806 if x1<=2.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "----------------- 2 --------------\n",
      "   +0.3546 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.0898 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -0.8746 if x4-x2>=0.0\n",
      "   -0.4593 if x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.0173 if x1>=1.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=-2.0\n",
      "   -0.0841 if c>=1.0 & x2>=2.0\n",
      "   -0.0697 if x3-x1<=2.0 & x4-x2<=1.0\n",
      "   +0.3397 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   +0.0519 if c<=0.0 & x3-x1>=-1.0 & x3-x1>=-2.0 & x4-x2<=-2.0\n",
      "   -0.4334 if x1<=0.0 & x3-x1>=1.0 & x4-x2<=-1.0\n",
      "   -0.1831 if c<=0.0 & x1<=2.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   -0.1553 if c<=0.0 & x1<=1.0 & x4-x2<=-2.0\n",
      "   -0.1647 if x1>=2.0 & x2>=3.0 & x3-x1>=0.0 & x4-x2<=-2.0\n",
      "   -0.5211 if c<=0.0 & x1>=3.0 & x3-x1>=0.0\n",
      "   +0.6262 if c<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.1405 if c<=0.0 & x2>=2.0 & x3-x1<=1.0\n",
      "----------------- 3 --------------\n",
      "   +0.7998 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.1334 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.4994 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.1545 if x1<=2.0 & x1>=2.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   +0.0087 if c>=1.0 & x2<=1.0\n",
      "   -0.5701 if x2<=2.0 & x3-x1>=2.0\n",
      "   -0.0266 if x2>=1.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   +0.3066 if x1<=1.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   +0.2274 if c<=0.0 & x2<=0.0\n",
      "   -0.2048 if x1<=0.0 & x2<=1.0 & x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.0416 if x2>=2.0 & x3-x1<=1.0\n",
      "   +0.0861 if x3-x1<=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.3834 if x4-x2>=2.0\n",
      "   -0.4863 if c<=0.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.0000 if x2>=1.0 & x3-x1>=3.0 & x4-x2>=1.0\n",
      "   +0.4535 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "init state [ 2  3  1 -2  0]\n",
      "(34,) (34,)\n",
      "init state [ 2  1 -2 -1  0]\n",
      "(170,) (136,)\n",
      "init state [0 1 0 1 0]\n",
      "(178,) (8,)\n",
      "init state [2 2 0 1 0]\n",
      "(180,) (2,)\n",
      "init state [ 2  1  1 -1  0]\n",
      "(187,) (7,)\n",
      "init state [ 1  3  2 -2  0]\n",
      "(202,) (15,)\n",
      "init state [ 3  0 -2  0  0]\n",
      "(252,) (50,)\n",
      "init state [0 0 1 1 0]\n",
      "(274,) (22,)\n",
      "init state [ 1  3  1 -2  0]\n",
      "(296,) (22,)\n",
      "init state [ 0  3  1 -1  0]\n",
      "(303,) (7,)\n",
      "============ 68 ===========\n",
      "Run episode 68 with rewards 35, accuracy 0.7\n",
      "----------------- 0 --------------\n",
      "   -0.2732 if c>=1.0 & x2>=3.0\n",
      "   -0.1181 if c<=0.0 & x1<=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.2279 if c<=0.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.2070 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.0254 if c<=0.0 & x1<=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.6020 if c>=1.0 & x1>=1.0 & x2<=2.0\n",
      "   +0.0637 if c<=0.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   -0.6683 if x1<=2.0 & x1>=1.0 & x4-x2<=0.0\n",
      "   +0.0000 if x4-x2<=2.0 & x4-x2>=2.0\n",
      "   +0.0569 if x1<=0.0 & x4-x2>=1.0\n",
      "   -0.0959 if c<=0.0 & x1<=1.0 & x1>=1.0 & x2<=1.0\n",
      "   -0.2449 if c<=0.0 & x1<=2.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.5205 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.4007 if c<=0.0 & x1<=2.0 & x3-x1>=-1.0\n",
      "   -0.1473 if x1>=2.0 & x2>=3.0 & x4-x2<=-2.0\n",
      "   +0.3433 if c<=0.0 & x3-x1<=2.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "----------------- 1 --------------\n",
      "   +0.2621 if c>=1.0 & x1>=1.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   +0.5089 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   -0.0444 if x2>=2.0 & x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.6780 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   +0.3214 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.1253 if x2>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.6463 if x2<=2.0 & x3-x1<=0.0\n",
      "   -0.0000 if x2>=1.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.3353 if x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.0374 if c<=0.0 & x1>=3.0 & x2<=2.0\n",
      "   -0.2054 if x2<=2.0 & x4-x2<=1.0\n",
      "   +0.2356 if x2<=2.0 & x3-x1>=2.0\n",
      "   +0.0025 if x1>=1.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.0014 if x2>=1.0 & x3-x1<=0.0\n",
      "   +0.3527 if x1<=2.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.2647 if x1<=0.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-2.0 & x3-x1>=1.0 & x4-x2>=-2.0\n",
      "----------------- 2 --------------\n",
      "   +0.6958 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.2137 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -0.3893 if x4-x2>=0.0\n",
      "   -0.1468 if x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.5351 if c>=1.0 & x2>=2.0\n",
      "   -0.1260 if x3-x1<=2.0 & x4-x2<=1.0\n",
      "   +0.1730 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   +0.0271 if c<=0.0 & x3-x1>=-1.0 & x3-x1>=-2.0 & x4-x2<=-2.0\n",
      "   -0.1663 if x1<=0.0 & x3-x1>=1.0 & x4-x2<=-1.0\n",
      "   +0.1839 if c<=0.0 & x1<=2.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   +0.2926 if c<=0.0 & x1<=1.0 & x4-x2<=-2.0\n",
      "   -0.3202 if x1>=2.0 & x2>=3.0 & x3-x1>=0.0 & x4-x2<=-2.0\n",
      "   +0.0529 if c<=0.0 & x1>=3.0 & x3-x1>=0.0\n",
      "   +0.0539 if c<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.3272 if c<=0.0 & x2>=2.0 & x3-x1<=1.0\n",
      "   -0.1990 if x2>=3.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "----------------- 3 --------------\n",
      "   +0.6469 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.7896 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.3800 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.1981 if x1<=2.0 & x1>=2.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   +0.2214 if c>=1.0 & x2<=1.0\n",
      "   -0.0348 if x2<=2.0 & x3-x1>=2.0\n",
      "   -0.2817 if x2>=1.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   -0.1522 if x1<=1.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   -0.4850 if c<=0.0 & x2<=0.0\n",
      "   -0.2134 if x1<=0.0 & x2<=1.0 & x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.2679 if x2>=2.0 & x3-x1<=1.0\n",
      "   -0.0751 if x3-x1<=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.0000 if x4-x2>=2.0\n",
      "   -0.2430 if c<=0.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.2392 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.5351 if x1<=2.0 & x2<=1.0 & x3-x1>=-1.0 & x4-x2>=0.0\n",
      "init state [ 1  2 -1  1  0]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(131,) (131,)\n",
      "init state [ 2  3  1 -3  0]\n",
      "(150,) (19,)\n",
      "init state [ 3  2 -3 -1  0]\n",
      "(232,) (82,)\n",
      "init state [ 1  0 -1  3  0]\n",
      "(243,) (11,)\n",
      "init state [ 2  3  0 -1  0]\n",
      "(246,) (3,)\n",
      "init state [ 3  2  0 -1  0]\n",
      "(249,) (3,)\n",
      "init state [ 3  2 -2  1  0]\n",
      "(255,) (6,)\n",
      "init state [ 3  2 -2 -2  0]\n",
      "(293,) (38,)\n",
      "init state [0 0 2 3 0]\n",
      "(305,) (12,)\n",
      "init state [0 1 3 1 0]\n",
      "(310,) (5,)\n",
      "============ 69 ===========\n",
      "Run episode 69 with rewards 37, accuracy 0.3\n",
      "----------------- 0 --------------\n",
      "   -0.6961 if c>=1.0 & x2>=3.0\n",
      "   -0.8160 if c<=0.0 & x1<=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +1.1671 if c<=0.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.7023 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.1329 if c<=0.0 & x1<=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.2911 if c>=1.0 & x1>=1.0 & x2<=2.0\n",
      "   +2.3830 if c<=0.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   -0.1971 if x1<=2.0 & x1>=1.0 & x4-x2<=0.0\n",
      "   -0.3582 if x1<=0.0 & x4-x2>=1.0\n",
      "   -0.0398 if c<=0.0 & x1<=1.0 & x1>=1.0 & x2<=1.0\n",
      "   -0.0330 if c<=0.0 & x1<=2.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   +0.7178 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -1.6565 if c<=0.0 & x1<=2.0 & x3-x1>=-1.0\n",
      "   +0.7162 if x1>=2.0 & x2>=3.0 & x4-x2<=-2.0\n",
      "   -0.9483 if c<=0.0 & x3-x1<=2.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +4.3784 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "----------------- 1 --------------\n",
      "   +0.0331 if c>=1.0 & x1>=1.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   +0.5569 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   -0.0218 if x2>=2.0 & x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -1.2643 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   -0.1308 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   -0.0733 if x2>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.4735 if x2<=2.0 & x3-x1<=0.0\n",
      "   +0.3967 if x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.0359 if c<=0.0 & x1>=3.0 & x2<=2.0\n",
      "   +0.2701 if x2<=2.0 & x4-x2<=1.0\n",
      "   +0.2873 if x2<=2.0 & x3-x1>=2.0\n",
      "   +0.4698 if x1>=1.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.7101 if x2>=1.0 & x3-x1<=0.0\n",
      "   +0.5941 if x1<=2.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.0000 if x1<=0.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-2.0 & x3-x1>=1.0 & x4-x2>=-2.0\n",
      "   +0.3100 if x3-x1>=3.0\n",
      "----------------- 2 --------------\n",
      "   +1.5130 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.2066 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -0.1503 if x4-x2>=0.0\n",
      "   -0.7803 if x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.1259 if c>=1.0 & x2>=2.0\n",
      "   -0.7203 if x3-x1<=2.0 & x4-x2<=1.0\n",
      "   -0.5132 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   +0.1903 if x1<=0.0 & x3-x1>=1.0 & x4-x2<=-1.0\n",
      "   +0.7466 if c<=0.0 & x1<=2.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   +0.2850 if c<=0.0 & x1<=1.0 & x4-x2<=-2.0\n",
      "   +0.1188 if x1>=2.0 & x2>=3.0 & x3-x1>=0.0 & x4-x2<=-2.0\n",
      "   +0.5268 if c<=0.0 & x1>=3.0 & x3-x1>=0.0\n",
      "   +0.3035 if c<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.3087 if c<=0.0 & x2>=2.0 & x3-x1<=1.0\n",
      "   +0.0000 if x2>=3.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.1720 if x3-x1<=2.0 & x4-x2<=2.0 & x4-x2>=-2.0\n",
      "----------------- 3 --------------\n",
      "   +0.3272 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.7210 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.3918 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.0460 if x1<=2.0 & x1>=2.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   +0.2580 if c>=1.0 & x2<=1.0\n",
      "   -0.1180 if x2<=2.0 & x3-x1>=2.0\n",
      "   +0.0816 if x2>=1.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   -0.4874 if x1<=1.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   +0.0776 if c<=0.0 & x2<=0.0\n",
      "   -0.2456 if x1<=0.0 & x2<=1.0 & x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.6023 if x2>=2.0 & x3-x1<=1.0\n",
      "   +0.0605 if x3-x1<=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.4177 if c<=0.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.1764 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.1544 if x1<=2.0 & x2<=1.0 & x3-x1>=-1.0 & x4-x2>=0.0\n",
      "   +0.2476 if x1<=1.0 & x2>=1.0 & x3-x1<=2.0 & x4-x2<=1.0 & x4-x2>=-2.0\n",
      "init state [ 3  1 -3  2  0]\n",
      "(19,) (19,)\n",
      "init state [0 1 3 1 0]\n",
      "(30,) (11,)\n",
      "init state [ 3  0 -3  3  0]\n",
      "(46,) (16,)\n",
      "init state [0 0 1 1 0]\n",
      "(57,) (11,)\n",
      "init state [ 1  1  0 -1  0]\n",
      "(81,) (24,)\n",
      "init state [ 2  3 -2 -3  0]\n",
      "(99,) (18,)\n",
      "init state [ 3  0 -1  1  0]\n",
      "(108,) (9,)\n",
      "init state [2 0 0 1 0]\n",
      "(128,) (20,)\n",
      "init state [ 0  1  1 -1  0]\n",
      "(137,) (9,)\n",
      "init state [0 0 1 0 0]\n",
      "(153,) (16,)\n",
      "============ 70 ===========\n",
      "Run episode 70 with rewards 26, accuracy 0.6\n",
      "----------------- 0 --------------\n",
      "   -0.2748 if c>=1.0 & x2>=3.0\n",
      "   -0.4085 if c<=0.0 & x1<=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.0292 if c<=0.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.1667 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.3763 if c<=0.0 & x1<=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.4964 if c>=1.0 & x1>=1.0 & x2<=2.0\n",
      "   +0.4707 if c<=0.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   -0.4096 if x1<=2.0 & x1>=1.0 & x4-x2<=0.0\n",
      "   -0.3201 if x1<=0.0 & x4-x2>=1.0\n",
      "   +0.1177 if c<=0.0 & x1<=1.0 & x1>=1.0 & x2<=1.0\n",
      "   +0.5944 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.3689 if c<=0.0 & x1<=2.0 & x3-x1>=-1.0\n",
      "   +0.1429 if x1>=2.0 & x2>=3.0 & x4-x2<=-2.0\n",
      "   -0.0309 if c<=0.0 & x3-x1<=2.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.8654 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.2777 if x2>=2.0 & x3-x1>=3.0\n",
      "----------------- 1 --------------\n",
      "   +0.3162 if c>=1.0 & x1>=1.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   +0.1220 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   -0.0016 if x2>=2.0 & x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.7532 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   -0.3247 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   -0.0832 if x2>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.3582 if x2<=2.0 & x3-x1<=0.0\n",
      "   +0.3260 if x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.0724 if c<=0.0 & x1>=3.0 & x2<=2.0\n",
      "   +0.0437 if x2<=2.0 & x4-x2<=1.0\n",
      "   +0.0055 if x2<=2.0 & x3-x1>=2.0\n",
      "   +0.2015 if x1>=1.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.2989 if x2>=1.0 & x3-x1<=0.0\n",
      "   +0.3925 if x1<=2.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.1439 if x3-x1>=3.0\n",
      "   +0.3868 if x1<=2.0 & x4-x2>=-2.0\n",
      "----------------- 2 --------------\n",
      "   +0.6196 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.3757 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -0.4771 if x4-x2>=0.0\n",
      "   -0.3169 if x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.6029 if c>=1.0 & x2>=2.0\n",
      "   -0.1409 if x3-x1<=2.0 & x4-x2<=1.0\n",
      "   +0.2519 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   +0.2104 if x1<=0.0 & x3-x1>=1.0 & x4-x2<=-1.0\n",
      "   +0.4107 if c<=0.0 & x1<=2.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   +0.1126 if c<=0.0 & x1<=1.0 & x4-x2<=-2.0\n",
      "   -0.1163 if x1>=2.0 & x2>=3.0 & x3-x1>=0.0 & x4-x2<=-2.0\n",
      "   -0.2462 if c<=0.0 & x1>=3.0 & x3-x1>=0.0\n",
      "   +0.1284 if c<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.0612 if c<=0.0 & x2>=2.0 & x3-x1<=1.0\n",
      "   -0.1103 if x3-x1<=2.0 & x4-x2<=2.0 & x4-x2>=-2.0\n",
      "   -0.1840 if x4-x2>=3.0\n",
      "----------------- 3 --------------\n",
      "   +0.5309 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.4492 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.3650 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.1261 if c>=1.0 & x2<=1.0\n",
      "   +0.0874 if x2<=2.0 & x3-x1>=2.0\n",
      "   +0.3063 if x2>=1.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   -0.0738 if x1<=1.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   -0.1309 if c<=0.0 & x2<=0.0\n",
      "   -0.1111 if x1<=0.0 & x2<=1.0 & x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.9068 if x2>=2.0 & x3-x1<=1.0\n",
      "   +0.2016 if x3-x1<=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.2147 if c<=0.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.0000 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.3729 if x1<=2.0 & x2<=1.0 & x3-x1>=-1.0 & x4-x2>=0.0\n",
      "   -0.0287 if x1<=1.0 & x2>=1.0 & x3-x1<=2.0 & x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   -0.5912 if x1<=2.0 & x4-x2<=0.0\n",
      "init state [ 3  2 -3 -2  0]\n",
      "(35,) (35,)\n",
      "init state [ 1  2  1 -1  0]\n",
      "(42,) (7,)\n",
      "init state [ 2  3  0 -1  0]\n",
      "(45,) (3,)\n",
      "init state [ 3  1 -2  1  0]\n",
      "(64,) (19,)\n",
      "init state [ 2  2 -2 -1  0]\n",
      "(85,) (21,)\n",
      "init state [ 1  0 -1  0  0]\n",
      "(93,) (8,)\n",
      "init state [ 3  2 -2 -2  0]\n",
      "(144,) (51,)\n",
      "init state [0 1 0 1 0]\n",
      "(159,) (15,)\n",
      "init state [0 2 2 1 0]\n",
      "(163,) (4,)\n",
      "init state [ 2  3 -2  0  0]\n",
      "(181,) (18,)\n",
      "============ 71 ===========\n",
      "Run episode 71 with rewards 24, accuracy 0.9\n",
      "----------------- 0 --------------\n",
      "   -0.4604 if c>=1.0 & x2>=3.0\n",
      "   -0.5266 if c<=0.0 & x1<=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.2143 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.2091 if c<=0.0 & x1<=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.7366 if c>=1.0 & x1>=1.0 & x2<=2.0\n",
      "   +0.5030 if c<=0.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   +0.1045 if x1<=2.0 & x1>=1.0 & x4-x2<=0.0\n",
      "   -0.0865 if x1<=0.0 & x4-x2>=1.0\n",
      "   +0.0496 if c<=0.0 & x1<=1.0 & x1>=1.0 & x2<=1.0\n",
      "   +0.6526 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.2558 if c<=0.0 & x1<=2.0 & x3-x1>=-1.0\n",
      "   +0.1189 if x1>=2.0 & x2>=3.0 & x4-x2<=-2.0\n",
      "   +0.2179 if c<=0.0 & x3-x1<=2.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.3209 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.0000 if x2>=2.0 & x3-x1>=3.0\n",
      "   -0.3461 if x1>=1.0 & x3-x1>=1.0 & x4-x2<=0.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 1 --------------\n",
      "   +0.3828 if c>=1.0 & x1>=1.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   +0.2937 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   -0.5994 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   -0.0932 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.0143 if x2>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.4270 if x2<=2.0 & x3-x1<=0.0\n",
      "   +0.2567 if x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   -0.1283 if c<=0.0 & x1>=3.0 & x2<=2.0\n",
      "   +0.1509 if x2<=2.0 & x4-x2<=1.0\n",
      "   +0.2041 if x2<=2.0 & x3-x1>=2.0\n",
      "   +0.2185 if x1>=1.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.0465 if x2>=1.0 & x3-x1<=0.0\n",
      "   +0.0940 if x1<=2.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.0000 if x3-x1>=3.0\n",
      "   +0.4835 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.5676 if x3-x1>=1.0 & x4-x2>=1.0\n",
      "----------------- 2 --------------\n",
      "   +0.8232 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.4070 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -0.7199 if x4-x2>=0.0\n",
      "   -0.4188 if x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.3522 if c>=1.0 & x2>=2.0\n",
      "   -0.2681 if x3-x1<=2.0 & x4-x2<=1.0\n",
      "   +0.2222 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   +0.4321 if x1<=0.0 & x3-x1>=1.0 & x4-x2<=-1.0\n",
      "   +0.3189 if c<=0.0 & x1<=2.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   +0.1548 if c<=0.0 & x1<=1.0 & x4-x2<=-2.0\n",
      "   -0.0280 if x1>=2.0 & x2>=3.0 & x3-x1>=0.0 & x4-x2<=-2.0\n",
      "   -0.0000 if c<=0.0 & x1>=3.0 & x3-x1>=0.0\n",
      "   +0.2682 if c<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.0337 if x3-x1<=2.0 & x4-x2<=2.0 & x4-x2>=-2.0\n",
      "   -0.0000 if x4-x2>=3.0\n",
      "   -0.0271 if x3-x1<=-2.0 & x4-x2<=-3.0\n",
      "----------------- 3 --------------\n",
      "   +0.4142 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.7602 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.6293 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.1727 if c>=1.0 & x2<=1.0\n",
      "   -0.1215 if x2<=2.0 & x3-x1>=2.0\n",
      "   +0.0386 if x2>=1.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   -0.3027 if x1<=1.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   -0.1992 if c<=0.0 & x2<=0.0\n",
      "   -0.0637 if x1<=0.0 & x2<=1.0 & x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.5072 if x2>=2.0 & x3-x1<=1.0\n",
      "   +0.1752 if x3-x1<=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.2451 if c<=0.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.0518 if x1<=2.0 & x2<=1.0 & x3-x1>=-1.0 & x4-x2>=0.0\n",
      "   -0.4243 if x1<=1.0 & x2>=1.0 & x3-x1<=2.0 & x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   -0.2111 if x1<=2.0 & x4-x2<=0.0\n",
      "   -0.1572 if x1>=2.0 & x2>=1.0 & x4-x2<=0.0\n",
      "init state [ 2  1 -2 -1  0]\n",
      "(51,) (51,)\n",
      "init state [ 0  3  1 -1  0]\n",
      "(69,) (18,)\n",
      "init state [ 0  3  3 -3  0]\n",
      "(94,) (25,)\n",
      "init state [1 0 1 2 0]\n",
      "(100,) (6,)\n",
      "init state [ 2  0 -1  0  0]\n",
      "(107,) (7,)\n",
      "init state [ 2  1 -2  2  0]\n",
      "(114,) (7,)\n",
      "init state [1 1 1 1 0]\n",
      "(132,) (18,)\n",
      "init state [1 0 1 3 0]\n",
      "(151,) (19,)\n",
      "init state [0 3 1 0 0]\n",
      "(163,) (12,)\n",
      "init state [ 1  3 -1  0  0]\n",
      "(182,) (19,)\n",
      "============ 72 ===========\n",
      "Run episode 72 with rewards 23, accuracy 1.0\n",
      "best\n",
      "----------------- 0 --------------\n",
      "   -0.4689 if c>=1.0 & x2>=3.0\n",
      "   +0.0754 if c<=0.0 & x1<=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.1225 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.0045 if c<=0.0 & x1<=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.5947 if c>=1.0 & x1>=1.0 & x2<=2.0\n",
      "   +0.3628 if c<=0.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   +0.1253 if x1<=2.0 & x1>=1.0 & x4-x2<=0.0\n",
      "   -0.2021 if x1<=0.0 & x4-x2>=1.0\n",
      "   -0.4520 if c<=0.0 & x1<=1.0 & x1>=1.0 & x2<=1.0\n",
      "   +0.4164 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.2635 if c<=0.0 & x1<=2.0 & x3-x1>=-1.0\n",
      "   -0.1591 if x1>=2.0 & x2>=3.0 & x4-x2<=-2.0\n",
      "   +0.4462 if c<=0.0 & x3-x1<=2.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.5000 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.4171 if x1>=1.0 & x3-x1>=1.0 & x4-x2<=0.0\n",
      "   +0.0158 if x3-x1>=3.0\n",
      "----------------- 1 --------------\n",
      "   -0.0074 if c>=1.0 & x1>=1.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   +0.0580 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   -0.6005 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   +0.0350 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.0955 if x2>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.3404 if x2<=2.0 & x3-x1<=0.0\n",
      "   -0.2136 if x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   -0.1021 if c<=0.0 & x1>=3.0 & x2<=2.0\n",
      "   +0.0443 if x2<=2.0 & x4-x2<=1.0\n",
      "   +0.2405 if x2<=2.0 & x3-x1>=2.0\n",
      "   -0.0900 if x1>=1.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.1935 if x2>=1.0 & x3-x1<=0.0\n",
      "   +0.0300 if x1<=2.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.7563 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.4638 if x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.8201 if c>=1.0 & x2>=1.0\n",
      "----------------- 2 --------------\n",
      "   +0.5659 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.1816 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -0.7682 if x4-x2>=0.0\n",
      "   -0.2795 if x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.1987 if c>=1.0 & x2>=2.0\n",
      "   -0.3059 if x3-x1<=2.0 & x4-x2<=1.0\n",
      "   +0.0296 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   +0.4113 if x1<=0.0 & x3-x1>=1.0 & x4-x2<=-1.0\n",
      "   +0.2140 if c<=0.0 & x1<=2.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   -0.0656 if c<=0.0 & x1<=1.0 & x4-x2<=-2.0\n",
      "   -0.0000 if x1>=2.0 & x2>=3.0 & x3-x1>=0.0 & x4-x2<=-2.0\n",
      "   -0.0000 if c<=0.0 & x1>=3.0 & x3-x1>=0.0\n",
      "   +0.2474 if c<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.1153 if x3-x1<=2.0 & x4-x2<=2.0 & x4-x2>=-2.0\n",
      "   -0.0493 if x3-x1<=-2.0 & x4-x2<=-3.0\n",
      "   -0.3341 if x4-x2<=1.0\n",
      "----------------- 3 --------------\n",
      "   +0.2897 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.6404 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.2301 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.0936 if c>=1.0 & x2<=1.0\n",
      "   -0.1721 if x2<=2.0 & x3-x1>=2.0\n",
      "   -0.0681 if x1<=1.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   +0.0734 if c<=0.0 & x2<=0.0\n",
      "   -0.0265 if x1<=0.0 & x2<=1.0 & x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.4749 if x2>=2.0 & x3-x1<=1.0\n",
      "   +0.2788 if x3-x1<=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.5295 if c<=0.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.1824 if x1<=2.0 & x2<=1.0 & x3-x1>=-1.0 & x4-x2>=0.0\n",
      "   -0.5459 if x1<=1.0 & x2>=1.0 & x3-x1<=2.0 & x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   -0.1492 if x1<=2.0 & x4-x2<=0.0\n",
      "   +0.2594 if x1>=2.0 & x2>=1.0 & x4-x2<=0.0\n",
      "   -0.6786 if c>=1.0 & x1<=2.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2>=0.0\n",
      "init state [1 1 1 0 0]\n",
      "(6,) (6,)\n",
      "init state [1 1 2 0 0]\n",
      "(120,) (114,)\n",
      "init state [ 1  1  1 -1  0]\n",
      "(138,) (18,)\n",
      "init state [ 1  2  2 -2  0]\n",
      "(202,) (64,)\n",
      "init state [ 3  1 -2  2  0]\n",
      "(209,) (7,)\n",
      "init state [2 2 1 0 0]\n",
      "(216,) (7,)\n",
      "init state [ 2  2 -2  1  0]\n",
      "(224,) (8,)\n",
      "init state [1 2 0 1 0]\n",
      "(231,) (7,)\n",
      "init state [ 3  2  0 -1  0]\n",
      "(253,) (22,)\n",
      "init state [ 1  3 -1  0  0]\n",
      "(265,) (12,)\n",
      "============ 73 ===========\n",
      "Run episode 73 with rewards 30, accuracy 0.5\n",
      "----------------- 0 --------------\n",
      "   -0.2922 if c>=1.0 & x2>=3.0\n",
      "   -0.0732 if c<=0.0 & x1<=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.1516 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.4927 if c>=1.0 & x1>=1.0 & x2<=2.0\n",
      "   +1.3301 if c<=0.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   -0.6358 if x1<=2.0 & x1>=1.0 & x4-x2<=0.0\n",
      "   -0.3164 if x1<=0.0 & x4-x2>=1.0\n",
      "   -0.0016 if c<=0.0 & x1<=1.0 & x1>=1.0 & x2<=1.0\n",
      "   +0.7886 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.4624 if c<=0.0 & x1<=2.0 & x3-x1>=-1.0\n",
      "   +0.7841 if x1>=2.0 & x2>=3.0 & x4-x2<=-2.0\n",
      "   +0.8121 if c<=0.0 & x3-x1<=2.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.3388 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   -0.4802 if x1>=1.0 & x3-x1>=1.0 & x4-x2<=0.0\n",
      "   +0.1832 if x3-x1>=3.0\n",
      "   -0.3074 if c<=0.0 & x1<=2.0 & x3-x1<=0.0\n",
      "----------------- 1 --------------\n",
      "   +0.2324 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   -0.5306 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   +0.3183 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   -0.2957 if x2>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.1213 if x2<=2.0 & x3-x1<=0.0\n",
      "   +0.0650 if x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   -0.2371 if c<=0.0 & x1>=3.0 & x2<=2.0\n",
      "   +0.1423 if x2<=2.0 & x4-x2<=1.0\n",
      "   +0.1580 if x2<=2.0 & x3-x1>=2.0\n",
      "   -0.0129 if x1>=1.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.3000 if x2>=1.0 & x3-x1<=0.0\n",
      "   +0.6019 if x1<=2.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.5603 if x1<=2.0 & x4-x2>=-2.0\n",
      "   -0.0500 if x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.2929 if c>=1.0 & x2>=1.0\n",
      "   +0.3396 if x2<=0.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "----------------- 2 --------------\n",
      "   +2.7132 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.2151 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -2.0034 if x4-x2>=0.0\n",
      "   -0.8677 if x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.1744 if c>=1.0 & x2>=2.0\n",
      "   +0.3334 if x3-x1<=2.0 & x4-x2<=1.0\n",
      "   +2.3053 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   +0.8141 if x1<=0.0 & x3-x1>=1.0 & x4-x2<=-1.0\n",
      "   +0.3598 if c<=0.0 & x1<=2.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   +0.9779 if c<=0.0 & x1<=1.0 & x4-x2<=-2.0\n",
      "   +2.1276 if x1>=2.0 & x2>=3.0 & x3-x1>=0.0 & x4-x2<=-2.0\n",
      "   +1.4252 if c<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.3898 if x3-x1<=2.0 & x4-x2<=2.0 & x4-x2>=-2.0\n",
      "   +0.0000 if x3-x1<=-2.0 & x4-x2<=-3.0\n",
      "   +1.0662 if x4-x2<=1.0\n",
      "   -1.4127 if c<=0.0 & x2>=2.0 & x4-x2>=0.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 3 --------------\n",
      "   +0.3479 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.3789 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.4755 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.2027 if c>=1.0 & x2<=1.0\n",
      "   -0.1300 if x2<=2.0 & x3-x1>=2.0\n",
      "   -0.1338 if x1<=1.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   +0.0048 if c<=0.0 & x2<=0.0\n",
      "   +0.0676 if x2>=2.0 & x3-x1<=1.0\n",
      "   +0.7483 if x3-x1<=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.6099 if c<=0.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.1009 if x1<=2.0 & x2<=1.0 & x3-x1>=-1.0 & x4-x2>=0.0\n",
      "   -0.1112 if x1<=1.0 & x2>=1.0 & x3-x1<=2.0 & x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   -0.2892 if x1<=2.0 & x4-x2<=0.0\n",
      "   +0.0770 if x1>=2.0 & x2>=1.0 & x4-x2<=0.0\n",
      "   +0.2043 if c>=1.0 & x1<=2.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2>=0.0\n",
      "   -0.4237 if c<=0.0 & x3-x1<=-2.0 & x4-x2>=1.0\n",
      "init state [ 0  3  1 -2  0]\n",
      "(20,) (20,)\n",
      "init state [0 2 1 0 0]\n",
      "(25,) (5,)\n",
      "init state [ 3  0 -1  3  0]\n",
      "(52,) (27,)\n",
      "init state [ 0  3  3 -3  0]\n",
      "(74,) (22,)\n",
      "init state [ 0  2  1 -1  0]\n",
      "(81,) (7,)\n",
      "init state [0 1 2 0 0]\n",
      "(98,) (17,)\n",
      "init state [ 2  2 -1  0  0]\n",
      "(104,) (6,)\n",
      "init state [0 1 3 1 0]\n",
      "(147,) (43,)\n",
      "init state [ 3  0 -3  2  0]\n",
      "(161,) (14,)\n",
      "init state [0 0 2 3 0]\n",
      "(179,) (18,)\n",
      "============ 74 ===========\n",
      "Run episode 74 with rewards 24, accuracy 0.8\n",
      "----------------- 0 --------------\n",
      "   -0.1689 if c>=1.0 & x2>=3.0\n",
      "   -0.0558 if c<=0.0 & x1<=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.0970 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.3278 if c>=1.0 & x1>=1.0 & x2<=2.0\n",
      "   +0.4182 if c<=0.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   -0.1827 if x1<=2.0 & x1>=1.0 & x4-x2<=0.0\n",
      "   -0.3372 if x1<=0.0 & x4-x2>=1.0\n",
      "   +0.5056 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.5624 if c<=0.0 & x1<=2.0 & x3-x1>=-1.0\n",
      "   -0.0356 if x1>=2.0 & x2>=3.0 & x4-x2<=-2.0\n",
      "   +0.0890 if c<=0.0 & x3-x1<=2.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.7691 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.3816 if x1>=1.0 & x3-x1>=1.0 & x4-x2<=0.0\n",
      "   +0.3730 if x3-x1>=3.0\n",
      "   +0.1902 if c<=0.0 & x1<=2.0 & x3-x1<=0.0\n",
      "   -0.2842 if x3-x1<=-1.0 & x4-x2>=2.0\n",
      "----------------- 1 --------------\n",
      "   -0.0306 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   -0.6409 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   +0.2743 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.6599 if x2>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.3133 if x2<=2.0 & x3-x1<=0.0\n",
      "   -0.2830 if x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.1376 if c<=0.0 & x1>=3.0 & x2<=2.0\n",
      "   +0.0979 if x2<=2.0 & x4-x2<=1.0\n",
      "   -0.2285 if x2<=2.0 & x3-x1>=2.0\n",
      "   -0.2438 if x2>=1.0 & x3-x1<=0.0\n",
      "   +0.6703 if x1<=2.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.4372 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.4478 if x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.4616 if c>=1.0 & x2>=1.0\n",
      "   -0.0729 if x2<=0.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "   -0.2022 if x1>=3.0 & x4-x2>=1.0\n",
      "----------------- 2 --------------\n",
      "   +0.3441 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.2117 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -0.8329 if x4-x2>=0.0\n",
      "   -0.6931 if x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.3694 if c>=1.0 & x2>=2.0\n",
      "   +0.3779 if x3-x1<=2.0 & x4-x2<=1.0\n",
      "   +0.9701 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   +0.3369 if x1<=0.0 & x3-x1>=1.0 & x4-x2<=-1.0\n",
      "   +0.3672 if c<=0.0 & x1<=2.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   +0.0315 if c<=0.0 & x1<=1.0 & x4-x2<=-2.0\n",
      "   -0.0000 if x1>=2.0 & x2>=3.0 & x3-x1>=0.0 & x4-x2<=-2.0\n",
      "   +0.3271 if c<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.3561 if x3-x1<=2.0 & x4-x2<=2.0 & x4-x2>=-2.0\n",
      "   +0.3268 if x4-x2<=1.0\n",
      "   +0.4683 if c<=0.0 & x2>=2.0 & x4-x2>=0.0\n",
      "   -0.6233 if c<=0.0 & x1>=2.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=-1.0 & x4-x2>=0.0\n",
      "----------------- 3 --------------\n",
      "   +0.3271 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.6507 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.3630 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.0582 if c>=1.0 & x2<=1.0\n",
      "   +0.0472 if x2<=2.0 & x3-x1>=2.0\n",
      "   -0.6875 if x1<=1.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   +0.2386 if x2>=2.0 & x3-x1<=1.0\n",
      "   -0.2784 if x3-x1<=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.6998 if c<=0.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.4253 if x1<=2.0 & x2<=1.0 & x3-x1>=-1.0 & x4-x2>=0.0\n",
      "   +0.0689 if x1<=1.0 & x2>=1.0 & x3-x1<=2.0 & x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   -0.5424 if x1<=2.0 & x4-x2<=0.0\n",
      "   +0.4224 if x1>=2.0 & x2>=1.0 & x4-x2<=0.0\n",
      "   -0.1318 if c>=1.0 & x1<=2.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2>=0.0\n",
      "   +0.0211 if c<=0.0 & x3-x1<=-2.0 & x4-x2>=1.0\n",
      "   -0.0453 if c>=1.0 & x4-x2>=-1.0\n",
      "init state [ 1  2  0 -1  0]\n",
      "(12,) (12,)\n",
      "init state [0 2 1 0 0]\n",
      "(36,) (24,)\n",
      "init state [1 2 0 1 0]\n",
      "(45,) (9,)\n",
      "init state [1 2 2 0 0]\n",
      "(71,) (26,)\n",
      "init state [ 2  2 -1  0  0]\n",
      "(76,) (5,)\n",
      "init state [0 1 2 2 0]\n",
      "(85,) (9,)\n",
      "init state [ 3  1 -2  2  0]\n",
      "(93,) (8,)\n",
      "init state [0 1 1 1 0]\n",
      "(101,) (8,)\n",
      "init state [3 0 0 2 0]\n",
      "(112,) (11,)\n",
      "init state [ 3  2  0 -1  0]\n",
      "(115,) (3,)\n",
      "============ 75 ===========\n",
      "Run episode 75 with rewards 39, accuracy 0.8\n",
      "----------------- 0 --------------\n",
      "   -0.1883 if c>=1.0 & x2>=3.0\n",
      "   -0.3799 if c<=0.0 & x1<=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.0727 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.3905 if c>=1.0 & x1>=1.0 & x2<=2.0\n",
      "   +0.5688 if c<=0.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   -0.2981 if x1<=2.0 & x1>=1.0 & x4-x2<=0.0\n",
      "   -0.4925 if x1<=0.0 & x4-x2>=1.0\n",
      "   +0.2760 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.0625 if c<=0.0 & x1<=2.0 & x3-x1>=-1.0\n",
      "   +0.2729 if c<=0.0 & x3-x1<=2.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.5320 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.0148 if x1>=1.0 & x3-x1>=1.0 & x4-x2<=0.0\n",
      "   -0.3286 if x3-x1>=3.0\n",
      "   +0.7004 if c<=0.0 & x1<=2.0 & x3-x1<=0.0\n",
      "   -0.2125 if x3-x1<=-1.0 & x4-x2>=2.0\n",
      "   +0.4340 if x1>=2.0 & x2<=0.0 & x4-x2>=2.0\n",
      "----------------- 1 --------------\n",
      "   -0.6851 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   +0.3106 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.3967 if x2>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.6071 if x2<=2.0 & x3-x1<=0.0\n",
      "   +0.1403 if x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   -0.1342 if c<=0.0 & x1>=3.0 & x2<=2.0\n",
      "   +0.1680 if x2<=2.0 & x4-x2<=1.0\n",
      "   -0.1890 if x2<=2.0 & x3-x1>=2.0\n",
      "   -0.2640 if x2>=1.0 & x3-x1<=0.0\n",
      "   +0.6889 if x1<=2.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.0915 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.2295 if x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.3476 if c>=1.0 & x2>=1.0\n",
      "   -0.3787 if x2<=0.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "   -0.1006 if x1>=3.0 & x4-x2>=1.0\n",
      "   +0.0979 if x2<=2.0 & x3-x1<=-1.0\n",
      "----------------- 2 --------------\n",
      "   +0.6572 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.0286 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -0.3288 if x4-x2>=0.0\n",
      "   +0.0842 if x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.1323 if c>=1.0 & x2>=2.0\n",
      "   -0.0948 if x3-x1<=2.0 & x4-x2<=1.0\n",
      "   +0.4538 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   +0.0000 if x1<=0.0 & x3-x1>=1.0 & x4-x2<=-1.0\n",
      "   +0.0000 if c<=0.0 & x1<=2.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   +0.0000 if c<=0.0 & x1<=1.0 & x4-x2<=-2.0\n",
      "   +0.1989 if c<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.3300 if x3-x1<=2.0 & x4-x2<=2.0 & x4-x2>=-2.0\n",
      "   +0.3270 if x4-x2<=1.0\n",
      "   +0.0357 if c<=0.0 & x2>=2.0 & x4-x2>=0.0\n",
      "   -0.5248 if c<=0.0 & x1>=2.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=-1.0 & x4-x2>=0.0\n",
      "   +0.3245 if x1>=1.0 & x2<=0.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "----------------- 3 --------------\n",
      "   +0.4165 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.5777 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.3369 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.2732 if c>=1.0 & x2<=1.0\n",
      "   +0.3117 if x2<=2.0 & x3-x1>=2.0\n",
      "   +0.2449 if x1<=1.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   +0.0689 if x2>=2.0 & x3-x1<=1.0\n",
      "   +0.0998 if x3-x1<=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.4195 if c<=0.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.5473 if x1<=2.0 & x2<=1.0 & x3-x1>=-1.0 & x4-x2>=0.0\n",
      "   +0.2771 if x1<=1.0 & x2>=1.0 & x3-x1<=2.0 & x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   -0.8519 if x1<=2.0 & x4-x2<=0.0\n",
      "   +0.1387 if x1>=2.0 & x2>=1.0 & x4-x2<=0.0\n",
      "   -0.0667 if c>=1.0 & x1<=2.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2>=0.0\n",
      "   +0.3531 if c>=1.0 & x4-x2>=-1.0\n",
      "   +0.5245 if x1<=1.0 & x1>=1.0 & x2<=1.0 & x3-x1>=1.0 & x4-x2>=2.0\n",
      "init state [ 2  2 -1 -2  0]\n",
      "(17,) (17,)\n",
      "init state [ 1  1 -1  0  0]\n",
      "(28,) (11,)\n",
      "init state [ 1  1 -1 -1  0]\n",
      "(47,) (19,)\n",
      "init state [ 2  3 -2 -2  0]\n",
      "(59,) (12,)\n",
      "init state [ 2  1  1 -1  0]\n",
      "(66,) (7,)\n",
      "init state [ 2  3 -2 -2  0]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(95,) (29,)\n",
      "init state [ 2  1 -2 -1  0]\n",
      "(115,) (20,)\n",
      "init state [0 0 2 3 0]\n",
      "(144,) (29,)\n",
      "init state [ 1  3 -1 -2  0]\n",
      "(176,) (32,)\n",
      "init state [1 0 2 0 0]\n",
      "(183,) (7,)\n",
      "============ 76 ===========\n",
      "Run episode 76 with rewards 35, accuracy 0.8\n",
      "----------------- 0 --------------\n",
      "   -0.2183 if c>=1.0 & x2>=3.0\n",
      "   -0.0384 if c<=0.0 & x1<=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.2474 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.5153 if c>=1.0 & x1>=1.0 & x2<=2.0\n",
      "   +0.5341 if c<=0.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   -0.3236 if x1<=2.0 & x1>=1.0 & x4-x2<=0.0\n",
      "   -0.0398 if x1<=0.0 & x4-x2>=1.0\n",
      "   +0.3372 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   +0.0426 if c<=0.0 & x1<=2.0 & x3-x1>=-1.0\n",
      "   +0.0631 if c<=0.0 & x3-x1<=2.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.4301 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.0000 if x3-x1>=3.0\n",
      "   +0.9098 if c<=0.0 & x1<=2.0 & x3-x1<=0.0\n",
      "   +0.0000 if x3-x1<=-1.0 & x4-x2>=2.0\n",
      "   +0.0000 if x1>=2.0 & x2<=0.0 & x4-x2>=2.0\n",
      "   -0.1559 if c<=0.0 & x3-x1>=-2.0\n",
      "----------------- 1 --------------\n",
      "   -0.4280 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   -0.0739 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.3213 if x2>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.5113 if x2<=2.0 & x3-x1<=0.0\n",
      "   +0.0954 if x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   -0.0507 if c<=0.0 & x1>=3.0 & x2<=2.0\n",
      "   +0.5788 if x2<=2.0 & x4-x2<=1.0\n",
      "   +0.1359 if x2<=2.0 & x3-x1>=2.0\n",
      "   -0.5363 if x2>=1.0 & x3-x1<=0.0\n",
      "   +0.3583 if x1<=2.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.0947 if x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.5369 if c>=1.0 & x2>=1.0\n",
      "   +0.0052 if x2<=0.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "   -0.0000 if x1>=3.0 & x4-x2>=1.0\n",
      "   +0.0167 if x2<=2.0 & x3-x1<=-1.0\n",
      "   +0.8408 if c<=0.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "----------------- 2 --------------\n",
      "   +0.5982 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.0792 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -0.4041 if x4-x2>=0.0\n",
      "   -0.1044 if x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.1675 if c>=1.0 & x2>=2.0\n",
      "   -0.1046 if x3-x1<=2.0 & x4-x2<=1.0\n",
      "   +0.6311 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   -0.1105 if x1<=0.0 & x3-x1>=1.0 & x4-x2<=-1.0\n",
      "   +0.4488 if c<=0.0 & x1<=2.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   +0.2895 if c<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.2139 if x3-x1<=2.0 & x4-x2<=2.0 & x4-x2>=-2.0\n",
      "   -0.1046 if x4-x2<=1.0\n",
      "   -0.2124 if c<=0.0 & x2>=2.0 & x4-x2>=0.0\n",
      "   -0.2032 if c<=0.0 & x1>=2.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=-1.0 & x4-x2>=0.0\n",
      "   -0.0318 if x1>=1.0 & x2<=0.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   +0.2898 if x3-x1<=0.0\n",
      "----------------- 3 --------------\n",
      "   +0.5286 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.0190 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.0326 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.5101 if c>=1.0 & x2<=1.0\n",
      "   -0.0579 if x2<=2.0 & x3-x1>=2.0\n",
      "   +0.0249 if x1<=1.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   -0.0272 if x2>=2.0 & x3-x1<=1.0\n",
      "   +0.0862 if x3-x1<=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.2633 if c<=0.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.5336 if x1<=2.0 & x2<=1.0 & x3-x1>=-1.0 & x4-x2>=0.0\n",
      "   -0.2857 if x1<=1.0 & x2>=1.0 & x3-x1<=2.0 & x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   -0.4068 if x1<=2.0 & x4-x2<=0.0\n",
      "   +0.3679 if x1>=2.0 & x2>=1.0 & x4-x2<=0.0\n",
      "   +0.7991 if c>=1.0 & x4-x2>=-1.0\n",
      "   +0.2938 if x1<=1.0 & x1>=1.0 & x2<=1.0 & x3-x1>=1.0 & x4-x2>=2.0\n",
      "   -0.2250 if x2<=1.0 & x2>=1.0 & x4-x2<=1.0\n",
      "init state [0 0 1 1 0]\n",
      "(15,) (15,)\n",
      "init state [0 1 1 1 0]\n",
      "(24,) (9,)\n",
      "init state [0 1 3 1 0]\n",
      "(31,) (7,)\n",
      "init state [ 1  0 -1  3  0]\n",
      "(43,) (12,)\n",
      "init state [ 3  2 -3 -2  0]\n",
      "(85,) (42,)\n",
      "init state [0 0 3 0 0]\n",
      "(110,) (25,)\n",
      "init state [ 1  3 -1  0  0]\n",
      "(122,) (12,)\n",
      "init state [ 2  0 -2  0  0]\n",
      "(139,) (17,)\n",
      "init state [ 3  1 -3  1  0]\n",
      "(166,) (27,)\n",
      "init state [ 2  0 -2  0  0]\n",
      "(191,) (25,)\n",
      "============ 77 ===========\n",
      "Run episode 77 with rewards 17, accuracy 0.2\n",
      "----------------- 0 --------------\n",
      "   -0.4966 if c>=1.0 & x2>=3.0\n",
      "   -0.2927 if c<=0.0 & x1<=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.1612 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.2659 if c>=1.0 & x1>=1.0 & x2<=2.0\n",
      "   +0.2145 if c<=0.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   -0.0388 if x1<=2.0 & x1>=1.0 & x4-x2<=0.0\n",
      "   -0.3517 if x1<=0.0 & x4-x2>=1.0\n",
      "   -0.0557 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.1352 if c<=0.0 & x1<=2.0 & x3-x1>=-1.0\n",
      "   +0.4830 if c<=0.0 & x3-x1<=2.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.4971 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   -0.0197 if x3-x1>=3.0\n",
      "   +0.4993 if c<=0.0 & x1<=2.0 & x3-x1<=0.0\n",
      "   -0.0411 if x1>=2.0 & x2<=0.0 & x4-x2>=2.0\n",
      "   -0.2227 if c<=0.0 & x3-x1>=-2.0\n",
      "   +0.6274 if c<=0.0 & x2<=0.0 & x3-x1<=-1.0 & x4-x2<=2.0\n",
      "----------------- 1 --------------\n",
      "   -0.6376 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   -0.1517 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.1389 if x2>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.3456 if x2<=2.0 & x3-x1<=0.0\n",
      "   +0.0918 if x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   -0.1094 if c<=0.0 & x1>=3.0 & x2<=2.0\n",
      "   +0.3751 if x2<=2.0 & x4-x2<=1.0\n",
      "   +0.4254 if x2<=2.0 & x3-x1>=2.0\n",
      "   -0.2448 if x2>=1.0 & x3-x1<=0.0\n",
      "   +0.0519 if x1<=2.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.2749 if x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.5830 if c>=1.0 & x2>=1.0\n",
      "   -0.4204 if x2<=0.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "   -0.1643 if x2<=2.0 & x3-x1<=-1.0\n",
      "   +0.3238 if c<=0.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.6262 if c>=1.0 & x1<=2.0 & x1>=1.0 & x2<=2.0 & x4-x2<=-1.0 & x4-x2<=-2.0\n",
      "----------------- 2 --------------\n",
      "   +0.5884 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.2998 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -0.3103 if x4-x2>=0.0\n",
      "   +0.0740 if x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.4700 if c>=1.0 & x2>=2.0\n",
      "   -0.0202 if x3-x1<=2.0 & x4-x2<=1.0\n",
      "   +0.6217 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   -0.0348 if x1<=0.0 & x3-x1>=1.0 & x4-x2<=-1.0\n",
      "   +0.1456 if c<=0.0 & x1<=2.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   +0.2185 if c<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.1274 if x3-x1<=2.0 & x4-x2<=2.0 & x4-x2>=-2.0\n",
      "   -0.0946 if x4-x2<=1.0\n",
      "   +0.2786 if c<=0.0 & x2>=2.0 & x4-x2>=0.0\n",
      "   +0.0456 if c<=0.0 & x1>=2.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=-1.0 & x4-x2>=0.0\n",
      "   -0.3855 if x3-x1<=0.0\n",
      "   +0.1756 if x4-x2<=-3.0\n",
      "----------------- 3 --------------\n",
      "   +0.2821 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.0355 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.2124 if c>=1.0 & x2<=1.0\n",
      "   -0.2276 if x2<=2.0 & x3-x1>=2.0\n",
      "   +0.1624 if x1<=1.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   +0.2111 if x2>=2.0 & x3-x1<=1.0\n",
      "   +0.2428 if x3-x1<=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.0890 if c<=0.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.6704 if x1<=2.0 & x2<=1.0 & x3-x1>=-1.0 & x4-x2>=0.0\n",
      "   -0.2402 if x1<=1.0 & x2>=1.0 & x3-x1<=2.0 & x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   -0.3429 if x1<=2.0 & x4-x2<=0.0\n",
      "   +0.3024 if x1>=2.0 & x2>=1.0 & x4-x2<=0.0\n",
      "   +0.9174 if c>=1.0 & x4-x2>=-1.0\n",
      "   +0.0000 if x1<=1.0 & x1>=1.0 & x2<=1.0 & x3-x1>=1.0 & x4-x2>=2.0\n",
      "   +0.3424 if x2<=1.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   +0.8824 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "init state [1 1 1 1 0]\n",
      "(12,) (12,)\n",
      "init state [ 2  0 -2  1  0]\n",
      "(45,) (33,)\n",
      "init state [0 1 0 1 0]\n",
      "(52,) (7,)\n",
      "init state [ 3  2 -1 -1  0]\n",
      "(68,) (16,)\n",
      "init state [ 3  0 -1  1  0]\n",
      "(74,) (6,)\n",
      "init state [ 2  2 -2  1  0]\n",
      "(96,) (22,)\n",
      "init state [ 1  1  1 -1  0]\n",
      "(111,) (15,)\n",
      "init state [1 0 1 0 0]\n",
      "(123,) (12,)\n",
      "init state [ 1  0 -1  2  0]\n",
      "(136,) (13,)\n",
      "init state [3 0 0 1 0]\n",
      "(139,) (3,)\n",
      "============ 78 ===========\n",
      "Run episode 78 with rewards 39, accuracy 0.6\n",
      "----------------- 0 --------------\n",
      "   -0.3709 if c>=1.0 & x2>=3.0\n",
      "   +0.0125 if c<=0.0 & x1<=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.0919 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.1425 if c>=1.0 & x1>=1.0 & x2<=2.0\n",
      "   +0.1672 if c<=0.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   -0.2147 if x1<=2.0 & x1>=1.0 & x4-x2<=0.0\n",
      "   -0.2791 if x1<=0.0 & x4-x2>=1.0\n",
      "   -0.0344 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   +0.1820 if c<=0.0 & x1<=2.0 & x3-x1>=-1.0\n",
      "   -0.3674 if c<=0.0 & x3-x1<=2.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.4334 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.4207 if c<=0.0 & x1<=2.0 & x3-x1<=0.0\n",
      "   +0.0000 if x1>=2.0 & x2<=0.0 & x4-x2>=2.0\n",
      "   +0.2439 if c<=0.0 & x3-x1>=-2.0\n",
      "   +0.4665 if c<=0.0 & x2<=0.0 & x3-x1<=-1.0 & x4-x2<=2.0\n",
      "   -0.4974 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "----------------- 1 --------------\n",
      "   -0.1310 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   +0.0297 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.2985 if x2>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.5485 if x2<=2.0 & x3-x1<=0.0\n",
      "   +0.2860 if x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   -0.3126 if c<=0.0 & x1>=3.0 & x2<=2.0\n",
      "   +0.0480 if x2<=2.0 & x4-x2<=1.0\n",
      "   +0.0191 if x2<=2.0 & x3-x1>=2.0\n",
      "   +0.3773 if x2>=1.0 & x3-x1<=0.0\n",
      "   +0.3659 if x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.5130 if c>=1.0 & x2>=1.0\n",
      "   +0.2493 if x2<=0.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "   -0.4360 if x2<=2.0 & x3-x1<=-1.0\n",
      "   +0.6573 if c<=0.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.0706 if c>=1.0 & x1<=2.0 & x1>=1.0 & x2<=2.0 & x4-x2<=-1.0 & x4-x2<=-2.0\n",
      "   -0.6659 if x1>=3.0 & x4-x2<=0.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 2 --------------\n",
      "   +0.4950 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.3460 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -0.3538 if x4-x2>=0.0\n",
      "   -0.2540 if x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.4060 if c>=1.0 & x2>=2.0\n",
      "   +0.4180 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   -0.1587 if x1<=0.0 & x3-x1>=1.0 & x4-x2<=-1.0\n",
      "   -0.0541 if c<=0.0 & x1<=2.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   +0.2676 if c<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.0014 if x3-x1<=2.0 & x4-x2<=2.0 & x4-x2>=-2.0\n",
      "   +0.0871 if x4-x2<=1.0\n",
      "   -0.4124 if c<=0.0 & x2>=2.0 & x4-x2>=0.0\n",
      "   -0.1102 if c<=0.0 & x1>=2.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=-1.0 & x4-x2>=0.0\n",
      "   +0.2337 if x3-x1<=0.0\n",
      "   -0.0303 if x4-x2<=-3.0\n",
      "   -0.6690 if x1<=2.0 & x2>=1.0 & x3-x1<=1.0\n",
      "----------------- 3 --------------\n",
      "   +0.1406 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.3104 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.5575 if c>=1.0 & x2<=1.0\n",
      "   -0.0327 if x2<=2.0 & x3-x1>=2.0\n",
      "   -0.1246 if x1<=1.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   +0.0326 if x2>=2.0 & x3-x1<=1.0\n",
      "   +0.2664 if x3-x1<=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.0208 if c<=0.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.2944 if x1<=2.0 & x2<=1.0 & x3-x1>=-1.0 & x4-x2>=0.0\n",
      "   -0.2163 if x1<=1.0 & x2>=1.0 & x3-x1<=2.0 & x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   -0.3473 if x1<=2.0 & x4-x2<=0.0\n",
      "   +0.3830 if x1>=2.0 & x2>=1.0 & x4-x2<=0.0\n",
      "   +0.8783 if c>=1.0 & x4-x2>=-1.0\n",
      "   +0.3490 if x2<=1.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   +0.7119 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   -0.1348 if x1>=2.0 & x3-x1>=-2.0\n",
      "init state [ 3  1 -2  2  0]\n",
      "(10,) (10,)\n",
      "init state [1 0 1 1 0]\n",
      "(22,) (12,)\n",
      "init state [0 0 1 1 0]\n",
      "(32,) (10,)\n",
      "init state [ 3  2 -2 -1  0]\n",
      "(55,) (23,)\n",
      "init state [0 0 1 2 0]\n",
      "(77,) (22,)\n",
      "init state [ 3  2  0 -1  0]\n",
      "(88,) (11,)\n",
      "init state [1 1 2 1 0]\n",
      "(92,) (4,)\n",
      "init state [ 2  2 -1  0  0]\n",
      "(96,) (4,)\n",
      "init state [ 2  3  0 -3  0]\n",
      "(110,) (14,)\n",
      "init state [ 2  0 -2  2  0]\n",
      "(123,) (13,)\n",
      "============ 79 ===========\n",
      "Run episode 79 with rewards 29, accuracy 0.9\n",
      "----------------- 0 --------------\n",
      "   -0.2512 if c>=1.0 & x2>=3.0\n",
      "   +0.0259 if c<=0.0 & x1<=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.0902 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.0968 if c>=1.0 & x1>=1.0 & x2<=2.0\n",
      "   +0.2915 if c<=0.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   -0.2751 if x1<=2.0 & x1>=1.0 & x4-x2<=0.0\n",
      "   +0.1157 if x1<=0.0 & x4-x2>=1.0\n",
      "   +0.1788 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.3404 if c<=0.0 & x1<=2.0 & x3-x1>=-1.0\n",
      "   +0.0605 if c<=0.0 & x3-x1<=2.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +1.0698 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.4371 if c<=0.0 & x1<=2.0 & x3-x1<=0.0\n",
      "   -0.2804 if c<=0.0 & x3-x1>=-2.0\n",
      "   -0.0874 if c<=0.0 & x2<=0.0 & x3-x1<=-1.0 & x4-x2<=2.0\n",
      "   -0.3470 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.6424 if x1>=3.0 & x3-x1<=-2.0\n",
      "----------------- 1 --------------\n",
      "   +0.0461 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   +0.3303 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.6375 if x2>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.5902 if x2<=2.0 & x3-x1<=0.0\n",
      "   +0.2047 if x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   -0.4736 if c<=0.0 & x1>=3.0 & x2<=2.0\n",
      "   -0.3046 if x2<=2.0 & x4-x2<=1.0\n",
      "   +0.1743 if x2>=1.0 & x3-x1<=0.0\n",
      "   +0.1031 if x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.4605 if c>=1.0 & x2>=1.0\n",
      "   -0.2067 if x2<=0.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "   -0.3794 if x2<=2.0 & x3-x1<=-1.0\n",
      "   +0.7130 if c<=0.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.1380 if c>=1.0 & x1<=2.0 & x1>=1.0 & x2<=2.0 & x4-x2<=-1.0 & x4-x2<=-2.0\n",
      "   -0.3173 if x1>=3.0 & x4-x2<=0.0\n",
      "   +0.4154 if x3-x1>=2.0\n",
      "----------------- 2 --------------\n",
      "   +0.6576 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.4212 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -0.2544 if x4-x2>=0.0\n",
      "   +0.0215 if x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.4022 if c>=1.0 & x2>=2.0\n",
      "   +0.1593 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   -0.2256 if x1<=0.0 & x3-x1>=1.0 & x4-x2<=-1.0\n",
      "   +0.0957 if c<=0.0 & x1<=2.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   +0.0014 if c<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.1553 if x4-x2<=1.0\n",
      "   -0.2439 if c<=0.0 & x2>=2.0 & x4-x2>=0.0\n",
      "   -0.3166 if c<=0.0 & x1>=2.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=-1.0 & x4-x2>=0.0\n",
      "   +0.3528 if x3-x1<=0.0\n",
      "   +0.3107 if x4-x2<=-3.0\n",
      "   -0.3332 if x1<=2.0 & x2>=1.0 & x3-x1<=1.0\n",
      "   -0.4567 if x2>=1.0 & x3-x1<=0.0\n",
      "----------------- 3 --------------\n",
      "   +0.2176 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.6340 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.1927 if c>=1.0 & x2<=1.0\n",
      "   -0.1476 if x2<=2.0 & x3-x1>=2.0\n",
      "   -0.0993 if x1<=1.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   +0.2236 if x2>=2.0 & x3-x1<=1.0\n",
      "   -0.0259 if x3-x1<=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.6605 if x1<=2.0 & x2<=1.0 & x3-x1>=-1.0 & x4-x2>=0.0\n",
      "   -0.0158 if x1<=1.0 & x2>=1.0 & x3-x1<=2.0 & x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   -0.4381 if x1<=2.0 & x4-x2<=0.0\n",
      "   +0.0056 if x1>=2.0 & x2>=1.0 & x4-x2<=0.0\n",
      "   +0.7021 if c>=1.0 & x4-x2>=-1.0\n",
      "   -0.0142 if x2<=1.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   +0.1872 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.0096 if x1>=2.0 & x3-x1>=-2.0\n",
      "   +0.8351 if x1>=1.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "init state [ 2  2 -1 -1  0]\n",
      "(20,) (20,)\n",
      "init state [ 1  3 -1 -3  0]\n",
      "(47,) (27,)\n",
      "init state [ 1  2  0 -1  0]\n",
      "(59,) (12,)\n",
      "init state [ 0  3  1 -1  0]\n",
      "(80,) (21,)\n",
      "init state [ 2  1 -2 -1  0]\n",
      "(91,) (11,)\n",
      "init state [ 2  3  0 -2  0]\n",
      "(100,) (9,)\n",
      "init state [ 3  1 -1 -1  0]\n",
      "(115,) (15,)\n",
      "init state [ 2  3  0 -2  0]\n",
      "(130,) (15,)\n",
      "init state [ 2  0 -2  0  0]\n",
      "(144,) (14,)\n",
      "init state [ 2  1 -1  1  0]\n",
      "(166,) (22,)\n",
      "============ 80 ===========\n",
      "Run episode 80 with rewards 20, accuracy 0.7\n",
      "----------------- 0 --------------\n",
      "   -0.2514 if c>=1.0 & x2>=3.0\n",
      "   -0.0943 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.4841 if c>=1.0 & x1>=1.0 & x2<=2.0\n",
      "   -0.1038 if c<=0.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   -0.0527 if x1<=2.0 & x1>=1.0 & x4-x2<=0.0\n",
      "   +0.0000 if x1<=0.0 & x4-x2>=1.0\n",
      "   +0.3177 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.1168 if c<=0.0 & x1<=2.0 & x3-x1>=-1.0\n",
      "   +0.0987 if c<=0.0 & x3-x1<=2.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.8686 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   -0.1015 if c<=0.0 & x1<=2.0 & x3-x1<=0.0\n",
      "   +0.4233 if c<=0.0 & x3-x1>=-2.0\n",
      "   -0.1200 if c<=0.0 & x2<=0.0 & x3-x1<=-1.0 & x4-x2<=2.0\n",
      "   -0.4154 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.4226 if x1>=3.0 & x3-x1<=-2.0\n",
      "   -0.4799 if c<=0.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "----------------- 1 --------------\n",
      "   +0.2284 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.0003 if x2>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.5144 if x2<=2.0 & x3-x1<=0.0\n",
      "   +0.3957 if x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   -0.3203 if c<=0.0 & x1>=3.0 & x2<=2.0\n",
      "   -0.1498 if x2<=2.0 & x4-x2<=1.0\n",
      "   +0.4932 if x2>=1.0 & x3-x1<=0.0\n",
      "   +0.0000 if x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.5661 if c>=1.0 & x2>=1.0\n",
      "   +0.0000 if x2<=0.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "   -0.1326 if x2<=2.0 & x3-x1<=-1.0\n",
      "   +0.4112 if c<=0.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.2039 if c>=1.0 & x1<=2.0 & x1>=1.0 & x2<=2.0 & x4-x2<=-1.0 & x4-x2<=-2.0\n",
      "   +0.0055 if x1>=3.0 & x4-x2<=0.0\n",
      "   +0.0000 if x3-x1>=2.0\n",
      "   +0.5542 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "----------------- 2 --------------\n",
      "   +0.8169 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.1323 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -0.1973 if x4-x2>=0.0\n",
      "   -0.5560 if x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.3207 if c>=1.0 & x2>=2.0\n",
      "   +0.4431 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   +0.1229 if x1<=0.0 & x3-x1>=1.0 & x4-x2<=-1.0\n",
      "   -0.1420 if c<=0.0 & x1<=2.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   -0.1600 if x4-x2<=1.0\n",
      "   -0.1492 if c<=0.0 & x2>=2.0 & x4-x2>=0.0\n",
      "   -0.2020 if c<=0.0 & x1>=2.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=-1.0 & x4-x2>=0.0\n",
      "   +0.0255 if x3-x1<=0.0\n",
      "   +0.1299 if x4-x2<=-3.0\n",
      "   -0.3163 if x1<=2.0 & x2>=1.0 & x3-x1<=1.0\n",
      "   +0.0902 if x2>=1.0 & x3-x1<=0.0\n",
      "   -0.0817 if x1>=3.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "----------------- 3 --------------\n",
      "   +0.3620 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +1.0917 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.4094 if c>=1.0 & x2<=1.0\n",
      "   +0.0000 if x2<=2.0 & x3-x1>=2.0\n",
      "   -0.0025 if x1<=1.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   -0.0688 if x2>=2.0 & x3-x1<=1.0\n",
      "   -0.0137 if x3-x1<=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.5388 if x1<=2.0 & x2<=1.0 & x3-x1>=-1.0 & x4-x2>=0.0\n",
      "   -0.0025 if x1<=1.0 & x2>=1.0 & x3-x1<=2.0 & x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   -0.2285 if x1<=2.0 & x4-x2<=0.0\n",
      "   +0.4660 if c>=1.0 & x4-x2>=-1.0\n",
      "   -0.4899 if x2<=1.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   +0.2418 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   -0.2732 if x1>=2.0 & x3-x1>=-2.0\n",
      "   -0.0091 if x1>=1.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.4799 if x1<=2.0 & x4-x2<=-3.0\n",
      "init state [ 2  0 -2  2  0]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(17,) (17,)\n",
      "init state [ 2  2 -2  1  0]\n",
      "(30,) (13,)\n",
      "init state [ 3  2  0 -2  0]\n",
      "(36,) (6,)\n",
      "init state [0 2 0 1 0]\n",
      "(50,) (14,)\n",
      "init state [ 3  1 -3  1  0]\n",
      "(66,) (16,)\n",
      "init state [0 1 0 1 0]\n",
      "(79,) (13,)\n",
      "init state [2 0 0 1 0]\n",
      "(91,) (12,)\n",
      "init state [ 1  1  0 -1  0]\n",
      "(106,) (15,)\n",
      "init state [ 1  2  2 -1  0]\n",
      "(113,) (7,)\n",
      "init state [ 2  3 -1 -1  0]\n",
      "(127,) (14,)\n",
      "============ 81 ===========\n",
      "Run episode 81 with rewards 28, accuracy 0.8\n",
      "----------------- 0 --------------\n",
      "   -0.0726 if c>=1.0 & x2>=3.0\n",
      "   -0.3876 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.4640 if c>=1.0 & x1>=1.0 & x2<=2.0\n",
      "   +0.2027 if c<=0.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   -0.1719 if x1<=2.0 & x1>=1.0 & x4-x2<=0.0\n",
      "   +0.7614 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.2592 if c<=0.0 & x1<=2.0 & x3-x1>=-1.0\n",
      "   -0.3443 if c<=0.0 & x3-x1<=2.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.8801 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.1078 if c<=0.0 & x1<=2.0 & x3-x1<=0.0\n",
      "   +0.2201 if c<=0.0 & x3-x1>=-2.0\n",
      "   +0.2315 if c<=0.0 & x2<=0.0 & x3-x1<=-1.0 & x4-x2<=2.0\n",
      "   -0.4882 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.2682 if x1>=3.0 & x3-x1<=-2.0\n",
      "   +0.0499 if c<=0.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   +0.0267 if x1<=2.0 & x1>=1.0\n",
      "----------------- 1 --------------\n",
      "   -0.0469 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.4431 if x2>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.5370 if x2<=2.0 & x3-x1<=0.0\n",
      "   +0.7077 if x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   -0.2578 if c<=0.0 & x1>=3.0 & x2<=2.0\n",
      "   +0.0380 if x2<=2.0 & x4-x2<=1.0\n",
      "   -0.2830 if x2>=1.0 & x3-x1<=0.0\n",
      "   +0.6969 if c>=1.0 & x2>=1.0\n",
      "   +0.2590 if x2<=0.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "   -0.1438 if x2<=2.0 & x3-x1<=-1.0\n",
      "   +0.2723 if c<=0.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.1827 if c>=1.0 & x1<=2.0 & x1>=1.0 & x2<=2.0 & x4-x2<=-1.0 & x4-x2<=-2.0\n",
      "   -0.3317 if x1>=3.0 & x4-x2<=0.0\n",
      "   +0.3476 if x3-x1>=2.0\n",
      "   +0.1384 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.4585 if x3-x1>=1.0 & x4-x2>=0.0\n",
      "----------------- 2 --------------\n",
      "   +0.7427 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.0949 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -0.7127 if x4-x2>=0.0\n",
      "   -0.4161 if x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.2192 if c>=1.0 & x2>=2.0\n",
      "   +0.3808 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   -0.1173 if x1<=0.0 & x3-x1>=1.0 & x4-x2<=-1.0\n",
      "   -0.0850 if c<=0.0 & x1<=2.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   -0.2977 if x4-x2<=1.0\n",
      "   +0.0467 if c<=0.0 & x2>=2.0 & x4-x2>=0.0\n",
      "   -0.1795 if c<=0.0 & x1>=2.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=-1.0 & x4-x2>=0.0\n",
      "   +0.0728 if x4-x2<=-3.0\n",
      "   +0.2686 if x1<=2.0 & x2>=1.0 & x3-x1<=1.0\n",
      "   +0.2016 if x2>=1.0 & x3-x1<=0.0\n",
      "   +0.0297 if x1>=3.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.3113 if c<=0.0 & x1<=1.0 & x3-x1<=1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "----------------- 3 --------------\n",
      "   +0.5982 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.9819 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.2690 if c>=1.0 & x2<=1.0\n",
      "   +0.0535 if x1<=1.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   -0.0386 if x2>=2.0 & x3-x1<=1.0\n",
      "   +0.3449 if x3-x1<=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.4109 if x1<=2.0 & x2<=1.0 & x3-x1>=-1.0 & x4-x2>=0.0\n",
      "   -0.2293 if x1<=1.0 & x2>=1.0 & x3-x1<=2.0 & x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   -0.3295 if x1<=2.0 & x4-x2<=0.0\n",
      "   +0.1565 if c>=1.0 & x4-x2>=-1.0\n",
      "   +0.0260 if x2<=1.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   +0.5479 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   -0.3441 if x1>=2.0 & x3-x1>=-2.0\n",
      "   +0.0000 if x1>=1.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.0732 if x1<=2.0 & x4-x2<=-3.0\n",
      "   +0.3114 if x3-x1<=-2.0 & x3-x1>=-2.0\n",
      "init state [ 2  0 -1  1  0]\n",
      "(11,) (11,)\n",
      "init state [ 0  3  0 -1  0]\n",
      "(26,) (15,)\n",
      "init state [ 1  2 -1  1  0]\n",
      "(35,) (9,)\n",
      "init state [2 1 1 1 0]\n",
      "(38,) (3,)\n",
      "init state [2 1 0 1 0]\n",
      "(48,) (10,)\n",
      "init state [ 2  2 -2 -1  0]\n",
      "(65,) (17,)\n",
      "init state [0 1 3 0 0]\n",
      "(76,) (11,)\n",
      "init state [ 3  0 -1  3  0]\n",
      "(112,) (36,)\n",
      "init state [ 3  1 -3  0  0]\n",
      "(135,) (23,)\n",
      "init state [ 3  0 -3  3  0]\n",
      "(148,) (13,)\n",
      "============ 82 ===========\n",
      "Run episode 82 with rewards 29, accuracy 0.9\n",
      "----------------- 0 --------------\n",
      "   -0.0731 if c>=1.0 & x2>=3.0\n",
      "   -0.2636 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.2564 if c>=1.0 & x1>=1.0 & x2<=2.0\n",
      "   +0.2064 if c<=0.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   -0.0364 if x1<=2.0 & x1>=1.0 & x4-x2<=0.0\n",
      "   +0.4283 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.2499 if c<=0.0 & x1<=2.0 & x3-x1>=-1.0\n",
      "   -0.0074 if c<=0.0 & x3-x1<=2.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.6085 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   -0.0029 if c<=0.0 & x1<=2.0 & x3-x1<=0.0\n",
      "   -0.1641 if c<=0.0 & x3-x1>=-2.0\n",
      "   -0.0746 if c<=0.0 & x2<=0.0 & x3-x1<=-1.0 & x4-x2<=2.0\n",
      "   -0.2127 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   -0.0419 if x1>=3.0 & x3-x1<=-2.0\n",
      "   +0.1959 if c<=0.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   +0.5791 if x3-x1<=-1.0 & x4-x2<=2.0 & x4-x2>=2.0\n",
      "----------------- 1 --------------\n",
      "   -0.0793 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.7095 if x2>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.6140 if x2<=2.0 & x3-x1<=0.0\n",
      "   +0.6884 if x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   -0.1526 if c<=0.0 & x1>=3.0 & x2<=2.0\n",
      "   -0.2378 if x2>=1.0 & x3-x1<=0.0\n",
      "   +0.6181 if c>=1.0 & x2>=1.0\n",
      "   +0.2885 if x2<=0.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "   -0.1975 if x2<=2.0 & x3-x1<=-1.0\n",
      "   +0.3570 if c<=0.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.0000 if c>=1.0 & x1<=2.0 & x1>=1.0 & x2<=2.0 & x4-x2<=-1.0 & x4-x2<=-2.0\n",
      "   -0.5418 if x1>=3.0 & x4-x2<=0.0\n",
      "   +0.3080 if x3-x1>=2.0\n",
      "   +0.2835 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.4190 if x3-x1>=1.0 & x4-x2>=0.0\n",
      "   -0.6851 if x2<=1.0 & x2>=1.0 & x3-x1<=2.0 & x3-x1>=1.0\n",
      "----------------- 2 --------------\n",
      "   +0.3565 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.0216 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -0.2245 if x4-x2>=0.0\n",
      "   -0.0360 if x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.4383 if c>=1.0 & x2>=2.0\n",
      "   +0.5112 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   +0.0000 if x1<=0.0 & x3-x1>=1.0 & x4-x2<=-1.0\n",
      "   +0.1684 if c<=0.0 & x1<=2.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   -0.0670 if x4-x2<=1.0\n",
      "   -0.0052 if c<=0.0 & x2>=2.0 & x4-x2>=0.0\n",
      "   +0.1141 if c<=0.0 & x1>=2.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=-1.0 & x4-x2>=0.0\n",
      "   +0.0000 if x4-x2<=-3.0\n",
      "   -0.3585 if x1<=2.0 & x2>=1.0 & x3-x1<=1.0\n",
      "   +0.0982 if x2>=1.0 & x3-x1<=0.0\n",
      "   +0.3973 if c<=0.0 & x1<=1.0 & x3-x1<=1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   +0.3874 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "----------------- 3 --------------\n",
      "   +0.3538 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.5379 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.2501 if c>=1.0 & x2<=1.0\n",
      "   +0.2569 if x1<=1.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   +0.1450 if x2>=2.0 & x3-x1<=1.0\n",
      "   -0.0382 if x3-x1<=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.4496 if x1<=2.0 & x2<=1.0 & x3-x1>=-1.0 & x4-x2>=0.0\n",
      "   -0.3240 if x1<=1.0 & x2>=1.0 & x3-x1<=2.0 & x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   -0.9300 if x1<=2.0 & x4-x2<=0.0\n",
      "   +0.2349 if c>=1.0 & x4-x2>=-1.0\n",
      "   +0.2089 if x2<=1.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   +0.3249 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.2933 if x1>=2.0 & x3-x1>=-2.0\n",
      "   +0.0000 if x1<=2.0 & x4-x2<=-3.0\n",
      "   +0.4674 if x3-x1<=-2.0 & x3-x1>=-2.0\n",
      "   +0.4468 if x2>=1.0 & x3-x1>=2.0 & x4-x2>=2.0\n",
      "init state [ 2  3  0 -3  0]\n",
      "(21,) (21,)\n",
      "init state [0 0 1 2 0]\n",
      "(30,) (9,)\n",
      "init state [0 0 3 0 0]\n",
      "(38,) (8,)\n",
      "init state [2 0 1 1 0]\n",
      "(51,) (13,)\n",
      "init state [ 1  2 -1  0  0]\n",
      "(61,) (10,)\n",
      "init state [ 1  3 -1  0  0]\n",
      "(76,) (15,)\n",
      "init state [ 3  0 -1  3  0]\n",
      "(85,) (9,)\n",
      "init state [ 0  1  1 -1  0]\n",
      "(98,) (13,)\n",
      "init state [ 1  1  1 -1  0]\n",
      "(106,) (8,)\n",
      "init state [ 2  3 -2 -2  0]\n",
      "(132,) (26,)\n",
      "============ 83 ===========\n",
      "Run episode 83 with rewards 16, accuracy 1.0\n",
      "best\n",
      "----------------- 0 --------------\n",
      "   +0.0683 if c>=1.0 & x2>=3.0\n",
      "   -0.2348 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.4952 if c>=1.0 & x1>=1.0 & x2<=2.0\n",
      "   +0.5061 if c<=0.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   -0.0332 if x1<=2.0 & x1>=1.0 & x4-x2<=0.0\n",
      "   +0.7579 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.4470 if c<=0.0 & x1<=2.0 & x3-x1>=-1.0\n",
      "   -0.1865 if c<=0.0 & x3-x1<=2.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.3060 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   -0.0996 if c<=0.0 & x3-x1>=-2.0\n",
      "   -0.0513 if c<=0.0 & x2<=0.0 & x3-x1<=-1.0 & x4-x2<=2.0\n",
      "   -0.1445 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   -0.0576 if x1>=3.0 & x3-x1<=-2.0\n",
      "   +0.1914 if c<=0.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.2281 if x3-x1<=-1.0 & x4-x2<=2.0 & x4-x2>=2.0\n",
      "   -0.1598 if x1>=2.0 & x3-x1<=-1.0 & x4-x2<=-2.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 1 --------------\n",
      "   -0.3845 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.0527 if x2>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.3232 if x2<=2.0 & x3-x1<=0.0\n",
      "   +0.5545 if x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.1596 if c<=0.0 & x1>=3.0 & x2<=2.0\n",
      "   -0.2514 if x2>=1.0 & x3-x1<=0.0\n",
      "   +0.9636 if c>=1.0 & x2>=1.0\n",
      "   +0.6163 if x2<=0.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "   -0.3203 if x2<=2.0 & x3-x1<=-1.0\n",
      "   +0.6166 if c<=0.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.3177 if x1>=3.0 & x4-x2<=0.0\n",
      "   +0.5774 if x3-x1>=2.0\n",
      "   +0.0819 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.6128 if x3-x1>=1.0 & x4-x2>=0.0\n",
      "   -0.2129 if x2<=1.0 & x2>=1.0 & x3-x1<=2.0 & x3-x1>=1.0\n",
      "   -0.1369 if x1>=3.0 & x4-x2>=3.0\n",
      "----------------- 2 --------------\n",
      "   +0.3532 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.2596 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -0.4223 if x4-x2>=0.0\n",
      "   +0.0205 if x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.5421 if c>=1.0 & x2>=2.0\n",
      "   +0.8529 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   -0.1942 if x1<=0.0 & x3-x1>=1.0 & x4-x2<=-1.0\n",
      "   +0.2417 if c<=0.0 & x1<=2.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   -0.4423 if x4-x2<=1.0\n",
      "   -0.3173 if c<=0.0 & x2>=2.0 & x4-x2>=0.0\n",
      "   +0.1300 if c<=0.0 & x1>=2.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=-1.0 & x4-x2>=0.0\n",
      "   +0.1034 if x1<=2.0 & x2>=1.0 & x3-x1<=1.0\n",
      "   +0.1942 if x2>=1.0 & x3-x1<=0.0\n",
      "   +0.5053 if c<=0.0 & x1<=1.0 & x3-x1<=1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   +0.3792 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.2160 if x4-x2>=3.0\n",
      "----------------- 3 --------------\n",
      "   +0.6243 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.5974 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.3405 if c>=1.0 & x2<=1.0\n",
      "   +0.2363 if x1<=1.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   +0.2014 if x2>=2.0 & x3-x1<=1.0\n",
      "   +0.2858 if x3-x1<=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.6044 if x1<=2.0 & x2<=1.0 & x3-x1>=-1.0 & x4-x2>=0.0\n",
      "   +0.0172 if x1<=1.0 & x2>=1.0 & x3-x1<=2.0 & x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   -0.6790 if x1<=2.0 & x4-x2<=0.0\n",
      "   +0.1895 if c>=1.0 & x4-x2>=-1.0\n",
      "   +0.0018 if x2<=1.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   +0.1641 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.2907 if x1>=2.0 & x3-x1>=-2.0\n",
      "   +0.1678 if x3-x1<=-2.0 & x3-x1>=-2.0\n",
      "   -0.0000 if x2>=1.0 & x3-x1>=2.0 & x4-x2>=2.0\n",
      "   -0.6598 if x1<=2.0 & x2<=0.0 & x3-x1>=0.0 & x4-x2<=2.0 & x4-x2>=1.0\n",
      "init state [1 2 0 1 0]\n",
      "(9,) (9,)\n",
      "init state [0 1 3 0 0]\n",
      "(36,) (27,)\n",
      "init state [ 2  3 -2 -1  0]\n",
      "(51,) (15,)\n",
      "init state [ 1  2 -1  0  0]\n",
      "(57,) (6,)\n",
      "init state [ 3  0 -1  2  0]\n",
      "(69,) (12,)\n",
      "init state [1 0 1 1 0]\n",
      "(80,) (11,)\n",
      "init state [0 3 2 0 0]\n",
      "(84,) (4,)\n",
      "init state [1 0 1 2 0]\n",
      "(91,) (7,)\n",
      "init state [ 1  3  0 -1  0]\n",
      "(97,) (6,)\n",
      "init state [ 1  1  0 -1  0]\n",
      "(107,) (10,)\n",
      "============ 84 ===========\n",
      "Run episode 84 with rewards 32, accuracy 0.7\n",
      "----------------- 0 --------------\n",
      "   -0.0329 if c>=1.0 & x2>=3.0\n",
      "   +0.4097 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.1659 if c>=1.0 & x1>=1.0 & x2<=2.0\n",
      "   +0.8571 if c<=0.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   +0.1086 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.1103 if c<=0.0 & x1<=2.0 & x3-x1>=-1.0\n",
      "   +0.2246 if c<=0.0 & x3-x1<=2.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.5651 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   -0.0688 if c<=0.0 & x3-x1>=-2.0\n",
      "   -0.2282 if c<=0.0 & x2<=0.0 & x3-x1<=-1.0 & x4-x2<=2.0\n",
      "   +0.1458 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.0519 if x1>=3.0 & x3-x1<=-2.0\n",
      "   +0.1193 if c<=0.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.2282 if x3-x1<=-1.0 & x4-x2<=2.0 & x4-x2>=2.0\n",
      "   -0.0551 if x1>=2.0 & x3-x1<=-1.0 & x4-x2<=-2.0\n",
      "   -0.5035 if x1>=1.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "----------------- 1 --------------\n",
      "   -0.3235 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   -1.0593 if x2<=2.0 & x3-x1<=0.0\n",
      "   +0.4553 if x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   -0.1587 if c<=0.0 & x1>=3.0 & x2<=2.0\n",
      "   +0.2199 if x2>=1.0 & x3-x1<=0.0\n",
      "   +0.6586 if c>=1.0 & x2>=1.0\n",
      "   +0.2922 if x2<=0.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "   -0.3794 if x2<=2.0 & x3-x1<=-1.0\n",
      "   +0.9280 if c<=0.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.0497 if x1>=3.0 & x4-x2<=0.0\n",
      "   +0.2127 if x3-x1>=2.0\n",
      "   +0.4100 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.9262 if x3-x1>=1.0 & x4-x2>=0.0\n",
      "   +0.0881 if x2<=1.0 & x2>=1.0 & x3-x1<=2.0 & x3-x1>=1.0\n",
      "   +0.0000 if x1>=3.0 & x4-x2>=3.0\n",
      "   +0.4574 if x1<=2.0 & x2>=3.0 & x3-x1<=-2.0\n",
      "----------------- 2 --------------\n",
      "   +0.5294 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.1385 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -0.3431 if x4-x2>=0.0\n",
      "   -0.4054 if c>=1.0 & x2>=2.0\n",
      "   +0.3650 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   -0.0478 if x1<=0.0 & x3-x1>=1.0 & x4-x2<=-1.0\n",
      "   +0.1218 if c<=0.0 & x1<=2.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   -0.2048 if x4-x2<=1.0\n",
      "   -0.0453 if c<=0.0 & x2>=2.0 & x4-x2>=0.0\n",
      "   -0.2752 if c<=0.0 & x1>=2.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=-1.0 & x4-x2>=0.0\n",
      "   -0.1488 if x1<=2.0 & x2>=1.0 & x3-x1<=1.0\n",
      "   +0.2333 if x2>=1.0 & x3-x1<=0.0\n",
      "   +0.2353 if c<=0.0 & x1<=1.0 & x3-x1<=1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   +0.0644 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   +0.0000 if x4-x2>=3.0\n",
      "   -0.3880 if x1<=2.0 & x4-x2>=2.0\n",
      "----------------- 3 --------------\n",
      "   -0.2074 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.5408 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.1060 if c>=1.0 & x2<=1.0\n",
      "   -0.1061 if x1<=1.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   -0.2735 if x2>=2.0 & x3-x1<=1.0\n",
      "   -0.1040 if x3-x1<=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.3671 if x1<=2.0 & x2<=1.0 & x3-x1>=-1.0 & x4-x2>=0.0\n",
      "   -0.3925 if x1<=1.0 & x2>=1.0 & x3-x1<=2.0 & x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   -0.1386 if x1<=2.0 & x4-x2<=0.0\n",
      "   +0.4153 if c>=1.0 & x4-x2>=-1.0\n",
      "   +0.4569 if x2<=1.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   +0.1591 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.2306 if x1>=2.0 & x3-x1>=-2.0\n",
      "   -0.2473 if x3-x1<=-2.0 & x3-x1>=-2.0\n",
      "   -0.3731 if x1<=2.0 & x2<=0.0 & x3-x1>=0.0 & x4-x2<=2.0 & x4-x2>=1.0\n",
      "   +0.9463 if x2<=2.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "init state [ 3  1 -3 -1  0]\n",
      "(29,) (29,)\n",
      "init state [3 1 0 1 0]\n",
      "(31,) (2,)\n",
      "init state [ 1  3  0 -3  0]\n",
      "(49,) (18,)\n",
      "init state [ 2  0 -1  3  0]\n",
      "(62,) (13,)\n",
      "init state [ 3  1 -1  0  0]\n",
      "(71,) (9,)\n",
      "init state [ 0  2  1 -1  0]\n",
      "(85,) (14,)\n",
      "init state [ 2  3 -2 -2  0]\n",
      "(101,) (16,)\n",
      "init state [ 2  3  1 -2  0]\n",
      "(114,) (13,)\n",
      "init state [ 2  0 -2  2  0]\n",
      "(126,) (12,)\n",
      "init state [ 3  2 -1  1  0]\n",
      "(132,) (6,)\n",
      "============ 85 ===========\n",
      "Run episode 85 with rewards 36, accuracy 0.9\n",
      "----------------- 0 --------------\n",
      "   -0.1618 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.2271 if c>=1.0 & x1>=1.0 & x2<=2.0\n",
      "   +0.3432 if c<=0.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   +0.0945 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.1665 if c<=0.0 & x1<=2.0 & x3-x1>=-1.0\n",
      "   +0.0955 if c<=0.0 & x3-x1<=2.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.6998 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.3033 if c<=0.0 & x3-x1>=-2.0\n",
      "   +0.1057 if c<=0.0 & x2<=0.0 & x3-x1<=-1.0 & x4-x2<=2.0\n",
      "   -0.4919 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   -0.0674 if x1>=3.0 & x3-x1<=-2.0\n",
      "   +0.0582 if c<=0.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.0907 if x3-x1<=-1.0 & x4-x2<=2.0 & x4-x2>=2.0\n",
      "   -0.3297 if x1>=2.0 & x3-x1<=-1.0 & x4-x2<=-2.0\n",
      "   -0.4116 if x1>=1.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   +0.7103 if c<=0.0 & x1<=2.0 & x2<=1.0 & x4-x2<=2.0 & x4-x2>=0.0\n",
      "----------------- 1 --------------\n",
      "   -0.2531 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   -0.5837 if x2<=2.0 & x3-x1<=0.0\n",
      "   +0.3199 if x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.2170 if c<=0.0 & x1>=3.0 & x2<=2.0\n",
      "   +0.3622 if x2>=1.0 & x3-x1<=0.0\n",
      "   +0.6176 if c>=1.0 & x2>=1.0\n",
      "   +0.4444 if x2<=0.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "   -0.1981 if x2<=2.0 & x3-x1<=-1.0\n",
      "   +0.2903 if c<=0.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.2582 if x1>=3.0 & x4-x2<=0.0\n",
      "   +0.2077 if x3-x1>=2.0\n",
      "   +0.3966 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.1163 if x3-x1>=1.0 & x4-x2>=0.0\n",
      "   -0.0344 if x2<=1.0 & x2>=1.0 & x3-x1<=2.0 & x3-x1>=1.0\n",
      "   +0.1085 if x1<=2.0 & x2>=3.0 & x3-x1<=-2.0\n",
      "   -0.3107 if c>=1.0 & x1<=2.0 & x1>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2>=-2.0\n",
      "----------------- 2 --------------\n",
      "   +0.5902 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.0238 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -0.3203 if x4-x2>=0.0\n",
      "   -0.4835 if c>=1.0 & x2>=2.0\n",
      "   +0.4387 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   +0.2033 if x1<=0.0 & x3-x1>=1.0 & x4-x2<=-1.0\n",
      "   -0.0070 if c<=0.0 & x1<=2.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   +0.0144 if x4-x2<=1.0\n",
      "   -0.0594 if c<=0.0 & x2>=2.0 & x4-x2>=0.0\n",
      "   -0.3707 if c<=0.0 & x1>=2.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=-1.0 & x4-x2>=0.0\n",
      "   +0.0911 if x1<=2.0 & x2>=1.0 & x3-x1<=1.0\n",
      "   -0.1373 if x2>=1.0 & x3-x1<=0.0\n",
      "   -0.1211 if c<=0.0 & x1<=1.0 & x3-x1<=1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   +0.0305 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.1549 if x1<=2.0 & x4-x2>=2.0\n",
      "   -0.3791 if c<=0.0 & x1<=2.0 & x2<=1.0 & x3-x1<=0.0 & x4-x2>=1.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 3 --------------\n",
      "   +0.0604 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.5506 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.0086 if c>=1.0 & x2<=1.0\n",
      "   +0.0243 if x1<=1.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   -0.3572 if x2>=2.0 & x3-x1<=1.0\n",
      "   +0.1337 if x1<=2.0 & x2<=1.0 & x3-x1>=-1.0 & x4-x2>=0.0\n",
      "   -0.1526 if x1<=1.0 & x2>=1.0 & x3-x1<=2.0 & x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   -0.3756 if x1<=2.0 & x4-x2<=0.0\n",
      "   +0.5368 if c>=1.0 & x4-x2>=-1.0\n",
      "   +0.2275 if x2<=1.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   +0.7660 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.3622 if x1>=2.0 & x3-x1>=-2.0\n",
      "   -0.1128 if x3-x1<=-2.0 & x3-x1>=-2.0\n",
      "   -0.1212 if x1<=2.0 & x2<=0.0 & x3-x1>=0.0 & x4-x2<=2.0 & x4-x2>=1.0\n",
      "   +0.3712 if x2<=2.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.5205 if x1<=0.0 & x4-x2>=-1.0\n",
      "init state [ 3  0 -2  0  0]\n",
      "(19,) (19,)\n",
      "init state [ 1  1 -1  1  0]\n",
      "(27,) (8,)\n",
      "init state [ 2  0 -1  3  0]\n",
      "(33,) (6,)\n",
      "init state [ 3  2 -1 -2  0]\n",
      "(44,) (11,)\n",
      "init state [ 2  1 -2  1  0]\n",
      "(56,) (12,)\n",
      "init state [ 2  1  0 -1  0]\n",
      "(63,) (7,)\n",
      "init state [1 1 0 1 0]\n",
      "(76,) (13,)\n",
      "init state [0 0 1 0 0]\n",
      "(86,) (10,)\n",
      "init state [ 3  2 -3  1  0]\n",
      "(113,) (27,)\n",
      "init state [ 2  3 -2  0  0]\n",
      "(121,) (8,)\n",
      "============ 86 ===========\n",
      "Run episode 86 with rewards 34, accuracy 0.9\n",
      "----------------- 0 --------------\n",
      "   -0.0181 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.0024 if c>=1.0 & x1>=1.0 & x2<=2.0\n",
      "   +0.3005 if c<=0.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   +0.2622 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.0890 if c<=0.0 & x1<=2.0 & x3-x1>=-1.0\n",
      "   +0.6015 if c<=0.0 & x3-x1<=2.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.7332 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.3297 if c<=0.0 & x3-x1>=-2.0\n",
      "   +0.1678 if c<=0.0 & x2<=0.0 & x3-x1<=-1.0 & x4-x2<=2.0\n",
      "   -0.3805 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   -0.0024 if x1>=3.0 & x3-x1<=-2.0\n",
      "   +0.2568 if x3-x1<=-1.0 & x4-x2<=2.0 & x4-x2>=2.0\n",
      "   +0.0271 if x1>=2.0 & x3-x1<=-1.0 & x4-x2<=-2.0\n",
      "   -0.4235 if x1>=1.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   +0.2722 if c<=0.0 & x1<=2.0 & x2<=1.0 & x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.2370 if c<=0.0 & x4-x2<=-1.0\n",
      "----------------- 1 --------------\n",
      "   -0.1414 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   -0.5747 if x2<=2.0 & x3-x1<=0.0\n",
      "   +0.2773 if x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   -0.0918 if c<=0.0 & x1>=3.0 & x2<=2.0\n",
      "   -0.0118 if x2>=1.0 & x3-x1<=0.0\n",
      "   +0.9049 if c>=1.0 & x2>=1.0\n",
      "   +0.0000 if x2<=0.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "   -0.7250 if x2<=2.0 & x3-x1<=-1.0\n",
      "   +0.3666 if c<=0.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.2528 if x1>=3.0 & x4-x2<=0.0\n",
      "   +0.0000 if x3-x1>=2.0\n",
      "   +0.0475 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.2490 if x3-x1>=1.0 & x4-x2>=0.0\n",
      "   +0.2148 if x1<=2.0 & x2>=3.0 & x3-x1<=-2.0\n",
      "   +0.3122 if c>=1.0 & x1<=2.0 & x1>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2>=-2.0\n",
      "   +0.3179 if x4-x2<=-3.0\n",
      "----------------- 2 --------------\n",
      "   +0.7440 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.1962 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -0.5145 if x4-x2>=0.0\n",
      "   -0.0943 if c>=1.0 & x2>=2.0\n",
      "   +0.4334 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   +0.1290 if x1<=0.0 & x3-x1>=1.0 & x4-x2<=-1.0\n",
      "   -0.1372 if x4-x2<=1.0\n",
      "   -0.2658 if c<=0.0 & x2>=2.0 & x4-x2>=0.0\n",
      "   +0.0520 if c<=0.0 & x1>=2.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=-1.0 & x4-x2>=0.0\n",
      "   +0.0424 if x1<=2.0 & x2>=1.0 & x3-x1<=1.0\n",
      "   -0.0856 if x2>=1.0 & x3-x1<=0.0\n",
      "   +0.0000 if c<=0.0 & x1<=1.0 & x3-x1<=1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   +0.0694 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   +0.0456 if x1<=2.0 & x4-x2>=2.0\n",
      "   +0.1368 if c<=0.0 & x1<=2.0 & x2<=1.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.2438 if c>=1.0 & x2>=1.0 & x4-x2>=0.0\n",
      "----------------- 3 --------------\n",
      "   +0.2843 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.5659 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.1847 if x1<=1.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   +0.1297 if x2>=2.0 & x3-x1<=1.0\n",
      "   +0.2208 if x1<=2.0 & x2<=1.0 & x3-x1>=-1.0 & x4-x2>=0.0\n",
      "   -0.0048 if x1<=1.0 & x2>=1.0 & x3-x1<=2.0 & x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   -0.5777 if x1<=2.0 & x4-x2<=0.0\n",
      "   +0.3017 if c>=1.0 & x4-x2>=-1.0\n",
      "   +0.2416 if x2<=1.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   +0.8540 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   -0.0197 if x1>=2.0 & x3-x1>=-2.0\n",
      "   -0.1909 if x3-x1<=-2.0 & x3-x1>=-2.0\n",
      "   +0.1739 if x1<=2.0 & x2<=0.0 & x3-x1>=0.0 & x4-x2<=2.0 & x4-x2>=1.0\n",
      "   +0.4010 if x2<=2.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   -0.0710 if x1<=0.0 & x4-x2>=-1.0\n",
      "   +0.2789 if x4-x2>=3.0\n",
      "init state [ 2  2  1 -1  0]\n",
      "(12,) (12,)\n",
      "init state [ 1  1  2 -1  0]\n",
      "(64,) (52,)\n",
      "init state [ 3  0 -3  3  0]\n",
      "(87,) (23,)\n",
      "init state [ 2  1  1 -1  0]\n",
      "(170,) (83,)\n",
      "init state [2 0 1 2 0]\n",
      "(192,) (22,)\n",
      "init state [0 0 3 1 0]\n",
      "(204,) (12,)\n",
      "init state [ 3  0 -3  0  0]\n",
      "(215,) (11,)\n",
      "init state [ 3  1 -3  2  0]\n",
      "(227,) (12,)\n",
      "init state [ 3  2 -2  1  0]\n",
      "(232,) (5,)\n",
      "init state [1 1 2 1 0]\n",
      "(242,) (10,)\n",
      "============ 87 ===========\n",
      "Run episode 87 with rewards 32, accuracy 0.7\n",
      "----------------- 0 --------------\n",
      "   -0.1187 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.1218 if c<=0.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   +0.8917 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.4767 if c<=0.0 & x1<=2.0 & x3-x1>=-1.0\n",
      "   +0.0140 if c<=0.0 & x3-x1<=2.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.7559 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.2395 if c<=0.0 & x3-x1>=-2.0\n",
      "   +0.4165 if c<=0.0 & x2<=0.0 & x3-x1<=-1.0 & x4-x2<=2.0\n",
      "   -0.1466 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.2983 if x1>=3.0 & x3-x1<=-2.0\n",
      "   +0.3920 if x3-x1<=-1.0 & x4-x2<=2.0 & x4-x2>=2.0\n",
      "   -0.0522 if x1>=2.0 & x3-x1<=-1.0 & x4-x2<=-2.0\n",
      "   -0.2950 if x1>=1.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   -0.1084 if c<=0.0 & x1<=2.0 & x2<=1.0 & x4-x2<=2.0 & x4-x2>=0.0\n",
      "   +0.1912 if c<=0.0 & x4-x2<=-1.0\n",
      "   +0.7954 if x1>=1.0 & x3-x1>=2.0 & x4-x2>=2.0\n",
      "----------------- 1 --------------\n",
      "   -0.1725 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   -0.7009 if x2<=2.0 & x3-x1<=0.0\n",
      "   +0.9740 if x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   -0.0165 if c<=0.0 & x1>=3.0 & x2<=2.0\n",
      "   +0.2370 if x2>=1.0 & x3-x1<=0.0\n",
      "   +0.5491 if c>=1.0 & x2>=1.0\n",
      "   -0.1155 if x2<=0.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "   -0.3715 if x2<=2.0 & x3-x1<=-1.0\n",
      "   +0.6677 if c<=0.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.0664 if x1>=3.0 & x4-x2<=0.0\n",
      "   -0.3843 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.8570 if x3-x1>=1.0 & x4-x2>=0.0\n",
      "   +0.3328 if x1<=2.0 & x2>=3.0 & x3-x1<=-2.0\n",
      "   +0.2806 if c>=1.0 & x1<=2.0 & x1>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2>=-2.0\n",
      "   +0.2729 if x4-x2<=-3.0\n",
      "   -0.6794 if x2>=1.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "----------------- 2 --------------\n",
      "   +0.6599 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.1232 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -0.5341 if x4-x2>=0.0\n",
      "   -0.3230 if c>=1.0 & x2>=2.0\n",
      "   +0.3378 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   -0.1694 if x1<=0.0 & x3-x1>=1.0 & x4-x2<=-1.0\n",
      "   -0.5505 if x4-x2<=1.0\n",
      "   +0.0078 if c<=0.0 & x2>=2.0 & x4-x2>=0.0\n",
      "   -0.3330 if c<=0.0 & x1>=2.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=-1.0 & x4-x2>=0.0\n",
      "   +0.3249 if x1<=2.0 & x2>=1.0 & x3-x1<=1.0\n",
      "   -0.5346 if x2>=1.0 & x3-x1<=0.0\n",
      "   +0.2227 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.1372 if x1<=2.0 & x4-x2>=2.0\n",
      "   +0.0734 if c<=0.0 & x1<=2.0 & x2<=1.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.1565 if c>=1.0 & x2>=1.0 & x4-x2>=0.0\n",
      "   -0.6785 if x2<=0.0\n",
      "----------------- 3 --------------\n",
      "   +0.4153 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.4407 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.4711 if x1<=1.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   +0.2841 if x2>=2.0 & x3-x1<=1.0\n",
      "   +0.4108 if x1<=2.0 & x2<=1.0 & x3-x1>=-1.0 & x4-x2>=0.0\n",
      "   -0.7539 if x1<=2.0 & x4-x2<=0.0\n",
      "   +0.2576 if c>=1.0 & x4-x2>=-1.0\n",
      "   +0.5735 if x2<=1.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   +0.3311 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   -0.2391 if x1>=2.0 & x3-x1>=-2.0\n",
      "   -0.2315 if x3-x1<=-2.0 & x3-x1>=-2.0\n",
      "   -0.0227 if x1<=2.0 & x2<=0.0 & x3-x1>=0.0 & x4-x2<=2.0 & x4-x2>=1.0\n",
      "   +0.3861 if x2<=2.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.1621 if x1<=0.0 & x4-x2>=-1.0\n",
      "   +0.1001 if x4-x2>=3.0\n",
      "   -0.6572 if x2<=2.0 & x3-x1<=-1.0\n",
      "init state [ 2  1  0 -1  0]\n",
      "(8,) (8,)\n",
      "init state [2 0 1 0 0]\n",
      "(39,) (31,)\n",
      "init state [2 2 1 0 0]\n",
      "(49,) (10,)\n",
      "init state [1 0 2 1 0]\n",
      "(61,) (12,)\n",
      "init state [ 2  3  0 -3  0]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(82,) (21,)\n",
      "init state [ 3  2  0 -2  0]\n",
      "(91,) (9,)\n",
      "init state [ 3  2 -3  0  0]\n",
      "(107,) (16,)\n",
      "init state [ 1  3  0 -3  0]\n",
      "(126,) (19,)\n",
      "init state [ 3  2 -1 -2  0]\n",
      "(149,) (23,)\n",
      "init state [ 0  2  3 -2  0]\n",
      "(174,) (25,)\n",
      "============ 88 ===========\n",
      "Run episode 88 with rewards 17, accuracy 0.5\n",
      "----------------- 0 --------------\n",
      "   -0.0450 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.4791 if c<=0.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   +0.3710 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   +0.0387 if c<=0.0 & x1<=2.0 & x3-x1>=-1.0\n",
      "   +0.2870 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.0260 if c<=0.0 & x3-x1>=-2.0\n",
      "   +0.0000 if c<=0.0 & x2<=0.0 & x3-x1<=-1.0 & x4-x2<=2.0\n",
      "   +0.1114 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.1135 if x1>=3.0 & x3-x1<=-2.0\n",
      "   +0.0000 if x3-x1<=-1.0 & x4-x2<=2.0 & x4-x2>=2.0\n",
      "   +0.0269 if x1>=2.0 & x3-x1<=-1.0 & x4-x2<=-2.0\n",
      "   -0.4666 if x1>=1.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   +0.1374 if c<=0.0 & x1<=2.0 & x2<=1.0 & x4-x2<=2.0 & x4-x2>=0.0\n",
      "   +0.0597 if c<=0.0 & x4-x2<=-1.0\n",
      "   +0.0000 if x1>=1.0 & x3-x1>=2.0 & x4-x2>=2.0\n",
      "   +0.3614 if x1<=2.0 & x2<=2.0 & x3-x1<=-2.0\n",
      "----------------- 1 --------------\n",
      "   -0.0237 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   -0.2822 if x2<=2.0 & x3-x1<=0.0\n",
      "   +0.4996 if x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.1675 if x2>=1.0 & x3-x1<=0.0\n",
      "   +0.4925 if c>=1.0 & x2>=1.0\n",
      "   +0.0949 if x2<=0.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "   -0.0322 if x2<=2.0 & x3-x1<=-1.0\n",
      "   +0.4795 if c<=0.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.1856 if x1>=3.0 & x4-x2<=0.0\n",
      "   +0.2488 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.3658 if x3-x1>=1.0 & x4-x2>=0.0\n",
      "   +0.1402 if x1<=2.0 & x2>=3.0 & x3-x1<=-2.0\n",
      "   +0.0553 if c>=1.0 & x1<=2.0 & x1>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2>=-2.0\n",
      "   -0.0262 if x4-x2<=-3.0\n",
      "   +0.0000 if x2>=1.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.8895 if c<=0.0 & x1<=1.0 & x4-x2>=0.0\n",
      "----------------- 2 --------------\n",
      "   +1.0419 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.4047 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -0.5023 if x4-x2>=0.0\n",
      "   -0.3773 if c>=1.0 & x2>=2.0\n",
      "   +0.6737 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   -0.1265 if x1<=0.0 & x3-x1>=1.0 & x4-x2<=-1.0\n",
      "   -0.2129 if x4-x2<=1.0\n",
      "   -0.1654 if c<=0.0 & x1>=2.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=-1.0 & x4-x2>=0.0\n",
      "   -0.0907 if x1<=2.0 & x2>=1.0 & x3-x1<=1.0\n",
      "   -0.2410 if x2>=1.0 & x3-x1<=0.0\n",
      "   +0.1284 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   +0.0000 if x1<=2.0 & x4-x2>=2.0\n",
      "   +0.0000 if c<=0.0 & x1<=2.0 & x2<=1.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.0225 if c>=1.0 & x2>=1.0 & x4-x2>=0.0\n",
      "   -0.1811 if x2<=0.0\n",
      "   -0.0503 if c>=1.0 & x1<=2.0 & x3-x1<=1.0\n",
      "----------------- 3 --------------\n",
      "   +0.5076 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.7453 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.0473 if x1<=1.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   -0.0352 if x2>=2.0 & x3-x1<=1.0\n",
      "   -0.0162 if x1<=2.0 & x2<=1.0 & x3-x1>=-1.0 & x4-x2>=0.0\n",
      "   -0.5426 if x1<=2.0 & x4-x2<=0.0\n",
      "   +0.3432 if c>=1.0 & x4-x2>=-1.0\n",
      "   -0.1888 if x2<=1.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   +0.4430 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.1034 if x1>=2.0 & x3-x1>=-2.0\n",
      "   -0.0938 if x3-x1<=-2.0 & x3-x1>=-2.0\n",
      "   +0.2431 if x2<=2.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.0878 if x1<=0.0 & x4-x2>=-1.0\n",
      "   +0.0000 if x4-x2>=3.0\n",
      "   -0.3711 if x2<=2.0 & x3-x1<=-1.0\n",
      "   -0.7616 if c<=0.0 & x3-x1<=2.0 & x3-x1>=0.0\n",
      "init state [ 1  3 -1 -3  0]\n",
      "(19,) (19,)\n",
      "init state [1 2 0 1 0]\n",
      "(41,) (22,)\n",
      "init state [ 3  1 -1  2  0]\n",
      "(80,) (39,)\n",
      "init state [ 1  0 -1  2  0]\n",
      "(124,) (44,)\n",
      "init state [1 2 0 1 0]\n",
      "(205,) (81,)\n",
      "init state [ 2  0 -1  1  0]\n",
      "(239,) (34,)\n",
      "init state [1 0 0 1 0]\n",
      "(256,) (17,)\n",
      "init state [ 1  2 -1  0  0]\n",
      "(264,) (8,)\n",
      "init state [ 2  1 -2 -1  0]\n",
      "(291,) (27,)\n",
      "init state [ 1  2 -1  1  0]\n",
      "(327,) (36,)\n",
      "============ 89 ===========\n",
      "Run episode 89 with rewards 6, accuracy 0.4\n",
      "----------------- 0 --------------\n",
      "   +0.0367 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.5393 if c<=0.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   +0.1979 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   +0.1520 if c<=0.0 & x1<=2.0 & x3-x1>=-1.0\n",
      "   +0.6788 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.1490 if c<=0.0 & x3-x1>=-2.0\n",
      "   +0.7019 if c<=0.0 & x2<=0.0 & x3-x1<=-1.0 & x4-x2<=2.0\n",
      "   -0.7664 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   -0.0832 if x1>=3.0 & x3-x1<=-2.0\n",
      "   +0.1521 if x1>=2.0 & x3-x1<=-1.0 & x4-x2<=-2.0\n",
      "   -0.6003 if x1>=1.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   -0.1131 if c<=0.0 & x1<=2.0 & x2<=1.0 & x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.2739 if c<=0.0 & x4-x2<=-1.0\n",
      "   +0.0000 if x1>=1.0 & x3-x1>=2.0 & x4-x2>=2.0\n",
      "   -0.0027 if x1<=2.0 & x2<=2.0 & x3-x1<=-2.0\n",
      "   -0.1648 if c<=0.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "----------------- 1 --------------\n",
      "   -0.1224 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.0139 if x2<=2.0 & x3-x1<=0.0\n",
      "   +0.1659 if x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.0453 if x2>=1.0 & x3-x1<=0.0\n",
      "   +0.6432 if c>=1.0 & x2>=1.0\n",
      "   +0.2236 if x2<=0.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.0295 if x2<=2.0 & x3-x1<=-1.0\n",
      "   +0.1678 if c<=0.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.2335 if x1>=3.0 & x4-x2<=0.0\n",
      "   +0.0446 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.1458 if x3-x1>=1.0 & x4-x2>=0.0\n",
      "   +0.0241 if x1<=2.0 & x2>=3.0 & x3-x1<=-2.0\n",
      "   +0.3313 if c>=1.0 & x1<=2.0 & x1>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2>=-2.0\n",
      "   +0.1847 if x4-x2<=-3.0\n",
      "   +0.1333 if c<=0.0 & x1<=1.0 & x4-x2>=0.0\n",
      "   -0.4417 if x3-x1<=-1.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=-1.0 & x4-x2<=-2.0 & x4-x2>=-2.0\n",
      "----------------- 2 --------------\n",
      "   +0.5583 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.1329 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -0.8610 if x4-x2>=0.0\n",
      "   -0.1635 if c>=1.0 & x2>=2.0\n",
      "   +0.1591 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   -0.0351 if x1<=0.0 & x3-x1>=1.0 & x4-x2<=-1.0\n",
      "   -0.1405 if x4-x2<=1.0\n",
      "   -0.3441 if c<=0.0 & x1>=2.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=-1.0 & x4-x2>=0.0\n",
      "   -0.0878 if x1<=2.0 & x2>=1.0 & x3-x1<=1.0\n",
      "   +0.1381 if x2>=1.0 & x3-x1<=0.0\n",
      "   +0.2831 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   +0.2004 if x1<=2.0 & x4-x2>=2.0\n",
      "   -0.0132 if c>=1.0 & x2>=1.0 & x4-x2>=0.0\n",
      "   -0.1686 if x2<=0.0\n",
      "   -0.1075 if c>=1.0 & x1<=2.0 & x3-x1<=1.0\n",
      "   -0.4948 if c>=1.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "----------------- 3 --------------\n",
      "   +0.0243 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.3899 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.3490 if x1<=1.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   -0.1923 if x2>=2.0 & x3-x1<=1.0\n",
      "   -0.0551 if x1<=2.0 & x2<=1.0 & x3-x1>=-1.0 & x4-x2>=0.0\n",
      "   -0.4223 if x1<=2.0 & x4-x2<=0.0\n",
      "   +0.1349 if c>=1.0 & x4-x2>=-1.0\n",
      "   +0.4803 if x2<=1.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   +0.8239 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.2722 if x1>=2.0 & x3-x1>=-2.0\n",
      "   +0.0424 if x3-x1<=-2.0 & x3-x1>=-2.0\n",
      "   +0.0141 if x2<=2.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   -0.1897 if x1<=0.0 & x4-x2>=-1.0\n",
      "   -0.0130 if x2<=2.0 & x3-x1<=-1.0\n",
      "   +0.6527 if c<=0.0 & x3-x1<=2.0 & x3-x1>=0.0\n",
      "   +0.3891 if x2>=2.0 & x3-x1<=-3.0 & x4-x2>=1.0\n",
      "init state [1 0 0 1 0]\n",
      "(9,) (9,)\n",
      "init state [ 3  0 -2  3  0]\n",
      "(18,) (9,)\n",
      "init state [1 1 1 2 0]\n",
      "(22,) (4,)\n",
      "init state [ 3  2 -1 -1  0]\n",
      "(42,) (20,)\n",
      "init state [ 1  3 -1 -2  0]\n",
      "(53,) (11,)\n",
      "init state [0 1 3 1 0]\n",
      "(85,) (32,)\n",
      "init state [1 2 1 0 0]\n",
      "(88,) (3,)\n",
      "init state [0 0 2 3 0]\n",
      "(101,) (13,)\n",
      "init state [0 0 1 1 0]\n",
      "(111,) (10,)\n",
      "init state [1 2 1 1 0]\n",
      "(116,) (5,)\n",
      "============ 90 ===========\n",
      "Run episode 90 with rewards 37, accuracy 0.2\n",
      "----------------- 0 --------------\n",
      "   -0.0855 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.6446 if c<=0.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   -0.0393 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   +0.0904 if c<=0.0 & x1<=2.0 & x3-x1>=-1.0\n",
      "   +0.5384 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.2209 if c<=0.0 & x3-x1>=-2.0\n",
      "   -0.0000 if c<=0.0 & x2<=0.0 & x3-x1<=-1.0 & x4-x2<=2.0\n",
      "   -0.1118 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   -0.0934 if x1>=3.0 & x3-x1<=-2.0\n",
      "   +0.1091 if x1>=2.0 & x3-x1<=-1.0 & x4-x2<=-2.0\n",
      "   -0.2731 if x1>=1.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   +0.0484 if c<=0.0 & x1<=2.0 & x2<=1.0 & x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.0818 if c<=0.0 & x4-x2<=-1.0\n",
      "   -0.0000 if x1<=2.0 & x2<=2.0 & x3-x1<=-2.0\n",
      "   -0.3196 if c<=0.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   -0.5758 if c<=0.0 & x1<=0.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 1 --------------\n",
      "   -0.0872 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.5939 if x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   -0.0691 if x2>=1.0 & x3-x1<=0.0\n",
      "   +0.4216 if c>=1.0 & x2>=1.0\n",
      "   +0.0688 if x2<=0.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.1464 if x2<=2.0 & x3-x1<=-1.0\n",
      "   +0.5428 if c<=0.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.3250 if x1>=3.0 & x4-x2<=0.0\n",
      "   -0.1042 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.4742 if x3-x1>=1.0 & x4-x2>=0.0\n",
      "   +0.1511 if x1<=2.0 & x2>=3.0 & x3-x1<=-2.0\n",
      "   +0.3856 if c>=1.0 & x1<=2.0 & x1>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2>=-2.0\n",
      "   +0.0000 if x4-x2<=-3.0\n",
      "   +0.3529 if c<=0.0 & x1<=1.0 & x4-x2>=0.0\n",
      "   -0.0639 if x3-x1<=-1.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=-1.0 & x4-x2<=-2.0 & x4-x2>=-2.0\n",
      "   -0.8262 if x1<=2.0 & x2<=1.0 & x2<=2.0 & x3-x1<=2.0 & x4-x2<=1.0\n",
      "----------------- 2 --------------\n",
      "   +0.7744 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.1914 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -0.8780 if x4-x2>=0.0\n",
      "   -0.4031 if c>=1.0 & x2>=2.0\n",
      "   +0.0181 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   +0.0000 if x1<=0.0 & x3-x1>=1.0 & x4-x2<=-1.0\n",
      "   -0.1597 if x4-x2<=1.0\n",
      "   -0.1652 if c<=0.0 & x1>=2.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=-1.0 & x4-x2>=0.0\n",
      "   +0.1836 if x1<=2.0 & x2>=1.0 & x3-x1<=1.0\n",
      "   -0.0106 if x2>=1.0 & x3-x1<=0.0\n",
      "   -0.0695 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.1672 if x1<=2.0 & x4-x2>=2.0\n",
      "   +0.2001 if x2<=0.0\n",
      "   -0.3015 if c>=1.0 & x1<=2.0 & x3-x1<=1.0\n",
      "   -0.1380 if c>=1.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   -0.1561 if c<=0.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "----------------- 3 --------------\n",
      "   +0.3227 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.3655 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.1276 if x1<=1.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   -0.2403 if x2>=2.0 & x3-x1<=1.0\n",
      "   +0.0346 if x1<=2.0 & x2<=1.0 & x3-x1>=-1.0 & x4-x2>=0.0\n",
      "   -0.4522 if x1<=2.0 & x4-x2<=0.0\n",
      "   +0.5194 if c>=1.0 & x4-x2>=-1.0\n",
      "   -0.0700 if x2<=1.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   +0.6038 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.0289 if x1>=2.0 & x3-x1>=-2.0\n",
      "   -0.0638 if x3-x1<=-2.0 & x3-x1>=-2.0\n",
      "   +0.5607 if x2<=2.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   -0.1925 if x1<=0.0 & x4-x2>=-1.0\n",
      "   -0.0808 if c<=0.0 & x3-x1<=2.0 & x3-x1>=0.0\n",
      "   -0.0000 if x2>=2.0 & x3-x1<=-3.0 & x4-x2>=1.0\n",
      "   +0.9060 if x1>=1.0 & x2<=1.0\n",
      "init state [ 0  1  2 -1  0]\n",
      "(11,) (11,)\n",
      "init state [ 1  2 -1  0  0]\n",
      "(36,) (25,)\n",
      "init state [ 2  0 -1  2  0]\n",
      "(45,) (9,)\n",
      "init state [ 0  3  2 -1  0]\n",
      "(55,) (10,)\n",
      "init state [ 1  3  2 -1  0]\n",
      "(61,) (6,)\n",
      "init state [ 2  1  1 -1  0]\n",
      "(72,) (11,)\n",
      "init state [ 0  2  1 -1  0]\n",
      "(80,) (8,)\n",
      "init state [2 2 1 0 0]\n",
      "(83,) (3,)\n",
      "init state [ 2  1 -2  2  0]\n",
      "(90,) (7,)\n",
      "init state [ 1  3 -1 -1  0]\n",
      "(104,) (14,)\n",
      "============ 91 ===========\n",
      "Run episode 91 with rewards 28, accuracy 1.0\n",
      "best\n",
      "----------------- 0 --------------\n",
      "   +0.3886 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.4473 if c<=0.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   +0.0277 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.5989 if c<=0.0 & x1<=2.0 & x3-x1>=-1.0\n",
      "   +0.8131 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   -0.1003 if c<=0.0 & x3-x1>=-2.0\n",
      "   -0.0539 if c<=0.0 & x2<=0.0 & x3-x1<=-1.0 & x4-x2<=2.0\n",
      "   +0.0000 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   -0.0794 if x1>=3.0 & x3-x1<=-2.0\n",
      "   +0.2320 if x1>=2.0 & x3-x1<=-1.0 & x4-x2<=-2.0\n",
      "   -0.1446 if x1>=1.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   -0.4453 if c<=0.0 & x1<=2.0 & x2<=1.0 & x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.2950 if c<=0.0 & x4-x2<=-1.0\n",
      "   +0.0911 if c<=0.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   -0.3629 if c<=0.0 & x1<=0.0\n",
      "   -0.3461 if x1>=3.0 & x2>=3.0\n",
      "----------------- 1 --------------\n",
      "   -0.1644 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.5357 if x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   -0.0603 if x2>=1.0 & x3-x1<=0.0\n",
      "   +0.7566 if c>=1.0 & x2>=1.0\n",
      "   +0.0000 if x2<=0.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "   -0.5100 if x2<=2.0 & x3-x1<=-1.0\n",
      "   +0.7327 if c<=0.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.4108 if x1>=3.0 & x4-x2<=0.0\n",
      "   +0.3847 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.6068 if x3-x1>=1.0 & x4-x2>=0.0\n",
      "   -0.0923 if x1<=2.0 & x2>=3.0 & x3-x1<=-2.0\n",
      "   +0.2768 if c>=1.0 & x1<=2.0 & x1>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2>=-2.0\n",
      "   -0.0806 if c<=0.0 & x1<=1.0 & x4-x2>=0.0\n",
      "   -0.3209 if x3-x1<=-1.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=-1.0 & x4-x2<=-2.0 & x4-x2>=-2.0\n",
      "   -0.2618 if x1<=2.0 & x2<=1.0 & x2<=2.0 & x3-x1<=2.0 & x4-x2<=1.0\n",
      "   -0.2027 if c<=0.0 & x1<=1.0 & x3-x1>=0.0\n",
      "----------------- 2 --------------\n",
      "   +0.8372 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.2438 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -0.4487 if x4-x2>=0.0\n",
      "   -0.4575 if c>=1.0 & x2>=2.0\n",
      "   +0.3728 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   -0.2940 if x4-x2<=1.0\n",
      "   +0.1653 if c<=0.0 & x1>=2.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=-1.0 & x4-x2>=0.0\n",
      "   +0.1377 if x1<=2.0 & x2>=1.0 & x3-x1<=1.0\n",
      "   -0.3685 if x2>=1.0 & x3-x1<=0.0\n",
      "   -0.2731 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.1047 if x1<=2.0 & x4-x2>=2.0\n",
      "   -0.2389 if x2<=0.0\n",
      "   -0.3579 if c>=1.0 & x1<=2.0 & x3-x1<=1.0\n",
      "   -0.1689 if c>=1.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.0390 if c<=0.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   -0.3759 if c<=0.0 & x2>=2.0 & x3-x1>=1.0\n",
      "----------------- 3 --------------\n",
      "   +0.3090 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.4255 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.1122 if x1<=1.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   -0.2023 if x2>=2.0 & x3-x1<=1.0\n",
      "   +0.3456 if x1<=2.0 & x2<=1.0 & x3-x1>=-1.0 & x4-x2>=0.0\n",
      "   -0.2256 if x1<=2.0 & x4-x2<=0.0\n",
      "   -0.0721 if c>=1.0 & x4-x2>=-1.0\n",
      "   -0.3280 if x2<=1.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   +0.0000 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   -0.0569 if x1>=2.0 & x3-x1>=-2.0\n",
      "   +0.2169 if x3-x1<=-2.0 & x3-x1>=-2.0\n",
      "   +0.8505 if x2<=2.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.1032 if x1<=0.0 & x4-x2>=-1.0\n",
      "   -0.4740 if c<=0.0 & x3-x1<=2.0 & x3-x1>=0.0\n",
      "   +0.5012 if x1>=1.0 & x2<=1.0\n",
      "   +0.2666 if x1<=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "init state [1 0 0 2 0]\n",
      "(9,) (9,)\n",
      "init state [0 2 2 0 0]\n",
      "(13,) (4,)\n",
      "init state [ 0  3  0 -1  0]\n",
      "(24,) (11,)\n",
      "init state [ 1  3 -1 -1  0]\n",
      "(41,) (17,)\n",
      "init state [ 3  1 -3  0  0]\n",
      "(66,) (25,)\n",
      "init state [3 1 0 1 0]\n",
      "(69,) (3,)\n",
      "init state [2 0 0 2 0]\n",
      "(84,) (15,)\n",
      "init state [0 1 1 0 0]\n",
      "(103,) (19,)\n",
      "init state [1 2 2 0 0]\n",
      "(106,) (3,)\n",
      "init state [ 2  2 -1 -1  0]\n",
      "(124,) (18,)\n",
      "============ 92 ===========\n",
      "Run episode 92 with rewards 24, accuracy 0.7\n",
      "----------------- 0 --------------\n",
      "   +0.3183 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.1186 if c<=0.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   +0.1350 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.3682 if c<=0.0 & x1<=2.0 & x3-x1>=-1.0\n",
      "   +0.7726 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   -0.2180 if c<=0.0 & x3-x1>=-2.0\n",
      "   -0.0488 if c<=0.0 & x2<=0.0 & x3-x1<=-1.0 & x4-x2<=2.0\n",
      "   +0.1736 if x1>=3.0 & x3-x1<=-2.0\n",
      "   -0.1350 if x1>=2.0 & x3-x1<=-1.0 & x4-x2<=-2.0\n",
      "   -0.2893 if x1>=1.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   +0.1035 if c<=0.0 & x1<=2.0 & x2<=1.0 & x4-x2<=2.0 & x4-x2>=0.0\n",
      "   +0.1961 if c<=0.0 & x4-x2<=-1.0\n",
      "   -0.1131 if c<=0.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   -0.2342 if c<=0.0 & x1<=0.0\n",
      "   +0.1902 if x1>=3.0 & x2>=3.0\n",
      "   -0.1118 if c<=0.0 & x1<=2.0 & x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0\n",
      "----------------- 1 --------------\n",
      "   +0.3098 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.5338 if x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   -0.1975 if x2>=1.0 & x3-x1<=0.0\n",
      "   +0.8844 if c>=1.0 & x2>=1.0\n",
      "   -0.2168 if x2<=2.0 & x3-x1<=-1.0\n",
      "   +0.6229 if c<=0.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.0651 if x1>=3.0 & x4-x2<=0.0\n",
      "   +0.3715 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.3944 if x3-x1>=1.0 & x4-x2>=0.0\n",
      "   +0.2389 if x1<=2.0 & x2>=3.0 & x3-x1<=-2.0\n",
      "   +0.0881 if c>=1.0 & x1<=2.0 & x1>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2>=-2.0\n",
      "   +0.0416 if c<=0.0 & x1<=1.0 & x4-x2>=0.0\n",
      "   +0.0651 if x3-x1<=-1.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=-1.0 & x4-x2<=-2.0 & x4-x2>=-2.0\n",
      "   +0.2428 if x1<=2.0 & x2<=1.0 & x2<=2.0 & x3-x1<=2.0 & x4-x2<=1.0\n",
      "   -0.2878 if c<=0.0 & x1<=1.0 & x3-x1>=0.0\n",
      "   +0.2241 if x1<=0.0 & x3-x1>=2.0\n",
      "----------------- 2 --------------\n",
      "   +0.2873 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.2258 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -0.6045 if x4-x2>=0.0\n",
      "   -0.4465 if c>=1.0 & x2>=2.0\n",
      "   +0.2324 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   -0.2425 if x4-x2<=1.0\n",
      "   -0.1871 if c<=0.0 & x1>=2.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=-1.0 & x4-x2>=0.0\n",
      "   -0.1432 if x1<=2.0 & x2>=1.0 & x3-x1<=1.0\n",
      "   +0.0253 if x2>=1.0 & x3-x1<=0.0\n",
      "   +0.3778 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.0672 if x1<=2.0 & x4-x2>=2.0\n",
      "   -0.0972 if x2<=0.0\n",
      "   -0.3114 if c>=1.0 & x1<=2.0 & x3-x1<=1.0\n",
      "   -0.3243 if c>=1.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   -0.2389 if c<=0.0 & x2>=2.0 & x3-x1>=1.0\n",
      "   +0.6405 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2>=2.0 & x3-x1<=1.0 & x4-x2>=-1.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 3 --------------\n",
      "   +0.1032 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.2444 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.0391 if x1<=1.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   -0.2815 if x2>=2.0 & x3-x1<=1.0\n",
      "   -0.1772 if x1<=2.0 & x2<=1.0 & x3-x1>=-1.0 & x4-x2>=0.0\n",
      "   -0.5043 if x1<=2.0 & x4-x2<=0.0\n",
      "   +0.1854 if c>=1.0 & x4-x2>=-1.0\n",
      "   -0.0045 if x2<=1.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   +0.1971 if x1>=2.0 & x3-x1>=-2.0\n",
      "   +0.2167 if x3-x1<=-2.0 & x3-x1>=-2.0\n",
      "   +0.7836 if x2<=2.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.3537 if x1<=0.0 & x4-x2>=-1.0\n",
      "   +0.3198 if c<=0.0 & x3-x1<=2.0 & x3-x1>=0.0\n",
      "   +0.2399 if x1>=1.0 & x2<=1.0\n",
      "   +0.2635 if x1<=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   +0.6230 if x1<=0.0 & x2>=3.0\n",
      "init state [0 0 0 3 0]\n",
      "(20,) (20,)\n",
      "init state [ 1  2 -1 -2  0]\n",
      "(206,) (186,)\n",
      "init state [2 0 0 3 0]\n",
      "(214,) (8,)\n",
      "init state [0 1 2 1 0]\n",
      "(227,) (13,)\n",
      "init state [ 1  3  1 -3  0]\n",
      "(324,) (97,)\n",
      "init state [ 3  1 -2  0  0]\n",
      "(343,) (19,)\n",
      "init state [ 1  2  0 -1  0]\n",
      "(364,) (21,)\n",
      "init state [0 0 0 2 0]\n",
      "(371,) (7,)\n",
      "init state [ 3  2 -3  1  0]\n",
      "(386,) (15,)\n",
      "init state [1 0 1 1 0]\n",
      "(435,) (49,)\n",
      "============ 93 ===========\n",
      "Run episode 93 with rewards -7, accuracy 0.2\n",
      "----------------- 0 --------------\n",
      "   +0.6677 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.4243 if c<=0.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   -0.3962 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.6403 if c<=0.0 & x1<=2.0 & x3-x1>=-1.0\n",
      "   +0.3424 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   -0.4346 if c<=0.0 & x3-x1>=-2.0\n",
      "   -0.0998 if x1>=3.0 & x3-x1<=-2.0\n",
      "   -1.2427 if x1>=2.0 & x3-x1<=-1.0 & x4-x2<=-2.0\n",
      "   -0.0109 if x1>=1.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   +0.3385 if c<=0.0 & x1<=2.0 & x2<=1.0 & x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -1.4740 if c<=0.0 & x4-x2<=-1.0\n",
      "   +0.9753 if c<=0.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   -0.8700 if c<=0.0 & x1<=0.0\n",
      "   +0.2941 if x1>=3.0 & x2>=3.0\n",
      "   +0.5323 if c<=0.0 & x1<=2.0 & x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0\n",
      "   -1.5422 if c<=0.0 & x1>=1.0 & x2>=1.0 & x4-x2<=-3.0\n",
      "----------------- 1 --------------\n",
      "   +0.3688 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   -0.1140 if x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.0022 if x2>=1.0 & x3-x1<=0.0\n",
      "   +1.3075 if c>=1.0 & x2>=1.0\n",
      "   -0.6957 if x2<=2.0 & x3-x1<=-1.0\n",
      "   +0.0465 if c<=0.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.2458 if x1>=3.0 & x4-x2<=0.0\n",
      "   +0.1832 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.1464 if x3-x1>=1.0 & x4-x2>=0.0\n",
      "   -0.1800 if x1<=2.0 & x2>=3.0 & x3-x1<=-2.0\n",
      "   +0.3092 if c>=1.0 & x1<=2.0 & x1>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2>=-2.0\n",
      "   -0.7396 if x3-x1<=-1.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=-1.0 & x4-x2<=-2.0 & x4-x2>=-2.0\n",
      "   -0.3351 if x1<=2.0 & x2<=1.0 & x2<=2.0 & x3-x1<=2.0 & x4-x2<=1.0\n",
      "   +1.6397 if c<=0.0 & x1<=1.0 & x3-x1>=0.0\n",
      "   +1.2396 if x1<=0.0 & x3-x1>=2.0\n",
      "   -0.4508 if x3-x1>=0.0 & x4-x2>=2.0\n",
      "----------------- 2 --------------\n",
      "   +0.6693 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.3242 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -2.4130 if x4-x2>=0.0\n",
      "   -0.6248 if c>=1.0 & x2>=2.0\n",
      "   +1.9345 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   +1.0976 if x4-x2<=1.0\n",
      "   -0.3890 if c<=0.0 & x1>=2.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=-1.0 & x4-x2>=0.0\n",
      "   +1.2069 if x1<=2.0 & x2>=1.0 & x3-x1<=1.0\n",
      "   +0.6746 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.0680 if x1<=2.0 & x4-x2>=2.0\n",
      "   -0.0043 if x2<=0.0\n",
      "   -0.7274 if c>=1.0 & x1<=2.0 & x3-x1<=1.0\n",
      "   -0.4740 if c>=1.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +1.1433 if c<=0.0 & x2>=2.0 & x3-x1>=1.0\n",
      "   -1.8578 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2>=2.0 & x3-x1<=1.0 & x4-x2>=-1.0\n",
      "   +4.2414 if c<=0.0 & x4-x2<=-3.0\n",
      "----------------- 3 --------------\n",
      "   +0.1338 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.5062 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.0502 if x1<=1.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   -0.2504 if x2>=2.0 & x3-x1<=1.0\n",
      "   +0.4933 if x1<=2.0 & x2<=1.0 & x3-x1>=-1.0 & x4-x2>=0.0\n",
      "   -1.4368 if x1<=2.0 & x4-x2<=0.0\n",
      "   +0.1536 if c>=1.0 & x4-x2>=-1.0\n",
      "   +0.4293 if x1>=2.0 & x3-x1>=-2.0\n",
      "   +0.0196 if x3-x1<=-2.0 & x3-x1>=-2.0\n",
      "   +0.8921 if x2<=2.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.6404 if x1<=0.0 & x4-x2>=-1.0\n",
      "   -0.9066 if c<=0.0 & x3-x1<=2.0 & x3-x1>=0.0\n",
      "   +0.0521 if x1>=1.0 & x2<=1.0\n",
      "   +1.1068 if x1<=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.7614 if x1<=0.0 & x2>=3.0\n",
      "   +0.4908 if x1>=2.0 & x4-x2>=2.0\n",
      "init state [0 1 1 2 0]\n",
      "(11,) (11,)\n",
      "init state [0 1 0 1 0]\n",
      "(46,) (35,)\n",
      "init state [2 2 1 0 0]\n",
      "(61,) (15,)\n",
      "init state [ 1  3  0 -3  0]\n",
      "(79,) (18,)\n",
      "init state [ 3  1 -2  1  0]\n",
      "(91,) (12,)\n",
      "init state [0 0 0 2 0]\n",
      "(115,) (24,)\n",
      "init state [1 1 1 2 0]\n",
      "(128,) (13,)\n",
      "init state [ 3  0 -2  1  0]\n",
      "(183,) (55,)\n",
      "init state [ 1  3  1 -2  0]\n",
      "(192,) (9,)\n",
      "init state [ 1  3  0 -2  0]\n",
      "(202,) (10,)\n",
      "============ 94 ===========\n",
      "Run episode 94 with rewards 32, accuracy 0.4\n",
      "----------------- 0 --------------\n",
      "   +0.0594 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.3350 if c<=0.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   -0.2635 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   +0.2755 if c<=0.0 & x1<=2.0 & x3-x1>=-1.0\n",
      "   +0.9159 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   -0.3039 if c<=0.0 & x3-x1>=-2.0\n",
      "   +0.0699 if x1>=3.0 & x3-x1<=-2.0\n",
      "   -0.1529 if x1>=2.0 & x3-x1<=-1.0 & x4-x2<=-2.0\n",
      "   -0.1835 if c<=0.0 & x1<=2.0 & x2<=1.0 & x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.0363 if c<=0.0 & x4-x2<=-1.0\n",
      "   -0.2416 if c<=0.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   -0.0546 if c<=0.0 & x1<=0.0\n",
      "   -0.1291 if x1>=3.0 & x2>=3.0\n",
      "   +0.2277 if c<=0.0 & x1<=2.0 & x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0\n",
      "   -0.0000 if c<=0.0 & x1>=1.0 & x2>=1.0 & x4-x2<=-3.0\n",
      "   -0.4896 if x1>=3.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "----------------- 1 --------------\n",
      "   +0.2597 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   -0.0197 if x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.7882 if c>=1.0 & x2>=1.0\n",
      "   -0.4931 if x2<=2.0 & x3-x1<=-1.0\n",
      "   +0.2662 if c<=0.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.1392 if x1>=3.0 & x4-x2<=0.0\n",
      "   +0.1496 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.2885 if x3-x1>=1.0 & x4-x2>=0.0\n",
      "   +0.0040 if x1<=2.0 & x2>=3.0 & x3-x1<=-2.0\n",
      "   +0.5258 if c>=1.0 & x1<=2.0 & x1>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2>=-2.0\n",
      "   +0.2101 if x3-x1<=-1.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=-1.0 & x4-x2<=-2.0 & x4-x2>=-2.0\n",
      "   -0.3360 if x1<=2.0 & x2<=1.0 & x2<=2.0 & x3-x1<=2.0 & x4-x2<=1.0\n",
      "   +0.4771 if c<=0.0 & x1<=1.0 & x3-x1>=0.0\n",
      "   -0.0000 if x1<=0.0 & x3-x1>=2.0\n",
      "   +0.5191 if x3-x1>=0.0 & x4-x2>=2.0\n",
      "   +0.8644 if x1>=2.0 & x2<=1.0 & x2>=1.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "----------------- 2 --------------\n",
      "   +0.9109 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.1109 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -0.8034 if x4-x2>=0.0\n",
      "   -0.2244 if c>=1.0 & x2>=2.0\n",
      "   +0.9302 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   +0.4751 if x4-x2<=1.0\n",
      "   -0.0863 if c<=0.0 & x1>=2.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=-1.0 & x4-x2>=0.0\n",
      "   +0.0853 if x1<=2.0 & x2>=1.0 & x3-x1<=1.0\n",
      "   +0.5703 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.1297 if x1<=2.0 & x4-x2>=2.0\n",
      "   -0.1327 if c>=1.0 & x1<=2.0 & x3-x1<=1.0\n",
      "   -0.3132 if c>=1.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.4370 if c<=0.0 & x2>=2.0 & x3-x1>=1.0\n",
      "   -0.6131 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2>=2.0 & x3-x1<=1.0 & x4-x2>=-1.0\n",
      "   +0.0467 if c<=0.0 & x4-x2<=-3.0\n",
      "   +0.0596 if x3-x1>=1.0 & x4-x2<=-2.0\n",
      "----------------- 3 --------------\n",
      "   +0.2258 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.5326 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.0559 if x1<=1.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   -0.0909 if x2>=2.0 & x3-x1<=1.0\n",
      "   +0.4655 if x1<=2.0 & x2<=1.0 & x3-x1>=-1.0 & x4-x2>=0.0\n",
      "   -0.7681 if x1<=2.0 & x4-x2<=0.0\n",
      "   +0.5558 if c>=1.0 & x4-x2>=-1.0\n",
      "   +0.1756 if x1>=2.0 & x3-x1>=-2.0\n",
      "   +0.4405 if x2<=2.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   -0.0966 if x1<=0.0 & x4-x2>=-1.0\n",
      "   -0.4156 if c<=0.0 & x3-x1<=2.0 & x3-x1>=0.0\n",
      "   +0.3698 if x1>=1.0 & x2<=1.0\n",
      "   -0.0808 if x1<=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   +0.0222 if x1<=0.0 & x2>=3.0\n",
      "   +0.5569 if x1>=2.0 & x4-x2>=2.0\n",
      "   +0.5901 if x1<=2.0 & x2>=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "init state [0 2 2 0 0]\n",
      "(20,) (20,)\n",
      "init state [1 0 1 3 0]\n",
      "(38,) (18,)\n",
      "init state [ 1  1  2 -1  0]\n",
      "(53,) (15,)\n",
      "init state [0 2 0 1 0]\n",
      "(60,) (7,)\n",
      "init state [ 3  1 -3  0  0]\n",
      "(79,) (19,)\n",
      "init state [ 3  1 -1  0  0]\n",
      "(103,) (24,)\n",
      "init state [1 1 2 0 0]\n",
      "(112,) (9,)\n",
      "init state [1 1 2 1 0]\n",
      "(116,) (4,)\n",
      "init state [0 0 1 1 0]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(131,) (15,)\n",
      "init state [ 2  0 -2  0  0]\n",
      "(176,) (45,)\n",
      "============ 95 ===========\n",
      "Run episode 95 with rewards -3, accuracy 0.4\n",
      "----------------- 0 --------------\n",
      "   -0.2787 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.3030 if c<=0.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   -0.1500 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.1305 if c<=0.0 & x1<=2.0 & x3-x1>=-1.0\n",
      "   +0.8666 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   -0.0126 if c<=0.0 & x3-x1>=-2.0\n",
      "   +0.1300 if x1>=3.0 & x3-x1<=-2.0\n",
      "   +0.1367 if x1>=2.0 & x3-x1<=-1.0 & x4-x2<=-2.0\n",
      "   +0.0500 if c<=0.0 & x1<=2.0 & x2<=1.0 & x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.4286 if c<=0.0 & x4-x2<=-1.0\n",
      "   +0.1617 if c<=0.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   +0.4322 if c<=0.0 & x1<=0.0\n",
      "   -0.0755 if x1>=3.0 & x2>=3.0\n",
      "   +0.0000 if c<=0.0 & x1<=2.0 & x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0\n",
      "   -0.2277 if x1>=3.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   -0.5001 if x1>=2.0 & x4-x2>=0.0\n",
      "----------------- 1 --------------\n",
      "   -0.0240 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   -0.1697 if x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.4518 if c>=1.0 & x2>=1.0\n",
      "   -0.6159 if x2<=2.0 & x3-x1<=-1.0\n",
      "   +0.1013 if c<=0.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.1503 if x1>=3.0 & x4-x2<=0.0\n",
      "   +0.1913 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.2967 if x3-x1>=1.0 & x4-x2>=0.0\n",
      "   -0.0018 if x1<=2.0 & x2>=3.0 & x3-x1<=-2.0\n",
      "   +0.2635 if c>=1.0 & x1<=2.0 & x1>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2>=-2.0\n",
      "   +0.4232 if x3-x1<=-1.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=-1.0 & x4-x2<=-2.0 & x4-x2>=-2.0\n",
      "   -0.2657 if x1<=2.0 & x2<=1.0 & x2<=2.0 & x3-x1<=2.0 & x4-x2<=1.0\n",
      "   +0.1345 if c<=0.0 & x1<=1.0 & x3-x1>=0.0\n",
      "   +0.1808 if x3-x1>=0.0 & x4-x2>=2.0\n",
      "   -0.3243 if x1>=2.0 & x2<=1.0 & x2>=1.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.7997 if x1>=1.0 & x3-x1>=-2.0 & x4-x2<=2.0\n",
      "----------------- 2 --------------\n",
      "   +0.2382 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.2876 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -0.6755 if x4-x2>=0.0\n",
      "   -0.3789 if c>=1.0 & x2>=2.0\n",
      "   +0.5398 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   +0.3347 if x4-x2<=1.0\n",
      "   -0.5030 if c<=0.0 & x1>=2.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=-1.0 & x4-x2>=0.0\n",
      "   -0.1592 if x1<=2.0 & x2>=1.0 & x3-x1<=1.0\n",
      "   +0.0647 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.0794 if x1<=2.0 & x4-x2>=2.0\n",
      "   +0.0017 if c>=1.0 & x1<=2.0 & x3-x1<=1.0\n",
      "   -0.3004 if c>=1.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   -0.0718 if c<=0.0 & x2>=2.0 & x3-x1>=1.0\n",
      "   -0.1593 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2>=2.0 & x3-x1<=1.0 & x4-x2>=-1.0\n",
      "   +0.0000 if x3-x1>=1.0 & x4-x2<=-2.0\n",
      "   +0.6524 if c<=0.0 & x1>=1.0 & x2<=2.0 & x2>=2.0 & x3-x1<=0.0\n",
      "----------------- 3 --------------\n",
      "   +0.5841 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.5168 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.1887 if x1<=1.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   -0.0415 if x2>=2.0 & x3-x1<=1.0\n",
      "   +0.0642 if x1<=2.0 & x2<=1.0 & x3-x1>=-1.0 & x4-x2>=0.0\n",
      "   -0.6794 if x1<=2.0 & x4-x2<=0.0\n",
      "   +0.7135 if c>=1.0 & x4-x2>=-1.0\n",
      "   +0.1966 if x1>=2.0 & x3-x1>=-2.0\n",
      "   +0.5490 if x2<=2.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.3221 if x1<=0.0 & x4-x2>=-1.0\n",
      "   +0.1648 if c<=0.0 & x3-x1<=2.0 & x3-x1>=0.0\n",
      "   +0.1735 if x1>=1.0 & x2<=1.0\n",
      "   -0.1683 if x1<=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   +0.2005 if x1>=2.0 & x4-x2>=2.0\n",
      "   +0.3337 if x1<=2.0 & x2>=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.4675 if c<=0.0 & x3-x1>=2.0\n",
      "init state [3 0 0 1 0]\n",
      "(5,) (5,)\n",
      "init state [1 1 2 1 0]\n",
      "(11,) (6,)\n",
      "init state [0 0 3 1 0]\n",
      "(19,) (8,)\n",
      "init state [1 1 2 1 0]\n",
      "(23,) (4,)\n",
      "init state [1 1 1 2 0]\n",
      "(32,) (9,)\n",
      "init state [ 2  0 -1  0  0]\n",
      "(42,) (10,)\n",
      "init state [ 0  3  1 -3  0]\n",
      "(61,) (19,)\n",
      "init state [2 1 1 1 0]\n",
      "(66,) (5,)\n",
      "init state [ 1  3  1 -1  0]\n",
      "(70,) (4,)\n",
      "init state [0 0 2 2 0]\n",
      "(82,) (12,)\n",
      "============ 96 ===========\n",
      "Run episode 96 with rewards 30, accuracy 0.7\n",
      "----------------- 0 --------------\n",
      "   +0.0000 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.0385 if c<=0.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   +0.1703 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.4952 if c<=0.0 & x1<=2.0 & x3-x1>=-1.0\n",
      "   +0.4538 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.0730 if c<=0.0 & x3-x1>=-2.0\n",
      "   +0.0577 if x1>=3.0 & x3-x1<=-2.0\n",
      "   -0.0751 if x1>=2.0 & x3-x1<=-1.0 & x4-x2<=-2.0\n",
      "   -0.0550 if c<=0.0 & x1<=2.0 & x2<=1.0 & x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.1290 if c<=0.0 & x4-x2<=-1.0\n",
      "   -0.1102 if c<=0.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   -0.3108 if c<=0.0 & x1<=0.0\n",
      "   +0.0000 if x1>=3.0 & x2>=3.0\n",
      "   +0.0381 if x1>=3.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   -0.1925 if x1>=2.0 & x4-x2>=0.0\n",
      "   +0.5918 if c<=0.0 & x1>=1.0 & x2<=0.0 & x3-x1<=0.0 & x4-x2<=1.0\n",
      "----------------- 1 --------------\n",
      "   -0.1436 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   -0.1284 if x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.4444 if c>=1.0 & x2>=1.0\n",
      "   +0.3208 if x2<=2.0 & x3-x1<=-1.0\n",
      "   +0.5918 if c<=0.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.3139 if x1>=3.0 & x4-x2<=0.0\n",
      "   -0.0934 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.6194 if x3-x1>=1.0 & x4-x2>=0.0\n",
      "   +0.3369 if c>=1.0 & x1<=2.0 & x1>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2>=-2.0\n",
      "   -0.0686 if x3-x1<=-1.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=-1.0 & x4-x2<=-2.0 & x4-x2>=-2.0\n",
      "   -0.2003 if x1<=2.0 & x2<=1.0 & x2<=2.0 & x3-x1<=2.0 & x4-x2<=1.0\n",
      "   +0.3439 if c<=0.0 & x1<=1.0 & x3-x1>=0.0\n",
      "   -0.1293 if x3-x1>=0.0 & x4-x2>=2.0\n",
      "   +0.0969 if x1>=2.0 & x2<=1.0 & x2>=1.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.3957 if x1>=1.0 & x3-x1>=-2.0 & x4-x2<=2.0\n",
      "   -0.5583 if x1>=3.0 & x2<=1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "----------------- 2 --------------\n",
      "   +0.4647 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.1157 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -0.8608 if x4-x2>=0.0\n",
      "   -0.2168 if c>=1.0 & x2>=2.0\n",
      "   +0.6682 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   -0.1607 if x4-x2<=1.0\n",
      "   -0.7469 if c<=0.0 & x1>=2.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=-1.0 & x4-x2>=0.0\n",
      "   +0.2208 if x1<=2.0 & x2>=1.0 & x3-x1<=1.0\n",
      "   +0.2340 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.2123 if x1<=2.0 & x4-x2>=2.0\n",
      "   -0.3316 if c>=1.0 & x1<=2.0 & x3-x1<=1.0\n",
      "   -0.0580 if c>=1.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   -0.0457 if c<=0.0 & x2>=2.0 & x3-x1>=1.0\n",
      "   +0.0655 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2>=2.0 & x3-x1<=1.0 & x4-x2>=-1.0\n",
      "   -0.2208 if c<=0.0 & x1>=1.0 & x2<=2.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   -0.3626 if x1<=1.0 & x1>=1.0 & x2>=3.0\n",
      "----------------- 3 --------------\n",
      "   +0.4918 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.5107 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.0654 if x1<=1.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   -0.2781 if x1<=2.0 & x2<=1.0 & x3-x1>=-1.0 & x4-x2>=0.0\n",
      "   -0.4765 if x1<=2.0 & x4-x2<=0.0\n",
      "   +0.6420 if c>=1.0 & x4-x2>=-1.0\n",
      "   +0.4428 if x1>=2.0 & x3-x1>=-2.0\n",
      "   +0.5346 if x2<=2.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.0769 if x1<=0.0 & x4-x2>=-1.0\n",
      "   +0.3439 if c<=0.0 & x3-x1<=2.0 & x3-x1>=0.0\n",
      "   +0.2922 if x1>=1.0 & x2<=1.0\n",
      "   -0.3776 if x1<=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   +0.2745 if x1>=2.0 & x4-x2>=2.0\n",
      "   -0.0080 if x1<=2.0 & x2>=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.4197 if c<=0.0 & x3-x1>=2.0\n",
      "   -0.8193 if c<=0.0 & x1>=3.0 & x3-x1<=-1.0\n",
      "init state [ 1  2  1 -2  0]\n",
      "(23,) (23,)\n",
      "init state [0 0 2 0 0]\n",
      "(47,) (24,)\n",
      "init state [0 2 2 0 0]\n",
      "(51,) (4,)\n",
      "init state [3 1 0 1 0]\n",
      "(53,) (2,)\n",
      "init state [ 3  0 -1  1  0]\n",
      "(60,) (7,)\n",
      "init state [ 0  3  2 -1  0]\n",
      "(71,) (11,)\n",
      "init state [ 1  3  2 -2  0]\n",
      "(77,) (6,)\n",
      "init state [ 3  2 -1  0  0]\n",
      "(81,) (4,)\n",
      "init state [ 3  1 -1 -1  0]\n",
      "(112,) (31,)\n",
      "init state [ 1  3  0 -2  0]\n",
      "(122,) (10,)\n",
      "============ 97 ===========\n",
      "Run episode 97 with rewards 32, accuracy 0.5\n",
      "----------------- 0 --------------\n",
      "   -0.1014 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.6695 if c<=0.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   -0.0144 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.5135 if c<=0.0 & x1<=2.0 & x3-x1>=-1.0\n",
      "   +0.2344 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   -0.0900 if c<=0.0 & x3-x1>=-2.0\n",
      "   +0.0000 if x1>=3.0 & x3-x1<=-2.0\n",
      "   -0.1487 if x1>=2.0 & x3-x1<=-1.0 & x4-x2<=-2.0\n",
      "   -0.1589 if c<=0.0 & x1<=2.0 & x2<=1.0 & x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.1358 if c<=0.0 & x4-x2<=-1.0\n",
      "   +0.1715 if c<=0.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   -0.1301 if c<=0.0 & x1<=0.0\n",
      "   -0.0177 if x1>=3.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   -0.0235 if x1>=2.0 & x4-x2>=0.0\n",
      "   +0.2196 if c<=0.0 & x1>=1.0 & x2<=0.0 & x3-x1<=0.0 & x4-x2<=1.0\n",
      "   -0.1275 if c<=0.0 & x1>=1.0 & x2>=1.0 & x2>=3.0 & x3-x1<=0.0 & x4-x2<=-2.0 & x4-x2>=-2.0\n",
      "----------------- 1 --------------\n",
      "   -0.1138 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.0042 if x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.9543 if c>=1.0 & x2>=1.0\n",
      "   -0.1722 if x2<=2.0 & x3-x1<=-1.0\n",
      "   +0.6257 if c<=0.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.0146 if x1>=3.0 & x4-x2<=0.0\n",
      "   +0.3230 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.7189 if x3-x1>=1.0 & x4-x2>=0.0\n",
      "   +0.3259 if c>=1.0 & x1<=2.0 & x1>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2>=-2.0\n",
      "   +0.1205 if x1<=2.0 & x2<=1.0 & x2<=2.0 & x3-x1<=2.0 & x4-x2<=1.0\n",
      "   +0.0794 if c<=0.0 & x1<=1.0 & x3-x1>=0.0\n",
      "   +0.0000 if x3-x1>=0.0 & x4-x2>=2.0\n",
      "   -0.1362 if x1>=2.0 & x2<=1.0 & x2>=1.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   -0.1930 if x1>=1.0 & x3-x1>=-2.0 & x4-x2<=2.0\n",
      "   -0.2514 if x1>=3.0 & x2<=1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.5321 if x2>=2.0 & x3-x1>=2.0 & x4-x2>=-1.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 2 --------------\n",
      "   +0.6846 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.3971 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -0.2765 if x4-x2>=0.0\n",
      "   -0.2458 if c>=1.0 & x2>=2.0\n",
      "   +0.5968 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   -0.1980 if x4-x2<=1.0\n",
      "   -0.0134 if c<=0.0 & x1>=2.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=-1.0 & x4-x2>=0.0\n",
      "   +0.1941 if x1<=2.0 & x2>=1.0 & x3-x1<=1.0\n",
      "   +0.0330 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   +0.0000 if x1<=2.0 & x4-x2>=2.0\n",
      "   -0.4347 if c>=1.0 & x1<=2.0 & x3-x1<=1.0\n",
      "   +0.0663 if c>=1.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.3472 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2>=2.0 & x3-x1<=1.0 & x4-x2>=-1.0\n",
      "   -0.0211 if c<=0.0 & x1>=1.0 & x2<=2.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   +0.2283 if x1<=1.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.2613 if c<=0.0 & x2>=1.0 & x4-x2>=1.0\n",
      "----------------- 3 --------------\n",
      "   +0.2399 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.4238 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.1919 if x1<=1.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   +0.0675 if x1<=2.0 & x2<=1.0 & x3-x1>=-1.0 & x4-x2>=0.0\n",
      "   -0.4216 if x1<=2.0 & x4-x2<=0.0\n",
      "   +0.3153 if c>=1.0 & x4-x2>=-1.0\n",
      "   +0.5980 if x1>=2.0 & x3-x1>=-2.0\n",
      "   +0.4626 if x2<=2.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   -0.2214 if x1<=0.0 & x4-x2>=-1.0\n",
      "   +0.0382 if c<=0.0 & x3-x1<=2.0 & x3-x1>=0.0\n",
      "   +0.2679 if x1>=1.0 & x2<=1.0\n",
      "   -0.2292 if x1<=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   +0.0000 if x1>=2.0 & x4-x2>=2.0\n",
      "   -0.1227 if c<=0.0 & x3-x1>=2.0\n",
      "   -0.4894 if c<=0.0 & x1>=3.0 & x3-x1<=-1.0\n",
      "   +0.2225 if x4-x2<=-1.0\n",
      "init state [0 1 2 1 0]\n",
      "(9,) (9,)\n",
      "init state [ 3  2  0 -1  0]\n",
      "(14,) (5,)\n",
      "init state [2 1 1 0 0]\n",
      "(29,) (15,)\n",
      "init state [ 2  1 -1  2  0]\n",
      "(38,) (9,)\n",
      "init state [ 1  0 -1  1  0]\n",
      "(61,) (23,)\n",
      "init state [ 2  0 -2  1  0]\n",
      "(93,) (32,)\n",
      "init state [ 2  0 -2  3  0]\n",
      "(105,) (12,)\n",
      "init state [ 2  2 -2 -2  0]\n",
      "(127,) (22,)\n",
      "init state [ 2  2 -2 -2  0]\n",
      "(225,) (98,)\n",
      "init state [ 2  1  0 -1  0]\n",
      "(238,) (13,)\n",
      "============ 98 ===========\n",
      "Run episode 98 with rewards 29, accuracy 0.6\n",
      "----------------- 0 --------------\n",
      "   +0.0633 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.0344 if c<=0.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   +0.4954 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.5704 if c<=0.0 & x1<=2.0 & x3-x1>=-1.0\n",
      "   +0.8627 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   -0.0834 if c<=0.0 & x3-x1>=-2.0\n",
      "   +0.0295 if x1>=2.0 & x3-x1<=-1.0 & x4-x2<=-2.0\n",
      "   -0.4322 if c<=0.0 & x1<=2.0 & x2<=1.0 & x4-x2<=2.0 & x4-x2>=0.0\n",
      "   +0.2217 if c<=0.0 & x4-x2<=-1.0\n",
      "   +0.2966 if c<=0.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   -0.2294 if c<=0.0 & x1<=0.0\n",
      "   +0.1205 if x1>=3.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   -0.1735 if x1>=2.0 & x4-x2>=0.0\n",
      "   +0.6427 if c<=0.0 & x1>=1.0 & x2<=0.0 & x3-x1<=0.0 & x4-x2<=1.0\n",
      "   -0.3071 if c<=0.0 & x1>=1.0 & x2>=1.0 & x2>=3.0 & x3-x1<=0.0 & x4-x2<=-2.0 & x4-x2>=-2.0\n",
      "   -0.0853 if x1<=2.0 & x1>=2.0 & x3-x1<=-1.0\n",
      "----------------- 1 --------------\n",
      "   +0.1185 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.3517 if x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.9647 if c>=1.0 & x2>=1.0\n",
      "   -0.4597 if x2<=2.0 & x3-x1<=-1.0\n",
      "   +0.3472 if c<=0.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.2750 if x1>=3.0 & x4-x2<=0.0\n",
      "   +0.2912 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.5062 if x3-x1>=1.0 & x4-x2>=0.0\n",
      "   +0.6098 if c>=1.0 & x1<=2.0 & x1>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2>=-2.0\n",
      "   -0.4013 if x1<=2.0 & x2<=1.0 & x2<=2.0 & x3-x1<=2.0 & x4-x2<=1.0\n",
      "   -0.1059 if c<=0.0 & x1<=1.0 & x3-x1>=0.0\n",
      "   -0.0553 if x1>=2.0 & x2<=1.0 & x2>=1.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   -0.3068 if x1>=1.0 & x3-x1>=-2.0 & x4-x2<=2.0\n",
      "   +0.0000 if x1>=3.0 & x2<=1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.1405 if x2>=2.0 & x3-x1>=2.0 & x4-x2>=-1.0\n",
      "   -0.4103 if x3-x1<=1.0 & x3-x1>=1.0 & x4-x2>=2.0\n",
      "----------------- 2 --------------\n",
      "   +0.2920 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.2563 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -0.1572 if x4-x2>=0.0\n",
      "   -0.5010 if c>=1.0 & x2>=2.0\n",
      "   +0.7806 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   -0.1004 if x4-x2<=1.0\n",
      "   -0.1522 if c<=0.0 & x1>=2.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=-1.0 & x4-x2>=0.0\n",
      "   -0.1059 if x1<=2.0 & x2>=1.0 & x3-x1<=1.0\n",
      "   +0.2499 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.3616 if c>=1.0 & x1<=2.0 & x3-x1<=1.0\n",
      "   -0.2044 if c>=1.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   -0.0183 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2>=2.0 & x3-x1<=1.0 & x4-x2>=-1.0\n",
      "   -0.0714 if c<=0.0 & x1>=1.0 & x2<=2.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   -0.0548 if x1<=1.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.1922 if c<=0.0 & x2>=1.0 & x4-x2>=1.0\n",
      "   +0.3500 if x2>=1.0 & x3-x1>=2.0 & x4-x2>=1.0\n",
      "----------------- 3 --------------\n",
      "   +0.3214 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.3957 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.4740 if x1<=1.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   +0.2827 if x1<=2.0 & x2<=1.0 & x3-x1>=-1.0 & x4-x2>=0.0\n",
      "   -0.4708 if x1<=2.0 & x4-x2<=0.0\n",
      "   +0.0653 if c>=1.0 & x4-x2>=-1.0\n",
      "   +0.7072 if x1>=2.0 & x3-x1>=-2.0\n",
      "   +0.6430 if x2<=2.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.5077 if x1<=0.0 & x4-x2>=-1.0\n",
      "   +0.2635 if c<=0.0 & x3-x1<=2.0 & x3-x1>=0.0\n",
      "   +0.3619 if x1>=1.0 & x2<=1.0\n",
      "   -0.2383 if x1<=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.3541 if c<=0.0 & x3-x1>=2.0\n",
      "   +0.0284 if c<=0.0 & x1>=3.0 & x3-x1<=-1.0\n",
      "   +0.4317 if x4-x2<=-1.0\n",
      "   +0.4988 if x3-x1<=1.0 & x4-x2>=2.0\n",
      "init state [0 0 0 3 0]\n",
      "(23,) (23,)\n",
      "init state [ 3  2  0 -1  0]\n",
      "(39,) (16,)\n",
      "init state [ 1  2 -1 -1  0]\n",
      "(51,) (12,)\n",
      "init state [ 2  0 -1  2  0]\n",
      "(57,) (6,)\n",
      "init state [ 3  0 -1  0  0]\n",
      "(70,) (13,)\n",
      "init state [ 0  3  1 -3  0]\n",
      "(84,) (14,)\n",
      "init state [1 2 0 1 0]\n",
      "(104,) (20,)\n",
      "init state [ 0  3  1 -3  0]\n",
      "(145,) (41,)\n",
      "init state [ 2  3 -1 -3  0]\n",
      "(170,) (25,)\n",
      "init state [ 0  2  2 -2  0]\n",
      "(183,) (13,)\n",
      "============ 99 ===========\n",
      "Run episode 99 with rewards 29, accuracy 0.6\n",
      "----------------- 0 --------------\n",
      "   -0.0418 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.5075 if c<=0.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   +0.0790 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.1714 if c<=0.0 & x1<=2.0 & x3-x1>=-1.0\n",
      "   +0.7871 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   -0.0673 if c<=0.0 & x3-x1>=-2.0\n",
      "   -0.4517 if c<=0.0 & x1<=2.0 & x2<=1.0 & x4-x2<=2.0 & x4-x2>=0.0\n",
      "   +0.0143 if c<=0.0 & x4-x2<=-1.0\n",
      "   +0.2934 if c<=0.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   -0.4089 if c<=0.0 & x1<=0.0\n",
      "   +0.3055 if x1>=3.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   -0.0584 if x1>=2.0 & x4-x2>=0.0\n",
      "   -0.1284 if c<=0.0 & x1>=1.0 & x2<=0.0 & x3-x1<=0.0 & x4-x2<=1.0\n",
      "   +0.0612 if c<=0.0 & x1>=1.0 & x2>=1.0 & x2>=3.0 & x3-x1<=0.0 & x4-x2<=-2.0 & x4-x2>=-2.0\n",
      "   -0.1745 if x1<=2.0 & x1>=2.0 & x3-x1<=-1.0\n",
      "   -0.4794 if x2>=1.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "----------------- 1 --------------\n",
      "   +0.4680 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   -0.1641 if x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +1.2801 if c>=1.0 & x2>=1.0\n",
      "   -0.5491 if x2<=2.0 & x3-x1<=-1.0\n",
      "   +0.2462 if c<=0.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.0168 if x1>=3.0 & x4-x2<=0.0\n",
      "   +0.3704 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.1133 if x3-x1>=1.0 & x4-x2>=0.0\n",
      "   +0.6073 if c>=1.0 & x1<=2.0 & x1>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2>=-2.0\n",
      "   +0.1401 if x1<=2.0 & x2<=1.0 & x2<=2.0 & x3-x1<=2.0 & x4-x2<=1.0\n",
      "   +0.1691 if c<=0.0 & x1<=1.0 & x3-x1>=0.0\n",
      "   +0.0000 if x1>=2.0 & x2<=1.0 & x2>=1.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   -0.0413 if x1>=1.0 & x3-x1>=-2.0 & x4-x2<=2.0\n",
      "   -0.1556 if x2>=2.0 & x3-x1>=2.0 & x4-x2>=-1.0\n",
      "   +0.1139 if x3-x1<=1.0 & x3-x1>=1.0 & x4-x2>=2.0\n",
      "   +0.7735 if x1<=2.0 & x1>=1.0 & x2<=0.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "----------------- 2 --------------\n",
      "   +0.5962 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.1691 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   +0.0925 if x4-x2>=0.0\n",
      "   -0.4702 if c>=1.0 & x2>=2.0\n",
      "   +0.6253 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   -0.3270 if x4-x2<=1.0\n",
      "   -0.4355 if c<=0.0 & x1>=2.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=-1.0 & x4-x2>=0.0\n",
      "   +0.2797 if x1<=2.0 & x2>=1.0 & x3-x1<=1.0\n",
      "   -0.1997 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.5447 if c>=1.0 & x1<=2.0 & x3-x1<=1.0\n",
      "   -0.2394 if c>=1.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   -0.3635 if c<=0.0 & x1>=1.0 & x2<=2.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   +0.4565 if x1<=1.0 & x1>=1.0 & x2>=3.0\n",
      "   +0.1771 if c<=0.0 & x2>=1.0 & x4-x2>=1.0\n",
      "   +0.0000 if x2>=1.0 & x3-x1>=2.0 & x4-x2>=1.0\n",
      "   +0.7183 if x1>=1.0 & x3-x1>=2.0 & x4-x2<=0.0\n",
      "----------------- 3 --------------\n",
      "   +0.0549 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.2979 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.0446 if x1<=1.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   +0.1828 if x1<=2.0 & x2<=1.0 & x3-x1>=-1.0 & x4-x2>=0.0\n",
      "   -0.6007 if x1<=2.0 & x4-x2<=0.0\n",
      "   -0.0054 if c>=1.0 & x4-x2>=-1.0\n",
      "   +0.7286 if x1>=2.0 & x3-x1>=-2.0\n",
      "   +0.7238 if x2<=2.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.0880 if x1<=0.0 & x4-x2>=-1.0\n",
      "   -0.4005 if c<=0.0 & x3-x1<=2.0 & x3-x1>=0.0\n",
      "   +0.2371 if x1>=1.0 & x2<=1.0\n",
      "   -0.2737 if x1<=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.3055 if c<=0.0 & x3-x1>=2.0\n",
      "   +0.2437 if x4-x2<=-1.0\n",
      "   -0.0832 if x3-x1<=1.0 & x4-x2>=2.0\n",
      "   +0.5415 if x1>=3.0 & x4-x2>=0.0\n",
      "init state [ 1  1 -1  1  0]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(12,) (12,)\n",
      "init state [0 2 2 1 0]\n",
      "(31,) (19,)\n",
      "init state [ 1  3 -1  0  0]\n",
      "(37,) (6,)\n",
      "init state [1 1 0 2 0]\n",
      "(47,) (10,)\n",
      "init state [ 3  2 -3  1  0]\n",
      "(55,) (8,)\n",
      "init state [2 0 1 2 0]\n",
      "(67,) (12,)\n",
      "init state [ 0  2  0 -2  0]\n",
      "(76,) (9,)\n",
      "init state [ 2  3 -2 -1  0]\n",
      "(104,) (28,)\n",
      "init state [ 1  3  2 -3  0]\n",
      "(118,) (14,)\n",
      "init state [ 2  1  1 -1  0]\n",
      "(131,) (13,)\n",
      "============ 100 ===========\n",
      "Run episode 100 with rewards 29, accuracy 0.8\n",
      "----------------- 0 --------------\n",
      "   +0.2137 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.6112 if c<=0.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   -0.2373 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.6009 if c<=0.0 & x1<=2.0 & x3-x1>=-1.0\n",
      "   +0.8375 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.3600 if c<=0.0 & x3-x1>=-2.0\n",
      "   -0.2645 if c<=0.0 & x1<=2.0 & x2<=1.0 & x4-x2<=2.0 & x4-x2>=0.0\n",
      "   +0.5023 if c<=0.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   -0.2305 if c<=0.0 & x1<=0.0\n",
      "   +0.0864 if x1>=3.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   +0.0945 if x1>=2.0 & x4-x2>=0.0\n",
      "   +0.0000 if c<=0.0 & x1>=1.0 & x2<=0.0 & x3-x1<=0.0 & x4-x2<=1.0\n",
      "   +0.0000 if c<=0.0 & x1>=1.0 & x2>=1.0 & x2>=3.0 & x3-x1<=0.0 & x4-x2<=-2.0 & x4-x2>=-2.0\n",
      "   -0.1090 if x1<=2.0 & x1>=2.0 & x3-x1<=-1.0\n",
      "   -0.4791 if x2>=1.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   -0.2440 if x3-x1<=-3.0 & x4-x2>=1.0\n",
      "----------------- 1 --------------\n",
      "   +0.4181 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.3840 if x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +1.0697 if c>=1.0 & x2>=1.0\n",
      "   -0.3673 if x2<=2.0 & x3-x1<=-1.0\n",
      "   +0.2524 if c<=0.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.2689 if x1>=3.0 & x4-x2<=0.0\n",
      "   +0.0739 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.5619 if x3-x1>=1.0 & x4-x2>=0.0\n",
      "   +0.6319 if c>=1.0 & x1<=2.0 & x1>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2>=-2.0\n",
      "   -0.0776 if x1<=2.0 & x2<=1.0 & x2<=2.0 & x3-x1<=2.0 & x4-x2<=1.0\n",
      "   +0.2166 if c<=0.0 & x1<=1.0 & x3-x1>=0.0\n",
      "   +0.0763 if x1>=1.0 & x3-x1>=-2.0 & x4-x2<=2.0\n",
      "   +0.0298 if x2>=2.0 & x3-x1>=2.0 & x4-x2>=-1.0\n",
      "   +0.2113 if x3-x1<=1.0 & x3-x1>=1.0 & x4-x2>=2.0\n",
      "   +0.7785 if x1<=2.0 & x1>=1.0 & x2<=0.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   -0.4620 if x1>=1.0 & x3-x1<=1.0 & x4-x2<=2.0\n",
      "----------------- 2 --------------\n",
      "   +0.5513 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.1986 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -0.5108 if x4-x2>=0.0\n",
      "   -0.4094 if c>=1.0 & x2>=2.0\n",
      "   +0.5442 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   -0.4512 if x4-x2<=1.0\n",
      "   -0.0301 if c<=0.0 & x1>=2.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=-1.0 & x4-x2>=0.0\n",
      "   +0.5142 if x1<=2.0 & x2>=1.0 & x3-x1<=1.0\n",
      "   -0.2856 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.3815 if c>=1.0 & x1<=2.0 & x3-x1<=1.0\n",
      "   -0.2520 if c>=1.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.0514 if c<=0.0 & x1>=1.0 & x2<=2.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   -0.3094 if x1<=1.0 & x1>=1.0 & x2>=3.0\n",
      "   +0.4243 if c<=0.0 & x2>=1.0 & x4-x2>=1.0\n",
      "   -0.0551 if x1>=1.0 & x3-x1>=2.0 & x4-x2<=0.0\n",
      "   +0.5766 if x3-x1>=0.0 & x4-x2<=1.0\n",
      "----------------- 3 --------------\n",
      "   +0.3063 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.3389 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.1132 if x1<=1.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   +0.2419 if x1<=2.0 & x2<=1.0 & x3-x1>=-1.0 & x4-x2>=0.0\n",
      "   -0.4776 if x1<=2.0 & x4-x2<=0.0\n",
      "   +0.2303 if x1>=2.0 & x3-x1>=-2.0\n",
      "   +0.4217 if x2<=2.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.2559 if x1<=0.0 & x4-x2>=-1.0\n",
      "   -0.5202 if c<=0.0 & x3-x1<=2.0 & x3-x1>=0.0\n",
      "   +0.2229 if x1>=1.0 & x2<=1.0\n",
      "   +0.0502 if x1<=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.1433 if c<=0.0 & x3-x1>=2.0\n",
      "   +0.2546 if x4-x2<=-1.0\n",
      "   +0.3055 if x3-x1<=1.0 & x4-x2>=2.0\n",
      "   +0.3003 if x1>=3.0 & x4-x2>=0.0\n",
      "   +0.9046 if x2>=1.0 & x3-x1<=0.0 & x4-x2<=2.0 & x4-x2>=1.0\n",
      "init state [ 1  3 -1  0  0]\n",
      "(5,) (5,)\n",
      "init state [ 1  3  1 -1  0]\n",
      "(12,) (7,)\n",
      "init state [ 0  3  0 -1  0]\n",
      "(19,) (7,)\n",
      "init state [ 0  3  2 -2  0]\n",
      "(29,) (10,)\n",
      "init state [ 1  0 -1  3  0]\n",
      "(51,) (22,)\n",
      "init state [ 1  1 -1  0  0]\n",
      "(64,) (13,)\n",
      "init state [ 0  1  0 -1  0]\n",
      "(83,) (19,)\n",
      "init state [ 3  2 -1  1  0]\n",
      "(86,) (3,)\n",
      "init state [1 0 1 1 0]\n",
      "(105,) (19,)\n",
      "init state [1 0 2 1 0]\n",
      "(144,) (39,)\n",
      "============ 101 ===========\n",
      "Run episode 101 with rewards 3, accuracy 0.7\n",
      "----------------- 0 --------------\n",
      "   +0.2564 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.2976 if c<=0.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   -0.2498 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   +0.0641 if c<=0.0 & x1<=2.0 & x3-x1>=-1.0\n",
      "   +0.8274 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.2671 if c<=0.0 & x3-x1>=-2.0\n",
      "   -0.2401 if c<=0.0 & x1<=2.0 & x2<=1.0 & x4-x2<=2.0 & x4-x2>=0.0\n",
      "   +0.4837 if c<=0.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   -0.2468 if c<=0.0 & x1<=0.0\n",
      "   +0.0800 if x1>=3.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   -0.1797 if x1>=2.0 & x4-x2>=0.0\n",
      "   -0.0404 if c<=0.0 & x1>=1.0 & x2<=0.0 & x3-x1<=0.0 & x4-x2<=1.0\n",
      "   -0.2196 if x1<=2.0 & x1>=2.0 & x3-x1<=-1.0\n",
      "   -0.0469 if x2>=1.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   +0.0000 if x3-x1<=-3.0 & x4-x2>=1.0\n",
      "   -0.3612 if x3-x1<=-1.0 & x4-x2<=1.0\n",
      "----------------- 1 --------------\n",
      "   +0.0800 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   -0.1570 if x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.8335 if c>=1.0 & x2>=1.0\n",
      "   -0.0688 if x2<=2.0 & x3-x1<=-1.0\n",
      "   +0.1677 if c<=0.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.1730 if x1>=3.0 & x4-x2<=0.0\n",
      "   +0.1773 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.6295 if x3-x1>=1.0 & x4-x2>=0.0\n",
      "   +0.4329 if c>=1.0 & x1<=2.0 & x1>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2>=-2.0\n",
      "   -0.2124 if x1<=2.0 & x2<=1.0 & x2<=2.0 & x3-x1<=2.0 & x4-x2<=1.0\n",
      "   +0.3556 if c<=0.0 & x1<=1.0 & x3-x1>=0.0\n",
      "   +0.0204 if x1>=1.0 & x3-x1>=-2.0 & x4-x2<=2.0\n",
      "   +0.0000 if x3-x1<=1.0 & x3-x1>=1.0 & x4-x2>=2.0\n",
      "   +0.1445 if x1<=2.0 & x1>=1.0 & x2<=0.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.0227 if x1>=1.0 & x3-x1<=1.0 & x4-x2<=2.0\n",
      "   +0.3328 if x2<=2.0 & x3-x1>=2.0 & x4-x2<=0.0\n",
      "----------------- 2 --------------\n",
      "   +0.4663 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.2087 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -0.5364 if x4-x2>=0.0\n",
      "   -0.2110 if c>=1.0 & x2>=2.0\n",
      "   +0.2754 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   -0.0523 if x4-x2<=1.0\n",
      "   +0.2212 if x1<=2.0 & x2>=1.0 & x3-x1<=1.0\n",
      "   -0.1091 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.3884 if c>=1.0 & x1<=2.0 & x3-x1<=1.0\n",
      "   -0.3371 if c>=1.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   -0.1139 if c<=0.0 & x1>=1.0 & x2<=2.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   -0.1712 if x1<=1.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.1078 if c<=0.0 & x2>=1.0 & x4-x2>=1.0\n",
      "   +0.0000 if x1>=1.0 & x3-x1>=2.0 & x4-x2<=0.0\n",
      "   +0.4294 if x3-x1>=0.0 & x4-x2<=1.0\n",
      "   -0.0882 if c<=0.0 & x1<=0.0 & x2<=1.0 & x2<=2.0 & x4-x2<=-1.0\n",
      "----------------- 3 --------------\n",
      "   +0.6762 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.5179 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.0897 if x1<=1.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   +0.2046 if x1<=2.0 & x2<=1.0 & x3-x1>=-1.0 & x4-x2>=0.0\n",
      "   -0.4160 if x1<=2.0 & x4-x2<=0.0\n",
      "   +0.4867 if x1>=2.0 & x3-x1>=-2.0\n",
      "   +0.7014 if x2<=2.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   -0.1660 if x1<=0.0 & x4-x2>=-1.0\n",
      "   -0.4265 if c<=0.0 & x3-x1<=2.0 & x3-x1>=0.0\n",
      "   +0.0640 if x1>=1.0 & x2<=1.0\n",
      "   -0.0150 if c<=0.0 & x3-x1>=2.0\n",
      "   -0.1205 if x4-x2<=-1.0\n",
      "   +0.1734 if x3-x1<=1.0 & x4-x2>=2.0\n",
      "   +0.3072 if x1>=3.0 & x4-x2>=0.0\n",
      "   +0.3840 if x2>=1.0 & x3-x1<=0.0 & x4-x2<=2.0 & x4-x2>=1.0\n",
      "   +0.3462 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x3-x1>=0.0\n",
      "init state [ 3  2  0 -2  0]\n",
      "(35,) (35,)\n",
      "init state [1 2 0 1 0]\n",
      "(44,) (9,)\n",
      "init state [ 3  2 -1 -2  0]\n",
      "(54,) (10,)\n",
      "init state [ 0  2  3 -2  0]\n",
      "(81,) (27,)\n",
      "init state [ 1  1  0 -1  0]\n",
      "(111,) (30,)\n",
      "init state [ 0  3  1 -1  0]\n",
      "(133,) (22,)\n",
      "init state [ 3  0 -3  1  0]\n",
      "(162,) (29,)\n",
      "init state [1 3 1 0 0]\n",
      "(165,) (3,)\n",
      "init state [ 3  2  0 -1  0]\n",
      "(168,) (3,)\n",
      "init state [0 1 2 2 0]\n",
      "(182,) (14,)\n",
      "============ 102 ===========\n",
      "Run episode 102 with rewards 28, accuracy 1.0\n",
      "best\n",
      "----------------- 0 --------------\n",
      "   -0.0682 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.0026 if c<=0.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   -0.0307 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.0508 if c<=0.0 & x1<=2.0 & x3-x1>=-1.0\n",
      "   +0.4631 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.0852 if c<=0.0 & x3-x1>=-2.0\n",
      "   -0.1736 if c<=0.0 & x1<=2.0 & x2<=1.0 & x4-x2<=2.0 & x4-x2>=0.0\n",
      "   +0.3514 if c<=0.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   +0.5724 if c<=0.0 & x1<=0.0\n",
      "   -0.1879 if x1>=3.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   -0.6355 if x1>=2.0 & x4-x2>=0.0\n",
      "   +0.2436 if c<=0.0 & x1>=1.0 & x2<=0.0 & x3-x1<=0.0 & x4-x2<=1.0\n",
      "   -0.0210 if x1<=2.0 & x1>=2.0 & x3-x1<=-1.0\n",
      "   -0.0513 if x2>=1.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   +0.0836 if x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   -0.2392 if x3-x1>=3.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 1 --------------\n",
      "   -0.0080 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.1419 if x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.9641 if c>=1.0 & x2>=1.0\n",
      "   +0.0248 if x2<=2.0 & x3-x1<=-1.0\n",
      "   +0.1146 if c<=0.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.2197 if x1>=3.0 & x4-x2<=0.0\n",
      "   +0.3826 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.0498 if x3-x1>=1.0 & x4-x2>=0.0\n",
      "   +0.3670 if c>=1.0 & x1<=2.0 & x1>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2>=-2.0\n",
      "   +0.0548 if x1<=2.0 & x2<=1.0 & x2<=2.0 & x3-x1<=2.0 & x4-x2<=1.0\n",
      "   +0.1205 if c<=0.0 & x1<=1.0 & x3-x1>=0.0\n",
      "   -0.0910 if x1>=1.0 & x3-x1>=-2.0 & x4-x2<=2.0\n",
      "   -0.1419 if x1<=2.0 & x1>=1.0 & x2<=0.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.1288 if x1>=1.0 & x3-x1<=1.0 & x4-x2<=2.0\n",
      "   +0.2079 if x2<=2.0 & x3-x1>=2.0 & x4-x2<=0.0\n",
      "   +0.2583 if x2<=0.0 & x3-x1<=2.0 & x3-x1>=-2.0\n",
      "----------------- 2 --------------\n",
      "   +0.6527 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.2168 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -0.2493 if x4-x2>=0.0\n",
      "   -0.2983 if c>=1.0 & x2>=2.0\n",
      "   +0.2514 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   -0.0083 if x4-x2<=1.0\n",
      "   -0.3345 if x1<=2.0 & x2>=1.0 & x3-x1<=1.0\n",
      "   +0.1071 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.1387 if c>=1.0 & x1<=2.0 & x3-x1<=1.0\n",
      "   -0.1816 if c>=1.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.2371 if c<=0.0 & x1>=1.0 & x2<=2.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   +0.0928 if x1<=1.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.1566 if c<=0.0 & x2>=1.0 & x4-x2>=1.0\n",
      "   +0.4401 if x3-x1>=0.0 & x4-x2<=1.0\n",
      "   -0.1234 if c<=0.0 & x1<=0.0 & x2<=1.0 & x2<=2.0 & x4-x2<=-1.0\n",
      "   -0.5134 if x2>=3.0 & x3-x1>=1.0\n",
      "----------------- 3 --------------\n",
      "   +0.8149 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.5593 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.5803 if x1<=1.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   +0.3236 if x1<=2.0 & x2<=1.0 & x3-x1>=-1.0 & x4-x2>=0.0\n",
      "   -0.1612 if x1<=2.0 & x4-x2<=0.0\n",
      "   +0.2215 if x1>=2.0 & x3-x1>=-2.0\n",
      "   +0.2140 if x2<=2.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.1731 if x1<=0.0 & x4-x2>=-1.0\n",
      "   -0.0288 if c<=0.0 & x3-x1<=2.0 & x3-x1>=0.0\n",
      "   +0.1761 if x1>=1.0 & x2<=1.0\n",
      "   -0.1972 if x4-x2<=-1.0\n",
      "   +0.7353 if x3-x1<=1.0 & x4-x2>=2.0\n",
      "   +0.0812 if x1>=3.0 & x4-x2>=0.0\n",
      "   +0.4492 if x2>=1.0 & x3-x1<=0.0 & x4-x2<=2.0 & x4-x2>=1.0\n",
      "   -0.3173 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x3-x1>=0.0\n",
      "   -0.1119 if c>=1.0 & x4-x2>=1.0\n",
      "init state [ 2  1 -1 -1  0]\n",
      "(24,) (24,)\n",
      "init state [ 3  1 -2  1  0]\n",
      "(41,) (17,)\n",
      "init state [ 0  3  3 -3  0]\n",
      "(53,) (12,)\n",
      "init state [ 2  2  1 -2  0]\n",
      "(67,) (14,)\n",
      "init state [ 1  0 -1  3  0]\n",
      "(81,) (14,)\n",
      "init state [0 2 0 1 0]\n",
      "(94,) (13,)\n",
      "init state [ 3  0 -1  1  0]\n",
      "(115,) (21,)\n",
      "init state [ 2  2  1 -2  0]\n",
      "(132,) (17,)\n",
      "init state [ 1  3  0 -3  0]\n",
      "(153,) (21,)\n",
      "init state [ 3  1 -3  1  0]\n",
      "(171,) (18,)\n",
      "============ 103 ===========\n",
      "Run episode 103 with rewards 24, accuracy 0.7\n",
      "----------------- 0 --------------\n",
      "   -0.0979 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.2972 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   +0.2921 if c<=0.0 & x1<=2.0 & x3-x1>=-1.0\n",
      "   +0.7149 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   -0.1047 if c<=0.0 & x3-x1>=-2.0\n",
      "   -0.0792 if c<=0.0 & x1<=2.0 & x2<=1.0 & x4-x2<=2.0 & x4-x2>=0.0\n",
      "   +0.1337 if c<=0.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   +0.6015 if c<=0.0 & x1<=0.0\n",
      "   +0.0017 if x1>=3.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   -0.0520 if x1>=2.0 & x4-x2>=0.0\n",
      "   -0.2855 if c<=0.0 & x1>=1.0 & x2<=0.0 & x3-x1<=0.0 & x4-x2<=1.0\n",
      "   -0.0905 if x1<=2.0 & x1>=2.0 & x3-x1<=-1.0\n",
      "   -0.0631 if x2>=1.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   -0.0025 if x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   +0.0280 if x3-x1>=3.0\n",
      "   -0.7467 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "----------------- 1 --------------\n",
      "   -0.3407 if x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.9076 if c>=1.0 & x2>=1.0\n",
      "   -0.4684 if x2<=2.0 & x3-x1<=-1.0\n",
      "   +0.9197 if c<=0.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.1457 if x1>=3.0 & x4-x2<=0.0\n",
      "   +0.4127 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.3318 if x3-x1>=1.0 & x4-x2>=0.0\n",
      "   +0.2002 if c>=1.0 & x1<=2.0 & x1>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2>=-2.0\n",
      "   +0.0095 if x1<=2.0 & x2<=1.0 & x2<=2.0 & x3-x1<=2.0 & x4-x2<=1.0\n",
      "   -0.2545 if c<=0.0 & x1<=1.0 & x3-x1>=0.0\n",
      "   +0.4891 if x1>=1.0 & x3-x1>=-2.0 & x4-x2<=2.0\n",
      "   +0.0000 if x1<=2.0 & x1>=1.0 & x2<=0.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.1445 if x1>=1.0 & x3-x1<=1.0 & x4-x2<=2.0\n",
      "   +0.2510 if x2<=2.0 & x3-x1>=2.0 & x4-x2<=0.0\n",
      "   +0.1576 if x2<=0.0 & x3-x1<=2.0 & x3-x1>=-2.0\n",
      "   +0.2649 if x1<=0.0 & x4-x2>=3.0\n",
      "----------------- 2 --------------\n",
      "   +0.4871 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.2490 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -0.3208 if x4-x2>=0.0\n",
      "   -0.1867 if c>=1.0 & x2>=2.0\n",
      "   +0.5244 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   -0.1850 if x1<=2.0 & x2>=1.0 & x3-x1<=1.0\n",
      "   +0.0607 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.1839 if c>=1.0 & x1<=2.0 & x3-x1<=1.0\n",
      "   +0.0480 if c>=1.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.2333 if c<=0.0 & x1>=1.0 & x2<=2.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   -0.2596 if x1<=1.0 & x1>=1.0 & x2>=3.0\n",
      "   +0.0058 if c<=0.0 & x2>=1.0 & x4-x2>=1.0\n",
      "   +0.4392 if x3-x1>=0.0 & x4-x2<=1.0\n",
      "   -0.4452 if c<=0.0 & x1<=0.0 & x2<=1.0 & x2<=2.0 & x4-x2<=-1.0\n",
      "   +0.2058 if x2>=3.0 & x3-x1>=1.0\n",
      "   +0.4759 if x1>=1.0 & x2<=0.0 & x3-x1<=1.0\n",
      "----------------- 3 --------------\n",
      "   +0.5845 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.6731 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.0468 if x1<=1.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   +0.4048 if x1<=2.0 & x2<=1.0 & x3-x1>=-1.0 & x4-x2>=0.0\n",
      "   -0.2347 if x1<=2.0 & x4-x2<=0.0\n",
      "   +0.1675 if x1>=2.0 & x3-x1>=-2.0\n",
      "   +0.2635 if x2<=2.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.0375 if x1<=0.0 & x4-x2>=-1.0\n",
      "   +0.3278 if x1>=1.0 & x2<=1.0\n",
      "   -0.0119 if x4-x2<=-1.0\n",
      "   +0.5723 if x3-x1<=1.0 & x4-x2>=2.0\n",
      "   -0.1568 if x1>=3.0 & x4-x2>=0.0\n",
      "   +0.3389 if x2>=1.0 & x3-x1<=0.0 & x4-x2<=2.0 & x4-x2>=1.0\n",
      "   +0.0300 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x3-x1>=0.0\n",
      "   +0.1726 if c>=1.0 & x4-x2>=1.0\n",
      "   -0.2489 if x4-x2>=3.0\n",
      "init state [ 1  2 -1  0  0]\n",
      "(8,) (8,)\n",
      "init state [ 2  2 -2  0  0]\n",
      "(46,) (38,)\n",
      "init state [ 3  2  0 -1  0]\n",
      "(49,) (3,)\n",
      "init state [ 1  3  2 -1  0]\n",
      "(54,) (5,)\n",
      "init state [ 1  3  0 -3  0]\n",
      "(70,) (16,)\n",
      "init state [ 1  3 -1 -2  0]\n",
      "(128,) (58,)\n",
      "init state [ 1  1 -1  2  0]\n",
      "(147,) (19,)\n",
      "init state [ 1  3  2 -3  0]\n",
      "(157,) (10,)\n",
      "init state [ 0  2  2 -1  0]\n",
      "(168,) (11,)\n",
      "init state [2 0 1 2 0]\n",
      "(186,) (18,)\n",
      "============ 104 ===========\n",
      "Run episode 104 with rewards 24, accuracy 0.7\n",
      "----------------- 0 --------------\n",
      "   -0.0125 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.0774 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.1051 if c<=0.0 & x1<=2.0 & x3-x1>=-1.0\n",
      "   +1.0973 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   -0.0923 if c<=0.0 & x3-x1>=-2.0\n",
      "   -0.4204 if c<=0.0 & x1<=2.0 & x2<=1.0 & x4-x2<=2.0 & x4-x2>=0.0\n",
      "   +0.8140 if c<=0.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   +0.0059 if c<=0.0 & x1<=0.0\n",
      "   +0.0203 if x1>=2.0 & x4-x2>=0.0\n",
      "   +0.0123 if c<=0.0 & x1>=1.0 & x2<=0.0 & x3-x1<=0.0 & x4-x2<=1.0\n",
      "   -0.2132 if x1<=2.0 & x1>=2.0 & x3-x1<=-1.0\n",
      "   -0.7106 if x2>=1.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   +0.4078 if x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   -0.0000 if x3-x1>=3.0\n",
      "   +0.7048 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.8201 if x3-x1>=1.0\n",
      "----------------- 1 --------------\n",
      "   +0.2750 if x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.7750 if c>=1.0 & x2>=1.0\n",
      "   -0.1111 if x2<=2.0 & x3-x1<=-1.0\n",
      "   +0.5037 if c<=0.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.2105 if x1>=3.0 & x4-x2<=0.0\n",
      "   +0.5724 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.3429 if x3-x1>=1.0 & x4-x2>=0.0\n",
      "   +0.5284 if c>=1.0 & x1<=2.0 & x1>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2>=-2.0\n",
      "   -0.0104 if x1<=2.0 & x2<=1.0 & x2<=2.0 & x3-x1<=2.0 & x4-x2<=1.0\n",
      "   -0.2811 if c<=0.0 & x1<=1.0 & x3-x1>=0.0\n",
      "   +0.1681 if x1>=1.0 & x3-x1>=-2.0 & x4-x2<=2.0\n",
      "   -0.0538 if x1>=1.0 & x3-x1<=1.0 & x4-x2<=2.0\n",
      "   +0.0297 if x2<=2.0 & x3-x1>=2.0 & x4-x2<=0.0\n",
      "   -0.0432 if x2<=0.0 & x3-x1<=2.0 & x3-x1>=-2.0\n",
      "   +0.3602 if x1<=0.0 & x4-x2>=3.0\n",
      "   +0.5311 if x2<=1.0 & x3-x1>=1.0 & x4-x2<=-1.0\n",
      "----------------- 2 --------------\n",
      "   +0.4715 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.3061 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -0.3830 if x4-x2>=0.0\n",
      "   -0.3809 if c>=1.0 & x2>=2.0\n",
      "   +0.8041 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   -0.2304 if x1<=2.0 & x2>=1.0 & x3-x1<=1.0\n",
      "   +0.4137 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.1769 if c>=1.0 & x1<=2.0 & x3-x1<=1.0\n",
      "   -0.2276 if c>=1.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.1350 if c<=0.0 & x1>=1.0 & x2<=2.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   +0.3590 if x1<=1.0 & x1>=1.0 & x2>=3.0\n",
      "   +0.5641 if x3-x1>=0.0 & x4-x2<=1.0\n",
      "   +0.0000 if c<=0.0 & x1<=0.0 & x2<=1.0 & x2<=2.0 & x4-x2<=-1.0\n",
      "   +0.3541 if x2>=3.0 & x3-x1>=1.0\n",
      "   +0.2871 if x1>=1.0 & x2<=0.0 & x3-x1<=1.0\n",
      "   -0.8664 if c<=0.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "----------------- 3 --------------\n",
      "   +0.6568 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.6914 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.0370 if x1<=1.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   +0.2656 if x1<=2.0 & x2<=1.0 & x3-x1>=-1.0 & x4-x2>=0.0\n",
      "   -0.5460 if x1<=2.0 & x4-x2<=0.0\n",
      "   +0.1976 if x1>=2.0 & x3-x1>=-2.0\n",
      "   +0.0897 if x2<=2.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   -0.0423 if x1<=0.0 & x4-x2>=-1.0\n",
      "   +0.2949 if x1>=1.0 & x2<=1.0\n",
      "   +0.2171 if x3-x1<=1.0 & x4-x2>=2.0\n",
      "   -0.0754 if x1>=3.0 & x4-x2>=0.0\n",
      "   +0.0232 if x2>=1.0 & x3-x1<=0.0 & x4-x2<=2.0 & x4-x2>=1.0\n",
      "   -0.4874 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x3-x1>=0.0\n",
      "   +0.1080 if c>=1.0 & x4-x2>=1.0\n",
      "   -0.1062 if x4-x2>=3.0\n",
      "   +0.6785 if x4-x2<=2.0 & x4-x2>=1.0\n",
      "init state [1 0 1 2 0]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(9,) (9,)\n",
      "init state [1 2 2 0 0]\n",
      "(25,) (16,)\n",
      "init state [ 2  1 -1  0  0]\n",
      "(40,) (15,)\n",
      "init state [ 1  1 -1  0  0]\n",
      "(52,) (12,)\n",
      "init state [0 2 3 0 0]\n",
      "(67,) (15,)\n",
      "init state [ 2  2  0 -2  0]\n",
      "(82,) (15,)\n",
      "init state [ 2  2 -1  0  0]\n",
      "(92,) (10,)\n",
      "init state [ 0  2  3 -1  0]\n",
      "(105,) (13,)\n",
      "init state [ 2  3 -1 -2  0]\n",
      "(118,) (13,)\n",
      "init state [ 1  0 -1  0  0]\n",
      "(133,) (15,)\n",
      "============ 105 ===========\n",
      "Run episode 105 with rewards 27, accuracy 0.5\n",
      "----------------- 0 --------------\n",
      "   +0.3900 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.5840 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.0405 if c<=0.0 & x1<=2.0 & x3-x1>=-1.0\n",
      "   +0.5093 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.3684 if c<=0.0 & x3-x1>=-2.0\n",
      "   -0.2274 if c<=0.0 & x1<=2.0 & x2<=1.0 & x4-x2<=2.0 & x4-x2>=0.0\n",
      "   +0.3583 if c<=0.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   -0.3232 if c<=0.0 & x1<=0.0\n",
      "   -0.0740 if x1>=2.0 & x4-x2>=0.0\n",
      "   +0.0479 if c<=0.0 & x1>=1.0 & x2<=0.0 & x3-x1<=0.0 & x4-x2<=1.0\n",
      "   -0.0228 if x1<=2.0 & x1>=2.0 & x3-x1<=-1.0\n",
      "   -0.0191 if x2>=1.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   -0.0699 if x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   +0.0321 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.2653 if x3-x1>=1.0\n",
      "   -0.5905 if x1<=1.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "----------------- 1 --------------\n",
      "   +0.1326 if x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.2741 if c>=1.0 & x2>=1.0\n",
      "   +0.0138 if x2<=2.0 & x3-x1<=-1.0\n",
      "   +0.0533 if c<=0.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.3315 if x1>=3.0 & x4-x2<=0.0\n",
      "   +0.0616 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.4938 if x3-x1>=1.0 & x4-x2>=0.0\n",
      "   +0.1029 if c>=1.0 & x1<=2.0 & x1>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2>=-2.0\n",
      "   +0.2028 if c<=0.0 & x1<=1.0 & x3-x1>=0.0\n",
      "   +0.0864 if x1>=1.0 & x3-x1>=-2.0 & x4-x2<=2.0\n",
      "   +0.4128 if x1>=1.0 & x3-x1<=1.0 & x4-x2<=2.0\n",
      "   +0.1394 if x2<=2.0 & x3-x1>=2.0 & x4-x2<=0.0\n",
      "   -0.3728 if x2<=0.0 & x3-x1<=2.0 & x3-x1>=-2.0\n",
      "   +0.0000 if x1<=0.0 & x4-x2>=3.0\n",
      "   -0.2038 if x2<=1.0 & x3-x1>=1.0 & x4-x2<=-1.0\n",
      "   +0.3683 if c>=1.0 & x3-x1<=0.0\n",
      "----------------- 2 --------------\n",
      "   +0.5226 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.2013 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -0.7264 if x4-x2>=0.0\n",
      "   -0.1766 if c>=1.0 & x2>=2.0\n",
      "   +0.2116 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   -0.0640 if x1<=2.0 & x2>=1.0 & x3-x1<=1.0\n",
      "   +0.5067 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.0701 if c>=1.0 & x1<=2.0 & x3-x1<=1.0\n",
      "   -0.3159 if c>=1.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   -0.4328 if c<=0.0 & x1>=1.0 & x2<=2.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   +0.3279 if x1<=1.0 & x1>=1.0 & x2>=3.0\n",
      "   +0.1543 if x3-x1>=0.0 & x4-x2<=1.0\n",
      "   +0.1370 if x2>=3.0 & x3-x1>=1.0\n",
      "   +0.1148 if x1>=1.0 & x2<=0.0 & x3-x1<=1.0\n",
      "   -0.1110 if c<=0.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.6846 if x2<=2.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "----------------- 3 --------------\n",
      "   +0.7233 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.6725 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.1364 if x1<=1.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   +0.4388 if x1<=2.0 & x2<=1.0 & x3-x1>=-1.0 & x4-x2>=0.0\n",
      "   -0.5311 if x1<=2.0 & x4-x2<=0.0\n",
      "   +0.3866 if x1>=2.0 & x3-x1>=-2.0\n",
      "   -0.3046 if x2<=2.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   -0.0111 if x1<=0.0 & x4-x2>=-1.0\n",
      "   +0.4609 if x1>=1.0 & x2<=1.0\n",
      "   +0.1603 if x3-x1<=1.0 & x4-x2>=2.0\n",
      "   +0.1117 if x1>=3.0 & x4-x2>=0.0\n",
      "   -0.3590 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x3-x1>=0.0\n",
      "   +0.1110 if c>=1.0 & x4-x2>=1.0\n",
      "   +0.0000 if x4-x2>=3.0\n",
      "   +0.7854 if x4-x2<=2.0 & x4-x2>=1.0\n",
      "   -0.3038 if x2>=1.0 & x3-x1>=1.0\n",
      "init state [ 2  2 -2 -1  0]\n",
      "(18,) (18,)\n",
      "init state [ 1  3  1 -1  0]\n",
      "(34,) (16,)\n",
      "init state [0 1 2 0 0]\n",
      "(40,) (6,)\n",
      "init state [ 2  2 -1 -2  0]\n",
      "(57,) (17,)\n",
      "init state [ 2  2 -1  1  0]\n",
      "(67,) (10,)\n",
      "init state [ 0  3  0 -1  0]\n",
      "(76,) (9,)\n",
      "init state [0 0 3 1 0]\n",
      "(85,) (9,)\n",
      "init state [ 3  2  0 -1  0]\n",
      "(94,) (9,)\n",
      "init state [ 3  0 -1  2  0]\n",
      "(99,) (5,)\n",
      "init state [ 2  0 -1  3  0]\n",
      "(115,) (16,)\n",
      "============ 106 ===========\n",
      "Run episode 106 with rewards 26, accuracy 0.6\n",
      "----------------- 0 --------------\n",
      "   -0.0265 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.2636 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   +0.0168 if c<=0.0 & x1<=2.0 & x3-x1>=-1.0\n",
      "   +0.7326 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.3221 if c<=0.0 & x3-x1>=-2.0\n",
      "   -0.1637 if c<=0.0 & x1<=2.0 & x2<=1.0 & x4-x2<=2.0 & x4-x2>=0.0\n",
      "   +0.1943 if c<=0.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   +0.0738 if c<=0.0 & x1<=0.0\n",
      "   -0.1189 if x1>=2.0 & x4-x2>=0.0\n",
      "   +0.0000 if c<=0.0 & x1>=1.0 & x2<=0.0 & x3-x1<=0.0 & x4-x2<=1.0\n",
      "   -0.0798 if x1<=2.0 & x1>=2.0 & x3-x1<=-1.0\n",
      "   +0.0814 if x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   +0.3807 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.3642 if x3-x1>=1.0\n",
      "   -0.0584 if x1<=1.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.3225 if c<=0.0 & x1>=3.0 & x2<=1.0 & x4-x2>=1.0\n",
      "----------------- 1 --------------\n",
      "   +0.4297 if x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.1642 if c>=1.0 & x2>=1.0\n",
      "   -0.0050 if x2<=2.0 & x3-x1<=-1.0\n",
      "   +0.8209 if c<=0.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.7985 if x1>=3.0 & x4-x2<=0.0\n",
      "   +0.6030 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.7345 if x3-x1>=1.0 & x4-x2>=0.0\n",
      "   +0.0289 if c>=1.0 & x1<=2.0 & x1>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2>=-2.0\n",
      "   -0.0502 if c<=0.0 & x1<=1.0 & x3-x1>=0.0\n",
      "   +0.4123 if x1>=1.0 & x3-x1>=-2.0 & x4-x2<=2.0\n",
      "   +0.2416 if x1>=1.0 & x3-x1<=1.0 & x4-x2<=2.0\n",
      "   +0.0825 if x2<=2.0 & x3-x1>=2.0 & x4-x2<=0.0\n",
      "   +0.2171 if x2<=0.0 & x3-x1<=2.0 & x3-x1>=-2.0\n",
      "   -0.1265 if x2<=1.0 & x3-x1>=1.0 & x4-x2<=-1.0\n",
      "   +0.1564 if c>=1.0 & x3-x1<=0.0\n",
      "   -0.1931 if c<=0.0 & x2<=0.0\n",
      "----------------- 2 --------------\n",
      "   +0.8376 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.2705 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -0.6604 if x4-x2>=0.0\n",
      "   +0.0275 if c>=1.0 & x2>=2.0\n",
      "   +0.0525 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   +0.1944 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.0299 if c>=1.0 & x1<=2.0 & x3-x1<=1.0\n",
      "   +0.1493 if c>=1.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   -0.1383 if c<=0.0 & x1>=1.0 & x2<=2.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   -0.1920 if x1<=1.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.0288 if x3-x1>=0.0 & x4-x2<=1.0\n",
      "   -0.1977 if x2>=3.0 & x3-x1>=1.0\n",
      "   +0.1728 if x1>=1.0 & x2<=0.0 & x3-x1<=1.0\n",
      "   -0.0336 if c<=0.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.1156 if x2<=2.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.2634 if x2>=3.0 & x4-x2<=-2.0\n",
      "----------------- 3 --------------\n",
      "   +0.7537 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.5755 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.0063 if x1<=1.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   -0.2019 if x1<=2.0 & x2<=1.0 & x3-x1>=-1.0 & x4-x2>=0.0\n",
      "   -0.7446 if x1<=2.0 & x4-x2<=0.0\n",
      "   +0.2292 if x1>=2.0 & x3-x1>=-2.0\n",
      "   +0.3594 if x2<=2.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   -0.2152 if x1<=0.0 & x4-x2>=-1.0\n",
      "   +0.3575 if x1>=1.0 & x2<=1.0\n",
      "   +0.0090 if x3-x1<=1.0 & x4-x2>=2.0\n",
      "   -0.0421 if x1>=3.0 & x4-x2>=0.0\n",
      "   -0.1337 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x3-x1>=0.0\n",
      "   +0.2682 if c>=1.0 & x4-x2>=1.0\n",
      "   +0.8204 if x4-x2<=2.0 & x4-x2>=1.0\n",
      "   -0.4393 if x2>=1.0 & x3-x1>=1.0\n",
      "   +0.5101 if c<=0.0 & x1>=3.0 & x2<=1.0\n",
      "init state [1 3 1 0 0]\n",
      "(3,) (3,)\n",
      "init state [ 1  3 -1  0  0]\n",
      "(17,) (14,)\n",
      "init state [0 0 2 0 0]\n",
      "(25,) (8,)\n",
      "init state [ 2  1  1 -1  0]\n",
      "(32,) (7,)\n",
      "init state [3 0 0 1 0]\n",
      "(35,) (3,)\n",
      "init state [ 3  1 -2  0  0]\n",
      "(49,) (14,)\n",
      "init state [ 1  3  0 -1  0]\n",
      "(78,) (29,)\n",
      "init state [ 3  2 -3 -2  0]\n",
      "(91,) (13,)\n",
      "init state [ 2  2 -1  0  0]\n",
      "(97,) (6,)\n",
      "init state [0 0 0 1 0]\n",
      "(113,) (16,)\n",
      "============ 107 ===========\n",
      "Run episode 107 with rewards 26, accuracy 0.6\n",
      "----------------- 0 --------------\n",
      "   +0.0859 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.6647 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   +0.3618 if c<=0.0 & x1<=2.0 & x3-x1>=-1.0\n",
      "   +0.5927 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.0688 if c<=0.0 & x3-x1>=-2.0\n",
      "   -0.0045 if c<=0.0 & x1<=2.0 & x2<=1.0 & x4-x2<=2.0 & x4-x2>=0.0\n",
      "   +0.2150 if c<=0.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   -0.2693 if c<=0.0 & x1<=0.0\n",
      "   -0.2995 if x1>=2.0 & x4-x2>=0.0\n",
      "   +0.3383 if x1<=2.0 & x1>=2.0 & x3-x1<=-1.0\n",
      "   +0.0080 if x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   +0.2243 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.4594 if x3-x1>=1.0\n",
      "   -0.0720 if x1<=1.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.0884 if c<=0.0 & x1>=3.0 & x2<=1.0 & x4-x2>=1.0\n",
      "   +0.2477 if x1<=0.0 & x4-x2>=1.0\n",
      "----------------- 1 --------------\n",
      "   +0.3725 if x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.3870 if c>=1.0 & x2>=1.0\n",
      "   +0.3593 if c<=0.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.2732 if x1>=3.0 & x4-x2<=0.0\n",
      "   +0.2149 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.7436 if x3-x1>=1.0 & x4-x2>=0.0\n",
      "   +0.1654 if c>=1.0 & x1<=2.0 & x1>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2>=-2.0\n",
      "   +0.1198 if c<=0.0 & x1<=1.0 & x3-x1>=0.0\n",
      "   +0.0373 if x1>=1.0 & x3-x1>=-2.0 & x4-x2<=2.0\n",
      "   -0.0494 if x1>=1.0 & x3-x1<=1.0 & x4-x2<=2.0\n",
      "   +0.1090 if x2<=2.0 & x3-x1>=2.0 & x4-x2<=0.0\n",
      "   +0.2512 if x2<=0.0 & x3-x1<=2.0 & x3-x1>=-2.0\n",
      "   -0.1777 if x2<=1.0 & x3-x1>=1.0 & x4-x2<=-1.0\n",
      "   +0.3987 if c>=1.0 & x3-x1<=0.0\n",
      "   +0.2305 if c<=0.0 & x2<=0.0\n",
      "   +0.2234 if x2>=1.0 & x3-x1<=-2.0 & x4-x2>=-1.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 2 --------------\n",
      "   +0.9474 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.2816 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -0.5692 if x4-x2>=0.0\n",
      "   +0.4754 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   +0.4516 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.1670 if c>=1.0 & x1<=2.0 & x3-x1<=1.0\n",
      "   -0.3943 if c>=1.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   -0.5923 if c<=0.0 & x1>=1.0 & x2<=2.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   +0.2970 if x1<=1.0 & x1>=1.0 & x2>=3.0\n",
      "   +0.1392 if x3-x1>=0.0 & x4-x2<=1.0\n",
      "   -0.0255 if x2>=3.0 & x3-x1>=1.0\n",
      "   +0.0976 if x1>=1.0 & x2<=0.0 & x3-x1<=1.0\n",
      "   +0.0384 if c<=0.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.2301 if x2<=2.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.2282 if x2>=3.0 & x4-x2<=-2.0\n",
      "   -0.1033 if x3-x1<=1.0\n",
      "----------------- 3 --------------\n",
      "   +0.6385 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.4912 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.0911 if x1<=2.0 & x2<=1.0 & x3-x1>=-1.0 & x4-x2>=0.0\n",
      "   -0.8309 if x1<=2.0 & x4-x2<=0.0\n",
      "   +0.5249 if x1>=2.0 & x3-x1>=-2.0\n",
      "   +0.3630 if x2<=2.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   -0.3533 if x1<=0.0 & x4-x2>=-1.0\n",
      "   +0.5089 if x1>=1.0 & x2<=1.0\n",
      "   +0.0000 if x3-x1<=1.0 & x4-x2>=2.0\n",
      "   +0.4415 if x1>=3.0 & x4-x2>=0.0\n",
      "   -0.0702 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x3-x1>=0.0\n",
      "   +0.1767 if c>=1.0 & x4-x2>=1.0\n",
      "   +0.2813 if x4-x2<=2.0 & x4-x2>=1.0\n",
      "   -0.1112 if x2>=1.0 & x3-x1>=1.0\n",
      "   +0.2980 if c<=0.0 & x1>=3.0 & x2<=1.0\n",
      "   -0.0904 if x1>=2.0 & x2<=1.0 & x3-x1>=-2.0\n",
      "init state [ 3  2 -1 -1  0]\n",
      "(7,) (7,)\n",
      "init state [ 0  1  3 -1  0]\n",
      "(30,) (23,)\n",
      "init state [ 2  3  0 -2  0]\n",
      "(35,) (5,)\n",
      "init state [ 3  2 -1 -2  0]\n",
      "(46,) (11,)\n",
      "init state [ 0  2  0 -1  0]\n",
      "(59,) (13,)\n",
      "init state [ 2  0 -2  3  0]\n",
      "(68,) (9,)\n",
      "init state [ 3  2 -1 -2  0]\n",
      "(88,) (20,)\n",
      "init state [ 3  2  0 -2  0]\n",
      "(106,) (18,)\n",
      "init state [ 2  0 -1  2  0]\n",
      "(112,) (6,)\n",
      "init state [ 2  2 -1  0  0]\n",
      "(127,) (15,)\n",
      "============ 108 ===========\n",
      "Run episode 108 with rewards 27, accuracy 0.9\n",
      "----------------- 0 --------------\n",
      "   -0.0047 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.1976 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   +0.0690 if c<=0.0 & x1<=2.0 & x3-x1>=-1.0\n",
      "   +0.8222 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.2118 if c<=0.0 & x3-x1>=-2.0\n",
      "   +0.4904 if c<=0.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   -0.2806 if c<=0.0 & x1<=0.0\n",
      "   -0.3289 if x1>=2.0 & x4-x2>=0.0\n",
      "   -0.1911 if x1<=2.0 & x1>=2.0 & x3-x1<=-1.0\n",
      "   +0.1740 if x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   +0.3444 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.4239 if x3-x1>=1.0\n",
      "   -0.2652 if x1<=1.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.0000 if c<=0.0 & x1>=3.0 & x2<=1.0 & x4-x2>=1.0\n",
      "   -0.0433 if x1<=0.0 & x4-x2>=1.0\n",
      "   -0.4711 if c<=0.0 & x2>=1.0 & x4-x2>=1.0\n",
      "----------------- 1 --------------\n",
      "   +0.3329 if x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.5931 if c>=1.0 & x2>=1.0\n",
      "   +0.2084 if c<=0.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.1312 if x1>=3.0 & x4-x2<=0.0\n",
      "   +0.2224 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.4452 if x3-x1>=1.0 & x4-x2>=0.0\n",
      "   +0.0695 if c>=1.0 & x1<=2.0 & x1>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2>=-2.0\n",
      "   +0.5046 if c<=0.0 & x1<=1.0 & x3-x1>=0.0\n",
      "   +0.0572 if x1>=1.0 & x3-x1<=1.0 & x4-x2<=2.0\n",
      "   -0.0487 if x2<=2.0 & x3-x1>=2.0 & x4-x2<=0.0\n",
      "   +0.2211 if x2<=0.0 & x3-x1<=2.0 & x3-x1>=-2.0\n",
      "   -0.0730 if x2<=1.0 & x3-x1>=1.0 & x4-x2<=-1.0\n",
      "   +0.3860 if c>=1.0 & x3-x1<=0.0\n",
      "   +0.2494 if c<=0.0 & x2<=0.0\n",
      "   -0.0653 if x2>=1.0 & x3-x1<=-2.0 & x4-x2>=-1.0\n",
      "   -0.7320 if x1>=1.0 & x2<=2.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "----------------- 2 --------------\n",
      "   +0.5441 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.2964 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -0.3424 if x4-x2>=0.0\n",
      "   +0.3364 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   +0.1511 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.3141 if c>=1.0 & x1<=2.0 & x3-x1<=1.0\n",
      "   -0.1262 if c>=1.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.0159 if c<=0.0 & x1>=1.0 & x2<=2.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   -0.1490 if x1<=1.0 & x1>=1.0 & x2>=3.0\n",
      "   +0.6280 if x3-x1>=0.0 & x4-x2<=1.0\n",
      "   +0.1369 if x1>=1.0 & x2<=0.0 & x3-x1<=1.0\n",
      "   -0.2240 if c<=0.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.4184 if x2<=2.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.3836 if x2>=3.0 & x4-x2<=-2.0\n",
      "   -0.2866 if x3-x1<=1.0\n",
      "   -0.1774 if c<=0.0 & x1>=3.0\n",
      "----------------- 3 --------------\n",
      "   +0.3366 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.7528 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.0843 if x1<=2.0 & x2<=1.0 & x3-x1>=-1.0 & x4-x2>=0.0\n",
      "   -0.7164 if x1<=2.0 & x4-x2<=0.0\n",
      "   +0.4500 if x1>=2.0 & x3-x1>=-2.0\n",
      "   +0.9151 if x2<=2.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   -0.1871 if x1<=0.0 & x4-x2>=-1.0\n",
      "   +0.3053 if x1>=1.0 & x2<=1.0\n",
      "   +0.1059 if x1>=3.0 & x4-x2>=0.0\n",
      "   -0.1132 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x3-x1>=0.0\n",
      "   +0.1038 if c>=1.0 & x4-x2>=1.0\n",
      "   +0.6264 if x4-x2<=2.0 & x4-x2>=1.0\n",
      "   -0.2761 if x2>=1.0 & x3-x1>=1.0\n",
      "   -0.0766 if c<=0.0 & x1>=3.0 & x2<=1.0\n",
      "   +0.3368 if x1>=2.0 & x2<=1.0 & x3-x1>=-2.0\n",
      "   +0.6431 if c<=0.0 & x4-x2>=1.0\n",
      "init state [ 3  1 -1  1  0]\n",
      "(10,) (10,)\n",
      "init state [ 2  3  1 -1  0]\n",
      "(16,) (6,)\n",
      "init state [0 1 3 1 0]\n",
      "(23,) (7,)\n",
      "init state [ 2  2 -2 -1  0]\n",
      "(36,) (13,)\n",
      "init state [ 2  2 -1  0  0]\n",
      "(56,) (20,)\n",
      "init state [ 0  2  0 -2  0]\n",
      "(84,) (28,)\n",
      "init state [0 0 0 3 0]\n",
      "(101,) (17,)\n",
      "init state [ 1  1 -1  1  0]\n",
      "(109,) (8,)\n",
      "init state [ 1  2  2 -1  0]\n",
      "(127,) (18,)\n",
      "init state [ 1  3  1 -1  0]\n",
      "(135,) (8,)\n",
      "============ 109 ===========\n",
      "Run episode 109 with rewards 34, accuracy 0.8\n",
      "----------------- 0 --------------\n",
      "   +0.2028 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.3130 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   +0.2047 if c<=0.0 & x1<=2.0 & x3-x1>=-1.0\n",
      "   +0.5612 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.0723 if c<=0.0 & x3-x1>=-2.0\n",
      "   +0.4779 if c<=0.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   -0.3114 if c<=0.0 & x1<=0.0\n",
      "   -0.4282 if x1>=2.0 & x4-x2>=0.0\n",
      "   -0.2769 if x1<=2.0 & x1>=2.0 & x3-x1<=-1.0\n",
      "   -0.0125 if x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   +0.5160 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.3257 if x3-x1>=1.0\n",
      "   +0.3183 if x1<=1.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.0275 if x1<=0.0 & x4-x2>=1.0\n",
      "   -0.0716 if c<=0.0 & x2>=1.0 & x4-x2>=1.0\n",
      "   -0.1226 if x3-x1<=-2.0\n",
      "----------------- 1 --------------\n",
      "   +0.5460 if x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.5115 if c>=1.0 & x2>=1.0\n",
      "   +0.5742 if c<=0.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.0852 if x1>=3.0 & x4-x2<=0.0\n",
      "   +0.2480 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.8048 if x3-x1>=1.0 & x4-x2>=0.0\n",
      "   +0.2725 if c>=1.0 & x1<=2.0 & x1>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2>=-2.0\n",
      "   -0.0147 if c<=0.0 & x1<=1.0 & x3-x1>=0.0\n",
      "   +0.1096 if x1>=1.0 & x3-x1<=1.0 & x4-x2<=2.0\n",
      "   +0.0861 if x2<=0.0 & x3-x1<=2.0 & x3-x1>=-2.0\n",
      "   +0.0000 if x2<=1.0 & x3-x1>=1.0 & x4-x2<=-1.0\n",
      "   +0.3357 if c>=1.0 & x3-x1<=0.0\n",
      "   +0.1270 if c<=0.0 & x2<=0.0\n",
      "   -0.0682 if x2>=1.0 & x3-x1<=-2.0 & x4-x2>=-1.0\n",
      "   -0.3412 if x1>=1.0 & x2<=2.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   +0.5131 if x1<=0.0 & x3-x1<=2.0 & x3-x1>=2.0\n",
      "----------------- 2 --------------\n",
      "   +0.7785 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.0747 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -0.6249 if x4-x2>=0.0\n",
      "   +0.1110 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   +0.1654 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.0753 if c>=1.0 & x1<=2.0 & x3-x1<=1.0\n",
      "   -0.1012 if c>=1.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   -0.1114 if x1<=1.0 & x1>=1.0 & x2>=3.0\n",
      "   +0.2105 if x3-x1>=0.0 & x4-x2<=1.0\n",
      "   -0.0075 if x1>=1.0 & x2<=0.0 & x3-x1<=1.0\n",
      "   -0.3684 if c<=0.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.1157 if x2<=2.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.2374 if x2>=3.0 & x4-x2<=-2.0\n",
      "   -0.0134 if x3-x1<=1.0\n",
      "   +0.0507 if c<=0.0 & x1>=3.0\n",
      "   +0.0235 if x4-x2<=-3.0\n",
      "----------------- 3 --------------\n",
      "   +0.3461 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.5478 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.0268 if x1<=2.0 & x2<=1.0 & x3-x1>=-1.0 & x4-x2>=0.0\n",
      "   -0.6125 if x1<=2.0 & x4-x2<=0.0\n",
      "   +0.1444 if x1>=2.0 & x3-x1>=-2.0\n",
      "   +0.9199 if x2<=2.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.1007 if x1<=0.0 & x4-x2>=-1.0\n",
      "   +0.2352 if x1>=1.0 & x2<=1.0\n",
      "   +0.2093 if x1>=3.0 & x4-x2>=0.0\n",
      "   -0.1142 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x3-x1>=0.0\n",
      "   +0.1744 if c>=1.0 & x4-x2>=1.0\n",
      "   +0.7585 if x4-x2<=2.0 & x4-x2>=1.0\n",
      "   -0.2582 if x2>=1.0 & x3-x1>=1.0\n",
      "   +0.1306 if x1>=2.0 & x2<=1.0 & x3-x1>=-2.0\n",
      "   +0.5311 if c<=0.0 & x4-x2>=1.0\n",
      "   -0.1554 if c<=0.0 & x4-x2>=2.0\n",
      "init state [0 2 1 0 0]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(4,) (4,)\n",
      "init state [ 2  1 -1  2  0]\n",
      "(9,) (5,)\n",
      "init state [ 0  3  0 -1  0]\n",
      "(17,) (8,)\n",
      "init state [ 0  3  3 -2  0]\n",
      "(29,) (12,)\n",
      "init state [3 1 0 1 0]\n",
      "(35,) (6,)\n",
      "init state [1 1 0 2 0]\n",
      "(39,) (4,)\n",
      "init state [0 1 1 1 0]\n",
      "(44,) (5,)\n",
      "init state [ 3  0 -3  0  0]\n",
      "(64,) (20,)\n",
      "init state [0 0 2 1 0]\n",
      "(75,) (11,)\n",
      "init state [ 0  3  0 -1  0]\n",
      "(90,) (15,)\n",
      "============ 110 ===========\n",
      "Run episode 110 with rewards 27, accuracy 0.4\n",
      "----------------- 0 --------------\n",
      "   +0.3543 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.2549 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   +0.1693 if c<=0.0 & x1<=2.0 & x3-x1>=-1.0\n",
      "   +0.6538 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.2279 if c<=0.0 & x3-x1>=-2.0\n",
      "   +0.1643 if c<=0.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   -0.2791 if c<=0.0 & x1<=0.0\n",
      "   -0.2953 if x1>=2.0 & x4-x2>=0.0\n",
      "   -0.0874 if x1<=2.0 & x1>=2.0 & x3-x1<=-1.0\n",
      "   +0.4342 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.2091 if x3-x1>=1.0\n",
      "   -0.0953 if x1<=1.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.0764 if x1<=0.0 & x4-x2>=1.0\n",
      "   -0.3463 if c<=0.0 & x2>=1.0 & x4-x2>=1.0\n",
      "   +0.0819 if x3-x1<=-2.0\n",
      "   +0.4240 if c<=0.0 & x2<=1.0 & x4-x2<=0.0\n",
      "----------------- 1 --------------\n",
      "   +0.4379 if x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.4977 if c>=1.0 & x2>=1.0\n",
      "   +0.5993 if c<=0.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.2017 if x1>=3.0 & x4-x2<=0.0\n",
      "   +0.4125 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.8503 if x3-x1>=1.0 & x4-x2>=0.0\n",
      "   +0.0464 if c>=1.0 & x1<=2.0 & x1>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2>=-2.0\n",
      "   +0.1623 if c<=0.0 & x1<=1.0 & x3-x1>=0.0\n",
      "   +0.0356 if x1>=1.0 & x3-x1<=1.0 & x4-x2<=2.0\n",
      "   +0.3393 if x2<=0.0 & x3-x1<=2.0 & x3-x1>=-2.0\n",
      "   +0.5804 if c>=1.0 & x3-x1<=0.0\n",
      "   +0.2115 if c<=0.0 & x2<=0.0\n",
      "   -0.2338 if x2>=1.0 & x3-x1<=-2.0 & x4-x2>=-1.0\n",
      "   -0.3137 if x1>=1.0 & x2<=2.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   +0.1387 if x1<=0.0 & x3-x1<=2.0 & x3-x1>=2.0\n",
      "   -0.2072 if x2<=1.0 & x3-x1>=2.0 & x3-x1>=3.0\n",
      "----------------- 2 --------------\n",
      "   +0.4274 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.0123 if c>=1.0 & x1>=1.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -0.5838 if x4-x2>=0.0\n",
      "   +0.0224 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   -0.1672 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.2145 if c>=1.0 & x1<=2.0 & x3-x1<=1.0\n",
      "   -0.0624 if c>=1.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   -0.2448 if x1<=1.0 & x1>=1.0 & x2>=3.0\n",
      "   +0.0859 if x3-x1>=0.0 & x4-x2<=1.0\n",
      "   -0.1180 if c<=0.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.2045 if x2<=2.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.0466 if x2>=3.0 & x4-x2<=-2.0\n",
      "   -0.1079 if x3-x1<=1.0\n",
      "   +0.0371 if c<=0.0 & x1>=3.0\n",
      "   +0.0807 if x4-x2<=-3.0\n",
      "   +0.3222 if x2<=2.0 & x3-x1>=3.0 & x4-x2<=-1.0\n",
      "----------------- 3 --------------\n",
      "   +0.2044 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.5784 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.3382 if x1<=2.0 & x4-x2<=0.0\n",
      "   +0.2542 if x1>=2.0 & x3-x1>=-2.0\n",
      "   +0.8405 if x2<=2.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   -0.5450 if x1<=0.0 & x4-x2>=-1.0\n",
      "   +0.3686 if x1>=1.0 & x2<=1.0\n",
      "   +0.2070 if x1>=3.0 & x4-x2>=0.0\n",
      "   +0.3104 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x3-x1>=0.0\n",
      "   -0.0189 if c>=1.0 & x4-x2>=1.0\n",
      "   +0.5877 if x4-x2<=2.0 & x4-x2>=1.0\n",
      "   -0.0598 if x2>=1.0 & x3-x1>=1.0\n",
      "   +0.1998 if x1>=2.0 & x2<=1.0 & x3-x1>=-2.0\n",
      "   +0.6066 if c<=0.0 & x4-x2>=1.0\n",
      "   +0.2087 if c<=0.0 & x4-x2>=2.0\n",
      "   -0.2894 if x3-x1>=1.0 & x4-x2>=1.0\n",
      "init state [2 1 1 0 0]\n",
      "(24,) (24,)\n",
      "init state [ 1  0 -1  2  0]\n",
      "(35,) (11,)\n",
      "init state [ 3  0 -3  2  0]\n",
      "(64,) (29,)\n",
      "init state [0 1 3 1 0]\n",
      "(69,) (5,)\n",
      "init state [ 2  3  0 -1  0]\n",
      "(96,) (27,)\n",
      "init state [ 1  1 -1 -1  0]\n",
      "(133,) (37,)\n",
      "init state [0 1 3 1 0]\n",
      "(142,) (9,)\n",
      "init state [ 1  3  2 -3  0]\n",
      "(173,) (31,)\n",
      "init state [ 2  1 -1  2  0]\n",
      "(179,) (6,)\n",
      "init state [1 0 2 1 0]\n",
      "(197,) (18,)\n",
      "============ 111 ===========\n",
      "Run episode 111 with rewards 24, accuracy 0.7\n",
      "----------------- 0 --------------\n",
      "   +0.4473 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.4962 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   +0.0518 if c<=0.0 & x1<=2.0 & x3-x1>=-1.0\n",
      "   +0.5814 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.3471 if c<=0.0 & x3-x1>=-2.0\n",
      "   +0.7598 if c<=0.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   -0.2907 if c<=0.0 & x1<=0.0\n",
      "   -0.1665 if x1>=2.0 & x4-x2>=0.0\n",
      "   -0.0615 if x1<=2.0 & x1>=2.0 & x3-x1<=-1.0\n",
      "   +0.2563 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.3333 if x3-x1>=1.0\n",
      "   -0.0524 if x1<=1.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.2546 if c<=0.0 & x2>=1.0 & x4-x2>=1.0\n",
      "   -0.2012 if x3-x1<=-2.0\n",
      "   +0.4154 if c<=0.0 & x2<=1.0 & x4-x2<=0.0\n",
      "   -0.5234 if c<=0.0 & x1<=2.0 & x3-x1>=0.0\n",
      "----------------- 1 --------------\n",
      "   +0.3870 if x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.6629 if c>=1.0 & x2>=1.0\n",
      "   +0.2117 if c<=0.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.3026 if x1>=3.0 & x4-x2<=0.0\n",
      "   +0.4716 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.6679 if x3-x1>=1.0 & x4-x2>=0.0\n",
      "   +0.4556 if c>=1.0 & x1<=2.0 & x1>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2>=-2.0\n",
      "   +0.4811 if c<=0.0 & x1<=1.0 & x3-x1>=0.0\n",
      "   -0.1633 if x2<=0.0 & x3-x1<=2.0 & x3-x1>=-2.0\n",
      "   +0.2660 if c>=1.0 & x3-x1<=0.0\n",
      "   +0.1688 if c<=0.0 & x2<=0.0\n",
      "   +0.1351 if x2>=1.0 & x3-x1<=-2.0 & x4-x2>=-1.0\n",
      "   -0.2895 if x1>=1.0 & x2<=2.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   +0.0000 if x1<=0.0 & x3-x1<=2.0 & x3-x1>=2.0\n",
      "   +0.1319 if x2<=1.0 & x3-x1>=2.0 & x3-x1>=3.0\n",
      "   -0.2095 if x2<=0.0 & x3-x1<=2.0 & x4-x2>=1.0\n",
      "----------------- 2 --------------\n",
      "   +0.1965 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.1552 if x4-x2>=0.0\n",
      "   +0.3733 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   -0.1321 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.2647 if c>=1.0 & x1<=2.0 & x3-x1<=1.0\n",
      "   -0.2247 if c>=1.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.0104 if x1<=1.0 & x1>=1.0 & x2>=3.0\n",
      "   +0.3749 if x3-x1>=0.0 & x4-x2<=1.0\n",
      "   +0.0644 if c<=0.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.0489 if x2<=2.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.0444 if x2>=3.0 & x4-x2<=-2.0\n",
      "   -0.5551 if x3-x1<=1.0\n",
      "   -0.1436 if c<=0.0 & x1>=3.0\n",
      "   +0.1074 if x4-x2<=-3.0\n",
      "   -0.0665 if x2<=2.0 & x3-x1>=3.0 & x4-x2<=-1.0\n",
      "   -0.2297 if x3-x1<=-1.0\n",
      "----------------- 3 --------------\n",
      "   +0.5912 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.6525 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.5653 if x1<=2.0 & x4-x2<=0.0\n",
      "   +0.3714 if x1>=2.0 & x3-x1>=-2.0\n",
      "   +0.4782 if x2<=2.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.0307 if x1<=0.0 & x4-x2>=-1.0\n",
      "   +0.2186 if x1>=1.0 & x2<=1.0\n",
      "   +0.4204 if x1>=3.0 & x4-x2>=0.0\n",
      "   +0.2780 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x3-x1>=0.0\n",
      "   +0.3634 if x4-x2<=2.0 & x4-x2>=1.0\n",
      "   -0.4032 if x2>=1.0 & x3-x1>=1.0\n",
      "   +0.5442 if x1>=2.0 & x2<=1.0 & x3-x1>=-2.0\n",
      "   +0.3634 if c<=0.0 & x4-x2>=1.0\n",
      "   +0.4666 if c<=0.0 & x4-x2>=2.0\n",
      "   +0.2226 if x3-x1>=1.0 & x4-x2>=1.0\n",
      "   -0.1466 if x1<=2.0\n",
      "init state [ 2  3 -2  0  0]\n",
      "(10,) (10,)\n",
      "init state [ 3  1 -3  1  0]\n",
      "(33,) (23,)\n",
      "init state [ 0  3  0 -3  0]\n",
      "(53,) (20,)\n",
      "init state [2 1 1 1 0]\n",
      "(56,) (3,)\n",
      "init state [ 3  0 -3  0  0]\n",
      "(76,) (20,)\n",
      "init state [2 0 0 3 0]\n",
      "(82,) (6,)\n",
      "init state [0 1 1 0 0]\n",
      "(89,) (7,)\n",
      "init state [1 1 1 2 0]\n",
      "(114,) (25,)\n",
      "init state [ 0  2  1 -1  0]\n",
      "(154,) (40,)\n",
      "init state [ 1  3  2 -3  0]\n",
      "(181,) (27,)\n",
      "============ 112 ===========\n",
      "Run episode 112 with rewards 15, accuracy 0.3\n",
      "----------------- 0 --------------\n",
      "   +0.0150 if x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.0558 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   +0.3185 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.2838 if c<=0.0 & x3-x1>=-2.0\n",
      "   +0.6593 if c<=0.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   -0.0282 if c<=0.0 & x1<=0.0\n",
      "   -0.4387 if x1>=2.0 & x4-x2>=0.0\n",
      "   +0.0460 if x1<=2.0 & x1>=2.0 & x3-x1<=-1.0\n",
      "   +0.4307 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.3349 if x3-x1>=1.0\n",
      "   +0.0344 if x1<=1.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.2421 if c<=0.0 & x2>=1.0 & x4-x2>=1.0\n",
      "   -0.2135 if x3-x1<=-2.0\n",
      "   +0.3867 if c<=0.0 & x2<=1.0 & x4-x2<=0.0\n",
      "   -0.2680 if c<=0.0 & x1<=2.0 & x3-x1>=0.0\n",
      "   +0.3970 if x1<=2.0 & x2>=3.0\n",
      "----------------- 1 --------------\n",
      "   +0.3659 if x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.5908 if c>=1.0 & x2>=1.0\n",
      "   +0.4398 if c<=0.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.4592 if x1>=3.0 & x4-x2<=0.0\n",
      "   +0.3628 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.6085 if x3-x1>=1.0 & x4-x2>=0.0\n",
      "   +0.1836 if c>=1.0 & x1<=2.0 & x1>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2>=-2.0\n",
      "   +0.0846 if c<=0.0 & x1<=1.0 & x3-x1>=0.0\n",
      "   +0.1595 if x2<=0.0 & x3-x1<=2.0 & x3-x1>=-2.0\n",
      "   +0.3665 if c>=1.0 & x3-x1<=0.0\n",
      "   +0.1816 if c<=0.0 & x2<=0.0\n",
      "   +0.0903 if x2>=1.0 & x3-x1<=-2.0 & x4-x2>=-1.0\n",
      "   +0.1180 if x1>=1.0 & x2<=2.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   +0.0346 if x2<=1.0 & x3-x1>=2.0 & x3-x1>=3.0\n",
      "   -0.0738 if x2<=0.0 & x3-x1<=2.0 & x4-x2>=1.0\n",
      "   -0.0603 if x4-x2<=0.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 2 --------------\n",
      "   +0.7250 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.3529 if x4-x2>=0.0\n",
      "   +0.6019 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   -0.0582 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.5899 if c>=1.0 & x1<=2.0 & x3-x1<=1.0\n",
      "   -0.2175 if c>=1.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.1392 if x3-x1>=0.0 & x4-x2<=1.0\n",
      "   +0.2013 if c<=0.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.2574 if x2<=2.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.2056 if x2>=3.0 & x4-x2<=-2.0\n",
      "   -0.3161 if x3-x1<=1.0\n",
      "   -0.2407 if c<=0.0 & x1>=3.0\n",
      "   -0.2401 if x4-x2<=-3.0\n",
      "   +0.0119 if x2<=2.0 & x3-x1>=3.0 & x4-x2<=-1.0\n",
      "   -0.3364 if x3-x1<=-1.0\n",
      "   -0.1789 if c<=0.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "----------------- 3 --------------\n",
      "   +0.5782 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.5180 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.6270 if x1<=2.0 & x4-x2<=0.0\n",
      "   +0.6078 if x1>=2.0 & x3-x1>=-2.0\n",
      "   +0.5702 if x2<=2.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.5713 if x1>=1.0 & x2<=1.0\n",
      "   +0.7898 if x1>=3.0 & x4-x2>=0.0\n",
      "   +0.1613 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x3-x1>=0.0\n",
      "   +0.3541 if x4-x2<=2.0 & x4-x2>=1.0\n",
      "   -0.0446 if x2>=1.0 & x3-x1>=1.0\n",
      "   +0.1796 if x1>=2.0 & x2<=1.0 & x3-x1>=-2.0\n",
      "   +0.4140 if c<=0.0 & x4-x2>=1.0\n",
      "   +0.2926 if c<=0.0 & x4-x2>=2.0\n",
      "   +0.1754 if x3-x1>=1.0 & x4-x2>=1.0\n",
      "   -0.3414 if x1<=2.0\n",
      "   +0.5054 if x2>=3.0 & x3-x1<=0.0 & x3-x1>=-1.0\n",
      "init state [0 0 3 1 0]\n",
      "(8,) (8,)\n",
      "init state [ 2  3 -2  0  0]\n",
      "(16,) (8,)\n",
      "init state [ 2  3 -1 -3  0]\n",
      "(63,) (47,)\n",
      "init state [ 3  0 -1  1  0]\n",
      "(70,) (7,)\n",
      "init state [0 0 1 1 0]\n",
      "(77,) (7,)\n",
      "init state [ 3  2 -3 -2  0]\n",
      "(108,) (31,)\n",
      "init state [0 1 1 2 0]\n",
      "(121,) (13,)\n",
      "init state [ 3  2 -3  0  0]\n",
      "(139,) (18,)\n",
      "init state [0 0 0 1 0]\n",
      "(149,) (10,)\n",
      "init state [ 3  1 -3  0  0]\n",
      "(157,) (8,)\n",
      "============ 113 ===========\n",
      "Run episode 113 with rewards 34, accuracy 0.9\n",
      "----------------- 0 --------------\n",
      "   +0.5181 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   +0.4895 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.1386 if c<=0.0 & x3-x1>=-2.0\n",
      "   +0.5330 if c<=0.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   -0.1703 if c<=0.0 & x1<=0.0\n",
      "   +0.1983 if x1>=2.0 & x4-x2>=0.0\n",
      "   -0.0771 if x1<=2.0 & x1>=2.0 & x3-x1<=-1.0\n",
      "   -0.0835 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.3144 if x3-x1>=1.0\n",
      "   -0.0374 if x1<=1.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.6299 if c<=0.0 & x2>=1.0 & x4-x2>=1.0\n",
      "   +0.2912 if x3-x1<=-2.0\n",
      "   +0.1829 if c<=0.0 & x2<=1.0 & x4-x2<=0.0\n",
      "   -0.6465 if c<=0.0 & x1<=2.0 & x3-x1>=0.0\n",
      "   -0.3274 if x1<=2.0 & x2>=3.0\n",
      "   -0.1204 if c<=0.0 & x1>=2.0 & x4-x2<=-3.0\n",
      "----------------- 1 --------------\n",
      "   +0.1761 if x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.5352 if c>=1.0 & x2>=1.0\n",
      "   +0.4896 if c<=0.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.3238 if x1>=3.0 & x4-x2<=0.0\n",
      "   +0.0428 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.5369 if x3-x1>=1.0 & x4-x2>=0.0\n",
      "   +0.4827 if c>=1.0 & x1<=2.0 & x1>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2>=-2.0\n",
      "   +0.1668 if c<=0.0 & x1<=1.0 & x3-x1>=0.0\n",
      "   +0.0282 if x2<=0.0 & x3-x1<=2.0 & x3-x1>=-2.0\n",
      "   +0.5566 if c>=1.0 & x3-x1<=0.0\n",
      "   +0.2290 if c<=0.0 & x2<=0.0\n",
      "   -0.1866 if x2>=1.0 & x3-x1<=-2.0 & x4-x2>=-1.0\n",
      "   -0.3886 if x1>=1.0 & x2<=2.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   -0.0300 if x2<=0.0 & x3-x1<=2.0 & x4-x2>=1.0\n",
      "   +0.3620 if x4-x2<=0.0\n",
      "   -0.1732 if x3-x1<=2.0\n",
      "----------------- 2 --------------\n",
      "   +0.6558 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.7796 if x4-x2>=0.0\n",
      "   +0.7981 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   +0.5215 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.6067 if c>=1.0 & x1<=2.0 & x3-x1<=1.0\n",
      "   -0.4281 if c>=1.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.2140 if x3-x1>=0.0 & x4-x2<=1.0\n",
      "   -0.3922 if c<=0.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.1980 if x2<=2.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.2426 if x2>=3.0 & x4-x2<=-2.0\n",
      "   -0.1534 if x3-x1<=1.0\n",
      "   -0.1702 if c<=0.0 & x1>=3.0\n",
      "   +0.2426 if x4-x2<=-3.0\n",
      "   +0.1064 if x3-x1<=-1.0\n",
      "   +0.3485 if c<=0.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.2689 if x2<=2.0 & x3-x1<=2.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "----------------- 3 --------------\n",
      "   +0.4893 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.5896 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.4026 if x1<=2.0 & x4-x2<=0.0\n",
      "   -0.0141 if x1>=2.0 & x3-x1>=-2.0\n",
      "   +0.1456 if x2<=2.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.6640 if x1>=1.0 & x2<=1.0\n",
      "   +0.1473 if x1>=3.0 & x4-x2>=0.0\n",
      "   +0.6619 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x3-x1>=0.0\n",
      "   +0.2459 if x4-x2<=2.0 & x4-x2>=1.0\n",
      "   +0.3127 if x1>=2.0 & x2<=1.0 & x3-x1>=-2.0\n",
      "   +0.2459 if c<=0.0 & x4-x2>=1.0\n",
      "   +0.1787 if c<=0.0 & x4-x2>=2.0\n",
      "   +0.1556 if x3-x1>=1.0 & x4-x2>=1.0\n",
      "   -0.3223 if x1<=2.0\n",
      "   -0.0252 if x2>=3.0 & x3-x1<=0.0 & x3-x1>=-1.0\n",
      "   +0.3152 if x4-x2<=1.0\n",
      "init state [3 0 0 1 0]\n",
      "(4,) (4,)\n",
      "init state [ 2  2  1 -1  0]\n",
      "(11,) (7,)\n",
      "init state [ 1  1 -1 -1  0]\n",
      "(24,) (13,)\n",
      "init state [ 2  3 -2 -3  0]\n",
      "(46,) (22,)\n",
      "init state [1 1 1 2 0]\n",
      "(52,) (6,)\n",
      "init state [ 1  2  0 -1  0]\n",
      "(66,) (14,)\n",
      "init state [ 3  2 -2  0  0]\n",
      "(80,) (14,)\n",
      "init state [ 3  0 -3  2  0]\n",
      "(101,) (21,)\n",
      "init state [ 1  3  2 -2  0]\n",
      "(109,) (8,)\n",
      "init state [ 0  2  0 -2  0]\n",
      "(130,) (21,)\n",
      "============ 114 ===========\n",
      "Run episode 114 with rewards 21, accuracy 0.9\n",
      "----------------- 0 --------------\n",
      "   +0.4945 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   +0.2195 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   -0.0304 if c<=0.0 & x3-x1>=-2.0\n",
      "   +0.2288 if c<=0.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   -0.2236 if c<=0.0 & x1<=0.0\n",
      "   +0.2421 if x1>=2.0 & x4-x2>=0.0\n",
      "   +0.1224 if x1<=2.0 & x1>=2.0 & x3-x1<=-1.0\n",
      "   +0.0516 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.0980 if x3-x1>=1.0\n",
      "   +0.2527 if c<=0.0 & x2>=1.0 & x4-x2>=1.0\n",
      "   -0.0882 if x3-x1<=-2.0\n",
      "   +0.2278 if c<=0.0 & x2<=1.0 & x4-x2<=0.0\n",
      "   -0.3020 if c<=0.0 & x1<=2.0 & x3-x1>=0.0\n",
      "   -0.2414 if x1<=2.0 & x2>=3.0\n",
      "   -0.0013 if c<=0.0 & x1>=2.0 & x4-x2<=-3.0\n",
      "   -0.1354 if x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "----------------- 1 --------------\n",
      "   +0.4583 if x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.2149 if c>=1.0 & x2>=1.0\n",
      "   +0.3710 if c<=0.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.0307 if x1>=3.0 & x4-x2<=0.0\n",
      "   +0.0574 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.4767 if x3-x1>=1.0 & x4-x2>=0.0\n",
      "   +0.1482 if c>=1.0 & x1<=2.0 & x1>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2>=-2.0\n",
      "   +0.1546 if c<=0.0 & x1<=1.0 & x3-x1>=0.0\n",
      "   +0.5418 if c>=1.0 & x3-x1<=0.0\n",
      "   -0.2245 if c<=0.0 & x2<=0.0\n",
      "   -0.2667 if x2>=1.0 & x3-x1<=-2.0 & x4-x2>=-1.0\n",
      "   -0.2546 if x1>=1.0 & x2<=2.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   -0.0423 if x2<=0.0 & x3-x1<=2.0 & x4-x2>=1.0\n",
      "   +0.2736 if x4-x2<=0.0\n",
      "   +0.0538 if x3-x1<=2.0\n",
      "   -0.3270 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=2.0\n",
      "----------------- 2 --------------\n",
      "   +0.7658 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.9543 if x4-x2>=0.0\n",
      "   +0.9092 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   +0.3373 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.1926 if c>=1.0 & x1<=2.0 & x3-x1<=1.0\n",
      "   -0.3019 if c>=1.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.1101 if x3-x1>=0.0 & x4-x2<=1.0\n",
      "   -0.2824 if c<=0.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.2392 if x2<=2.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.2975 if x2>=3.0 & x4-x2<=-2.0\n",
      "   +0.1805 if x3-x1<=1.0\n",
      "   -0.0223 if c<=0.0 & x1>=3.0\n",
      "   +0.1361 if x4-x2<=-3.0\n",
      "   +0.0398 if c<=0.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.2235 if x2<=2.0 & x3-x1<=2.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   +0.0886 if c<=0.0 & x1<=1.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=0.0\n",
      "----------------- 3 --------------\n",
      "   +0.6672 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.4517 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.4151 if x1<=2.0 & x4-x2<=0.0\n",
      "   +0.1925 if x2<=2.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.3632 if x1>=1.0 & x2<=1.0\n",
      "   +0.3455 if x1>=3.0 & x4-x2>=0.0\n",
      "   +0.3478 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x3-x1>=0.0\n",
      "   +0.3883 if x4-x2<=2.0 & x4-x2>=1.0\n",
      "   -0.0731 if x1>=2.0 & x2<=1.0 & x3-x1>=-2.0\n",
      "   +0.3235 if c<=0.0 & x4-x2>=1.0\n",
      "   -0.0132 if c<=0.0 & x4-x2>=2.0\n",
      "   +0.2272 if x3-x1>=1.0 & x4-x2>=1.0\n",
      "   -0.2465 if x1<=2.0\n",
      "   -0.1569 if x2>=3.0 & x3-x1<=0.0 & x3-x1>=-1.0\n",
      "   +0.4871 if x4-x2<=1.0\n",
      "   +0.6246 if x1<=2.0 & x1>=1.0 & x3-x1<=1.0 & x4-x2>=1.0\n",
      "init state [ 2  1 -2  1  0]\n",
      "(11,) (11,)\n",
      "init state [1 2 1 1 0]\n",
      "(14,) (3,)\n",
      "init state [ 2  3 -2 -1  0]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(23,) (9,)\n",
      "init state [ 0  1  2 -1  0]\n",
      "(36,) (13,)\n",
      "init state [ 1  3  1 -3  0]\n",
      "(44,) (8,)\n",
      "init state [ 2  3  1 -2  0]\n",
      "(54,) (10,)\n",
      "init state [ 2  2 -2  1  0]\n",
      "(82,) (28,)\n",
      "init state [ 1  0 -1  0  0]\n",
      "(97,) (15,)\n",
      "init state [ 1  0 -1  3  0]\n",
      "(111,) (14,)\n",
      "init state [1 3 1 0 0]\n",
      "(113,) (2,)\n",
      "============ 115 ===========\n",
      "Run episode 115 with rewards 40, accuracy 0.9\n",
      "----------------- 0 --------------\n",
      "   +0.2949 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   +0.7868 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   -0.0316 if c<=0.0 & x3-x1>=-2.0\n",
      "   +0.3151 if c<=0.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   -0.0663 if c<=0.0 & x1<=0.0\n",
      "   +0.1537 if x1>=2.0 & x4-x2>=0.0\n",
      "   -0.3343 if x1<=2.0 & x1>=2.0 & x3-x1<=-1.0\n",
      "   -0.4438 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.2527 if x3-x1>=1.0\n",
      "   -0.2972 if c<=0.0 & x2>=1.0 & x4-x2>=1.0\n",
      "   -0.1009 if x3-x1<=-2.0\n",
      "   -0.1026 if c<=0.0 & x2<=1.0 & x4-x2<=0.0\n",
      "   -0.4980 if c<=0.0 & x1<=2.0 & x3-x1>=0.0\n",
      "   +0.0801 if x1<=2.0 & x2>=3.0\n",
      "   -0.0388 if x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.2466 if x1<=1.0 & x4-x2>=2.0\n",
      "----------------- 1 --------------\n",
      "   +0.5162 if x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.4182 if c>=1.0 & x2>=1.0\n",
      "   +0.4470 if c<=0.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.2588 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.2566 if x3-x1>=1.0 & x4-x2>=0.0\n",
      "   +0.3033 if c>=1.0 & x1<=2.0 & x1>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2>=-2.0\n",
      "   +0.4019 if c<=0.0 & x1<=1.0 & x3-x1>=0.0\n",
      "   +0.4781 if c>=1.0 & x3-x1<=0.0\n",
      "   -0.0325 if c<=0.0 & x2<=0.0\n",
      "   -0.0415 if x2>=1.0 & x3-x1<=-2.0 & x4-x2>=-1.0\n",
      "   -0.8307 if x1>=1.0 & x2<=2.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   -0.0165 if x2<=0.0 & x3-x1<=2.0 & x4-x2>=1.0\n",
      "   +0.4219 if x4-x2<=0.0\n",
      "   -0.0784 if x3-x1<=2.0\n",
      "   +0.0000 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=2.0\n",
      "   +0.4980 if x2<=2.0 & x2>=2.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "----------------- 2 --------------\n",
      "   +0.7145 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.8531 if x4-x2>=0.0\n",
      "   +0.8547 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   +0.3082 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.5240 if c>=1.0 & x1<=2.0 & x3-x1<=1.0\n",
      "   -0.2400 if c>=1.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   -0.0456 if x3-x1>=0.0 & x4-x2<=1.0\n",
      "   -0.7568 if c<=0.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.0651 if x2<=2.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.2412 if x2>=3.0 & x4-x2<=-2.0\n",
      "   +0.2058 if x3-x1<=1.0\n",
      "   +0.1297 if x4-x2<=-3.0\n",
      "   -0.0731 if c<=0.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.0270 if x2<=2.0 & x3-x1<=2.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   -0.0636 if c<=0.0 & x1<=1.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=0.0\n",
      "   -0.2460 if x2<=2.0 & x3-x1>=1.0 & x4-x2<=-2.0\n",
      "----------------- 3 --------------\n",
      "   +0.6300 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.6463 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.5937 if x1<=2.0 & x4-x2<=0.0\n",
      "   +0.9225 if x2<=2.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.5205 if x1>=1.0 & x2<=1.0\n",
      "   -0.1398 if x1>=3.0 & x4-x2>=0.0\n",
      "   -0.0689 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x3-x1>=0.0\n",
      "   +0.4235 if x4-x2<=2.0 & x4-x2>=1.0\n",
      "   +0.1363 if x1>=2.0 & x2<=1.0 & x3-x1>=-2.0\n",
      "   +0.4812 if c<=0.0 & x4-x2>=1.0\n",
      "   +0.3407 if x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.0380 if x1<=2.0\n",
      "   -0.1635 if x2>=3.0 & x3-x1<=0.0 & x3-x1>=-1.0\n",
      "   -0.0078 if x4-x2<=1.0\n",
      "   +0.4760 if x1<=2.0 & x1>=1.0 & x3-x1<=1.0 & x4-x2>=1.0\n",
      "   -0.6500 if x1<=1.0 & x2<=2.0 & x2>=2.0 & x3-x1<=-1.0 & x4-x2>=0.0\n",
      "init state [1 0 2 1 0]\n",
      "(8,) (8,)\n",
      "init state [0 1 1 2 0]\n",
      "(16,) (8,)\n",
      "init state [ 0  3  3 -2  0]\n",
      "(35,) (19,)\n",
      "init state [1 0 0 3 0]\n",
      "(40,) (5,)\n",
      "init state [ 2  0 -2  2  0]\n",
      "(60,) (20,)\n",
      "init state [ 1  2  2 -2  0]\n",
      "(73,) (13,)\n",
      "init state [ 2  1 -1  1  0]\n",
      "(78,) (5,)\n",
      "init state [0 1 1 1 0]\n",
      "(86,) (8,)\n",
      "init state [ 2  3 -1 -1  0]\n",
      "(94,) (8,)\n",
      "init state [ 2  0 -2  0  0]\n",
      "(115,) (21,)\n",
      "============ 116 ===========\n",
      "Run episode 116 with rewards 21, accuracy 0.7\n",
      "----------------- 0 --------------\n",
      "   +0.3703 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   +0.5152 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.3645 if c<=0.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   +0.3110 if c<=0.0 & x1<=0.0\n",
      "   +0.2837 if x1>=2.0 & x4-x2>=0.0\n",
      "   +0.2585 if x1<=2.0 & x1>=2.0 & x3-x1<=-1.0\n",
      "   -0.2914 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.2691 if x3-x1>=1.0\n",
      "   +0.6779 if c<=0.0 & x2>=1.0 & x4-x2>=1.0\n",
      "   +0.0038 if x3-x1<=-2.0\n",
      "   -0.2244 if c<=0.0 & x2<=1.0 & x4-x2<=0.0\n",
      "   -0.3677 if c<=0.0 & x1<=2.0 & x3-x1>=0.0\n",
      "   -0.4931 if x1<=2.0 & x2>=3.0\n",
      "   +0.0593 if x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.0159 if x1<=1.0 & x4-x2>=2.0\n",
      "   -0.3800 if c>=1.0 & x1>=1.0 & x2<=2.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "----------------- 1 --------------\n",
      "   +0.6429 if x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.4243 if c>=1.0 & x2>=1.0\n",
      "   +0.1377 if c<=0.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.2437 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.3310 if x3-x1>=1.0 & x4-x2>=0.0\n",
      "   -0.0411 if c>=1.0 & x1<=2.0 & x1>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2>=-2.0\n",
      "   +0.3482 if c<=0.0 & x1<=1.0 & x3-x1>=0.0\n",
      "   +0.3761 if c>=1.0 & x3-x1<=0.0\n",
      "   -0.3541 if c<=0.0 & x2<=0.0\n",
      "   -0.3265 if x2>=1.0 & x3-x1<=-2.0 & x4-x2>=-1.0\n",
      "   -0.5277 if x1>=1.0 & x2<=2.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   -0.1364 if x2<=0.0 & x3-x1<=2.0 & x4-x2>=1.0\n",
      "   +0.3932 if x4-x2<=0.0\n",
      "   +0.1568 if x3-x1<=2.0\n",
      "   +0.0744 if x2<=2.0 & x2>=2.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.2488 if c<=0.0 & x1<=2.0 & x3-x1<=-1.0 & x3-x1<=0.0\n",
      "----------------- 2 --------------\n",
      "   +0.6487 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.7153 if x4-x2>=0.0\n",
      "   +0.1826 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   +0.1922 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.1747 if c>=1.0 & x1<=2.0 & x3-x1<=1.0\n",
      "   +0.0672 if c>=1.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.2712 if x3-x1>=0.0 & x4-x2<=1.0\n",
      "   -0.4281 if c<=0.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.5935 if x2<=2.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.1203 if x2>=3.0 & x4-x2<=-2.0\n",
      "   +0.1496 if x3-x1<=1.0\n",
      "   +0.0848 if x4-x2<=-3.0\n",
      "   -0.1246 if c<=0.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.0634 if c<=0.0 & x1<=1.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=0.0\n",
      "   +0.1209 if x2<=2.0 & x3-x1>=1.0 & x4-x2<=-2.0\n",
      "   -0.5181 if c>=1.0 & x3-x1>=0.0\n",
      "----------------- 3 --------------\n",
      "   +0.1937 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.7721 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.5138 if x1<=2.0 & x4-x2<=0.0\n",
      "   +0.2424 if x2<=2.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.4182 if x1>=1.0 & x2<=1.0\n",
      "   -0.0279 if x1>=3.0 & x4-x2>=0.0\n",
      "   +0.4824 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x3-x1>=0.0\n",
      "   +0.2621 if x4-x2<=2.0 & x4-x2>=1.0\n",
      "   -0.0374 if x1>=2.0 & x2<=1.0 & x3-x1>=-2.0\n",
      "   +0.3453 if c<=0.0 & x4-x2>=1.0\n",
      "   +0.0620 if x3-x1>=1.0 & x4-x2>=1.0\n",
      "   -0.1089 if x1<=2.0\n",
      "   -0.2470 if x2>=3.0 & x3-x1<=0.0 & x3-x1>=-1.0\n",
      "   +0.4976 if x1<=2.0 & x1>=1.0 & x3-x1<=1.0 & x4-x2>=1.0\n",
      "   -0.2233 if x1<=1.0 & x2<=2.0 & x2>=2.0 & x3-x1<=-1.0 & x4-x2>=0.0\n",
      "   +0.2376 if x3-x1>=-2.0 & x4-x2<=1.0\n",
      "init state [1 2 1 1 0]\n",
      "(3,) (3,)\n",
      "init state [ 2  0 -1  1  0]\n",
      "(9,) (6,)\n",
      "init state [ 3  1 -3  1  0]\n",
      "(41,) (32,)\n",
      "init state [ 2  0 -1  3  0]\n",
      "(54,) (13,)\n",
      "init state [ 1  1 -1  1  0]\n",
      "(72,) (18,)\n",
      "init state [1 3 1 0 0]\n",
      "(74,) (2,)\n",
      "init state [ 2  0 -2  3  0]\n",
      "(95,) (21,)\n",
      "init state [1 0 1 3 0]\n",
      "(100,) (5,)\n",
      "init state [ 3  0 -3  0  0]\n",
      "(170,) (70,)\n",
      "init state [1 1 2 1 0]\n",
      "(185,) (15,)\n",
      "============ 117 ===========\n",
      "Run episode 117 with rewards 27, accuracy 0.3\n",
      "----------------- 0 --------------\n",
      "   +0.4730 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   +0.6067 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.0316 if c<=0.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   -0.1886 if c<=0.0 & x1<=0.0\n",
      "   +0.0084 if x1>=2.0 & x4-x2>=0.0\n",
      "   +0.5131 if x1<=2.0 & x1>=2.0 & x3-x1<=-1.0\n",
      "   -0.0101 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.1611 if x3-x1>=1.0\n",
      "   +0.7470 if c<=0.0 & x2>=1.0 & x4-x2>=1.0\n",
      "   +0.3246 if c<=0.0 & x2<=1.0 & x4-x2<=0.0\n",
      "   -0.4933 if c<=0.0 & x1<=2.0 & x3-x1>=0.0\n",
      "   -0.2100 if x1<=2.0 & x2>=3.0\n",
      "   +0.3502 if x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.1927 if x1<=1.0 & x4-x2>=2.0\n",
      "   -0.1230 if c>=1.0 & x1>=1.0 & x2<=2.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   +0.5628 if c<=0.0 & x1>=2.0 & x2<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2<=2.0\n",
      "----------------- 1 --------------\n",
      "   +0.6678 if x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.1726 if c>=1.0 & x2>=1.0\n",
      "   +0.3678 if c<=0.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.2372 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.3678 if x3-x1>=1.0 & x4-x2>=0.0\n",
      "   -0.1056 if c<=0.0 & x1<=1.0 & x3-x1>=0.0\n",
      "   +0.2895 if c>=1.0 & x3-x1<=0.0\n",
      "   -0.6140 if c<=0.0 & x2<=0.0\n",
      "   +0.0520 if x2>=1.0 & x3-x1<=-2.0 & x4-x2>=-1.0\n",
      "   -0.4833 if x1>=1.0 & x2<=2.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   -0.0044 if x2<=0.0 & x3-x1<=2.0 & x4-x2>=1.0\n",
      "   +0.7639 if x4-x2<=0.0\n",
      "   +0.0112 if x3-x1<=2.0\n",
      "   +0.3495 if x2<=2.0 & x2>=2.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.0741 if c<=0.0 & x1<=2.0 & x3-x1<=-1.0 & x3-x1<=0.0\n",
      "   -0.1489 if x2<=2.0 & x2>=1.0 & x3-x1>=1.0 & x4-x2>=1.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 2 --------------\n",
      "   +0.0338 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.0856 if x4-x2>=0.0\n",
      "   +0.0959 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   -0.1356 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.4079 if c>=1.0 & x1<=2.0 & x3-x1<=1.0\n",
      "   -0.3001 if c>=1.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   -0.1382 if x3-x1>=0.0 & x4-x2<=1.0\n",
      "   -0.1284 if c<=0.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.1256 if x2<=2.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.0153 if x2>=3.0 & x4-x2<=-2.0\n",
      "   -0.1717 if x3-x1<=1.0\n",
      "   +0.0000 if x4-x2<=-3.0\n",
      "   -0.1213 if c<=0.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.0000 if x2<=2.0 & x3-x1>=1.0 & x4-x2<=-2.0\n",
      "   -0.2361 if c>=1.0 & x3-x1>=0.0\n",
      "   -0.4628 if x3-x1>=1.0\n",
      "----------------- 3 --------------\n",
      "   +0.4757 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.9702 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.3117 if x1<=2.0 & x4-x2<=0.0\n",
      "   +0.1836 if x2<=2.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.0402 if x1>=1.0 & x2<=1.0\n",
      "   +0.7851 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x3-x1>=0.0\n",
      "   +0.4987 if x4-x2<=2.0 & x4-x2>=1.0\n",
      "   -0.2892 if x1>=2.0 & x2<=1.0 & x3-x1>=-2.0\n",
      "   +0.6983 if c<=0.0 & x4-x2>=1.0\n",
      "   +0.3805 if x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.2748 if x1<=2.0\n",
      "   -0.0966 if x2>=3.0 & x3-x1<=0.0 & x3-x1>=-1.0\n",
      "   +0.1684 if x1<=2.0 & x1>=1.0 & x3-x1<=1.0 & x4-x2>=1.0\n",
      "   +0.0026 if x1<=1.0 & x2<=2.0 & x2>=2.0 & x3-x1<=-1.0 & x4-x2>=0.0\n",
      "   -0.4622 if x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   -0.4590 if x2>=1.0 & x3-x1>=2.0 & x4-x2>=1.0\n",
      "init state [ 2  1 -1  0  0]\n",
      "(10,) (10,)\n",
      "init state [ 0  1  2 -1  0]\n",
      "(24,) (14,)\n",
      "init state [1 1 2 1 0]\n",
      "(37,) (13,)\n",
      "init state [ 0  1  1 -1  0]\n",
      "(53,) (16,)\n",
      "init state [ 0  2  3 -2  0]\n",
      "(121,) (68,)\n",
      "init state [ 1  1 -1  1  0]\n",
      "(129,) (8,)\n",
      "init state [ 2  1 -1  1  0]\n",
      "(137,) (8,)\n",
      "init state [ 3  2 -1 -1  0]\n",
      "(150,) (13,)\n",
      "init state [ 1  2  2 -2  0]\n",
      "(170,) (20,)\n",
      "init state [1 2 2 0 0]\n",
      "(173,) (3,)\n",
      "============ 118 ===========\n",
      "Run episode 118 with rewards 39, accuracy 0.3\n",
      "----------------- 0 --------------\n",
      "   +0.4561 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   +0.7500 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.0461 if c<=0.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   -0.0292 if c<=0.0 & x1<=0.0\n",
      "   +0.2201 if x1<=2.0 & x1>=2.0 & x3-x1<=-1.0\n",
      "   +0.2293 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   +0.1895 if x3-x1>=1.0\n",
      "   +0.6293 if c<=0.0 & x2>=1.0 & x4-x2>=1.0\n",
      "   +0.2077 if c<=0.0 & x2<=1.0 & x4-x2<=0.0\n",
      "   -0.2930 if c<=0.0 & x1<=2.0 & x3-x1>=0.0\n",
      "   -0.3449 if x1<=2.0 & x2>=3.0\n",
      "   +0.5154 if x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.0658 if x1<=1.0 & x4-x2>=2.0\n",
      "   -0.1688 if c>=1.0 & x1>=1.0 & x2<=2.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   +0.3871 if c<=0.0 & x1>=2.0 & x2<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2<=2.0\n",
      "   +0.1400 if x1<=0.0 & x2<=0.0\n",
      "----------------- 1 --------------\n",
      "   +0.1870 if x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +1.0353 if c>=1.0 & x2>=1.0\n",
      "   +0.5296 if c<=0.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.7368 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.0654 if x3-x1>=1.0 & x4-x2>=0.0\n",
      "   -0.0605 if c<=0.0 & x1<=1.0 & x3-x1>=0.0\n",
      "   -0.3613 if c>=1.0 & x3-x1<=0.0\n",
      "   +0.0926 if c<=0.0 & x2<=0.0\n",
      "   +0.1172 if x2>=1.0 & x3-x1<=-2.0 & x4-x2>=-1.0\n",
      "   -0.7142 if x1>=1.0 & x2<=2.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   +0.3260 if x4-x2<=0.0\n",
      "   +0.1574 if x3-x1<=2.0\n",
      "   +0.0795 if x2<=2.0 & x2>=2.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.0508 if c<=0.0 & x1<=2.0 & x3-x1<=-1.0 & x3-x1<=0.0\n",
      "   -0.3459 if x2<=2.0 & x2>=1.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "   -0.4544 if x3-x1>=-1.0\n",
      "----------------- 2 --------------\n",
      "   +0.7003 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.4928 if x4-x2>=0.0\n",
      "   +0.7383 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   +0.0932 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.1226 if c>=1.0 & x1<=2.0 & x3-x1<=1.0\n",
      "   -0.3871 if c>=1.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.3184 if x3-x1>=0.0 & x4-x2<=1.0\n",
      "   -0.0681 if c<=0.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.4966 if x2<=2.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.0251 if x2>=3.0 & x4-x2<=-2.0\n",
      "   -0.0972 if x3-x1<=1.0\n",
      "   +0.1379 if c<=0.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.0608 if x2<=2.0 & x3-x1>=1.0 & x4-x2<=-2.0\n",
      "   -0.5028 if c>=1.0 & x3-x1>=0.0\n",
      "   -0.6385 if x3-x1>=1.0\n",
      "   -0.4107 if x3-x1>=3.0 & x4-x2>=-1.0\n",
      "----------------- 3 --------------\n",
      "   +1.7110 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   -0.1852 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.1192 if x1<=2.0 & x4-x2<=0.0\n",
      "   +1.9056 if x2<=2.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.4751 if x1>=1.0 & x2<=1.0\n",
      "   -0.3377 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x3-x1>=0.0\n",
      "   -0.0875 if x4-x2<=2.0 & x4-x2>=1.0\n",
      "   +0.7235 if x1>=2.0 & x2<=1.0 & x3-x1>=-2.0\n",
      "   -0.0875 if c<=0.0 & x4-x2>=1.0\n",
      "   +0.1505 if x3-x1>=1.0 & x4-x2>=1.0\n",
      "   -0.2067 if x1<=2.0\n",
      "   +0.0763 if x2>=3.0 & x3-x1<=0.0 & x3-x1>=-1.0\n",
      "   -0.2883 if x1<=2.0 & x1>=1.0 & x3-x1<=1.0 & x4-x2>=1.0\n",
      "   +0.4192 if x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   -0.0413 if x2>=1.0 & x3-x1>=2.0 & x4-x2>=1.0\n",
      "   +0.3604 if x4-x2>=2.0\n",
      "init state [0 2 2 1 0]\n",
      "(19,) (19,)\n",
      "init state [ 2  0 -2  2  0]\n",
      "(38,) (19,)\n",
      "init state [ 1  2 -1 -2  0]\n",
      "(64,) (26,)\n",
      "init state [ 0  1  1 -1  0]\n",
      "(78,) (14,)\n",
      "init state [0 1 3 0 0]\n",
      "(91,) (13,)\n",
      "init state [ 3  0 -2  0  0]\n",
      "(107,) (16,)\n",
      "init state [ 3  0 -1  3  0]\n",
      "(118,) (11,)\n",
      "init state [1 0 2 2 0]\n",
      "(128,) (10,)\n",
      "init state [ 0  3  2 -3  0]\n",
      "(146,) (18,)\n",
      "init state [ 3  0 -3  2  0]\n",
      "(177,) (31,)\n",
      "============ 119 ===========\n",
      "Run episode 119 with rewards 11, accuracy 1.0\n",
      "best\n",
      "----------------- 0 --------------\n",
      "   +0.0916 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   +0.4776 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.2428 if c<=0.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   +0.1452 if x1<=2.0 & x1>=2.0 & x3-x1<=-1.0\n",
      "   +0.1809 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   +0.0201 if x3-x1>=1.0\n",
      "   +0.4069 if c<=0.0 & x2>=1.0 & x4-x2>=1.0\n",
      "   -0.2315 if c<=0.0 & x2<=1.0 & x4-x2<=0.0\n",
      "   -0.0340 if c<=0.0 & x1<=2.0 & x3-x1>=0.0\n",
      "   +0.1722 if x1<=2.0 & x2>=3.0\n",
      "   +0.3893 if x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.2005 if x1<=1.0 & x4-x2>=2.0\n",
      "   -0.2945 if c>=1.0 & x1>=1.0 & x2<=2.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   +0.0419 if c<=0.0 & x1>=2.0 & x2<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2<=2.0\n",
      "   -0.0916 if x1<=0.0 & x2<=0.0\n",
      "   -0.6325 if x2>=3.0 & x4-x2<=-1.0\n",
      "----------------- 1 --------------\n",
      "   +0.2075 if x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.6372 if c>=1.0 & x2>=1.0\n",
      "   +0.3976 if c<=0.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.5325 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.2332 if x3-x1>=1.0 & x4-x2>=0.0\n",
      "   -0.1470 if c<=0.0 & x1<=1.0 & x3-x1>=0.0\n",
      "   +0.4071 if c>=1.0 & x3-x1<=0.0\n",
      "   -0.0251 if c<=0.0 & x2<=0.0\n",
      "   -0.0608 if x2>=1.0 & x3-x1<=-2.0 & x4-x2>=-1.0\n",
      "   -0.6838 if x1>=1.0 & x2<=2.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   +0.3227 if x4-x2<=0.0\n",
      "   +0.0920 if x3-x1<=2.0\n",
      "   +1.0359 if x2<=2.0 & x2>=2.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.3177 if x2<=2.0 & x2>=1.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "   -0.4360 if x3-x1>=-1.0\n",
      "   +0.2051 if x1<=0.0 & x3-x1>=3.0 & x4-x2>=1.0\n",
      "----------------- 2 --------------\n",
      "   +0.7332 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.8671 if x4-x2>=0.0\n",
      "   +0.4333 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   +0.5717 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.1899 if c>=1.0 & x1<=2.0 & x3-x1<=1.0\n",
      "   -0.2001 if c>=1.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.1473 if x3-x1>=0.0 & x4-x2<=1.0\n",
      "   -0.3616 if c<=0.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.1625 if x2<=2.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.0656 if x3-x1<=1.0\n",
      "   +0.1012 if c<=0.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.1300 if x2<=2.0 & x3-x1>=1.0 & x4-x2<=-2.0\n",
      "   -0.1919 if c>=1.0 & x3-x1>=0.0\n",
      "   -0.5267 if x3-x1>=1.0\n",
      "   -0.2223 if x3-x1>=3.0 & x4-x2>=-1.0\n",
      "   +0.4039 if c<=0.0 & x1>=3.0 & x2>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "----------------- 3 --------------\n",
      "   +0.4099 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.4719 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.1562 if x1<=2.0 & x4-x2<=0.0\n",
      "   +1.2438 if x2<=2.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.3591 if x1>=1.0 & x2<=1.0\n",
      "   -0.1095 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x3-x1>=0.0\n",
      "   +0.3916 if x4-x2<=2.0 & x4-x2>=1.0\n",
      "   +0.5318 if x1>=2.0 & x2<=1.0 & x3-x1>=-2.0\n",
      "   +0.4150 if c<=0.0 & x4-x2>=1.0\n",
      "   -0.1915 if x3-x1>=1.0 & x4-x2>=1.0\n",
      "   -0.2615 if x1<=2.0\n",
      "   -0.0242 if x2>=3.0 & x3-x1<=0.0 & x3-x1>=-1.0\n",
      "   -0.0278 if x1<=2.0 & x1>=1.0 & x3-x1<=1.0 & x4-x2>=1.0\n",
      "   +0.3839 if x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.1690 if x4-x2>=2.0\n",
      "   +0.3938 if x2<=1.0 & x3-x1>=3.0 & x4-x2<=0.0\n",
      "init state [ 3  2 -3 -2  0]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(34,) (34,)\n",
      "init state [1 2 0 1 0]\n",
      "(38,) (4,)\n",
      "init state [ 3  0 -1  2  0]\n",
      "(43,) (5,)\n",
      "init state [1 1 1 1 0]\n",
      "(52,) (9,)\n",
      "init state [ 3  0 -1  2  0]\n",
      "(61,) (9,)\n",
      "init state [ 2  3  0 -2  0]\n",
      "(68,) (7,)\n",
      "init state [ 1  1  1 -1  0]\n",
      "(78,) (10,)\n",
      "init state [ 2  1  0 -1  0]\n",
      "(95,) (17,)\n",
      "init state [1 0 2 1 0]\n",
      "(114,) (19,)\n",
      "init state [ 0  1  2 -1  0]\n",
      "(123,) (9,)\n",
      "============ 120 ===========\n",
      "Run episode 120 with rewards 33, accuracy 0.5\n",
      "----------------- 0 --------------\n",
      "   +0.5785 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   +0.5773 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.2932 if c<=0.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   -0.0965 if x1<=2.0 & x1>=2.0 & x3-x1<=-1.0\n",
      "   +0.0613 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   +0.0151 if c<=0.0 & x2>=1.0 & x4-x2>=1.0\n",
      "   -0.5661 if c<=0.0 & x2<=1.0 & x4-x2<=0.0\n",
      "   -0.0980 if c<=0.0 & x1<=2.0 & x3-x1>=0.0\n",
      "   -0.2754 if x1<=2.0 & x2>=3.0\n",
      "   +0.2811 if x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.0000 if x1<=1.0 & x4-x2>=2.0\n",
      "   -0.1313 if c>=1.0 & x1>=1.0 & x2<=2.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   -0.3342 if c<=0.0 & x1>=2.0 & x2<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2<=2.0\n",
      "   +0.0205 if x1<=0.0 & x2<=0.0\n",
      "   -0.1973 if x2>=3.0 & x4-x2<=-1.0\n",
      "   +0.3471 if c>=1.0 & x3-x1<=-2.0 & x3-x1<=-3.0\n",
      "----------------- 1 --------------\n",
      "   -0.1263 if x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.4037 if c>=1.0 & x2>=1.0\n",
      "   +0.6926 if c<=0.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.2940 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.5037 if x3-x1>=1.0 & x4-x2>=0.0\n",
      "   +0.3887 if c<=0.0 & x1<=1.0 & x3-x1>=0.0\n",
      "   +0.2806 if c>=1.0 & x3-x1<=0.0\n",
      "   -0.0427 if x2>=1.0 & x3-x1<=-2.0 & x4-x2>=-1.0\n",
      "   -0.4053 if x1>=1.0 & x2<=2.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   +0.0207 if x4-x2<=0.0\n",
      "   -0.1070 if x3-x1<=2.0\n",
      "   +0.0611 if x2<=2.0 & x2>=2.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.0176 if x2<=2.0 & x2>=1.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.1846 if x3-x1>=-1.0\n",
      "   +0.0000 if x1<=0.0 & x3-x1>=3.0 & x4-x2>=1.0\n",
      "   +0.7707 if c>=1.0 & x1<=2.0 & x1>=1.0\n",
      "----------------- 2 --------------\n",
      "   +0.6991 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.6850 if x4-x2>=0.0\n",
      "   +0.4080 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   +0.5730 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.1711 if c>=1.0 & x1<=2.0 & x3-x1<=1.0\n",
      "   -0.4595 if c>=1.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.3669 if x3-x1>=0.0 & x4-x2<=1.0\n",
      "   -0.1164 if c<=0.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.2127 if x2<=2.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.4714 if c<=0.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.0156 if x2<=2.0 & x3-x1>=1.0 & x4-x2<=-2.0\n",
      "   +0.0340 if c>=1.0 & x3-x1>=0.0\n",
      "   -0.4121 if x3-x1>=1.0\n",
      "   -0.0703 if x3-x1>=3.0 & x4-x2>=-1.0\n",
      "   +0.0098 if c<=0.0 & x1>=3.0 & x2>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.2883 if x1>=1.0 & x2>=2.0 & x3-x1>=2.0\n",
      "----------------- 3 --------------\n",
      "   +0.5930 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.5567 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.2229 if x1<=2.0 & x4-x2<=0.0\n",
      "   +0.4584 if x2<=2.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.4837 if x1>=1.0 & x2<=1.0\n",
      "   -0.0128 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x3-x1>=0.0\n",
      "   +0.3328 if x4-x2<=2.0 & x4-x2>=1.0\n",
      "   +0.6160 if x1>=2.0 & x2<=1.0 & x3-x1>=-2.0\n",
      "   +0.4815 if c<=0.0 & x4-x2>=1.0\n",
      "   -0.3745 if x3-x1>=1.0 & x4-x2>=1.0\n",
      "   -0.3585 if x1<=2.0\n",
      "   +0.0182 if x1<=2.0 & x1>=1.0 & x3-x1<=1.0 & x4-x2>=1.0\n",
      "   +0.3826 if x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.1590 if x4-x2>=2.0\n",
      "   +0.0000 if x2<=1.0 & x3-x1>=3.0 & x4-x2<=0.0\n",
      "   -0.6763 if c<=0.0 & x2<=1.0 & x3-x1>=1.0\n",
      "init state [ 3  2 -2 -1  0]\n",
      "(13,) (13,)\n",
      "init state [ 2  1 -1  1  0]\n",
      "(29,) (16,)\n",
      "init state [1 0 0 1 0]\n",
      "(50,) (21,)\n",
      "init state [1 0 1 3 0]\n",
      "(61,) (11,)\n",
      "init state [1 0 0 3 0]\n",
      "(75,) (14,)\n",
      "init state [ 2  0 -1  0  0]\n",
      "(93,) (18,)\n",
      "init state [ 2  2  0 -1  0]\n",
      "(97,) (4,)\n",
      "init state [1 1 0 1 0]\n",
      "(101,) (4,)\n",
      "init state [0 0 2 3 0]\n",
      "(111,) (10,)\n",
      "init state [ 3  1 -1  1  0]\n",
      "(125,) (14,)\n",
      "============ 121 ===========\n",
      "Run episode 121 with rewards 28, accuracy 1.0\n",
      "best\n",
      "----------------- 0 --------------\n",
      "   +0.3117 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   +0.5030 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.2349 if c<=0.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   -0.1552 if x1<=2.0 & x1>=2.0 & x3-x1<=-1.0\n",
      "   +0.1350 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.2843 if c<=0.0 & x2>=1.0 & x4-x2>=1.0\n",
      "   +0.0490 if c<=0.0 & x2<=1.0 & x4-x2<=0.0\n",
      "   -0.2274 if c<=0.0 & x1<=2.0 & x3-x1>=0.0\n",
      "   +0.0418 if x1<=2.0 & x2>=3.0\n",
      "   -0.1021 if x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.2112 if c>=1.0 & x1>=1.0 & x2<=2.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   -0.0640 if c<=0.0 & x1>=2.0 & x2<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2<=2.0\n",
      "   -0.0935 if x1<=0.0 & x2<=0.0\n",
      "   +0.1005 if x2>=3.0 & x4-x2<=-1.0\n",
      "   +0.0000 if c>=1.0 & x3-x1<=-2.0 & x3-x1<=-3.0\n",
      "   -0.5406 if x3-x1<=0.0 & x4-x2>=2.0\n",
      "----------------- 1 --------------\n",
      "   -0.1068 if x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.5249 if c>=1.0 & x2>=1.0\n",
      "   +0.8804 if c<=0.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.1932 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.4987 if x3-x1>=1.0 & x4-x2>=0.0\n",
      "   +0.3233 if c<=0.0 & x1<=1.0 & x3-x1>=0.0\n",
      "   +0.4529 if c>=1.0 & x3-x1<=0.0\n",
      "   -0.1823 if x2>=1.0 & x3-x1<=-2.0 & x4-x2>=-1.0\n",
      "   -0.7825 if x1>=1.0 & x2<=2.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   -0.0611 if x4-x2<=0.0\n",
      "   -0.0484 if x3-x1<=2.0\n",
      "   +0.0283 if x2<=2.0 & x2>=2.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.2961 if x2<=2.0 & x2>=1.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.2669 if x3-x1>=-1.0\n",
      "   +0.8056 if c>=1.0 & x1<=2.0 & x1>=1.0\n",
      "   +0.1204 if x2<=0.0 & x3-x1>=1.0\n",
      "----------------- 2 --------------\n",
      "   +0.3575 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.0663 if x4-x2>=0.0\n",
      "   +0.4766 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   -0.0716 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.3191 if c>=1.0 & x1<=2.0 & x3-x1<=1.0\n",
      "   -0.3572 if c>=1.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.1113 if x3-x1>=0.0 & x4-x2<=1.0\n",
      "   +0.0257 if c<=0.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.3835 if x2<=2.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.1756 if c<=0.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.0000 if x2<=2.0 & x3-x1>=1.0 & x4-x2<=-2.0\n",
      "   -0.1352 if c>=1.0 & x3-x1>=0.0\n",
      "   -0.1350 if x3-x1>=1.0\n",
      "   +0.0000 if x3-x1>=3.0 & x4-x2>=-1.0\n",
      "   +0.0000 if x1>=1.0 & x2>=2.0 & x3-x1>=2.0\n",
      "   +0.6859 if c<=0.0 & x2<=2.0 & x2>=2.0\n",
      "----------------- 3 --------------\n",
      "   +0.4976 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.5267 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.2287 if x1<=2.0 & x4-x2<=0.0\n",
      "   +0.4663 if x2<=2.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.6586 if x1>=1.0 & x2<=1.0\n",
      "   +0.3002 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x3-x1>=0.0\n",
      "   +0.4823 if x4-x2<=2.0 & x4-x2>=1.0\n",
      "   +0.3975 if x1>=2.0 & x2<=1.0 & x3-x1>=-2.0\n",
      "   +0.2265 if c<=0.0 & x4-x2>=1.0\n",
      "   -0.3401 if x3-x1>=1.0 & x4-x2>=1.0\n",
      "   -0.2939 if x1<=2.0\n",
      "   +0.0489 if x1<=2.0 & x1>=1.0 & x3-x1<=1.0 & x4-x2>=1.0\n",
      "   -0.2092 if x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.1463 if x4-x2>=2.0\n",
      "   -0.2989 if c<=0.0 & x2<=1.0 & x3-x1>=1.0\n",
      "   +0.5202 if x4-x2<=2.0\n",
      "init state [ 0  3  1 -3  0]\n",
      "(26,) (26,)\n",
      "init state [2 0 0 2 0]\n",
      "(32,) (6,)\n",
      "init state [ 1  3  2 -2  0]\n",
      "(41,) (9,)\n",
      "init state [ 0  3  0 -1  0]\n",
      "(77,) (36,)\n",
      "init state [ 2  1 -1  0  0]\n",
      "(104,) (27,)\n",
      "init state [ 0  2  1 -2  0]\n",
      "(118,) (14,)\n",
      "init state [ 3  0 -1  0  0]\n",
      "(131,) (13,)\n",
      "init state [0 0 2 2 0]\n",
      "(141,) (10,)\n",
      "init state [ 3  1  0 -1  0]\n",
      "(156,) (15,)\n",
      "init state [2 1 0 1 0]\n",
      "(159,) (3,)\n",
      "============ 122 ===========\n",
      "Run episode 122 with rewards 39, accuracy 0.9\n",
      "----------------- 0 --------------\n",
      "   -0.1961 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   +0.7584 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.4646 if c<=0.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   +0.1568 if x1<=2.0 & x1>=2.0 & x3-x1<=-1.0\n",
      "   +0.6286 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   +0.4615 if c<=0.0 & x2>=1.0 & x4-x2>=1.0\n",
      "   +0.1278 if c<=0.0 & x2<=1.0 & x4-x2<=0.0\n",
      "   -0.5231 if c<=0.0 & x1<=2.0 & x3-x1>=0.0\n",
      "   -0.0015 if x1<=2.0 & x2>=3.0\n",
      "   -0.0784 if x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.3316 if c>=1.0 & x1>=1.0 & x2<=2.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   +0.7461 if c<=0.0 & x1>=2.0 & x2<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2<=2.0\n",
      "   -0.0220 if x1<=0.0 & x2<=0.0\n",
      "   +0.2126 if x2>=3.0 & x4-x2<=-1.0\n",
      "   -0.0461 if x3-x1<=0.0 & x4-x2>=2.0\n",
      "   -0.0552 if c<=0.0 & x1<=1.0 & x2<=2.0\n",
      "----------------- 1 --------------\n",
      "   +0.1633 if x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.2970 if c>=1.0 & x2>=1.0\n",
      "   +0.3127 if c<=0.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.2149 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.4584 if x3-x1>=1.0 & x4-x2>=0.0\n",
      "   +0.1316 if c<=0.0 & x1<=1.0 & x3-x1>=0.0\n",
      "   +0.1881 if c>=1.0 & x3-x1<=0.0\n",
      "   -0.0373 if x2>=1.0 & x3-x1<=-2.0 & x4-x2>=-1.0\n",
      "   -0.6642 if x1>=1.0 & x2<=2.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   +0.1542 if x4-x2<=0.0\n",
      "   +0.0679 if x3-x1<=2.0\n",
      "   +0.0907 if x2<=2.0 & x2>=1.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.2172 if x3-x1>=-1.0\n",
      "   +0.6299 if c>=1.0 & x1<=2.0 & x1>=1.0\n",
      "   +0.3677 if x2<=0.0 & x3-x1>=1.0\n",
      "   +0.7275 if x1>=1.0 & x2>=3.0 & x3-x1>=1.0\n",
      "----------------- 2 --------------\n",
      "   +0.6482 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.0323 if x4-x2>=0.0\n",
      "   +0.2934 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   -0.4723 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.3358 if c>=1.0 & x1<=2.0 & x3-x1<=1.0\n",
      "   -0.3831 if c>=1.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.3652 if x3-x1>=0.0 & x4-x2<=1.0\n",
      "   +0.5329 if c<=0.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.2888 if x2<=2.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.0507 if c<=0.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.1223 if c>=1.0 & x3-x1>=0.0\n",
      "   -0.3139 if x3-x1>=1.0\n",
      "   +0.0000 if x3-x1>=3.0 & x4-x2>=-1.0\n",
      "   -0.0873 if x1>=1.0 & x2>=2.0 & x3-x1>=2.0\n",
      "   +0.6025 if c<=0.0 & x2<=2.0 & x2>=2.0\n",
      "   -0.4911 if c<=0.0 & x1<=0.0 & x2<=2.0 & x2>=1.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 3 --------------\n",
      "   +0.5176 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.8432 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.4407 if x1<=2.0 & x4-x2<=0.0\n",
      "   +0.5010 if x2<=2.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.5430 if x1>=1.0 & x2<=1.0\n",
      "   +0.7782 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x3-x1>=0.0\n",
      "   +0.2447 if x4-x2<=2.0 & x4-x2>=1.0\n",
      "   +0.3456 if x1>=2.0 & x2<=1.0 & x3-x1>=-2.0\n",
      "   +0.2447 if c<=0.0 & x4-x2>=1.0\n",
      "   +0.0420 if x3-x1>=1.0 & x4-x2>=1.0\n",
      "   -0.1959 if x1<=2.0\n",
      "   -0.0867 if x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.3361 if x4-x2>=2.0\n",
      "   -0.2020 if c<=0.0 & x2<=1.0 & x3-x1>=1.0\n",
      "   +0.0840 if x4-x2<=2.0\n",
      "   -0.3866 if c<=0.0 & x1>=3.0 & x3-x1>=-1.0\n",
      "init state [2 0 1 1 0]\n",
      "(7,) (7,)\n",
      "init state [1 1 2 0 0]\n",
      "(13,) (6,)\n",
      "init state [1 0 1 1 0]\n",
      "(25,) (12,)\n",
      "init state [1 1 1 2 0]\n",
      "(43,) (18,)\n",
      "init state [ 0  3  1 -3  0]\n",
      "(66,) (23,)\n",
      "init state [2 0 0 2 0]\n",
      "(73,) (7,)\n",
      "init state [ 3  0 -1  2  0]\n",
      "(80,) (7,)\n",
      "init state [3 0 0 1 0]\n",
      "(87,) (7,)\n",
      "init state [ 2  3  1 -2  0]\n",
      "(100,) (13,)\n",
      "init state [ 1  2  2 -1  0]\n",
      "(105,) (5,)\n",
      "============ 123 ===========\n",
      "Run episode 123 with rewards 37, accuracy 0.6\n",
      "----------------- 0 --------------\n",
      "   -0.0681 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   +0.1117 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.4908 if c<=0.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   +0.1487 if x1<=2.0 & x1>=2.0 & x3-x1<=-1.0\n",
      "   -0.2049 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   +0.6632 if c<=0.0 & x2>=1.0 & x4-x2>=1.0\n",
      "   +0.2572 if c<=0.0 & x2<=1.0 & x4-x2<=0.0\n",
      "   -0.0238 if c<=0.0 & x1<=2.0 & x3-x1>=0.0\n",
      "   -0.3587 if x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.1723 if c>=1.0 & x1>=1.0 & x2<=2.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   +0.3489 if c<=0.0 & x1>=2.0 & x2<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2<=2.0\n",
      "   +0.0000 if x1<=0.0 & x2<=0.0\n",
      "   +0.0310 if x2>=3.0 & x4-x2<=-1.0\n",
      "   -0.1442 if x3-x1<=0.0 & x4-x2>=2.0\n",
      "   +0.1446 if c<=0.0 & x1<=1.0 & x2<=2.0\n",
      "   -0.5223 if c<=0.0 & x1>=2.0 & x3-x1>=0.0 & x4-x2<=1.0\n",
      "----------------- 1 --------------\n",
      "   +0.3926 if x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   -0.0490 if c>=1.0 & x2>=1.0\n",
      "   +0.2624 if c<=0.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.0883 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.3767 if x3-x1>=1.0 & x4-x2>=0.0\n",
      "   +0.2463 if c<=0.0 & x1<=1.0 & x3-x1>=0.0\n",
      "   -0.2096 if c>=1.0 & x3-x1<=0.0\n",
      "   -0.9626 if x1>=1.0 & x2<=2.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   +0.8659 if x4-x2<=0.0\n",
      "   +0.1441 if x3-x1<=2.0\n",
      "   -0.4238 if x2<=2.0 & x2>=1.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.1147 if x3-x1>=-1.0\n",
      "   +0.4055 if c>=1.0 & x1<=2.0 & x1>=1.0\n",
      "   -0.1154 if x2<=0.0 & x3-x1>=1.0\n",
      "   +0.1868 if x1>=1.0 & x2>=3.0 & x3-x1>=1.0\n",
      "   +0.6568 if x3-x1>=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "----------------- 2 --------------\n",
      "   +0.1335 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.0220 if x4-x2>=0.0\n",
      "   +0.2778 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   -0.2537 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.0302 if c>=1.0 & x1<=2.0 & x3-x1<=1.0\n",
      "   -0.1490 if c>=1.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.3400 if x3-x1>=0.0 & x4-x2<=1.0\n",
      "   -0.2751 if c<=0.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.3586 if x2<=2.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.2944 if c<=0.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.1507 if c>=1.0 & x3-x1>=0.0\n",
      "   -0.3250 if x3-x1>=1.0\n",
      "   -0.1240 if x1>=1.0 & x2>=2.0 & x3-x1>=2.0\n",
      "   +0.3725 if c<=0.0 & x2<=2.0 & x2>=2.0\n",
      "   -0.2619 if c<=0.0 & x1<=0.0 & x2<=2.0 & x2>=1.0\n",
      "   +1.0079 if c<=0.0 & x1>=3.0 & x2<=2.0 & x2>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "----------------- 3 --------------\n",
      "   +0.8107 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.7643 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.5300 if x1<=2.0 & x4-x2<=0.0\n",
      "   +0.2323 if x2<=2.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.4084 if x1>=1.0 & x2<=1.0\n",
      "   +0.4369 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x3-x1>=0.0\n",
      "   +0.3425 if x4-x2<=2.0 & x4-x2>=1.0\n",
      "   +0.5125 if x1>=2.0 & x2<=1.0 & x3-x1>=-2.0\n",
      "   +0.5010 if c<=0.0 & x4-x2>=1.0\n",
      "   -0.0137 if x1<=2.0\n",
      "   +0.0243 if x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.2018 if x4-x2>=2.0\n",
      "   -0.0294 if c<=0.0 & x2<=1.0 & x3-x1>=1.0\n",
      "   -0.0287 if x4-x2<=2.0\n",
      "   -0.2074 if c<=0.0 & x1>=3.0 & x3-x1>=-1.0\n",
      "   +0.2762 if x1>=3.0 & x2<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "init state [ 3  1 -3 -1  0]\n",
      "(27,) (27,)\n",
      "init state [ 3  0 -3  1  0]\n",
      "(81,) (54,)\n",
      "init state [1 1 1 0 0]\n",
      "(91,) (10,)\n",
      "init state [ 0  3  3 -3  0]\n",
      "(129,) (38,)\n",
      "init state [ 0  1  1 -1  0]\n",
      "(147,) (18,)\n",
      "init state [1 0 1 1 0]\n",
      "(157,) (10,)\n",
      "init state [ 0  3  1 -2  0]\n",
      "(174,) (17,)\n",
      "init state [ 1  2  1 -1  0]\n",
      "(188,) (14,)\n",
      "init state [0 1 2 0 0]\n",
      "(193,) (5,)\n",
      "init state [ 2  3  1 -3  0]\n",
      "(208,) (15,)\n",
      "============ 124 ===========\n",
      "Run episode 124 with rewards 27, accuracy 0.5\n",
      "----------------- 0 --------------\n",
      "   +0.6156 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   +0.0605 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.4744 if c<=0.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   +0.3482 if x1<=2.0 & x1>=2.0 & x3-x1<=-1.0\n",
      "   -0.7217 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   +0.0000 if c<=0.0 & x2>=1.0 & x4-x2>=1.0\n",
      "   +0.1159 if c<=0.0 & x2<=1.0 & x4-x2<=0.0\n",
      "   -0.4870 if c<=0.0 & x1<=2.0 & x3-x1>=0.0\n",
      "   -0.0764 if x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.2943 if c>=1.0 & x1>=1.0 & x2<=2.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   -0.0159 if c<=0.0 & x1>=2.0 & x2<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2<=2.0\n",
      "   -0.0077 if x2>=3.0 & x4-x2<=-1.0\n",
      "   +0.0000 if x3-x1<=0.0 & x4-x2>=2.0\n",
      "   +0.2705 if c<=0.0 & x1<=1.0 & x2<=2.0\n",
      "   -0.0196 if c<=0.0 & x1>=2.0 & x3-x1>=0.0 & x4-x2<=1.0\n",
      "   -0.9154 if x3-x1<=0.0 & x4-x2<=-1.0\n",
      "----------------- 1 --------------\n",
      "   +0.4324 if x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.2443 if c<=0.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.3635 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.2466 if x3-x1>=1.0 & x4-x2>=0.0\n",
      "   -0.0287 if c<=0.0 & x1<=1.0 & x3-x1>=0.0\n",
      "   +0.3306 if c>=1.0 & x3-x1<=0.0\n",
      "   -0.8185 if x1>=1.0 & x2<=2.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   +0.6157 if x4-x2<=0.0\n",
      "   -0.0620 if x3-x1<=2.0\n",
      "   -0.0000 if x2<=2.0 & x2>=1.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.4111 if x3-x1>=-1.0\n",
      "   +0.6857 if c>=1.0 & x1<=2.0 & x1>=1.0\n",
      "   -0.5913 if x2<=0.0 & x3-x1>=1.0\n",
      "   +0.1041 if x1>=1.0 & x2>=3.0 & x3-x1>=1.0\n",
      "   +0.3933 if x3-x1>=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.6222 if x1>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "----------------- 2 --------------\n",
      "   +0.2777 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.7628 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   +0.0010 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.3296 if c>=1.0 & x1<=2.0 & x3-x1<=1.0\n",
      "   -0.0410 if c>=1.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.1671 if x3-x1>=0.0 & x4-x2<=1.0\n",
      "   -0.0000 if c<=0.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.2573 if x2<=2.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.0081 if c<=0.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.2868 if c>=1.0 & x3-x1>=0.0\n",
      "   -0.1934 if x3-x1>=1.0\n",
      "   +0.0191 if x1>=1.0 & x2>=2.0 & x3-x1>=2.0\n",
      "   +0.8386 if c<=0.0 & x2<=2.0 & x2>=2.0\n",
      "   +0.0426 if c<=0.0 & x1<=0.0 & x2<=2.0 & x2>=1.0\n",
      "   +0.6196 if c<=0.0 & x1>=3.0 & x2<=2.0 & x2>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.4333 if x1>=2.0 & x4-x2<=-3.0\n",
      "----------------- 3 --------------\n",
      "   +0.8467 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.8245 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.8650 if x1<=2.0 & x4-x2<=0.0\n",
      "   +0.3340 if x2<=2.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.2822 if x1>=1.0 & x2<=1.0\n",
      "   +0.1931 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x3-x1>=0.0\n",
      "   +0.4343 if x4-x2<=2.0 & x4-x2>=1.0\n",
      "   +0.4889 if x1>=2.0 & x2<=1.0 & x3-x1>=-2.0\n",
      "   +0.4158 if c<=0.0 & x4-x2>=1.0\n",
      "   +0.0672 if x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   -0.0000 if x4-x2>=2.0\n",
      "   -0.0774 if c<=0.0 & x2<=1.0 & x3-x1>=1.0\n",
      "   +0.1177 if x4-x2<=2.0\n",
      "   -0.2428 if c<=0.0 & x1>=3.0 & x3-x1>=-1.0\n",
      "   -0.0230 if x1>=3.0 & x2<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.4193 if c>=1.0 & x1<=2.0 & x2<=1.0 & x2>=1.0 & x3-x1<=0.0\n",
      "init state [0 2 0 1 0]\n",
      "(16,) (16,)\n",
      "init state [ 0  3  1 -1  0]\n",
      "(32,) (16,)\n",
      "init state [1 0 2 0 0]\n",
      "(40,) (8,)\n",
      "init state [ 0  2  3 -1  0]\n",
      "(48,) (8,)\n",
      "init state [ 1  3  1 -2  0]\n",
      "(61,) (13,)\n",
      "init state [ 3  2 -1 -1  0]\n",
      "(78,) (17,)\n",
      "init state [0 1 1 1 0]\n",
      "(92,) (14,)\n",
      "init state [ 3  2 -1 -1  0]\n",
      "(100,) (8,)\n",
      "init state [ 3  2 -3  1  0]\n",
      "(114,) (14,)\n",
      "init state [ 3  2 -1  1  0]\n",
      "(118,) (4,)\n",
      "============ 125 ===========\n",
      "Run episode 125 with rewards 38, accuracy 0.9\n",
      "----------------- 0 --------------\n",
      "   +0.0795 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   +0.4836 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.4097 if c<=0.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   -0.0094 if x1<=2.0 & x1>=2.0 & x3-x1<=-1.0\n",
      "   -0.3909 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   +0.0728 if c<=0.0 & x2>=1.0 & x4-x2>=1.0\n",
      "   +0.0484 if c<=0.0 & x2<=1.0 & x4-x2<=0.0\n",
      "   -0.1443 if c<=0.0 & x1<=2.0 & x3-x1>=0.0\n",
      "   +0.1572 if x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.0909 if c>=1.0 & x1>=1.0 & x2<=2.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   +0.0807 if c<=0.0 & x1>=2.0 & x2<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2<=2.0\n",
      "   -0.1392 if x2>=3.0 & x4-x2<=-1.0\n",
      "   +0.2261 if c<=0.0 & x1<=1.0 & x2<=2.0\n",
      "   -0.2275 if c<=0.0 & x1>=2.0 & x3-x1>=0.0 & x4-x2<=1.0\n",
      "   -0.5257 if x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   -0.1963 if c<=0.0 & x3-x1<=-1.0 & x4-x2>=2.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 1 --------------\n",
      "   +0.2804 if x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.4022 if c<=0.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.4659 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.5922 if x3-x1>=1.0 & x4-x2>=0.0\n",
      "   -0.1125 if c<=0.0 & x1<=1.0 & x3-x1>=0.0\n",
      "   +0.1023 if c>=1.0 & x3-x1<=0.0\n",
      "   -0.7241 if x1>=1.0 & x2<=2.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   +0.2708 if x4-x2<=0.0\n",
      "   +0.0543 if x3-x1<=2.0\n",
      "   +0.0716 if x3-x1>=-1.0\n",
      "   +0.5020 if c>=1.0 & x1<=2.0 & x1>=1.0\n",
      "   -0.3699 if x2<=0.0 & x3-x1>=1.0\n",
      "   -0.0902 if x1>=1.0 & x2>=3.0 & x3-x1>=1.0\n",
      "   +0.0000 if x3-x1>=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.2433 if x1>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.1249 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "----------------- 2 --------------\n",
      "   +0.2608 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.4859 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   +0.2445 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.4225 if c>=1.0 & x1<=2.0 & x3-x1<=1.0\n",
      "   +0.0513 if c>=1.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.2395 if x3-x1>=0.0 & x4-x2<=1.0\n",
      "   +0.0132 if x2<=2.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.0172 if c<=0.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.0862 if c>=1.0 & x3-x1>=0.0\n",
      "   -0.0349 if x3-x1>=1.0\n",
      "   +0.0000 if x1>=1.0 & x2>=2.0 & x3-x1>=2.0\n",
      "   +0.5234 if c<=0.0 & x2<=2.0 & x2>=2.0\n",
      "   +0.0756 if c<=0.0 & x1<=0.0 & x2<=2.0 & x2>=1.0\n",
      "   +0.5353 if c<=0.0 & x1>=3.0 & x2<=2.0 & x2>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.0000 if x1>=2.0 & x4-x2<=-3.0\n",
      "   -1.1130 if c<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "----------------- 3 --------------\n",
      "   +0.3620 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.6917 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.3069 if x1<=2.0 & x4-x2<=0.0\n",
      "   +0.6750 if x2<=2.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.5619 if x1>=1.0 & x2<=1.0\n",
      "   -0.2748 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x3-x1>=0.0\n",
      "   +0.5984 if x4-x2<=2.0 & x4-x2>=1.0\n",
      "   +0.2886 if x1>=2.0 & x2<=1.0 & x3-x1>=-2.0\n",
      "   +0.5679 if c<=0.0 & x4-x2>=1.0\n",
      "   -0.0152 if x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   -0.0874 if c<=0.0 & x2<=1.0 & x3-x1>=1.0\n",
      "   +0.2534 if x4-x2<=2.0\n",
      "   +0.1113 if c<=0.0 & x1>=3.0 & x3-x1>=-1.0\n",
      "   +0.0497 if x1>=3.0 & x2<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.2330 if c>=1.0 & x1<=2.0 & x2<=1.0 & x2>=1.0 & x3-x1<=0.0\n",
      "   -0.3436 if x1>=2.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "init state [ 3  0 -1  2  0]\n",
      "(7,) (7,)\n",
      "init state [ 2  2 -2 -1  0]\n",
      "(44,) (37,)\n",
      "init state [1 0 1 1 0]\n",
      "(56,) (12,)\n",
      "init state [ 3  2 -1 -2  0]\n",
      "(67,) (11,)\n",
      "init state [ 0  3  1 -1  0]\n",
      "(72,) (5,)\n",
      "init state [ 2  1 -1  2  0]\n",
      "(78,) (6,)\n",
      "init state [ 1  2  2 -2  0]\n",
      "(100,) (22,)\n",
      "init state [2 2 0 1 0]\n",
      "(102,) (2,)\n",
      "init state [ 2  3 -1 -3  0]\n",
      "(116,) (14,)\n",
      "init state [ 1  0 -1  0  0]\n",
      "(125,) (9,)\n",
      "============ 126 ===========\n",
      "Run episode 126 with rewards 33, accuracy 0.7\n",
      "----------------- 0 --------------\n",
      "   +0.4380 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   +0.6298 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.4108 if c<=0.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   -0.1214 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.1496 if c<=0.0 & x2>=1.0 & x4-x2>=1.0\n",
      "   +0.7011 if c<=0.0 & x2<=1.0 & x4-x2<=0.0\n",
      "   -0.5320 if c<=0.0 & x1<=2.0 & x3-x1>=0.0\n",
      "   -0.0359 if x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.0156 if c>=1.0 & x1>=1.0 & x2<=2.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   +0.7947 if c<=0.0 & x1>=2.0 & x2<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2<=2.0\n",
      "   -0.3648 if x2>=3.0 & x4-x2<=-1.0\n",
      "   -0.1388 if c<=0.0 & x1<=1.0 & x2<=2.0\n",
      "   +0.0910 if c<=0.0 & x1>=2.0 & x3-x1>=0.0 & x4-x2<=1.0\n",
      "   -0.0537 if x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   -0.1224 if c<=0.0 & x3-x1<=-1.0 & x4-x2>=2.0\n",
      "   -0.3063 if x1<=0.0 & x2<=1.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "----------------- 1 --------------\n",
      "   -0.1102 if x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.3166 if c<=0.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.2880 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.3926 if x3-x1>=1.0 & x4-x2>=0.0\n",
      "   +0.2314 if c<=0.0 & x1<=1.0 & x3-x1>=0.0\n",
      "   +0.6705 if c>=1.0 & x3-x1<=0.0\n",
      "   -0.3986 if x1>=1.0 & x2<=2.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   +0.3412 if x4-x2<=0.0\n",
      "   +0.3393 if x3-x1<=2.0\n",
      "   -0.1024 if x3-x1>=-1.0\n",
      "   +0.6248 if c>=1.0 & x1<=2.0 & x1>=1.0\n",
      "   +0.2692 if x2<=0.0 & x3-x1>=1.0\n",
      "   +0.0000 if x1>=1.0 & x2>=3.0 & x3-x1>=1.0\n",
      "   -0.0772 if x1>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.1569 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.6317 if x2<=2.0 & x3-x1<=1.0\n",
      "----------------- 2 --------------\n",
      "   +0.6589 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.3645 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   +0.3235 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.3872 if c>=1.0 & x1<=2.0 & x3-x1<=1.0\n",
      "   -0.2989 if c>=1.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.0006 if x3-x1>=0.0 & x4-x2<=1.0\n",
      "   -0.0007 if x2<=2.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.0815 if c<=0.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.3434 if c>=1.0 & x3-x1>=0.0\n",
      "   +0.5333 if x3-x1>=1.0\n",
      "   +0.6225 if c<=0.0 & x2<=2.0 & x2>=2.0\n",
      "   +0.2300 if c<=0.0 & x1<=0.0 & x2<=2.0 & x2>=1.0\n",
      "   -0.2211 if c<=0.0 & x1>=3.0 & x2<=2.0 & x2>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.0755 if x1>=2.0 & x4-x2<=-3.0\n",
      "   -0.5854 if c<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.1795 if x3-x1>=2.0\n",
      "----------------- 3 --------------\n",
      "   +0.3080 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.6910 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.5088 if x1<=2.0 & x4-x2<=0.0\n",
      "   +0.8127 if x2<=2.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.2578 if x1>=1.0 & x2<=1.0\n",
      "   -0.0312 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x3-x1>=0.0\n",
      "   +0.6502 if x4-x2<=2.0 & x4-x2>=1.0\n",
      "   +0.0782 if x1>=2.0 & x2<=1.0 & x3-x1>=-2.0\n",
      "   +0.5285 if c<=0.0 & x4-x2>=1.0\n",
      "   +0.0619 if c<=0.0 & x2<=1.0 & x3-x1>=1.0\n",
      "   +0.3090 if x4-x2<=2.0\n",
      "   -0.3343 if c<=0.0 & x1>=3.0 & x3-x1>=-1.0\n",
      "   +0.0740 if x1>=3.0 & x2<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.1591 if c>=1.0 & x1<=2.0 & x2<=1.0 & x2>=1.0 & x3-x1<=0.0\n",
      "   -0.1392 if x1>=2.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   -0.3355 if x1>=3.0 & x2>=1.0 & x4-x2>=1.0\n",
      "init state [0 0 0 3 0]\n",
      "(6,) (6,)\n",
      "init state [0 0 2 0 0]\n",
      "(17,) (11,)\n",
      "init state [ 1  1  2 -1  0]\n",
      "(39,) (22,)\n",
      "init state [ 3  2 -2  0  0]\n",
      "(46,) (7,)\n",
      "init state [ 1  2  2 -2  0]\n",
      "(99,) (53,)\n",
      "init state [2 2 0 1 0]\n",
      "(101,) (2,)\n",
      "init state [1 0 2 1 0]\n",
      "(139,) (38,)\n",
      "init state [0 1 2 1 0]\n",
      "(152,) (13,)\n",
      "init state [ 0  3  3 -2  0]\n",
      "(168,) (16,)\n",
      "init state [ 3  2 -1  1  0]\n",
      "(173,) (5,)\n",
      "============ 127 ===========\n",
      "Run episode 127 with rewards 37, accuracy 0.8\n",
      "----------------- 0 --------------\n",
      "   +0.4171 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   +0.7679 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.2712 if c<=0.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   +0.0000 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   +0.0417 if c<=0.0 & x2>=1.0 & x4-x2>=1.0\n",
      "   +0.3297 if c<=0.0 & x2<=1.0 & x4-x2<=0.0\n",
      "   -0.3657 if c<=0.0 & x1<=2.0 & x3-x1>=0.0\n",
      "   -0.1761 if x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.5042 if c<=0.0 & x1>=2.0 & x2<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2<=2.0\n",
      "   -0.1052 if x2>=3.0 & x4-x2<=-1.0\n",
      "   -0.2230 if c<=0.0 & x1<=1.0 & x2<=2.0\n",
      "   -0.1161 if c<=0.0 & x1>=2.0 & x3-x1>=0.0 & x4-x2<=1.0\n",
      "   -0.2775 if x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   +0.0000 if c<=0.0 & x3-x1<=-1.0 & x4-x2>=2.0\n",
      "   +0.0000 if x1<=0.0 & x2<=1.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   -0.2699 if c<=0.0 & x1<=2.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "----------------- 1 --------------\n",
      "   -0.2875 if x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.4134 if c<=0.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.1865 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.4987 if x3-x1>=1.0 & x4-x2>=0.0\n",
      "   -0.1036 if c<=0.0 & x1<=1.0 & x3-x1>=0.0\n",
      "   +0.3168 if c>=1.0 & x3-x1<=0.0\n",
      "   -0.4548 if x1>=1.0 & x2<=2.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   +0.5283 if x4-x2<=0.0\n",
      "   +0.1926 if x3-x1<=2.0\n",
      "   +0.5460 if x3-x1>=-1.0\n",
      "   +0.7609 if c>=1.0 & x1<=2.0 & x1>=1.0\n",
      "   +0.5272 if x2<=0.0 & x3-x1>=1.0\n",
      "   -0.2216 if x1>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.3625 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.5253 if x2<=2.0 & x3-x1<=1.0\n",
      "   +0.6284 if x1>=1.0 & x2<=1.0 & x4-x2<=0.0\n",
      "----------------- 2 --------------\n",
      "   +0.3160 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.5031 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   -0.0139 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.2899 if c>=1.0 & x1<=2.0 & x3-x1<=1.0\n",
      "   -0.1854 if c>=1.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.1948 if x2<=2.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.0000 if c<=0.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.6238 if c>=1.0 & x3-x1>=0.0\n",
      "   +0.0123 if x3-x1>=1.0\n",
      "   +1.0410 if c<=0.0 & x2<=2.0 & x2>=2.0\n",
      "   -0.3888 if c<=0.0 & x1<=0.0 & x2<=2.0 & x2>=1.0\n",
      "   -0.1345 if c<=0.0 & x1>=3.0 & x2<=2.0 & x2>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.0000 if x1>=2.0 & x4-x2<=-3.0\n",
      "   -0.4311 if c<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.4423 if x3-x1>=2.0\n",
      "   -0.2754 if c<=0.0 & x1>=3.0 & x3-x1<=-1.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 3 --------------\n",
      "   +0.6453 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.9500 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.6603 if x1<=2.0 & x4-x2<=0.0\n",
      "   +0.6947 if x2<=2.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.1819 if x1>=1.0 & x2<=1.0\n",
      "   +0.4515 if x4-x2<=2.0 & x4-x2>=1.0\n",
      "   -0.2957 if x1>=2.0 & x2<=1.0 & x3-x1>=-2.0\n",
      "   +0.6796 if c<=0.0 & x4-x2>=1.0\n",
      "   +0.0973 if c<=0.0 & x2<=1.0 & x3-x1>=1.0\n",
      "   +0.3200 if x4-x2<=2.0\n",
      "   -0.2467 if c<=0.0 & x1>=3.0 & x3-x1>=-1.0\n",
      "   +0.0000 if x1>=3.0 & x2<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.0000 if c>=1.0 & x1<=2.0 & x2<=1.0 & x2>=1.0 & x3-x1<=0.0\n",
      "   -0.2289 if x1>=2.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   -0.2516 if x1>=3.0 & x2>=1.0 & x4-x2>=1.0\n",
      "   +0.2624 if x2>=1.0 & x4-x2>=2.0\n",
      "init state [0 1 2 0 0]\n",
      "(5,) (5,)\n",
      "init state [ 1  2  2 -2  0]\n",
      "(25,) (20,)\n",
      "init state [ 0  3  3 -2  0]\n",
      "(39,) (14,)\n",
      "init state [ 1  3  2 -3  0]\n",
      "(57,) (18,)\n",
      "init state [ 3  1 -1  2  0]\n",
      "(67,) (10,)\n",
      "init state [ 2  2 -1  1  0]\n",
      "(88,) (21,)\n",
      "init state [ 2  1 -2  1  0]\n",
      "(117,) (29,)\n",
      "init state [ 2  3 -1 -2  0]\n",
      "(135,) (18,)\n",
      "init state [ 1  3 -1  0  0]\n",
      "(148,) (13,)\n",
      "init state [ 2  1  1 -1  0]\n",
      "(166,) (18,)\n",
      "============ 128 ===========\n",
      "Run episode 128 with rewards 24, accuracy 0.9\n",
      "----------------- 0 --------------\n",
      "   +0.3189 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   +0.5127 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.2407 if c<=0.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   +0.2466 if c<=0.0 & x2>=1.0 & x4-x2>=1.0\n",
      "   +0.6207 if c<=0.0 & x2<=1.0 & x4-x2<=0.0\n",
      "   -0.4543 if c<=0.0 & x1<=2.0 & x3-x1>=0.0\n",
      "   -0.0348 if x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.3778 if c<=0.0 & x1>=2.0 & x2<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2<=2.0\n",
      "   -0.4202 if x2>=3.0 & x4-x2<=-1.0\n",
      "   -0.1046 if c<=0.0 & x1<=1.0 & x2<=2.0\n",
      "   -0.0343 if c<=0.0 & x1>=2.0 & x3-x1>=0.0 & x4-x2<=1.0\n",
      "   -0.2444 if x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   -0.2230 if c<=0.0 & x3-x1<=-1.0 & x4-x2>=2.0\n",
      "   +0.0000 if x1<=0.0 & x2<=1.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   -0.1419 if c<=0.0 & x1<=2.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.3623 if x1<=1.0 & x2<=1.0 & x3-x1<=-1.0 & x3-x1<=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "----------------- 1 --------------\n",
      "   +0.2329 if x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.5286 if c<=0.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.1978 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.6507 if x3-x1>=1.0 & x4-x2>=0.0\n",
      "   +0.4511 if c>=1.0 & x3-x1<=0.0\n",
      "   -0.2788 if x1>=1.0 & x2<=2.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   +0.3208 if x4-x2<=0.0\n",
      "   -0.1389 if x3-x1<=2.0\n",
      "   +0.0849 if x3-x1>=-1.0\n",
      "   +0.2802 if c>=1.0 & x1<=2.0 & x1>=1.0\n",
      "   +0.1773 if x2<=0.0 & x3-x1>=1.0\n",
      "   +0.0641 if x1>=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.2999 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.0839 if x2<=2.0 & x3-x1<=1.0\n",
      "   +0.2884 if x1>=1.0 & x2<=1.0 & x4-x2<=0.0\n",
      "   -0.5749 if x1>=3.0 & x2>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "----------------- 2 --------------\n",
      "   +0.4770 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.6181 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   +0.4217 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.0481 if c>=1.0 & x1<=2.0 & x3-x1<=1.0\n",
      "   -0.0353 if c>=1.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   -0.3517 if x2<=2.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.2532 if c<=0.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.3359 if c>=1.0 & x3-x1>=0.0\n",
      "   -0.2599 if x3-x1>=1.0\n",
      "   +0.6500 if c<=0.0 & x2<=2.0 & x2>=2.0\n",
      "   -0.0388 if c<=0.0 & x1<=0.0 & x2<=2.0 & x2>=1.0\n",
      "   +0.3402 if c<=0.0 & x1>=3.0 & x2<=2.0 & x2>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.0915 if c<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.0073 if x3-x1>=2.0\n",
      "   -0.0349 if c<=0.0 & x1>=3.0 & x3-x1<=-1.0\n",
      "   -0.4345 if x1<=2.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "----------------- 3 --------------\n",
      "   +0.7522 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.8821 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.1969 if x1<=2.0 & x4-x2<=0.0\n",
      "   +0.5589 if x2<=2.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   -0.2035 if x1>=1.0 & x2<=1.0\n",
      "   +0.6389 if x4-x2<=2.0 & x4-x2>=1.0\n",
      "   -0.0853 if x1>=2.0 & x2<=1.0 & x3-x1>=-2.0\n",
      "   +0.5428 if c<=0.0 & x4-x2>=1.0\n",
      "   -0.1188 if c<=0.0 & x2<=1.0 & x3-x1>=1.0\n",
      "   +0.5259 if x4-x2<=2.0\n",
      "   -0.2653 if c<=0.0 & x1>=3.0 & x3-x1>=-1.0\n",
      "   -0.1322 if c>=1.0 & x1<=2.0 & x2<=1.0 & x2>=1.0 & x3-x1<=0.0\n",
      "   -0.2618 if x1>=2.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   -0.1537 if x1>=3.0 & x2>=1.0 & x4-x2>=1.0\n",
      "   +0.3290 if x2>=1.0 & x4-x2>=2.0\n",
      "   +0.6168 if c<=0.0 & x1<=2.0 & x2>=3.0 & x4-x2<=-2.0 & x4-x2>=-2.0\n",
      "init state [ 2  2  1 -1  0]\n",
      "(8,) (8,)\n",
      "init state [1 1 0 1 0]\n",
      "(14,) (6,)\n",
      "init state [ 2  2 -1  1  0]\n",
      "(32,) (18,)\n",
      "init state [ 3  0 -1  3  0]\n",
      "(42,) (10,)\n",
      "init state [1 1 1 2 0]\n",
      "(46,) (4,)\n",
      "init state [ 0  2  2 -2  0]\n",
      "(68,) (22,)\n",
      "init state [2 1 1 1 0]\n",
      "(73,) (5,)\n",
      "init state [ 1  2  2 -1  0]\n",
      "(78,) (5,)\n",
      "init state [1 2 1 1 0]\n",
      "(86,) (8,)\n",
      "init state [ 3  0 -3  2  0]\n",
      "(98,) (12,)\n",
      "============ 129 ===========\n",
      "Run episode 129 with rewards 30, accuracy 0.7\n",
      "----------------- 0 --------------\n",
      "   +0.4896 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   +0.4580 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.3111 if c<=0.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   +0.4872 if c<=0.0 & x2>=1.0 & x4-x2>=1.0\n",
      "   -0.0953 if c<=0.0 & x2<=1.0 & x4-x2<=0.0\n",
      "   -0.6598 if c<=0.0 & x1<=2.0 & x3-x1>=0.0\n",
      "   -0.3625 if x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.1322 if c<=0.0 & x1>=2.0 & x2<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2<=2.0\n",
      "   -0.1328 if x2>=3.0 & x4-x2<=-1.0\n",
      "   -0.3462 if c<=0.0 & x1<=1.0 & x2<=2.0\n",
      "   -0.3307 if c<=0.0 & x1>=2.0 & x3-x1>=0.0 & x4-x2<=1.0\n",
      "   -0.2690 if x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   +0.1250 if c<=0.0 & x3-x1<=-1.0 & x4-x2>=2.0\n",
      "   -0.3251 if c<=0.0 & x1<=2.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.2977 if x1<=1.0 & x2<=1.0 & x3-x1<=-1.0 & x3-x1<=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.3670 if c<=0.0 & x1>=3.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "----------------- 1 --------------\n",
      "   +0.1682 if x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.6055 if c<=0.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.2536 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.3026 if x3-x1>=1.0 & x4-x2>=0.0\n",
      "   +0.0976 if c>=1.0 & x3-x1<=0.0\n",
      "   -0.2318 if x1>=1.0 & x2<=2.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   +0.4246 if x4-x2<=0.0\n",
      "   +0.0004 if x3-x1<=2.0\n",
      "   +0.1138 if x3-x1>=-1.0\n",
      "   +0.5540 if c>=1.0 & x1<=2.0 & x1>=1.0\n",
      "   -0.2288 if x2<=0.0 & x3-x1>=1.0\n",
      "   -0.5338 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.0264 if x2<=2.0 & x3-x1<=1.0\n",
      "   +0.2823 if x1>=1.0 & x2<=1.0 & x4-x2<=0.0\n",
      "   -0.3377 if x1>=3.0 & x2>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   -0.4968 if x3-x1>=1.0 & x4-x2>=2.0\n",
      "----------------- 2 --------------\n",
      "   +0.6704 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.2974 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   +0.7910 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.0231 if c>=1.0 & x1<=2.0 & x3-x1<=1.0\n",
      "   +0.1667 if c>=1.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   -0.0161 if x2<=2.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.3611 if c<=0.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.2840 if c>=1.0 & x3-x1>=0.0\n",
      "   -0.1316 if x3-x1>=1.0\n",
      "   +0.0001 if c<=0.0 & x2<=2.0 & x2>=2.0\n",
      "   +0.0053 if c<=0.0 & x1<=0.0 & x2<=2.0 & x2>=1.0\n",
      "   +0.1625 if c<=0.0 & x1>=3.0 & x2<=2.0 & x2>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.4409 if c<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.0375 if c<=0.0 & x1>=3.0 & x3-x1<=-1.0\n",
      "   -0.0673 if x1<=2.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.3688 if x1>=2.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "----------------- 3 --------------\n",
      "   +0.6878 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.5558 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.6462 if x1<=2.0 & x4-x2<=0.0\n",
      "   +0.2458 if x2<=2.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   -0.2803 if x1>=1.0 & x2<=1.0\n",
      "   +0.7693 if x4-x2<=2.0 & x4-x2>=1.0\n",
      "   +0.5144 if c<=0.0 & x4-x2>=1.0\n",
      "   +0.5531 if c<=0.0 & x2<=1.0 & x3-x1>=1.0\n",
      "   +0.4881 if x4-x2<=2.0\n",
      "   -0.4490 if c<=0.0 & x1>=3.0 & x3-x1>=-1.0\n",
      "   -0.0359 if c>=1.0 & x1<=2.0 & x2<=1.0 & x2>=1.0 & x3-x1<=0.0\n",
      "   +0.0797 if x1>=2.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   -0.2463 if x1>=3.0 & x2>=1.0 & x4-x2>=1.0\n",
      "   +0.3857 if x2>=1.0 & x4-x2>=2.0\n",
      "   +0.0000 if c<=0.0 & x1<=2.0 & x2>=3.0 & x4-x2<=-2.0 & x4-x2>=-2.0\n",
      "   +0.3455 if x2<=0.0 & x3-x1>=1.0 & x4-x2>=3.0\n",
      "init state [1 0 2 1 0]\n",
      "(6,) (6,)\n",
      "init state [ 0  3  2 -1  0]\n",
      "(15,) (9,)\n",
      "init state [ 0  2  2 -2  0]\n",
      "(27,) (12,)\n",
      "init state [ 2  0 -1  1  0]\n",
      "(35,) (8,)\n",
      "init state [ 0  3  2 -2  0]\n",
      "(63,) (28,)\n",
      "init state [ 3  0 -1  2  0]\n",
      "(73,) (10,)\n",
      "init state [0 0 0 2 0]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(90,) (17,)\n",
      "init state [ 1  2 -1 -1  0]\n",
      "(109,) (19,)\n",
      "init state [1 0 1 0 0]\n",
      "(118,) (9,)\n",
      "init state [ 2  3 -2 -3  0]\n",
      "(163,) (45,)\n",
      "============ 130 ===========\n",
      "Run episode 130 with rewards -3, accuracy 0.9\n",
      "----------------- 0 --------------\n",
      "   +0.3768 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   +0.3870 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.0816 if c<=0.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   +0.0455 if c<=0.0 & x2>=1.0 & x4-x2>=1.0\n",
      "   -0.5518 if c<=0.0 & x1<=2.0 & x3-x1>=0.0\n",
      "   -0.0485 if x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.2216 if c<=0.0 & x1>=2.0 & x2<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2<=2.0\n",
      "   -0.1634 if x2>=3.0 & x4-x2<=-1.0\n",
      "   -0.0559 if c<=0.0 & x1<=1.0 & x2<=2.0\n",
      "   -0.0695 if c<=0.0 & x1>=2.0 & x3-x1>=0.0 & x4-x2<=1.0\n",
      "   -0.4335 if x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   -0.0893 if c<=0.0 & x3-x1<=-1.0 & x4-x2>=2.0\n",
      "   +0.5659 if c<=0.0 & x1<=2.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.2196 if x1<=1.0 & x2<=1.0 & x3-x1<=-1.0 & x3-x1<=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.0000 if c<=0.0 & x1>=3.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   -0.4433 if x1<=1.0 & x3-x1>=1.0\n",
      "----------------- 1 --------------\n",
      "   +0.2971 if x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.0093 if c<=0.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.2182 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.6959 if x3-x1>=1.0 & x4-x2>=0.0\n",
      "   +0.0479 if c>=1.0 & x3-x1<=0.0\n",
      "   +0.1092 if x1>=1.0 & x2<=2.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   +0.0033 if x4-x2<=0.0\n",
      "   +0.5858 if x3-x1>=-1.0\n",
      "   +0.7275 if c>=1.0 & x1<=2.0 & x1>=1.0\n",
      "   -0.0362 if x2<=0.0 & x3-x1>=1.0\n",
      "   -0.0384 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.5598 if x2<=2.0 & x3-x1<=1.0\n",
      "   +0.2930 if x1>=1.0 & x2<=1.0 & x4-x2<=0.0\n",
      "   +0.0021 if x1>=3.0 & x2>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.0000 if x3-x1>=1.0 & x4-x2>=2.0\n",
      "   +0.3353 if x2<=2.0 & x3-x1>=2.0 & x4-x2>=1.0\n",
      "----------------- 2 --------------\n",
      "   +0.7350 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.5699 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   +0.1331 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.1989 if c>=1.0 & x1<=2.0 & x3-x1<=1.0\n",
      "   +0.1452 if c>=1.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   -0.2729 if x2<=2.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.1839 if c<=0.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.3541 if c>=1.0 & x3-x1>=0.0\n",
      "   +0.5544 if x3-x1>=1.0\n",
      "   -0.1292 if c<=0.0 & x1<=0.0 & x2<=2.0 & x2>=1.0\n",
      "   -0.0258 if c<=0.0 & x1>=3.0 & x2<=2.0 & x2>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.7086 if c<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.0301 if c<=0.0 & x1>=3.0 & x3-x1<=-1.0\n",
      "   +0.1142 if x1<=2.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.0753 if x1>=2.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   +0.6138 if x1<=1.0 & x2<=1.0 & x3-x1>=1.0 & x4-x2<=0.0\n",
      "----------------- 3 --------------\n",
      "   +0.7264 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.7635 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.8168 if x1<=2.0 & x4-x2<=0.0\n",
      "   -0.0940 if x2<=2.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.2471 if x1>=1.0 & x2<=1.0\n",
      "   +0.4233 if x4-x2<=2.0 & x4-x2>=1.0\n",
      "   +0.2871 if c<=0.0 & x4-x2>=1.0\n",
      "   +0.0732 if c<=0.0 & x2<=1.0 & x3-x1>=1.0\n",
      "   +0.2880 if x4-x2<=2.0\n",
      "   +0.3470 if c<=0.0 & x1>=3.0 & x3-x1>=-1.0\n",
      "   +0.0656 if c>=1.0 & x1<=2.0 & x2<=1.0 & x2>=1.0 & x3-x1<=0.0\n",
      "   +0.1933 if x1>=2.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.1803 if x1>=3.0 & x2>=1.0 & x4-x2>=1.0\n",
      "   +0.0000 if x2>=1.0 & x4-x2>=2.0\n",
      "   +0.0000 if x2<=0.0 & x3-x1>=1.0 & x4-x2>=3.0\n",
      "   +0.5792 if c<=0.0 & x3-x1<=1.0 & x4-x2>=1.0\n",
      "init state [1 0 2 2 0]\n",
      "(15,) (15,)\n",
      "init state [ 1  3  2 -2  0]\n",
      "(34,) (19,)\n",
      "init state [ 0  3  1 -1  0]\n",
      "(47,) (13,)\n",
      "init state [ 1  1  0 -1  0]\n",
      "(75,) (28,)\n",
      "init state [ 0  2  3 -2  0]\n",
      "(87,) (12,)\n",
      "init state [ 3  2 -1 -2  0]\n",
      "(147,) (60,)\n",
      "init state [3 1 0 1 0]\n",
      "(150,) (3,)\n",
      "init state [ 2  3  1 -1  0]\n",
      "(153,) (3,)\n",
      "init state [ 1  1 -1 -1  0]\n",
      "(172,) (19,)\n",
      "init state [0 1 1 2 0]\n",
      "(192,) (20,)\n",
      "============ 131 ===========\n",
      "Run episode 131 with rewards 22, accuracy 1.0\n",
      "best\n",
      "----------------- 0 --------------\n",
      "   -0.1972 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   +0.1487 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   -0.2497 if c<=0.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   -0.1591 if c<=0.0 & x2>=1.0 & x4-x2>=1.0\n",
      "   +0.0222 if c<=0.0 & x1<=2.0 & x3-x1>=0.0\n",
      "   -0.0774 if x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.1476 if c<=0.0 & x1>=2.0 & x2<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2<=2.0\n",
      "   +0.1674 if x2>=3.0 & x4-x2<=-1.0\n",
      "   +0.2261 if c<=0.0 & x1<=1.0 & x2<=2.0\n",
      "   -0.1385 if c<=0.0 & x1>=2.0 & x3-x1>=0.0 & x4-x2<=1.0\n",
      "   -0.0898 if x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   -0.0185 if c<=0.0 & x3-x1<=-1.0 & x4-x2>=2.0\n",
      "   +0.8443 if c<=0.0 & x1<=2.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.0000 if x1<=1.0 & x2<=1.0 & x3-x1<=-1.0 & x3-x1<=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.1291 if x1<=1.0 & x3-x1>=1.0\n",
      "   -0.3140 if c<=0.0 & x1<=1.0 & x4-x2<=-1.0\n",
      "----------------- 1 --------------\n",
      "   +0.1016 if x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.0543 if c<=0.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.3149 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.4350 if x3-x1>=1.0 & x4-x2>=0.0\n",
      "   +0.0130 if c>=1.0 & x3-x1<=0.0\n",
      "   +0.2245 if x1>=1.0 & x2<=2.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   -0.0471 if x4-x2<=0.0\n",
      "   +0.3292 if x3-x1>=-1.0\n",
      "   +0.4374 if c>=1.0 & x1<=2.0 & x1>=1.0\n",
      "   +0.2872 if x2<=0.0 & x3-x1>=1.0\n",
      "   +0.0670 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.1877 if x2<=2.0 & x3-x1<=1.0\n",
      "   +0.0414 if x1>=1.0 & x2<=1.0 & x4-x2<=0.0\n",
      "   +0.3802 if x1>=3.0 & x2>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.0667 if x2<=2.0 & x3-x1>=2.0 & x4-x2>=1.0\n",
      "   +0.8127 if x2>=3.0 & x3-x1>=0.0 & x4-x2>=-2.0\n",
      "----------------- 2 --------------\n",
      "   +0.6811 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.3239 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   -0.1217 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.5035 if c>=1.0 & x1<=2.0 & x3-x1<=1.0\n",
      "   -0.1242 if c>=1.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.0074 if x2<=2.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.1054 if c<=0.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.3158 if c>=1.0 & x3-x1>=0.0\n",
      "   +0.5016 if x3-x1>=1.0\n",
      "   +0.2500 if c<=0.0 & x1<=0.0 & x2<=2.0 & x2>=1.0\n",
      "   -0.3081 if c<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.4141 if c<=0.0 & x1>=3.0 & x3-x1<=-1.0\n",
      "   +0.1682 if x1<=2.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.3836 if x1>=2.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   +0.2015 if x1<=1.0 & x2<=1.0 & x3-x1>=1.0 & x4-x2<=0.0\n",
      "   -0.4685 if x1<=0.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "----------------- 3 --------------\n",
      "   +0.6063 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.4950 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.5698 if x1<=2.0 & x4-x2<=0.0\n",
      "   +0.1817 if x2<=2.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.0217 if x1>=1.0 & x2<=1.0\n",
      "   +0.2859 if x4-x2<=2.0 & x4-x2>=1.0\n",
      "   +0.2166 if c<=0.0 & x4-x2>=1.0\n",
      "   -0.0668 if c<=0.0 & x2<=1.0 & x3-x1>=1.0\n",
      "   +0.3502 if x4-x2<=2.0\n",
      "   +0.0896 if c<=0.0 & x1>=3.0 & x3-x1>=-1.0\n",
      "   +0.1593 if c>=1.0 & x1<=2.0 & x2<=1.0 & x2>=1.0 & x3-x1<=0.0\n",
      "   +0.3671 if x1>=2.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   -0.1683 if x1>=3.0 & x2>=1.0 & x4-x2>=1.0\n",
      "   +0.1827 if x2>=1.0 & x4-x2>=2.0\n",
      "   +0.1131 if c<=0.0 & x3-x1<=1.0 & x4-x2>=1.0\n",
      "   +0.3219 if c<=0.0 & x4-x2>=2.0\n",
      "init state [2 0 0 2 0]\n",
      "(8,) (8,)\n",
      "init state [1 2 1 0 0]\n",
      "(11,) (3,)\n",
      "init state [ 2  0 -2  3  0]\n",
      "(82,) (71,)\n",
      "init state [ 3  0 -3  3  0]\n",
      "(161,) (79,)\n",
      "init state [0 0 2 1 0]\n",
      "(173,) (12,)\n",
      "init state [0 1 0 1 0]\n",
      "(199,) (26,)\n",
      "init state [0 1 3 0 0]\n",
      "(217,) (18,)\n",
      "init state [2 1 1 0 0]\n",
      "(225,) (8,)\n",
      "init state [2 1 1 0 0]\n",
      "(238,) (13,)\n",
      "init state [ 1  2 -1  1  0]\n",
      "(283,) (45,)\n",
      "============ 132 ===========\n",
      "Run episode 132 with rewards -3, accuracy 0.7\n",
      "----------------- 0 --------------\n",
      "   -0.3459 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   +1.4880 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +1.7725 if c<=0.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   -0.3573 if c<=0.0 & x2>=1.0 & x4-x2>=1.0\n",
      "   -0.5021 if c<=0.0 & x1<=2.0 & x3-x1>=0.0\n",
      "   +0.0531 if x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.0451 if c<=0.0 & x1>=2.0 & x2<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2<=2.0\n",
      "   -0.0157 if x2>=3.0 & x4-x2<=-1.0\n",
      "   -0.2790 if c<=0.0 & x1<=1.0 & x2<=2.0\n",
      "   -0.2717 if c<=0.0 & x1>=2.0 & x3-x1>=0.0 & x4-x2<=1.0\n",
      "   -0.0991 if x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   +0.8431 if c<=0.0 & x3-x1<=-1.0 & x4-x2>=2.0\n",
      "   +0.7844 if c<=0.0 & x1<=2.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.2966 if x1<=1.0 & x3-x1>=1.0\n",
      "   +0.0000 if c<=0.0 & x1<=1.0 & x4-x2<=-1.0\n",
      "   +1.2599 if x4-x2>=3.0\n",
      "----------------- 1 --------------\n",
      "   -0.0114 if x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.4189 if c<=0.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.2838 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.0453 if x3-x1>=1.0 & x4-x2>=0.0\n",
      "   -0.7694 if x1>=1.0 & x2<=2.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   +0.4701 if x4-x2<=0.0\n",
      "   +0.5658 if x3-x1>=-1.0\n",
      "   +1.0131 if c>=1.0 & x1<=2.0 & x1>=1.0\n",
      "   -0.1723 if x2<=0.0 & x3-x1>=1.0\n",
      "   -0.4909 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.2037 if x2<=2.0 & x3-x1<=1.0\n",
      "   -0.4124 if x1>=1.0 & x2<=1.0 & x4-x2<=0.0\n",
      "   +0.2300 if x1>=3.0 & x2>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   -0.3663 if x2<=2.0 & x3-x1>=2.0 & x4-x2>=1.0\n",
      "   -0.0202 if x2>=3.0 & x3-x1>=0.0 & x4-x2>=-2.0\n",
      "   -0.8259 if x4-x2>=1.0\n",
      "----------------- 2 --------------\n",
      "   +0.2820 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.3702 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   -0.4013 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.4288 if c>=1.0 & x1<=2.0 & x3-x1<=1.0\n",
      "   -0.3085 if c>=1.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.0086 if c<=0.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.2665 if c>=1.0 & x3-x1>=0.0\n",
      "   +0.3604 if x3-x1>=1.0\n",
      "   -0.2372 if c<=0.0 & x1<=0.0 & x2<=2.0 & x2>=1.0\n",
      "   -0.1750 if c<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.0113 if c<=0.0 & x1>=3.0 & x3-x1<=-1.0\n",
      "   -0.2604 if x1<=2.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.1212 if x1>=2.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   +0.4108 if x1<=1.0 & x2<=1.0 & x3-x1>=1.0 & x4-x2<=0.0\n",
      "   -0.2062 if x1<=0.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.0574 if x1<=1.0 & x1>=1.0 & x3-x1>=1.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 3 --------------\n",
      "   +0.6458 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.7624 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.6248 if x1<=2.0 & x4-x2<=0.0\n",
      "   +0.5482 if x2<=2.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.3927 if x4-x2<=2.0 & x4-x2>=1.0\n",
      "   +1.6427 if c<=0.0 & x4-x2>=1.0\n",
      "   +0.0791 if c<=0.0 & x2<=1.0 & x3-x1>=1.0\n",
      "   -0.1670 if x4-x2<=2.0\n",
      "   +0.1711 if c<=0.0 & x1>=3.0 & x3-x1>=-1.0\n",
      "   -0.1005 if c>=1.0 & x1<=2.0 & x2<=1.0 & x2>=1.0 & x3-x1<=0.0\n",
      "   -0.0168 if x1>=2.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.6222 if x1>=3.0 & x2>=1.0 & x4-x2>=1.0\n",
      "   +0.4227 if x2>=1.0 & x4-x2>=2.0\n",
      "   +1.2824 if c<=0.0 & x3-x1<=1.0 & x4-x2>=1.0\n",
      "   +1.7320 if c<=0.0 & x4-x2>=2.0\n",
      "   -0.6720 if c<=0.0 & x1<=2.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2<=1.0\n",
      "init state [0 0 2 2 0]\n",
      "(6,) (6,)\n",
      "init state [ 3  1 -1  2  0]\n",
      "(10,) (4,)\n",
      "init state [ 2  0 -2  2  0]\n",
      "(23,) (13,)\n",
      "init state [0 0 3 0 0]\n",
      "(34,) (11,)\n",
      "init state [ 3  1 -3 -1  0]\n",
      "(56,) (22,)\n",
      "init state [1 0 2 1 0]\n",
      "(78,) (22,)\n",
      "init state [ 1  3  0 -3  0]\n",
      "(111,) (33,)\n",
      "init state [ 2  3  1 -3  0]\n",
      "(122,) (11,)\n",
      "init state [0 1 0 2 0]\n",
      "(128,) (6,)\n",
      "init state [ 2  0 -2  1  0]\n",
      "(144,) (16,)\n",
      "============ 133 ===========\n",
      "Run episode 133 with rewards 26, accuracy 0.7\n",
      "----------------- 0 --------------\n",
      "   +0.4218 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   +1.0417 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.7609 if c<=0.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   +0.0674 if c<=0.0 & x2>=1.0 & x4-x2>=1.0\n",
      "   -0.5411 if c<=0.0 & x1<=2.0 & x3-x1>=0.0\n",
      "   -0.0263 if x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.1402 if c<=0.0 & x1>=2.0 & x2<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2<=2.0\n",
      "   -0.1782 if x2>=3.0 & x4-x2<=-1.0\n",
      "   -0.0818 if c<=0.0 & x1<=1.0 & x2<=2.0\n",
      "   +0.0000 if c<=0.0 & x1>=2.0 & x3-x1>=0.0 & x4-x2<=1.0\n",
      "   -0.3493 if x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   -0.0123 if c<=0.0 & x3-x1<=-1.0 & x4-x2>=2.0\n",
      "   +0.1973 if c<=0.0 & x1<=2.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.2927 if x1<=1.0 & x3-x1>=1.0\n",
      "   -0.0000 if x4-x2>=3.0\n",
      "   +0.1296 if c<=0.0 & x1<=1.0 & x4-x2<=-2.0\n",
      "----------------- 1 --------------\n",
      "   +0.4805 if c<=0.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.4406 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.1818 if x3-x1>=1.0 & x4-x2>=0.0\n",
      "   -0.2946 if x1>=1.0 & x2<=2.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   +0.6769 if x4-x2<=0.0\n",
      "   +0.4662 if x3-x1>=-1.0\n",
      "   +0.8152 if c>=1.0 & x1<=2.0 & x1>=1.0\n",
      "   -0.0786 if x2<=0.0 & x3-x1>=1.0\n",
      "   -0.1139 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.1907 if x2<=2.0 & x3-x1<=1.0\n",
      "   -0.4955 if x1>=1.0 & x2<=1.0 & x4-x2<=0.0\n",
      "   -0.7521 if x1>=3.0 & x2>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   -0.1414 if x2<=2.0 & x3-x1>=2.0 & x4-x2>=1.0\n",
      "   +0.0081 if x2>=3.0 & x3-x1>=0.0 & x4-x2>=-2.0\n",
      "   -0.2553 if x4-x2>=1.0\n",
      "   +0.0918 if x3-x1<=-2.0 & x3-x1>=-2.0\n",
      "----------------- 2 --------------\n",
      "   +0.9573 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.5206 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   +0.0407 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.4519 if c>=1.0 & x1<=2.0 & x3-x1<=1.0\n",
      "   -0.3600 if c>=1.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   -0.3000 if c>=1.0 & x3-x1>=0.0\n",
      "   -0.4103 if x3-x1>=1.0\n",
      "   -0.0148 if c<=0.0 & x1<=0.0 & x2<=2.0 & x2>=1.0\n",
      "   -0.1195 if c<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.0597 if c<=0.0 & x1>=3.0 & x3-x1<=-1.0\n",
      "   -0.1819 if x1<=2.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.1892 if x1>=2.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   -0.1758 if x1<=1.0 & x2<=1.0 & x3-x1>=1.0 & x4-x2<=0.0\n",
      "   -0.1073 if x1<=0.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.2018 if x1<=1.0 & x1>=1.0 & x3-x1>=1.0\n",
      "   +0.5554 if c<=0.0 & x1>=2.0 & x2<=1.0 & x3-x1>=0.0\n",
      "----------------- 3 --------------\n",
      "   +0.7088 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.2808 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.8959 if x1<=2.0 & x4-x2<=0.0\n",
      "   +0.7795 if x2<=2.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.6807 if x4-x2<=2.0 & x4-x2>=1.0\n",
      "   +0.7404 if c<=0.0 & x4-x2>=1.0\n",
      "   -0.0746 if c<=0.0 & x2<=1.0 & x3-x1>=1.0\n",
      "   +0.4853 if x4-x2<=2.0\n",
      "   +0.3426 if c<=0.0 & x1>=3.0 & x3-x1>=-1.0\n",
      "   +0.1035 if c>=1.0 & x1<=2.0 & x2<=1.0 & x2>=1.0 & x3-x1<=0.0\n",
      "   +0.3308 if x1>=3.0 & x2>=1.0 & x4-x2>=1.0\n",
      "   +0.2108 if x2>=1.0 & x4-x2>=2.0\n",
      "   +0.4795 if c<=0.0 & x3-x1<=1.0 & x4-x2>=1.0\n",
      "   +0.3936 if c<=0.0 & x4-x2>=2.0\n",
      "   -0.0365 if c<=0.0 & x1<=2.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2<=1.0\n",
      "   +0.2281 if c>=1.0 & x3-x1<=-3.0\n",
      "init state [ 3  1 -1  2  0]\n",
      "(4,) (4,)\n",
      "init state [ 2  2  0 -1  0]\n",
      "(10,) (6,)\n",
      "init state [ 0  2  2 -1  0]\n",
      "(19,) (9,)\n",
      "init state [ 2  1 -2  1  0]\n",
      "(28,) (9,)\n",
      "init state [0 1 3 1 0]\n",
      "(45,) (17,)\n",
      "init state [ 3  2 -2 -1  0]\n",
      "(63,) (18,)\n",
      "init state [ 3  2 -3 -1  0]\n",
      "(75,) (12,)\n",
      "init state [0 0 0 3 0]\n",
      "(82,) (7,)\n",
      "init state [ 3  2  0 -1  0]\n",
      "(90,) (8,)\n",
      "init state [ 2  3 -1 -3  0]\n",
      "(119,) (29,)\n",
      "============ 134 ===========\n",
      "Run episode 134 with rewards 13, accuracy 1.0\n",
      "best\n",
      "----------------- 0 --------------\n",
      "   +0.5122 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   +0.8535 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.7512 if c<=0.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   -0.3057 if c<=0.0 & x2>=1.0 & x4-x2>=1.0\n",
      "   -0.3474 if c<=0.0 & x1<=2.0 & x3-x1>=0.0\n",
      "   -0.0583 if x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.1853 if c<=0.0 & x1>=2.0 & x2<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2<=2.0\n",
      "   -0.3278 if x2>=3.0 & x4-x2<=-1.0\n",
      "   +0.0774 if c<=0.0 & x1<=1.0 & x2<=2.0\n",
      "   +0.0285 if c<=0.0 & x1>=2.0 & x3-x1>=0.0 & x4-x2<=1.0\n",
      "   -0.1885 if x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   -0.0406 if c<=0.0 & x3-x1<=-1.0 & x4-x2>=2.0\n",
      "   +0.0727 if c<=0.0 & x1<=2.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.0871 if x1<=1.0 & x3-x1>=1.0\n",
      "   +0.0111 if c<=0.0 & x1<=1.0 & x4-x2<=-2.0\n",
      "   +0.2591 if c<=0.0 & x2>=3.0 & x3-x1>=1.0\n",
      "----------------- 1 --------------\n",
      "   +0.6098 if c<=0.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.2331 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.3917 if x3-x1>=1.0 & x4-x2>=0.0\n",
      "   -0.3215 if x1>=1.0 & x2<=2.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   +0.4917 if x4-x2<=0.0\n",
      "   +0.5489 if x3-x1>=-1.0\n",
      "   +0.5586 if c>=1.0 & x1<=2.0 & x1>=1.0\n",
      "   +0.0000 if x2<=0.0 & x3-x1>=1.0\n",
      "   +0.0051 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.2995 if x2<=2.0 & x3-x1<=1.0\n",
      "   -0.1961 if x1>=1.0 & x2<=1.0 & x4-x2<=0.0\n",
      "   +0.0560 if x1>=3.0 & x2>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.1996 if x2<=2.0 & x3-x1>=2.0 & x4-x2>=1.0\n",
      "   +0.1358 if x4-x2>=1.0\n",
      "   +0.1411 if x3-x1<=-2.0 & x3-x1>=-2.0\n",
      "   +0.5359 if x1>=3.0 & x2>=3.0 & x3-x1<=0.0 & x3-x1>=0.0\n",
      "----------------- 2 --------------\n",
      "   +0.4550 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.3010 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   -0.2416 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.3429 if c>=1.0 & x1<=2.0 & x3-x1<=1.0\n",
      "   +0.0683 if c>=1.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   -0.3294 if c>=1.0 & x3-x1>=0.0\n",
      "   -0.5598 if x3-x1>=1.0\n",
      "   +0.1286 if c<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.2018 if c<=0.0 & x1>=3.0 & x3-x1<=-1.0\n",
      "   +0.2960 if x1<=2.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.1680 if x1>=2.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   +0.0000 if x1<=1.0 & x2<=1.0 & x3-x1>=1.0 & x4-x2<=0.0\n",
      "   -0.2059 if x1<=0.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.1715 if x1<=1.0 & x1>=1.0 & x3-x1>=1.0\n",
      "   -0.0331 if c<=0.0 & x1>=2.0 & x2<=1.0 & x3-x1>=0.0\n",
      "   -0.3237 if c<=0.0 & x1<=1.0 & x1>=1.0 & x2<=2.0\n",
      "----------------- 3 --------------\n",
      "   +0.4967 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.4827 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.4785 if x1<=2.0 & x4-x2<=0.0\n",
      "   +0.8870 if x2<=2.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.6118 if x4-x2<=2.0 & x4-x2>=1.0\n",
      "   +0.6914 if c<=0.0 & x4-x2>=1.0\n",
      "   +0.0021 if c<=0.0 & x2<=1.0 & x3-x1>=1.0\n",
      "   +0.3483 if x4-x2<=2.0\n",
      "   -0.0316 if c<=0.0 & x1>=3.0 & x3-x1>=-1.0\n",
      "   +0.1791 if c>=1.0 & x1<=2.0 & x2<=1.0 & x2>=1.0 & x3-x1<=0.0\n",
      "   +0.2675 if x1>=3.0 & x2>=1.0 & x4-x2>=1.0\n",
      "   +0.1619 if x2>=1.0 & x4-x2>=2.0\n",
      "   +0.8599 if c<=0.0 & x3-x1<=1.0 & x4-x2>=1.0\n",
      "   +0.2518 if c<=0.0 & x4-x2>=2.0\n",
      "   +0.1229 if c>=1.0 & x3-x1<=-3.0\n",
      "   -0.4741 if x1<=2.0 & x3-x1<=0.0 & x4-x2<=2.0 & x4-x2>=-2.0\n",
      "init state [ 1  2 -1  1  0]\n",
      "(19,) (19,)\n",
      "init state [ 1  1 -1  2  0]\n",
      "(25,) (6,)\n",
      "init state [ 1  2 -1  1  0]\n",
      "(30,) (5,)\n",
      "init state [ 2  1 -1  2  0]\n",
      "(35,) (5,)\n",
      "init state [0 0 0 1 0]\n",
      "(47,) (12,)\n",
      "init state [0 0 1 3 0]\n",
      "(57,) (10,)\n",
      "init state [ 0  2  0 -1  0]\n",
      "(63,) (6,)\n",
      "init state [ 0  3  1 -2  0]\n",
      "(74,) (11,)\n",
      "init state [1 0 0 1 0]\n",
      "(81,) (7,)\n",
      "init state [ 3  2 -2 -2  0]\n",
      "(102,) (21,)\n",
      "============ 135 ===========\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Run episode 135 with rewards 21, accuracy 0.8\n",
      "----------------- 0 --------------\n",
      "   +0.4989 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   +0.8439 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.6501 if c<=0.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   -0.0461 if c<=0.0 & x2>=1.0 & x4-x2>=1.0\n",
      "   -0.1938 if c<=0.0 & x1<=2.0 & x3-x1>=0.0\n",
      "   -0.0420 if x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.0000 if c<=0.0 & x1>=2.0 & x2<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2<=2.0\n",
      "   +0.1057 if x2>=3.0 & x4-x2<=-1.0\n",
      "   +0.1745 if c<=0.0 & x1<=1.0 & x2<=2.0\n",
      "   +0.0000 if c<=0.0 & x1>=2.0 & x3-x1>=0.0 & x4-x2<=1.0\n",
      "   -0.2244 if x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   +0.2839 if c<=0.0 & x3-x1<=-1.0 & x4-x2>=2.0\n",
      "   +0.7484 if c<=0.0 & x1<=2.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.4351 if x1<=1.0 & x3-x1>=1.0\n",
      "   -0.0781 if c<=0.0 & x2>=3.0 & x3-x1>=1.0\n",
      "   -0.7201 if x1<=0.0\n",
      "----------------- 1 --------------\n",
      "   +0.3411 if c<=0.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.0000 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.6767 if x3-x1>=1.0 & x4-x2>=0.0\n",
      "   -0.5088 if x1>=1.0 & x2<=2.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   +0.5531 if x4-x2<=0.0\n",
      "   +0.4378 if x3-x1>=-1.0\n",
      "   +0.9238 if c>=1.0 & x1<=2.0 & x1>=1.0\n",
      "   -0.2654 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.1748 if x2<=2.0 & x3-x1<=1.0\n",
      "   -0.0373 if x1>=1.0 & x2<=1.0 & x4-x2<=0.0\n",
      "   +0.0000 if x1>=3.0 & x2>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.0000 if x2<=2.0 & x3-x1>=2.0 & x4-x2>=1.0\n",
      "   +0.0746 if x4-x2>=1.0\n",
      "   +0.2649 if x3-x1<=-2.0 & x3-x1>=-2.0\n",
      "   +0.0000 if x1>=3.0 & x2>=3.0 & x3-x1<=0.0 & x3-x1>=0.0\n",
      "   -0.5456 if c<=0.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "----------------- 2 --------------\n",
      "   +0.6760 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.5237 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   -0.4182 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.2246 if c>=1.0 & x1<=2.0 & x3-x1<=1.0\n",
      "   -0.0815 if c>=1.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   -0.2328 if c>=1.0 & x3-x1>=0.0\n",
      "   +0.5824 if x3-x1>=1.0\n",
      "   -0.1720 if c<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.0031 if c<=0.0 & x1>=3.0 & x3-x1<=-1.0\n",
      "   -0.1349 if x1<=2.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.1007 if x1>=2.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   +0.1506 if x1<=0.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.0000 if x1<=1.0 & x1>=1.0 & x3-x1>=1.0\n",
      "   +0.0000 if c<=0.0 & x1>=2.0 & x2<=1.0 & x3-x1>=0.0\n",
      "   -0.2038 if c<=0.0 & x1<=1.0 & x1>=1.0 & x2<=2.0\n",
      "   -0.1176 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-2.0\n",
      "----------------- 3 --------------\n",
      "   +0.4782 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.6084 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.8691 if x1<=2.0 & x4-x2<=0.0\n",
      "   +0.6914 if x2<=2.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.5818 if x4-x2<=2.0 & x4-x2>=1.0\n",
      "   +0.4438 if c<=0.0 & x4-x2>=1.0\n",
      "   +0.1885 if x4-x2<=2.0\n",
      "   +0.0000 if c<=0.0 & x1>=3.0 & x3-x1>=-1.0\n",
      "   +0.1090 if c>=1.0 & x1<=2.0 & x2<=1.0 & x2>=1.0 & x3-x1<=0.0\n",
      "   +0.0000 if x1>=3.0 & x2>=1.0 & x4-x2>=1.0\n",
      "   +0.3152 if x2>=1.0 & x4-x2>=2.0\n",
      "   +0.4438 if c<=0.0 & x3-x1<=1.0 & x4-x2>=1.0\n",
      "   +0.1727 if c<=0.0 & x4-x2>=2.0\n",
      "   +0.2355 if c>=1.0 & x3-x1<=-3.0\n",
      "   +0.3077 if x1<=2.0 & x3-x1<=0.0 & x4-x2<=2.0 & x4-x2>=-2.0\n",
      "   -0.5488 if c<=0.0 & x1<=1.0 & x1>=1.0 & x3-x1<=0.0 & x4-x2>=2.0\n",
      "init state [ 2  3  0 -2  0]\n",
      "(5,) (5,)\n",
      "init state [ 2  2 -1 -2  0]\n",
      "(50,) (45,)\n",
      "init state [0 1 1 1 0]\n",
      "(57,) (7,)\n",
      "init state [ 2  2 -1 -2  0]\n",
      "(85,) (28,)\n",
      "init state [2 1 1 1 0]\n",
      "(93,) (8,)\n",
      "init state [ 0  1  0 -1  0]\n",
      "(104,) (11,)\n",
      "init state [ 0  3  1 -1  0]\n",
      "(113,) (9,)\n",
      "init state [ 3  0 -1  0  0]\n",
      "(121,) (8,)\n",
      "init state [ 3  2 -1  0  0]\n",
      "(124,) (3,)\n",
      "init state [ 3  0 -1  1  0]\n",
      "(137,) (13,)\n",
      "============ 136 ===========\n",
      "Run episode 136 with rewards 29, accuracy 1.0\n",
      "best\n",
      "----------------- 0 --------------\n",
      "   +0.5371 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   +0.8002 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.2207 if c<=0.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   -0.1906 if c<=0.0 & x2>=1.0 & x4-x2>=1.0\n",
      "   -0.2299 if c<=0.0 & x1<=2.0 & x3-x1>=0.0\n",
      "   -0.1561 if x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.2690 if c<=0.0 & x1>=2.0 & x2<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2<=2.0\n",
      "   -0.1715 if x2>=3.0 & x4-x2<=-1.0\n",
      "   +0.0835 if c<=0.0 & x1<=1.0 & x2<=2.0\n",
      "   +0.1295 if x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   -0.0000 if c<=0.0 & x3-x1<=-1.0 & x4-x2>=2.0\n",
      "   +0.0981 if c<=0.0 & x1<=2.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.1430 if x1<=1.0 & x3-x1>=1.0\n",
      "   -0.0601 if c<=0.0 & x2>=3.0 & x3-x1>=1.0\n",
      "   -0.2621 if x1<=0.0\n",
      "   +0.2056 if c<=0.0 & x1>=2.0 & x3-x1<=-1.0 & x3-x1>=-2.0 & x4-x2<=-2.0\n",
      "----------------- 1 --------------\n",
      "   +0.3813 if c<=0.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.0574 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.7824 if x3-x1>=1.0 & x4-x2>=0.0\n",
      "   -0.0474 if x1>=1.0 & x2<=2.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   +0.1668 if x4-x2<=0.0\n",
      "   +0.0227 if x3-x1>=-1.0\n",
      "   +0.9224 if c>=1.0 & x1<=2.0 & x1>=1.0\n",
      "   -0.1467 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.2134 if x2<=2.0 & x3-x1<=1.0\n",
      "   -0.0904 if x1>=1.0 & x2<=1.0 & x4-x2<=0.0\n",
      "   +0.0000 if x2<=2.0 & x3-x1>=2.0 & x4-x2>=1.0\n",
      "   +0.1374 if x4-x2>=1.0\n",
      "   +0.1329 if x3-x1<=-2.0 & x3-x1>=-2.0\n",
      "   +0.0000 if x1>=3.0 & x2>=3.0 & x3-x1<=0.0 & x3-x1>=0.0\n",
      "   -0.3778 if c<=0.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.2810 if x3-x1<=1.0 & x4-x2<=1.0\n",
      "----------------- 2 --------------\n",
      "   +1.0909 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.9825 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   +0.5711 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.4316 if c>=1.0 & x1<=2.0 & x3-x1<=1.0\n",
      "   -0.3238 if c>=1.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   -0.1803 if c>=1.0 & x3-x1>=0.0\n",
      "   +0.2796 if x3-x1>=1.0\n",
      "   -0.4055 if c<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.1758 if c<=0.0 & x1>=3.0 & x3-x1<=-1.0\n",
      "   +0.2367 if x1<=2.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.2213 if x1>=2.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   -0.0641 if x1<=0.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.1211 if x1<=1.0 & x1>=1.0 & x3-x1>=1.0\n",
      "   +0.0028 if c<=0.0 & x1<=1.0 & x1>=1.0 & x2<=2.0\n",
      "   +0.4364 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-2.0\n",
      "   -0.1607 if x1<=0.0 & x3-x1>=1.0\n",
      "----------------- 3 --------------\n",
      "   +0.4095 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.3791 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.3891 if x1<=2.0 & x4-x2<=0.0\n",
      "   +0.9325 if x2<=2.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.5078 if x4-x2<=2.0 & x4-x2>=1.0\n",
      "   +0.4483 if c<=0.0 & x4-x2>=1.0\n",
      "   +0.3677 if x4-x2<=2.0\n",
      "   +0.2274 if c>=1.0 & x1<=2.0 & x2<=1.0 & x2>=1.0 & x3-x1<=0.0\n",
      "   +0.1896 if x1>=3.0 & x2>=1.0 & x4-x2>=1.0\n",
      "   +0.0000 if x2>=1.0 & x4-x2>=2.0\n",
      "   +0.4483 if c<=0.0 & x3-x1<=1.0 & x4-x2>=1.0\n",
      "   -0.0701 if c<=0.0 & x4-x2>=2.0\n",
      "   -0.0251 if c>=1.0 & x3-x1<=-3.0\n",
      "   -0.0950 if x1<=2.0 & x3-x1<=0.0 & x4-x2<=2.0 & x4-x2>=-2.0\n",
      "   +0.0000 if c<=0.0 & x1<=1.0 & x1>=1.0 & x3-x1<=0.0 & x4-x2>=2.0\n",
      "   +0.5532 if x1>=2.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "init state [ 2  3  0 -3  0]\n",
      "(11,) (11,)\n",
      "init state [1 0 2 2 0]\n",
      "(21,) (10,)\n",
      "init state [ 3  1 -3  2  0]\n",
      "(52,) (31,)\n",
      "init state [ 0  3  1 -2  0]\n",
      "(76,) (24,)\n",
      "init state [0 1 1 2 0]\n",
      "(91,) (15,)\n",
      "init state [ 1  3  1 -2  0]\n",
      "(125,) (34,)\n",
      "init state [ 3  0 -3  2  0]\n",
      "(137,) (12,)\n",
      "init state [1 2 1 1 0]\n",
      "(197,) (60,)\n",
      "init state [ 0  3  3 -3  0]\n",
      "(230,) (33,)\n",
      "init state [ 3  2 -2 -1  0]\n",
      "(237,) (7,)\n",
      "============ 137 ===========\n",
      "Run episode 137 with rewards 35, accuracy 0.6\n",
      "----------------- 0 --------------\n",
      "   +0.5305 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   +0.9056 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.2699 if c<=0.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   +0.0116 if c<=0.0 & x2>=1.0 & x4-x2>=1.0\n",
      "   -0.5674 if c<=0.0 & x1<=2.0 & x3-x1>=0.0\n",
      "   -0.1157 if x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.0431 if c<=0.0 & x1>=2.0 & x2<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2<=2.0\n",
      "   -0.3619 if x2>=3.0 & x4-x2<=-1.0\n",
      "   -0.1980 if c<=0.0 & x1<=1.0 & x2<=2.0\n",
      "   -0.1367 if x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   +0.2218 if c<=0.0 & x1<=2.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.4886 if x1<=1.0 & x3-x1>=1.0\n",
      "   -0.1619 if c<=0.0 & x2>=3.0 & x3-x1>=1.0\n",
      "   -0.2252 if x1<=0.0\n",
      "   +0.0000 if c<=0.0 & x1>=2.0 & x3-x1<=-1.0 & x3-x1>=-2.0 & x4-x2<=-2.0\n",
      "   +0.1784 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0 & x4-x2>=0.0\n",
      "----------------- 1 --------------\n",
      "   +0.8322 if c<=0.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.1746 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.9353 if x3-x1>=1.0 & x4-x2>=0.0\n",
      "   -0.0045 if x1>=1.0 & x2<=2.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   +0.7553 if x4-x2<=0.0\n",
      "   +0.6208 if x3-x1>=-1.0\n",
      "   +0.2664 if c>=1.0 & x1<=2.0 & x1>=1.0\n",
      "   +0.0951 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.7333 if x2<=2.0 & x3-x1<=1.0\n",
      "   +0.5113 if x1>=1.0 & x2<=1.0 & x4-x2<=0.0\n",
      "   +0.0802 if x4-x2>=1.0\n",
      "   -0.1065 if x3-x1<=-2.0 & x3-x1>=-2.0\n",
      "   -0.0000 if x1>=3.0 & x2>=3.0 & x3-x1<=0.0 & x3-x1>=0.0\n",
      "   +0.2271 if c<=0.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.8759 if x3-x1<=1.0 & x4-x2<=1.0\n",
      "   +1.2284 if x1<=2.0 & x2>=2.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 2 --------------\n",
      "   +0.6816 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.6927 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   +0.0252 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.6102 if c>=1.0 & x1<=2.0 & x3-x1<=1.0\n",
      "   -0.4237 if c>=1.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   -0.5416 if c>=1.0 & x3-x1>=0.0\n",
      "   +0.2613 if x3-x1>=1.0\n",
      "   +0.4432 if c<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.2351 if c<=0.0 & x1>=3.0 & x3-x1<=-1.0\n",
      "   +0.1950 if x1<=2.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.0115 if x1>=2.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   +0.2076 if x1<=0.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.0009 if x1<=1.0 & x1>=1.0 & x3-x1>=1.0\n",
      "   +0.3313 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-2.0\n",
      "   -0.1644 if x1<=0.0 & x3-x1>=1.0\n",
      "   -0.1213 if x1>=2.0 & x3-x1>=1.0 & x4-x2<=0.0\n",
      "----------------- 3 --------------\n",
      "   +0.8459 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.8012 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.8079 if x1<=2.0 & x4-x2<=0.0\n",
      "   +0.7332 if x2<=2.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.3902 if x4-x2<=2.0 & x4-x2>=1.0\n",
      "   +0.1208 if c<=0.0 & x4-x2>=1.0\n",
      "   +0.2871 if x4-x2<=2.0\n",
      "   +0.2440 if c>=1.0 & x1<=2.0 & x2<=1.0 & x2>=1.0 & x3-x1<=0.0\n",
      "   -0.0978 if x1>=3.0 & x2>=1.0 & x4-x2>=1.0\n",
      "   +0.5488 if c<=0.0 & x3-x1<=1.0 & x4-x2>=1.0\n",
      "   +0.2468 if c<=0.0 & x4-x2>=2.0\n",
      "   -0.2168 if c>=1.0 & x3-x1<=-3.0\n",
      "   +0.7014 if x1<=2.0 & x3-x1<=0.0 & x4-x2<=2.0 & x4-x2>=-2.0\n",
      "   -0.0997 if c<=0.0 & x1<=1.0 & x1>=1.0 & x3-x1<=0.0 & x4-x2>=2.0\n",
      "   +0.0919 if x1>=2.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.5189 if x1<=0.0 & x2<=0.0\n",
      "init state [ 2  3  0 -1  0]\n",
      "(3,) (3,)\n",
      "init state [2 0 0 2 0]\n",
      "(9,) (6,)\n",
      "init state [ 3  2 -3 -2  0]\n",
      "(35,) (26,)\n",
      "init state [ 1  3  0 -1  0]\n",
      "(52,) (17,)\n",
      "init state [ 3  2 -2 -1  0]\n",
      "(79,) (27,)\n",
      "init state [ 2  1 -1 -1  0]\n",
      "(109,) (30,)\n",
      "init state [ 2  0 -2  2  0]\n",
      "(117,) (8,)\n",
      "init state [ 2  3 -2 -2  0]\n",
      "(138,) (21,)\n",
      "init state [ 0  3  1 -2  0]\n",
      "(146,) (8,)\n",
      "init state [0 1 1 1 0]\n",
      "(153,) (7,)\n",
      "============ 138 ===========\n",
      "Run episode 138 with rewards 35, accuracy 1.0\n",
      "best\n",
      "----------------- 0 --------------\n",
      "   +0.6042 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   +0.9548 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.2166 if c<=0.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   -0.2558 if c<=0.0 & x2>=1.0 & x4-x2>=1.0\n",
      "   -0.3481 if c<=0.0 & x1<=2.0 & x3-x1>=0.0\n",
      "   -0.0500 if x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.0610 if c<=0.0 & x1>=2.0 & x2<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2<=2.0\n",
      "   -0.1858 if x2>=3.0 & x4-x2<=-1.0\n",
      "   +0.0977 if c<=0.0 & x1<=1.0 & x2<=2.0\n",
      "   +0.0404 if x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   +0.3209 if c<=0.0 & x1<=2.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.2372 if x1<=1.0 & x3-x1>=1.0\n",
      "   -0.0342 if c<=0.0 & x2>=3.0 & x3-x1>=1.0\n",
      "   -0.1928 if x1<=0.0\n",
      "   +0.6413 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0 & x4-x2>=0.0\n",
      "   +0.5379 if x2>=3.0 & x3-x1<=-2.0\n",
      "----------------- 1 --------------\n",
      "   +0.2797 if c<=0.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.0579 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.4474 if x3-x1>=1.0 & x4-x2>=0.0\n",
      "   -0.0657 if x1>=1.0 & x2<=2.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   +0.2242 if x4-x2<=0.0\n",
      "   +0.4094 if x3-x1>=-1.0\n",
      "   +0.4660 if c>=1.0 & x1<=2.0 & x1>=1.0\n",
      "   -0.0471 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.3673 if x2<=2.0 & x3-x1<=1.0\n",
      "   -0.1582 if x1>=1.0 & x2<=1.0 & x4-x2<=0.0\n",
      "   -0.3161 if x4-x2>=1.0\n",
      "   -0.4927 if x3-x1<=-2.0 & x3-x1>=-2.0\n",
      "   +0.0814 if c<=0.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.0109 if x3-x1<=1.0 & x4-x2<=1.0\n",
      "   +0.4890 if x1<=2.0 & x2>=2.0\n",
      "   +0.8296 if x1<=2.0 & x2>=3.0 & x3-x1<=-1.0 & x4-x2>=-1.0\n",
      "----------------- 2 --------------\n",
      "   +0.9826 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.5361 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   +0.2182 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.5459 if c>=1.0 & x1<=2.0 & x3-x1<=1.0\n",
      "   -0.3518 if c>=1.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   -0.2362 if c>=1.0 & x3-x1>=0.0\n",
      "   +0.0845 if x3-x1>=1.0\n",
      "   +0.0514 if c<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.0624 if c<=0.0 & x1>=3.0 & x3-x1<=-1.0\n",
      "   +0.1190 if x1<=2.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.1256 if x1>=2.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   +0.0037 if x1<=0.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.0949 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-2.0\n",
      "   +0.0958 if x1<=0.0 & x3-x1>=1.0\n",
      "   +0.0000 if x1>=2.0 & x3-x1>=1.0 & x4-x2<=0.0\n",
      "   -0.2970 if c<=0.0 & x2>=2.0 & x4-x2>=0.0\n",
      "----------------- 3 --------------\n",
      "   +0.3457 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.5232 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.1013 if x1<=2.0 & x4-x2<=0.0\n",
      "   +0.4827 if x2<=2.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.6241 if x4-x2<=2.0 & x4-x2>=1.0\n",
      "   +0.6241 if c<=0.0 & x4-x2>=1.0\n",
      "   +0.1771 if x4-x2<=2.0\n",
      "   +0.1302 if c>=1.0 & x1<=2.0 & x2<=1.0 & x2>=1.0 & x3-x1<=0.0\n",
      "   +0.0000 if x1>=3.0 & x2>=1.0 & x4-x2>=1.0\n",
      "   +0.6241 if c<=0.0 & x3-x1<=1.0 & x4-x2>=1.0\n",
      "   +0.2974 if c<=0.0 & x4-x2>=2.0\n",
      "   +0.0000 if c>=1.0 & x3-x1<=-3.0\n",
      "   +0.3395 if x1<=2.0 & x3-x1<=0.0 & x4-x2<=2.0 & x4-x2>=-2.0\n",
      "   +0.0000 if c<=0.0 & x1<=1.0 & x1>=1.0 & x3-x1<=0.0 & x4-x2>=2.0\n",
      "   +0.1077 if x1<=0.0 & x2<=0.0\n",
      "   +0.2974 if x4-x2>=2.0\n",
      "init state [ 1  3 -1 -3  0]\n",
      "(17,) (17,)\n",
      "init state [ 2  3  1 -3  0]\n",
      "(30,) (13,)\n",
      "init state [ 1  0 -1  0  0]\n",
      "(48,) (18,)\n",
      "init state [1 1 0 2 0]\n",
      "(54,) (6,)\n",
      "init state [1 2 1 1 0]\n",
      "(59,) (5,)\n",
      "init state [ 2  3  0 -1  0]\n",
      "(66,) (7,)\n",
      "init state [0 0 2 0 0]\n",
      "(80,) (14,)\n",
      "init state [0 0 3 2 0]\n",
      "(106,) (26,)\n",
      "init state [1 2 0 1 0]\n",
      "(109,) (3,)\n",
      "init state [ 0  3  1 -2  0]\n",
      "(127,) (18,)\n",
      "============ 139 ===========\n",
      "Run episode 139 with rewards 24, accuracy 1.0\n",
      "best\n",
      "----------------- 0 --------------\n",
      "   +0.5226 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   +0.6038 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.5642 if c<=0.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   -0.0035 if c<=0.0 & x2>=1.0 & x4-x2>=1.0\n",
      "   +0.0412 if c<=0.0 & x1<=2.0 & x3-x1>=0.0\n",
      "   -0.3101 if x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.0930 if c<=0.0 & x1>=2.0 & x2<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2<=2.0\n",
      "   -0.3959 if x2>=3.0 & x4-x2<=-1.0\n",
      "   +0.1349 if c<=0.0 & x1<=1.0 & x2<=2.0\n",
      "   +0.0506 if x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   +0.1654 if c<=0.0 & x1<=2.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.5213 if x1<=1.0 & x3-x1>=1.0\n",
      "   -0.0267 if x1<=0.0\n",
      "   -0.0000 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0 & x4-x2>=0.0\n",
      "   -0.0030 if x2>=3.0 & x3-x1<=-2.0\n",
      "   -0.3578 if x1>=1.0 & x1>=2.0 & x2<=0.0 & x3-x1>=1.0\n",
      "----------------- 1 --------------\n",
      "   +0.2321 if c<=0.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.3820 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.3344 if x3-x1>=1.0 & x4-x2>=0.0\n",
      "   -0.1091 if x1>=1.0 & x2<=2.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   +0.7294 if x4-x2<=0.0\n",
      "   +0.0480 if x3-x1>=-1.0\n",
      "   +0.6034 if c>=1.0 & x1<=2.0 & x1>=1.0\n",
      "   -0.0353 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.5797 if x2<=2.0 & x3-x1<=1.0\n",
      "   +0.5367 if x1>=1.0 & x2<=1.0 & x4-x2<=0.0\n",
      "   -0.4864 if x4-x2>=1.0\n",
      "   +0.2543 if x3-x1<=-2.0 & x3-x1>=-2.0\n",
      "   +0.2573 if c<=0.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.4438 if x1<=2.0 & x2>=2.0\n",
      "   +0.1837 if x1<=2.0 & x2>=3.0 & x3-x1<=-1.0 & x4-x2>=-1.0\n",
      "   -0.6749 if c<=0.0 & x1>=2.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "----------------- 2 --------------\n",
      "   +0.7289 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.2418 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   +0.3550 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.3299 if c>=1.0 & x1<=2.0 & x3-x1<=1.0\n",
      "   -0.3333 if c>=1.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   -0.1107 if c>=1.0 & x3-x1>=0.0\n",
      "   +0.3914 if x3-x1>=1.0\n",
      "   -0.2942 if c<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.0469 if c<=0.0 & x1>=3.0 & x3-x1<=-1.0\n",
      "   +0.3071 if x1<=2.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.5026 if x1>=2.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   -0.5266 if x1<=0.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.1352 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-2.0\n",
      "   +0.1221 if x1<=0.0 & x3-x1>=1.0\n",
      "   -0.3637 if c<=0.0 & x2>=2.0 & x4-x2>=0.0\n",
      "   -0.2715 if x1>=1.0 & x2>=1.0 & x3-x1>=1.0 & x4-x2<=0.0\n",
      "----------------- 3 --------------\n",
      "   +0.4092 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +1.0992 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.4618 if x1<=2.0 & x4-x2<=0.0\n",
      "   +0.4728 if x2<=2.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.4690 if x4-x2<=2.0 & x4-x2>=1.0\n",
      "   +0.3992 if c<=0.0 & x4-x2>=1.0\n",
      "   +0.3645 if x4-x2<=2.0\n",
      "   +0.2167 if c>=1.0 & x1<=2.0 & x2<=1.0 & x2>=1.0 & x3-x1<=0.0\n",
      "   +0.4518 if c<=0.0 & x3-x1<=1.0 & x4-x2>=1.0\n",
      "   +0.2348 if c<=0.0 & x4-x2>=2.0\n",
      "   +0.0000 if c>=1.0 & x3-x1<=-3.0\n",
      "   +0.0120 if x1<=2.0 & x3-x1<=0.0 & x4-x2<=2.0 & x4-x2>=-2.0\n",
      "   +0.0980 if c<=0.0 & x1<=1.0 & x1>=1.0 & x3-x1<=0.0 & x4-x2>=2.0\n",
      "   +0.3735 if x1<=0.0 & x2<=0.0\n",
      "   +0.2348 if x4-x2>=2.0\n",
      "   +0.2165 if x2<=0.0 & x3-x1<=-1.0 & x3-x1<=-2.0\n",
      "init state [ 3  2  0 -2  0]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(20,) (20,)\n",
      "init state [1 0 1 2 0]\n",
      "(29,) (9,)\n",
      "init state [ 3  1 -3 -1  0]\n",
      "(55,) (26,)\n",
      "init state [1 2 1 1 0]\n",
      "(60,) (5,)\n",
      "init state [ 0  3  1 -2  0]\n",
      "(72,) (12,)\n",
      "init state [ 3  2 -1 -2  0]\n",
      "(94,) (22,)\n",
      "init state [ 3  1 -2  1  0]\n",
      "(112,) (18,)\n",
      "init state [0 0 0 2 0]\n",
      "(123,) (11,)\n",
      "init state [1 1 0 1 0]\n",
      "(127,) (4,)\n",
      "init state [2 2 1 0 0]\n",
      "(129,) (2,)\n",
      "============ 140 ===========\n",
      "Run episode 140 with rewards 40, accuracy 0.7\n",
      "----------------- 0 --------------\n",
      "   -0.2396 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   +0.2320 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.6023 if c<=0.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   -0.3907 if c<=0.0 & x2>=1.0 & x4-x2>=1.0\n",
      "   +0.2262 if c<=0.0 & x1<=2.0 & x3-x1>=0.0\n",
      "   -0.1483 if x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.1224 if c<=0.0 & x1>=2.0 & x2<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2<=2.0\n",
      "   +0.1055 if x2>=3.0 & x4-x2<=-1.0\n",
      "   +0.2333 if c<=0.0 & x1<=1.0 & x2<=2.0\n",
      "   +0.1806 if x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   +0.7583 if c<=0.0 & x1<=2.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.5766 if x1<=1.0 & x3-x1>=1.0\n",
      "   +0.2009 if x1<=0.0\n",
      "   -0.1372 if x2>=3.0 & x3-x1<=-2.0\n",
      "   -0.0862 if x1>=1.0 & x1>=2.0 & x2<=0.0 & x3-x1>=1.0\n",
      "   +0.8206 if x1<=0.0 & x4-x2>=2.0\n",
      "----------------- 1 --------------\n",
      "   +0.2129 if c<=0.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.4486 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.4243 if x3-x1>=1.0 & x4-x2>=0.0\n",
      "   +0.1069 if x1>=1.0 & x2<=2.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   +0.6148 if x4-x2<=0.0\n",
      "   -0.2212 if x3-x1>=-1.0\n",
      "   +0.9554 if c>=1.0 & x1<=2.0 & x1>=1.0\n",
      "   -0.0966 if x2<=2.0 & x3-x1<=1.0\n",
      "   +0.2858 if x1>=1.0 & x2<=1.0 & x4-x2<=0.0\n",
      "   -0.4849 if x4-x2>=1.0\n",
      "   +0.0401 if x3-x1<=-2.0 & x3-x1>=-2.0\n",
      "   +0.2474 if c<=0.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.6473 if x1<=2.0 & x2>=2.0\n",
      "   -0.0111 if x1<=2.0 & x2>=3.0 & x3-x1<=-1.0 & x4-x2>=-1.0\n",
      "   +0.2165 if c<=0.0 & x1>=2.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   -0.3340 if x2>=1.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "----------------- 2 --------------\n",
      "   +0.8200 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.2900 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   -0.3081 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.1435 if c>=1.0 & x1<=2.0 & x3-x1<=1.0\n",
      "   -0.1656 if c>=1.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   -0.3254 if c>=1.0 & x3-x1>=0.0\n",
      "   +0.2201 if x3-x1>=1.0\n",
      "   -0.3375 if c<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.1118 if x1<=2.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.1427 if x1>=2.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   -0.1178 if x1<=0.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.2299 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-2.0\n",
      "   +0.0366 if x1<=0.0 & x3-x1>=1.0\n",
      "   -0.0422 if c<=0.0 & x2>=2.0 & x4-x2>=0.0\n",
      "   -0.0592 if x1>=1.0 & x2>=1.0 & x3-x1>=1.0 & x4-x2<=0.0\n",
      "   -0.3641 if c<=0.0 & x2<=1.0 & x3-x1>=-1.0\n",
      "----------------- 3 --------------\n",
      "   +0.5901 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.2244 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.6624 if x1<=2.0 & x4-x2<=0.0\n",
      "   +0.6773 if x2<=2.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.4506 if x4-x2<=2.0 & x4-x2>=1.0\n",
      "   +0.3784 if c<=0.0 & x4-x2>=1.0\n",
      "   +0.7993 if x4-x2<=2.0\n",
      "   +0.1398 if c>=1.0 & x1<=2.0 & x2<=1.0 & x2>=1.0 & x3-x1<=0.0\n",
      "   +0.3784 if c<=0.0 & x3-x1<=1.0 & x4-x2>=1.0\n",
      "   -0.0979 if c<=0.0 & x4-x2>=2.0\n",
      "   -0.4816 if x1<=2.0 & x3-x1<=0.0 & x4-x2<=2.0 & x4-x2>=-2.0\n",
      "   -0.0000 if c<=0.0 & x1<=1.0 & x1>=1.0 & x3-x1<=0.0 & x4-x2>=2.0\n",
      "   -0.4720 if x1<=0.0 & x2<=0.0\n",
      "   -0.0979 if x4-x2>=2.0\n",
      "   +0.0808 if x2<=0.0 & x3-x1<=-1.0 & x3-x1<=-2.0\n",
      "   +0.3946 if x1>=1.0 & x4-x2>=2.0\n",
      "init state [ 3  1 -2  1  0]\n",
      "(23,) (23,)\n",
      "init state [1 1 1 0 0]\n",
      "(31,) (8,)\n",
      "init state [ 0  1  3 -1  0]\n",
      "(45,) (14,)\n",
      "init state [ 1  3  0 -2  0]\n",
      "(55,) (10,)\n",
      "init state [ 2  0 -1  2  0]\n",
      "(94,) (39,)\n",
      "init state [ 1  3  0 -1  0]\n",
      "(124,) (30,)\n",
      "init state [ 2  3 -2 -2  0]\n",
      "(137,) (13,)\n",
      "init state [0 0 2 0 0]\n",
      "(191,) (54,)\n",
      "init state [1 1 2 0 0]\n",
      "(201,) (10,)\n",
      "init state [ 3  1 -3 -1  0]\n",
      "(214,) (13,)\n",
      "============ 141 ===========\n",
      "Run episode 141 with rewards 29, accuracy 0.3\n",
      "----------------- 0 --------------\n",
      "   -0.0799 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   +0.6889 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   -0.0895 if c<=0.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   +0.0306 if c<=0.0 & x2>=1.0 & x4-x2>=1.0\n",
      "   -0.1396 if c<=0.0 & x1<=2.0 & x3-x1>=0.0\n",
      "   -0.0749 if x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.1890 if c<=0.0 & x1>=2.0 & x2<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2<=2.0\n",
      "   +0.1896 if x2>=3.0 & x4-x2<=-1.0\n",
      "   +0.3069 if c<=0.0 & x1<=1.0 & x2<=2.0\n",
      "   +0.4296 if x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   +0.7962 if c<=0.0 & x1<=2.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.0099 if x1<=1.0 & x3-x1>=1.0\n",
      "   +0.4212 if x1<=0.0\n",
      "   +0.0219 if x2>=3.0 & x3-x1<=-2.0\n",
      "   +0.0234 if x1<=0.0 & x4-x2>=2.0\n",
      "   +0.4574 if c<=0.0 & x2<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "----------------- 1 --------------\n",
      "   +0.4056 if c<=0.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.2790 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.0835 if x3-x1>=1.0 & x4-x2>=0.0\n",
      "   +0.0088 if x1>=1.0 & x2<=2.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   +0.3831 if x4-x2<=0.0\n",
      "   +0.1390 if x3-x1>=-1.0\n",
      "   +0.9035 if c>=1.0 & x1<=2.0 & x1>=1.0\n",
      "   -0.1743 if x2<=2.0 & x3-x1<=1.0\n",
      "   -0.0189 if x1>=1.0 & x2<=1.0 & x4-x2<=0.0\n",
      "   -0.2251 if x4-x2>=1.0\n",
      "   +0.2627 if x3-x1<=-2.0 & x3-x1>=-2.0\n",
      "   +0.4326 if c<=0.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.2709 if x1<=2.0 & x2>=2.0\n",
      "   -0.0603 if c<=0.0 & x1>=2.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   -0.0961 if x2>=1.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   -0.1679 if x1<=2.0 & x2>=2.0 & x3-x1<=0.0\n",
      "----------------- 2 --------------\n",
      "   +1.1062 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.6183 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   -0.2340 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.2981 if c>=1.0 & x1<=2.0 & x3-x1<=1.0\n",
      "   -0.2327 if c>=1.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   -0.2082 if c>=1.0 & x3-x1>=0.0\n",
      "   -0.2699 if x3-x1>=1.0\n",
      "   -0.3388 if c<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.4273 if x1<=2.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.8076 if x1>=2.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   -0.2668 if x1<=0.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.2060 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-2.0\n",
      "   -0.2396 if c<=0.0 & x2>=2.0 & x4-x2>=0.0\n",
      "   +0.2140 if x1>=1.0 & x2>=1.0 & x3-x1>=1.0 & x4-x2<=0.0\n",
      "   +0.1714 if c<=0.0 & x2<=1.0 & x3-x1>=-1.0\n",
      "   -0.4751 if x2<=1.0 & x2>=1.0 & x3-x1>=2.0\n",
      "----------------- 3 --------------\n",
      "   +0.7525 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.4917 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.8212 if x1<=2.0 & x4-x2<=0.0\n",
      "   +0.7051 if x2<=2.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.5651 if x4-x2<=2.0 & x4-x2>=1.0\n",
      "   +0.5651 if c<=0.0 & x4-x2>=1.0\n",
      "   +0.5600 if x4-x2<=2.0\n",
      "   -0.0001 if c>=1.0 & x1<=2.0 & x2<=1.0 & x2>=1.0 & x3-x1<=0.0\n",
      "   +0.5651 if c<=0.0 & x3-x1<=1.0 & x4-x2>=1.0\n",
      "   +0.2285 if c<=0.0 & x4-x2>=2.0\n",
      "   -0.2968 if x1<=2.0 & x3-x1<=0.0 & x4-x2<=2.0 & x4-x2>=-2.0\n",
      "   -0.0219 if x1<=0.0 & x2<=0.0\n",
      "   +0.2285 if x4-x2>=2.0\n",
      "   +0.0048 if x2<=0.0 & x3-x1<=-1.0 & x3-x1<=-2.0\n",
      "   +0.2028 if x1>=1.0 & x4-x2>=2.0\n",
      "   +0.2611 if x2<=1.0 & x3-x1<=1.0 & x3-x1>=-2.0\n",
      "init state [ 1  2  0 -1  0]\n",
      "(7,) (7,)\n",
      "init state [2 1 1 0 0]\n",
      "(15,) (8,)\n",
      "init state [0 1 1 1 0]\n",
      "(22,) (7,)\n",
      "init state [ 3  2 -3 -1  0]\n",
      "(53,) (31,)\n",
      "init state [0 1 2 0 0]\n",
      "(68,) (15,)\n",
      "init state [ 2  2  1 -1  0]\n",
      "(72,) (4,)\n",
      "init state [0 1 2 1 0]\n",
      "(82,) (10,)\n",
      "init state [ 3  2 -2  1  0]\n",
      "(98,) (16,)\n",
      "init state [ 2  3 -2 -3  0]\n",
      "(134,) (36,)\n",
      "init state [0 2 1 0 0]\n",
      "(143,) (9,)\n",
      "============ 142 ===========\n",
      "Run episode 142 with rewards 33, accuracy 0.8\n",
      "----------------- 0 --------------\n",
      "   -0.2354 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   +0.4591 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.0536 if c<=0.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   -0.2102 if c<=0.0 & x2>=1.0 & x4-x2>=1.0\n",
      "   -0.1588 if c<=0.0 & x1<=2.0 & x3-x1>=0.0\n",
      "   -0.1709 if x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.1020 if c<=0.0 & x1>=2.0 & x2<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2<=2.0\n",
      "   -0.1372 if x2>=3.0 & x4-x2<=-1.0\n",
      "   -0.1936 if c<=0.0 & x1<=1.0 & x2<=2.0\n",
      "   -0.1727 if x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   +0.4028 if c<=0.0 & x1<=2.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.6069 if x1<=0.0\n",
      "   -0.1347 if x2>=3.0 & x3-x1<=-2.0\n",
      "   -0.0454 if x1<=0.0 & x4-x2>=2.0\n",
      "   -0.0056 if c<=0.0 & x2<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   +0.5932 if x2<=1.0 & x3-x1>=2.0 & x4-x2<=0.0\n",
      "----------------- 1 --------------\n",
      "   +0.1947 if c<=0.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.2556 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.0280 if x3-x1>=1.0 & x4-x2>=0.0\n",
      "   +0.2987 if x4-x2<=0.0\n",
      "   +0.0514 if x3-x1>=-1.0\n",
      "   +0.5854 if c>=1.0 & x1<=2.0 & x1>=1.0\n",
      "   -0.0762 if x2<=2.0 & x3-x1<=1.0\n",
      "   -0.0593 if x1>=1.0 & x2<=1.0 & x4-x2<=0.0\n",
      "   -0.0118 if x4-x2>=1.0\n",
      "   +0.2195 if x3-x1<=-2.0 & x3-x1>=-2.0\n",
      "   +0.0444 if c<=0.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.5955 if x1<=2.0 & x2>=2.0\n",
      "   +0.1765 if c<=0.0 & x1>=2.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   +0.2994 if x2>=1.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   +0.0696 if x1<=2.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   +0.4663 if c>=1.0 & x2>=3.0 & x3-x1<=-1.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 2 --------------\n",
      "   +1.0100 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.9633 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   +0.0134 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.4323 if c>=1.0 & x1<=2.0 & x3-x1<=1.0\n",
      "   -0.2815 if c>=1.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   -0.3233 if c>=1.0 & x3-x1>=0.0\n",
      "   -0.4267 if x3-x1>=1.0\n",
      "   -0.3332 if c<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.0152 if x1<=2.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.0690 if x1>=2.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   -0.7462 if x1<=0.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.2418 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-2.0\n",
      "   -0.1759 if c<=0.0 & x2>=2.0 & x4-x2>=0.0\n",
      "   +0.2532 if x1>=1.0 & x2>=1.0 & x3-x1>=1.0 & x4-x2<=0.0\n",
      "   +0.0523 if x2<=1.0 & x2>=1.0 & x3-x1>=2.0\n",
      "   +0.3154 if x1<=1.0 & x2<=2.0 & x3-x1>=0.0 & x3-x1>=1.0\n",
      "----------------- 3 --------------\n",
      "   +0.3310 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.4242 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.2812 if x1<=2.0 & x4-x2<=0.0\n",
      "   +0.2490 if x2<=2.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.4208 if x4-x2<=2.0 & x4-x2>=1.0\n",
      "   +0.3358 if c<=0.0 & x4-x2>=1.0\n",
      "   +0.5945 if x4-x2<=2.0\n",
      "   +0.5918 if c<=0.0 & x3-x1<=1.0 & x4-x2>=1.0\n",
      "   +0.2241 if c<=0.0 & x4-x2>=2.0\n",
      "   -0.0658 if x1<=2.0 & x3-x1<=0.0 & x4-x2<=2.0 & x4-x2>=-2.0\n",
      "   +0.2653 if x1<=0.0 & x2<=0.0\n",
      "   +0.2241 if x4-x2>=2.0\n",
      "   +0.0236 if x2<=0.0 & x3-x1<=-1.0 & x3-x1<=-2.0\n",
      "   +0.0518 if x1>=1.0 & x4-x2>=2.0\n",
      "   +0.6607 if x2<=1.0 & x3-x1<=1.0 & x3-x1>=-2.0\n",
      "   +0.0517 if x1>=3.0 & x4-x2>=2.0\n",
      "init state [ 1  3 -1 -2  0]\n",
      "(29,) (29,)\n",
      "init state [1 1 0 1 0]\n",
      "(34,) (5,)\n",
      "init state [ 1  2  1 -1  0]\n",
      "(43,) (9,)\n",
      "init state [0 0 0 1 0]\n",
      "(54,) (11,)\n",
      "init state [ 0  1  1 -1  0]\n",
      "(63,) (9,)\n",
      "init state [ 2  2 -1 -2  0]\n",
      "(80,) (17,)\n",
      "init state [0 1 3 0 0]\n",
      "(93,) (13,)\n",
      "init state [1 2 0 1 0]\n",
      "(100,) (7,)\n",
      "init state [ 1  1 -1  2  0]\n",
      "(110,) (10,)\n",
      "init state [0 0 1 1 0]\n",
      "(116,) (6,)\n",
      "============ 143 ===========\n",
      "Run episode 143 with rewards 36, accuracy 0.6\n",
      "----------------- 0 --------------\n",
      "   +0.4826 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   +0.8829 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.3098 if c<=0.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   +0.0107 if c<=0.0 & x2>=1.0 & x4-x2>=1.0\n",
      "   -0.2617 if c<=0.0 & x1<=2.0 & x3-x1>=0.0\n",
      "   -0.1258 if x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.0330 if c<=0.0 & x1>=2.0 & x2<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2<=2.0\n",
      "   -0.3135 if x2>=3.0 & x4-x2<=-1.0\n",
      "   -0.4992 if c<=0.0 & x1<=1.0 & x2<=2.0\n",
      "   -0.4320 if x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   +0.4038 if c<=0.0 & x1<=2.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.3749 if x1<=0.0\n",
      "   -0.2116 if x2>=3.0 & x3-x1<=-2.0\n",
      "   +0.0000 if x1<=0.0 & x4-x2>=2.0\n",
      "   +0.3199 if x2<=1.0 & x3-x1>=2.0 & x4-x2<=0.0\n",
      "   +0.3604 if x3-x1>=3.0\n",
      "----------------- 1 --------------\n",
      "   +0.6152 if c<=0.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.2315 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.0335 if x3-x1>=1.0 & x4-x2>=0.0\n",
      "   -0.0131 if x4-x2<=0.0\n",
      "   +0.3626 if x3-x1>=-1.0\n",
      "   +0.7184 if c>=1.0 & x1<=2.0 & x1>=1.0\n",
      "   -0.2375 if x2<=2.0 & x3-x1<=1.0\n",
      "   -0.6130 if x1>=1.0 & x2<=1.0 & x4-x2<=0.0\n",
      "   -0.0831 if x3-x1<=-2.0 & x3-x1>=-2.0\n",
      "   -0.1374 if c<=0.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.9097 if x1<=2.0 & x2>=2.0\n",
      "   -0.1851 if c<=0.0 & x1>=2.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   +0.1629 if x2>=1.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   -0.0297 if x1<=2.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   +0.3545 if c>=1.0 & x2>=3.0 & x3-x1<=-1.0\n",
      "   +0.5015 if x1<=0.0 & x2<=2.0 & x3-x1<=2.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "----------------- 2 --------------\n",
      "   +0.7836 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.6371 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   -0.5657 if c>=1.0 & x1<=2.0 & x3-x1<=1.0\n",
      "   -0.1839 if c>=1.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   -0.3955 if c>=1.0 & x3-x1>=0.0\n",
      "   -0.4737 if x3-x1>=1.0\n",
      "   +0.0120 if c<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.1543 if x1<=2.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.0076 if x1>=2.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   -0.3030 if x1<=0.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.0336 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-2.0\n",
      "   -0.3484 if c<=0.0 & x2>=2.0 & x4-x2>=0.0\n",
      "   +0.1132 if x1>=1.0 & x2>=1.0 & x3-x1>=1.0 & x4-x2<=0.0\n",
      "   +0.1357 if x2<=1.0 & x2>=1.0 & x3-x1>=2.0\n",
      "   +0.0022 if x1<=1.0 & x2<=2.0 & x3-x1>=0.0 & x3-x1>=1.0\n",
      "   -0.1542 if x3-x1>=3.0\n",
      "----------------- 3 --------------\n",
      "   +0.5629 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.6157 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.1903 if x1<=2.0 & x4-x2<=0.0\n",
      "   +0.5299 if x2<=2.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.1601 if x4-x2<=2.0 & x4-x2>=1.0\n",
      "   +0.1601 if c<=0.0 & x4-x2>=1.0\n",
      "   +0.3680 if x4-x2<=2.0\n",
      "   +0.3283 if c<=0.0 & x3-x1<=1.0 & x4-x2>=1.0\n",
      "   +0.0813 if c<=0.0 & x4-x2>=2.0\n",
      "   -0.1694 if x1<=2.0 & x3-x1<=0.0 & x4-x2<=2.0 & x4-x2>=-2.0\n",
      "   -0.4608 if x1<=0.0 & x2<=0.0\n",
      "   +0.0813 if x4-x2>=2.0\n",
      "   +0.0813 if x1>=1.0 & x4-x2>=2.0\n",
      "   +0.8593 if x2<=1.0 & x3-x1<=1.0 & x3-x1>=-2.0\n",
      "   +0.0000 if x1>=3.0 & x4-x2>=2.0\n",
      "   -0.1682 if x2<=0.0 & x3-x1>=2.0\n",
      "init state [2 0 1 2 0]\n",
      "(9,) (9,)\n",
      "init state [1 0 0 2 0]\n",
      "(18,) (9,)\n",
      "init state [ 3  2 -3  1  0]\n",
      "(31,) (13,)\n",
      "init state [ 3  2 -2 -2  0]\n",
      "(52,) (21,)\n",
      "init state [1 0 0 3 0]\n",
      "(60,) (8,)\n",
      "init state [3 0 0 2 0]\n",
      "(64,) (4,)\n",
      "init state [ 1  3  1 -2  0]\n",
      "(71,) (7,)\n",
      "init state [ 2  3 -1 -1  0]\n",
      "(82,) (11,)\n",
      "init state [0 0 2 2 0]\n",
      "(90,) (8,)\n",
      "init state [ 2  3 -1 -1  0]\n",
      "(99,) (9,)\n",
      "============ 144 ===========\n",
      "Run episode 144 with rewards 33, accuracy 1.0\n",
      "best\n",
      "----------------- 0 --------------\n",
      "   +0.3956 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   +0.8802 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.3859 if c<=0.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   -0.0369 if c<=0.0 & x2>=1.0 & x4-x2>=1.0\n",
      "   -0.4045 if c<=0.0 & x1<=2.0 & x3-x1>=0.0\n",
      "   -0.0711 if x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.1020 if c<=0.0 & x1>=2.0 & x2<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2<=2.0\n",
      "   -0.3631 if x2>=3.0 & x4-x2<=-1.0\n",
      "   -0.3796 if c<=0.0 & x1<=1.0 & x2<=2.0\n",
      "   -0.4432 if x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   +0.6248 if c<=0.0 & x1<=2.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.0746 if x1<=0.0\n",
      "   +0.0053 if x2>=3.0 & x3-x1<=-2.0\n",
      "   +0.0000 if x2<=1.0 & x3-x1>=2.0 & x4-x2<=0.0\n",
      "   +0.0000 if x3-x1>=3.0\n",
      "   +0.3701 if x3-x1<=0.0 & x4-x2>=3.0\n",
      "----------------- 1 --------------\n",
      "   +0.2458 if c<=0.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.2912 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.1641 if x3-x1>=1.0 & x4-x2>=0.0\n",
      "   +0.2844 if x3-x1>=-1.0\n",
      "   +0.6737 if c>=1.0 & x1<=2.0 & x1>=1.0\n",
      "   -0.0694 if x2<=2.0 & x3-x1<=1.0\n",
      "   -0.1144 if x1>=1.0 & x2<=1.0 & x4-x2<=0.0\n",
      "   -0.1970 if x3-x1<=-2.0 & x3-x1>=-2.0\n",
      "   -0.2889 if c<=0.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.6538 if x1<=2.0 & x2>=2.0\n",
      "   +0.3186 if c<=0.0 & x1>=2.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   +0.4535 if x2>=1.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   +0.2133 if x1<=2.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   -0.0071 if c>=1.0 & x2>=3.0 & x3-x1<=-1.0\n",
      "   +0.5244 if x1<=0.0 & x2<=2.0 & x3-x1<=2.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   -0.3392 if x2>=3.0 & x3-x1>=2.0\n",
      "----------------- 2 --------------\n",
      "   +0.4558 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.8279 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   -0.3476 if c>=1.0 & x1<=2.0 & x3-x1<=1.0\n",
      "   -0.0969 if c>=1.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   -0.2249 if c>=1.0 & x3-x1>=0.0\n",
      "   -0.3269 if x3-x1>=1.0\n",
      "   -0.3425 if c<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.0626 if x1<=2.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.4788 if x1>=2.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   +0.0390 if x1<=0.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.1011 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-2.0\n",
      "   -0.3881 if c<=0.0 & x2>=2.0 & x4-x2>=0.0\n",
      "   -0.0046 if x1>=1.0 & x2>=1.0 & x3-x1>=1.0 & x4-x2<=0.0\n",
      "   -0.0770 if x2<=1.0 & x2>=1.0 & x3-x1>=2.0\n",
      "   +0.0000 if x3-x1>=3.0\n",
      "   +0.0305 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "----------------- 3 --------------\n",
      "   +0.4782 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.1605 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.0062 if x1<=2.0 & x4-x2<=0.0\n",
      "   +0.3213 if x2<=2.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.5433 if x4-x2<=2.0 & x4-x2>=1.0\n",
      "   +0.3528 if c<=0.0 & x4-x2>=1.0\n",
      "   +0.7112 if x4-x2<=2.0\n",
      "   +0.0406 if c<=0.0 & x3-x1<=1.0 & x4-x2>=1.0\n",
      "   -0.0837 if c<=0.0 & x4-x2>=2.0\n",
      "   -0.1670 if x1<=2.0 & x3-x1<=0.0 & x4-x2<=2.0 & x4-x2>=-2.0\n",
      "   -0.2370 if x1<=0.0 & x2<=0.0\n",
      "   -0.0837 if x4-x2>=2.0\n",
      "   +0.2296 if x1>=1.0 & x4-x2>=2.0\n",
      "   +0.3608 if x2<=1.0 & x3-x1<=1.0 & x3-x1>=-2.0\n",
      "   +0.0397 if x2<=0.0 & x3-x1>=2.0\n",
      "   +0.1521 if x1<=2.0 & x3-x1<=1.0 & x4-x2>=2.0\n",
      "init state [ 0  2  1 -1  0]\n",
      "(6,) (6,)\n",
      "init state [ 1  3  0 -2  0]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(28,) (22,)\n",
      "init state [1 1 2 1 0]\n",
      "(45,) (17,)\n",
      "init state [ 2  0 -1  1  0]\n",
      "(57,) (12,)\n",
      "init state [ 3  1 -3  1  0]\n",
      "(71,) (14,)\n",
      "init state [2 0 1 1 0]\n",
      "(76,) (5,)\n",
      "init state [ 3  0 -3  0  0]\n",
      "(123,) (47,)\n",
      "init state [2 0 1 2 0]\n",
      "(129,) (6,)\n",
      "init state [2 1 1 1 0]\n",
      "(132,) (3,)\n",
      "init state [ 1  1 -1  1  0]\n",
      "(140,) (8,)\n",
      "============ 145 ===========\n",
      "Run episode 145 with rewards 34, accuracy 1.0\n",
      "best\n",
      "----------------- 0 --------------\n",
      "   +0.1741 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   +0.8828 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   -0.0741 if c<=0.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   -0.0799 if c<=0.0 & x2>=1.0 & x4-x2>=1.0\n",
      "   -0.3988 if c<=0.0 & x1<=2.0 & x3-x1>=0.0\n",
      "   -0.1418 if x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.2300 if c<=0.0 & x1>=2.0 & x2<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2<=2.0\n",
      "   -0.3505 if x2>=3.0 & x4-x2<=-1.0\n",
      "   +0.2173 if c<=0.0 & x1<=1.0 & x2<=2.0\n",
      "   -0.3136 if x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   +0.3077 if c<=0.0 & x1<=2.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.0229 if x1<=0.0\n",
      "   -0.0926 if x2>=3.0 & x3-x1<=-2.0\n",
      "   +0.2136 if x3-x1>=3.0\n",
      "   -0.0000 if x3-x1<=0.0 & x4-x2>=3.0\n",
      "   +0.1925 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "----------------- 1 --------------\n",
      "   +0.1026 if c<=0.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.1183 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.6067 if x3-x1>=1.0 & x4-x2>=0.0\n",
      "   -0.1525 if x3-x1>=-1.0\n",
      "   +0.5809 if c>=1.0 & x1<=2.0 & x1>=1.0\n",
      "   -0.0032 if x2<=2.0 & x3-x1<=1.0\n",
      "   -0.4307 if x1>=1.0 & x2<=1.0 & x4-x2<=0.0\n",
      "   +0.1778 if x3-x1<=-2.0 & x3-x1>=-2.0\n",
      "   -0.2242 if c<=0.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.3841 if x1<=2.0 & x2>=2.0\n",
      "   +0.6273 if c<=0.0 & x1>=2.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   +0.1432 if x2>=1.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   +0.2706 if x1<=2.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   +0.3306 if x1<=0.0 & x2<=2.0 & x3-x1<=2.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   -0.1892 if x2>=3.0 & x3-x1>=2.0\n",
      "   +0.4277 if x2<=2.0 & x3-x1<=1.0 & x3-x1<=2.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "----------------- 2 --------------\n",
      "   +0.8048 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.7144 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   -0.5412 if c>=1.0 & x1<=2.0 & x3-x1<=1.0\n",
      "   -0.3712 if c>=1.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   -0.3928 if c>=1.0 & x3-x1>=0.0\n",
      "   +0.0552 if x3-x1>=1.0\n",
      "   -0.7917 if c<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.4816 if x1<=2.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.1481 if x1>=2.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   +0.1564 if x1<=0.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.2827 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-2.0\n",
      "   -0.7756 if c<=0.0 & x2>=2.0 & x4-x2>=0.0\n",
      "   +0.0812 if x1>=1.0 & x2>=1.0 & x3-x1>=1.0 & x4-x2<=0.0\n",
      "   +0.2303 if x2<=1.0 & x2>=1.0 & x3-x1>=2.0\n",
      "   +0.0921 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   -0.2119 if x4-x2>=2.0\n",
      "----------------- 3 --------------\n",
      "   +0.5537 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.5201 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.4853 if x2<=2.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.2880 if x4-x2<=2.0 & x4-x2>=1.0\n",
      "   +0.3834 if c<=0.0 & x4-x2>=1.0\n",
      "   +0.2830 if x4-x2<=2.0\n",
      "   +0.3421 if c<=0.0 & x3-x1<=1.0 & x4-x2>=1.0\n",
      "   +0.1824 if c<=0.0 & x4-x2>=2.0\n",
      "   +0.3217 if x1<=2.0 & x3-x1<=0.0 & x4-x2<=2.0 & x4-x2>=-2.0\n",
      "   -0.0294 if x1<=0.0 & x2<=0.0\n",
      "   +0.1824 if x4-x2>=2.0\n",
      "   +0.2807 if x1>=1.0 & x4-x2>=2.0\n",
      "   +0.7003 if x2<=1.0 & x3-x1<=1.0 & x3-x1>=-2.0\n",
      "   +0.0390 if x2<=0.0 & x3-x1>=2.0\n",
      "   +0.1433 if x1<=2.0 & x3-x1<=1.0 & x4-x2>=2.0\n",
      "   -0.3090 if x2<=0.0 & x3-x1>=0.0\n",
      "init state [0 1 2 0 0]\n",
      "(14,) (14,)\n",
      "init state [ 0  2  2 -2  0]\n",
      "(47,) (33,)\n",
      "init state [ 2  3  0 -2  0]\n",
      "(57,) (10,)\n",
      "init state [ 3  2 -1  0  0]\n",
      "(62,) (5,)\n",
      "init state [ 1  3  0 -1  0]\n",
      "(68,) (6,)\n",
      "init state [ 1  0 -1  1  0]\n",
      "(80,) (12,)\n",
      "init state [ 3  2 -1 -1  0]\n",
      "(87,) (7,)\n",
      "init state [1 0 2 2 0]\n",
      "(94,) (7,)\n",
      "init state [0 2 2 1 0]\n",
      "(100,) (6,)\n",
      "init state [1 1 1 0 0]\n",
      "(104,) (4,)\n",
      "============ 146 ===========\n",
      "Run episode 146 with rewards 38, accuracy 0.4\n",
      "----------------- 0 --------------\n",
      "   +0.4496 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   +0.7380 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.2112 if c<=0.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   -0.2213 if c<=0.0 & x2>=1.0 & x4-x2>=1.0\n",
      "   -0.7863 if c<=0.0 & x1<=2.0 & x3-x1>=0.0\n",
      "   -0.1844 if x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.1510 if c<=0.0 & x1>=2.0 & x2<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2<=2.0\n",
      "   -0.3273 if x2>=3.0 & x4-x2<=-1.0\n",
      "   -0.1874 if c<=0.0 & x1<=1.0 & x2<=2.0\n",
      "   -0.1278 if x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   +0.1025 if c<=0.0 & x1<=2.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.1092 if x1<=0.0\n",
      "   -0.0273 if x2>=3.0 & x3-x1<=-2.0\n",
      "   +0.0000 if x3-x1>=3.0\n",
      "   +0.5036 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "   -0.1965 if x1>=2.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "----------------- 1 --------------\n",
      "   +0.0844 if c<=0.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.1263 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.1598 if x3-x1>=1.0 & x4-x2>=0.0\n",
      "   +0.4219 if x3-x1>=-1.0\n",
      "   +0.5442 if c>=1.0 & x1<=2.0 & x1>=1.0\n",
      "   +0.2546 if x1>=1.0 & x2<=1.0 & x4-x2<=0.0\n",
      "   +0.0969 if x3-x1<=-2.0 & x3-x1>=-2.0\n",
      "   -0.1492 if c<=0.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.6495 if x1<=2.0 & x2>=2.0\n",
      "   +0.0708 if c<=0.0 & x1>=2.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   +0.6767 if x2>=1.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   +0.5155 if x1<=2.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   -0.0541 if x1<=0.0 & x2<=2.0 & x3-x1<=2.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   -0.2997 if x2>=3.0 & x3-x1>=2.0\n",
      "   +0.0129 if x2<=2.0 & x3-x1<=1.0 & x3-x1<=2.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.3623 if x1<=1.0 & x1>=1.0 & x2>=2.0 & x4-x2>=1.0\n",
      "----------------- 2 --------------\n",
      "   +0.7080 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.4082 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   -0.2756 if c>=1.0 & x1<=2.0 & x3-x1<=1.0\n",
      "   -0.4174 if c>=1.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   -0.1031 if c>=1.0 & x3-x1>=0.0\n",
      "   +0.0398 if c<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.2997 if x1<=2.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.0416 if x1>=2.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   +0.1489 if x1<=0.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.1692 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-2.0\n",
      "   -0.0765 if c<=0.0 & x2>=2.0 & x4-x2>=0.0\n",
      "   -0.4013 if x1>=1.0 & x2>=1.0 & x3-x1>=1.0 & x4-x2<=0.0\n",
      "   -0.1043 if x2<=1.0 & x2>=1.0 & x3-x1>=2.0\n",
      "   -0.0249 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   -0.1619 if x4-x2>=2.0\n",
      "   +0.3547 if c<=0.0 & x2>=3.0 & x3-x1>=2.0\n",
      "----------------- 3 --------------\n",
      "   +0.5201 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.5430 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.5498 if x2<=2.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.6501 if x4-x2<=2.0 & x4-x2>=1.0\n",
      "   +0.5032 if c<=0.0 & x4-x2>=1.0\n",
      "   +0.1163 if x4-x2<=2.0\n",
      "   +0.4265 if c<=0.0 & x3-x1<=1.0 & x4-x2>=1.0\n",
      "   +0.4091 if c<=0.0 & x4-x2>=2.0\n",
      "   +0.0667 if x1<=2.0 & x3-x1<=0.0 & x4-x2<=2.0 & x4-x2>=-2.0\n",
      "   +0.4091 if x4-x2>=2.0\n",
      "   +0.1785 if x1>=1.0 & x4-x2>=2.0\n",
      "   +0.1623 if x2<=1.0 & x3-x1<=1.0 & x3-x1>=-2.0\n",
      "   -0.0440 if x2<=0.0 & x3-x1>=2.0\n",
      "   +0.0000 if x1<=2.0 & x3-x1<=1.0 & x4-x2>=2.0\n",
      "   -0.2236 if x2<=0.0 & x3-x1>=0.0\n",
      "   -0.2331 if x3-x1>=-1.0 & x4-x2<=1.0\n",
      "init state [ 2  3  1 -2  0]\n",
      "(13,) (13,)\n",
      "init state [ 1  0 -1  0  0]\n",
      "(30,) (17,)\n",
      "init state [ 3  1 -1  2  0]\n",
      "(36,) (6,)\n",
      "init state [ 2  3 -2 -2  0]\n",
      "(67,) (31,)\n",
      "init state [ 1  3  0 -3  0]\n",
      "(84,) (17,)\n",
      "init state [ 0  2  1 -1  0]\n",
      "(116,) (32,)\n",
      "init state [ 1  3  1 -2  0]\n",
      "(126,) (10,)\n",
      "init state [ 1  1  0 -1  0]\n",
      "(137,) (11,)\n",
      "init state [0 0 1 3 0]\n",
      "(155,) (18,)\n",
      "init state [1 0 1 0 0]\n",
      "(175,) (20,)\n",
      "============ 147 ===========\n",
      "Run episode 147 with rewards 22, accuracy 0.8\n",
      "----------------- 0 --------------\n",
      "   +0.3839 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   +1.1398 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.2118 if c<=0.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   +0.3710 if c<=0.0 & x2>=1.0 & x4-x2>=1.0\n",
      "   -0.3776 if c<=0.0 & x1<=2.0 & x3-x1>=0.0\n",
      "   +0.0000 if x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.0645 if c<=0.0 & x1>=2.0 & x2<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2<=2.0\n",
      "   +0.2414 if x2>=3.0 & x4-x2<=-1.0\n",
      "   -0.3022 if c<=0.0 & x1<=1.0 & x2<=2.0\n",
      "   -0.1219 if x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   +0.4929 if c<=0.0 & x1<=2.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.2569 if x1<=0.0\n",
      "   -0.0204 if x2>=3.0 & x3-x1<=-2.0\n",
      "   +0.5831 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "   -0.0204 if x1>=2.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   +0.4009 if x1>=3.0 & x4-x2>=2.0\n",
      "----------------- 1 --------------\n",
      "   +0.1763 if c<=0.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.1132 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.3617 if x3-x1>=1.0 & x4-x2>=0.0\n",
      "   +0.5614 if x3-x1>=-1.0\n",
      "   +0.1879 if c>=1.0 & x1<=2.0 & x1>=1.0\n",
      "   +0.1679 if x1>=1.0 & x2<=1.0 & x4-x2<=0.0\n",
      "   +0.0196 if x3-x1<=-2.0 & x3-x1>=-2.0\n",
      "   -0.0140 if c<=0.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.4146 if x1<=2.0 & x2>=2.0\n",
      "   +0.4976 if c<=0.0 & x1>=2.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   +0.3570 if x2>=1.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   +0.4173 if x1<=2.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   +0.0750 if x1<=0.0 & x2<=2.0 & x3-x1<=2.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   +0.0000 if x2>=3.0 & x3-x1>=2.0\n",
      "   +0.1427 if x1<=1.0 & x1>=1.0 & x2>=2.0 & x4-x2>=1.0\n",
      "   -0.8084 if c<=0.0 & x1<=2.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 2 --------------\n",
      "   +0.9217 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.1509 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   -0.2412 if c>=1.0 & x1<=2.0 & x3-x1<=1.0\n",
      "   -0.2866 if c>=1.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   -0.0928 if c>=1.0 & x3-x1>=0.0\n",
      "   -0.4428 if c<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.3626 if x1<=2.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.1428 if x1>=2.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   -0.0946 if x1<=0.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.6006 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-2.0\n",
      "   -0.2028 if c<=0.0 & x2>=2.0 & x4-x2>=0.0\n",
      "   +0.0027 if x1>=1.0 & x2>=1.0 & x3-x1>=1.0 & x4-x2<=0.0\n",
      "   -0.0993 if x2<=1.0 & x2>=1.0 & x3-x1>=2.0\n",
      "   -0.0672 if x4-x2>=2.0\n",
      "   +0.0000 if c<=0.0 & x2>=3.0 & x3-x1>=2.0\n",
      "   -0.1818 if x1<=1.0 & x1>=1.0 & x2>=3.0 & x3-x1>=1.0 & x4-x2<=-2.0\n",
      "----------------- 3 --------------\n",
      "   +0.4182 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.8045 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.5555 if x2<=2.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.2683 if x4-x2<=2.0 & x4-x2>=1.0\n",
      "   +0.2383 if c<=0.0 & x4-x2>=1.0\n",
      "   -0.0559 if x4-x2<=2.0\n",
      "   +0.2383 if c<=0.0 & x3-x1<=1.0 & x4-x2>=1.0\n",
      "   -0.0226 if c<=0.0 & x4-x2>=2.0\n",
      "   +0.2709 if x1<=2.0 & x3-x1<=0.0 & x4-x2<=2.0 & x4-x2>=-2.0\n",
      "   -0.0226 if x4-x2>=2.0\n",
      "   -0.0215 if x1>=1.0 & x4-x2>=2.0\n",
      "   +0.5158 if x2<=1.0 & x3-x1<=1.0 & x3-x1>=-2.0\n",
      "   +0.0000 if x2<=0.0 & x3-x1>=2.0\n",
      "   +0.2296 if x2<=0.0 & x3-x1>=0.0\n",
      "   -0.3481 if x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   -0.0188 if x1<=0.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "init state [1 1 1 0 0]\n",
      "(9,) (9,)\n",
      "init state [1 0 0 1 0]\n",
      "(14,) (5,)\n",
      "init state [0 1 2 0 0]\n",
      "(25,) (11,)\n",
      "init state [1 0 1 1 0]\n",
      "(43,) (18,)\n",
      "init state [ 2  3 -1  0  0]\n",
      "(56,) (13,)\n",
      "init state [ 0  3  2 -3  0]\n",
      "(69,) (13,)\n",
      "init state [ 1  3 -1 -1  0]\n",
      "(85,) (16,)\n",
      "init state [ 2  1 -1 -1  0]\n",
      "(94,) (9,)\n",
      "init state [1 2 2 0 0]\n",
      "(99,) (5,)\n",
      "init state [ 0  2  2 -1  0]\n",
      "(105,) (6,)\n",
      "============ 148 ===========\n",
      "Run episode 148 with rewards 36, accuracy 0.8\n",
      "----------------- 0 --------------\n",
      "   +0.3396 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   +0.6958 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.6805 if c<=0.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   +0.0525 if c<=0.0 & x2>=1.0 & x4-x2>=1.0\n",
      "   -0.2538 if c<=0.0 & x1<=2.0 & x3-x1>=0.0\n",
      "   +0.3298 if c<=0.0 & x1>=2.0 & x2<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2<=2.0\n",
      "   -0.0355 if x2>=3.0 & x4-x2<=-1.0\n",
      "   -0.7041 if c<=0.0 & x1<=1.0 & x2<=2.0\n",
      "   -0.3083 if x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   +0.1753 if c<=0.0 & x1<=2.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.1059 if x1<=0.0\n",
      "   +0.4135 if x2>=3.0 & x3-x1<=-2.0\n",
      "   +0.4177 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "   -0.2273 if x1>=2.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   +0.0000 if x1>=3.0 & x4-x2>=2.0\n",
      "   -0.0495 if x3-x1>=1.0 & x4-x2<=-3.0\n",
      "----------------- 1 --------------\n",
      "   +0.2058 if c<=0.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.3344 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.3316 if x3-x1>=1.0 & x4-x2>=0.0\n",
      "   +0.8830 if x3-x1>=-1.0\n",
      "   +0.2791 if c>=1.0 & x1<=2.0 & x1>=1.0\n",
      "   -0.0112 if x1>=1.0 & x2<=1.0 & x4-x2<=0.0\n",
      "   -0.0438 if x3-x1<=-2.0 & x3-x1>=-2.0\n",
      "   -0.1349 if c<=0.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.2730 if x1<=2.0 & x2>=2.0\n",
      "   -0.3968 if c<=0.0 & x1>=2.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   +0.5477 if x2>=1.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   +0.3776 if x1<=2.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   +0.2246 if x1<=0.0 & x2<=2.0 & x3-x1<=2.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   +0.2834 if x1<=1.0 & x1>=1.0 & x2>=2.0 & x4-x2>=1.0\n",
      "   -0.3685 if c<=0.0 & x1<=2.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.2393 if x3-x1>=2.0\n",
      "----------------- 2 --------------\n",
      "   +0.6460 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.2393 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   -0.2268 if c>=1.0 & x1<=2.0 & x3-x1<=1.0\n",
      "   -0.5555 if c>=1.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   -0.0797 if c>=1.0 & x3-x1>=0.0\n",
      "   -0.2705 if c<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.3412 if x1<=2.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.0563 if x1>=2.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   +0.1507 if x1<=0.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.2215 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-2.0\n",
      "   -0.1831 if c<=0.0 & x2>=2.0 & x4-x2>=0.0\n",
      "   -0.5422 if x1>=1.0 & x2>=1.0 & x3-x1>=1.0 & x4-x2<=0.0\n",
      "   -0.2257 if x2<=1.0 & x2>=1.0 & x3-x1>=2.0\n",
      "   +0.0000 if x4-x2>=2.0\n",
      "   -0.0689 if x1<=1.0 & x1>=1.0 & x2>=3.0 & x3-x1>=1.0 & x4-x2<=-2.0\n",
      "   -0.1807 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "----------------- 3 --------------\n",
      "   +0.4191 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.8552 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.8448 if x2<=2.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.2878 if x4-x2<=2.0 & x4-x2>=1.0\n",
      "   +0.2878 if c<=0.0 & x4-x2>=1.0\n",
      "   -0.1253 if x4-x2<=2.0\n",
      "   +0.2878 if c<=0.0 & x3-x1<=1.0 & x4-x2>=1.0\n",
      "   +0.0000 if c<=0.0 & x4-x2>=2.0\n",
      "   +0.1637 if x1<=2.0 & x3-x1<=0.0 & x4-x2<=2.0 & x4-x2>=-2.0\n",
      "   +0.0000 if x4-x2>=2.0\n",
      "   +0.0000 if x1>=1.0 & x4-x2>=2.0\n",
      "   +0.2983 if x2<=1.0 & x3-x1<=1.0 & x3-x1>=-2.0\n",
      "   +0.3423 if x2<=0.0 & x3-x1>=0.0\n",
      "   -0.1203 if x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   -0.1307 if x1<=0.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   -0.3362 if x2>=2.0 & x4-x2<=0.0\n",
      "init state [ 1  3  1 -2  0]\n",
      "(7,) (7,)\n",
      "init state [ 1  3  2 -1  0]\n",
      "(14,) (7,)\n",
      "init state [ 3  2 -3 -1  0]\n",
      "(52,) (38,)\n",
      "init state [1 0 0 3 0]\n",
      "(71,) (19,)\n",
      "init state [0 1 1 2 0]\n",
      "(83,) (12,)\n",
      "init state [1 2 0 1 0]\n",
      "(86,) (3,)\n",
      "init state [1 0 2 2 0]\n",
      "(104,) (18,)\n",
      "init state [0 0 1 1 0]\n",
      "(114,) (10,)\n",
      "init state [ 0  1  0 -1  0]\n",
      "(122,) (8,)\n",
      "init state [1 0 0 2 0]\n",
      "(131,) (9,)\n",
      "============ 149 ===========\n",
      "Run episode 149 with rewards 33, accuracy 0.3\n",
      "----------------- 0 --------------\n",
      "   +0.2801 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   +0.2830 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.1609 if c<=0.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   +0.2786 if c<=0.0 & x2>=1.0 & x4-x2>=1.0\n",
      "   -0.3886 if c<=0.0 & x1<=2.0 & x3-x1>=0.0\n",
      "   +0.1272 if c<=0.0 & x1>=2.0 & x2<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2<=2.0\n",
      "   -0.2406 if x2>=3.0 & x4-x2<=-1.0\n",
      "   -0.0990 if c<=0.0 & x1<=1.0 & x2<=2.0\n",
      "   -0.2888 if x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   +0.1437 if c<=0.0 & x1<=2.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.4316 if x1<=0.0\n",
      "   -0.1806 if x2>=3.0 & x3-x1<=-2.0\n",
      "   +0.1267 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "   +0.3146 if x1>=2.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   -0.0000 if x3-x1>=1.0 & x4-x2<=-3.0\n",
      "   +0.6724 if c<=0.0 & x1>=1.0 & x2>=3.0 & x3-x1<=0.0 & x3-x1<=1.0 & x4-x2>=-1.0\n",
      "----------------- 1 --------------\n",
      "   +0.0625 if c<=0.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.3572 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.3595 if x3-x1>=1.0 & x4-x2>=0.0\n",
      "   +0.4485 if x3-x1>=-1.0\n",
      "   +0.6524 if c>=1.0 & x1<=2.0 & x1>=1.0\n",
      "   -0.0661 if x3-x1<=-2.0 & x3-x1>=-2.0\n",
      "   -0.3933 if c<=0.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.4356 if x1<=2.0 & x2>=2.0\n",
      "   -0.1166 if c<=0.0 & x1>=2.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   +0.2356 if x2>=1.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   -0.0511 if x1<=2.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   -0.2723 if x1<=0.0 & x2<=2.0 & x3-x1<=2.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   +0.2152 if x1<=1.0 & x1>=1.0 & x2>=2.0 & x4-x2>=1.0\n",
      "   -0.3626 if c<=0.0 & x1<=2.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.2412 if x3-x1>=2.0\n",
      "   +0.6260 if c<=0.0 & x3-x1>=1.0 & x4-x2<=0.0\n",
      "----------------- 2 --------------\n",
      "   +0.6077 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.5028 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   -0.4006 if c>=1.0 & x1<=2.0 & x3-x1<=1.0\n",
      "   -0.3393 if c>=1.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   -0.3731 if c>=1.0 & x3-x1>=0.0\n",
      "   -0.4603 if c<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.6628 if x1<=2.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.0633 if x1>=2.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   -0.1131 if x1<=0.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.1353 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-2.0\n",
      "   -0.1720 if c<=0.0 & x2>=2.0 & x4-x2>=0.0\n",
      "   -0.2477 if x1>=1.0 & x2>=1.0 & x3-x1>=1.0 & x4-x2<=0.0\n",
      "   +0.0479 if x2<=1.0 & x2>=1.0 & x3-x1>=2.0\n",
      "   -0.1839 if x1<=1.0 & x1>=1.0 & x2>=3.0 & x3-x1>=1.0 & x4-x2<=-2.0\n",
      "   -0.4424 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.1165 if x3-x1>=2.0\n",
      "----------------- 3 --------------\n",
      "   +0.3128 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.5824 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.8029 if x2<=2.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.4043 if x4-x2<=2.0 & x4-x2>=1.0\n",
      "   +0.3656 if c<=0.0 & x4-x2>=1.0\n",
      "   +0.2423 if x4-x2<=2.0\n",
      "   +0.5421 if c<=0.0 & x3-x1<=1.0 & x4-x2>=1.0\n",
      "   +0.0782 if c<=0.0 & x4-x2>=2.0\n",
      "   +0.0017 if x1<=2.0 & x3-x1<=0.0 & x4-x2<=2.0 & x4-x2>=-2.0\n",
      "   +0.0782 if x4-x2>=2.0\n",
      "   +0.4234 if x2<=1.0 & x3-x1<=1.0 & x3-x1>=-2.0\n",
      "   +0.0532 if x2<=0.0 & x3-x1>=0.0\n",
      "   -0.1438 if x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   +0.1622 if x1<=0.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   -0.4901 if x2>=2.0 & x4-x2<=0.0\n",
      "   -0.1277 if x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "\n",
      "Done\n"
     ]
    }
   ],
   "source": [
    "rewards = train()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "39cee1c7",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": 27,
   "id": "3d20e8e0",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "------------------------\n",
      "   +0.3956 if c<=0.0 & x1>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   +0.8802 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   +0.3859 if c<=0.0 & x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   -0.0369 if c<=0.0 & x2>=1.0 & x4-x2>=1.0\n",
      "   -0.4045 if c<=0.0 & x1<=2.0 & x3-x1>=0.0\n",
      "   -0.0711 if x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.1020 if c<=0.0 & x1>=2.0 & x2<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2<=2.0\n",
      "   -0.3631 if x2>=3.0 & x4-x2<=-1.0\n",
      "   -0.3796 if c<=0.0 & x1<=1.0 & x2<=2.0\n",
      "   -0.4432 if x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   +0.6248 if c<=0.0 & x1<=2.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.0746 if x1<=0.0\n",
      "   +0.0053 if x2>=3.0 & x3-x1<=-2.0\n",
      "   +0.0000 if x2<=1.0 & x3-x1>=2.0 & x4-x2<=0.0\n",
      "   +0.0000 if x3-x1>=3.0\n",
      "   +0.3701 if x3-x1<=0.0 & x4-x2>=3.0\n",
      "------------------------\n",
      "   +0.2458 if c<=0.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.2912 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.1641 if x3-x1>=1.0 & x4-x2>=0.0\n",
      "   +0.2844 if x3-x1>=-1.0\n",
      "   +0.6737 if c>=1.0 & x1<=2.0 & x1>=1.0\n",
      "   -0.0694 if x2<=2.0 & x3-x1<=1.0\n",
      "   -0.1144 if x1>=1.0 & x2<=1.0 & x4-x2<=0.0\n",
      "   -0.1970 if x3-x1<=-2.0 & x3-x1>=-2.0\n",
      "   -0.2889 if c<=0.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.6538 if x1<=2.0 & x2>=2.0\n",
      "   +0.3186 if c<=0.0 & x1>=2.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   +0.4535 if x2>=1.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   +0.2133 if x1<=2.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   -0.0071 if c>=1.0 & x2>=3.0 & x3-x1<=-1.0\n",
      "   +0.5244 if x1<=0.0 & x2<=2.0 & x3-x1<=2.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   -0.3392 if x2>=3.0 & x3-x1>=2.0\n",
      "------------------------\n",
      "   +0.4558 if c<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.8279 if c<=0.0 & x2>=1.0 & x4-x2<=1.0\n",
      "   -0.3476 if c>=1.0 & x1<=2.0 & x3-x1<=1.0\n",
      "   -0.0969 if c>=1.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "   -0.2249 if c>=1.0 & x3-x1>=0.0\n",
      "   -0.3269 if x3-x1>=1.0\n",
      "   -0.3425 if c<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.0626 if x1<=2.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.4788 if x1>=2.0 & x2>=3.0 & x4-x2<=-1.0\n",
      "   +0.0390 if x1<=0.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.1011 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-2.0\n",
      "   -0.3881 if c<=0.0 & x2>=2.0 & x4-x2>=0.0\n",
      "   -0.0046 if x1>=1.0 & x2>=1.0 & x3-x1>=1.0 & x4-x2<=0.0\n",
      "   -0.0770 if x2<=1.0 & x2>=1.0 & x3-x1>=2.0\n",
      "   +0.0000 if x3-x1>=3.0\n",
      "   +0.0305 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0\n",
      "------------------------\n",
      "   +0.4782 if c>=1.0 & x1>=3.0 & x4-x2<=0.0\n",
      "   +0.1605 if c>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.0062 if x1<=2.0 & x4-x2<=0.0\n",
      "   +0.3213 if x2<=2.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.5433 if x4-x2<=2.0 & x4-x2>=1.0\n",
      "   +0.3528 if c<=0.0 & x4-x2>=1.0\n",
      "   +0.7112 if x4-x2<=2.0\n",
      "   +0.0406 if c<=0.0 & x3-x1<=1.0 & x4-x2>=1.0\n",
      "   -0.0837 if c<=0.0 & x4-x2>=2.0\n",
      "   -0.1670 if x1<=2.0 & x3-x1<=0.0 & x4-x2<=2.0 & x4-x2>=-2.0\n",
      "   -0.2370 if x1<=0.0 & x2<=0.0\n",
      "   -0.0837 if x4-x2>=2.0\n",
      "   +0.2296 if x1>=1.0 & x4-x2>=2.0\n",
      "   +0.3608 if x2<=1.0 & x3-x1<=1.0 & x3-x1>=-2.0\n",
      "   +0.0397 if x2<=0.0 & x3-x1>=2.0\n",
      "   +0.1521 if x1<=2.0 & x3-x1<=1.0 & x4-x2>=2.0\n"
     ]
    }
   ],
   "source": [
    "for i in range(4):\n",
    "    print('------------------------')\n",
    "    print(actor.best_model[i].rules_)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 28,
   "id": "0b443f87",
   "metadata": {},
   "outputs": [],
   "source": [
    "def test(num_test_episodes=100):\n",
    "    \"\"\"\n",
    "    Test the learned policy using the trained actor model.\n",
    "\n",
    "    Args:\n",
    "        num_test_episodes (int): Number of episodes to test the model.\n",
    "\n",
    "    Returns:\n",
    "        float: Average reward over the test episodes.\n",
    "    \"\"\"\n",
    "    total_reward = 0\n",
    "\n",
    "    for episode in range(num_test_episodes):\n",
    "        state = env.reset()[0]  # Reset the environment and get the initial state\n",
    "        episode_reward = 0\n",
    "\n",
    "        for t in range(1, 100):  # Limit the number of time steps\n",
    "            # Convert state to tensor and predict action probabilities\n",
    "            #             state_tensor = torch.tensor(state, dtype=torch.float32).to(device)\n",
    "            action_probs = actor.predict(pd.DataFrame(np.array([state]), columns=column_names))\n",
    "            # Select action based on the highest probability\n",
    "            action = np.argmax(action_probs)\n",
    "            # Take the chosen action\n",
    "            next_state, reward, done, trunc, _ = env.step(action)\n",
    "            # Accumulate reward\n",
    "            episode_reward += reward\n",
    "            if done or trunc:\n",
    "                break\n",
    "            # Update state\n",
    "            state = next_state\n",
    "        total_reward += episode_reward\n",
    "        print(f\"Test Episode {episode + 1}, Reward: {episode_reward}\")\n",
    "    avg_reward = total_reward / num_test_episodes\n",
    "    print(f\"\\nAverage Reward over {num_test_episodes} Test Episodes: {avg_reward}\")\n",
    "    return avg_reward"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 32,
   "id": "ef9e3e26",
   "metadata": {
    "scrolled": false
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Test Episode 1, Reward: 37\n",
      "Test Episode 2, Reward: 37\n",
      "Test Episode 3, Reward: 36\n",
      "Test Episode 4, Reward: 34\n",
      "Test Episode 5, Reward: 37\n",
      "Test Episode 6, Reward: 36\n",
      "Test Episode 7, Reward: 36\n",
      "Test Episode 8, Reward: 37\n",
      "Test Episode 9, Reward: 32\n",
      "Test Episode 10, Reward: 36\n",
      "Test Episode 11, Reward: 37\n",
      "Test Episode 12, Reward: 38\n",
      "Test Episode 13, Reward: 31\n",
      "Test Episode 14, Reward: 33\n",
      "Test Episode 15, Reward: 37\n",
      "Test Episode 16, Reward: 34\n",
      "Test Episode 17, Reward: -99\n",
      "Test Episode 18, Reward: -99\n",
      "Test Episode 19, Reward: 37\n",
      "Test Episode 20, Reward: 31\n",
      "Test Episode 21, Reward: 36\n",
      "Test Episode 22, Reward: 33\n",
      "Test Episode 23, Reward: 37\n",
      "Test Episode 24, Reward: 34\n",
      "Test Episode 25, Reward: 36\n",
      "Test Episode 26, Reward: 30\n",
      "Test Episode 27, Reward: 37\n",
      "Test Episode 28, Reward: 37\n",
      "Test Episode 29, Reward: 34\n",
      "Test Episode 30, Reward: 37\n",
      "Test Episode 31, Reward: 33\n",
      "Test Episode 32, Reward: 36\n",
      "Test Episode 33, Reward: 35\n",
      "Test Episode 34, Reward: 39\n",
      "Test Episode 35, Reward: 35\n",
      "Test Episode 36, Reward: 35\n",
      "Test Episode 37, Reward: 40\n",
      "Test Episode 38, Reward: 34\n",
      "Test Episode 39, Reward: 39\n",
      "Test Episode 40, Reward: 34\n",
      "Test Episode 41, Reward: 37\n",
      "Test Episode 42, Reward: 33\n",
      "Test Episode 43, Reward: 38\n",
      "Test Episode 44, Reward: 33\n",
      "Test Episode 45, Reward: 37\n",
      "Test Episode 46, Reward: 33\n",
      "Test Episode 47, Reward: 36\n",
      "Test Episode 48, Reward: -99\n",
      "Test Episode 49, Reward: -99\n",
      "Test Episode 50, Reward: 35\n",
      "Test Episode 51, Reward: 37\n",
      "Test Episode 52, Reward: -99\n",
      "Test Episode 53, Reward: 37\n",
      "Test Episode 54, Reward: 38\n",
      "Test Episode 55, Reward: 38\n",
      "Test Episode 56, Reward: 40\n",
      "Test Episode 57, Reward: 33\n",
      "Test Episode 58, Reward: 38\n",
      "Test Episode 59, Reward: 38\n",
      "Test Episode 60, Reward: 33\n",
      "Test Episode 61, Reward: 36\n",
      "Test Episode 62, Reward: 34\n",
      "Test Episode 63, Reward: 35\n",
      "Test Episode 64, Reward: 32\n",
      "Test Episode 65, Reward: -99\n",
      "Test Episode 66, Reward: 37\n",
      "Test Episode 67, Reward: 37\n",
      "Test Episode 68, Reward: 34\n",
      "Test Episode 69, Reward: 35\n",
      "Test Episode 70, Reward: 34\n",
      "Test Episode 71, Reward: 37\n",
      "Test Episode 72, Reward: 36\n",
      "Test Episode 73, Reward: 37\n",
      "Test Episode 74, Reward: 34\n",
      "Test Episode 75, Reward: 33\n",
      "Test Episode 76, Reward: 37\n",
      "Test Episode 77, Reward: 37\n",
      "Test Episode 78, Reward: 34\n",
      "Test Episode 79, Reward: 37\n",
      "Test Episode 80, Reward: 37\n",
      "Test Episode 81, Reward: 35\n",
      "Test Episode 82, Reward: 39\n",
      "Test Episode 83, Reward: 37\n",
      "Test Episode 84, Reward: 35\n",
      "Test Episode 85, Reward: 35\n",
      "Test Episode 86, Reward: 37\n",
      "Test Episode 87, Reward: 34\n",
      "Test Episode 88, Reward: -99\n",
      "Test Episode 89, Reward: 37\n",
      "Test Episode 90, Reward: 36\n",
      "Test Episode 91, Reward: 31\n",
      "Test Episode 92, Reward: -99\n",
      "Test Episode 93, Reward: 36\n",
      "Test Episode 94, Reward: 36\n",
      "Test Episode 95, Reward: 36\n",
      "Test Episode 96, Reward: 33\n",
      "Test Episode 97, Reward: 35\n",
      "Test Episode 98, Reward: 34\n",
      "Test Episode 99, Reward: 37\n",
      "Test Episode 100, Reward: 37\n",
      "\n",
      "Average Reward over 100 Test Episodes: 24.82\n"
     ]
    }
   ],
   "source": [
    "avg_test_reward = test(num_test_episodes=100)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 30,
   "id": "31340922",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[<matplotlib.lines.Line2D at 0x7f12d8ba08b0>]"
      ]
     },
     "execution_count": 30,
     "metadata": {},
     "output_type": "execute_result"
    },
    {
     "data": {
      "image/png": "iVBORw0KGgoAAAANSUhEUgAAAXkAAAD4CAYAAAAJmJb0AAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjUuMiwgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy8qNh9FAAAACXBIWXMAAAsTAAALEwEAmpwYAABiz0lEQVR4nO2dd5hcZdn/P88502d7T7LpJCGVGAIEpPemoNIUFCsvig2xgPiKP8v7+ioWbGABK4qAUlREeg+BBBLSQ3rb3sv0eX5/nDJnZme2ZHezm53nc1177c7MmZ1nzpz5nvt8n/u+HyGlRKFQKBQTE22sB6BQKBSK0UOJvEKhUExglMgrFArFBEaJvEKhUExglMgrFArFBMY11gNwUlFRIWfMmDHWw1AoFIojijVr1jRLKSuzPTauRH7GjBmsXr16rIehUCgURxRCiD25HlN2jUKhUExglMgrFArFBEaJvEKhUExglMgrFArFBEaJvEKhUExgRkzkhRC6EOJNIcQ/zdszhRCrhBDbhRB/FUJ4Ruq1FAqFQjE4RjKS/xyw2XH7/4AfSSmPAtqAj43gaykUCoViEIyIyAshaoGLgN+YtwVwJvCgucnvgUtH4rUmCl3hGI+sPTDWw1AoDivtvVEeXXdwrIcxIvRG4zy4Zj/jvV37SEXyPwa+DCTN2+VAu5Qybt7eD0zJ9kQhxHVCiNVCiNVNTU0jNJzxzyNrD/K5+9bS0Bke66EoFIeNh948wGf/8iZNXZGxHsqw+ff6er74wDq2NnSN9VD6ZdgiL4S4GGiUUq45lOdLKX8lpVwupVxeWZm1KndC0toTBSAcS4zxSMaeSDzBdX9YzX821o/1UHISjiW49p7X2HSwM+1+KSWfv+9NXt7ePEYjO7Jo640B0BGKpt1/sD3EB+9eRYf5eCbhWIIP3r2K1btbR32Mg6WlxzhRHWwPjfFI+mckIvl3Au8WQuwG7sOwae4ASoQQVtuEWkB5Ew7aeo2DPJboe6nX1hPtc994IJmUbGvoYtPBThq7sl+BNHcPPUL79Qs7eWJTAz96ctu4vfTd2dTD89uauHdVevV4OJbk4bUHeWIcn6DGE50hS+TTxXzVrhZefLuZbY3Zo+Ltjd28+HYzX37wLSLx9MCovTdKPJHM+rzRpLXHeA8H2wd/Nd7WEyWZPLzH+LBFXkp5i5SyVko5A7gKeEZKeTXwLHCZudm1wCPDfa2JhBWxxDIOzg0HOlj27SfZnuNgH0vue30f5/7oBS78yYuc/N1n2XCgI+3xV3Y0c9x3nuK1XYOPtva29PLTZ7ZTVehlS30Xa/a0jfSwRwTryuupzQ1pX9KuiPE57m8b39HceCGXyDd0GsFBbzT7la0VLe9s7uGXz++0708kJWfc/hy/enFn1ueNJlYwVt8xOJE/2B5ixf8+zWMb6kZzWH0YzTz5rwBfEEJsx/Do7x7F1xo3bG/s5vltA88tWJF8PCOS39HUjZRwoJ/o4KE39+e8rB1NDrT3omuCO69eRpHfza0PrSfhELzntzYhJfz+ld1pz5NS8pfX9tITiZPJbY9uwKUJ7rtuBYVeF396NWefpX7ZWt/Fi28Pfk6npTvCn1ftHfSVg3Vp3tAZYb3j5NYdNt7TgVG8ZK/vCPPY+sMrDKOFJe6dofRjwRLKULTvMQJQb85dnTirnJ89u509LT0ANHVFaOuN8dyW1Gf/1KYGtjd2j/jYM2k1v8MHOwb32T+5qYFIPMmelt7RHFYfRlTkpZTPSSkvNv/eKaU8Xkp5lJTycinl6M60jJPL/F88u50vP7huwO3azYM9lkyP5K2IsTeLIIJxUN/413X8c/3hz1DoCMUo8bu5YPEkvnbRfNbt7+DPr+21H9+9fQMPeL7B5M330Niaiua31Hdxy9/X87c39qf9v6auCM9ubeK6U2czq7KA9y6bwmPr62k5BMvnZ89u58a/DrzfLW75+3q++tB6dg/yC9fqsNCe2txg/91livz+ttCoWU1/fX0fn7r3DTrDh//EPtJ05IjkLfuvJ5Irkg/j1gW3X3EM0XiSxzcY9lidKbBr97UTjiXoCsf45L1r+OXzO0brLdi0myJfN0i75slNxnHTepjt2AlR8bruqT/T8v9mcHD/rlF/re//Zwunfu9ZTv3es/zf41v6PF7XEabXcaA+t7WRz9/3Zp/t2i27Jp5d5LtziLw1URuJHX4Psr03RrHfDcAlSydz0uxyvvf4Ftp7o3RH4ixreoTjtG3c6vojwTuXQ4vxRbOitLf2p9s7W+sNS2r5jFIArl4xnWgiyUNvDn36pjMUo7k7MqgrnKc2NfCE+YUb7KRZa08UTcBxM0rtLyukPqfuSLxPdDoQdz2/g68/smHA7XrM6HbvYY4ARwPrRNWZy67JkYhQ1xGiusjHlBI/RT6XbY/VmcdWNJHkzb3tPL+tiVhC0ngYsnes72p9RobcwfYQl9/1Cruae+z7OsMxXt3ZAqRsHikl1/1hNc9uaRzVcU4IkadwMuW007PpqVF/qYfeOICuCQIend+9vLtPdkxDV5iwY2Lo5e3NPLz2IL0Zl6FWFBDPmIRpsSL5HN6ktX2ml3846AjFKA4YIi+E4NaL5tMVNnKF1+xu5SJtJa2TTuP/Vf4ALdZN8vnvAdhpom/tb0/7f1vqjUyVeTWFAMytLqSmyGeL/1DoMsVjR3P2y/R4IsmGAx2s3dfObY9upLLQC6REYiBaeqKUBjyct7CGLfVd7GvtNV839bnuaxu8CCeSkl+9sJM/rNyTdtLIRsg8Fva2HvkinyuSt46RXHZNXUeYycV+AGpLA7Y95jxJr9rVYu/LkUzRjCeSbDzYwfr9HWm2nJUpdLA9/Sru96/s5vXdbdz9Umqe4LmtTcSTEq9Ls63ajlCMJzY18IMnt45qwsGEEPnyOctpkYW4dj83qq/TG41zsCPMe98xhVsunE8oluiTOtfYGSGWkLZXHTYj7uau1CVaMintgzyaIdat3cZ2PTkOdiuLIPPkcDjoCKUieYCFk4tZNq2Ee1ftZe9bz1MrmgkeewXLT7mIP8fPRKx/ANr22JHO9sbuNF9+a30XFQUeKvw6/OkyuOd8vqH9Ck9r3yukgbAi6p1NPVkf/+kz27n4py9x6c9f5kB7iB9dsRSAusFG8t1RyoIezji6CoCXzM+9y2GhDMWXf2NvG609UXxujW88urFPEOAkZAYSh9vLHQ2sqx2nyEspaRxg4rWuI8SkEh8AU0r97DdPqPUdYXxujdOrw5z8+g28e8uXuFR7ifbOkUtcuPulXVz0k5d4189e4ozbn6M7EieZlLT3RinwuojEk/aVeTiW4P7V+wAjILSOyyc3NTAnGOKB4PeZ1P4GAM3md33DgU7WZVzljiQTQuQnlQR5RS6msumVUfXmLQGZVVnAilllFHhdfS7drQ/VivCt386Uw65wHEujMydeU5589oPdSrmMxsfGrilxiDzANSumG5elG/9ODBfeRe9i8ZRifh2/kCQCXvmpfSmelLDRkWe+taHLiOK3/BO2PwnRbk6PPM+N9TdD99AK46wJ0J1NfSP5WCLJvav2smJWGb/50HL+/blTOHlOBeVBD3WDLEZr7TFEvrbUiCateQOnrTaUDJsnNzXg1gV3Xn0sB9pD3PH02zm3tUR+b2v2E9hY8tb+9n4nvPe39fIPs8I1Gk/a78U5v9DWG7ODnWwin0xKGjoi1BQbIl9b6ueAOQdS1xHm/IKd/LznJuaG17NQbufHnl/wxejP05IChsPru1upLfXzydNnE40nOdAWojMcIylh/iTjKtSafP33hjraemPcdM5cymIH6bnrXMIb/81zWxv4YfB3LIms4b86fwKJWFq68aEmHAyGCSHyuibY5F9OQawVGjaO2uvsND222VVBvC6d0+ZV8tTmRjulrqEzjJcoZXTa4m4d1M7LR+tyDeiT32tlceSK5GN2JD9Gdk2GyF+4eBJlfp1z5Ep2lZ4EvmJqin00inI2V14Ib/6R97/9BZ7xfZnb3XfRtvZRSCZJmDn386qL4NU7oXQGXPc8v5z9cwpkN/ztY5AcfKGYZZvsyCLyT2xsoLk7wn+dOpuzF1Qzf1IRAJNKfIOO5Ft6IpQXePC6dPxu3Y7crJOLz61xYAgi/9SmBlbMKueMo6u4Ynktd7+4K6dNFY6O30j+u//ewpcffCvn4395bS+fve9NIvFEmrA7I3ln1Xe2K5qWnijRRNK2a6aU+OmJJmjvjbG4/kFuD/03+Iq5NPotTk/8nPVTruIS7WXaD2wdibfIW/s7OG5GGWfPN67iDnaE7GBsgXksWZOvf3p1LzPKA9xw2kzuDP6a6rY16A9cwy2JX7K480W2FZ3EdHkA1vyOFjOSP3Z6Kf9Yd9C2cEeaCSHyAHUVJxp/7Hhm1F5jR2M3QsCM8iAA58yvprk7wlrTa27o6OU37tt5yPN1wmakbdk1TY6zdrvjAO9j1wwQyVvinq2IajRJJiWd4RjFgfRmoj63zpfnHKRGtBE7+j0AeFwa1UU+Hi26EgLlFESb6PRP4Tx9Neet+xw88TX2tvYSjiU50bcb9r0KJ1wPmk6iahG3xT4Mu56HP1wCb/wRoqkI9idPv81dGZkTyaSkO5rbrvnTq3uoLfVz6tz0iuqaIj9lLWvgtxdBa/951lYkD1Dsd9si1R2J43VpTCsL2BbCQGxv7GZncw/nLqgG4OYL5lPgc/G1h9dnLZTpHaciL6VkS30XdR3hnBPebb0xpDSCHKewOyep00XeeK9tPVEuv+sVdjf32Bk0qUg+AEiS//oS13f9nG0FxxH9yFPslJM5eU4VzUs/RRwd8cpPhv0e6zvCNHZFWFJbTI15kqnvCNPWG0OQ5J3BgywV2wnvX8fWug7W7Gnj6hOmo636BYvim/hG7ENsZgYf0J+BaSfy+OIfsTKxAPnc/6LtW8lSsZ3/XtrD/MQ2/v3y68MebzYmjMgXV03jbTkVOYoiv7O5hyklfnxuHYAz5lWha8K2bArW/ZZT9A1M1xqJdhoz5lZ1Xu5IPvWlTiSlfQLIHcmPvF0TjiX6TIRl0hWOIyV9InkiXVxe/yPafLXMOfVK++7aUj/resrhC5u4QtzOX+fczldm/Z1HXBfAqz+nffX9gGR53V/AUwhLrwagstDLXxOn03XqbdC+Bx79NDz2Jfv/Pra+rk/OeG8sgZTGyWVPS2/aZfr2xm5W7mzh/cdPQ9dE2vNmFsa5qft22PMS3P8hiGWPxK3PpSxoTNaWBNz259QZjlPoczGlxD9oT946Xs42Rb4s6OGrF8zn9d1tPJiRZgqpq8G6jlDWz11KmbMH0r7W3lGb1GvqjthBSa7+LdZx5RT5sqAnayQf8Oj2JPPWhi5e393Gv9bX2ZPjqYlXP4vFLso3/Y4/JM7h8cU/orS8km9dspDPnz2XoqqpPJg4jZKt98P6B+GP74VX7zqk92glCyypLaaq0IsmjHmctp4ol2ovc+5Ll/Ow9+tc/Mrl1N7zDn7k/gXX7vg8PP1NEnMvpPT0z1D4iX/CaV+B9/2G0gIf345fDaE2Lnj9Izzs/TpL/3MZD3u/zgnNDx3SGAdiwoj8tPIgzycWwZ5Xcn5Zh8uOxm5mVxbYt4sDbo6fUcbzW5ugeTvzN/6QA7IcAGHaRuEsdo0z6nFmybT1Ru0phZzZNabIj5Rds+FAB2fe/hwf/u1r/W7XbvYayfTk+c+t6J37KP3A3Xj8QftuS/RiiSQtPRGqCn0snFrJF7vfT3zSsSx8/as85/0CpTsfhWOvBZ9x2Wtlvew9+mPwubdg8eWw9d9gvt/OUKxP5oQ1+blwchHRRDItov7XW3UIAVcsn9rnPb238edUyxaip3wF6tennUycWJ9LuRnJF2VE8oU+N4sDbXyt9auwceAv6is7mpk/qYhJpmgBXHZsLe+YVsIvnt3eZ3vrGEpKsl4trNrVyon/+7Sd8WPx1KYGTvnes/zzrdEppHLaS1vrO7Nu0+kQeevvqaX+NOvGmrOZXh6kxzzuLftt1a5W21KzJl5rS/1cqT9LTHj4fuxKqkuM4+6DJ85g0ZRiKgt8/DJxsWH3/e1jsONp2PAgh8L6Ax3ommDBpGLcukZloZeDHWFae6O8S19JvLCWm9xf497JX+VNjuYM9wY8sU5Y+n70S37G586Zy8wpk+CMr0JxLSUBDxvlTPZc+TS/nfF9Pqt9Fa5+EK5+kFnn/NchjXEgJozITy8L8FJyESIRgf0jf9mTTEp2NfcwqzKYdv+SqcVsbzTSBRPCxSeiNwGgNxkiP5AnH3NEnc4iCSsLJZmU/O7lXbZXaZ0UYvHhR2fPbGngsrte4WBHmI0HO/vtqWGJWlokv+cVeOP38M7PwrQVadvXlgao6whT3xFGSqgu8rGktpgYLl5b/iNa9EoaXJPhXXfAWbfZz7NEvqkrAkLAUedAqBXqDd+3MxynuTuSNlbLFz+mtgRI9+XrO0OUBz32/7XZ/E/m1z/KnYl3s2/JZ+HkL8Cbf4TtfdNwrbxmy64p8bvtE3V3OMZJ2kY+9fYnOJG3SLw0sEXQ2BlhWpk/7T5NExw3o4yDHeE+kXcolmBKibH9nixplA2dYZIy3RLsjca57VHjGMysQB4pLJH3ujS25JhPsEW+OxXJTy0L0BWO21dcDZ1hSgNuSvxuO4Wy22wXsWZ3K/vbQnh0jTLTKix2xbhEf4WXPO+ki4Ad4VtUFnrZK6t5dt5/w7t+Akuvgea3DykpY93+DuZUFeD3GFfvk4r91HeE6els4WRtPcn5l7Cn7J38uuN4rum6gftOewauew7e/VMIlvf5f9YxVO+ZzkptGduKToQ55xg/FXOGPL7BMHFEvjzAW8nZxo2Da0f8/9d3hgnFEsxyRPIAR9cUEk0kidZtZId3IZvkDJpkMd5mY/0Uy5N3Fme0OyJ558SrNRHjc2t2JL+prpNv/GMTL5itEmyRH4E8+dv/s40pJX4+d9YcovEkDTmajjnHXBJwiPyWf4HuhdNu7rP9lFI/iaS0C6Cqi7wsnVpCedDD9f+o56LED7h7+u1w7IfBlfL5KwuMaM0+Kc463fi981niiSTdkTixhEy73O8yT4hLp5YYmzp8+ZbulJdu07oTHv4U3eWLuSP+PmPS7PSboXgqPPOdPmJg1S5YkfxUVwddvca+Ku16m2903kbMX8G98bPQ696Ajr6Wi5O2XiPnPpOyoIdYPE6oYQd0pqLvUDTB0WYtQbaCKKswzlmz8ZOnt3OgPcRFiyexek+bXZMwkmyp76KiwMuS2mK25bBrOs0TcFNXxP57alkASF2BNXRGqC7yEfDo9nFvnbh7ogme3tJITbEPzbTbxOZ/UihC/Lr7ZCDl1Vv4PTqFXhcvBs8zrhKrF0C4HXqH1sFSSsn6/e128AAwucTHwY4Q5QeewyMSuBddQk2xz66cPse04HJhfe7tvVGau43J/NFmwoj81LIArRTR5a2GurUj/v+t6HB2RiQ/r7oIkLjadrKLGgIenc3JafjajFzvbHZNe28Ul3nAOsXaiuRrSwN2JG+JaySenh8fG2Z6WEdvjM31nbz7mCkcO92oOO1vYi97JP8y1B4HnkCf7a1UQ6vhWHWRj0Kfm4dveCeTS/y09kRt4XJiRdz2SbGwGqoWwM7n0gqPnCfNbls8/JQG3OxwiLw9Ybr1cbjzZHjia/DXD4EQdFx8NzFcRvqbywunfRkOvgHbHqexK8ylP3+ZPS099udSVuCBg2u5ddvlfCv6XYh086mO2wnpQXZffD+/SVxovOjmf+Tcj1JKQ+QzTzx167ho81fY5P0ogbuOhV+ealtUoViCqWUB/G4962dkzftYYn+gPcRvXtzJ5cfW8u1LF+FxaekpelLC63ennUgOha31XRxdU8i8mkK21Hdl9f6t46bRYddYx4Y1+drQGaa60MsUrdn25Lscqam7mnuYWxCGX50OD34UXvkpja5JrEzMA+gTyYNxHFlXNvfuMPd1S18rrD/2t4Vo642xuLbYvq+myIjkZzY9QyNliNrjmGxeZc2qDKbZudkoDRrfn9aeGC09USoKvP1uPxJMGJH3uXWqi7zs9swdlUjeig4zP8TZVUEma+24Er1sidUwrSzAZjmNYMfbkIiniqEcFkN7KGZ/uM4smVYzfXJaWcCeeLW+JNZ2KbtmeJH867tbkRJOmFXG9HJDpPsrm7cmGq2KV8IdULcOpp+UdXvLXnhjb0rkwTgZ/+2TJ/Gl8+Zx9YrpfZ5nRWFpvvusM2DPSjq7UtGo83FL/Au8bmZXFqTZNa09UcqDXlh9t/Elf/VOaFgP7/01FVOPAhxdBI95P5TOhGe+w6s7mlm7r52nNzfakXxZwA1PfI245uEssQb50+UcldjJA5O/RPXkWnbJSbQVHAWbHk17T50tdfR0GlGkdSViWQ8kE/CPz8MvT2VSy0ruT5xGy9yroKcRmqyrwQQBj8708kDWXPlIPD2S39PcQzwpee+yWkqDHi5eMomH3jjAyh0tvL67lbfWr4V/fYHkq3dm++gGhZ0CW1PIvJoiusLxPtXDUsq0idfOUAyfW6PSPPbtZmUdbdzU8T98c+dVHB9+ETA+U7cumFVhBFUfiP/dON52PgcN61lXeQkSjYBHp8jvIpOKQi9NnRHiiSS/32o+3pK7FiEb1lVoZiQvoz3M7XyVVz0ngqYxybySGCiKh1Qk39YbpbkrYhybo8yEEXmA6WVBNsiZ0LrDEKERZGdTN0GPTlWGt+t16ZxUYgjZ+lAF08sDbElOQ09GoWU74VgCty6IOzJn2npjdsSaHsmnIh0rhdKaoErZNCMz8bpqVwsel8bSqSVMLvGja4I9/RTbdGZG8ntXgUzCjHdm3d6KbjYeNCauyh2Ra9Dr4oYzjrKFPxNnFAYYlk0iQmLPq/ZdTd0pQbH82wKfi5kVQXY7eoa09ESp8cVh5/Ow/CPwpe3wqVdh7rl4XToVBV47RQ/dDaffAg3rmf3SF/ESZf2BDrsKuWz/07D7Rd6cdyM3xz4O3fU8wmnsrTidygIvXpfG+qLTYO9K6Dayq556aw/dPzmZHb/5CJBheyXi8ND1sOa3sOIGNl3xMrfFP8LWuZ8wxrPnFWKJJLGExO/WmVYWyBHJmyIfT6/NCJg+8odOnEFPNMH7f/0ql9+1kjvvMyaHmze/mHX/D4Y9LT1E4knm1RTaV2SZef690YTtu1vZNUU+t30MdYZjxDvquSv6VRZ1vkCnu4Ib4/dApIvucJwCr4sTZpVRRRuntD0CS66Em7bBdc+ze66xP2uKfRirjaZjHUNvN3azI1ZOHNeQI/kNBztw68JuuwGGJ3+O9gZeIqwtPBXAtnAvWDRpwP/pc+sEPDoH20P0RBPKrhkq08oDrAxNM27U5S7QOBR2NPUwu6og6wG1vMBoPLQtXsP08iCbpRmhNmwg7Jg0s6LPjl7DQtA1kZZC2doTocjnotjvpicaT4uE7CIo83c0S578w28eSGuK1B+rdrWydGoJPreOW9eYUuLv165p7zVK8L0uQzjY8xJobqg9Puv2PrdOZaGXWEIaqWda3/2Wi4pCr72v/rOxng3uhaC58ex62t4meyTvYlKJn6ZuI4KLJZJ0hGIsjb0BiQjMuxD8pVA1337upGJf+qIPS66AM25lYfO/+avnm+zYt5/WngjlPoHr6dugfA6Nc6/ivsSZ7P7AC3wp+gkKfW6EEEwtC/CstgKQsOkR7n5pFy/99XYmi2aO6loFiVjK+gl6DOto/f1w5n/D+f9DSZlRbHNAVkHhZNi70hZsvx3J9/aZII/Y1dXptRlWqu/SqSX849Mn86ePncCfPnYCtyw19l1Zx0aIG+N5cM3+rNXCubAEfRlbWPLWd/iG63cEVv0YGlMtKaxjVwjLkzeK6YpMke8IxYg+9W1miwM8e+zPeGTu/1Ep2+DZ/6U7EqfA5+KEmeV8yvUIOnHDTtNdMHkpk8sNCyWbVQNQWWAcQ+v3d5BAp16fZEy+DoHtjd3MKA/icaVkclKBxuddD/J2cgoNpcsAOHVOBU/fdJo9JzQQpQEPb5utkCuVXTM0ppcFeKmn1rgxwr58Q2c45wF1tLuBXumlnlKmlQXYISeTFC6S9RuIJ6U90WS1NmjrjVEScOPSRFok39ITpbzAS8DjIimNCM3ucWNGa5YXn82u+dKD6/jjyoHLo7vCMTYc6GDFzDL7PktAcmG0GXZEHbtfhinLsvrxFpb3WpUjYs9FpSny8USSL/x1LT9/uR7mXcCULb/jUu0lILfIVxd5kdLoC2JlMS3ofAl8JTDtxD6vNanYl77ogxBw2pf5qucrLBG7OLf9fva09nKZ91UjEjz7GxQHjfe8j0lEkxoFPsMOmF4WYGVXNUx+B/Lpb/LMU//i895/0KsFCcgQHHjD7kFe7o4YmUnHfABO/SJgev5Aa2/MyFbas5Kw6U37PTpzqwuJxJNszphEzbRr7BODKfIAi2uLOXlOBSfPqWBa1IhoXckI1K9HSslX/vYWP3hy26A/oy31XZSLTmY/9XG8b93Le1yvcNyuX8AvTjCK2JKpCtfaUj9NXRHae2MU+VORfLxlJ/4Nf+G+xJkkZ59NR/kx/DlxJnLVXVS3v0Gh180ZpU1c7XqGznlXQNks+/WnmMfWpOLsx1ZVkZfuSJxXdxkB2F5tit0VdbDsbOruk003e89fmaXV8534BygJGmMQQgzoxTspDbrtfvcqkh8i08qNyddYweQR9+Uj8SRed/bdNSV5kN2yBonGjPIgMVy0BWaQrDfayFoibwlTu5ld4da1DE/eiPCDXuPL2ROJ2zaJNeEaz9HWwLqst9oi9MfqPW0kJZwwK5XilcsKsHC2GSbSDQffhOnZrRoL6wqmOjN9cQCqTJHfVNdJTzRh9Ph4z100lC3nh+47ucz9SvrEayRO0KOja4KjYm/zHu1FGjrDtPZE0UkwtfkFmHueEQVmMLnE32fRh+5InD93HsNrvpP4kP4kG3fu5Zr436FqIRx9kb0frF41BV7j/04rD7C3LYS84o8k3QF+J79OSbKNf8y6jaQUyJ3P2qXrtQceh1gvHPcx+3WDHh2PSzOi/eknQddBoq3GSdvv1jl9XhVC0KdrZSSjutoSe1+O45W6t3iFY4y/960iFDNslee3NvUptrrp/nXc8ve30jJ3usIxnt3ayLeD9yOiPfBfz/P56Q/x/oLfGkU/O5+DtffS0RtjrtjHR30vEE0k2dfWywx3G+Vr7mAyzczbcidJofHz+CVUFxnBzffiV5EsmcEN9V/nBLGB4r9/AHdhJSUX3pY2rtoBRN6KkJ/bamSl7WWSkVU1yFYZsUSSva296dl0oTaKXvshLyUX8VxyadYMqcFQGvDYV3Rq4nWIWMUlHSULBx3JH2zPXkWYSTSexKNn310lvXvYKWsAQywBGgJz0Hc+w2rv9Xx6z+cIELaj085wnGK/2/Tq07NryoIeAh5DNHqjqUpUK3KP5bBrrC/hYBYkWLWzFbcuWDat1L5venmARKiDzoa9WZ/jbDPMvlUgEzn9eAuj/LxvittAVBYaUZj1BW3pjoInyD8W/oi1cjY3u/5MS2fqhNQdjtvR9JK13+D77l/S2rCX1u4oy8U2PNEOw6rJQk2xj65wPK3RmJUO2HXcZykSvdzBD5ia2Acn3whC2GmkVmFSoSOS740maNIr2XT63YTx0DLpNNqmns16OZPk9mfteZeSrX+FyqNhyrH26wphzF209ETtugNtnzEP4Tftr2XTStMWLYFUdk1mUzyfR6cPXfXQ08gq13Ja3TWw79W0nvhWz3OATQc7+dsb+/nLa/u4/K6VvPh2E89ubeQ9v3iFYN2rXBB/Bk76DFTO47S5laxq9rBhzqcMC++Zb5Os38CfPd/hI60/4lixlf1tIa7p+DXeF/+X57w3Mqf+X7w16TIaRRmzKgsIeHQ6CdJ86Z+Jo3Nb680Q7jSKhYrS/e6KAi/fvnQRVxzXt8gNUlla1vdhp5xkWHYd+/ps2x2J91moZl9rL7GETI/Qn7wNEWrnl96PAKJvhtQgcab0qkh+iFSYO6yx4Gjj0jrcf25wOJbg7B8+z32vZxc2J9FEMs2bs4lHcXXuZb82BYDqYi8el8bKqvfTveiDPJVYxqT2N/i69y9pucKlATcuXetr1wQ9BM0vZ080bm/fZ+I1I0/eukS3cu374409bSyaUmwXeAAsFHt43Hszwd+caFR/ZpDWnGzjQ+AOwNQVfbZzYl1S55pgzYUVhf3zLaN7oTUJ2xpz8evEu6mQrUxvW2lv3xWJUehzw4E1+JvX4xJJirc+SEtPlPfqL5LUvXDUWVlfa7p5Ul65IyVult989LJTeU07hpP0TbR4JsNCozdPZiRvi7zZ02hvSy8bktM4I/JDQpfeQ1Whl5eTi9AOrqa7s4152gFcB1fDO64x7CEHZUEzyqtaAN5iPAcMkbcE++z51Ww40JnWR93Ok88Qe6ddY1NnrJ61z3sU270LYd9r9DpSU51XCX9atQevS+MHlx/D1c13EPjjBaz8w9e5vvOn3Ov9PyiZDqcaVcLvPbYWv1vnT6v2wnnfge4Gjn/qfegkibiL+ZTrUaZTxzFdz8OyD/F37Vzq/EfxB/09zK4soMDrso/HLn8tX/Hcyj7vHLjyj1CzKOtnd82K6XYgkYmz+K2iwMv2hBGEZZt8/Z/HNvPh36YXUKY6zpp2zbYnDHvtpM/QU2rM6ZQFM6q/B4nzCkBF8kOk3Nxhe31G/iz7VvW7fUcoRm80we7mgRs/RePJ1KSjk/Y9CJkgXDST0oAbr0vH59LY65lNwynf5ub4dew86sNcJZ6kvP5F2ycu80pmigZbtKWUtFmRvHn53xNJOPrOW+KefdEQ64s+mEh+e1N3eo761sc58fn3o5Ekqgfh3sv7FPRYS/8Rajf6gSy+DLz9+5C2Jz9Eu8b6gm5rMBrCdYXjdn+dN7zH0+0q5YzQE/b2XWYmBq/fg3QHWZ+cyYx9DxFrfJv36S8QXvIh8PbNyQc4a341R1UV8M1/bkz1TanvIujRmVLi5+VJHwZgde2HbLvHmGhN9Y8v8Bpf9mlmKuqell52NnXT5SplcmU5lYVeXkwuRiTjVDW8yGe9/wDNBUuu6jOeMiuS13SYejzFux7jMc8tLH/ycmjbbafpOaN5y66xjoFQLIGuCdzZrjzNhIQ63xw2u+dDVx2RFsMSCnh0ntrcgJSSrnCMh988wMVLJvO+xWVc6XqOY3yNfNX9F96nP4+27Br4yL/tOZkin5tLlk7mkbUH6ax8Byy6DIng49GbaF70Uc7S3+S77t+QFC4442vcFfgvvjvtV7xcp7FkSrH5+sb+DUUTrI7P5Jfzfwuzz8j6uQ1EVWEqsDhhZhlb48akNs19Rb6hI9wnYWGnufjM7IoCo4jq0c9A5Xw441bbMRiOXQOGzefLdiIeYSaUyBf5XHh0jbfcS8BfBm/+qd/tLQEdjI8djeeI5M0Z+9nzl3LhYuOS0ufWCceStke6+5gvsE+fxgcPfJOCZ27lev1Rznv6PP4c/TTFIeMqojMUJ56Uhifv6evJZ7YYzuxCGXLYNf01pGrvjdLaE2VWhSnQ4U545AZk+RzeHfkODy+8w+j6+Jtz4Mmv29kStie/7j6Ih2D5x3K+hsUxtSUcU1vM8hllA27rxBmFHW8+t7UnSmcoRiDgZ1v1RZwmVxPpMNb57I7EqfaEYMPfEEsu52H3RZSF93LKmzcRw4Xn9JtyvpbHpfGtSxaxrzXEz82+MVvqO5lbU4imCfxzT+OMyA/YPzPVfE3XBIVel23XWJ58bakfIYzWAzuaephZEUTTBJWFXt5IziGheblyz21cJF+AYz8CBZV9xlMe9Nj1EhxzFTFPCQ2yBH/nLvjtRRylNzCrIpgWcWfaNaFoMnsUD1C/DspmofkLWS+MYMi7y2jlcN7CGurMFhcPv3mA3miCa1ZMg72vIBJRXFf8Fj6/AXHjRrj4R1A8Je1fX7NiOqFYgr+v2Q+X3sk9yx5mjZxH4ORP0S19rNA2s23ypVBYTbHfzdsNXXaHR8A+7nujcTOF8tAiZTBOlpowrphnVxVwIFaI9BZljeR7owm6I/G0Nsc7GnuoKPAYFuXqu6G7Ad5zF7h99jzAoYq8dQVQcRisGphgIi+EoLzAQ2MvsPQDxmIU3bnXT7QEtHmAhaOllLntGvOgedcZp/Cd9ywGTJGPJ2zh9fj83D3lm6zTF1Kx9c/c7L6PWNE0XCRZ2Pmy8W/ML3Z5gdOT7yvy0RxtDawveNQs/c+FVQ06u8q8DH3ph9DbjP7un0BBFW9GJsM1f4Oqo0m+8nMid55KuHkPoViCEr8LVt9j+MiTl/a7z8D4oj3y6ZOZWREccFsnzijsoiXGibPZ7H1S5HdTP+sy3CJBeM1fAMOTPzvylH3yWV96JiHhp7L3be4X5+Eq7j9/+cTZ5bx32RR++cIOntrUYFdygtF9cJecREXG1UhJwGNP/lp2jdelM7nYz96WHnY2pZrZVRZ4ieBhc+3lrPMu57ay78NFt+fYZ147L5/Fl/HMuY/zkdhXOHDJA8b7+91FvOcojVd3ttiilJldE44n0iddQ21w1ynwry/CgTegZgkBj4tNialQtYAZq77Ot113c+mCQjQBl9+1km/+cxMLJxcZaYE7ngXdY2QnlUyFgqqsY180pZhjppZw3+v7wOXhYLKEQp+LkrJK7k2eR0S62DXvo4DR5M3qd7PYLDay7BprERFrvx4KuiaoKPCyuLbEPOEJZOXRsOsFoz7BgbWurHP1tp3N3alAqGEjlEyzj/lJZkJBn3YZg6TEPDmUHwarBiaYyIPhcTV3R4yeKMk4rP1zzm3tSH4AH9sSVm8ukQ9UGPnXJj63RjiWcGQ56MjyOVwfu4k7lj3OGZEf0HLFo+zQZrKo20gJbLX7o3jtyLDbYdfEBrBrQo6ulf1ZNlY16KyKAmjfCyt/YRSZTFnGjHIzw2bq8fDBh/j+UX+CZJK2f3wNgKN7V0Pz1kFF8cPBisKmlvlZZF7Kt3RH7Qlr7+QFrE7OJbD6F9DdhC/UwEWtf4QZp8CkJZQUFfO0+3RCWpCHg5cP6jW/dtECjq4p4uN/WE1bb4x51YbInzCznK9dNJ+z5qdXMxb73XaLG6cYTSsLsL2pm31tIdvPLQ14cGmCxyZ/hlv8X6euZFnOcZQXeOiJJhxRufFbm7QYPvQohDu4au83SCbi9nEbyciPD0cT6TbAgTVGg7fXfw2dB2DSEoIene4Y8PGn2XHUh3m//gwrnrmSn5xbxJXHTeXqE6bz7UsXGXUhO583JoL7SZe1OG1OBdsauojGk3SGjeInIQT3Bq7hrOgP0MtmAti58kaHR6MDqRXcNJmpxsMReYBvXbqIL5471z7h9S77L+P4XZt+hW81RXMW2O1scjQjbNpmTJKbvOcdU/h/715o25FDxTo5lB/iSWKoTDiRLy/wGAd/xRyYfrIxWZKjOtTK4x0okrcipT7ZNVIanRhrFqfdnWnX+N260XkvEucnL9VzQJtCRYGX17wrOCq8EXpa7EWBSwMeAmYKZUt3pM/C3fFEdrsm7MgQaulH5Hc29eDWhXGAPvd/xsTfWV8HMBe+SE3obY1VcHfiAibteZSr9ac49a2vGBHNovf2u7+Gi64JppcHOW1upT0J29RtlMUX+VxUFnr579hH0CId8LeP8pXoz3ARNzpaYkz0fit2NTdW/ApXYV9LJBtlQQ8PXH8ilyydDMA7zMwjXRN8/JRZ9onXwtnDJ+h4bHp5gI0HO0kkU5kZmhlVNnVF0hYfyTUOSJ2ow45iKGoWwbvuoLJ1DV9y/dV+rDq8g397bsYdMSaPjUjeIfKNRnsErnve6Pi57FoCXpdxJeAJsHreTVwT+yquUAsXr7qabyyo4xvvXmjsg+5Gow2E1ShuAKaVB0lKY76i0zFZX1YUZL+stG9bv+dWF9oRvFWha7UeztznQ+W8hTUssSN56Jp1oZEs8Mx3IJKqzrWuuK11Ztt7o7T0RI3PLxE3ArnKufb2ZUEP1540I2th5GCwbJ7Mq8PRYsKJvB3JgxHNt+7MuVqU1S62tSfa73qQVoplH7umaYvRD2P+xWl3+1x6RiSvce1JM/jbJ0/igetP5D83nkrQ62KNbwUaSdj2uOPLrBE0IxpnLxA7uyY5iEi+nyuTnU1GFZ8rETayZJZcAcVGAVlNsc9oW+soRf9F/N20yCK+476HhKcYPvwvcB9aBDMUHrj+RG69cIGdYtbSHbVFo6rQx2Y5ndcWfA12vcDJYh0vzvgslBtdSKuLvDSENDZ1B4d0Se1z6/z4yqWsvOVMjhmgetFKJ/WbFcMW08uDdoTvLKSpLPTS2BXJ3pzMQabI9ylsWnIF+2ddxfWufxJv3Q3ACaEXma/tZWrvJuM50US6J9+4BYJVht1wyhcgWEGB10WP2TqjO5JgZXIhPdc+ZXTivPdyePknRhCz6wXzzZze7/5IvX9r8rnHtNdc9vsH7NtFPmP/WZOukLJrrKLB4Yq8hXXCC8WSRuZPTyN7/vFd+3Hru2Nlce1wZta07zFSLyvmjchYINWkrOJIieSFEFOFEM8KITYJITYKIT5n3l8mhHhSCPG2+bt0oP81EliRvJQSFrwbimrhhe9l7SXdYXbBS8r0Hu+ZWCLfx67Z9Cgg4Oh3pd3tdWuEHYsWe12GEBw7vZTjZpTZHvVe71yatQrY+ljqNXQNX+smhJBpaXKZjclyefIwsF0zqzIIbz8BsR5YdJn9WHWRj3hS2lWZTV0RInqQ/459mJWJBex61wNGJH8YqCjw4vfoBDwuAh49zZO3hH9V8flETvw8D8RPZdeMVKaKlbK5t7XXXs1psAgh0hbzyIUViRZkWAqWyAFpcxGVhV52t/QQS0hKA7knFK1LeOtqLBRNb1EA0LjgWgC8ew2rb37M6BtfGTEm8cOxZLon37gprZUDmKswmUVQveYcTqBqJnzsCZj/Lnjyv+HXZ8LKnxnVwpOW9rM3HO/fTEnd29pLZyhu7ydL5DMj+SVTUyJvBTdWJF/oO/SJVyfWvgvHklC7nLWeZWmdQq32xlaxotXeYVZlATSZ68Q67JrhUlng5bS5lZx0VMWI/c/+GIlIPg7cJKVcAKwAbhBCLABuBp6WUs4BnjZvjzqVBV6iZsERLq8RuexblTWad65O058vnzOS3/yo4VUWpvu1PrdOJJawe4rkSpPyuHRe966AHc8Qj5iFNbseQ9x1Mld6VlLvWNItGrcak6V78xZOkbcE4oY/v5G2HmpaFd+GvxnR3YyT7ceri4wvohXNN3dHOHdhDY8lV/D+2NcIVBwegc+kvMDD3tZe4klpFpFplAU9NHVFaDnhZr4Uv54ChyA48/JHy/e0VsgqzIg2rWK4qkJvmkhVFnjtthH9ZWWkInlDcEKxBB6Xlr50YeXRNMkiAnUrIRFjQdJoR1AT22c/xz7mkknjijND5C1BDcUSdEeNdWpdugaeIFz+e7jwdmNO6+CbxoIW2uBS/SoLvXZLZKshmbU/ICXuVkHZkikl9nN9bg0hUssBDteTd/5f670CbNdmMClxEJIJpJR97JodpqU5tdRv7DtIs2uGi0vX+P1Hj2eFo+J8NBm2yEsp66SUb5h/dwGbgSnAJcDvzc1+D1w63NcaDKnLe9Oyecc1RjT/3Hf7RPPOhSf68+Wtidc0kW/ZAQ0bjKgnA8OTT6Q8+WyVh4BLF7zgORlivUzd9wgABevuAeBG8Rda2oxOmrqjx00qlVKmNaoKpUXyEWKJJP/ZUM+dz+2wTwBWFd+8UmFE8gsvTfvyWj1mGjsNWyGelBw3vZQ5VYa33Gd918NERYHXjq4s0bAaUFmZRM6I2inyh5oBMRDWvsgUIiuSz+xlUlnotQ+//sZktZ61go5QNN4nHdLvcfFqcgEl9Suhbh1+IiSkYErcqG0IO0W+Y6/RPiEzkjfnfXojcXoi8bR5BYSA4z8B178IN26Ei3/c365IQwhht8iwGpIBXHXcNG6//Bj7xHfBohq+dekiFk0pSnuu363bEfVI2TXW/rOCrp3JSXiIQftewrGk/blYds3Opm6mlweNk17zNiicBL7irP/7SGBEPXkhxAzgHcAqoFpKaa1KUA9kbbYshLhOCLFaCLG6qalp2GOwKsiarcjc5YVTb4L9rxktYB10hmK2cPcr8tkmXjebPcOzibxLMydeE/btbLh1jbViIUxexsJdv2Oe2Itr3ysw7yKqaeHS8MOAIQpWfrwzgo85JpStE4pVFm9Fvh2hGP9YZ1SOdr/xIJ/SH+a4xgcgHoZF70sbT40pjvWdYfuAryz0cfGSyRT5XHZGxOGmPJiKgi3RqCn2sbe1115dqDAtkk9ZNKNVNm5Fopl2TaHPzbSygJ37bVHlGFNJP5F8kd+FSxNpnnwgI0jwu3VeSS7EF240liwEnksuZWoyJfL2icGadK1akPY/rEi+J5qgN5Kw+yX1obh2wKK3TKaWBdjZ1E1vNGEfMzXFPi47ttbepiTg4YMrpveZvAx4dPtKNHPfHiopT94sdksYk+u0bE/Ljbftmuae1OJATVuhYuSi+LFgxEReCFEA/A34vJQyrZ+ANKpzss5sSil/JaVcLqVcXlk5uEyI/khFQg7Rnn2m8bt1Z9q2HaEYM8zIqz+7JpLNrtnxDNQsyepRO/PkXZowIoIsWH3mOeULFIf38wv3HUjdA+/+Ca+4V/BJ16NU0kZFgdde0zURj/Fp/SEm0ZIm+NYBPKnER2tP1C7LDnjMUvNkkjmrb+PL7vuZsub7UDSlT5tgyzdt6AzbB3xVkZcbzpjNUzedlm4ZHEYqCz12NpEl8u+YVsLWhi4OtPedpCv2u+35k9GO5LNFm4/c8E5uPCddGJwtZfsbkxBGT5SUyPctbPJ7dFYmTdF+8172yGpeTc6nlE4ItZl2jXnMNW4yB5DuKQccBXdGg7eREVQwrmZ2mhWkQ736CzjGMVJ2jXUlbX1HNses6tdtth+va8LuLbWnpcewNKU0IvnKkZt0HQtGROSFEG4Mgb9XSvl38+4GIcQk8/FJQO6qpBGkotD4AqVF5l7zkjCS3i+7MxxnamkAlyb6jeStisI0kW/d1ecS2CKVJ5/st2zZpZm9a+ZdRLN/BrO1OsSCSyBYwX0ln8BNgv9x30N5wG1bRkt6XuSL7ge4WF+ZNvkaiSXwujTKg15ae6J2Pvz1p81m3b52tq9fiT/Wzh3aB+GiHxjVe1r6x+/WNSoKPDR0RmyRryzw4tK1tAKlw41z9RwrO+OEmeVICc9tMQ4rpyAIIWzLZvRE3mO+bl8RKw16+nzuziresgEqJe0mZRiZH5n/y+fW2S1r6PZWQzLGa4l5RgMugObthJ0nhsbNhl3pK0r7H0G7dUacnmiGXTNMnJPPQxd5Y9weXcveRuQQ8DsmXpNJycFokDZZQKJpm321PaXET3N3hD2mpTmrImjUFES7lcgL43rrbmCzlPKHjoceBa41/74WeGS4rzUYygIehHDYNQAe83LTkRsLhl1THHCncutz0Ce7Jh41DoDSGVm3t/Lk0ybAsmC3GtY0Xqr5sHHn8dcB0BWYxvfiV3COvoYzI0/Zgn5up3EOrRFttvCDEaX4PbohEN1RdjZ1U1Hg5dqTZuB36zz4gFEAsqn8fDju4zDz1Kxjqir0pUXylYcpl7c/nOXfzkjeo2s8u9UQ+cyI2rJsRmt5tf4i+WxY+1ETA0eoZY5IPmx+rk6sCs79xcsBeF3OY58wWgzI5m3GcWc9p7HvpCukxLQ3mqAn0tcSGg7W5DOQdWm+/rDe60hZNYDdIjwUS9jVrTvkZJJNqUh+enmAeFLaaxLPripITbqOYPrkWDASkfw7gQ8CZwoh1po/FwLfBc4RQrwNnG3eHnVcukZpwJMembs8oHshkt6V0sq7Lg96B+XJ25FFxz5j6buSvmuUQsoD7AzHcvf0xrBrLPF+o+Qczhd3GtWmQMDr4p7EBbwpFvD+1l9QE90D+9cwL2pcfleL1jS7JhxL4HPptkBYFXvFfjc/unIpV5Ztp8k/k09clH1NVovqIi8NnWEauyIEPPqIRniHirP825p49bl1jplabBeRZQqnNYlceoidAgfC8uQHaylYIl8a8Ay4SlZZml2T6GPXeFwaLk2wrfgkpOZiZXIBHb4pRKVOomkb0XgSn0s3Cnmat2YVeevk1BM1Jl5HapITUt044dAj+ZGyaiB94rXHnKjfmZyE1rI9TeQBu9Xy7IoCaMhudR1pjER2zUtSSiGlXCKlXGr+PCalbJFSniWlnCOlPFtK2ToSAx4MVjSbhrfQuPQySSQlXZE4RT43FYVemvvJLe+TXdNurr6UI5K3Iv6O3tiAkbyVEhmJJWl3p+amgx4dicYdhV8gJjzc0f0l+PeX6BEB1iZnMUm0ptk1oVgSv0enrMBDKJZgc12nneFx/rwSZva+ReWS8wdsFmYURBl2zVC7R44Wznaszi//CTNTKWiZnvLcqkKmlPhH7JI/k7Kgh0Kvi6k5Wt1mEvC4KPC6BtWD3FnQ15vFrgFDuNYWnkHTx95gn6ymIOBjr6wm3mikU/o9upFskIhmj+RNUe+NJOiNJkb0ZD6lxI91HisaYq67322MYyRPOvbEq9mIDIz+8npvI9EeI3KfXmacmFbtbKU86KG462144fvGvFvw8OSzjxYTruIVMqpeLbyFaXaNc2HqiqCH5q4hZNe07TZ+l/YfybeHov1G8i5HJB+JJ9JWnrLbrgZr+fGsX3JA1MCBNTzpPYcdcgo1ojWttUHY9uQNEemJJlIZAvtWGdk0g6harCr00dIToa4jNC6sGkjZNQVeV9ok9gmzyuz7M6PjT54+m8c+e8qojcnn1nnhy2fwPkfGyEBUFnr7LYSyqC4yFjLpicSz2jVg9JcPxROEfIYAFfvd7JSTEGbDvCLZBX//L8OPn3dBn+c71yywVtYaKTwuzV7IfaiRvJXlM5Ii79aNK59w3MgkAsOuAdBbjf1ltYk+0B5ieVkY7r3MqBm46s99ev4faUxIkS8v8PTt3+ItSBf5sEPkC7209ERytujtUwzVtsfoyleYvbuhLfK9sdwtXzFOGs7uks4UTetgL/a76fVN4hOub8OFt/NHz1XUy1KqaCcWS+X5W2LgrPC0y+p3Pmv0Lx9gJScwBEZK2FLXNY5EPr2QxuLY6aW4NJH10t7j0lIrWY0SpeZi7IPl0qVTuGBR/x0xASaXGFZTXUeIUDRBIEckH4om7MyvYr+bHXIy7o5dFNHN6Ru/Bl11cMUf0prnWVhBRE+2PPkRwLI/hpp2m7JrRvaz87l1QtFkWiQP4G43igWdk8UfTdxv9JD/wP1G180jnAkp8hUF3r6RubcoLbvGKoQq8rspD3oIx5L0OPq/OOlj17TtNnp85KgCtKL39gHsGpcubF89EktmjeSLzArP7qQHjv8E7TJAs1aBWySQPamEpVA05clb2AU5u16AKctzLpzhxJqw7IrED8tK8oOh2O82erhniHnA42JxbfGQLYGx4nNnz+GjJ88ccDurXqGuI2xPqGfidxttCazsECuS15Ix1ng/yeSmF+H8/4XaY/s8F4xj2a0L2ntjxJNyFEQ+iM+tDXlRDMuuGUlPHlJpzVZe/B5ZTVK48HcaadUVBV77BDO/9w0j7XrSkhEdw1gx9rNqo0BFgYcu81LXPsi8hdB50N6m0+xbU+x325FiS3ck62Wi1co1zZPPYdWA0aAMjMUs+vOEXZrhyUspjYXCHdtal89WS1urZ008KWlzVUISRFc9YMz8h+MJ+4QFxlVCbWnAWLi4YeOg2wM7q0XHSySvacbap9ku/b91yaJ+++cfiVhWR117OGeGls+jE4ol7Ui+JODhicQimqqW8mjTJBaeey0rju9r0zgJeFx2T/yRtGsArj91NmfMy953vv8xjbxdA2Zas8OTj+OiJ1DL9Lr/8LjnP5Q+PJ/Kwk8Rb9lDUXg/zPzMiL7+WDJhI3nIaLnrSbdrUpG8y66KzJVh06effNvunJOukN6rpj9P3jppxBKSSDyRYdcYB7m14HfU0aCs02UUjWldqZOWkU+tUWa+l+nlAcNKaN9j+PFVg8sQcIr8WObGZ3JUVQEzHFkbFoumFB+2HiCHC+sz2G8uMp/N8gu4dcLRhB2AFPndHKSCvy29h2/FP0ikZvmArxP06HbHx5GO5KeVB+ylCoeC1W5hJFMoIXXlY3XeBGgqWkBRaD9+Iujbn+AdvnpO1M2MmpmjN59zuJmQkbyVcnfL39dTWeDl5guOpjJz4tXhyVuWiTO3/r7X9jK3ppBl00rT+8mHO4yVdnKkT0K6sPdfDGX4ufFkkmg8STCY+jisL12Rz0U0nkxrNdzlrYQo6N0pkbcKrwq9Lty6SPnxjVaDpeyFW5mUmz5zIinHTSQP8Jtrl6Md4RNgg8Xj0qgo8Nrrjvo9fQMFv8fo8WIV6llXOVY31f7mgiwCXkckPw5SZQF7/mGk7Rq/x+gn5Wxj8ORRt9Jd81keWr2Hl8SnOD/5AiF9HzJQgRjk9+VIYHx8siPMktpiFk8pZn9bLy++3UR1kZcvZ6RQ2pG8z43AEA9nJP/dx7dw7oJqlk0rNdZ31TWjz0Zb/+mTkC7s/X3ZrD7ksbhl1zg9edOuCbjpCMVJSiPtM55IEvWWEe3Scfek1vm0+pUIIbjquGmcNNuMbofYRU/TBFWFXuo6wuNK5AMjWHZ/JDC5xGc3Zct2DFmRqXPiFVJrJPR3BWkR9LrY2dht/z0esD7nzO6ew8XnMvaXZddoAjrjLtqTBYQ85TDzDE498CwxbwIx85Q+1eBHMhPnnTioLvLxj8+czDM3nc5ZR1dz/+p9xN2Fhm0RNyKdjlAMlyYIeFKTlVZuvZSS7nDcLpRIW8R7gPRJyIzk+y+GAqPRWCSexOPw5K3sghK/B7fL3C6RJJ6Q+DxuGinF3VNnb++cf/jWpYu4wFxUnKYtRp+aIXTRswqJxpPI5xs1RT67/1BWT97Orjn0SD7o0ekyRW+kPflDZTQqXsGYwwjHkvSaC6oEzUVTQlFzYnvJVQRCdRTHGo1lJCcQE1LknVyzYhrN3VE2t5qFQ2Y032kuQCGEwOPSCHh0O3c+Ek8ST0rH4tiJQRdCAWkTqAMVQ4Eh3tGMSP4dU0v43mVLOHlOhe3VxxJJookkAY9OnSzDEzIieasndtYvduPmIffeqC70IsThW4NS0ZfJJX67oVa2qxi/RzMi+Vh6JN9uR/KDsGs8fe3BscZOofSOcAqly+gn1W2mixorY8Vt0efoi1LtT2aeNqKvPdZMeJE/dU4lU8v8vLTXtGJMX77Dsf4kGLP5PaZfZ5U+p0XyzkIob3HW3GOL9InX/lIojf8ZNydenSKvaYIrlk/FrWuOk4EknpQEPC4aZBm+3nr7/qR0XDXccwG89GMjs6Z526D9eIujawqZVRHM2T1TMfpMKk5Nemf15LPkycPQRN7ZXniks1kOldrSgLmI++AqiQeL5ckbNQE6AY9ObzSRauXsCcDiy6H8KHsZyYnC+PhkRxFNE3zg+Omse+J58GCLfGc4nlaoUeB10RW2RN4Qd0vkI3FHDntb/+mTMPiJV8uuiSaSRGLJvitPmbis7eJJEkmJ34zkfeF14FjZxufWjUnhva8Yiw8ffdGQMmssPnPWHK4/fWId6EcaNQ6Rz9XWIDNPHhx2zSDsF2ckP5INyobDvJpC1t527ojXPliefE8kQdBjJCd0R+Ipuwbggu8Z67lOsAn+vAjVzjy6ih7ML40jki9y+H4FPpc9KdMVifEh/T8c1bsWcETyUkLd2pwthi0Gm0LpdkbyiWTOnHprOyszwO/WqZdluBIhCLenLzNoZdP0NMIrPzH+HmKDJbeu5d1E53jDypWHHBOv5ufjzBIDaDctx1wL1Thx+vDjxa6Bofe7GQx+05NPRfKmXROLp451l2dQBYNHGnkh8h6XRrc0vzSmJ9+Vza6JpCL5L7oe4KrQfcZTrInXpi3Q0zTgxIxbT63J6eu3GCo1oZrpyaeN3xZ506P1GiIPQOdBO5L3u/XUIhGeAnjTaC98pPfDzkdqipx2TbZIPlVVrWsCn1tDE8ax6tZzL1TjxGpSpmsi57E3UfC6jTmMXrN3ftDrMlbFimavKJ5ITOxP1kQXgi5MkTfbDXeYE68WQaddE4pQJHpZnNwMsZDRV8alGe0BIGcvdidWJNWvXWNuY11BeHNE/VYkb0/EuV3U2SJfl27XNG0BTyEs/4jRDrlw8hG9PmW+UlPss12D7JF8qj+S12Wk91rHWn+BhRMrkg969D7L8E00/G6daDxJV9hYBavAq9Nj2jXZegNNJPJD5HVBjxXJR7qQUqYtMgxGXq4lthGz/aiXGOxdaaQ36qbIl0wf0JOHlLhnmzSzcJu5uNYVhCdH9GV591Yk7/dojkh+v2PBcM3IpqmaD+/4kPH4EP14xfjArWt276BsIu/sdOrNCCh8g4xMLYtmPFk1o4W1b5q7I4Zd43XRGzWya8bLfMRokR8iLwTddiTfTSiWIJaQad5fgS9l18S72+z75Y5nDStFl7D7pUGXOw8mqrLEOxXJ5/DkzS9xyPLkPS4aKCXkKoZdLxAyxd+na0afmqr5RvHTihtg6dWDGq9i/GFl2ORqUAZWJG8da5bYD+5rbWXX5IPIW/urM5xKoeyOxNNX0Zqg5IfIayJt4tUSxUDGxFN3JI6Uknivsb5JTOrIHc8RiSc5Krkbwu2DzqG1rJdcwg2pFEormyeXL5qK+E0xd2kkhc7WinNgy7+IhdoBKEi2Qag1NTF8/v/A4ssGNV7F+GNSsRGYZM2ucdo17vRIfjCFUJDKrsknkQdjgZmgx0U4ZsyFBdwT+/3njcgn0YjpAYh0kTBXY3L2Ai/wusxGYUlkbzsALycXoTW8hT/ayqLoW8aGg6yGsyL4wVS8WlcQOUXe3M7y3q3c+bfKzod4mJJdjwNQ1Gn0xh4o+0dxZDCl1I/PnaqTcBKwRT5l11gBxWDb+1qraY2XatfRxDnfZUy8pt6zsmsmAJaYR/UARLvsJfdcDpG3GiL1ROLIkGHX/Ct5AgDvizzECV1PQPkcKBp40QdIiftgetd0DyTytl1jiLxLF7g1wR7/AiibRc0eY430wk5j6TeqFgxqjIrxzXWnzuLXH8reTdIS8p5oImXXZET0AxHIQ7sGDJvK+Z5Vds0EwBLzqKsgZyRvRTXdkTgi0gHAS4nFJDzFXB1/iIrYQXjn5wb9mr5BRFV9I/ns22amULo0DbfLXB92yZVUNr9GDS3427aBvwyClYMep2L8Ul3k45Q52T9Lp2jZ4u5SkXwufBl2jTN6V5H8BCAVyQdz2zVmJN8VjuMyRb6VQnad/Ws+L77Mdxf9C5Z9cNCvOTiRN712c0I1V8VrZjGUxyVw6xrRhITFlyOQ3Om5A+/+l40ofoKnwynSo8/MSN4/yIlXS9zyIpLPmH9ztnFQIj8BsEVeC0Ck27ZrnCJvtTbticRxRTuISDcRPDSVL+fJxLFoHn/ff9wPqUvn/hbytuya/ideXRkplC5Nw60J4okklM/m6Xm3USNa0dt3QbWyavIBZyTfJ4VysJG8ecyPl741o4kzyy3TrhnqEoVHGhP/08VIoQSI6EGINJGUliefElUrku+OxPHEOunAWHQjFIuniqGGgH3pPJgUSrM0fdB2jS5wu1KLgK8rv4hPRWex5WqJmLZiSONUHJk4helQs2uCXh1dE0NebPtIxFmvEvS67Iw1mPhrFUzsd2eiaQIhIGJm11grQTmTFqwze3ckTkWikx7NaDvaEzFy6oda9u1163hcGpqW2zrJTI0cyK4JxeL2bZcmiJnvIxRLoLl8iEXnD2mMiiMXo8rVaKd0qBOvXpfO7z5yHIsmT/yK6PT1k112gAUT367JC5EHI5qPaEZ2TcqTT4lqoUPkpya6CbuKgNQKUkON5GeUB5hR3n+7VFdmMdQAKZRWJG+lUFqRvLH0X144bwoTIQQBt25m15gplEOceAVyTuxONNI9eT2tulxl1wwTIcT5QoitQojtQoibR/v1cqFrgrBmTbwa4ujKMvHaHY4TTHQRdWeI/BB7q1936iz+/bn+e9xkTrzm7F3jysyuMRY6sUQ+54IhigmNJU6Znrw6FvqSWQwVUBOvI4MQQgd+DlwALADeL4QYk5lBQ+QDkIyTjIUA0qwUv1tHE0ZUXSC7SXiNS9h2sz/3UO0aIUTaxG42bJEfoHeNdX/IEcln2jUTffJI0RfrM08VQQ2trUE+kZZC6XWlNSVTFa/D43hgu5Ryp5QyCtwHXDLKr5kVXROENMM+kWGjp7wzkhdCEPS66AzFKKQbfCVAaqWdodo1gx2TdWKB3C0QrHFaKZQuXaTZNREl8nmJFZ32ieQneGR6KOiawKNrxo85V2ZF8BN9f422yE8B9jlu7zfvsxFCXCeEWC2EWN3U1DRqA7EjeUBEu+z7nBR6XTR29FIkQuArwefW7EUYRkPkwUijtLpI5rpa0M2JY8uusQ5Up12jorf8o49dY/+e2KJ1qHjdml3lC0ZEr2sibRJ2IjLmyiCl/JWUcrmUcnll5ehNArk0Qa8wJ0JziHzQ66Kns8UYl6+EgMflsGtG54tjWTFCpF9ZOBHCiNyt3jUuXeDShJ3vH44lJ3w0ouiLbddkTLhO9K6Kh4rfrdtVvmDUBwTcE7+X/miL/AFgquN2rXnfYUfXBCFhRfLd9n1OCnwuQqbIi0AJfreesmtGaVFrK8PGWvghFx5dSy+G0jWi5iLOoWhCRW95iGU3ZObJD2bpv3zE59b7NCbLh+BotI+G14E5QoiZQggPcBXw6Ci/ZlZ0IegVRtWqFjFEPjNyLvC6iJsLhuiBUgIeffTtGi09/S0Xbl3You7O8OTD8YnfE1vRl76evNnWQB0LWfG70ytdg17XhM+sgVHOk5dSxoUQnwb+A+jAPVLKjaP5mrnQdUEIK5LvBIrQRF+RR5ongGAZAY/OnpZeYPRE3mNG8gP9f2e7WSNP3mHXRFUKZT7iz7BrrEVwRmMh7IlAkd9FoWPflAbcREwLdCIz6rlDUsrHgMdG+3UGQheCZr0CXD4KW9YDtbZVYlHgdeHCEHlPQRk+t9HSAEZ34hUGTtF0irydXRO3InlVDJWP+DImXlfMKufua5ezpHbiV7AeCv/znsVpC5x/9cL5dtLDRGZiJ4g60DVBGC/MOoPq/U8D5xt2zdbHjQWvK+dR4NXxih4AfIXlBDzN9vNHy5N3Ozz5wWwHRjsEl9WFEsOTV5F8/mFH8uYJXtMEZ82vHsshjWvmVBem3Z5eHhyjkRxe8krkE0kJCy4gsO3fzBd78TWthweutLc5Y/pneBVT5IvKCXja7cdGK1J264P15M0vsjC+zB5dEE8mkVIanrwS+bzDb0+0qs9ekZu8ucbXNXORjXkXIBGco62h7I2fgbcYPvwYVC/i6NZnKBY9hKWbgmBB2gSWRx+dL5Il3oP15K3fLtOu6YrEkTK1spUif/BnZNcoFNnIm6ND1zBaDBdU0VKyhCtdz+Lf8Rgc/3GY8U5YcAlVXRuZJeroIIjPraXNvI+eJz9Iu8aVLvJuXSOWlDR3RQCoKPCOyvgU45fMiVeFIht5JPKanY2yr+oMpogW0L1wwieNDeacC8Bp2jq6RAFCiPRIfpRE3mo3nKulgf365snAOil4dEEskaS52yjWUiKff2RWvCoU2cibo0MXkDRFfm/l6QCEF18NBWaV7aRjiPiq8IgEPcLoJe9sXDRqIu+yRLv//2/l09u/dQ0pobErDEB5gWdUxqcYvxxVVUBJwE1VoW+sh6IYx+SNyLs0jbjZYrgtMINrorcQPu1rqQ2EoKP2dAB6daPNsHM1mVGreLUj+cHZNVZEb9k29R2GyFeqSD7vOG5GGWu/fi7FAZUXr8hN3oi8poGp8cSTkpeSi9F86SlV4ZlnAxDSjfv9Zp8LIRi1JkbuQebJp+way5M3bteZIl8aVJG8QqHoS96IvDOSt1aG6tMQbNbpRKSbXncZgN1z2qP331dmOAw+T96yafpG8qUBd1qxlEKhUFjkjTLomsCsHSIhpX2fk2BhCe+L3sazFVcBqQZQo+XHw9Dz5K2JWut2XUeIcmXVKBSKHOSXyFuRfCK7yBf4XGyQs5CBCuDwZC8MOoXSEnlXepZNfUeYCjXpqlAocpBnIm/8baVS6hkWjNdlLPBbYHaqC5ie/GhNukIqMh+4GMoUd2t7c0wNXREVySsUipzkTZmkLlKRfFJKuz1AJjeeM5fjZxqevFVsMqp2jWuIkXyGJ59ISpVZo1AocpI/Iu9ozRtPypyLbH/y9Nn23/7D4MkPvp98Zp58avzlKrNGoVDkIH/sGiHsYqhEPyLvxF55ZxTLxq0TyIB2jRnxp/LlU9tXFKpIXqFQZCdvRN65JmoiKe2IuD8OR3aNlcY5cJ68lV2TPvEKKpJXKBS5yRuR17T0SH4QgXzKrhnNiVcrhXKgitccefKgInmFQpGbvBF5ZyQfTybTVojJhUfX0DUxynnyVu+a/i0hV5+KV4fIB5XIKxSK7OSNyGuaMFoNA4lk3xz5bAghCLj10bVrBt3WIN2Ld7ZZqChUdo1CochO3oh8uief7JMjnwufZ3RFfsh2jZZu1/jdup3Pr1AoFJnkjchrQtg9a/pLocxk2bQSFk4uGrVxpeyawXry6XaNiuIVCkV/5E0I6NJSIp9MyrTslP745QeXj+awHJH8QHnyIuvvcuXHKxSKfsibSF7XMyL5UeoqOVQGnUKZZfk/UCtCKRSK/skfkXfYNYMthjocFPvdab9zkVnpav1WzckUCkV/DEvkhRDfF0JsEUK8JYR4SAhR4njsFiHEdiHEViHEecMe6TBxacJuMTyeRP6s+dU8+ul3MrnE3+92tk2T0aBMRfIKhaI/hhvJPwksklIuAbYBtwAIIRYAVwELgfOBXwghxnRJeU0TSGn48eNJ5HVNsKS2ZMDtrHYGVgQf9Lo4uqaQZdMHfq5CochfhjXxKqV8wnHzVeAy8+9LgPuklBFglxBiO3A8sHI4rzccLO87ISXxpOy7KtQ4x6P39eQf//ypYzkkhUJxBDCSnvxHgX+bf08B9jke22/e1wchxHVCiNVCiNVNTU0jOJx0rLbCiaQkKcdPJD9YMlsNKxQKxWAYMJIXQjwF1GR56FYp5SPmNrcCceDeoQ5ASvkr4FcAy5cvl0N9/mCxIvd4UhJPHIkin75oiEKhUAyGAUVeSnl2f48LIT4MXAycJaW0RPoAMNWxWa1535ihiVQkP548+cGiInmFQnEoDDe75nzgy8C7pZS9joceBa4SQniFEDOBOcBrw3mt4eJy2DUJObhWw+OJzPx4hUKhGAzDrXj9GeAFnhRGpPyqlPJ6KeVGIcT9wCYMG+cGKWVimK81LHSHyMeTMuvSf+MZd0YXSoVCoRgMw82uOaqfx74DfGc4/38k0bXUmqiJZPKIy66ZUR7kc2fN4Yx5lWM9FIVCcQSRV71rwEihHGyr4fGEpgluPGfuWA9DoVAcYeTNtb+dQpmQQ2o1rFAoFEcyeSPymcVQuspSUSgUeUDeiHyqGCpptBo+wuwahUKhOBTyRuRTKZTjq9WwQqFQjCZ5I/JWMVQ8mTwii6EUCoXiUMgbkbci+WTSSKMc7MpQCoVCcSSTNyKva+mRvKbsGoVCkQfkncgnj9BWwwqFQnEo5J3IxxOSZFLaFbAKhUIxkckbpcvsXaNawCgUinwgb6ROT2troCJ5hUKRH+SN0umORUOMVsPKk1coFBOfvBF5V1rvmiOv1bBCoVAcCnkj8lbKZCyRBFCRvEKhyAvyRuSt4qeoKfKq4lWhUOQDeSPyVq+aSEyJvEKhyB/yR+RNUY8ou0ahUOQReSfy0bgh8qqtgUKhyAfyVuRVgzKFQpEP5K3IK09eoVDkA/kn8omEcVvZNQqFIg/IH5EXKpJXKBT5R96IvMvsVaM8eYVCkU+MiMgLIW4SQkghRIV5WwghfiKE2C6EeEsIsWwkXmc46KaoR1R2jUKhyCOGLfJCiKnAucBex90XAHPMn+uAO4f7OsMl065xqS6UCoUiDxgJpfsR8GVAOu67BPiDNHgVKBFCTBqB1zpkMouhlCevUCjygWGJvBDiEuCAlHJdxkNTgH2O2/vN+7L9j+uEEKuFEKubmpqGM5x+sUVetTVQKBR5hGugDYQQTwE1WR66FfgqhlVzyEgpfwX8CmD58uVygM0PGUvTo6qtgUKhyCMGFHkp5dnZ7hdCLAZmAuuE4XfXAm8IIY4HDgBTHZvXmveNGUIIdE0QjZt58krkFQpFHnDIdo2Ucr2UskpKOUNKOQPDklkmpawHHgU+ZGbZrAA6pJR1IzPkQ8cQeWXXKBSK/GHASP4QeQy4ENgO9AIfGaXXGRK6EKqfvEKhyCtGTOTNaN76WwI3jNT/HilcjkheefIKhSIfyKtkcU0TqWIoJfIKhSIPyCuRV5G8QqHIN/JK5DU18apQKPKMvBJ5lxJ5hUKRZ+SVyOsOT17ZNQqFIh/IO5FPpVDm1VtXKBR5Sl4pndOiUStDKRSKfCC/RN4h7LpaNEShUOQB+SXyjkheefIKhSIfyFuRVytDKRSKfCCvRN6lInmFQpFn5JXIO1sZKE9eoVDkA3kl8i6VXaNQKPKMvBJ5pw+vKl4VCkU+kFci79KVJ69QKPKLvBJ5FckrFIp8I69E3oreNWGs+apQKBQTnbwSeatfjUv1rVEoFHlCXqmdbr5bpfEKhSJfyCu5c6lIXqFQ5Bl5pXZWMZSadFUoFPlCXom8S4m8QqHIM/JK5K0USiXyCoUiX8grkbcieVUIpVAo8oVhi7wQ4jNCiC1CiI1CiO857r9FCLFdCLFVCHHecF9nJNDsPHkl8gqFIj9wDefJQogzgEuAY6SUESFElXn/AuAqYCEwGXhKCDFXSpkY7oCHgx3Jqw6UCoUiTxhuJP9J4LtSygiAlLLRvP8S4D4pZURKuQvYDhw/zNcaNrqaeFUoFHnGcEV+LnCKEGKVEOJ5IcRx5v1TgH2O7fab9/VBCHGdEGK1EGJ1U1PTMIfTP7bIK7tGoVDkCQPaNUKIp4CaLA/daj6/DFgBHAfcL4SYNZQBSCl/BfwKYPny5XIozx0qKoVSoVDkGwOKvJTy7FyPCSE+CfxdSimB14QQSaACOABMdWxaa943pmjKk1coFHnGcO2ah4EzAIQQcwEP0Aw8ClwlhPAKIWYCc4DXhvlaw8al7BqFQpFnDCu7BrgHuEcIsQGIAteaUf1GIcT9wCYgDtww1pk1oIqhFApF/jEskZdSRoFrcjz2HeA7w/n/I02qGCqvasAUCkUek1dqZxdD5dW7VigU+UxeyZ2K5BUKRb6RV2qniqEUCkW+oUReoVAoJjBK5BUKhWICk5cir1oNKxSKfCG/RF5Y2TVK5BUKRX6QXyKvInmFQpFn5JXIWz1rlCevUCjyhbwSebutgepdo1Ao8oS8EnmrCEp1oVQoFPlCXom8rlm/lcgrFIr8IM9E3ni7yq5RKBT5Qp6JvPU7r962QqHIY/JK7exIPq/etUKhyGfySu50e9GQvHrbCoUij8krtVPFUAqFIt/IS5FXbQ0UCkW+kJciryJ5hUKRL+SVyLtUq2GFQpFn5JXIq37yCoUi38hLkVd2jUKhyBfyUuRVJK9QKPIFJfIKhUIxgRmWyAshlgohXhVCrBVCrBZCHG/eL4QQPxFCbBdCvCWEWDYywx0eqWIoJfIKhSI/GG4k/z3g/0kplwJfN28DXADMMX+uA+4c5uuMCMqTVygU+cZwRV4CRebfxcBB8+9LgD9Ig1eBEiHEpGG+1rCZUuLnM2cexRnzqsZ6KAqFQnFYcA3z+Z8H/iOEuB3jhHGSef8UYJ9ju/3mfXXDfL1hoWmCm86dN5ZDUCgUisPKgCIvhHgKqMny0K3AWcCNUsq/CSGuAO4Gzh7KAIQQ12FYOkybNm0oT1UoFArFAAgp5aE/WYgOoERKKYUQAuiQUhYJIX4JPCel/Iu53VbgdCllv5H88uXL5erVqw95PAqFQpGPCCHWSCmXZ3tsuJ78QeA08+8zgbfNvx8FPmRm2azAEP8xtWoUCoUiHxmuJ/8J4A4hhAsIY9ouwGPAhcB2oBf4yDBfR6FQKBSHwLBEXkr5EnBslvslcMNw/rdCoVAohk9eVbwqFApFvqFEXqFQKCYwSuQVCoViAjOsFMqRRgjRBOw5xKdXAM0jOJzRQI1xZFBjHBnUGIfPeBnfdCllZbYHxpXIDwchxOpceaLjBTXGkUGNcWRQYxw+4318oOwahUKhmNAokVcoFIoJzEQS+V+N9QAGgRrjyKDGODKoMQ6f8T6+iePJKxQKhaIvEymSVygUCkUGSuQVCoViAjMhRF4Icb4QYqu5puzNYz0eACHEVCHEs0KITUKIjUKIz5n3lwkhnhRCvG3+Lh3jcepCiDeFEP80b88UQqwy9+VfhRCeMR5fiRDiQSHEFiHEZiHEieNwH95ofsYbhBB/EUL4xno/CiHuEUI0CiE2OO7Lut/Gak3mHGP8vvlZvyWEeEgIUeJ47BZzjFuFEOeN1Rgdj90khJBCiArz9rhc2/qIF3khhA78HGNd2QXA+4UQC8Z2VADEgZuklAuAFcAN5rhuBp6WUs4BnjZvjyWfAzY7bv8f8CMp5VFAG/CxMRlVijuAx6WURwPHYIx13OxDIcQU4LPAcinlIkAHrmLs9+PvgPMz7su138ZqTeZsY3wSWCSlXAJsA24BML87VwELzef8wvzuj8UYEUJMBc4F9jruHpdrWyOlPKJ/gBOB/zhu3wLcMtbjyjLOR4BzgK3AJPO+ScDWMRxTLcaX/Uzgn4DAqN5zZdu3YzC+YmAXZoKA4/7xtA+tpS7LMLq6/hM4bzzsR2AGsGGg/Qb8Enh/tu0O9xgzHnsPcK/5d9r3GvgPcOJYjRF4ECPo2A1UjPV+7O/niI/kyb2e7LhBCDEDeAewCqiWqQVU6oHqsRoX8GPgy0DSvF0OtEsp4+btsd6XM4Em4LempfQbIUSQcbQPpZQHgNsxIro6oANYw/jajxa59tt4/Q59FPi3+fe4GaMQ4hLggJRyXcZD42aMTiaCyI9rhBAFwN+Az0spO52PSeN0PyY5rEKIi4FGKeWasXj9QeIClgF3SinfAfSQYc2M5T4EMH3tSzBOSJOBIFku78cbY73fBkIIcSuG5XnvWI/FiRAiAHwV+PpYj2WwTASRPwBMddyuNe8bc4QQbgyBv1dK+Xfz7gYhxCTz8UlA4xgN753Au4UQu4H7MCybO4ASc6UvGPt9uR/YL6VcZd5+EEP0x8s+BGPh+l1SyiYpZQz4O8a+HU/70SLXfhtX3yEhxIeBi4GrzZMRjJ8xzsY4oa8zvzu1wBtCiBrGzxjTmAgi/zowx8xm8GBMzjw6xmNCCCGAu4HNUsofOh56FLjW/PtaDK/+sCOlvEVKWSulnIGxz56RUl4NPAtcNtbjA5BS1gP7hBDzzLvOAjYxTvahyV5ghRAiYH7m1hjHzX50kGu/jZs1mYUQ52NYiO+WUvY6HnoUuEoI4RVCzMSY3HztcI9PSrleSlklpZxhfnf2A8vMY3Xc7Mc0xnpSYIQmRi7EmInfAdw61uMxx3QyxuXwW8Ba8+dCDN/7aYxFz58CysbBWE8H/mn+PQvjy7MdeADwjvHYlgKrzf34MFA63vYh8P+ALcAG4I+Ad6z3I/AXjDmCGIYQfSzXfsOYcP+5+f1Zj5EpNFZj3I7ha1vfmbsc299qjnErcMFYjTHj8d2kJl7HZD8O9KPaGigUCsUEZiLYNQqFQqHIgRJ5hUKhmMAokVcoFIoJjBJ5hUKhmMAokVcoFIoJjBJ5hUKhmMAokVcoFIoJzP8H2X/6G7gybRkAAAAASUVORK5CYII=\n",
      "text/plain": [
       "<Figure size 432x288 with 1 Axes>"
      ]
     },
     "metadata": {
      "needs_background": "light"
     },
     "output_type": "display_data"
    }
   ],
   "source": [
    "import matplotlib.pyplot as plt\n",
    "# Generate recent 50 interval average\n",
    "average_reward = []\n",
    "for idx in range(len(rewards)):\n",
    "    avg_list = np.empty(shape=(1,), dtype=int)\n",
    "    if idx < 5:\n",
    "        avg_list = rewards[:idx+1]\n",
    "    else:\n",
    "        avg_list = rewards[idx-4:idx+1]\n",
    "    average_reward.append(np.average(avg_list))\n",
    "plt.plot(rewards)\n",
    "plt.plot(average_reward)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "9f18bae5",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "44b0354e",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "58e2db1b",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "8385f8b3",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "c1d27da3",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "fb4df6e4",
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.10.12"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
