{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "id": "67576132",
   "metadata": {},
   "outputs": [],
   "source": [
    "from math import inf\n",
    "import numpy as np\n",
    "import scipy\n",
    "import torch\n",
    "import torch.nn as nn\n",
    "import torch.nn.functional as F\n",
    "import torch.optim as optim\n",
    "import gymnasium as gym\n",
    "import pandas as pd\n",
    "from datetime import datetime\n",
    "from sklearn.base import BaseEstimator\n",
    "from realkd.boosting import WeightUpdateMethod\n",
    "from pandas import qcut\n",
    "from realkd.rules import SquaredLoss, AdditiveRuleEnsemble, Rule\n",
    "from realkd.search import Context\n",
    "from typing import Optional\n",
    "import warnings\n",
    "import random"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "id": "8b8f01e2",
   "metadata": {},
   "outputs": [],
   "source": [
    "statespace_size_g = 4\n",
    "np.random.seed(2443249)\n",
    "torch.manual_seed(13451035)\n",
    "number_rules=16\n",
    "regular = 50.0\n",
    "column_names=['x1','x2','x3-x1','x4-x2', 'c']"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "id": "24f75485",
   "metadata": {},
   "outputs": [],
   "source": [
    "def same_location(location1, location2):\n",
    "    # Check if either location is None\n",
    "    if location1 is None or location2 is None:\n",
    "        return False\n",
    "\n",
    "    # Compare the locations\n",
    "    return location1[0] == location2[0] and location1[1] == location2[1]\n",
    "\n",
    "class GridWorldEnv(gym.Env):\n",
    "    def __init__(self, size):\n",
    "        \"\"\"\n",
    "        :param height: The height of the environment grid.\n",
    "        :param width: The width of the environment grid.\n",
    "        :functionality: Initializes the Environment object with height and width,\n",
    "                        and calls regenerate_locations to set random target, agent, and item locations.\n",
    "        \"\"\"\n",
    "        self.item_location = None\n",
    "        self.agent_location = None\n",
    "        self.size = size\n",
    "        self.target_location = None\n",
    "        self.num_steps=0\n",
    "        self.carry_item=0\n",
    "        # We have 4 actions, corresponding to \"right\", \"up\", \"left\", \"down\"\n",
    "        self.action_space = gym.spaces.Discrete(4)\n",
    "        # Dictionary maps the abstract actions to the directions on the grid\n",
    "        self._action_to_direction = {\n",
    "            3: np.array([1, 0]),  # right\n",
    "            0: np.array([0, 1]),  # up\n",
    "            2: np.array([-1, 0]),  # left\n",
    "            1: np.array([0, -1]),  # down\n",
    "        }\n",
    "        self.reset()\n",
    "#         self.observation_space = gym.spaces.Dict(\n",
    "#             {\n",
    "#                 \"agent\": gym.spaces.Box(0, size - 1, shape=(2,), dtype=int),\n",
    "#                 \"item\": gym.spaces.Box(0, size - 1, shape=(2,), dtype=int),\n",
    "#                 \"target\": gym.spaces.Box(0, size - 1, shape=(2,), dtype=int),\n",
    "#             }\n",
    "#         )\n",
    "        self.observation_space = gym.spaces.Tuple(\n",
    "            [gym.spaces.Discrete(self.size),\n",
    "            gym.spaces.Discrete(self.size),\n",
    "            gym.spaces.Discrete(self.size),\n",
    "            gym.spaces.Discrete(self.size),\n",
    "            gym.spaces.Discrete(2),]\n",
    "        )\n",
    "    def _get_obs(self):\n",
    "#         return {\"agent\": np.array(self.agent_location), \n",
    "#                 \"item\": np.array(self.item_location), \n",
    "#                 \"target\": np.array(self.target_location)}\n",
    "        return np.array([self.agent_location[0], self.agent_location[1],\n",
    "                        self.item_location[0]-self.agent_location[0], \n",
    "                         self.item_location[1]-self.agent_location[1],\n",
    "                        self.carry_item])\n",
    "    \n",
    "    def _get_info(self):\n",
    "        return {\n",
    "            \"distance\": np.linalg.norm(\n",
    "                np.array(self.agent_location) - np.array(self.item_location), ord=1\n",
    "            ) + np.linalg.norm(\n",
    "                np.array(self.target_location) - np.array(self.item_location), ord=1\n",
    "            )\n",
    "        } if not self.carry_item else {\n",
    "            \"distance\": np.linalg.norm(\n",
    "                np.array(self.agent_location) - np.array(self.target_location), ord=1\n",
    "            )\n",
    "        }\n",
    "    \n",
    "    def reset(self, seed: Optional[int] = None, options: Optional[dict] = None):\n",
    "        \"\"\"\n",
    "        :return: None\n",
    "        :functionality: Generates new random locations for the target, agent, and the item,\n",
    "                        ensuring no overlaps between them.\n",
    "        \"\"\"\n",
    "        if seed is not None:\n",
    "            random.seed(seed)\n",
    "            np.random.seed(seed)\n",
    "        self.carry_item=0\n",
    "        self.set_target_location([self.size-1, self.size-1])\n",
    "        self.set_agent_location(self.generate_random_location([self.target_location]))\n",
    "        self.set_item_location(self.generate_random_location([self.target_location, self.agent_location]))\n",
    "        return self._get_obs(), self._get_info()\n",
    "    \n",
    "    def set_target_location(self, new_location):\n",
    "        \"\"\"\n",
    "        :param new_location: The new location for the target.\n",
    "        :return: None\n",
    "        :functionality: Updates the target's location to the new location.\n",
    "        \"\"\"\n",
    "        self.target_location = new_location\n",
    "\n",
    "    def set_agent_location(self, new_location):\n",
    "        \"\"\"\n",
    "        :param new_location: The new location for the agent.\n",
    "        :return: None\n",
    "        :functionality: Updates the agent's location to the new location.\n",
    "        \"\"\"\n",
    "        self.agent_location = new_location\n",
    "\n",
    "    def set_item_location(self, new_location):\n",
    "        \"\"\"\n",
    "        :param new_location: The new location for the item.\n",
    "        :return: None\n",
    "        :functionality: Updates the item's location to the new location.\n",
    "        \"\"\"\n",
    "        self.item_location = new_location\n",
    "\n",
    "    def generate_random_location(self, exclude=()):\n",
    "        \"\"\"\n",
    "        :param exclude: A list of locations to be excluded when generating a new random location.\n",
    "        :return: A new random location as a list [x, y] that is not in the exclude list.\n",
    "        :functionality: Generates a random location within the bounds of the environment\n",
    "                        grid, ensuring that it does not match any of the locations in the exclude list.\n",
    "        \"\"\"\n",
    "        \n",
    "        # Helper function to check if a location already exists in the exclude list\n",
    "        def location_exist(new_location):\n",
    "            for loc in exclude:\n",
    "                if same_location(loc, new_location):\n",
    "                    return True\n",
    "            return False\n",
    "        \n",
    "        # Generate an initial random location\n",
    "        location = [np.random.randint(0, self.size), np.random.randint(0, self.size)]\n",
    "        \n",
    "        # If the generated location exists in the exclude list, keep generating new ones until it doesn't\n",
    "        while location_exist(location):  \n",
    "            location = [np.random.randint(0, self.size), np.random.randint(0, self.size)]\n",
    "        \n",
    "        return location\n",
    "    def step(self, action): \n",
    "        \"\"\"\n",
    "        Update the agent's location based on the action taken.\n",
    "\n",
    "        :param action: Action taken by the agent.\n",
    "        :param env: Reference to the environment to check for boundaries and get reward.\n",
    "        \"\"\"\n",
    "        # Movement logic for each action\n",
    "        if action == 0 and self.agent_location[0] > 0:\n",
    "            self.agent_location[0] -= 1\n",
    "        elif action == 1 and self.agent_location[0] < self.size - 1:\n",
    "            self.agent_location[0] += 1\n",
    "        elif action == 2 and self.agent_location[1] > 0:\n",
    "            self.agent_location[1] -= 1\n",
    "        elif action == 3 and self.agent_location[1] < self.size - 1:\n",
    "            self.agent_location[1] += 1\n",
    "        reward, terminated=self.get_reward()\n",
    "        info = self._get_info()\n",
    "        return self._get_obs(), reward, terminated, False, info\n",
    "        \n",
    "    def get_reward(self):\n",
    "        \"\"\"\n",
    "        :param state: The current state of the agent.\n",
    "        :return: None\n",
    "        :functionality: Evaluates the agent's current state to assign a reward.\n",
    "                        Updates the state's reward attribute accordingly.\n",
    "        \"\"\"\n",
    "        # If the agent is at the item location and not carrying the item, reward it and update its state\n",
    "        done=False\n",
    "        if same_location(self.agent_location, self.item_location) and not self.carry_item:\n",
    "            reward = 20\n",
    "            self.carry_item = 1                                                                                            \n",
    "        # If the agent is at the target location and carrying the item, reward it\n",
    "        elif same_location(self.agent_location, self.target_location) and self.carry_item:\n",
    "            reward = 20\n",
    "            self.carry_item=0\n",
    "            done=True\n",
    "        # Otherwise, penalize the agent\n",
    "        else:\n",
    "            reward = -1\n",
    "        \n",
    "        return reward, done\n",
    "        \n",
    "gym.register(\n",
    "    id=\"gymnasium_env/GridWorld-v0\",\n",
    "    entry_point=GridWorldEnv,\n",
    ")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "id": "db545637",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "cuda\n",
      "<class 'gymnasium.wrappers.common.OrderEnforcing'>\n"
     ]
    }
   ],
   "source": [
    "# env = gym.make('CartPole-v1', render_mode='rgb_array')\n",
    "env=gym.make(\"gymnasium_env/GridWorld-v0\", size=statespace_size_g)\n",
    "device = torch.device(\"cuda\" if torch.cuda.is_available() else \"cpu\")\n",
    "print(device)\n",
    "print(type(env))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "id": "7aa6c889",
   "metadata": {},
   "outputs": [],
   "source": [
    "# column_names = ['cp', 'cv', 'pa', 'pav']"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "id": "84732b72",
   "metadata": {},
   "outputs": [],
   "source": [
    "def orthonormalization(Q):\n",
    "    n, k = Q.shape\n",
    "    O = np.zeros(shape=(n, k))\n",
    "    q = Q[:, 0]\n",
    "    O[:, 0] = q / (norm(q) + 1e-6)\n",
    "    for i in range(1, k):\n",
    "        O_i = O[:, :i]\n",
    "        q = Q[:, i]\n",
    "        q_orth = q - O_i.dot(O_i.T.dot(q))\n",
    "        O[:, i] = q_orth / (norm(q_orth) + 1e-6)\n",
    "    return O"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "id": "973f1f9b",
   "metadata": {},
   "outputs": [],
   "source": [
    "def softmax1(action, values, other_values, location):\n",
    "    all_values = np.insert(other_values, location, values, axis=1)\n",
    "    exps = np.exp(all_values)\n",
    "    res = np.exp(all_values[np.arange(values.shape[0]), action]) / np.sum(exps, axis=1)\n",
    "    return res\n",
    "\n",
    "def norm(x):\n",
    "    \"\"\"\n",
    "    Calculate the L-2 norm of a vector\n",
    "    :param x: the vector whose L-2 norm is to be calculated\n",
    "    :return: the L-2 norm of the vector\n",
    "    \"\"\"\n",
    "    return (x * x).sum() ** 0.5\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "id": "5b0af6ac",
   "metadata": {},
   "outputs": [],
   "source": [
    "class PiLoss:\n",
    "    _instance = None\n",
    "\n",
    "    def __new__(cls):\n",
    "        if cls._instance is None:\n",
    "            cls._instance = super(PiLoss, cls).__new__(cls)\n",
    "        return cls._instance\n",
    "\n",
    "    @staticmethod\n",
    "    def __call__(action, values, advantage, other_values, current):\n",
    "        \"\"\"\n",
    "        :param action: the action chosen\n",
    "        :param values: the values provided by current model\n",
    "        :param other_values: the output by other models\n",
    "        :param current: the action represented by the current model\n",
    "        \"\"\"\n",
    "        sm = softmax1(action, values, other_values, current)+1e-6\n",
    "        return -np.log(sm) * advantage\n",
    "\n",
    "    @staticmethod\n",
    "    def g(action, values, advantage, other_values, current):\n",
    "        return np.where(action == current, -advantage * (1 - softmax1(current, values, other_values, current)),\n",
    "                        advantage * softmax1(current, values, other_values, current))\n",
    "\n",
    "    @staticmethod\n",
    "    def h(action, values, advantage, other_values, current):\n",
    "        sm = softmax1(current, values, other_values, current)\n",
    "        return advantage * sm * (1 - sm)\n",
    "\n",
    "    @staticmethod\n",
    "    def __repr__():\n",
    "        return 'pi_loss'\n",
    "\n",
    "    @staticmethod\n",
    "    def __str__():\n",
    "        return 'pi_loss'"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 9,
   "id": "67942365",
   "metadata": {},
   "outputs": [],
   "source": [
    "loss_functions = {\n",
    "    'pi_loss': PiLoss()\n",
    "}"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 10,
   "id": "693287f4",
   "metadata": {},
   "outputs": [],
   "source": [
    "def loss_function(loss):\n",
    "    \"\"\"Provides loss functions from string representation.\n",
    "\n",
    "    :param loss: string identifier of loss function loss function\n",
    "    :return: loss function matching corresponding to input string (or unchanged input if was already loss function)\n",
    "    \"\"\"\n",
    "    if callable(loss):\n",
    "        return loss\n",
    "    else:\n",
    "        return loss_functions[loss]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 11,
   "id": "ae0af97c",
   "metadata": {},
   "outputs": [],
   "source": [
    "def calc_risk(loss, action, rules, states, reg, advantage, others, current):\n",
    "    weights = np.array([rule.y for rule in rules])\n",
    "    risk = sum(loss(action, rules(states), advantage, others, current)) + reg * sum(weights * weights) / 2\n",
    "    return risk"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 12,
   "id": "d06dc96b",
   "metadata": {},
   "outputs": [],
   "source": [
    "class FullyCorrectiveA2C:\n",
    "    def __init__(self, loss='pi_loss', reg=regular, solver='L-BFGS-B'):\n",
    "        self.loss = loss_function(loss)\n",
    "        self.reg = reg\n",
    "        self.solver = solver\n",
    "\n",
    "    @staticmethod\n",
    "    def get_risk(loss, action, q_mat, reg, advantage, others, current):\n",
    "        def sum_loss(weights):\n",
    "            return sum(loss(action, q_mat.dot(weights), advantage, others, current)) + reg * sum(weights * weights) / 2\n",
    "\n",
    "        return sum_loss\n",
    "\n",
    "    @staticmethod\n",
    "    def get_gradient(g, action, q_mat, reg, advantage, other, current):\n",
    "        def gradient(weights):\n",
    "            grad_vec = g(action, q_mat.dot(weights), advantage, other, current)\n",
    "            return q_mat.T.dot(grad_vec) + reg * weights\n",
    "\n",
    "        return gradient\n",
    "\n",
    "    @staticmethod\n",
    "    def get_hessian(h, action, q_mat, reg, advantage, other, current):\n",
    "        def hessian(weights):\n",
    "            h_vec = h(action, q_mat.dot(weights), advantage, other, current)\n",
    "            return q_mat.T.dot(np.diag(h_vec)).dot(q_mat) + np.diag([reg] * len(weights))\n",
    "\n",
    "        return hessian\n",
    "\n",
    "    def calc_weight(self, data, action, rules, advantage, other, current):\n",
    "        g = self.loss.g\n",
    "        h = self.loss.h\n",
    "        loss = self.loss\n",
    "        y = np.array(action)\n",
    "        q_mat = np.column_stack(\n",
    "            [rules[i].q(data) + np.zeros(len(data)) for i in range(len(rules))])\n",
    "        sum_loss = self.get_risk(loss, y, q_mat, self.reg, advantage, other, current)\n",
    "        gradient = self.get_gradient(g, y, q_mat, self.reg, advantage, other, current)\n",
    "        hessian = self.get_hessian(h, y, q_mat, self.reg, advantage, other, current)\n",
    "        if self.solver == 'GD':  # Gradient descent\n",
    "            w = np.array([r.y for r in rules])\n",
    "            old_w = np.ones_like(w) * (1.0 if len(w) - sum(w) > 1e-5 else 2.0)\n",
    "            i = 0\n",
    "            while norm(old_w - w) > 1e-3 and i < 50:\n",
    "                old_w = np.array(w)\n",
    "                if norm(gradient(w)) == 0:\n",
    "                    break\n",
    "                p = -gradient(w) / norm(gradient(w))\n",
    "                w += GoldenRatioSearch(sum_loss, old_w, p, gradient).run() * p\n",
    "                i += 1\n",
    "        elif self.solver == 'Line':\n",
    "            w = np.array([r.y for r in rules])\n",
    "            if norm(gradient(w)) != 0:\n",
    "                p = -gradient(w) / norm(gradient(w))\n",
    "                distance = GoldenRatioSearch(sum_loss, w, p, gradient).run()\n",
    "                w += distance * p\n",
    "        else:\n",
    "            w = np.array([r.y for r in rules])\n",
    "            w = scipy.optimize.minimize(sum_loss, w, method=self.solver, jac=gradient,  # hess=hessian,\n",
    "                                        options={'disp': False}).x\n",
    "\n",
    "        return w"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 13,
   "id": "2d0c04a8",
   "metadata": {},
   "outputs": [],
   "source": [
    "class ObjectFunction:\n",
    "    def __init__(self, data, target, predictions, loss, reg, advantage, other_values, current, rules=None):\n",
    "        self.loss = loss_function(loss)\n",
    "        self.reg = reg\n",
    "        predictions = np.zeros_like(\n",
    "            target) if predictions is None else predictions\n",
    "        g = np.array(self.loss.g(target, predictions, advantage, other_values, current))\n",
    "        h = np.array(self.loss.h(target, predictions, advantage, other_values, current)) + 1e-6\n",
    "        r = g / h\n",
    "        order = np.argsort(r)[::-1]\n",
    "        self.g = g[order]\n",
    "        self.h = h[order]\n",
    "        self.data = data.iloc[order].reset_index(drop=True)\n",
    "        self.target = target.iloc[order].reset_index(drop=True)\n",
    "        self.n = len(target)\n",
    "\n",
    "    def __call__(self, ext):\n",
    "        raise NotImplementedError()\n",
    "\n",
    "    def bound(self, ext):\n",
    "        raise NotImplementedError()\n",
    "\n",
    "    def search(self, method='greedy', verbose=False, **search_params):\n",
    "        from realkd.search import search_methods\n",
    "        ctx = Context.from_df(self.data, **search_params)\n",
    "        if verbose >= 2:\n",
    "            print(\n",
    "                f'Created search context with {len(ctx.attributes)} attributes')\n",
    "        return search_methods[method](ctx, self, self.bound, verbose=verbose, **search_params).run()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 14,
   "id": "eaec4413",
   "metadata": {},
   "outputs": [],
   "source": [
    "class OrthogonalBoostingObjective(ObjectFunction):\n",
    "    def __init__(self, data, target, advantage, other_values, current, predictions=None, loss=SquaredLoss, reg=regular,\n",
    "                 rules=None,\n",
    "                 epsilon=1e-4, **kwargs):\n",
    "        super().__init__(data, target, predictions, loss, reg, advantage, other_values, current, rules)\n",
    "        self.rules = [] if rules is None else rules\n",
    "        self.loss = loss_function(loss)\n",
    "        self.reg = reg\n",
    "        self.epsilon = epsilon\n",
    "        predictions = np.zeros_like(\n",
    "            target) if predictions is None else predictions\n",
    "        g = np.array(self.loss.g(target, predictions, advantage, other_values, current))\n",
    "        self.n = len(target)\n",
    "        r = g\n",
    "        order = np.argsort(r)[::-1]\n",
    "        self.g = g[order]\n",
    "        self.data = data.iloc[order].reset_index(drop=True)\n",
    "        self.target = target.iloc[order].reset_index(drop=True)\n",
    "        if len(rules) != 0:\n",
    "            orth_basis = kwargs['orth_basis']\n",
    "            self.orth_basis = orth_basis[order]\n",
    "            self.g = self.g - self.orth_basis @ self.orth_basis.T @ self.g\n",
    "        else:\n",
    "            self.orth_basis = np.zeros(self.n)\n",
    "\n",
    "    def __call__(self, ext):\n",
    "        if len(ext) == 0:\n",
    "            return -inf\n",
    "        g_q = self.g[ext]\n",
    "        if len(self.rules) == 0:\n",
    "            h_q = self.h[ext]\n",
    "            return abs(g_q.sum()) / np.sqrt(h_q.sum())\n",
    "        length = self.fast_orth_norm(ext)\n",
    "        if length > 1e-4:\n",
    "            obj = abs(g_q.sum()) / (length + self.epsilon)\n",
    "        else:\n",
    "            obj = 0\n",
    "        return obj\n",
    "\n",
    "    def fast_orth_norm(self, ext):\n",
    "        deltas = self.orth_basis[ext]\n",
    "        length = len(ext)\n",
    "        okqi = abs(np.sum(deltas, axis=0))\n",
    "        q_para_norms = (okqi ** 2).sum()\n",
    "        q_orth_norms_sq = np.abs(length - q_para_norms)\n",
    "        return np.sqrt(q_orth_norms_sq)\n",
    "\n",
    "    def fast_para_norms_prefix(self, ext):\n",
    "        deltas = self.orth_basis[ext]\n",
    "        length = len(ext)\n",
    "        okqi = np.cumsum(deltas, axis=0)\n",
    "        q_para_norms = (okqi ** 2).sum(axis=1)\n",
    "        q_orth_norms_sq = np.abs(np.arange(1, length + 1) - q_para_norms)\n",
    "        q_orth_norms = np.sqrt(q_orth_norms_sq)\n",
    "        return q_orth_norms\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 15,
   "id": "626cceb7",
   "metadata": {},
   "outputs": [],
   "source": [
    "class GeneralRuleBoostingEstimator(BaseEstimator):\n",
    "    def __init__(self, num_rules, objective_function, weight_update_method, loss='squared', reg=regular,\n",
    "                 search='greedy', max_col_attr=10,\n",
    "                 search_params=None, verbose=False):\n",
    "        if search_params is None:\n",
    "            search_params = {'order': 'bestboundfirst', 'apx': 1.0, 'max_depth': None, 'discretization': qcut,\n",
    "                             'max_col_attr': max_col_attr}\n",
    "        self.num_rules = num_rules\n",
    "        self.num_components = 500\n",
    "        self.objective = objective_function\n",
    "        self.objective_function = objective_function\n",
    "        self.max_col_attr = max_col_attr\n",
    "        self.weight_update_method = weight_update_method\n",
    "        self.loss = loss_function(loss)\n",
    "        self.reg = reg\n",
    "        self.weight_update_method.loss = loss\n",
    "        self.weight_update_method.reg = reg\n",
    "        self.verbose = verbose\n",
    "        self.search = search\n",
    "        self.rules_ = AdditiveRuleEnsemble([])\n",
    "        self.search_params = search_params\n",
    "        self.history = []\n",
    "        self.time = []\n",
    "\n",
    "    def set_reg(self, reg):\n",
    "        self.reg = reg\n",
    "        self.objective.reg = reg\n",
    "        self.weight_update_method.reg = reg\n",
    "\n",
    "    def fit(self, data, target, advantage, other_values, current, has_origin_rules=False, verbose=False):\n",
    "        if not has_origin_rules:\n",
    "            self.history = []\n",
    "            self.time = []\n",
    "            self.rules_.members = []\n",
    "            orth_basis = np.array([])\n",
    "        else:\n",
    "            q_mat = np.column_stack(\n",
    "                [self.rules_[i].q(data) + np.zeros(len(data)) for i in range(len(self.rules_))])\n",
    "            orth_basis = orthonormalization(q_mat)\n",
    "        num_components = 0\n",
    "        while len(self.rules_) < self.num_rules and num_components < self.num_components:\n",
    "            start_time = datetime.now()\n",
    "            # Search for a rule\n",
    "            scores = self.rules_(data)\n",
    "            obj = self.objective(data, target, advantage, other_values, current, predictions=scores,\n",
    "                                 loss=self.loss, reg=self.reg, rules=self.rules_, orth_basis=orth_basis)\n",
    "            q = obj.search(method=self.search, verbose=verbose,\n",
    "                           **self.search_params)\n",
    "            if hasattr(self.objective, 'opt_weight') and callable(getattr(self.objective, 'opt_weight')):\n",
    "                y = obj.opt_weight(q)\n",
    "            else:\n",
    "                y = 1.0  # np.random.random()\n",
    "            q_vec = q(data)\n",
    "            num_components += (1 + len(q))\n",
    "            if len(orth_basis) == 0:\n",
    "                basis = q_vec / norm(q_vec)\n",
    "                orth_basis = np.array([basis]).T\n",
    "            else:\n",
    "                basis = q_vec - orth_basis.dot(orth_basis.T.dot(q_vec))\n",
    "                basis = basis / (norm(basis) + 1e-6)\n",
    "                orth_basis = np.hstack((orth_basis, np.array([basis]).T))\n",
    "            rule = Rule(q, y)\n",
    "            if self.verbose:\n",
    "                print(rule)\n",
    "            self.rules_.append(rule)\n",
    "            # Calculate weights\n",
    "            weights = self.weight_update_method.calc_weight(\n",
    "                data, target, self.rules_, advantage, other_values, current)\n",
    "            for i in range(len(self.rules_)):\n",
    "                self.rules_[i].y = weights[i]\n",
    "            self.history.append(AdditiveRuleEnsemble(\n",
    "                [Rule(q=rule.q, y=rule.y) for rule in self.rules_.members]))\n",
    "            end_time = datetime.now()\n",
    "            self.time.append(str(end_time - start_time))\n",
    "        return self\n",
    "\n",
    "    def predict(self, data):\n",
    "        loss = loss_function(self.loss)\n",
    "        return loss.preidictions(self.rules_(data))\n",
    "\n",
    "    def decision_function(self, data):\n",
    "        return self.rules_(data)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 16,
   "id": "b50ce787",
   "metadata": {},
   "outputs": [],
   "source": [
    "# class Actor(nn.Module):\n",
    "#     def __init__(self, action_space, node=16):\n",
    "#         super(Actor, self).__init__()\n",
    "#         self.fc1 = nn.Linear(4, node)  \n",
    "# #         self.fc1_ = nn.Linear(node, node)\n",
    "#         self.fc2 = nn.Linear(node, action_space)\n",
    "\n",
    "#     def forward(self, state):\n",
    "#         x = F.relu(self.fc1(state))\n",
    "# #         x = F.relu(self.fc1_(x))\n",
    "#         x = self.fc2(x)\n",
    "#         return x"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 17,
   "id": "84b0ee0a",
   "metadata": {},
   "outputs": [],
   "source": [
    "def copy_rules(origin_rules):\n",
    "    rules = []\n",
    "    for n in range(len(origin_rules)):\n",
    "        rule = origin_rules[n]\n",
    "        rules.append(Rule(q=rule.q, y=rule.y))\n",
    "    return AdditiveRuleEnsemble(rules)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 18,
   "id": "bb3fcc8c",
   "metadata": {},
   "outputs": [],
   "source": [
    "class ActorRule():\n",
    "    def __init__(self, action_space=4, num_rules=number_rules):\n",
    "        self.action_space = action_space\n",
    "        self.model = [GeneralRuleBoostingEstimator(num_rules=num_rules, objective_function=OrthogonalBoostingObjective,\n",
    "                                                   weight_update_method=FullyCorrectiveA2C(), loss=PiLoss(),\n",
    "                                                   reg=regular, search='greedy', max_col_attr=20, verbose=False) for _ in\n",
    "                      range(action_space)]\n",
    "        self.best_model = [\n",
    "            GeneralRuleBoostingEstimator(num_rules=num_rules, objective_function=OrthogonalBoostingObjective,\n",
    "                                         weight_update_method=FullyCorrectiveA2C(), loss=PiLoss(),\n",
    "                                         reg=0.01, search='greedy', max_col_attr=20, verbose=False) for _ in\n",
    "            range(action_space)]\n",
    "\n",
    "    def __call__(self, state):\n",
    "        res = [self.model[i].rules_(state) for i in range(len(self.model))]\n",
    "        return np.array(res)\n",
    "\n",
    "    def predict(self, state):\n",
    "        res = [self.best_model[i].rules_(state) for i in range(len(self.model))]\n",
    "        return np.array(res)\n",
    "\n",
    "\n",
    "def update_rules(estimator: GeneralRuleBoostingEstimator, x, y, adv, other_values, current):\n",
    "    queries_lst = []\n",
    "    queries = {}\n",
    "    original_rules = copy_rules(estimator.rules_)\n",
    "    origin_risk = calc_risk(PiLoss(), y, original_rules, x, estimator.reg, adv, other_values, current)\n",
    "    for i in range(len(estimator.rules_)):\n",
    "        q_str = str(estimator.rules_[i].q)\n",
    "        if q_str not in queries:\n",
    "            queries[q_str] = estimator.rules_[i].y\n",
    "            queries_lst.append(estimator.rules_[i].q)\n",
    "        else:\n",
    "            queries[q_str] += estimator.rules_[i].y\n",
    "    for k in queries:\n",
    "        queries[k] = abs(queries[k])\n",
    "    min_weight_query = min(queries, key=queries.get)\n",
    "    rules = []\n",
    "    for i in range(len(queries_lst)):\n",
    "        q_str = str(queries_lst[i])\n",
    "        if q_str != min_weight_query:\n",
    "            rules.append(Rule(q=queries_lst[i], y=queries[str(queries_lst[i])]))\n",
    "    if len(rules) == 0:\n",
    "        rules = [Rule(q=queries_lst[0], y=queries[str(queries_lst[0])])]\n",
    "    new_rules = AdditiveRuleEnsemble(rules)\n",
    "    weights = FullyCorrectiveA2C(loss_function('pi_loss'), estimator.reg).calc_weight(x, y, new_rules, adv,\n",
    "                                                                                      other_values, current)\n",
    "    for i in range(len(new_rules)):\n",
    "        new_rules[i].y = weights[i]\n",
    "    estimator.rules_ = new_rules\n",
    "    estimator.fit(x, y, adv, other_values, current, has_origin_rules=True)\n",
    "    weights = FullyCorrectiveA2C(loss_function('pi_loss'), estimator.reg).calc_weight(x, y, estimator.rules_, adv,\n",
    "                                                                                      other_values, current)\n",
    "    for i in range(len(estimator.rules_)):\n",
    "        estimator.rules_[i].y = weights[i]\n",
    "    new_risk = calc_risk(PiLoss(), y, estimator.rules_, x, estimator.reg, adv, other_values, current)\n",
    "    if new_risk > origin_risk:\n",
    "        estimator.rules_ = copy_rules(original_rules)\n",
    "        print(\"origin\", origin_risk, 'new', new_risk, 'not updated')\n",
    "        # risk = sum(PiLoss.__call__(y, estimator.rules_[i].y))\n",
    "    return estimator"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 19,
   "id": "2824981f",
   "metadata": {},
   "outputs": [],
   "source": [
    "class Critic(nn.Module):\n",
    "    def __init__(self, node=16):\n",
    "        super(Critic, self).__init__()\n",
    "        self.fc1 = nn.Linear(5, node)\n",
    "        self.fc2 = nn.Linear(node, 1)\n",
    "\n",
    "    def forward(self, state):\n",
    "        x = F.relu(self.fc1(state))\n",
    "        x = self.fc2(x)\n",
    "        return x"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 20,
   "id": "6b6e2dd7",
   "metadata": {},
   "outputs": [],
   "source": [
    "gamma = 0.99\n",
    "actor = ActorRule()\n",
    "critic = Critic().to(device)\n",
    "critic_optimizer = optim.AdamW(critic.parameters(), lr=0.001)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 21,
   "id": "24c116b8",
   "metadata": {},
   "outputs": [],
   "source": [
    "class ActorNet(nn.Module):\n",
    "    def __init__(self, hidden_dim=16):\n",
    "        super().__init__()\n",
    "\n",
    "        self.hidden = nn.Linear(5, hidden_dim)\n",
    "        self.output = nn.Linear(hidden_dim, 4)\n",
    "\n",
    "    def forward(self, s):\n",
    "        outs = self.hidden(s)\n",
    "        outs = F.relu(outs)\n",
    "        logits = self.output(outs)\n",
    "        return logits\n",
    "\n",
    "\n",
    "actor_func = ActorNet().to(device)\n",
    "value_func = critic"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 22,
   "id": "c565d5ef",
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/home/fyan/.local/lib/python3.10/site-packages/gymnasium/utils/passive_env_checker.py:142: UserWarning: \u001b[33mWARN: The obs returned by the `reset()` method was expecting a tuple, actual type: <class 'numpy.ndarray'>\u001b[0m\n",
      "  logger.warn(f\"{pre} was expecting a tuple, actual type: {type(obs)}\")\n",
      "/home/fyan/.local/lib/python3.10/site-packages/gymnasium/utils/passive_env_checker.py:158: UserWarning: \u001b[33mWARN: The obs returned by the `reset()` method is not within the observation space.\u001b[0m\n",
      "  logger.warn(f\"{pre} is not within the observation space.\")\n",
      "/home/fyan/.local/lib/python3.10/site-packages/gymnasium/utils/passive_env_checker.py:142: UserWarning: \u001b[33mWARN: The obs returned by the `step()` method was expecting a tuple, actual type: <class 'numpy.ndarray'>\u001b[0m\n",
      "  logger.warn(f\"{pre} was expecting a tuple, actual type: {type(obs)}\")\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Run episode 0 with rewards -63\n",
      "Run episode 1 with rewards -78\n",
      "Run episode 2 with rewards -69\n",
      "Run episode 3 with rewards 39\n",
      "Run episode 4 with rewards -201\n",
      "Run episode 5 with rewards -63\n",
      "Run episode 6 with rewards -201\n",
      "Run episode 7 with rewards -201\n",
      "Run episode 8 with rewards -120\n",
      "Run episode 9 with rewards -180\n",
      "Run episode 10 with rewards -142\n",
      "Run episode 11 with rewards -63\n",
      "Run episode 12 with rewards -201\n",
      "Run episode 13 with rewards 0\n",
      "Run episode 14 with rewards 28\n",
      "Run episode 15 with rewards -87\n",
      "Run episode 16 with rewards -41\n",
      "Run episode 17 with rewards -44\n",
      "Run episode 18 with rewards -29\n",
      "Run episode 19 with rewards 27\n",
      "Run episode 20 with rewards -121\n",
      "Run episode 21 with rewards -42\n",
      "Run episode 22 with rewards -201\n",
      "Run episode 23 with rewards -117\n",
      "Run episode 24 with rewards 23\n",
      "Run episode 25 with rewards 23\n",
      "Run episode 26 with rewards -41\n",
      "Run episode 27 with rewards -86\n",
      "Run episode 28 with rewards -77\n",
      "Run episode 29 with rewards -3\n",
      "Run episode 30 with rewards 25\n",
      "Run episode 31 with rewards -38\n",
      "Run episode 32 with rewards -180\n",
      "Run episode 33 with rewards 6\n",
      "Run episode 34 with rewards 19\n",
      "Run episode 35 with rewards -201\n",
      "Run episode 36 with rewards 6\n",
      "Run episode 37 with rewards -26\n",
      "Run episode 38 with rewards 21\n",
      "Run episode 39 with rewards -43\n",
      "Run episode 40 with rewards 14\n",
      "Run episode 41 with rewards -19\n",
      "Run episode 42 with rewards -180\n",
      "Run episode 43 with rewards -77\n",
      "Run episode 44 with rewards -137\n",
      "Run episode 45 with rewards -54\n",
      "Run episode 46 with rewards -78\n",
      "Run episode 47 with rewards 22\n",
      "Run episode 48 with rewards -11\n",
      "Run episode 49 with rewards -12\n",
      "Run episode 50 with rewards -201\n",
      "Run episode 51 with rewards 1\n",
      "Run episode 52 with rewards 36\n",
      "Run episode 53 with rewards 14\n",
      "Run episode 54 with rewards -50\n",
      "Run episode 55 with rewards -120\n",
      "Run episode 56 with rewards 26\n",
      "Run episode 57 with rewards -180\n",
      "Run episode 58 with rewards 38\n",
      "Run episode 59 with rewards -88\n",
      "Run episode 60 with rewards -4\n",
      "Run episode 61 with rewards 33\n",
      "Run episode 62 with rewards 9\n",
      "Run episode 63 with rewards -64\n",
      "Run episode 64 with rewards -88\n",
      "Run episode 65 with rewards 1\n",
      "Run episode 66 with rewards 33\n",
      "Run episode 67 with rewards 16\n",
      "Run episode 68 with rewards -201\n",
      "Run episode 69 with rewards -4\n",
      "Run episode 70 with rewards 12\n",
      "Run episode 71 with rewards 26\n",
      "Run episode 72 with rewards -17\n",
      "Run episode 73 with rewards -56\n",
      "Run episode 74 with rewards 28\n",
      "Run episode 75 with rewards -180\n",
      "Run episode 76 with rewards -201\n",
      "Run episode 77 with rewards -61\n",
      "Run episode 78 with rewards -22\n",
      "Run episode 79 with rewards -28\n",
      "Run episode 80 with rewards -99\n",
      "Run episode 81 with rewards 27\n",
      "Run episode 82 with rewards -11\n",
      "Run episode 83 with rewards -102\n",
      "Run episode 84 with rewards -201\n",
      "Run episode 85 with rewards -132\n",
      "Run episode 86 with rewards -201\n",
      "Run episode 87 with rewards 40\n"
     ]
    }
   ],
   "source": [
    "opt1 = torch.optim.AdamW(value_func.parameters(), lr=0.001)\n",
    "opt2 = torch.optim.AdamW(actor_func.parameters(), lr=0.001)\n",
    "def pick_sample(s):\n",
    "    with torch.no_grad():\n",
    "        #   --> size : (1, 4)\n",
    "        s_batch = np.expand_dims(s, axis=0)\n",
    "        s_batch = torch.tensor(s_batch, dtype=torch.float).to(device)\n",
    "        # Get logits from state\n",
    "        #   --> size : (1, 2)\n",
    "        logits = actor_func(s_batch)\n",
    "        #   --> size : (2)\n",
    "        logits = logits.squeeze(dim=0)\n",
    "        # From logits to probabilities\n",
    "        probs = F.softmax(logits, dim=-1)\n",
    "        # Pick up action's sample\n",
    "        a = torch.multinomial(probs, num_samples=1)\n",
    "        # Return\n",
    "        return a.tolist()[0]\n",
    "reward_records = []\n",
    "for i in range(200):\n",
    "    #\n",
    "    # Run episode till done\n",
    "    #\n",
    "    done = False\n",
    "    states = []\n",
    "    actions = []\n",
    "    rewards = []\n",
    "    s, _ = env.reset(seed=np.random.randint(0, 1e6))\n",
    "    num_steps=0\n",
    "    while not done and num_steps<=200:\n",
    "        states.append(s.tolist())\n",
    "        a = pick_sample(s)\n",
    "        s, r, term, trunc, _ = env.step(a)\n",
    "        done = term or trunc\n",
    "        actions.append(a)\n",
    "        rewards.append(r)\n",
    "        num_steps+=1\n",
    "    #\n",
    "    # Get cumulative rewards\n",
    "    #\n",
    "    cum_rewards = np.zeros_like(rewards)\n",
    "    reward_len = len(rewards)\n",
    "    for j in reversed(range(reward_len)):\n",
    "        cum_rewards[j] = rewards[j] + (cum_rewards[j+1]*gamma if j+1 < reward_len else 0)\n",
    "    \n",
    "    #\n",
    "    # Train (optimize parameters)\n",
    "    #\n",
    "\n",
    "    # Optimize value loss (Critic)\n",
    "    opt1.zero_grad()\n",
    "    states = torch.tensor(states, dtype=torch.float).to(device)\n",
    "    cum_rewards = torch.tensor(cum_rewards, dtype=torch.float).to(device)\n",
    "    values = value_func(states)\n",
    "    values = values.squeeze(dim=1)\n",
    "    vf_loss = F.mse_loss(\n",
    "        values,\n",
    "        cum_rewards,\n",
    "        reduction=\"none\")\n",
    "    vf_loss.sum().backward()\n",
    "    opt1.step()\n",
    "\n",
    "    # Todo 2; RULE BASED UPDATES\n",
    "    with torch.no_grad():\n",
    "        values = value_func(states).squeeze(dim=1)\n",
    "    opt2.zero_grad()\n",
    "    actions = torch.tensor(actions, dtype=torch.int64).to(device)\n",
    "    advantages = cum_rewards - values\n",
    "#     print(advantages)\n",
    "    logits = actor_func(states)\n",
    "    log_probs = -F.cross_entropy(logits, actions, reduction=\"none\")\n",
    "    pi_loss = -log_probs * advantages\n",
    "    pi_loss.sum().backward()\n",
    "    opt2.step()\n",
    "    \n",
    "    # Output total rewards in episode (max 500)\n",
    "    print(\"Run episode {} with rewards {}\".format(i, sum(rewards)))#, end=\"\\r\")\n",
    "    reward_records.append(sum(rewards))\n",
    "    if sum(rewards)>35 and i>80:\n",
    "        break"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 23,
   "id": "f28c7004",
   "metadata": {},
   "outputs": [],
   "source": [
    "def manhattan_distance(location1, location2):\n",
    "    \"\"\"\n",
    "    :param location1: A tuple or list representing the coordinates (x, y) of the first location.\n",
    "    :param location2: A tuple or list representing the coordinates (x, y) of the second location.\n",
    "    :return: Integer representing the Manhattan distance between the two locations.\n",
    "    :functionality: Calculates and returns the Manhattan distance between two points in a 2D grid.\n",
    "    \"\"\"\n",
    "    return abs(location1[0] - location2[0]) + abs(location1[1] - location2[1])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 24,
   "id": "a3a7c7ce",
   "metadata": {},
   "outputs": [],
   "source": [
    "def accuracy_test(env, agent, test_num=10):\n",
    "    \"\"\"\n",
    "    :param env: An Environment object representing the environment in which the agent operates.\n",
    "    :param agent: An Agent object representing the agent being tested.\n",
    "    :param test_num: Integer representing the number of tests to perform.\n",
    "    :return: Float representing the ratio of times the agent successfully found the exact shortest path \n",
    "             in the given environment over the total number of tests.\n",
    "    :functionality: Tests the agent's ability to match the exact shortest path in the given environment. \n",
    "                    The accuracy is computed based on the number of times the agent's path length \n",
    "                    matches the actual minimum distance.\n",
    "    \"\"\"\n",
    "    \n",
    "    accuracy = 0\n",
    "\n",
    "    for _ in range(test_num):\n",
    "        # Regenerate random locations for items and agents in the environment\n",
    "        state, _=env.reset()\n",
    "\n",
    "        # Calculate the actual minimum distance needed to pick the item and reach the target\n",
    "        actual_length = manhattan_distance((state[0], state[1]), (state[2],state[3])) + manhattan_distance(\n",
    "            (state[2], state[3]), (4, 4)) + 1\n",
    "\n",
    "        # Initialize agent's state\n",
    "#         agent.agent_location = env.agent_location\n",
    "#         agent.carry_item = 0\n",
    "#         agent.reward = 0\n",
    "        episode_reward = 0\n",
    "        num_steps=0\n",
    "        for t in range(1, 100):  # Limit the number of time steps\n",
    "            # Convert state to tensor and predict action probabilities\n",
    "            #             state_tensor = torch.tensor(state, dtype=torch.float32).to(device)\n",
    "            action_probs = actor(pd.DataFrame(np.array([state]), columns=column_names))\n",
    "            # Select action based on the highest probability\n",
    "            action = np.argmax(action_probs)\n",
    "            # Take the chosen action\n",
    "            next_state, reward, done, trunc, _ = env.step(action)\n",
    "            # Accumulate reward\n",
    "            episode_reward += reward\n",
    "            if done or trunc:\n",
    "                break\n",
    "            # Update state\n",
    "            state = next_state\n",
    "            num_steps+=1\n",
    "        # Check if the path length found by the agent matches the actual minimum distance\n",
    "        if num_steps <= 3*actual_length:\n",
    "            accuracy += 1\n",
    "\n",
    "    # Calculate and return the accuracy ratio\n",
    "    return accuracy / test_num\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 25,
   "id": "73589768",
   "metadata": {},
   "outputs": [],
   "source": [
    "def softmax(logits):\n",
    "    exp_logits = np.exp(logits)\n",
    "    sum_logits = np.sum(exp_logits)\n",
    "    return (exp_logits / sum_logits).reshape([-1])\n",
    "\n",
    "def pick_sample(s):\n",
    "    with torch.no_grad():\n",
    "        s_batch = np.expand_dims(s, axis=0)\n",
    "        logits = actor(pd.DataFrame(s_batch, columns=column_names))\n",
    "        probs = softmax(logits)\n",
    "        a = torch.multinomial(torch.tensor(probs), num_samples=1)\n",
    "        return a.tolist()[0]\n",
    "\n",
    "\n",
    "def train():\n",
    "    reward_records = []\n",
    "    best_rewards = -100000\n",
    "    accuracies = []\n",
    "    best_accuracy = 0\n",
    "    # best_model = None\n",
    "    for i in range(150):\n",
    "\n",
    "        done = False\n",
    "        states = []\n",
    "        actions = []\n",
    "        rewards = []\n",
    "        \n",
    "#         if i == 2:\n",
    "#             print('stop here')\n",
    "        cum_rwds=np.array([])\n",
    "        for ii in range(10):\n",
    "            s, _ = env.reset(seed=np.random.randint(0, 1e6))\n",
    "            print('init state', s)\n",
    "            num_steps=0\n",
    "            done=False\n",
    "            rewards = []\n",
    "            while not done and num_steps<=200:\n",
    "                states.append(s.tolist())\n",
    "                a = pick_sample(s)\n",
    "                s, r, term, trunc, _ = env.step(a)\n",
    "    #             print(s, 'r:', r, 'term: ',term,'tr:', trunc, end=',')\n",
    "                done = term or trunc\n",
    "                actions.append(a)\n",
    "                rewards.append(r)\n",
    "                num_steps+=1\n",
    "            cum_rewards = np.zeros_like(rewards)\n",
    "            reward_len = len(rewards)\n",
    "            for j in reversed(range(reward_len)):\n",
    "                cum_rewards[j] = rewards[j] + (cum_rewards[j + 1] * gamma if j + 1 < reward_len else 0)\n",
    "            cum_rwds=np.hstack([cum_rwds, cum_rewards])\n",
    "            print(cum_rwds.shape, cum_rewards.shape)\n",
    "\n",
    "        # if sum(rewards) > 480:\n",
    "        #     break\n",
    "        #\n",
    "        # Get cumulative rewards\n",
    "        #\n",
    "        print('============', i, '===========')\n",
    "#         print(len(actions), 'actions', actions)\n",
    "#         print(type(env))\n",
    "        avg_accuracy = accuracy_test(env, actor)\n",
    "        accuracies.append(avg_accuracy)\n",
    "        print(\"Run episode {} with rewards {}, accuracy {}\".format(i, sum(rewards), avg_accuracy))  # , end=\"\\r\")\n",
    "#         if i > 0:\n",
    "        if avg_accuracy >= best_accuracy:\n",
    "#             best_rewards = sum(rewards)\n",
    "            best_accuracy = avg_accuracy\n",
    "            for rr in range(actor.action_space):\n",
    "                rules = []\n",
    "                for n in range(len(actor.model[rr].rules_)):\n",
    "                    rule = actor.model[rr].rules_[n]\n",
    "                    rules.append(Rule(q=rule.q, y=rule.y))\n",
    "                actor.best_model[rr].rules_ = AdditiveRuleEnsemble(rules)\n",
    "            print('best')\n",
    "        if np.average(accuracies[:-5])>=0.99:\n",
    "            break\n",
    "#         cum_rewards = np.zeros_like(rewards)\n",
    "#         reward_len = len(rewards)\n",
    "#         for j in reversed(range(reward_len)):\n",
    "#             cum_rewards[j] = rewards[j] + (cum_rewards[j + 1] * gamma if j + 1 < reward_len else 0)\n",
    "        #\n",
    "        # Train (optimize parameters)\n",
    "        #\n",
    "        # Optimize value loss (Critic)\n",
    "        critic_optimizer.zero_grad()\n",
    "        states = torch.tensor(states, dtype=torch.float).to(device)\n",
    "        cum_rewards = torch.tensor(cum_rwds, dtype=torch.float).to(device)\n",
    "        values = critic(states)\n",
    "        values = values.squeeze(dim=1)\n",
    "        vf_loss = F.mse_loss(\n",
    "            values,\n",
    "            cum_rewards,\n",
    "            reduction=\"none\")\n",
    "        vf_loss.sum().backward()\n",
    "        critic_optimizer.step()\n",
    "#         if np.average(reward_records[-5:]) > 32.0:\n",
    "#             break\n",
    "        #     else:\n",
    "        #         for rr in range(actor.action_space):\n",
    "        #             rules = []\n",
    "        #             for n in range(len(actor.best_model[rr].rules_)):\n",
    "        #                 rule = actor.best_model[rr].rules_[n]\n",
    "        #                 rules.append(Rule(q=rule.q, y=rule.y))\n",
    "        #             actor.model[rr].rules_ = AdditiveRuleEnsemble(rules)\n",
    "        #         print('')\n",
    "\n",
    "        #\n",
    "        # Todo 2; RULE BASED UPDATES\n",
    "        with torch.no_grad():\n",
    "            values = critic(states).squeeze(dim=1)\n",
    "        actions = torch.tensor(actions, dtype=torch.int64).to(device)\n",
    "        advantages = cum_rewards - values\n",
    "        states_array = states.cpu().detach().numpy()\n",
    "        x = pd.DataFrame(states_array, columns=column_names)\n",
    "        y = pd.Series(actions.cpu().detach().numpy())\n",
    "#         advantages = (advantages-advantages.mean())/advantages.std()\n",
    "        adv = pd.Series(advantages.cpu().detach().numpy())\n",
    "        outputs = actor(x).T\n",
    "        # print('adv', advantages.cpu().detach().numpy())\n",
    "        # print('outputs', outputs.tolist())\n",
    "        for j in range(len(actor.model)):\n",
    "            m = actor.model[j]\n",
    "            masks = np.ones_like(outputs, dtype=bool)\n",
    "            masks[:, j] = False\n",
    "            other_values = outputs[masks].reshape(-1, outputs.shape[1] - 1)\n",
    "\n",
    "            if len(m.rules_) == 0:\n",
    "                m.fit(x, y, adv, other_values, j)\n",
    "            else:\n",
    "                for _ in range(1):\n",
    "                    update_rules(m, x, y, adv, other_values, j)\n",
    "            print('-----------------',j,'--------------')\n",
    "            print(m.rules_)\n",
    "        \n",
    "        # print(\n",
    "        #     \"{}\\n--------------\\n{}\\nRun episode {} with rewards {}\".format(actor.model[0].rules_,\n",
    "        #                                                                     actor.model[1].rules_,\n",
    "        #                                                                     i,\n",
    "        #                                                                     sum(rewards)))  # , end=\"\\r\")\n",
    "        reward_records.append(sum(rewards))\n",
    "    print(\"\\nDone\")\n",
    "    env.close()\n",
    "    return reward_records"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 26,
   "id": "b411aa5d",
   "metadata": {
    "scrolled": true
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "init state [1 0 0 2 0]\n",
      "(57,) (57,)\n",
      "init state [1 1 0 1 0]\n",
      "(96,) (39,)\n",
      "init state [ 3  1 -2 -1  0]\n",
      "(209,) (113,)\n",
      "init state [ 2  3  0 -3  0]\n",
      "(293,) (84,)\n",
      "init state [1 1 2 1 0]\n",
      "(414,) (121,)\n",
      "init state [ 2  1 -2  1  0]\n",
      "(451,) (37,)\n",
      "init state [ 1  2  1 -1  0]\n",
      "(470,) (19,)\n",
      "init state [1 2 1 0 0]\n",
      "(518,) (48,)\n",
      "init state [0 2 3 0 0]\n",
      "(561,) (43,)\n",
      "init state [1 0 2 2 0]\n",
      "(590,) (29,)\n",
      "============ 0 ===========\n",
      "Run episode 0 with rewards 13, accuracy 0.0\n",
      "best\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/home/fyan/.local/lib/python3.10/site-packages/numpy/lib/function_base.py:518: RuntimeWarning: Mean of empty slice.\n",
      "  avg = a.mean(axis, **keepdims_kw)\n",
      "/home/fyan/.local/lib/python3.10/site-packages/numpy/core/_methods.py:190: RuntimeWarning: invalid value encountered in double_scalars\n",
      "  ret = ret.dtype.type(ret / rcount)\n",
      "/tmp/ipykernel_316/4131041232.py:32: RuntimeWarning: invalid value encountered in sqrt\n",
      "  return abs(g_q.sum()) / np.sqrt(h_q.sum())\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 0 --------------\n",
      "   -0.0594 if x1>=2.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.4180 if c>=1.0 & x1>=2.0 & x2>=2.0\n",
      "   -0.6871 if x1<=2.0 & x1>=1.0 & x2>=3.0\n",
      "   -1.1914 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.1761 if c<=0.0 & x1<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1<=-2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.4522 if c<=0.0 & x2<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.2636 if c<=0.0 & x1<=1.0 & x2<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.5335 if x2>=3.0 & x3-x1>=2.0 & x4-x2>=-1.0\n",
      "   +0.3600 if c<=0.0 & x1<=2.0 & x3-x1<=-2.0\n",
      "   +0.1634 if c>=1.0 & x1>=3.0 & x2<=1.0 & x2>=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   -0.1393 if c<=0.0 & x1<=0.0 & x1<=1.0 & x2>=1.0 & x2>=2.0 & x3-x1<=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.3895 if c<=0.0 & x1>=3.0 & x2<=1.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0\n",
      "   +0.1235 if x1>=3.0 & x2>=1.0 & x3-x1<=-2.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.3585 if x1>=1.0 & x2>=2.0 & x3-x1>=1.0 & x3-x1>=2.0 & x4-x2>=0.0\n",
      "   +0.1534 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2<=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   +0.4514 if c<=0.0 & x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=0.0\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/tmp/ipykernel_316/4131041232.py:32: RuntimeWarning: invalid value encountered in sqrt\n",
      "  return abs(g_q.sum()) / np.sqrt(h_q.sum())\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 1 --------------\n",
      "   +0.7121 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.7627 if c>=1.0 & x1>=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   -0.6238 if c>=1.0 & x1<=2.0 & x1>=2.0 & x2<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   -0.5264 if x1<=0.0 & x3-x1<=1.0 & x4-x2>=2.0\n",
      "   -0.2094 if x1>=2.0 & x2>=3.0 & x3-x1>=0.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   -0.5640 if x2>=2.0 & x3-x1<=-1.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   -0.2398 if x2>=2.0 & x3-x1>=3.0 & x4-x2>=0.0\n",
      "   +0.3201 if c<=0.0 & x1<=0.0 & x1<=1.0 & x3-x1<=1.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.2617 if x1<=1.0 & x1>=1.0 & x2<=1.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0 & x4-x2>=0.0\n",
      "   +0.1963 if c>=1.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2<=-3.0\n",
      "   -0.1005 if x3-x1<=-3.0 & x4-x2>=1.0\n",
      "   +0.3070 if c<=0.0 & x1<=2.0 & x2>=3.0 & x3-x1<=2.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   +0.2718 if x3-x1<=0.0 & x4-x2<=-3.0\n",
      "   +0.1184 if c<=0.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.2227 if x1>=2.0 & x2<=1.0 & x3-x1>=1.0\n",
      "   +0.2776 if x1<=2.0 & x1>=1.0 & x2>=2.0 & x3-x1>=-1.0 & x4-x2>=0.0\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/tmp/ipykernel_316/4131041232.py:32: RuntimeWarning: invalid value encountered in sqrt\n",
      "  return abs(g_q.sum()) / np.sqrt(h_q.sum())\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 2 --------------\n",
      "   +0.0047 if x1>=2.0 & x4-x2<=0.0\n",
      "   -0.3533 if c>=1.0 & x3-x1<=0.0 & x4-x2<=-3.0\n",
      "   -0.6849 if x2>=1.0 & x3-x1<=2.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   -0.2570 if x1>=2.0 & x2>=3.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2>=-2.0\n",
      "   +0.4576 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.2666 if c>=1.0 & x3-x1>=2.0 & x4-x2<=-3.0\n",
      "   +0.4270 if c<=0.0 & x1<=0.0 & x3-x1<=1.0 & x4-x2>=1.0\n",
      "   -0.1599 if c<=0.0 & x1<=2.0 & x1>=1.0 & x1>=2.0 & x2<=2.0 & x2>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.2334 if x4-x2>=-1.0\n",
      "   -0.1705 if x1>=3.0 & x2>=1.0 & x3-x1<=-2.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.2724 if x2<=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   +0.2003 if x1>=1.0 & x1>=3.0 & x2<=2.0 & x2>=2.0 & x3-x1<=-1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.3182 if x1>=1.0 & x2<=2.0 & x3-x1<=0.0\n",
      "   -0.2711 if c>=1.0 & x1<=2.0 & x1>=2.0 & x2>=2.0 & x3-x1>=0.0\n",
      "   +0.0962 if c<=0.0 & x1>=2.0 & x3-x1>=1.0\n",
      "   +0.1531 if x1<=0.0 & x3-x1<=1.0 & x4-x2>=2.0\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/tmp/ipykernel_316/4131041232.py:32: RuntimeWarning: invalid value encountered in sqrt\n",
      "  return abs(g_q.sum()) / np.sqrt(h_q.sum())\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 3 --------------\n",
      "   +0.2087 if x3-x1<=-1.0\n",
      "   +0.8321 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2>=0.0\n",
      "   +0.8431 if x1<=2.0 & x1>=2.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   +0.3068 if c>=1.0 & x1>=2.0 & x2>=3.0 & x4-x2<=-2.0\n",
      "   +0.3143 if c>=1.0 & x2>=1.0 & x3-x1<=-2.0 & x4-x2>=0.0\n",
      "   +0.3536 if x1>=3.0 & x2>=3.0 & x3-x1>=0.0\n",
      "   -0.4938 if c<=0.0 & x1>=1.0 & x3-x1<=1.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.4948 if c>=1.0 & x1<=2.0 & x1>=2.0 & x2<=2.0 & x2>=1.0 & x3-x1>=0.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.2429 if c>=1.0 & x1<=1.0 & x3-x1<=0.0 & x4-x2<=-2.0\n",
      "   +0.1815 if x1<=0.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   +0.4540 if x1>=3.0 & x3-x1<=-2.0\n",
      "   +0.3653 if x2>=1.0 & x3-x1>=3.0\n",
      "   -0.4999 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   -0.2128 if c<=0.0 & x1>=3.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=0.0\n",
      "   -0.1267 if c<=0.0 & x2<=2.0 & x3-x1>=2.0 & x4-x2<=-1.0\n",
      "   +0.2725 if x1<=0.0 & x3-x1<=1.0 & x4-x2>=0.0 & x4-x2>=1.0\n",
      "init state [1 2 1 0 0]\n",
      "(23,) (23,)\n",
      "init state [ 2  1 -1  1  0]\n",
      "(39,) (16,)\n",
      "init state [2 1 1 1 0]\n",
      "(42,) (3,)\n",
      "init state [ 3  1 -3  2  0]\n",
      "(103,) (61,)\n",
      "init state [ 2  3 -2 -3  0]\n",
      "(245,) (142,)\n",
      "init state [ 2  3 -2 -3  0]\n",
      "(446,) (201,)\n",
      "init state [ 3  0 -3  1  0]\n",
      "(523,) (77,)\n",
      "init state [0 1 2 1 0]\n",
      "(531,) (8,)\n",
      "init state [0 2 2 1 0]\n",
      "(540,) (9,)\n",
      "init state [ 2  3 -1 -3  0]\n",
      "(576,) (36,)\n",
      "============ 1 ===========\n",
      "Run episode 1 with rewards 6, accuracy 0.1\n",
      "best\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/home/fyan/.local/lib/python3.10/site-packages/numpy/lib/function_base.py:518: RuntimeWarning: Mean of empty slice.\n",
      "  avg = a.mean(axis, **keepdims_kw)\n",
      "/home/fyan/.local/lib/python3.10/site-packages/numpy/core/_methods.py:190: RuntimeWarning: invalid value encountered in double_scalars\n",
      "  ret = ret.dtype.type(ret / rcount)\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 0 --------------\n",
      "   -0.6206 if c>=1.0 & x1>=2.0 & x2>=2.0\n",
      "   +0.5636 if x1<=2.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.9065 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.4468 if c<=0.0 & x1<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1<=-2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.6339 if c<=0.0 & x2<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.1061 if c<=0.0 & x1<=1.0 & x2<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.1966 if x2>=3.0 & x3-x1>=2.0 & x4-x2>=-1.0\n",
      "   +2.4328 if c<=0.0 & x1<=2.0 & x3-x1<=-2.0\n",
      "   -0.0000 if c>=1.0 & x1>=3.0 & x2<=1.0 & x2>=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   -0.2174 if c<=0.0 & x1<=0.0 & x1<=1.0 & x2>=1.0 & x2>=2.0 & x3-x1<=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.0000 if c<=0.0 & x1>=3.0 & x2<=1.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0\n",
      "   +0.3500 if x1>=3.0 & x2>=1.0 & x3-x1<=-2.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.0000 if x1>=1.0 & x2>=2.0 & x3-x1>=1.0 & x3-x1>=2.0 & x4-x2>=0.0\n",
      "   -0.2544 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2<=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   +0.4589 if c<=0.0 & x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   -0.3734 if x2<=1.0 & x3-x1>=2.0\n",
      "----------------- 1 --------------\n",
      "   +0.5412 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.1893 if c>=1.0 & x1>=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   -0.1022 if c>=1.0 & x1<=2.0 & x1>=2.0 & x2<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   -0.1120 if x1<=0.0 & x3-x1<=1.0 & x4-x2>=2.0\n",
      "   -0.1674 if x1>=2.0 & x2>=3.0 & x3-x1>=0.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   -0.3181 if x2>=2.0 & x3-x1<=-1.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.0000 if x2>=2.0 & x3-x1>=3.0 & x4-x2>=0.0\n",
      "   +0.0000 if c<=0.0 & x1<=0.0 & x1<=1.0 & x3-x1<=1.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.1550 if x1<=1.0 & x1>=1.0 & x2<=1.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0 & x4-x2>=0.0\n",
      "   +0.0000 if c>=1.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2<=-3.0\n",
      "   +0.0004 if c<=0.0 & x1<=2.0 & x2>=3.0 & x3-x1<=2.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   -0.1057 if x3-x1<=0.0 & x4-x2<=-3.0\n",
      "   -0.2280 if c<=0.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.1375 if x1>=2.0 & x2<=1.0 & x3-x1>=1.0\n",
      "   -0.1049 if x1<=2.0 & x1>=1.0 & x2>=2.0 & x3-x1>=-1.0 & x4-x2>=0.0\n",
      "   +0.3636 if x1>=2.0 & x2>=2.0 & x3-x1>=1.0\n",
      "----------------- 2 --------------\n",
      "   -0.1594 if c>=1.0 & x3-x1<=0.0 & x4-x2<=-3.0\n",
      "   -0.6994 if x2>=1.0 & x3-x1<=2.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   -0.1913 if x1>=2.0 & x2>=3.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2>=-2.0\n",
      "   +0.4057 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.0000 if c>=1.0 & x3-x1>=2.0 & x4-x2<=-3.0\n",
      "   +0.2618 if c<=0.0 & x1<=0.0 & x3-x1<=1.0 & x4-x2>=1.0\n",
      "   -0.4093 if c<=0.0 & x1<=2.0 & x1>=1.0 & x1>=2.0 & x2<=2.0 & x2>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.2346 if x4-x2>=-1.0\n",
      "   +0.1162 if x1>=3.0 & x2>=1.0 & x3-x1<=-2.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.1097 if x2<=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.0000 if x1>=1.0 & x1>=3.0 & x2<=2.0 & x2>=2.0 & x3-x1<=-1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.0961 if x1>=1.0 & x2<=2.0 & x3-x1<=0.0\n",
      "   -0.0754 if c>=1.0 & x1<=2.0 & x1>=2.0 & x2>=2.0 & x3-x1>=0.0\n",
      "   -0.0983 if c<=0.0 & x1>=2.0 & x3-x1>=1.0\n",
      "   -0.1083 if x1<=0.0 & x3-x1<=1.0 & x4-x2>=2.0\n",
      "   -0.3483 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "----------------- 3 --------------\n",
      "   +0.0757 if x3-x1<=-1.0\n",
      "   +0.8935 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2>=0.0\n",
      "   +0.7420 if x1<=2.0 & x1>=2.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   +0.2327 if c>=1.0 & x1>=2.0 & x2>=3.0 & x4-x2<=-2.0\n",
      "   +0.1495 if c>=1.0 & x2>=1.0 & x3-x1<=-2.0 & x4-x2>=0.0\n",
      "   +0.0000 if x1>=3.0 & x2>=3.0 & x3-x1>=0.0\n",
      "   -0.4420 if c<=0.0 & x1>=1.0 & x3-x1<=1.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.0000 if c>=1.0 & x1<=2.0 & x1>=2.0 & x2<=2.0 & x2>=1.0 & x3-x1>=0.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.0532 if c>=1.0 & x1<=1.0 & x3-x1<=0.0 & x4-x2<=-2.0\n",
      "   +0.4152 if x1<=0.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   +0.6988 if x1>=3.0 & x3-x1<=-2.0\n",
      "   +0.0000 if x2>=1.0 & x3-x1>=3.0\n",
      "   -0.6124 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   +0.0000 if c<=0.0 & x1>=3.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=0.0\n",
      "   +0.4471 if x1<=0.0 & x3-x1<=1.0 & x4-x2>=0.0 & x4-x2>=1.0\n",
      "   +0.7248 if c>=1.0 & x1>=2.0 & x2>=3.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "init state [1 0 0 1 0]\n",
      "(27,) (27,)\n",
      "init state [ 1  2 -1  1  0]\n",
      "(38,) (11,)\n",
      "init state [0 0 1 3 0]\n",
      "(93,) (55,)\n",
      "init state [1 0 1 1 0]\n",
      "(121,) (28,)\n",
      "init state [ 2  1 -2 -1  0]\n",
      "(139,) (18,)\n",
      "init state [ 0  3  3 -3  0]\n",
      "(255,) (116,)\n",
      "init state [ 3  2 -1 -1  0]\n",
      "(276,) (21,)\n",
      "init state [ 1  0 -1  1  0]\n",
      "(293,) (17,)\n",
      "init state [ 1  3  2 -2  0]\n",
      "(444,) (151,)\n",
      "init state [ 2  0 -2  1  0]\n",
      "(457,) (13,)\n",
      "============ 2 ===========\n",
      "Run episode 2 with rewards 29, accuracy 0.2\n",
      "best\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/home/fyan/.local/lib/python3.10/site-packages/numpy/lib/function_base.py:518: RuntimeWarning: Mean of empty slice.\n",
      "  avg = a.mean(axis, **keepdims_kw)\n",
      "/home/fyan/.local/lib/python3.10/site-packages/numpy/core/_methods.py:190: RuntimeWarning: invalid value encountered in double_scalars\n",
      "  ret = ret.dtype.type(ret / rcount)\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 0 --------------\n",
      "   -0.2634 if c>=1.0 & x1>=2.0 & x2>=2.0\n",
      "   -0.0478 if x1<=2.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.8359 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.2770 if c<=0.0 & x1<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1<=-2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.2576 if c<=0.0 & x2<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.1582 if c<=0.0 & x1<=1.0 & x2<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.0000 if x2>=3.0 & x3-x1>=2.0 & x4-x2>=-1.0\n",
      "   +0.7211 if c<=0.0 & x1<=2.0 & x3-x1<=-2.0\n",
      "   -0.0000 if c<=0.0 & x1<=0.0 & x1<=1.0 & x2>=1.0 & x2>=2.0 & x3-x1<=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.0000 if c<=0.0 & x1>=3.0 & x2<=1.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0\n",
      "   +0.0715 if x1>=3.0 & x2>=1.0 & x3-x1<=-2.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.0000 if x1>=1.0 & x2>=2.0 & x3-x1>=1.0 & x3-x1>=2.0 & x4-x2>=0.0\n",
      "   -0.1167 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2<=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   +0.0388 if c<=0.0 & x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   -0.4404 if x2<=1.0 & x3-x1>=2.0\n",
      "   +0.6255 if c<=0.0 & x1<=2.0 & x2>=1.0 & x2>=2.0 & x3-x1<=-1.0\n",
      "----------------- 1 --------------\n",
      "   +0.8658 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.2771 if c>=1.0 & x1>=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   +0.0994 if c>=1.0 & x1<=2.0 & x1>=2.0 & x2<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   -0.0023 if x1<=0.0 & x3-x1<=1.0 & x4-x2>=2.0\n",
      "   -0.0000 if x1>=2.0 & x2>=3.0 & x3-x1>=0.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   -0.0279 if x2>=2.0 & x3-x1<=-1.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   -0.0000 if x2>=2.0 & x3-x1>=3.0 & x4-x2>=0.0\n",
      "   -0.0000 if c<=0.0 & x1<=0.0 & x1<=1.0 & x3-x1<=1.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.0934 if x1<=1.0 & x1>=1.0 & x2<=1.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0 & x4-x2>=0.0\n",
      "   -0.0000 if c<=0.0 & x1<=2.0 & x2>=3.0 & x3-x1<=2.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   +0.0104 if x3-x1<=0.0 & x4-x2<=-3.0\n",
      "   +0.4547 if c<=0.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   +0.4157 if x1>=2.0 & x2<=1.0 & x3-x1>=1.0\n",
      "   -0.2779 if x1<=2.0 & x1>=1.0 & x2>=2.0 & x3-x1>=-1.0 & x4-x2>=0.0\n",
      "   +0.0388 if x1>=2.0 & x2>=2.0 & x3-x1>=1.0\n",
      "   -0.5545 if c>=1.0 & x1>=2.0 & x2>=1.0 & x3-x1<=0.0 & x3-x1>=0.0\n",
      "----------------- 2 --------------\n",
      "   +0.0000 if c>=1.0 & x3-x1<=0.0 & x4-x2<=-3.0\n",
      "   -0.6897 if x2>=1.0 & x3-x1<=2.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   -0.2539 if x1>=2.0 & x2>=3.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2>=-2.0\n",
      "   +0.3761 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.0000 if c>=1.0 & x3-x1>=2.0 & x4-x2<=-3.0\n",
      "   -0.2293 if c<=0.0 & x1<=0.0 & x3-x1<=1.0 & x4-x2>=1.0\n",
      "   -0.1148 if c<=0.0 & x1<=2.0 & x1>=1.0 & x1>=2.0 & x2<=2.0 & x2>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.2647 if x4-x2>=-1.0\n",
      "   -0.1538 if x1>=3.0 & x2>=1.0 & x3-x1<=-2.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.3370 if x2<=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   +0.0117 if x1>=1.0 & x2<=2.0 & x3-x1<=0.0\n",
      "   -0.1311 if c>=1.0 & x1<=2.0 & x1>=2.0 & x2>=2.0 & x3-x1>=0.0\n",
      "   +0.1813 if c<=0.0 & x1>=2.0 & x3-x1>=1.0\n",
      "   -0.0086 if x1<=0.0 & x3-x1<=1.0 & x4-x2>=2.0\n",
      "   -0.0342 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.5760 if c>=1.0 & x1>=1.0 & x2<=2.0 & x4-x2<=-1.0\n",
      "----------------- 3 --------------\n",
      "   -0.0199 if x3-x1<=-1.0\n",
      "   +0.3665 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2>=0.0\n",
      "   -0.0953 if x1<=2.0 & x1>=2.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   +0.3121 if c>=1.0 & x1>=2.0 & x2>=3.0 & x4-x2<=-2.0\n",
      "   +0.0750 if c>=1.0 & x2>=1.0 & x3-x1<=-2.0 & x4-x2>=0.0\n",
      "   +0.0764 if x1>=3.0 & x2>=3.0 & x3-x1>=0.0\n",
      "   -0.3510 if c<=0.0 & x1>=1.0 & x3-x1<=1.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.0734 if c>=1.0 & x1<=2.0 & x1>=2.0 & x2<=2.0 & x2>=1.0 & x3-x1>=0.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.0003 if c>=1.0 & x1<=1.0 & x3-x1<=0.0 & x4-x2<=-2.0\n",
      "   +0.2277 if x1<=0.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   +0.4210 if x1>=3.0 & x3-x1<=-2.0\n",
      "   -0.1079 if x2>=1.0 & x3-x1>=3.0\n",
      "   -0.2248 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   +0.1025 if x1<=0.0 & x3-x1<=1.0 & x4-x2>=0.0 & x4-x2>=1.0\n",
      "   +0.4203 if c>=1.0 & x1>=2.0 & x2>=3.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   +0.4896 if x3-x1<=-3.0 & x4-x2>=-1.0\n",
      "init state [0 0 1 0 0]\n",
      "(17,) (17,)\n",
      "init state [ 2  3  0 -2  0]\n",
      "(100,) (83,)\n",
      "init state [ 3  1 -3  0  0]\n",
      "(130,) (30,)\n",
      "init state [ 2  0 -2  1  0]\n",
      "(152,) (22,)\n",
      "init state [0 2 1 1 0]\n",
      "(162,) (10,)\n",
      "init state [ 2  0 -1  2  0]\n",
      "(192,) (30,)\n",
      "init state [0 2 1 1 0]\n",
      "(208,) (16,)\n",
      "init state [ 0  2  1 -1  0]\n",
      "(218,) (10,)\n",
      "init state [ 3  1 -3  1  0]\n",
      "(240,) (22,)\n",
      "init state [ 3  0 -3  1  0]\n",
      "(263,) (23,)\n",
      "============ 3 ===========\n",
      "Run episode 3 with rewards 19, accuracy 0.0\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/home/fyan/.local/lib/python3.10/site-packages/numpy/lib/function_base.py:518: RuntimeWarning: Mean of empty slice.\n",
      "  avg = a.mean(axis, **keepdims_kw)\n",
      "/home/fyan/.local/lib/python3.10/site-packages/numpy/core/_methods.py:190: RuntimeWarning: invalid value encountered in double_scalars\n",
      "  ret = ret.dtype.type(ret / rcount)\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 0 --------------\n",
      "   -0.3855 if c>=1.0 & x1>=2.0 & x2>=2.0\n",
      "   +0.3676 if x1<=2.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.9883 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.1045 if c<=0.0 & x1<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1<=-2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.0609 if c<=0.0 & x2<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.0890 if c<=0.0 & x1<=1.0 & x2<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.0000 if x2>=3.0 & x3-x1>=2.0 & x4-x2>=-1.0\n",
      "   +0.4189 if c<=0.0 & x1<=2.0 & x3-x1<=-2.0\n",
      "   -0.2442 if c<=0.0 & x1<=0.0 & x1<=1.0 & x2>=1.0 & x2>=2.0 & x3-x1<=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.0000 if c<=0.0 & x1>=3.0 & x2<=1.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0\n",
      "   +0.0161 if x1>=3.0 & x2>=1.0 & x3-x1<=-2.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.2709 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2<=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   +0.1265 if c<=0.0 & x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   +0.0865 if x2<=1.0 & x3-x1>=2.0\n",
      "   +0.8511 if c<=0.0 & x1<=2.0 & x2>=1.0 & x2>=2.0 & x3-x1<=-1.0\n",
      "   +0.3674 if c<=0.0 & x1<=1.0 & x2<=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "----------------- 1 --------------\n",
      "   +0.5889 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.1652 if c>=1.0 & x1>=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   -0.1738 if c>=1.0 & x1<=2.0 & x1>=2.0 & x2<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   -0.0040 if x1<=0.0 & x3-x1<=1.0 & x4-x2>=2.0\n",
      "   +0.0000 if x1>=2.0 & x2>=3.0 & x3-x1>=0.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   +0.1917 if x2>=2.0 & x3-x1<=-1.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.0761 if c<=0.0 & x1<=0.0 & x1<=1.0 & x3-x1<=1.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.0552 if x1<=1.0 & x1>=1.0 & x2<=1.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0 & x4-x2>=0.0\n",
      "   +0.4467 if c<=0.0 & x1<=2.0 & x2>=3.0 & x3-x1<=2.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   +0.2596 if x3-x1<=0.0 & x4-x2<=-3.0\n",
      "   +0.1716 if c<=0.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   +0.0000 if x1>=2.0 & x2<=1.0 & x3-x1>=1.0\n",
      "   +0.2343 if x1<=2.0 & x1>=1.0 & x2>=2.0 & x3-x1>=-1.0 & x4-x2>=0.0\n",
      "   +0.0000 if x1>=2.0 & x2>=2.0 & x3-x1>=1.0\n",
      "   +0.0243 if c>=1.0 & x1>=2.0 & x2>=1.0 & x3-x1<=0.0 & x3-x1>=0.0\n",
      "   -0.7843 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "----------------- 2 --------------\n",
      "   -0.0759 if c>=1.0 & x3-x1<=0.0 & x4-x2<=-3.0\n",
      "   -0.7550 if x2>=1.0 & x3-x1<=2.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.0265 if x1>=2.0 & x2>=3.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2>=-2.0\n",
      "   +0.1439 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.0853 if c<=0.0 & x1<=0.0 & x3-x1<=1.0 & x4-x2>=1.0\n",
      "   +0.2451 if c<=0.0 & x1<=2.0 & x1>=1.0 & x1>=2.0 & x2<=2.0 & x2>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.2958 if x4-x2>=-1.0\n",
      "   -0.3097 if x1>=3.0 & x2>=1.0 & x3-x1<=-2.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.0288 if x2<=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   +0.2123 if x1>=1.0 & x2<=2.0 & x3-x1<=0.0\n",
      "   -0.0269 if c>=1.0 & x1<=2.0 & x1>=2.0 & x2>=2.0 & x3-x1>=0.0\n",
      "   +0.0000 if c<=0.0 & x1>=2.0 & x3-x1>=1.0\n",
      "   -0.0096 if x1<=0.0 & x3-x1<=1.0 & x4-x2>=2.0\n",
      "   -0.0636 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.5541 if c>=1.0 & x1>=1.0 & x2<=2.0 & x4-x2<=-1.0\n",
      "   +0.8805 if x1<=1.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "----------------- 3 --------------\n",
      "   -0.0505 if x3-x1<=-1.0\n",
      "   +0.2121 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2>=0.0\n",
      "   +0.5435 if x1<=2.0 & x1>=2.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   -0.1789 if c>=1.0 & x1>=2.0 & x2>=3.0 & x4-x2<=-2.0\n",
      "   +0.3151 if c>=1.0 & x2>=1.0 & x3-x1<=-2.0 & x4-x2>=0.0\n",
      "   -0.0000 if x1>=3.0 & x2>=3.0 & x3-x1>=0.0\n",
      "   -0.1093 if c<=0.0 & x1>=1.0 & x3-x1<=1.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.0000 if c>=1.0 & x1<=2.0 & x1>=2.0 & x2<=2.0 & x2>=1.0 & x3-x1>=0.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.0630 if x1<=0.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   +0.3271 if x1>=3.0 & x3-x1<=-2.0\n",
      "   -0.0000 if x2>=1.0 & x3-x1>=3.0\n",
      "   +0.2291 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   +0.5399 if x1<=0.0 & x3-x1<=1.0 & x4-x2>=0.0 & x4-x2>=1.0\n",
      "   -0.0818 if c>=1.0 & x1>=2.0 & x2>=3.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   +0.1953 if x3-x1<=-3.0 & x4-x2>=-1.0\n",
      "   +0.8748 if c>=1.0 & x2<=1.0 & x2>=1.0\n",
      "init state [ 3  0 -2  3  0]\n",
      "(20,) (20,)\n",
      "init state [ 3  2  0 -1  0]\n",
      "(82,) (62,)\n",
      "init state [ 1  3  1 -3  0]\n",
      "(151,) (69,)\n",
      "init state [ 2  3 -1 -3  0]\n",
      "(258,) (107,)\n",
      "init state [0 1 1 0 0]\n",
      "(268,) (10,)\n",
      "init state [ 2  2 -1 -1  0]\n",
      "(289,) (21,)\n",
      "init state [ 1  1  0 -1  0]\n",
      "(300,) (11,)\n",
      "init state [ 3  2 -2  1  0]\n",
      "(309,) (9,)\n",
      "init state [ 0  1  2 -1  0]\n",
      "(354,) (45,)\n",
      "init state [ 0  3  0 -2  0]\n",
      "(423,) (69,)\n",
      "============ 4 ===========\n",
      "Run episode 4 with rewards -27, accuracy 0.1\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/home/fyan/.local/lib/python3.10/site-packages/numpy/lib/function_base.py:518: RuntimeWarning: Mean of empty slice.\n",
      "  avg = a.mean(axis, **keepdims_kw)\n",
      "/home/fyan/.local/lib/python3.10/site-packages/numpy/core/_methods.py:190: RuntimeWarning: invalid value encountered in double_scalars\n",
      "  ret = ret.dtype.type(ret / rcount)\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 0 --------------\n",
      "   -0.3205 if c>=1.0 & x1>=2.0 & x2>=2.0\n",
      "   +0.0451 if x1<=2.0 & x1>=1.0 & x2>=3.0\n",
      "   -1.0288 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.0066 if c<=0.0 & x1<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1<=-2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.4494 if c<=0.0 & x2<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.0343 if c<=0.0 & x1<=1.0 & x2<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.0000 if x2>=3.0 & x3-x1>=2.0 & x4-x2>=-1.0\n",
      "   +0.1647 if c<=0.0 & x1<=2.0 & x3-x1<=-2.0\n",
      "   -0.0990 if c<=0.0 & x1<=0.0 & x1<=1.0 & x2>=1.0 & x2>=2.0 & x3-x1<=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.2006 if x1>=3.0 & x2>=1.0 & x3-x1<=-2.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.1086 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2<=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   +0.4913 if c<=0.0 & x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   +0.0224 if x2<=1.0 & x3-x1>=2.0\n",
      "   +0.3517 if c<=0.0 & x1<=2.0 & x2>=1.0 & x2>=2.0 & x3-x1<=-1.0\n",
      "   +0.0072 if c<=0.0 & x1<=1.0 & x2<=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.6813 if c<=0.0 & x2>=2.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "----------------- 1 --------------\n",
      "   +0.6883 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.2417 if c>=1.0 & x1>=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   -0.1479 if c>=1.0 & x1<=2.0 & x1>=2.0 & x2<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.0000 if x1<=0.0 & x3-x1<=1.0 & x4-x2>=2.0\n",
      "   -0.1713 if x2>=2.0 & x3-x1<=-1.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.2624 if c<=0.0 & x1<=0.0 & x1<=1.0 & x3-x1<=1.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.1423 if x1<=1.0 & x1>=1.0 & x2<=1.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0 & x4-x2>=0.0\n",
      "   -0.2772 if c<=0.0 & x1<=2.0 & x2>=3.0 & x3-x1<=2.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   +0.4148 if x3-x1<=0.0 & x4-x2<=-3.0\n",
      "   +0.3320 if c<=0.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   +0.0180 if x1>=2.0 & x2<=1.0 & x3-x1>=1.0\n",
      "   -0.3528 if x1<=2.0 & x1>=1.0 & x2>=2.0 & x3-x1>=-1.0 & x4-x2>=0.0\n",
      "   +0.4217 if x1>=2.0 & x2>=2.0 & x3-x1>=1.0\n",
      "   -0.0055 if c>=1.0 & x1>=2.0 & x2>=1.0 & x3-x1<=0.0 & x3-x1>=0.0\n",
      "   -0.6697 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   +0.9427 if x1>=1.0 & x2>=3.0 & x3-x1>=0.0 & x4-x2<=-2.0 & x4-x2>=-2.0\n",
      "----------------- 2 --------------\n",
      "   -0.1639 if c>=1.0 & x3-x1<=0.0 & x4-x2<=-3.0\n",
      "   -0.7439 if x2>=1.0 & x3-x1<=2.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   -0.0774 if x1>=2.0 & x2>=3.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2>=-2.0\n",
      "   +0.3688 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.2289 if c<=0.0 & x1<=0.0 & x3-x1<=1.0 & x4-x2>=1.0\n",
      "   +0.5938 if c<=0.0 & x1<=2.0 & x1>=1.0 & x1>=2.0 & x2<=2.0 & x2>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.2857 if x4-x2>=-1.0\n",
      "   -0.2889 if x1>=3.0 & x2>=1.0 & x3-x1<=-2.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.1089 if x2<=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.2246 if x1>=1.0 & x2<=2.0 & x3-x1<=0.0\n",
      "   +0.0233 if c>=1.0 & x1<=2.0 & x1>=2.0 & x2>=2.0 & x3-x1>=0.0\n",
      "   +0.0000 if x1<=0.0 & x3-x1<=1.0 & x4-x2>=2.0\n",
      "   -0.3554 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.8759 if c>=1.0 & x1>=1.0 & x2<=2.0 & x4-x2<=-1.0\n",
      "   +0.0236 if x1<=1.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.3559 if x2<=0.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "----------------- 3 --------------\n",
      "   +0.3251 if x3-x1<=-1.0\n",
      "   +0.3614 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2>=0.0\n",
      "   +0.2554 if x1<=2.0 & x1>=2.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   -0.1629 if c>=1.0 & x1>=2.0 & x2>=3.0 & x4-x2<=-2.0\n",
      "   -0.0000 if c>=1.0 & x2>=1.0 & x3-x1<=-2.0 & x4-x2>=0.0\n",
      "   -0.5216 if x1>=3.0 & x2>=3.0 & x3-x1>=0.0\n",
      "   -0.0528 if c<=0.0 & x1>=1.0 & x3-x1<=1.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.1032 if x1<=0.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   +0.1758 if x1>=3.0 & x3-x1<=-2.0\n",
      "   +0.0134 if x2>=1.0 & x3-x1>=3.0\n",
      "   -0.3283 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   -0.0091 if x1<=0.0 & x3-x1<=1.0 & x4-x2>=0.0 & x4-x2>=1.0\n",
      "   -0.2637 if c>=1.0 & x1>=2.0 & x2>=3.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   +0.1114 if x3-x1<=-3.0 & x4-x2>=-1.0\n",
      "   +0.3452 if c>=1.0 & x2<=1.0 & x2>=1.0\n",
      "   -0.6863 if c<=0.0 & x3-x1<=-1.0\n",
      "init state [0 0 0 1 0]\n",
      "(69,) (69,)\n",
      "init state [0 0 1 1 0]\n",
      "(94,) (25,)\n",
      "init state [ 2  1 -2 -1  0]\n",
      "(164,) (70,)\n",
      "init state [ 1  1  0 -1  0]\n",
      "(184,) (20,)\n",
      "init state [0 3 1 0 0]\n",
      "(199,) (15,)\n",
      "init state [ 0  2  0 -2  0]\n",
      "(223,) (24,)\n",
      "init state [ 2  1 -2  0  0]\n",
      "(257,) (34,)\n",
      "init state [2 0 0 1 0]\n",
      "(262,) (5,)\n",
      "init state [ 2  3 -1 -3  0]\n",
      "(333,) (71,)\n",
      "init state [ 2  3 -1 -2  0]\n",
      "(363,) (30,)\n",
      "============ 5 ===========\n",
      "Run episode 5 with rewards 12, accuracy 0.4\n",
      "best\n",
      "----------------- 0 --------------\n",
      "   -0.2562 if c>=1.0 & x1>=2.0 & x2>=2.0\n",
      "   -0.2052 if x1<=2.0 & x1>=1.0 & x2>=3.0\n",
      "   -1.1763 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.1912 if c<=0.0 & x1<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1<=-2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.7251 if c<=0.0 & x2<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.2485 if c<=0.0 & x1<=1.0 & x2<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.3231 if c<=0.0 & x1<=2.0 & x3-x1<=-2.0\n",
      "   +0.1343 if c<=0.0 & x1<=0.0 & x1<=1.0 & x2>=1.0 & x2>=2.0 & x3-x1<=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.2679 if x1>=3.0 & x2>=1.0 & x3-x1<=-2.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.0503 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2<=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   -0.1014 if c<=0.0 & x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   +0.0000 if x2<=1.0 & x3-x1>=2.0\n",
      "   -0.0754 if c<=0.0 & x1<=2.0 & x2>=1.0 & x2>=2.0 & x3-x1<=-1.0\n",
      "   +0.5812 if c<=0.0 & x1<=1.0 & x2<=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.0000 if c<=0.0 & x2>=2.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   -0.1598 if c<=0.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "----------------- 1 --------------\n",
      "   +0.3397 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.5876 if c>=1.0 & x1>=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   +0.1016 if c>=1.0 & x1<=2.0 & x1>=2.0 & x2<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   -0.0655 if x2>=2.0 & x3-x1<=-1.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   -0.0757 if c<=0.0 & x1<=0.0 & x1<=1.0 & x3-x1<=1.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.1704 if x1<=1.0 & x1>=1.0 & x2<=1.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0 & x4-x2>=0.0\n",
      "   -0.1791 if c<=0.0 & x1<=2.0 & x2>=3.0 & x3-x1<=2.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   +0.1578 if x3-x1<=0.0 & x4-x2<=-3.0\n",
      "   -0.0000 if c<=0.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.0000 if x1>=2.0 & x2<=1.0 & x3-x1>=1.0\n",
      "   +0.0132 if x1<=2.0 & x1>=1.0 & x2>=2.0 & x3-x1>=-1.0 & x4-x2>=0.0\n",
      "   -0.0000 if x1>=2.0 & x2>=2.0 & x3-x1>=1.0\n",
      "   +0.1752 if c>=1.0 & x1>=2.0 & x2>=1.0 & x3-x1<=0.0 & x3-x1>=0.0\n",
      "   -0.2439 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   +0.2014 if x1>=1.0 & x2>=3.0 & x3-x1>=0.0 & x4-x2<=-2.0 & x4-x2>=-2.0\n",
      "   -0.8743 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "----------------- 2 --------------\n",
      "   -0.1309 if c>=1.0 & x3-x1<=0.0 & x4-x2<=-3.0\n",
      "   -0.5275 if x2>=1.0 & x3-x1<=2.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.0000 if x1>=2.0 & x2>=3.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2>=-2.0\n",
      "   +0.0912 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.3122 if c<=0.0 & x1<=0.0 & x3-x1<=1.0 & x4-x2>=1.0\n",
      "   -0.1119 if c<=0.0 & x1<=2.0 & x1>=1.0 & x1>=2.0 & x2<=2.0 & x2>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.4220 if x4-x2>=-1.0\n",
      "   -0.0909 if x1>=3.0 & x2>=1.0 & x3-x1<=-2.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.0905 if x2<=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   +0.0725 if x1>=1.0 & x2<=2.0 & x3-x1<=0.0\n",
      "   +0.0000 if c>=1.0 & x1<=2.0 & x1>=2.0 & x2>=2.0 & x3-x1>=0.0\n",
      "   -0.1222 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.3656 if c>=1.0 & x1>=1.0 & x2<=2.0 & x4-x2<=-1.0\n",
      "   -0.1342 if x1<=1.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.3471 if x2<=0.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   +0.8307 if c<=0.0 & x4-x2>=-2.0\n",
      "----------------- 3 --------------\n",
      "   +0.1839 if x3-x1<=-1.0\n",
      "   +0.0110 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2>=0.0\n",
      "   +0.5901 if x1<=2.0 & x1>=2.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   -0.0927 if c>=1.0 & x1>=2.0 & x2>=3.0 & x4-x2<=-2.0\n",
      "   +0.0000 if x1>=3.0 & x2>=3.0 & x3-x1>=0.0\n",
      "   +0.0000 if c<=0.0 & x1>=1.0 & x3-x1<=1.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.0962 if x1<=0.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   +0.2231 if x1>=3.0 & x3-x1<=-2.0\n",
      "   +0.0000 if x2>=1.0 & x3-x1>=3.0\n",
      "   -0.2047 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   +0.0375 if x1<=0.0 & x3-x1<=1.0 & x4-x2>=0.0 & x4-x2>=1.0\n",
      "   -0.0930 if c>=1.0 & x1>=2.0 & x2>=3.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   +0.2495 if x3-x1<=-3.0 & x4-x2>=-1.0\n",
      "   +0.5294 if c>=1.0 & x2<=1.0 & x2>=1.0\n",
      "   -0.8813 if c<=0.0 & x3-x1<=-1.0\n",
      "   +0.4516 if c>=1.0 & x1>=3.0 & x4-x2>=0.0\n",
      "init state [ 1  0 -1  1  0]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(33,) (33,)\n",
      "init state [ 3  2 -1  0  0]\n",
      "(48,) (15,)\n",
      "init state [ 3  0 -1  2  0]\n",
      "(74,) (26,)\n",
      "init state [ 1  0 -1  0  0]\n",
      "(82,) (8,)\n",
      "init state [ 0  3  2 -1  0]\n",
      "(93,) (11,)\n",
      "init state [ 3  1 -3  0  0]\n",
      "(119,) (26,)\n",
      "init state [1 0 0 2 0]\n",
      "(125,) (6,)\n",
      "init state [ 1  1 -1 -1  0]\n",
      "(136,) (11,)\n",
      "init state [ 0  2  0 -2  0]\n",
      "(186,) (50,)\n",
      "init state [ 2  2  0 -2  0]\n",
      "(230,) (44,)\n",
      "============ 6 ===========\n",
      "Run episode 6 with rewards -2, accuracy 0.4\n",
      "best\n",
      "----------------- 0 --------------\n",
      "   -0.5326 if c>=1.0 & x1>=2.0 & x2>=2.0\n",
      "   -0.5846 if x1<=2.0 & x1>=1.0 & x2>=3.0\n",
      "   -1.0533 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.1734 if c<=0.0 & x1<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1<=-2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.1675 if c<=0.0 & x2<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.5387 if c<=0.0 & x1<=1.0 & x2<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.2681 if c<=0.0 & x1<=2.0 & x3-x1<=-2.0\n",
      "   -0.1958 if c<=0.0 & x1<=0.0 & x1<=1.0 & x2>=1.0 & x2>=2.0 & x3-x1<=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.1615 if x1>=3.0 & x2>=1.0 & x3-x1<=-2.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.3619 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2<=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   +0.0000 if c<=0.0 & x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   +0.3389 if c<=0.0 & x1<=2.0 & x2>=1.0 & x2>=2.0 & x3-x1<=-1.0\n",
      "   +0.1647 if c<=0.0 & x1<=1.0 & x2<=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.0000 if c<=0.0 & x2>=2.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   -0.1682 if c<=0.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   -0.6397 if x3-x1>=2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "----------------- 1 --------------\n",
      "   +0.4203 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.0473 if c>=1.0 & x1>=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   +0.2268 if c>=1.0 & x1<=2.0 & x1>=2.0 & x2<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.0090 if x2>=2.0 & x3-x1<=-1.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.0000 if c<=0.0 & x1<=0.0 & x1<=1.0 & x3-x1<=1.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.1392 if x1<=1.0 & x1>=1.0 & x2<=1.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0 & x4-x2>=0.0\n",
      "   -0.0127 if c<=0.0 & x1<=2.0 & x2>=3.0 & x3-x1<=2.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   +0.2914 if x3-x1<=0.0 & x4-x2<=-3.0\n",
      "   +0.4134 if c<=0.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.1638 if x1<=2.0 & x1>=1.0 & x2>=2.0 & x3-x1>=-1.0 & x4-x2>=0.0\n",
      "   +0.0000 if x1>=2.0 & x2>=2.0 & x3-x1>=1.0\n",
      "   +0.0012 if c>=1.0 & x1>=2.0 & x2>=1.0 & x3-x1<=0.0 & x3-x1>=0.0\n",
      "   -0.0437 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   +0.0000 if x1>=1.0 & x2>=3.0 & x3-x1>=0.0 & x4-x2<=-2.0 & x4-x2>=-2.0\n",
      "   -1.0279 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.7667 if x2<=1.0 & x3-x1>=2.0 & x4-x2<=0.0\n",
      "----------------- 2 --------------\n",
      "   +0.0517 if c>=1.0 & x3-x1<=0.0 & x4-x2<=-3.0\n",
      "   -0.2276 if x2>=1.0 & x3-x1<=2.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.2231 if x1>=2.0 & x2>=3.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2>=-2.0\n",
      "   +0.2021 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.2140 if c<=0.0 & x1<=0.0 & x3-x1<=1.0 & x4-x2>=1.0\n",
      "   +0.3596 if c<=0.0 & x1<=2.0 & x1>=1.0 & x1>=2.0 & x2<=2.0 & x2>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.2637 if x4-x2>=-1.0\n",
      "   -0.2853 if x1>=3.0 & x2>=1.0 & x3-x1<=-2.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.2255 if x2<=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.0832 if x1>=1.0 & x2<=2.0 & x3-x1<=0.0\n",
      "   -0.2078 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.5425 if c>=1.0 & x1>=1.0 & x2<=2.0 & x4-x2<=-1.0\n",
      "   -0.1659 if x1<=1.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.2161 if x2<=0.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   +0.7323 if c<=0.0 & x4-x2>=-2.0\n",
      "   -0.4851 if c<=0.0 & x2<=2.0\n",
      "----------------- 3 --------------\n",
      "   +0.3977 if x3-x1<=-1.0\n",
      "   -0.0576 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2>=0.0\n",
      "   +0.3728 if x1<=2.0 & x1>=2.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   -0.2075 if c>=1.0 & x1>=2.0 & x2>=3.0 & x4-x2<=-2.0\n",
      "   +0.0000 if x1>=3.0 & x2>=3.0 & x3-x1>=0.0\n",
      "   -0.1828 if c<=0.0 & x1>=1.0 & x3-x1<=1.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.2108 if x1<=0.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   +0.6170 if x1>=3.0 & x3-x1<=-2.0\n",
      "   -0.4960 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   -0.1657 if x1<=0.0 & x3-x1<=1.0 & x4-x2>=0.0 & x4-x2>=1.0\n",
      "   +0.1700 if c>=1.0 & x1>=2.0 & x2>=3.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   +0.3613 if x3-x1<=-3.0 & x4-x2>=-1.0\n",
      "   +0.5255 if c>=1.0 & x2<=1.0 & x2>=1.0\n",
      "   -0.6051 if c<=0.0 & x3-x1<=-1.0\n",
      "   +0.3932 if c>=1.0 & x1>=3.0 & x4-x2>=0.0\n",
      "   +1.1608 if c<=0.0 & x1<=2.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "init state [ 2  3 -2  0  0]\n",
      "(28,) (28,)\n",
      "init state [ 3  1 -2  0  0]\n",
      "(50,) (22,)\n",
      "init state [ 1  1 -1 -1  0]\n",
      "(64,) (14,)\n",
      "init state [2 2 1 0 0]\n",
      "(71,) (7,)\n",
      "init state [ 2  2 -2  1  0]\n",
      "(87,) (16,)\n",
      "init state [ 2  1  0 -1  0]\n",
      "(97,) (10,)\n",
      "init state [0 0 1 0 0]\n",
      "(115,) (18,)\n",
      "init state [ 3  2 -3  0  0]\n",
      "(137,) (22,)\n",
      "init state [1 3 1 0 0]\n",
      "(150,) (13,)\n",
      "init state [ 2  0 -2  3  0]\n",
      "(293,) (143,)\n",
      "============ 7 ===========\n",
      "Run episode 7 with rewards -101, accuracy 0.2\n",
      "----------------- 0 --------------\n",
      "   -0.4265 if c>=1.0 & x1>=2.0 & x2>=2.0\n",
      "   -0.5839 if x1<=2.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.7127 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.2089 if c<=0.0 & x1<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1<=-2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.0261 if c<=0.0 & x2<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.0838 if c<=0.0 & x1<=1.0 & x2<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.6679 if c<=0.0 & x1<=2.0 & x3-x1<=-2.0\n",
      "   -0.3332 if c<=0.0 & x1<=0.0 & x1<=1.0 & x2>=1.0 & x2>=2.0 & x3-x1<=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.0039 if x1>=3.0 & x2>=1.0 & x3-x1<=-2.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.0592 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2<=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   +0.2540 if c<=0.0 & x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   +0.4211 if c<=0.0 & x1<=2.0 & x2>=1.0 & x2>=2.0 & x3-x1<=-1.0\n",
      "   +0.0000 if c<=0.0 & x1<=1.0 & x2<=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.3444 if c<=0.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   -0.3649 if x3-x1>=2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.1298 if c>=1.0 & x3-x1>=2.0\n",
      "----------------- 1 --------------\n",
      "   +0.3298 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.5584 if c>=1.0 & x1>=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   +0.3329 if c>=1.0 & x1<=2.0 & x1>=2.0 & x2<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.0851 if x2>=2.0 & x3-x1<=-1.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.2030 if c<=0.0 & x1<=0.0 & x1<=1.0 & x3-x1<=1.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.0489 if x1<=1.0 & x1>=1.0 & x2<=1.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0 & x4-x2>=0.0\n",
      "   +0.3930 if c<=0.0 & x1<=2.0 & x2>=3.0 & x3-x1<=2.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   +0.1701 if x3-x1<=0.0 & x4-x2<=-3.0\n",
      "   +0.5919 if c<=0.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.3334 if x1<=2.0 & x1>=1.0 & x2>=2.0 & x3-x1>=-1.0 & x4-x2>=0.0\n",
      "   +0.1432 if c>=1.0 & x1>=2.0 & x2>=1.0 & x3-x1<=0.0 & x3-x1>=0.0\n",
      "   -0.5596 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   +0.0000 if x1>=1.0 & x2>=3.0 & x3-x1>=0.0 & x4-x2<=-2.0 & x4-x2>=-2.0\n",
      "   -0.5923 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.1160 if x2<=1.0 & x3-x1>=2.0 & x4-x2<=0.0\n",
      "   -0.4962 if x3-x1>=2.0 & x4-x2>=0.0\n",
      "----------------- 2 --------------\n",
      "   -0.6828 if x2>=1.0 & x3-x1<=2.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.5265 if x1>=2.0 & x2>=3.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2>=-2.0\n",
      "   +0.2341 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.2435 if c<=0.0 & x1<=0.0 & x3-x1<=1.0 & x4-x2>=1.0\n",
      "   +0.3232 if c<=0.0 & x1<=2.0 & x1>=1.0 & x1>=2.0 & x2<=2.0 & x2>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.1088 if x4-x2>=-1.0\n",
      "   +0.2682 if x1>=3.0 & x2>=1.0 & x3-x1<=-2.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.1158 if x2<=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.0526 if x1>=1.0 & x2<=2.0 & x3-x1<=0.0\n",
      "   +0.1064 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.1521 if c>=1.0 & x1>=1.0 & x2<=2.0 & x4-x2<=-1.0\n",
      "   +0.2187 if x1<=1.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.1506 if x2<=0.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   +0.2905 if c<=0.0 & x4-x2>=-2.0\n",
      "   -0.2169 if c<=0.0 & x2<=2.0\n",
      "   -0.6747 if x4-x2<=-3.0\n",
      "----------------- 3 --------------\n",
      "   +0.2403 if x3-x1<=-1.0\n",
      "   -0.0301 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2>=0.0\n",
      "   +0.4637 if x1<=2.0 & x1>=2.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   +0.3552 if c>=1.0 & x1>=2.0 & x2>=3.0 & x4-x2<=-2.0\n",
      "   +0.0055 if c<=0.0 & x1>=1.0 & x3-x1<=1.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.5532 if x1<=0.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   +0.0574 if x1>=3.0 & x3-x1<=-2.0\n",
      "   -0.4919 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   +0.7123 if x1<=0.0 & x3-x1<=1.0 & x4-x2>=0.0 & x4-x2>=1.0\n",
      "   +0.1469 if c>=1.0 & x1>=2.0 & x2>=3.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   -0.0781 if x3-x1<=-3.0 & x4-x2>=-1.0\n",
      "   +0.2761 if c>=1.0 & x2<=1.0 & x2>=1.0\n",
      "   -0.3627 if c<=0.0 & x3-x1<=-1.0\n",
      "   +0.5219 if c>=1.0 & x1>=3.0 & x4-x2>=0.0\n",
      "   +0.5760 if c<=0.0 & x1<=2.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.9996 if x3-x1>=2.0 & x4-x2>=0.0\n",
      "init state [1 2 1 1 0]\n",
      "(4,) (4,)\n",
      "init state [1 1 1 2 0]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(15,) (11,)\n",
      "init state [1 3 1 0 0]\n",
      "(20,) (5,)\n",
      "init state [2 1 0 2 0]\n",
      "(25,) (5,)\n",
      "init state [ 0  3  2 -3  0]\n",
      "(92,) (67,)\n",
      "init state [ 0  2  3 -2  0]\n",
      "(198,) (106,)\n",
      "init state [0 1 1 1 0]\n",
      "(203,) (5,)\n",
      "init state [ 1  3  1 -2  0]\n",
      "(228,) (25,)\n",
      "init state [0 1 2 0 0]\n",
      "(286,) (58,)\n",
      "init state [2 0 0 1 0]\n",
      "(293,) (7,)\n",
      "============ 8 ===========\n",
      "Run episode 8 with rewards 35, accuracy 0.7\n",
      "best\n",
      "----------------- 0 --------------\n",
      "   -0.0857 if c>=1.0 & x1>=2.0 & x2>=2.0\n",
      "   -0.4727 if x1<=2.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.7342 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.0000 if c<=0.0 & x1<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1<=-2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.0712 if c<=0.0 & x2<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.0109 if c<=0.0 & x1<=1.0 & x2<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.0000 if c<=0.0 & x1<=2.0 & x3-x1<=-2.0\n",
      "   -0.1485 if c<=0.0 & x1<=0.0 & x1<=1.0 & x2>=1.0 & x2>=2.0 & x3-x1<=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.0000 if x1>=3.0 & x2>=1.0 & x3-x1<=-2.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.1039 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2<=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   +0.2279 if c<=0.0 & x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   +0.0000 if c<=0.0 & x1<=2.0 & x2>=1.0 & x2>=2.0 & x3-x1<=-1.0\n",
      "   -0.3839 if c<=0.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   -0.2816 if x3-x1>=2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.0399 if c>=1.0 & x3-x1>=2.0\n",
      "   +0.6997 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "----------------- 1 --------------\n",
      "   +0.8263 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.4904 if c>=1.0 & x1>=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   +0.1409 if c>=1.0 & x1<=2.0 & x1>=2.0 & x2<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   -0.1320 if x2>=2.0 & x3-x1<=-1.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.2923 if c<=0.0 & x1<=0.0 & x1<=1.0 & x3-x1<=1.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.1072 if x1<=1.0 & x1>=1.0 & x2<=1.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0 & x4-x2>=0.0\n",
      "   +0.5843 if c<=0.0 & x1<=2.0 & x2>=3.0 & x3-x1<=2.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   +0.3012 if x3-x1<=0.0 & x4-x2<=-3.0\n",
      "   +0.2917 if c<=0.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.3222 if x1<=2.0 & x1>=1.0 & x2>=2.0 & x3-x1>=-1.0 & x4-x2>=0.0\n",
      "   +0.0405 if c>=1.0 & x1>=2.0 & x2>=1.0 & x3-x1<=0.0 & x3-x1>=0.0\n",
      "   -0.3740 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   -0.3282 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.4874 if x2<=1.0 & x3-x1>=2.0 & x4-x2<=0.0\n",
      "   +0.2037 if x3-x1>=2.0 & x4-x2>=0.0\n",
      "   +0.4875 if x4-x2>=2.0\n",
      "----------------- 2 --------------\n",
      "   -0.9472 if x2>=1.0 & x3-x1<=2.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.1876 if x1>=2.0 & x2>=3.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2>=-2.0\n",
      "   +0.5611 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.0430 if c<=0.0 & x1<=0.0 & x3-x1<=1.0 & x4-x2>=1.0\n",
      "   +0.2957 if c<=0.0 & x1<=2.0 & x1>=1.0 & x1>=2.0 & x2<=2.0 & x2>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.6405 if x4-x2>=-1.0\n",
      "   -0.0000 if x1>=3.0 & x2>=1.0 & x3-x1<=-2.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.0814 if x2<=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.1995 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.1259 if c>=1.0 & x1>=1.0 & x2<=2.0 & x4-x2<=-1.0\n",
      "   -0.0629 if x1<=1.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.2009 if x2<=0.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   +0.1949 if c<=0.0 & x4-x2>=-2.0\n",
      "   +0.0939 if c<=0.0 & x2<=2.0\n",
      "   -0.0149 if x4-x2<=-3.0\n",
      "   +0.2350 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "----------------- 3 --------------\n",
      "   +0.1470 if x3-x1<=-1.0\n",
      "   +0.2385 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2>=0.0\n",
      "   +0.5628 if x1<=2.0 & x1>=2.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   -0.2377 if c>=1.0 & x1>=2.0 & x2>=3.0 & x4-x2<=-2.0\n",
      "   +0.0000 if x1<=0.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   +0.0000 if x1>=3.0 & x3-x1<=-2.0\n",
      "   -0.2118 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   +0.3873 if x1<=0.0 & x3-x1<=1.0 & x4-x2>=0.0 & x4-x2>=1.0\n",
      "   -0.3103 if c>=1.0 & x1>=2.0 & x2>=3.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   +0.0000 if x3-x1<=-3.0 & x4-x2>=-1.0\n",
      "   +0.7688 if c>=1.0 & x2<=1.0 & x2>=1.0\n",
      "   -0.4274 if c<=0.0 & x3-x1<=-1.0\n",
      "   +0.1908 if c>=1.0 & x1>=3.0 & x4-x2>=0.0\n",
      "   +0.2820 if c<=0.0 & x1<=2.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.0850 if x3-x1>=2.0 & x4-x2>=0.0\n",
      "   +0.3329 if c>=1.0 & x1<=2.0 & x3-x1<=1.0 & x4-x2<=-2.0\n",
      "init state [ 2  0 -1  0  0]\n",
      "(18,) (18,)\n",
      "init state [ 0  2  2 -2  0]\n",
      "(49,) (31,)\n",
      "init state [0 2 1 0 0]\n",
      "(54,) (5,)\n",
      "init state [ 2  1 -1  1  0]\n",
      "(66,) (12,)\n",
      "init state [ 3  2  0 -2  0]\n",
      "(105,) (39,)\n",
      "init state [ 2  2 -2  0  0]\n",
      "(114,) (9,)\n",
      "init state [1 1 1 1 0]\n",
      "(118,) (4,)\n",
      "init state [ 1  2 -1 -1  0]\n",
      "(143,) (25,)\n",
      "init state [ 2  3  0 -2  0]\n",
      "(150,) (7,)\n",
      "init state [ 1  2 -1 -1  0]\n",
      "(169,) (19,)\n",
      "============ 9 ===========\n",
      "Run episode 9 with rewards 23, accuracy 0.3\n",
      "----------------- 0 --------------\n",
      "   -0.3794 if c>=1.0 & x1>=2.0 & x2>=2.0\n",
      "   -0.4663 if x1<=2.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.4480 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.0937 if c<=0.0 & x1<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1<=-2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.6758 if c<=0.0 & x2<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.1708 if c<=0.0 & x1<=1.0 & x2<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.1039 if c<=0.0 & x1<=2.0 & x3-x1<=-2.0\n",
      "   -0.1418 if c<=0.0 & x1<=0.0 & x1<=1.0 & x2>=1.0 & x2>=2.0 & x3-x1<=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.3367 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2<=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   +0.2730 if c<=0.0 & x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   +0.0634 if c<=0.0 & x1<=2.0 & x2>=1.0 & x2>=2.0 & x3-x1<=-1.0\n",
      "   +0.2392 if c<=0.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   -0.0745 if x3-x1>=2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.0745 if c>=1.0 & x3-x1>=2.0\n",
      "   +0.8633 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.5393 if x3-x1<=1.0 & x3-x1>=-2.0 & x4-x2>=-2.0\n",
      "----------------- 1 --------------\n",
      "   +0.5893 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.3739 if c>=1.0 & x1>=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   -0.2274 if c>=1.0 & x1<=2.0 & x1>=2.0 & x2<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   -0.4552 if x2>=2.0 & x3-x1<=-1.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.5503 if c<=0.0 & x1<=0.0 & x1<=1.0 & x3-x1<=1.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.0996 if x1<=1.0 & x1>=1.0 & x2<=1.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0 & x4-x2>=0.0\n",
      "   +0.0000 if c<=0.0 & x1<=2.0 & x2>=3.0 & x3-x1<=2.0 & x3-x1>=0.0 & x4-x2>=-1.0\n",
      "   -0.0009 if x3-x1<=0.0 & x4-x2<=-3.0\n",
      "   +0.4708 if c<=0.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.2966 if x1<=2.0 & x1>=1.0 & x2>=2.0 & x3-x1>=-1.0 & x4-x2>=0.0\n",
      "   -0.1442 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   -0.6773 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.1115 if x2<=1.0 & x3-x1>=2.0 & x4-x2<=0.0\n",
      "   -0.0585 if x3-x1>=2.0 & x4-x2>=0.0\n",
      "   -0.1192 if x4-x2>=2.0\n",
      "   +0.6109 if c>=1.0 & x1>=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=-1.0\n",
      "----------------- 2 --------------\n",
      "   -0.6008 if x2>=1.0 & x3-x1<=2.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.1499 if x1>=2.0 & x2>=3.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2>=-2.0\n",
      "   +0.1635 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.0728 if c<=0.0 & x1<=0.0 & x3-x1<=1.0 & x4-x2>=1.0\n",
      "   +0.5271 if c<=0.0 & x1<=2.0 & x1>=1.0 & x1>=2.0 & x2<=2.0 & x2>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.7632 if x4-x2>=-1.0\n",
      "   -0.0630 if x2<=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.2384 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.3651 if c>=1.0 & x1>=1.0 & x2<=2.0 & x4-x2<=-1.0\n",
      "   -0.0245 if x1<=1.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.0225 if x2<=0.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   +0.6273 if c<=0.0 & x4-x2>=-2.0\n",
      "   +0.4166 if c<=0.0 & x2<=2.0\n",
      "   -0.0187 if x4-x2<=-3.0\n",
      "   +0.4422 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "   -0.5477 if c<=0.0 & x1<=2.0 & x2<=1.0 & x3-x1>=0.0 & x4-x2<=1.0\n",
      "----------------- 3 --------------\n",
      "   +0.2042 if x3-x1<=-1.0\n",
      "   +0.4086 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2>=0.0\n",
      "   +0.2655 if x1<=2.0 & x1>=2.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   -0.0123 if c>=1.0 & x1>=2.0 & x2>=3.0 & x4-x2<=-2.0\n",
      "   -0.0402 if x1<=0.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   -0.4879 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   +0.3771 if x1<=0.0 & x3-x1<=1.0 & x4-x2>=0.0 & x4-x2>=1.0\n",
      "   +0.0582 if c>=1.0 & x1>=2.0 & x2>=3.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   -0.0867 if x3-x1<=-3.0 & x4-x2>=-1.0\n",
      "   +0.2054 if c>=1.0 & x2<=1.0 & x2>=1.0\n",
      "   -0.3289 if c<=0.0 & x3-x1<=-1.0\n",
      "   -0.0499 if c>=1.0 & x1>=3.0 & x4-x2>=0.0\n",
      "   -0.2749 if c<=0.0 & x1<=2.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.1391 if x3-x1>=2.0 & x4-x2>=0.0\n",
      "   +0.0742 if c>=1.0 & x1<=2.0 & x3-x1<=1.0 & x4-x2<=-2.0\n",
      "   +0.3765 if x2<=1.0 & x3-x1<=-2.0 & x4-x2>=1.0\n",
      "init state [1 2 1 1 0]\n",
      "(3,) (3,)\n",
      "init state [ 0  3  0 -3  0]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(42,) (39,)\n",
      "init state [ 0  2  0 -2  0]\n",
      "(69,) (27,)\n",
      "init state [ 3  1 -1  0  0]\n",
      "(76,) (7,)\n",
      "init state [ 2  0 -2  0  0]\n",
      "(86,) (10,)\n",
      "init state [ 2  3 -2 -1  0]\n",
      "(104,) (18,)\n",
      "init state [ 2  2 -1 -2  0]\n",
      "(141,) (37,)\n",
      "init state [ 0  1  1 -1  0]\n",
      "(158,) (17,)\n",
      "init state [1 0 1 1 0]\n",
      "(174,) (16,)\n",
      "init state [ 3  0 -3  1  0]\n",
      "(187,) (13,)\n",
      "============ 10 ===========\n",
      "Run episode 10 with rewards 29, accuracy 0.3\n",
      "----------------- 0 --------------\n",
      "   -0.1286 if c>=1.0 & x1>=2.0 & x2>=2.0\n",
      "   -0.1097 if x1<=2.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.6945 if c>=1.0 & x3-x1<=1.0\n",
      "   -0.1688 if c<=0.0 & x1<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1<=-2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.6848 if c<=0.0 & x2<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.1883 if c<=0.0 & x1<=1.0 & x2<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.1246 if c<=0.0 & x1<=2.0 & x3-x1<=-2.0\n",
      "   +0.0000 if c<=0.0 & x1<=0.0 & x1<=1.0 & x2>=1.0 & x2>=2.0 & x3-x1<=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.0000 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2<=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   -0.1348 if c<=0.0 & x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   -0.2617 if c<=0.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   -0.1321 if x3-x1>=2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.0000 if c>=1.0 & x3-x1>=2.0\n",
      "   +1.1246 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.4186 if x3-x1<=1.0 & x3-x1>=-2.0 & x4-x2>=-2.0\n",
      "   +0.3063 if c<=0.0 & x1>=1.0 & x2<=0.0 & x3-x1>=0.0\n",
      "----------------- 1 --------------\n",
      "   +0.3763 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.1813 if c>=1.0 & x1>=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   -0.0565 if c>=1.0 & x1<=2.0 & x1>=2.0 & x2<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   -0.1979 if x2>=2.0 & x3-x1<=-1.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   -0.0817 if c<=0.0 & x1<=0.0 & x1<=1.0 & x3-x1<=1.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.1155 if x1<=1.0 & x1>=1.0 & x2<=1.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0 & x4-x2>=0.0\n",
      "   -0.0629 if x3-x1<=0.0 & x4-x2<=-3.0\n",
      "   +0.0000 if c<=0.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   +0.3447 if x1<=2.0 & x1>=1.0 & x2>=2.0 & x3-x1>=-1.0 & x4-x2>=0.0\n",
      "   -0.3354 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   -0.6231 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.2577 if x2<=1.0 & x3-x1>=2.0 & x4-x2<=0.0\n",
      "   +0.4816 if x3-x1>=2.0 & x4-x2>=0.0\n",
      "   +0.0000 if x4-x2>=2.0\n",
      "   +0.4024 if c>=1.0 & x1>=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   -0.5185 if x3-x1<=-3.0 & x4-x2<=-1.0\n",
      "----------------- 2 --------------\n",
      "   -0.5733 if x2>=1.0 & x3-x1<=2.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   -0.0310 if x1>=2.0 & x2>=3.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2>=-2.0\n",
      "   +0.5980 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.0469 if c<=0.0 & x1<=0.0 & x3-x1<=1.0 & x4-x2>=1.0\n",
      "   +0.2792 if c<=0.0 & x1<=2.0 & x1>=1.0 & x1>=2.0 & x2<=2.0 & x2>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.5408 if x4-x2>=-1.0\n",
      "   -0.2858 if x2<=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   +0.1198 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.6647 if c>=1.0 & x1>=1.0 & x2<=2.0 & x4-x2<=-1.0\n",
      "   +0.3477 if x1<=1.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.1207 if x2<=0.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   +0.2633 if c<=0.0 & x4-x2>=-2.0\n",
      "   +0.1967 if c<=0.0 & x2<=2.0\n",
      "   +0.3219 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "   +0.0039 if c<=0.0 & x1<=2.0 & x2<=1.0 & x3-x1>=0.0 & x4-x2<=1.0\n",
      "   +0.7986 if x3-x1<=-2.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "----------------- 3 --------------\n",
      "   +0.4721 if x3-x1<=-1.0\n",
      "   -0.1974 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2>=0.0\n",
      "   +0.2772 if x1<=2.0 & x1>=2.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   -0.0315 if x1<=0.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   -0.2872 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   -0.1794 if x1<=0.0 & x3-x1<=1.0 & x4-x2>=0.0 & x4-x2>=1.0\n",
      "   +0.0983 if c>=1.0 & x1>=2.0 & x2>=3.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   +0.2977 if x3-x1<=-3.0 & x4-x2>=-1.0\n",
      "   +0.4844 if c>=1.0 & x2<=1.0 & x2>=1.0\n",
      "   -0.4658 if c<=0.0 & x3-x1<=-1.0\n",
      "   +0.2516 if c>=1.0 & x1>=3.0 & x4-x2>=0.0\n",
      "   +0.7687 if c<=0.0 & x1<=2.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.1857 if x3-x1>=2.0 & x4-x2>=0.0\n",
      "   -0.3251 if c>=1.0 & x1<=2.0 & x3-x1<=1.0 & x4-x2<=-2.0\n",
      "   -0.0941 if x2<=1.0 & x3-x1<=-2.0 & x4-x2>=1.0\n",
      "   -0.3217 if x1>=1.0 & x2<=2.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "init state [ 2  0 -2  2  0]\n",
      "(29,) (29,)\n",
      "init state [ 2  3  0 -1  0]\n",
      "(40,) (11,)\n",
      "init state [2 1 0 1 0]\n",
      "(44,) (4,)\n",
      "init state [ 2  0 -2  3  0]\n",
      "(68,) (24,)\n",
      "init state [ 1  3 -1  0  0]\n",
      "(74,) (6,)\n",
      "init state [0 1 2 0 0]\n",
      "(91,) (17,)\n",
      "init state [ 1  2 -1  1  0]\n",
      "(105,) (14,)\n",
      "init state [ 3  2 -1 -2  0]\n",
      "(123,) (18,)\n",
      "init state [ 0  3  1 -2  0]\n",
      "(154,) (31,)\n",
      "init state [ 3  2 -3  1  0]\n",
      "(194,) (40,)\n",
      "============ 11 ===========\n",
      "Run episode 11 with rewards 2, accuracy 0.4\n",
      "----------------- 0 --------------\n",
      "   -0.2911 if c>=1.0 & x1>=2.0 & x2>=2.0\n",
      "   -0.0514 if x1<=2.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.7506 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.0000 if c<=0.0 & x1<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1<=-2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.1215 if c<=0.0 & x2<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.0967 if c<=0.0 & x1<=1.0 & x2<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.2960 if c<=0.0 & x1<=2.0 & x3-x1<=-2.0\n",
      "   +0.0000 if c<=0.0 & x1<=0.0 & x1<=1.0 & x2>=1.0 & x2>=2.0 & x3-x1<=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.1150 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2<=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   +0.0223 if c<=0.0 & x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   -0.1785 if c<=0.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   -0.0364 if x3-x1>=2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.8972 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.3923 if x3-x1<=1.0 & x3-x1>=-2.0 & x4-x2>=-2.0\n",
      "   -0.0904 if c<=0.0 & x1>=1.0 & x2<=0.0 & x3-x1>=0.0\n",
      "   +0.5237 if x1>=3.0 & x2<=0.0 & x4-x2<=1.0\n",
      "----------------- 1 --------------\n",
      "   +0.6223 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.1727 if c>=1.0 & x1>=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   +0.3198 if c>=1.0 & x1<=2.0 & x1>=2.0 & x2<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   -0.4683 if x2>=2.0 & x3-x1<=-1.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.0000 if c<=0.0 & x1<=0.0 & x1<=1.0 & x3-x1<=1.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.0805 if x1<=1.0 & x1>=1.0 & x2<=1.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0 & x4-x2>=0.0\n",
      "   +0.0000 if x3-x1<=0.0 & x4-x2<=-3.0\n",
      "   -0.2616 if c<=0.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   +0.1527 if x1<=2.0 & x1>=1.0 & x2>=2.0 & x3-x1>=-1.0 & x4-x2>=0.0\n",
      "   -0.2857 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   -0.3172 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.0565 if x2<=1.0 & x3-x1>=2.0 & x4-x2<=0.0\n",
      "   +0.1573 if x3-x1>=2.0 & x4-x2>=0.0\n",
      "   +0.2577 if c>=1.0 & x1>=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   +0.0000 if x3-x1<=-3.0 & x4-x2<=-1.0\n",
      "   -0.4157 if x1<=1.0 & x2>=2.0 & x3-x1<=0.0\n",
      "----------------- 2 --------------\n",
      "   -0.0053 if x2>=1.0 & x3-x1<=2.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   -0.2557 if x1>=2.0 & x2>=3.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2>=-2.0\n",
      "   -0.0606 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.1468 if c<=0.0 & x1<=0.0 & x3-x1<=1.0 & x4-x2>=1.0\n",
      "   -0.1169 if c<=0.0 & x1<=2.0 & x1>=1.0 & x1>=2.0 & x2<=2.0 & x2>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.0818 if x4-x2>=-1.0\n",
      "   -0.3068 if x2<=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.1768 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.3616 if c>=1.0 & x1>=1.0 & x2<=2.0 & x4-x2<=-1.0\n",
      "   +0.6122 if x1<=1.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.0920 if x2<=0.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   +0.3538 if c<=0.0 & x4-x2>=-2.0\n",
      "   -0.2568 if c<=0.0 & x2<=2.0\n",
      "   +0.5331 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "   +0.1163 if x3-x1<=-2.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   -0.8297 if x3-x1<=0.0 & x4-x2>=-1.0\n",
      "----------------- 3 --------------\n",
      "   +0.3505 if x3-x1<=-1.0\n",
      "   +0.0439 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2>=0.0\n",
      "   +0.3400 if x1<=2.0 & x1>=2.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   -0.0953 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   +0.3698 if x1<=0.0 & x3-x1<=1.0 & x4-x2>=0.0 & x4-x2>=1.0\n",
      "   +0.0000 if c>=1.0 & x1>=2.0 & x2>=3.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   +0.2583 if x3-x1<=-3.0 & x4-x2>=-1.0\n",
      "   +0.3119 if c>=1.0 & x2<=1.0 & x2>=1.0\n",
      "   -0.2967 if c<=0.0 & x3-x1<=-1.0\n",
      "   +0.3316 if c>=1.0 & x1>=3.0 & x4-x2>=0.0\n",
      "   +0.5766 if c<=0.0 & x1<=2.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.3334 if x3-x1>=2.0 & x4-x2>=0.0\n",
      "   -0.0078 if c>=1.0 & x1<=2.0 & x3-x1<=1.0 & x4-x2<=-2.0\n",
      "   -0.0020 if x2<=1.0 & x3-x1<=-2.0 & x4-x2>=1.0\n",
      "   +0.1338 if x1>=1.0 & x2<=2.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   -0.4097 if x1>=1.0 & x3-x1>=0.0\n",
      "init state [0 1 0 1 0]\n",
      "(5,) (5,)\n",
      "init state [3 0 0 1 0]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(23,) (18,)\n",
      "init state [ 1  1 -1  1  0]\n",
      "(38,) (15,)\n",
      "init state [ 3  0 -3  2  0]\n",
      "(60,) (22,)\n",
      "init state [ 3  1 -3 -1  0]\n",
      "(100,) (40,)\n",
      "init state [ 2  1  1 -1  0]\n",
      "(128,) (28,)\n",
      "init state [ 3  0 -2  1  0]\n",
      "(185,) (57,)\n",
      "init state [0 0 1 1 0]\n",
      "(194,) (9,)\n",
      "init state [ 2  2 -2 -2  0]\n",
      "(231,) (37,)\n",
      "init state [0 2 1 0 0]\n",
      "(237,) (6,)\n",
      "============ 12 ===========\n",
      "Run episode 12 with rewards 36, accuracy 0.3\n",
      "----------------- 0 --------------\n",
      "   -0.5190 if c>=1.0 & x1>=2.0 & x2>=2.0\n",
      "   +0.0547 if x1<=2.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.8604 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.0358 if c<=0.0 & x1<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1<=-2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.0920 if c<=0.0 & x2<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.2287 if c<=0.0 & x1<=1.0 & x2<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.5359 if c<=0.0 & x1<=2.0 & x3-x1<=-2.0\n",
      "   -0.2269 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2<=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   -0.1198 if c<=0.0 & x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   +0.1921 if c<=0.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   -0.2154 if x3-x1>=2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.9109 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.3799 if x3-x1<=1.0 & x3-x1>=-2.0 & x4-x2>=-2.0\n",
      "   -0.0871 if c<=0.0 & x1>=1.0 & x2<=0.0 & x3-x1>=0.0\n",
      "   +0.0661 if x1>=3.0 & x2<=0.0 & x4-x2<=1.0\n",
      "   -0.4044 if c<=0.0 & x1>=3.0 & x2>=2.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "----------------- 1 --------------\n",
      "   +0.8544 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.3180 if c>=1.0 & x1>=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   -0.2154 if c>=1.0 & x1<=2.0 & x1>=2.0 & x2<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.0955 if x2>=2.0 & x3-x1<=-1.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.0794 if c<=0.0 & x1<=0.0 & x1<=1.0 & x3-x1<=1.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.0144 if x1<=1.0 & x1>=1.0 & x2<=1.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0 & x4-x2>=0.0\n",
      "   +0.1483 if c<=0.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.0519 if x1<=2.0 & x1>=1.0 & x2>=2.0 & x3-x1>=-1.0 & x4-x2>=0.0\n",
      "   -0.0690 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   -0.5021 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.2357 if x2<=1.0 & x3-x1>=2.0 & x4-x2<=0.0\n",
      "   +0.2357 if x3-x1>=2.0 & x4-x2>=0.0\n",
      "   +0.3813 if c>=1.0 & x1>=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   -0.0282 if x3-x1<=-3.0 & x4-x2<=-1.0\n",
      "   -0.0166 if x1<=1.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   -0.4217 if c<=0.0 & x1<=1.0 & x2<=1.0 & x3-x1>=0.0\n",
      "----------------- 2 --------------\n",
      "   +0.2317 if x1>=2.0 & x2>=3.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2>=-2.0\n",
      "   +0.0113 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.4621 if c<=0.0 & x1<=0.0 & x3-x1<=1.0 & x4-x2>=1.0\n",
      "   -0.4075 if c<=0.0 & x1<=2.0 & x1>=1.0 & x1>=2.0 & x2<=2.0 & x2>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.7287 if x4-x2>=-1.0\n",
      "   -0.1389 if x2<=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.3556 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.2716 if c>=1.0 & x1>=1.0 & x2<=2.0 & x4-x2<=-1.0\n",
      "   +0.1986 if x1<=1.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.1910 if x2<=0.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   +0.5623 if c<=0.0 & x4-x2>=-2.0\n",
      "   +0.2237 if c<=0.0 & x2<=2.0\n",
      "   +0.8782 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "   -0.1560 if x3-x1<=-2.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   -0.0162 if x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   +0.3646 if x2<=0.0 & x3-x1>=2.0\n",
      "----------------- 3 --------------\n",
      "   +0.2109 if x3-x1<=-1.0\n",
      "   +0.3973 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2>=0.0\n",
      "   +0.2243 if x1<=2.0 & x1>=2.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   -0.3323 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   +0.5977 if x1<=0.0 & x3-x1<=1.0 & x4-x2>=0.0 & x4-x2>=1.0\n",
      "   +0.2729 if x3-x1<=-3.0 & x4-x2>=-1.0\n",
      "   +0.5362 if c>=1.0 & x2<=1.0 & x2>=1.0\n",
      "   -0.4734 if c<=0.0 & x3-x1<=-1.0\n",
      "   +0.3815 if c>=1.0 & x1>=3.0 & x4-x2>=0.0\n",
      "   -0.0225 if c<=0.0 & x1<=2.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.3445 if x3-x1>=2.0 & x4-x2>=0.0\n",
      "   -0.2304 if c>=1.0 & x1<=2.0 & x3-x1<=1.0 & x4-x2<=-2.0\n",
      "   -0.1114 if x2<=1.0 & x3-x1<=-2.0 & x4-x2>=1.0\n",
      "   -0.1625 if x1>=1.0 & x2<=2.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   -0.1205 if x1>=1.0 & x3-x1>=0.0\n",
      "   +0.4099 if x1<=1.0 & x2<=1.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "init state [ 0  2  3 -1  0]\n",
      "(12,) (12,)\n",
      "init state [ 1  3 -1 -3  0]\n",
      "(42,) (30,)\n",
      "init state [ 3  2  0 -1  0]\n",
      "(46,) (4,)\n",
      "init state [1 2 0 1 0]\n",
      "(73,) (27,)\n",
      "init state [ 3  2 -2  1  0]\n",
      "(82,) (9,)\n",
      "init state [2 0 0 3 0]\n",
      "(124,) (42,)\n",
      "init state [0 0 2 2 0]\n",
      "(142,) (18,)\n",
      "init state [ 2  3 -2  0  0]\n",
      "(155,) (13,)\n",
      "init state [1 1 2 0 0]\n",
      "(207,) (52,)\n",
      "init state [ 1  3  2 -2  0]\n",
      "(237,) (30,)\n",
      "============ 13 ===========\n",
      "Run episode 13 with rewards 12, accuracy 0.3\n",
      "----------------- 0 --------------\n",
      "   -0.5650 if c>=1.0 & x1>=2.0 & x2>=2.0\n",
      "   -0.1486 if x1<=2.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.3704 if c>=1.0 & x3-x1<=1.0\n",
      "   -0.1920 if c<=0.0 & x2<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.1983 if c<=0.0 & x1<=1.0 & x2<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.0182 if c<=0.0 & x1<=2.0 & x3-x1<=-2.0\n",
      "   -0.0250 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2<=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   -0.2260 if c<=0.0 & x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   -0.2040 if c<=0.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   +0.0820 if x3-x1>=2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.9137 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.0101 if x3-x1<=1.0 & x3-x1>=-2.0 & x4-x2>=-2.0\n",
      "   -0.0375 if c<=0.0 & x1>=1.0 & x2<=0.0 & x3-x1>=0.0\n",
      "   +0.5732 if x1>=3.0 & x2<=0.0 & x4-x2<=1.0\n",
      "   +0.0323 if c<=0.0 & x1>=3.0 & x2>=2.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.8286 if x2<=2.0 & x4-x2>=0.0\n",
      "----------------- 1 --------------\n",
      "   +0.4882 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.7053 if c>=1.0 & x1>=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   -0.1344 if c>=1.0 & x1<=2.0 & x1>=2.0 & x2<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   -0.1576 if x2>=2.0 & x3-x1<=-1.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.0000 if c<=0.0 & x1<=0.0 & x1<=1.0 & x3-x1<=1.0 & x3-x1>=1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.0987 if c<=0.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.1299 if x1<=2.0 & x1>=1.0 & x2>=2.0 & x3-x1>=-1.0 & x4-x2>=0.0\n",
      "   -0.0191 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   -0.3854 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.4128 if x2<=1.0 & x3-x1>=2.0 & x4-x2<=0.0\n",
      "   +0.3966 if x3-x1>=2.0 & x4-x2>=0.0\n",
      "   -0.0903 if c>=1.0 & x1>=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   +0.0297 if x3-x1<=-3.0 & x4-x2<=-1.0\n",
      "   +0.1441 if x1<=1.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   +0.3848 if c<=0.0 & x1<=1.0 & x2<=1.0 & x3-x1>=0.0\n",
      "   -0.5758 if x1>=3.0 & x4-x2>=2.0\n",
      "----------------- 2 --------------\n",
      "   -0.0290 if x1>=2.0 & x2>=3.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2>=-2.0\n",
      "   +0.0067 if c<=0.0 & x1<=0.0 & x3-x1<=1.0 & x4-x2>=1.0\n",
      "   +0.4591 if c<=0.0 & x1<=2.0 & x1>=1.0 & x1>=2.0 & x2<=2.0 & x2>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.3562 if x4-x2>=-1.0\n",
      "   -0.5150 if x2<=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.3454 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.4651 if c>=1.0 & x1>=1.0 & x2<=2.0 & x4-x2<=-1.0\n",
      "   -0.1423 if x1<=1.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.4513 if x2<=0.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   -0.0082 if c<=0.0 & x4-x2>=-2.0\n",
      "   +0.2733 if c<=0.0 & x2<=2.0\n",
      "   +0.3270 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "   +0.0302 if x3-x1<=-2.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   +0.1324 if x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   -0.2078 if x2<=0.0 & x3-x1>=2.0\n",
      "   -0.6684 if x2>=3.0 & x3-x1<=-1.0 & x4-x2>=0.0\n",
      "----------------- 3 --------------\n",
      "   +0.1702 if x3-x1<=-1.0\n",
      "   +0.1121 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2>=0.0\n",
      "   -0.0592 if x1<=2.0 & x1>=2.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   -0.3174 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   -0.0097 if x1<=0.0 & x3-x1<=1.0 & x4-x2>=0.0 & x4-x2>=1.0\n",
      "   -0.1770 if x3-x1<=-3.0 & x4-x2>=-1.0\n",
      "   +0.6985 if c>=1.0 & x2<=1.0 & x2>=1.0\n",
      "   +0.2910 if c<=0.0 & x3-x1<=-1.0\n",
      "   +0.1961 if c>=1.0 & x1>=3.0 & x4-x2>=0.0\n",
      "   -0.0295 if x3-x1>=2.0 & x4-x2>=0.0\n",
      "   -0.0000 if c>=1.0 & x1<=2.0 & x3-x1<=1.0 & x4-x2<=-2.0\n",
      "   +0.2475 if x2<=1.0 & x3-x1<=-2.0 & x4-x2>=1.0\n",
      "   +0.3626 if x1>=1.0 & x2<=2.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   +0.1856 if x1>=1.0 & x3-x1>=0.0\n",
      "   -0.0752 if x1<=1.0 & x2<=1.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   -0.6578 if x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "init state [ 3  0 -3  2  0]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(63,) (63,)\n",
      "init state [2 0 1 0 0]\n",
      "(75,) (12,)\n",
      "init state [ 0  1  3 -1  0]\n",
      "(153,) (78,)\n",
      "init state [2 1 1 0 0]\n",
      "(164,) (11,)\n",
      "init state [0 3 1 0 0]\n",
      "(170,) (6,)\n",
      "init state [1 0 2 0 0]\n",
      "(199,) (29,)\n",
      "init state [0 0 1 1 0]\n",
      "(208,) (9,)\n",
      "init state [0 0 2 3 0]\n",
      "(222,) (14,)\n",
      "init state [ 2  3 -1 -1  0]\n",
      "(273,) (51,)\n",
      "init state [ 2  0 -2  2  0]\n",
      "(320,) (47,)\n",
      "============ 14 ===========\n",
      "Run episode 14 with rewards -5, accuracy 0.2\n",
      "----------------- 0 --------------\n",
      "   -0.3471 if c>=1.0 & x1>=2.0 & x2>=2.0\n",
      "   -0.0292 if x1<=2.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.6888 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.1196 if c<=0.0 & x2<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.1976 if c<=0.0 & x1<=1.0 & x2<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.2207 if c<=0.0 & x1<=2.0 & x3-x1<=-2.0\n",
      "   -0.0000 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2<=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   +0.2160 if c<=0.0 & x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   -0.1759 if c<=0.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   -0.1402 if x3-x1>=2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.6846 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.1174 if c<=0.0 & x1>=1.0 & x2<=0.0 & x3-x1>=0.0\n",
      "   +0.0184 if x1>=3.0 & x2<=0.0 & x4-x2<=1.0\n",
      "   +0.0483 if c<=0.0 & x1>=3.0 & x2>=2.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.3287 if x2<=2.0 & x4-x2>=0.0\n",
      "   -0.6683 if c<=0.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "----------------- 1 --------------\n",
      "   +0.1854 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.4725 if c>=1.0 & x1>=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   +0.3236 if c>=1.0 & x1<=2.0 & x1>=2.0 & x2<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   -0.0590 if x2>=2.0 & x3-x1<=-1.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.4498 if c<=0.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   +0.3365 if x1<=2.0 & x1>=1.0 & x2>=2.0 & x3-x1>=-1.0 & x4-x2>=0.0\n",
      "   -0.3934 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   -0.9210 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.4589 if x2<=1.0 & x3-x1>=2.0 & x4-x2<=0.0\n",
      "   +0.3442 if x3-x1>=2.0 & x4-x2>=0.0\n",
      "   -0.0142 if c>=1.0 & x1>=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   +0.0064 if x3-x1<=-3.0 & x4-x2<=-1.0\n",
      "   +0.2804 if x1<=1.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   -0.0234 if c<=0.0 & x1<=1.0 & x2<=1.0 & x3-x1>=0.0\n",
      "   -0.0597 if x1>=3.0 & x4-x2>=2.0\n",
      "   -0.3758 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=2.0\n",
      "----------------- 2 --------------\n",
      "   -0.0470 if x1>=2.0 & x2>=3.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2>=-2.0\n",
      "   -0.2524 if c<=0.0 & x1<=2.0 & x1>=1.0 & x1>=2.0 & x2<=2.0 & x2>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.4342 if x4-x2>=-1.0\n",
      "   +0.2168 if x2<=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.0972 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.3956 if c>=1.0 & x1>=1.0 & x2<=2.0 & x4-x2<=-1.0\n",
      "   -0.3347 if x1<=1.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.3092 if x2<=0.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   +0.4065 if c<=0.0 & x4-x2>=-2.0\n",
      "   -0.2182 if c<=0.0 & x2<=2.0\n",
      "   -0.0070 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "   -0.2363 if x3-x1<=-2.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   -0.1131 if x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   -0.0936 if x2<=0.0 & x3-x1>=2.0\n",
      "   -0.0515 if x2>=3.0 & x3-x1<=-1.0 & x4-x2>=0.0\n",
      "   -0.5238 if c<=0.0 & x2<=0.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "----------------- 3 --------------\n",
      "   +0.0801 if x3-x1<=-1.0\n",
      "   +0.1967 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2>=0.0\n",
      "   -0.4162 if x1<=2.0 & x1>=2.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   +0.1350 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   +0.3944 if x1<=0.0 & x3-x1<=1.0 & x4-x2>=0.0 & x4-x2>=1.0\n",
      "   -0.0661 if x3-x1<=-3.0 & x4-x2>=-1.0\n",
      "   +0.3620 if c>=1.0 & x2<=1.0 & x2>=1.0\n",
      "   -0.3794 if c<=0.0 & x3-x1<=-1.0\n",
      "   +0.3063 if c>=1.0 & x1>=3.0 & x4-x2>=0.0\n",
      "   -0.1039 if x3-x1>=2.0 & x4-x2>=0.0\n",
      "   -0.1281 if x2<=1.0 & x3-x1<=-2.0 & x4-x2>=1.0\n",
      "   +0.3018 if x1>=1.0 & x2<=2.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   +0.1759 if x1>=1.0 & x3-x1>=0.0\n",
      "   +0.5371 if x1<=1.0 & x2<=1.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   -0.8399 if x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.9045 if x2>=1.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "init state [ 3  2  0 -1  0]\n",
      "(59,) (59,)\n",
      "init state [ 2  2 -1  0  0]\n",
      "(75,) (16,)\n",
      "init state [1 1 2 0 0]\n",
      "(81,) (6,)\n",
      "init state [ 0  1  3 -1  0]\n",
      "(135,) (54,)\n",
      "init state [ 1  2  0 -2  0]\n",
      "(148,) (13,)\n",
      "init state [ 2  3  0 -2  0]\n",
      "(191,) (43,)\n",
      "init state [0 0 0 1 0]\n",
      "(201,) (10,)\n",
      "init state [ 2  3 -1 -2  0]\n",
      "(230,) (29,)\n",
      "init state [ 2  1 -2  2  0]\n",
      "(248,) (18,)\n",
      "init state [ 3  2 -2  1  0]\n",
      "(262,) (14,)\n",
      "============ 15 ===========\n",
      "Run episode 15 with rewards 28, accuracy 0.6\n",
      "----------------- 0 --------------\n",
      "   -0.3861 if c>=1.0 & x1>=2.0 & x2>=2.0\n",
      "   -0.1266 if x1<=2.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.7911 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.0194 if c<=0.0 & x2<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.2251 if c<=0.0 & x1<=1.0 & x2<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.3538 if c<=0.0 & x1<=2.0 & x3-x1<=-2.0\n",
      "   +0.2044 if c<=0.0 & x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   -0.5644 if c<=0.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   -0.1904 if x3-x1>=2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.8290 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.0733 if c<=0.0 & x1>=1.0 & x2<=0.0 & x3-x1>=0.0\n",
      "   -0.1248 if x1>=3.0 & x2<=0.0 & x4-x2<=1.0\n",
      "   +0.2236 if c<=0.0 & x1>=3.0 & x2>=2.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.6591 if x2<=2.0 & x4-x2>=0.0\n",
      "   -0.3351 if c<=0.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   -0.3651 if c<=0.0 & x1<=1.0 & x3-x1<=0.0 & x4-x2<=-2.0\n",
      "----------------- 1 --------------\n",
      "   +0.3291 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.4982 if c>=1.0 & x1>=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   -0.2131 if c>=1.0 & x1<=2.0 & x1>=2.0 & x2<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   -0.0009 if x2>=2.0 & x3-x1<=-1.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.2198 if c<=0.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   +0.3369 if x1<=2.0 & x1>=1.0 & x2>=2.0 & x3-x1>=-1.0 & x4-x2>=0.0\n",
      "   -0.3026 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   -1.0000 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.2532 if x2<=1.0 & x3-x1>=2.0 & x4-x2<=0.0\n",
      "   +0.3061 if x3-x1>=2.0 & x4-x2>=0.0\n",
      "   -0.1219 if c>=1.0 & x1>=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   +0.0242 if x1<=1.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   +0.2346 if c<=0.0 & x1<=1.0 & x2<=1.0 & x3-x1>=0.0\n",
      "   -0.0000 if x1>=3.0 & x4-x2>=2.0\n",
      "   -0.0000 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=2.0\n",
      "   +0.7886 if x1>=2.0 & x2<=1.0 & x3-x1>=0.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "----------------- 2 --------------\n",
      "   +0.0524 if x1>=2.0 & x2>=3.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2>=-2.0\n",
      "   +0.1099 if c<=0.0 & x1<=2.0 & x1>=1.0 & x1>=2.0 & x2<=2.0 & x2>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.5510 if x4-x2>=-1.0\n",
      "   +0.1415 if x2<=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.2411 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.3375 if c>=1.0 & x1>=1.0 & x2<=2.0 & x4-x2<=-1.0\n",
      "   +0.2198 if x1<=1.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.1506 if x2<=0.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   +0.5578 if c<=0.0 & x4-x2>=-2.0\n",
      "   +0.0391 if c<=0.0 & x2<=2.0\n",
      "   -0.1821 if x3-x1<=-2.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   -0.1823 if x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   -0.0142 if x2<=0.0 & x3-x1>=2.0\n",
      "   -0.0337 if x2>=3.0 & x3-x1<=-1.0 & x4-x2>=0.0\n",
      "   -0.2598 if c<=0.0 & x2<=0.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.4356 if x4-x2>=3.0\n",
      "----------------- 3 --------------\n",
      "   +0.2147 if x3-x1<=-1.0\n",
      "   -0.0879 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2>=0.0\n",
      "   -0.1924 if x1<=2.0 & x1>=2.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   -0.0016 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   +0.2882 if x1<=0.0 & x3-x1<=1.0 & x4-x2>=0.0 & x4-x2>=1.0\n",
      "   +0.3364 if c>=1.0 & x2<=1.0 & x2>=1.0\n",
      "   -0.5791 if c<=0.0 & x3-x1<=-1.0\n",
      "   +0.2493 if c>=1.0 & x1>=3.0 & x4-x2>=0.0\n",
      "   -0.1333 if x3-x1>=2.0 & x4-x2>=0.0\n",
      "   +0.0810 if x2<=1.0 & x3-x1<=-2.0 & x4-x2>=1.0\n",
      "   +0.5444 if x1>=1.0 & x2<=2.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   -0.1375 if x1>=1.0 & x3-x1>=0.0\n",
      "   +0.1163 if x1<=1.0 & x2<=1.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   -0.7807 if x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.0000 if x2>=1.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.4495 if x2>=1.0 & x3-x1>=-1.0 & x4-x2>=2.0\n",
      "init state [ 1  2 -1  1  0]\n",
      "(14,) (14,)\n",
      "init state [ 1  3  2 -1  0]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(40,) (26,)\n",
      "init state [ 2  0 -2  2  0]\n",
      "(81,) (41,)\n",
      "init state [ 3  1 -1  0  0]\n",
      "(88,) (7,)\n",
      "init state [0 1 2 0 0]\n",
      "(97,) (9,)\n",
      "init state [ 3  0 -2  2  0]\n",
      "(122,) (25,)\n",
      "init state [0 1 3 1 0]\n",
      "(138,) (16,)\n",
      "init state [ 0  2  3 -2  0]\n",
      "(178,) (40,)\n",
      "init state [3 1 0 1 0]\n",
      "(183,) (5,)\n",
      "init state [ 2  2 -1  0  0]\n",
      "(187,) (4,)\n",
      "============ 16 ===========\n",
      "Run episode 16 with rewards 38, accuracy 0.6\n",
      "----------------- 0 --------------\n",
      "   -0.2758 if c>=1.0 & x1>=2.0 & x2>=2.0\n",
      "   -0.4283 if x1<=2.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.7723 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.0454 if c<=0.0 & x1<=1.0 & x2<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.1375 if c<=0.0 & x1<=2.0 & x3-x1<=-2.0\n",
      "   +0.4952 if c<=0.0 & x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   -0.5364 if c<=0.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   -0.3006 if x3-x1>=2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +1.0768 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.0444 if c<=0.0 & x1>=1.0 & x2<=0.0 & x3-x1>=0.0\n",
      "   -0.0788 if x1>=3.0 & x2<=0.0 & x4-x2<=1.0\n",
      "   -0.2740 if c<=0.0 & x1>=3.0 & x2>=2.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.2551 if x2<=2.0 & x4-x2>=0.0\n",
      "   +0.0499 if c<=0.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   -0.0000 if c<=0.0 & x1<=1.0 & x3-x1<=0.0 & x4-x2<=-2.0\n",
      "   -0.3674 if c<=0.0 & x1<=0.0 & x2>=1.0 & x3-x1<=2.0 & x4-x2<=1.0\n",
      "----------------- 1 --------------\n",
      "   +0.2402 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   -0.0828 if c>=1.0 & x1>=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   +0.0898 if c>=1.0 & x1<=2.0 & x1>=2.0 & x2<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   -0.3793 if x2>=2.0 & x3-x1<=-1.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   -0.0331 if c<=0.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   +0.1855 if x1<=2.0 & x1>=1.0 & x2>=2.0 & x3-x1>=-1.0 & x4-x2>=0.0\n",
      "   -0.3101 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   -0.7566 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.5183 if x2<=1.0 & x3-x1>=2.0 & x4-x2<=0.0\n",
      "   +0.5047 if x3-x1>=2.0 & x4-x2>=0.0\n",
      "   +0.3296 if c>=1.0 & x1>=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   +0.2656 if x1<=1.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   +0.1129 if c<=0.0 & x1<=1.0 & x2<=1.0 & x3-x1>=0.0\n",
      "   -0.0257 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=2.0\n",
      "   -0.0100 if x1>=2.0 & x2<=1.0 & x3-x1>=0.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   +0.5023 if x2>=3.0\n",
      "----------------- 2 --------------\n",
      "   +0.2426 if x1>=2.0 & x2>=3.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2>=-2.0\n",
      "   +0.0749 if c<=0.0 & x1<=2.0 & x1>=1.0 & x1>=2.0 & x2<=2.0 & x2>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.5062 if x4-x2>=-1.0\n",
      "   -0.2909 if x2<=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.3192 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.3842 if c>=1.0 & x1>=1.0 & x2<=2.0 & x4-x2<=-1.0\n",
      "   -0.3472 if x1<=1.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.1435 if x2<=0.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   +0.3568 if c<=0.0 & x4-x2>=-2.0\n",
      "   -0.0933 if c<=0.0 & x2<=2.0\n",
      "   -0.2126 if x3-x1<=-2.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   -0.2386 if x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   -0.0992 if x2>=3.0 & x3-x1<=-1.0 & x4-x2>=0.0\n",
      "   -0.3215 if c<=0.0 & x2<=0.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   -0.1138 if x4-x2>=3.0\n",
      "   +0.6974 if x1<=0.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "----------------- 3 --------------\n",
      "   +0.1275 if x3-x1<=-1.0\n",
      "   +0.1349 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2>=0.0\n",
      "   +0.0678 if x1<=2.0 & x1>=2.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   -0.2874 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   +0.4242 if x1<=0.0 & x3-x1<=1.0 & x4-x2>=0.0 & x4-x2>=1.0\n",
      "   +0.7829 if c>=1.0 & x2<=1.0 & x2>=1.0\n",
      "   -0.6433 if c<=0.0 & x3-x1<=-1.0\n",
      "   +0.4453 if c>=1.0 & x1>=3.0 & x4-x2>=0.0\n",
      "   +0.0743 if x3-x1>=2.0 & x4-x2>=0.0\n",
      "   +0.3587 if x2<=1.0 & x3-x1<=-2.0 & x4-x2>=1.0\n",
      "   +0.6212 if x1>=1.0 & x2<=2.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   -0.0006 if x1>=1.0 & x3-x1>=0.0\n",
      "   -0.1005 if x1<=1.0 & x2<=1.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   -0.7720 if x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.1546 if x2>=1.0 & x3-x1>=-1.0 & x4-x2>=2.0\n",
      "   +0.4170 if x4-x2>=3.0\n",
      "init state [ 3  2  0 -2  0]\n",
      "(85,) (85,)\n",
      "init state [0 1 3 0 0]\n",
      "(117,) (32,)\n",
      "init state [ 3  2 -2  0  0]\n",
      "(132,) (15,)\n",
      "init state [1 0 0 3 0]\n",
      "(140,) (8,)\n",
      "init state [2 0 0 3 0]\n",
      "(156,) (16,)\n",
      "init state [ 1  1  0 -1  0]\n",
      "(282,) (126,)\n",
      "init state [ 0  3  3 -3  0]\n",
      "(308,) (26,)\n",
      "init state [0 0 1 2 0]\n",
      "(320,) (12,)\n",
      "init state [0 2 0 1 0]\n",
      "(331,) (11,)\n",
      "init state [ 3  2 -1 -2  0]\n",
      "(380,) (49,)\n",
      "============ 17 ===========\n",
      "Run episode 17 with rewards -7, accuracy 0.4\n",
      "----------------- 0 --------------\n",
      "   -0.3724 if c>=1.0 & x1>=2.0 & x2>=2.0\n",
      "   +0.6350 if x1<=2.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.9298 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.2646 if c<=0.0 & x1<=1.0 & x2<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.0000 if c<=0.0 & x1<=2.0 & x3-x1<=-2.0\n",
      "   -0.1036 if c<=0.0 & x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   -0.3720 if c<=0.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   +0.0369 if x3-x1>=2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.1119 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.0988 if c<=0.0 & x1>=1.0 & x2<=0.0 & x3-x1>=0.0\n",
      "   -0.1341 if x1>=3.0 & x2<=0.0 & x4-x2<=1.0\n",
      "   -0.3698 if c<=0.0 & x1>=3.0 & x2>=2.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.4431 if x2<=2.0 & x4-x2>=0.0\n",
      "   +0.1179 if c<=0.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   -0.3449 if c<=0.0 & x1<=0.0 & x2>=1.0 & x3-x1<=2.0 & x4-x2<=1.0\n",
      "   -0.5569 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "----------------- 1 --------------\n",
      "   -0.2088 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.2688 if c>=1.0 & x1>=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   +0.0966 if c>=1.0 & x1<=2.0 & x1>=2.0 & x2<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.2695 if x2>=2.0 & x3-x1<=-1.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.2195 if c<=0.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   +0.5575 if x1<=2.0 & x1>=1.0 & x2>=2.0 & x3-x1>=-1.0 & x4-x2>=0.0\n",
      "   -0.3138 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   -0.4096 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.2862 if x2<=1.0 & x3-x1>=2.0 & x4-x2<=0.0\n",
      "   +0.5009 if x3-x1>=2.0 & x4-x2>=0.0\n",
      "   -0.1118 if c>=1.0 & x1>=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   +0.0555 if x1<=1.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   +0.3669 if c<=0.0 & x1<=1.0 & x2<=1.0 & x3-x1>=0.0\n",
      "   +0.2352 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=2.0\n",
      "   +0.2810 if x2>=3.0\n",
      "   -0.4751 if x4-x2<=-3.0\n",
      "----------------- 2 --------------\n",
      "   +0.0975 if x1>=2.0 & x2>=3.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2>=-2.0\n",
      "   -0.1909 if x4-x2>=-1.0\n",
      "   -0.3242 if x2<=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   +0.3565 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   +0.1063 if c>=1.0 & x1>=1.0 & x2<=2.0 & x4-x2<=-1.0\n",
      "   +0.3458 if x1<=1.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.6162 if x2<=0.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   +0.2776 if c<=0.0 & x4-x2>=-2.0\n",
      "   +0.4945 if c<=0.0 & x2<=2.0\n",
      "   -0.0538 if x3-x1<=-2.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   -0.6495 if x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   -0.2865 if x2>=3.0 & x3-x1<=-1.0 & x4-x2>=0.0\n",
      "   -0.3683 if c<=0.0 & x2<=0.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.1973 if x4-x2>=3.0\n",
      "   -0.0637 if x1<=0.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.5456 if c<=0.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "----------------- 3 --------------\n",
      "   +0.2977 if x3-x1<=-1.0\n",
      "   +0.0402 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2>=0.0\n",
      "   -0.3634 if x1<=2.0 & x1>=2.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   -0.1888 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   +0.0064 if x1<=0.0 & x3-x1<=1.0 & x4-x2>=0.0 & x4-x2>=1.0\n",
      "   +0.6663 if c>=1.0 & x2<=1.0 & x2>=1.0\n",
      "   +0.1496 if c<=0.0 & x3-x1<=-1.0\n",
      "   +0.4145 if c>=1.0 & x1>=3.0 & x4-x2>=0.0\n",
      "   -0.3138 if x3-x1>=2.0 & x4-x2>=0.0\n",
      "   +0.0801 if x2<=1.0 & x3-x1<=-2.0 & x4-x2>=1.0\n",
      "   +0.1812 if x1>=1.0 & x2<=2.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   -0.6603 if x1<=1.0 & x2<=1.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   -0.4211 if x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.1819 if x2>=1.0 & x3-x1>=-1.0 & x4-x2>=2.0\n",
      "   +0.2061 if x4-x2>=3.0\n",
      "   +0.9300 if c<=0.0 & x1<=1.0 & x3-x1<=0.0 & x4-x2<=2.0 & x4-x2>=1.0\n",
      "init state [ 1  2  2 -1  0]\n",
      "(9,) (9,)\n",
      "init state [0 0 3 0 0]\n",
      "(22,) (13,)\n",
      "init state [ 2  3  0 -1  0]\n",
      "(42,) (20,)\n",
      "init state [ 2  1 -1  0  0]\n",
      "(53,) (11,)\n",
      "init state [ 0  3  0 -1  0]\n",
      "(66,) (13,)\n",
      "init state [0 0 1 2 0]\n",
      "(81,) (15,)\n",
      "init state [1 1 2 0 0]\n",
      "(87,) (6,)\n",
      "init state [ 1  3  0 -2  0]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(105,) (18,)\n",
      "init state [ 2  2 -1 -1  0]\n",
      "(137,) (32,)\n",
      "init state [ 0  3  3 -3  0]\n",
      "(180,) (43,)\n",
      "============ 18 ===========\n",
      "Run episode 18 with rewards -1, accuracy 0.6\n",
      "----------------- 0 --------------\n",
      "   -0.6374 if c>=1.0 & x1>=2.0 & x2>=2.0\n",
      "   +0.2872 if x1<=2.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.6651 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.0954 if c<=0.0 & x1<=1.0 & x2<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.4377 if c<=0.0 & x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   -0.3782 if c<=0.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   +0.0312 if x3-x1>=2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.3668 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.3330 if c<=0.0 & x1>=1.0 & x2<=0.0 & x3-x1>=0.0\n",
      "   -0.1065 if x1>=3.0 & x2<=0.0 & x4-x2<=1.0\n",
      "   +0.1109 if c<=0.0 & x1>=3.0 & x2>=2.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.1694 if x2<=2.0 & x4-x2>=0.0\n",
      "   +0.3750 if c<=0.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   -0.3773 if c<=0.0 & x1<=0.0 & x2>=1.0 & x3-x1<=2.0 & x4-x2<=1.0\n",
      "   -0.4909 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.3929 if c<=0.0 & x2<=1.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "----------------- 1 --------------\n",
      "   +0.4251 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.5641 if c>=1.0 & x1>=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   +0.0460 if c>=1.0 & x1<=2.0 & x1>=2.0 & x2<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   -0.1102 if x2>=2.0 & x3-x1<=-1.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.0168 if c<=0.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   +0.3216 if x1<=2.0 & x1>=1.0 & x2>=2.0 & x3-x1>=-1.0 & x4-x2>=0.0\n",
      "   -0.2082 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   -0.6394 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.6998 if x2<=1.0 & x3-x1>=2.0 & x4-x2<=0.0\n",
      "   +0.4759 if x3-x1>=2.0 & x4-x2>=0.0\n",
      "   +0.0911 if c>=1.0 & x1>=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   +0.2644 if c<=0.0 & x1<=1.0 & x2<=1.0 & x3-x1>=0.0\n",
      "   -0.0000 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=2.0\n",
      "   +0.0923 if x2>=3.0\n",
      "   -0.0135 if x4-x2<=-3.0\n",
      "   +0.6266 if x1>=2.0 & x2>=1.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "----------------- 2 --------------\n",
      "   -0.1173 if x1>=2.0 & x2>=3.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2>=-2.0\n",
      "   -1.0182 if x4-x2>=-1.0\n",
      "   +0.2853 if x2<=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.1158 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.4424 if c>=1.0 & x1>=1.0 & x2<=2.0 & x4-x2<=-1.0\n",
      "   +0.3213 if x1<=1.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.1443 if x2<=0.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   +0.8968 if c<=0.0 & x4-x2>=-2.0\n",
      "   +0.2059 if c<=0.0 & x2<=2.0\n",
      "   +0.0401 if x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   +0.0000 if x2>=3.0 & x3-x1<=-1.0 & x4-x2>=0.0\n",
      "   +0.1427 if c<=0.0 & x2<=0.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.0000 if x4-x2>=3.0\n",
      "   +0.0000 if x1<=0.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.3654 if c<=0.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -1.0906 if c<=0.0 & x1<=2.0 & x2>=1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "----------------- 3 --------------\n",
      "   +0.3557 if x3-x1<=-1.0\n",
      "   +0.2264 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2>=0.0\n",
      "   -0.0000 if x1<=2.0 & x1>=2.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   -0.6578 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   +0.5869 if c>=1.0 & x2<=1.0 & x2>=1.0\n",
      "   -0.2724 if c<=0.0 & x3-x1<=-1.0\n",
      "   +0.2832 if c>=1.0 & x1>=3.0 & x4-x2>=0.0\n",
      "   +0.0208 if x3-x1>=2.0 & x4-x2>=0.0\n",
      "   -0.0276 if x2<=1.0 & x3-x1<=-2.0 & x4-x2>=1.0\n",
      "   +0.1147 if x1>=1.0 & x2<=2.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   -0.1484 if x1<=1.0 & x2<=1.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   -0.0183 if x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.0000 if x2>=1.0 & x3-x1>=-1.0 & x4-x2>=2.0\n",
      "   -0.0000 if x4-x2>=3.0\n",
      "   +0.3710 if c<=0.0 & x1<=1.0 & x3-x1<=0.0 & x4-x2<=2.0 & x4-x2>=1.0\n",
      "   -0.5133 if x2>=3.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "init state [2 0 1 2 0]\n",
      "(7,) (7,)\n",
      "init state [ 3  0 -2  0  0]\n",
      "(49,) (42,)\n",
      "init state [ 1  0 -1  0  0]\n",
      "(88,) (39,)\n",
      "init state [1 0 0 1 0]\n",
      "(100,) (12,)\n",
      "init state [ 3  0 -3  3  0]\n",
      "(128,) (28,)\n",
      "init state [ 1  3 -1  0  0]\n",
      "(138,) (10,)\n",
      "init state [ 2  0 -2  2  0]\n",
      "(162,) (24,)\n",
      "init state [ 0  3  3 -2  0]\n",
      "(196,) (34,)\n",
      "init state [ 2  2 -2 -1  0]\n",
      "(213,) (17,)\n",
      "init state [ 1  0 -1  1  0]\n",
      "(228,) (15,)\n",
      "============ 19 ===========\n",
      "Run episode 19 with rewards 27, accuracy 0.4\n",
      "----------------- 0 --------------\n",
      "   -0.6315 if c>=1.0 & x1>=2.0 & x2>=2.0\n",
      "   -0.1648 if x1<=2.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.8919 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.4697 if c<=0.0 & x1<=1.0 & x2<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.1123 if c<=0.0 & x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   -0.5206 if c<=0.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   +0.6283 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.2715 if c<=0.0 & x1>=1.0 & x2<=0.0 & x3-x1>=0.0\n",
      "   +0.0798 if x1>=3.0 & x2<=0.0 & x4-x2<=1.0\n",
      "   +0.0000 if c<=0.0 & x1>=3.0 & x2>=2.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.1268 if x2<=2.0 & x4-x2>=0.0\n",
      "   -0.3431 if c<=0.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   -0.2144 if c<=0.0 & x1<=0.0 & x2>=1.0 & x3-x1<=2.0 & x4-x2<=1.0\n",
      "   -0.4108 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.0758 if c<=0.0 & x2<=1.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.5303 if x1>=1.0 & x2<=0.0 & x3-x1>=-1.0 & x4-x2>=2.0\n",
      "----------------- 1 --------------\n",
      "   +0.6259 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.3594 if c>=1.0 & x1>=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   +0.1194 if c>=1.0 & x1<=2.0 & x1>=2.0 & x2<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   -0.0221 if x2>=2.0 & x3-x1<=-1.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.0220 if c<=0.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   +0.0597 if x1<=2.0 & x1>=1.0 & x2>=2.0 & x3-x1>=-1.0 & x4-x2>=0.0\n",
      "   -0.1921 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   -0.7739 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.0000 if x2<=1.0 & x3-x1>=2.0 & x4-x2<=0.0\n",
      "   +0.0000 if x3-x1>=2.0 & x4-x2>=0.0\n",
      "   +0.0550 if c>=1.0 & x1>=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   +0.4510 if c<=0.0 & x1<=1.0 & x2<=1.0 & x3-x1>=0.0\n",
      "   +0.1089 if x2>=3.0\n",
      "   -0.2178 if x4-x2<=-3.0\n",
      "   +0.4696 if x1>=2.0 & x2>=1.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   +0.2884 if x1>=1.0 & x2<=2.0 & x3-x1>=2.0\n",
      "----------------- 2 --------------\n",
      "   +0.0000 if x1>=2.0 & x2>=3.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2>=-2.0\n",
      "   -0.3758 if x4-x2>=-1.0\n",
      "   +0.0884 if x2<=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.1396 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.6291 if c>=1.0 & x1>=1.0 & x2<=2.0 & x4-x2<=-1.0\n",
      "   +0.2155 if x1<=1.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.2895 if x2<=0.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   +0.4943 if c<=0.0 & x4-x2>=-2.0\n",
      "   +0.4115 if c<=0.0 & x2<=2.0\n",
      "   -0.3813 if x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   -0.2453 if x2>=3.0 & x3-x1<=-1.0 & x4-x2>=0.0\n",
      "   -0.0803 if c<=0.0 & x2<=0.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.3613 if x4-x2>=3.0\n",
      "   +0.0312 if c<=0.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.4248 if c<=0.0 & x1<=2.0 & x2>=1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.4406 if x1<=0.0 & x4-x2>=2.0\n",
      "----------------- 3 --------------\n",
      "   +0.3404 if x3-x1<=-1.0\n",
      "   +0.4205 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2>=0.0\n",
      "   +0.3247 if x1<=2.0 & x1>=2.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   -0.1973 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   +0.2088 if c>=1.0 & x2<=1.0 & x2>=1.0\n",
      "   -0.7684 if c<=0.0 & x3-x1<=-1.0\n",
      "   +0.1755 if c>=1.0 & x1>=3.0 & x4-x2>=0.0\n",
      "   +0.0000 if x3-x1>=2.0 & x4-x2>=0.0\n",
      "   -0.0617 if x2<=1.0 & x3-x1<=-2.0 & x4-x2>=1.0\n",
      "   -0.0816 if x1>=1.0 & x2<=2.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   -0.2654 if x1<=1.0 & x2<=1.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   -0.2235 if x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.2436 if x4-x2>=3.0\n",
      "   +0.7586 if c<=0.0 & x1<=1.0 & x3-x1<=0.0 & x4-x2<=2.0 & x4-x2>=1.0\n",
      "   -0.4388 if x2>=3.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.5168 if x1>=2.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "init state [ 1  0 -1  1  0]\n",
      "(10,) (10,)\n",
      "init state [ 1  3  2 -2  0]\n",
      "(37,) (27,)\n",
      "init state [0 2 3 0 0]\n",
      "(62,) (25,)\n",
      "init state [2 1 0 1 0]\n",
      "(71,) (9,)\n",
      "init state [ 1  3  2 -2  0]\n",
      "(103,) (32,)\n",
      "init state [1 0 0 3 0]\n",
      "(140,) (37,)\n",
      "init state [ 2  2 -2  0  0]\n",
      "(150,) (10,)\n",
      "init state [ 2  3 -1 -3  0]\n",
      "(200,) (50,)\n",
      "init state [0 0 3 2 0]\n",
      "(217,) (17,)\n",
      "init state [ 3  1 -3  0  0]\n",
      "(235,) (18,)\n",
      "============ 20 ===========\n",
      "Run episode 20 with rewards 24, accuracy 0.2\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 0 --------------\n",
      "   -0.3079 if c>=1.0 & x1>=2.0 & x2>=2.0\n",
      "   -0.0524 if x1<=2.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.7596 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.0787 if c<=0.0 & x1<=1.0 & x2<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.3447 if c<=0.0 & x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   -0.3777 if c<=0.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   +0.8081 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.1432 if c<=0.0 & x1>=1.0 & x2<=0.0 & x3-x1>=0.0\n",
      "   -0.0076 if x1>=3.0 & x2<=0.0 & x4-x2<=1.0\n",
      "   -0.2366 if x2<=2.0 & x4-x2>=0.0\n",
      "   -0.2919 if c<=0.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   -0.1173 if c<=0.0 & x1<=0.0 & x2>=1.0 & x3-x1<=2.0 & x4-x2<=1.0\n",
      "   -0.7201 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.2151 if c<=0.0 & x2<=1.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.1070 if x1>=1.0 & x2<=0.0 & x3-x1>=-1.0 & x4-x2>=2.0\n",
      "   +0.5606 if x3-x1<=0.0 & x3-x1>=0.0 & x4-x2<=2.0 & x4-x2>=2.0\n",
      "----------------- 1 --------------\n",
      "   +0.8183 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.2167 if c>=1.0 & x1>=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   +0.0138 if c>=1.0 & x1<=2.0 & x1>=2.0 & x2<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.1198 if x2>=2.0 & x3-x1<=-1.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.2677 if c<=0.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.0895 if x1<=2.0 & x1>=1.0 & x2>=2.0 & x3-x1>=-1.0 & x4-x2>=0.0\n",
      "   -0.5624 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   -0.4777 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.1676 if x2<=1.0 & x3-x1>=2.0 & x4-x2<=0.0\n",
      "   +0.0791 if c>=1.0 & x1>=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   +0.6154 if c<=0.0 & x1<=1.0 & x2<=1.0 & x3-x1>=0.0\n",
      "   +0.2562 if x2>=3.0\n",
      "   -0.0903 if x4-x2<=-3.0\n",
      "   +0.7225 if x1>=2.0 & x2>=1.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   +0.0927 if x1>=1.0 & x2<=2.0 & x3-x1>=2.0\n",
      "   -0.3752 if x3-x1<=1.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "----------------- 2 --------------\n",
      "   -0.1685 if x4-x2>=-1.0\n",
      "   +0.2374 if x2<=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.3775 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.5813 if c>=1.0 & x1>=1.0 & x2<=2.0 & x4-x2<=-1.0\n",
      "   +0.0914 if x1<=1.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.2687 if x2<=0.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   +0.0356 if c<=0.0 & x4-x2>=-2.0\n",
      "   +0.3016 if c<=0.0 & x2<=2.0\n",
      "   +0.0269 if x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   -0.0298 if x2>=3.0 & x3-x1<=-1.0 & x4-x2>=0.0\n",
      "   -0.1388 if c<=0.0 & x2<=0.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   -0.1797 if x4-x2>=3.0\n",
      "   +0.5397 if c<=0.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.1086 if c<=0.0 & x1<=2.0 & x2>=1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.3303 if x1<=0.0 & x4-x2>=2.0\n",
      "   -0.8050 if x2>=1.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "----------------- 3 --------------\n",
      "   +0.0178 if x3-x1<=-1.0\n",
      "   +0.3119 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2>=0.0\n",
      "   +0.7473 if x1<=2.0 & x1>=2.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   -0.3279 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   +0.2668 if c>=1.0 & x2<=1.0 & x2>=1.0\n",
      "   -0.1294 if c<=0.0 & x3-x1<=-1.0\n",
      "   +0.3163 if c>=1.0 & x1>=3.0 & x4-x2>=0.0\n",
      "   +0.0000 if x2<=1.0 & x3-x1<=-2.0 & x4-x2>=1.0\n",
      "   +0.2218 if x1>=1.0 & x2<=2.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   +0.2674 if x1<=1.0 & x2<=1.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   -0.2451 if x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.5272 if x4-x2>=3.0\n",
      "   +0.3405 if c<=0.0 & x1<=1.0 & x3-x1<=0.0 & x4-x2<=2.0 & x4-x2>=1.0\n",
      "   -0.2794 if x2>=3.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.0396 if x1>=2.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.3619 if x2<=2.0 & x2>=2.0 & x3-x1<=-3.0 & x4-x2>=0.0\n",
      "init state [1 1 1 0 0]\n",
      "(8,) (8,)\n",
      "init state [ 0  3  2 -1  0]\n",
      "(20,) (12,)\n",
      "init state [ 1  3 -1 -3  0]\n",
      "(113,) (93,)\n",
      "init state [ 1  1  0 -1  0]\n",
      "(146,) (33,)\n",
      "init state [ 1  2 -1 -2  0]\n",
      "(209,) (63,)\n",
      "init state [0 1 2 1 0]\n",
      "(223,) (14,)\n",
      "init state [1 0 0 3 0]\n",
      "(230,) (7,)\n",
      "init state [0 1 1 2 0]\n",
      "(245,) (15,)\n",
      "init state [1 0 2 0 0]\n",
      "(292,) (47,)\n",
      "init state [1 1 0 2 0]\n",
      "(310,) (18,)\n",
      "============ 21 ===========\n",
      "Run episode 21 with rewards 24, accuracy 0.1\n",
      "----------------- 0 --------------\n",
      "   -0.3170 if c>=1.0 & x1>=2.0 & x2>=2.0\n",
      "   +0.1939 if x1<=2.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.9820 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.2259 if c<=0.0 & x1<=1.0 & x2<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.4585 if c<=0.0 & x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   -0.5518 if c<=0.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   +0.9132 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.3104 if c<=0.0 & x1>=1.0 & x2<=0.0 & x3-x1>=0.0\n",
      "   -0.1630 if x2<=2.0 & x4-x2>=0.0\n",
      "   +0.0946 if c<=0.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   -0.2033 if c<=0.0 & x1<=0.0 & x2>=1.0 & x3-x1<=2.0 & x4-x2<=1.0\n",
      "   -0.3126 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.1687 if c<=0.0 & x2<=1.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.4268 if x1>=1.0 & x2<=0.0 & x3-x1>=-1.0 & x4-x2>=2.0\n",
      "   -0.0598 if x3-x1<=0.0 & x3-x1>=0.0 & x4-x2<=2.0 & x4-x2>=2.0\n",
      "   +0.6642 if c<=0.0 & x1>=2.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "----------------- 1 --------------\n",
      "   +0.4624 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.1734 if c>=1.0 & x1>=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   -0.6673 if x2>=2.0 & x3-x1<=-1.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   -0.1822 if c<=0.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   +0.1764 if x1<=2.0 & x1>=1.0 & x2>=2.0 & x3-x1>=-1.0 & x4-x2>=0.0\n",
      "   -0.3858 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   -0.2535 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.0719 if x2<=1.0 & x3-x1>=2.0 & x4-x2<=0.0\n",
      "   +0.2083 if c>=1.0 & x1>=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   +0.4425 if c<=0.0 & x1<=1.0 & x2<=1.0 & x3-x1>=0.0\n",
      "   +0.8211 if x2>=3.0\n",
      "   +0.9568 if x4-x2<=-3.0\n",
      "   +0.0000 if x1>=2.0 & x2>=1.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   -0.1230 if x1>=1.0 & x2<=2.0 & x3-x1>=2.0\n",
      "   +0.1638 if x3-x1<=1.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   +0.6223 if x2<=0.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "----------------- 2 --------------\n",
      "   -0.3634 if x4-x2>=-1.0\n",
      "   +0.2791 if x2<=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.0897 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.4762 if c>=1.0 & x1>=1.0 & x2<=2.0 & x4-x2<=-1.0\n",
      "   +0.1939 if x1<=1.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.2817 if x2<=0.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   +0.2831 if c<=0.0 & x4-x2>=-2.0\n",
      "   +0.2479 if c<=0.0 & x2<=2.0\n",
      "   -0.1598 if x2>=3.0 & x3-x1<=-1.0 & x4-x2>=0.0\n",
      "   -0.3197 if c<=0.0 & x2<=0.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.2185 if x4-x2>=3.0\n",
      "   +0.1699 if c<=0.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.1788 if c<=0.0 & x1<=2.0 & x2>=1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.0577 if x1<=0.0 & x4-x2>=2.0\n",
      "   -0.6872 if x2>=1.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   -0.4375 if c<=0.0 & x1<=0.0 & x3-x1<=1.0 & x4-x2>=-1.0\n",
      "----------------- 3 --------------\n",
      "   +0.5037 if x3-x1<=-1.0\n",
      "   +0.1713 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2>=0.0\n",
      "   +0.4596 if x1<=2.0 & x1>=2.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   -0.3236 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   +0.5012 if c>=1.0 & x2<=1.0 & x2>=1.0\n",
      "   -0.1151 if c<=0.0 & x3-x1<=-1.0\n",
      "   +0.3668 if c>=1.0 & x1>=3.0 & x4-x2>=0.0\n",
      "   +0.0067 if x1>=1.0 & x2<=2.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   +0.2844 if x1<=1.0 & x2<=1.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   -0.4664 if x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.0026 if x4-x2>=3.0\n",
      "   +0.0771 if c<=0.0 & x1<=1.0 & x3-x1<=0.0 & x4-x2<=2.0 & x4-x2>=1.0\n",
      "   -0.3354 if x2>=3.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.2008 if x1>=2.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.0000 if x2<=2.0 & x2>=2.0 & x3-x1<=-3.0 & x4-x2>=0.0\n",
      "   -0.5422 if c<=0.0 & x2<=0.0 & x3-x1<=1.0 & x3-x1>=-2.0 & x4-x2<=2.0\n",
      "init state [2 1 0 1 0]\n",
      "(3,) (3,)\n",
      "init state [ 2  1 -2  2  0]\n",
      "(10,) (7,)\n",
      "init state [ 2  2 -1 -1  0]\n",
      "(42,) (32,)\n",
      "init state [1 0 0 2 0]\n",
      "(51,) (9,)\n",
      "init state [1 0 2 2 0]\n",
      "(73,) (22,)\n",
      "init state [1 1 1 0 0]\n",
      "(82,) (9,)\n",
      "init state [ 2  1 -2  0  0]\n",
      "(119,) (37,)\n",
      "init state [ 3  2 -3 -1  0]\n",
      "(148,) (29,)\n",
      "init state [ 3  2 -2  0  0]\n",
      "(160,) (12,)\n",
      "init state [ 2  0 -2  3  0]\n",
      "(170,) (10,)\n",
      "============ 22 ===========\n",
      "Run episode 22 with rewards 32, accuracy 0.5\n",
      "----------------- 0 --------------\n",
      "   -0.1180 if c>=1.0 & x1>=2.0 & x2>=2.0\n",
      "   +0.0567 if x1<=2.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.5343 if c>=1.0 & x3-x1<=1.0\n",
      "   -0.0857 if c<=0.0 & x1<=1.0 & x2<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.5869 if c<=0.0 & x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   -0.4515 if c<=0.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   +1.0888 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.2226 if c<=0.0 & x1>=1.0 & x2<=0.0 & x3-x1>=0.0\n",
      "   -0.4458 if x2<=2.0 & x4-x2>=0.0\n",
      "   -0.0954 if c<=0.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   -0.1432 if c<=0.0 & x1<=0.0 & x2>=1.0 & x3-x1<=2.0 & x4-x2<=1.0\n",
      "   -0.0711 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.0560 if c<=0.0 & x2<=1.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x3-x1>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.3052 if x1>=1.0 & x2<=0.0 & x3-x1>=-1.0 & x4-x2>=2.0\n",
      "   +0.7158 if c<=0.0 & x1>=2.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.2856 if x1>=2.0 & x2<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-2.0\n",
      "----------------- 1 --------------\n",
      "   +0.4745 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.1513 if c>=1.0 & x1>=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   -0.1910 if x2>=2.0 & x3-x1<=-1.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   -0.0000 if c<=0.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   +0.4779 if x1<=2.0 & x1>=1.0 & x2>=2.0 & x3-x1>=-1.0 & x4-x2>=0.0\n",
      "   -0.5484 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   -0.9952 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.0000 if x2<=1.0 & x3-x1>=2.0 & x4-x2<=0.0\n",
      "   +0.1992 if c>=1.0 & x1>=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   +0.4281 if c<=0.0 & x1<=1.0 & x2<=1.0 & x3-x1>=0.0\n",
      "   +0.7757 if x2>=3.0\n",
      "   -0.0000 if x4-x2<=-3.0\n",
      "   +0.1563 if x1>=1.0 & x2<=2.0 & x3-x1>=2.0\n",
      "   +0.2727 if x3-x1<=1.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   +0.1528 if x2<=0.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   -0.3180 if c<=0.0 & x1<=1.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 2 --------------\n",
      "   -0.5752 if x4-x2>=-1.0\n",
      "   +0.4290 if x2<=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   +0.0346 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.3747 if c>=1.0 & x1>=1.0 & x2<=2.0 & x4-x2<=-1.0\n",
      "   +0.0137 if x1<=1.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.0730 if x2<=0.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   +0.4345 if c<=0.0 & x4-x2>=-2.0\n",
      "   +0.4622 if c<=0.0 & x2<=2.0\n",
      "   -0.2242 if x2>=3.0 & x3-x1<=-1.0 & x4-x2>=0.0\n",
      "   -0.1192 if c<=0.0 & x2<=0.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   -0.1194 if x4-x2>=3.0\n",
      "   -0.2872 if c<=0.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.2063 if c<=0.0 & x1<=2.0 & x2>=1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.4731 if x2>=1.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   -0.2381 if c<=0.0 & x1<=0.0 & x3-x1<=1.0 & x4-x2>=-1.0\n",
      "   -0.4162 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "----------------- 3 --------------\n",
      "   +0.1329 if x3-x1<=-1.0\n",
      "   -0.0219 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2>=0.0\n",
      "   +0.3476 if x1<=2.0 & x1>=2.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   -0.3671 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   +0.3150 if c>=1.0 & x2<=1.0 & x2>=1.0\n",
      "   -0.3609 if c<=0.0 & x3-x1<=-1.0\n",
      "   +0.4544 if c>=1.0 & x1>=3.0 & x4-x2>=0.0\n",
      "   +0.0986 if x1>=1.0 & x2<=2.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   +0.0100 if x1<=1.0 & x2<=1.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   -0.3712 if x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.2359 if x4-x2>=3.0\n",
      "   -0.0988 if c<=0.0 & x1<=1.0 & x3-x1<=0.0 & x4-x2<=2.0 & x4-x2>=1.0\n",
      "   -0.1823 if x2>=3.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.3295 if x1>=2.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   -0.3188 if c<=0.0 & x2<=0.0 & x3-x1<=1.0 & x3-x1>=-2.0 & x4-x2<=2.0\n",
      "   +1.0821 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "init state [ 2  3  0 -3  0]\n",
      "(18,) (18,)\n",
      "init state [ 2  2 -1  0  0]\n",
      "(28,) (10,)\n",
      "init state [ 3  2 -2  0  0]\n",
      "(39,) (11,)\n",
      "init state [ 1  3 -1 -1  0]\n",
      "(55,) (16,)\n",
      "init state [0 0 0 3 0]\n",
      "(69,) (14,)\n",
      "init state [ 1  3 -1 -3  0]\n",
      "(112,) (43,)\n",
      "init state [1 1 2 1 0]\n",
      "(149,) (37,)\n",
      "init state [ 1  1  2 -1  0]\n",
      "(174,) (25,)\n",
      "init state [ 2  0 -1  0  0]\n",
      "(197,) (23,)\n",
      "init state [3 0 0 2 0]\n",
      "(209,) (12,)\n",
      "============ 23 ===========\n",
      "Run episode 23 with rewards 30, accuracy 0.2\n",
      "----------------- 0 --------------\n",
      "   -0.0736 if c>=1.0 & x1>=2.0 & x2>=2.0\n",
      "   +0.3437 if x1<=2.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.7463 if c>=1.0 & x3-x1<=1.0\n",
      "   -0.1680 if c<=0.0 & x1<=1.0 & x2<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.6903 if c<=0.0 & x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   +0.0925 if c<=0.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   +0.4817 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.2103 if c<=0.0 & x1>=1.0 & x2<=0.0 & x3-x1>=0.0\n",
      "   -0.1385 if x2<=2.0 & x4-x2>=0.0\n",
      "   -0.4196 if c<=0.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   -0.2287 if c<=0.0 & x1<=0.0 & x2>=1.0 & x3-x1<=2.0 & x4-x2<=1.0\n",
      "   -0.3291 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.1042 if x1>=1.0 & x2<=0.0 & x3-x1>=-1.0 & x4-x2>=2.0\n",
      "   +0.3446 if c<=0.0 & x1>=2.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.2156 if x1>=2.0 & x2<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-2.0\n",
      "   -0.4322 if c<=0.0 & x2>=3.0 & x3-x1<=-1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "----------------- 1 --------------\n",
      "   +0.2992 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.2770 if c>=1.0 & x1>=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   -0.1032 if x2>=2.0 & x3-x1<=-1.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   -0.2776 if c<=0.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   +0.4343 if x1<=2.0 & x1>=1.0 & x2>=2.0 & x3-x1>=-1.0 & x4-x2>=0.0\n",
      "   -0.1707 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   -0.7737 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.3756 if c>=1.0 & x1>=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   -0.0177 if c<=0.0 & x1<=1.0 & x2<=1.0 & x3-x1>=0.0\n",
      "   +0.3055 if x2>=3.0\n",
      "   +0.1078 if x4-x2<=-3.0\n",
      "   +0.2373 if x1>=1.0 & x2<=2.0 & x3-x1>=2.0\n",
      "   +0.7682 if x3-x1<=1.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   -0.0268 if x2<=0.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   -0.0254 if c<=0.0 & x1<=1.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.5511 if x2>=2.0 & x3-x1<=-2.0 & x4-x2>=-1.0\n",
      "----------------- 2 --------------\n",
      "   -0.0151 if x4-x2>=-1.0\n",
      "   +0.0682 if x2<=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   +0.2247 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.4447 if c>=1.0 & x1>=1.0 & x2<=2.0 & x4-x2<=-1.0\n",
      "   -0.0789 if x2<=0.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   +0.5587 if c<=0.0 & x4-x2>=-2.0\n",
      "   +0.1124 if c<=0.0 & x2<=2.0\n",
      "   -0.1737 if x2>=3.0 & x3-x1<=-1.0 & x4-x2>=0.0\n",
      "   -0.3115 if c<=0.0 & x2<=0.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   -0.0512 if x4-x2>=3.0\n",
      "   -0.3478 if c<=0.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.1395 if c<=0.0 & x1<=2.0 & x2>=1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.4692 if x2>=1.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   -0.0522 if c<=0.0 & x1<=0.0 & x3-x1<=1.0 & x4-x2>=-1.0\n",
      "   -0.3956 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.6242 if x1>=3.0 & x2>=3.0 & x3-x1<=-2.0 & x4-x2>=-1.0\n",
      "----------------- 3 --------------\n",
      "   +0.3011 if x3-x1<=-1.0\n",
      "   +0.0444 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2>=0.0\n",
      "   -0.4151 if x1<=2.0 & x1>=2.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   -0.1873 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   +0.2727 if c>=1.0 & x2<=1.0 & x2>=1.0\n",
      "   -0.0086 if c<=0.0 & x3-x1<=-1.0\n",
      "   +0.2988 if c>=1.0 & x1>=3.0 & x4-x2>=0.0\n",
      "   +0.1231 if x1>=1.0 & x2<=2.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   -0.2603 if x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.1442 if x4-x2>=3.0\n",
      "   +0.2847 if c<=0.0 & x1<=1.0 & x3-x1<=0.0 & x4-x2<=2.0 & x4-x2>=1.0\n",
      "   -0.0317 if x2>=3.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.0697 if x1>=2.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.1703 if c<=0.0 & x2<=0.0 & x3-x1<=1.0 & x3-x1>=-2.0 & x4-x2<=2.0\n",
      "   +0.6311 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.6104 if x1>=2.0 & x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-2.0\n",
      "init state [ 2  3  0 -3  0]\n",
      "(20,) (20,)\n",
      "init state [ 0  3  1 -2  0]\n",
      "(56,) (36,)\n",
      "init state [ 0  3  2 -1  0]\n",
      "(65,) (9,)\n",
      "init state [ 3  0 -3  2  0]\n",
      "(93,) (28,)\n",
      "init state [ 1  0 -1  3  0]\n",
      "(111,) (18,)\n",
      "init state [ 3  0 -3  3  0]\n",
      "(152,) (41,)\n",
      "init state [2 1 0 2 0]\n",
      "(160,) (8,)\n",
      "init state [ 2  3 -1 -1  0]\n",
      "(165,) (5,)\n",
      "init state [ 1  1  2 -1  0]\n",
      "(184,) (19,)\n",
      "init state [ 2  3  0 -2  0]\n",
      "(193,) (9,)\n",
      "============ 24 ===========\n",
      "Run episode 24 with rewards 33, accuracy 0.5\n",
      "----------------- 0 --------------\n",
      "   +0.2391 if x1<=2.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.9090 if c>=1.0 & x3-x1<=1.0\n",
      "   -0.1559 if c<=0.0 & x1<=1.0 & x2<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.5238 if c<=0.0 & x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   -0.2435 if c<=0.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   +0.6734 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.0263 if c<=0.0 & x1>=1.0 & x2<=0.0 & x3-x1>=0.0\n",
      "   -0.2843 if x2<=2.0 & x4-x2>=0.0\n",
      "   -0.0405 if c<=0.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   -0.1625 if c<=0.0 & x1<=0.0 & x2>=1.0 & x3-x1<=2.0 & x4-x2<=1.0\n",
      "   -0.5777 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.0837 if x1>=1.0 & x2<=0.0 & x3-x1>=-1.0 & x4-x2>=2.0\n",
      "   +0.7306 if c<=0.0 & x1>=2.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.0191 if x1>=2.0 & x2<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-2.0\n",
      "   -0.2358 if c<=0.0 & x2>=3.0 & x3-x1<=-1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.1511 if x4-x2<=-3.0\n",
      "----------------- 1 --------------\n",
      "   +0.9145 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.2282 if c>=1.0 & x1>=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   +0.1255 if x2>=2.0 & x3-x1<=-1.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.3282 if c<=0.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   +0.4562 if x1<=2.0 & x1>=1.0 & x2>=2.0 & x3-x1>=-1.0 & x4-x2>=0.0\n",
      "   -0.6698 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   -0.4363 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.1468 if c>=1.0 & x1>=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   +0.1649 if x2>=3.0\n",
      "   +0.0485 if x4-x2<=-3.0\n",
      "   +0.1441 if x1>=1.0 & x2<=2.0 & x3-x1>=2.0\n",
      "   +0.6117 if x3-x1<=1.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   +0.0167 if x2<=0.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   +0.1571 if c<=0.0 & x1<=1.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.2744 if x2>=2.0 & x3-x1<=-2.0 & x4-x2>=-1.0\n",
      "   +0.2309 if x1<=0.0 & x3-x1>=2.0\n",
      "----------------- 2 --------------\n",
      "   +0.1832 if x2<=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.0404 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.4308 if c>=1.0 & x1>=1.0 & x2<=2.0 & x4-x2<=-1.0\n",
      "   -0.2561 if x2<=0.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   +0.4774 if c<=0.0 & x4-x2>=-2.0\n",
      "   +0.0413 if c<=0.0 & x2<=2.0\n",
      "   -0.1658 if x2>=3.0 & x3-x1<=-1.0 & x4-x2>=0.0\n",
      "   -0.2561 if c<=0.0 & x2<=0.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.2520 if x4-x2>=3.0\n",
      "   -0.2393 if c<=0.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.3401 if c<=0.0 & x1<=2.0 & x2>=1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.8482 if x2>=1.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   +0.0157 if c<=0.0 & x1<=0.0 & x3-x1<=1.0 & x4-x2>=-1.0\n",
      "   -0.1217 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.0519 if x1>=3.0 & x2>=3.0 & x3-x1<=-2.0 & x4-x2>=-1.0\n",
      "   +0.1694 if x3-x1<=-1.0 & x4-x2<=-3.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 3 --------------\n",
      "   +0.0974 if x3-x1<=-1.0\n",
      "   -0.3175 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2>=0.0\n",
      "   -0.1540 if x1<=2.0 & x1>=2.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   -0.1899 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   +0.3843 if c>=1.0 & x2<=1.0 & x2>=1.0\n",
      "   +0.3205 if c>=1.0 & x1>=3.0 & x4-x2>=0.0\n",
      "   -0.0455 if x1>=1.0 & x2<=2.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   -0.1996 if x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.0763 if x4-x2>=3.0\n",
      "   +0.2607 if c<=0.0 & x1<=1.0 & x3-x1<=0.0 & x4-x2<=2.0 & x4-x2>=1.0\n",
      "   -0.4896 if x2>=3.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.1064 if x1>=2.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.0340 if c<=0.0 & x2<=0.0 & x3-x1<=1.0 & x3-x1>=-2.0 & x4-x2<=2.0\n",
      "   +0.8244 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.2695 if x1>=2.0 & x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-2.0\n",
      "   +0.6325 if c>=1.0 & x1>=1.0\n",
      "init state [ 1  1 -1 -1  0]\n",
      "(64,) (64,)\n",
      "init state [0 1 0 2 0]\n",
      "(72,) (8,)\n",
      "init state [ 2  1 -2  0  0]\n",
      "(85,) (13,)\n",
      "init state [ 2  3 -2  0  0]\n",
      "(91,) (6,)\n",
      "init state [2 1 1 0 0]\n",
      "(96,) (5,)\n",
      "init state [0 1 2 2 0]\n",
      "(111,) (15,)\n",
      "init state [3 0 0 2 0]\n",
      "(119,) (8,)\n",
      "init state [ 2  0 -1  2  0]\n",
      "(126,) (7,)\n",
      "init state [ 1  1 -1 -1  0]\n",
      "(145,) (19,)\n",
      "init state [1 0 0 3 0]\n",
      "(150,) (5,)\n",
      "============ 25 ===========\n",
      "Run episode 25 with rewards 37, accuracy 0.6\n",
      "----------------- 0 --------------\n",
      "   -0.0422 if x1<=2.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.6045 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.4891 if c<=0.0 & x1<=1.0 & x2<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.4520 if c<=0.0 & x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   -0.5299 if c<=0.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   +1.0238 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.0818 if c<=0.0 & x1>=1.0 & x2<=0.0 & x3-x1>=0.0\n",
      "   -0.3335 if x2<=2.0 & x4-x2>=0.0\n",
      "   -0.2427 if c<=0.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   -0.2035 if c<=0.0 & x1<=0.0 & x2>=1.0 & x3-x1<=2.0 & x4-x2<=1.0\n",
      "   -0.2878 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.0522 if x1>=1.0 & x2<=0.0 & x3-x1>=-1.0 & x4-x2>=2.0\n",
      "   +0.6997 if c<=0.0 & x1>=2.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.0000 if c<=0.0 & x2>=3.0 & x3-x1<=-1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   +0.0060 if x4-x2<=-3.0\n",
      "   -0.2428 if x3-x1>=0.0 & x4-x2>=3.0\n",
      "----------------- 1 --------------\n",
      "   +0.7696 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.3616 if c>=1.0 & x1>=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   -0.4075 if x2>=2.0 & x3-x1<=-1.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   -0.0000 if c<=0.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.0819 if x1<=2.0 & x1>=1.0 & x2>=2.0 & x3-x1>=-1.0 & x4-x2>=0.0\n",
      "   -0.5647 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   -0.2273 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.1622 if c>=1.0 & x1>=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   +0.7009 if x2>=3.0\n",
      "   +0.3771 if x4-x2<=-3.0\n",
      "   -0.0000 if x1>=1.0 & x2<=2.0 & x3-x1>=2.0\n",
      "   +0.3444 if x3-x1<=1.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   +0.1604 if c<=0.0 & x1<=1.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.1352 if x2>=2.0 & x3-x1<=-2.0 & x4-x2>=-1.0\n",
      "   +0.1834 if x1<=0.0 & x3-x1>=2.0\n",
      "   -0.3424 if x2>=1.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "----------------- 2 --------------\n",
      "   -0.0643 if x2<=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.2445 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.2404 if c>=1.0 & x1>=1.0 & x2<=2.0 & x4-x2<=-1.0\n",
      "   -0.0741 if x2<=0.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   -0.0331 if c<=0.0 & x4-x2>=-2.0\n",
      "   +0.0740 if c<=0.0 & x2<=2.0\n",
      "   -0.2090 if x2>=3.0 & x3-x1<=-1.0 & x4-x2>=0.0\n",
      "   +0.1704 if c<=0.0 & x2<=0.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.6062 if x4-x2>=3.0\n",
      "   +0.1601 if c<=0.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.2995 if c<=0.0 & x1<=2.0 & x2>=1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.9587 if x2>=1.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   -0.2208 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.0000 if x1>=3.0 & x2>=3.0 & x3-x1<=-2.0 & x4-x2>=-1.0\n",
      "   -0.3461 if x3-x1<=-1.0 & x4-x2<=-3.0\n",
      "   +0.5405 if x2>=1.0 & x3-x1<=1.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "----------------- 3 --------------\n",
      "   +0.1332 if x3-x1<=-1.0\n",
      "   +0.0122 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2>=0.0\n",
      "   -0.2371 if x1<=2.0 & x1>=2.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   -0.4470 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   +0.0903 if c>=1.0 & x2<=1.0 & x2>=1.0\n",
      "   +0.2802 if c>=1.0 & x1>=3.0 & x4-x2>=0.0\n",
      "   +0.1929 if x1>=1.0 & x2<=2.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   -0.2771 if x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.2608 if x4-x2>=3.0\n",
      "   +0.3118 if c<=0.0 & x1<=1.0 & x3-x1<=0.0 & x4-x2<=2.0 & x4-x2>=1.0\n",
      "   -0.2193 if x2>=3.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.3025 if x1>=2.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +1.0469 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.1510 if x1>=2.0 & x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-2.0\n",
      "   +0.2775 if c>=1.0 & x1>=1.0\n",
      "   +0.2970 if x3-x1<=-3.0\n",
      "init state [2 0 1 1 0]\n",
      "(11,) (11,)\n",
      "init state [ 3  0 -3  2  0]\n",
      "(30,) (19,)\n",
      "init state [ 2  2 -1  0  0]\n",
      "(40,) (10,)\n",
      "init state [ 2  0 -2  0  0]\n",
      "(113,) (73,)\n",
      "init state [2 0 1 0 0]\n",
      "(121,) (8,)\n",
      "init state [ 1  2 -1 -1  0]\n",
      "(134,) (13,)\n",
      "init state [ 1  3  0 -2  0]\n",
      "(176,) (42,)\n",
      "init state [0 1 0 1 0]\n",
      "(197,) (21,)\n",
      "init state [0 2 1 1 0]\n",
      "(203,) (6,)\n",
      "init state [ 3  2 -2  0  0]\n",
      "(221,) (18,)\n",
      "============ 26 ===========\n",
      "Run episode 26 with rewards 24, accuracy 0.7\n",
      "best\n",
      "----------------- 0 --------------\n",
      "   +0.3278 if x1<=2.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.6400 if c>=1.0 & x3-x1<=1.0\n",
      "   -0.0250 if c<=0.0 & x1<=1.0 & x2<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.0841 if c<=0.0 & x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   +0.0343 if c<=0.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   +0.5926 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.2775 if c<=0.0 & x1>=1.0 & x2<=0.0 & x3-x1>=0.0\n",
      "   -0.1298 if x2<=2.0 & x4-x2>=0.0\n",
      "   -0.0898 if c<=0.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   -0.1134 if c<=0.0 & x1<=0.0 & x2>=1.0 & x3-x1<=2.0 & x4-x2<=1.0\n",
      "   -0.2939 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.0000 if x1>=1.0 & x2<=0.0 & x3-x1>=-1.0 & x4-x2>=2.0\n",
      "   +0.8122 if c<=0.0 & x1>=2.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.0560 if x4-x2<=-3.0\n",
      "   -0.0000 if x3-x1>=0.0 & x4-x2>=3.0\n",
      "   -0.1866 if x2<=1.0 & x3-x1>=2.0\n",
      "----------------- 1 --------------\n",
      "   +0.3474 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.7063 if c>=1.0 & x1>=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   +0.0658 if x2>=2.0 & x3-x1<=-1.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   -0.1729 if c<=0.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.1576 if x1<=2.0 & x1>=1.0 & x2>=2.0 & x3-x1>=-1.0 & x4-x2>=0.0\n",
      "   +0.3036 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   -0.6547 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.1487 if c>=1.0 & x1>=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   +0.4381 if x2>=3.0\n",
      "   +0.1011 if x4-x2<=-3.0\n",
      "   +0.3240 if x3-x1<=1.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   +0.0809 if c<=0.0 & x1<=1.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.0513 if x2>=2.0 & x3-x1<=-2.0 & x4-x2>=-1.0\n",
      "   -0.0000 if x1<=0.0 & x3-x1>=2.0\n",
      "   +0.0746 if x2>=1.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.6621 if x2<=2.0 & x2>=2.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "----------------- 2 --------------\n",
      "   +0.5835 if x2<=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   +0.0891 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.3822 if c>=1.0 & x1>=1.0 & x2<=2.0 & x4-x2<=-1.0\n",
      "   -0.3491 if x2<=0.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   -0.0628 if c<=0.0 & x4-x2>=-2.0\n",
      "   +0.3593 if c<=0.0 & x2<=2.0\n",
      "   -0.0393 if x2>=3.0 & x3-x1<=-1.0 & x4-x2>=0.0\n",
      "   -0.0201 if c<=0.0 & x2<=0.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.0000 if x4-x2>=3.0\n",
      "   -0.0886 if c<=0.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.2844 if c<=0.0 & x1<=2.0 & x2>=1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.4638 if x2>=1.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   -0.0207 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.1462 if x3-x1<=-1.0 & x4-x2<=-3.0\n",
      "   -0.1360 if x2>=1.0 & x3-x1<=1.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "   -0.1867 if x1>=1.0 & x2<=2.0 & x3-x1<=0.0 & x4-x2<=1.0\n",
      "----------------- 3 --------------\n",
      "   -0.4366 if x3-x1<=-1.0\n",
      "   +0.2421 if x1<=2.0 & x1>=2.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   -0.7559 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   +0.1495 if c>=1.0 & x2<=1.0 & x2>=1.0\n",
      "   +0.2112 if c>=1.0 & x1>=3.0 & x4-x2>=0.0\n",
      "   +0.7042 if x1>=1.0 & x2<=2.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   -0.1185 if x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.0000 if x4-x2>=3.0\n",
      "   +0.2095 if c<=0.0 & x1<=1.0 & x3-x1<=0.0 & x4-x2<=2.0 & x4-x2>=1.0\n",
      "   +0.0078 if x2>=3.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.0000 if x1>=2.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.2059 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.1367 if x1>=2.0 & x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-2.0\n",
      "   +0.5595 if c>=1.0 & x1>=1.0\n",
      "   -0.6900 if x3-x1<=-3.0\n",
      "   -0.6548 if x1>=2.0 & x3-x1>=1.0 & x4-x2<=0.0\n",
      "init state [0 0 1 3 0]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(13,) (13,)\n",
      "init state [ 3  2 -1  1  0]\n",
      "(17,) (4,)\n",
      "init state [ 0  2  2 -2  0]\n",
      "(89,) (72,)\n",
      "init state [ 2  2  1 -2  0]\n",
      "(126,) (37,)\n",
      "init state [ 0  2  1 -1  0]\n",
      "(164,) (38,)\n",
      "init state [ 0  1  3 -1  0]\n",
      "(173,) (9,)\n",
      "init state [1 1 0 1 0]\n",
      "(179,) (6,)\n",
      "init state [0 1 2 2 0]\n",
      "(188,) (9,)\n",
      "init state [0 0 1 0 0]\n",
      "(197,) (9,)\n",
      "init state [ 3  1 -2 -1  0]\n",
      "(221,) (24,)\n",
      "============ 27 ===========\n",
      "Run episode 27 with rewards 18, accuracy 0.7\n",
      "best\n",
      "----------------- 0 --------------\n",
      "   -0.5977 if x1<=2.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.5188 if c>=1.0 & x3-x1<=1.0\n",
      "   -0.0576 if c<=0.0 & x1<=1.0 & x2<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.0637 if c<=0.0 & x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   -0.4769 if c<=0.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   +0.9092 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.2787 if c<=0.0 & x1>=1.0 & x2<=0.0 & x3-x1>=0.0\n",
      "   -0.1972 if x2<=2.0 & x4-x2>=0.0\n",
      "   -0.3150 if c<=0.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   +0.0740 if c<=0.0 & x1<=0.0 & x2>=1.0 & x3-x1<=2.0 & x4-x2<=1.0\n",
      "   -0.0792 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.8681 if c<=0.0 & x1>=2.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.2047 if x4-x2<=-3.0\n",
      "   +0.1485 if x3-x1>=0.0 & x4-x2>=3.0\n",
      "   -0.3343 if x2<=1.0 & x3-x1>=2.0\n",
      "   -0.4475 if x1>=3.0 & x2>=2.0 & x4-x2>=1.0\n",
      "----------------- 1 --------------\n",
      "   +0.2672 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.4636 if c>=1.0 & x1>=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   -0.2118 if x2>=2.0 & x3-x1<=-1.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.1531 if c<=0.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   +0.3311 if x1<=2.0 & x1>=1.0 & x2>=2.0 & x3-x1>=-1.0 & x4-x2>=0.0\n",
      "   -0.4530 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   -0.3568 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.4748 if c>=1.0 & x1>=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   +0.6331 if x2>=3.0\n",
      "   +0.4829 if x4-x2<=-3.0\n",
      "   +0.4219 if x3-x1<=1.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   +0.0988 if c<=0.0 & x1<=1.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.1760 if x2>=2.0 & x3-x1<=-2.0 & x4-x2>=-1.0\n",
      "   +0.7432 if x2>=1.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   -0.0179 if x2<=2.0 & x2>=2.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   -0.6418 if x4-x2>=3.0\n",
      "----------------- 2 --------------\n",
      "   -0.4938 if x2<=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.0752 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.7354 if c>=1.0 & x1>=1.0 & x2<=2.0 & x4-x2<=-1.0\n",
      "   -0.3514 if x2<=0.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   +0.2902 if c<=0.0 & x4-x2>=-2.0\n",
      "   +0.3674 if c<=0.0 & x2<=2.0\n",
      "   -0.1712 if x2>=3.0 & x3-x1<=-1.0 & x4-x2>=0.0\n",
      "   -0.3514 if c<=0.0 & x2<=0.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   -0.1734 if c<=0.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.0000 if c<=0.0 & x1<=2.0 & x2>=1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.6429 if x2>=1.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   -0.2234 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.0525 if x3-x1<=-1.0 & x4-x2<=-3.0\n",
      "   -0.0869 if x2>=1.0 & x3-x1<=1.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "   -0.1034 if x1>=1.0 & x2<=2.0 & x3-x1<=0.0 & x4-x2<=1.0\n",
      "   +0.3600 if x4-x2>=3.0\n",
      "----------------- 3 --------------\n",
      "   -0.0722 if x3-x1<=-1.0\n",
      "   -0.4416 if x1<=2.0 & x1>=2.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   +0.0326 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   +0.4141 if c>=1.0 & x2<=1.0 & x2>=1.0\n",
      "   +0.3378 if c>=1.0 & x1>=3.0 & x4-x2>=0.0\n",
      "   +0.3021 if x1>=1.0 & x2<=2.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   -0.2351 if x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.3570 if c<=0.0 & x1<=1.0 & x3-x1<=0.0 & x4-x2<=2.0 & x4-x2>=1.0\n",
      "   -0.0369 if x2>=3.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.2069 if x1>=2.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.8850 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.4378 if x1>=2.0 & x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-2.0\n",
      "   +0.5778 if c>=1.0 & x1>=1.0\n",
      "   -0.0000 if x3-x1<=-3.0\n",
      "   -0.4366 if x1>=2.0 & x3-x1>=1.0 & x4-x2<=0.0\n",
      "   +0.2965 if x3-x1<=-2.0 & x4-x2>=0.0\n",
      "init state [ 2  2  0 -2  0]\n",
      "(13,) (13,)\n",
      "init state [ 3  1 -3  0  0]\n",
      "(92,) (79,)\n",
      "init state [0 0 0 2 0]\n",
      "(112,) (20,)\n",
      "init state [0 0 2 2 0]\n",
      "(133,) (21,)\n",
      "init state [1 0 1 1 0]\n",
      "(151,) (18,)\n",
      "init state [0 2 2 1 0]\n",
      "(163,) (12,)\n",
      "init state [1 0 2 0 0]\n",
      "(176,) (13,)\n",
      "init state [2 0 0 2 0]\n",
      "(197,) (21,)\n",
      "init state [ 1  1 -1  0  0]\n",
      "(215,) (18,)\n",
      "init state [ 3  2 -2  1  0]\n",
      "(222,) (7,)\n",
      "============ 28 ===========\n",
      "Run episode 28 with rewards 35, accuracy 0.6\n",
      "----------------- 0 --------------\n",
      "   -0.6338 if x1<=2.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.6314 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.1895 if c<=0.0 & x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   -0.3264 if c<=0.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   +0.6748 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.1285 if c<=0.0 & x1>=1.0 & x2<=0.0 & x3-x1>=0.0\n",
      "   -0.1273 if x2<=2.0 & x4-x2>=0.0\n",
      "   -0.3790 if c<=0.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   +0.0849 if c<=0.0 & x1<=0.0 & x2>=1.0 & x3-x1<=2.0 & x4-x2<=1.0\n",
      "   -0.3979 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.9184 if c<=0.0 & x1>=2.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.1213 if x4-x2<=-3.0\n",
      "   -0.0731 if x3-x1>=0.0 & x4-x2>=3.0\n",
      "   -0.0886 if x2<=1.0 & x3-x1>=2.0\n",
      "   -0.2344 if x1>=3.0 & x2>=2.0 & x4-x2>=1.0\n",
      "   +0.1364 if x2<=2.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "----------------- 1 --------------\n",
      "   -0.0272 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.5892 if c>=1.0 & x1>=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   +0.0070 if x2>=2.0 & x3-x1<=-1.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.5046 if c<=0.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   +0.3307 if x1<=2.0 & x1>=1.0 & x2>=2.0 & x3-x1>=-1.0 & x4-x2>=0.0\n",
      "   -0.0961 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   -0.1831 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.4856 if c>=1.0 & x1>=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   +0.3866 if x2>=3.0\n",
      "   +0.1870 if x4-x2<=-3.0\n",
      "   +0.6341 if x3-x1<=1.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   -0.4424 if c<=0.0 & x1<=1.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.1039 if x2>=2.0 & x3-x1<=-2.0 & x4-x2>=-1.0\n",
      "   +0.9222 if x2>=1.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   -0.3167 if x4-x2>=3.0\n",
      "   -0.5414 if x1>=1.0 & x2<=2.0 & x2>=2.0 & x3-x1>=0.0\n",
      "----------------- 2 --------------\n",
      "   -0.0880 if x2<=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.1790 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.2903 if c>=1.0 & x1>=1.0 & x2<=2.0 & x4-x2<=-1.0\n",
      "   -0.1476 if x2<=0.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   +0.5024 if c<=0.0 & x4-x2>=-2.0\n",
      "   -0.0240 if c<=0.0 & x2<=2.0\n",
      "   -0.2642 if x2>=3.0 & x3-x1<=-1.0 & x4-x2>=0.0\n",
      "   -0.1917 if c<=0.0 & x2<=0.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.1997 if c<=0.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.9266 if x2>=1.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   -0.5671 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.3559 if x3-x1<=-1.0 & x4-x2<=-3.0\n",
      "   +0.2787 if x2>=1.0 & x3-x1<=1.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.1791 if x1>=1.0 & x2<=2.0 & x3-x1<=0.0 & x4-x2<=1.0\n",
      "   +0.1338 if x4-x2>=3.0\n",
      "   +0.3965 if x3-x1>=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "----------------- 3 --------------\n",
      "   +0.1949 if x3-x1<=-1.0\n",
      "   -0.4607 if x1<=2.0 & x1>=2.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   -0.2016 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   +0.0679 if c>=1.0 & x2<=1.0 & x2>=1.0\n",
      "   +0.2649 if c>=1.0 & x1>=3.0 & x4-x2>=0.0\n",
      "   +0.2669 if x1>=1.0 & x2<=2.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   -0.2391 if x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.1221 if c<=0.0 & x1<=1.0 & x3-x1<=0.0 & x4-x2<=2.0 & x4-x2>=1.0\n",
      "   -0.2658 if x2>=3.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.4607 if x1>=2.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.6814 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.4619 if x1>=2.0 & x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-2.0\n",
      "   +0.7684 if c>=1.0 & x1>=1.0\n",
      "   -0.1008 if x1>=2.0 & x3-x1>=1.0 & x4-x2<=0.0\n",
      "   +0.1591 if x3-x1<=-2.0 & x4-x2>=0.0\n",
      "   +0.1843 if x1>=2.0 & x2<=0.0 & x4-x2>=2.0\n",
      "init state [ 2  1 -2  1  0]\n",
      "(15,) (15,)\n",
      "init state [1 1 2 0 0]\n",
      "(63,) (48,)\n",
      "init state [ 0  1  2 -1  0]\n",
      "(110,) (47,)\n",
      "init state [ 0  1  2 -1  0]\n",
      "(125,) (15,)\n",
      "init state [ 0  2  2 -2  0]\n",
      "(142,) (17,)\n",
      "init state [ 3  0 -3  2  0]\n",
      "(162,) (20,)\n",
      "init state [ 0  3  0 -2  0]\n",
      "(183,) (21,)\n",
      "init state [ 1  3 -1 -2  0]\n",
      "(194,) (11,)\n",
      "init state [ 1  2 -1  0  0]\n",
      "(211,) (17,)\n",
      "init state [ 3  1 -1 -1  0]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(236,) (25,)\n",
      "============ 29 ===========\n",
      "Run episode 29 with rewards 17, accuracy 0.4\n",
      "----------------- 0 --------------\n",
      "   +0.1976 if x1<=2.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.7733 if c>=1.0 & x3-x1<=1.0\n",
      "   -0.0778 if c<=0.0 & x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   +0.3595 if c<=0.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   +0.9768 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.3418 if c<=0.0 & x1>=1.0 & x2<=0.0 & x3-x1>=0.0\n",
      "   -0.0662 if x2<=2.0 & x4-x2>=0.0\n",
      "   -0.1363 if c<=0.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   +0.3386 if c<=0.0 & x1<=0.0 & x2>=1.0 & x3-x1<=2.0 & x4-x2<=1.0\n",
      "   -0.4746 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.1701 if c<=0.0 & x1>=2.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.0004 if x4-x2<=-3.0\n",
      "   -0.2106 if x2<=1.0 & x3-x1>=2.0\n",
      "   +0.0000 if x1>=3.0 & x2>=2.0 & x4-x2>=1.0\n",
      "   -0.7013 if x2<=2.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   -0.4713 if x4-x2<=-2.0\n",
      "----------------- 1 --------------\n",
      "   +0.0221 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.5198 if c>=1.0 & x1>=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   +0.4604 if c<=0.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   +0.1070 if x1<=2.0 & x1>=1.0 & x2>=2.0 & x3-x1>=-1.0 & x4-x2>=0.0\n",
      "   -0.2701 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   -0.2807 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.3282 if c>=1.0 & x1>=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   +0.7048 if x2>=3.0\n",
      "   +0.0864 if x4-x2<=-3.0\n",
      "   +0.3456 if x3-x1<=1.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   +0.0971 if c<=0.0 & x1<=1.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.2125 if x2>=2.0 & x3-x1<=-2.0 & x4-x2>=-1.0\n",
      "   +0.1128 if x2>=1.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   -0.0000 if x4-x2>=3.0\n",
      "   +0.0458 if x1>=1.0 & x2<=2.0 & x2>=2.0 & x3-x1>=0.0\n",
      "   +0.8935 if x1>=2.0 & x3-x1>=-2.0 & x4-x2<=-2.0 & x4-x2>=-2.0\n",
      "----------------- 2 --------------\n",
      "   +0.0548 if x2<=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.1748 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.5150 if c>=1.0 & x1>=1.0 & x2<=2.0 & x4-x2<=-1.0\n",
      "   -0.2344 if x2<=0.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   +0.5910 if c<=0.0 & x4-x2>=-2.0\n",
      "   +0.0000 if x2>=3.0 & x3-x1<=-1.0 & x4-x2>=0.0\n",
      "   -0.0800 if c<=0.0 & x2<=0.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   -0.0519 if c<=0.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.4744 if x2>=1.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   -0.6560 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.1072 if x3-x1<=-1.0 & x4-x2<=-3.0\n",
      "   +0.0000 if x2>=1.0 & x3-x1<=1.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.3495 if x1>=1.0 & x2<=2.0 & x3-x1<=0.0 & x4-x2<=1.0\n",
      "   +0.0000 if x4-x2>=3.0\n",
      "   +0.1226 if x3-x1>=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.4044 if x1<=1.0 & x2<=0.0\n",
      "----------------- 3 --------------\n",
      "   -0.2864 if x3-x1<=-1.0\n",
      "   -0.0611 if x1<=2.0 & x1>=2.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   -0.2378 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   -0.0013 if c>=1.0 & x1>=3.0 & x4-x2>=0.0\n",
      "   -0.1282 if x1>=1.0 & x2<=2.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   +0.1502 if x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.1142 if c<=0.0 & x1<=1.0 & x3-x1<=0.0 & x4-x2<=2.0 & x4-x2>=1.0\n",
      "   -0.1443 if x2>=3.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.0219 if x1>=2.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.2244 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.3752 if x1>=2.0 & x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-2.0\n",
      "   +0.5905 if c>=1.0 & x1>=1.0\n",
      "   +0.0577 if x1>=2.0 & x3-x1>=1.0 & x4-x2<=0.0\n",
      "   +0.3561 if x3-x1<=-2.0 & x4-x2>=0.0\n",
      "   +0.0461 if x1>=2.0 & x2<=0.0 & x4-x2>=2.0\n",
      "   +0.6170 if x1>=3.0 & x2<=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "init state [ 0  3  3 -1  0]\n",
      "(10,) (10,)\n",
      "init state [ 3  0 -1  1  0]\n",
      "(29,) (19,)\n",
      "init state [2 0 0 1 0]\n",
      "(58,) (29,)\n",
      "init state [ 1  3  0 -1  0]\n",
      "(66,) (8,)\n",
      "init state [ 0  2  0 -2  0]\n",
      "(92,) (26,)\n",
      "init state [2 0 1 1 0]\n",
      "(97,) (5,)\n",
      "init state [2 0 0 3 0]\n",
      "(111,) (14,)\n",
      "init state [0 2 1 0 0]\n",
      "(127,) (16,)\n",
      "init state [0 2 0 1 0]\n",
      "(138,) (11,)\n",
      "init state [ 2  3  0 -1  0]\n",
      "(145,) (7,)\n",
      "============ 30 ===========\n",
      "Run episode 30 with rewards 35, accuracy 0.6\n",
      "----------------- 0 --------------\n",
      "   +0.1167 if x1<=2.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.5212 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.3630 if c<=0.0 & x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   +0.0976 if c<=0.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   -0.1094 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.2635 if c<=0.0 & x1>=1.0 & x2<=0.0 & x3-x1>=0.0\n",
      "   -0.1256 if x2<=2.0 & x4-x2>=0.0\n",
      "   -0.1103 if c<=0.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   +0.5053 if c<=0.0 & x1<=0.0 & x2>=1.0 & x3-x1<=2.0 & x4-x2<=1.0\n",
      "   -0.3898 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.6218 if c<=0.0 & x1>=2.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.0000 if x4-x2<=-3.0\n",
      "   -0.0434 if x2<=1.0 & x3-x1>=2.0\n",
      "   -0.6433 if x2<=2.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   +0.3319 if x4-x2<=-2.0\n",
      "   -0.4751 if c<=0.0 & x1>=1.0 & x2>=1.0 & x3-x1>=0.0\n",
      "----------------- 1 --------------\n",
      "   +0.2792 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.2795 if c>=1.0 & x1>=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   -0.0001 if c<=0.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   +0.3219 if x1<=2.0 & x1>=1.0 & x2>=2.0 & x3-x1>=-1.0 & x4-x2>=0.0\n",
      "   -0.3706 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   -0.4017 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.1264 if c>=1.0 & x1>=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   +0.4319 if x2>=3.0\n",
      "   +0.0000 if x4-x2<=-3.0\n",
      "   +0.5012 if x3-x1<=1.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   -0.1162 if c<=0.0 & x1<=1.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.1603 if x2>=2.0 & x3-x1<=-2.0 & x4-x2>=-1.0\n",
      "   -0.2832 if x2>=1.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.1763 if x1>=1.0 & x2<=2.0 & x2>=2.0 & x3-x1>=0.0\n",
      "   +0.0672 if x1>=2.0 & x3-x1>=-2.0 & x4-x2<=-2.0 & x4-x2>=-2.0\n",
      "   +0.7384 if c<=0.0 & x2>=2.0 & x3-x1>=1.0\n",
      "----------------- 2 --------------\n",
      "   -0.0090 if x2<=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.2780 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.2602 if c>=1.0 & x1>=1.0 & x2<=2.0 & x4-x2<=-1.0\n",
      "   +0.1091 if x2<=0.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   +0.0529 if c<=0.0 & x4-x2>=-2.0\n",
      "   -0.0991 if x2>=3.0 & x3-x1<=-1.0 & x4-x2>=0.0\n",
      "   -0.1897 if c<=0.0 & x2<=0.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   -0.0584 if c<=0.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.5381 if x2>=1.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   -0.5104 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.0000 if x3-x1<=-1.0 & x4-x2<=-3.0\n",
      "   -0.0195 if x2>=1.0 & x3-x1<=1.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "   -0.4382 if x1>=1.0 & x2<=2.0 & x3-x1<=0.0 & x4-x2<=1.0\n",
      "   +0.1046 if x3-x1>=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.1186 if x1<=1.0 & x2<=0.0\n",
      "   +0.8317 if x1<=2.0 & x3-x1<=2.0 & x3-x1>=0.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "----------------- 3 --------------\n",
      "   -0.0292 if x3-x1<=-1.0\n",
      "   +0.0645 if x1<=2.0 & x1>=2.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   -0.0670 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   +0.0640 if x1>=1.0 & x2<=2.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   +0.0417 if x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.0256 if c<=0.0 & x1<=1.0 & x3-x1<=0.0 & x4-x2<=2.0 & x4-x2>=1.0\n",
      "   -0.2095 if x2>=3.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.7476 if x1>=2.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.4051 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.0387 if x1>=2.0 & x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-2.0\n",
      "   +0.6474 if c>=1.0 & x1>=1.0\n",
      "   -0.1165 if x1>=2.0 & x3-x1>=1.0 & x4-x2<=0.0\n",
      "   -0.0586 if x3-x1<=-2.0 & x4-x2>=0.0\n",
      "   +0.0551 if x1>=2.0 & x2<=0.0 & x4-x2>=2.0\n",
      "   +0.5976 if x1>=3.0 & x2<=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   -0.3917 if x3-x1<=-1.0 & x4-x2>=2.0\n",
      "init state [ 0  3  2 -3  0]\n",
      "(20,) (20,)\n",
      "init state [ 3  0 -2  0  0]\n",
      "(74,) (54,)\n",
      "init state [ 2  2 -1 -1  0]\n",
      "(119,) (45,)\n",
      "init state [ 3  2 -2  1  0]\n",
      "(146,) (27,)\n",
      "init state [ 1  0 -1  0  0]\n",
      "(226,) (80,)\n",
      "init state [ 2  1 -1  2  0]\n",
      "(248,) (22,)\n",
      "init state [ 2  2 -1 -2  0]\n",
      "(293,) (45,)\n",
      "init state [ 3  1 -1  2  0]\n",
      "(305,) (12,)\n",
      "init state [1 2 0 1 0]\n",
      "(308,) (3,)\n",
      "init state [1 0 2 2 0]\n",
      "(313,) (5,)\n",
      "============ 31 ===========\n",
      "Run episode 31 with rewards 37, accuracy 0.5\n",
      "----------------- 0 --------------\n",
      "   -0.2072 if x1<=2.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.4530 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.3365 if c<=0.0 & x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   +0.0703 if c<=0.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   +0.3128 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.2056 if c<=0.0 & x1>=1.0 & x2<=0.0 & x3-x1>=0.0\n",
      "   -0.0373 if x2<=2.0 & x4-x2>=0.0\n",
      "   -0.1412 if c<=0.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   -0.0667 if c<=0.0 & x1<=0.0 & x2>=1.0 & x3-x1<=2.0 & x4-x2<=1.0\n",
      "   -0.4152 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.4558 if c<=0.0 & x1>=2.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.0509 if x2<=1.0 & x3-x1>=2.0\n",
      "   -0.5833 if x2<=2.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   -0.4522 if x4-x2<=-2.0\n",
      "   -0.4293 if c<=0.0 & x1>=1.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   +0.4435 if x1>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=2.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 1 --------------\n",
      "   +0.2993 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.6728 if c>=1.0 & x1>=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   +0.2375 if c<=0.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   +0.0982 if x1<=2.0 & x1>=1.0 & x2>=2.0 & x3-x1>=-1.0 & x4-x2>=0.0\n",
      "   +0.0677 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   -0.7301 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.0623 if c>=1.0 & x1>=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   +0.3045 if x2>=3.0\n",
      "   -0.0180 if x3-x1<=1.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   +0.0306 if c<=0.0 & x1<=1.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.1611 if x2>=2.0 & x3-x1<=-2.0 & x4-x2>=-1.0\n",
      "   +0.1440 if x2>=1.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.1920 if x1>=1.0 & x2<=2.0 & x2>=2.0 & x3-x1>=0.0\n",
      "   +0.1726 if x1>=2.0 & x3-x1>=-2.0 & x4-x2<=-2.0 & x4-x2>=-2.0\n",
      "   +0.1830 if c<=0.0 & x2>=2.0 & x3-x1>=1.0\n",
      "   +0.3898 if x3-x1>=2.0 & x4-x2>=2.0\n",
      "----------------- 2 --------------\n",
      "   -0.3801 if x2<=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.0356 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   +0.0704 if c>=1.0 & x1>=1.0 & x2<=2.0 & x4-x2<=-1.0\n",
      "   -0.1043 if x2<=0.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   +0.4033 if c<=0.0 & x4-x2>=-2.0\n",
      "   +0.0615 if x2>=3.0 & x3-x1<=-1.0 & x4-x2>=0.0\n",
      "   -0.1206 if c<=0.0 & x2<=0.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   -0.1928 if c<=0.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.5305 if x2>=1.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   -0.8072 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.0503 if x2>=1.0 & x3-x1<=1.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.0345 if x1>=1.0 & x2<=2.0 & x3-x1<=0.0 & x4-x2<=1.0\n",
      "   +0.0000 if x3-x1>=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.2606 if x1<=1.0 & x2<=0.0\n",
      "   +0.4735 if x1<=2.0 & x3-x1<=2.0 & x3-x1>=0.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -1.0592 if c>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "----------------- 3 --------------\n",
      "   +0.1004 if x3-x1<=-1.0\n",
      "   -0.4114 if x1<=2.0 & x1>=2.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   -0.4268 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   -0.0469 if x1>=1.0 & x2<=2.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   +0.1137 if x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.6904 if x2>=3.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.3874 if x1>=2.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.4844 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.2447 if x1>=2.0 & x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-2.0\n",
      "   +0.9217 if c>=1.0 & x1>=1.0\n",
      "   +0.0000 if x1>=2.0 & x3-x1>=1.0 & x4-x2<=0.0\n",
      "   -0.1620 if x3-x1<=-2.0 & x4-x2>=0.0\n",
      "   +0.1327 if x1>=2.0 & x2<=0.0 & x4-x2>=2.0\n",
      "   +0.1608 if x1>=3.0 & x2<=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   -0.2794 if x3-x1<=-1.0 & x4-x2>=2.0\n",
      "   +0.2085 if x4-x2>=3.0\n",
      "init state [ 3  2 -3 -1  0]\n",
      "(20,) (20,)\n",
      "init state [ 1  2  0 -1  0]\n",
      "(28,) (8,)\n",
      "init state [ 2  1 -1  0  0]\n",
      "(45,) (17,)\n",
      "init state [ 1  3  0 -3  0]\n",
      "(59,) (14,)\n",
      "init state [1 1 0 1 0]\n",
      "(71,) (12,)\n",
      "init state [ 1  3  0 -1  0]\n",
      "(75,) (4,)\n",
      "init state [ 2  2  1 -2  0]\n",
      "(96,) (21,)\n",
      "init state [ 2  0 -2  2  0]\n",
      "(124,) (28,)\n",
      "init state [ 3  2 -2  1  0]\n",
      "(130,) (6,)\n",
      "init state [ 2  0 -1  0  0]\n",
      "(140,) (10,)\n",
      "============ 32 ===========\n",
      "Run episode 32 with rewards 32, accuracy 0.4\n",
      "----------------- 0 --------------\n",
      "   -0.0399 if x1<=2.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.3137 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.4038 if c<=0.0 & x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   +0.0454 if c<=0.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   +0.7720 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.1495 if c<=0.0 & x1>=1.0 & x2<=0.0 & x3-x1>=0.0\n",
      "   -0.1495 if c<=0.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   +0.0000 if c<=0.0 & x1<=0.0 & x2>=1.0 & x3-x1<=2.0 & x4-x2<=1.0\n",
      "   -0.2891 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.3205 if c<=0.0 & x1>=2.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.0139 if x2<=1.0 & x3-x1>=2.0\n",
      "   -0.4004 if x2<=2.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   +0.1078 if x4-x2<=-2.0\n",
      "   -0.2933 if c<=0.0 & x1>=1.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   +0.0000 if x1>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=2.0\n",
      "   -0.8566 if x1<=1.0 & x1>=1.0 & x4-x2<=-1.0\n",
      "----------------- 1 --------------\n",
      "   -0.0425 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.6530 if c>=1.0 & x1>=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   +0.3372 if c<=0.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   +0.0486 if x1<=2.0 & x1>=1.0 & x2>=2.0 & x3-x1>=-1.0 & x4-x2>=0.0\n",
      "   -0.2751 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   -0.4346 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.0564 if c>=1.0 & x1>=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   +0.5113 if x2>=3.0\n",
      "   -0.0895 if c<=0.0 & x1<=1.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.2102 if x2>=2.0 & x3-x1<=-2.0 & x4-x2>=-1.0\n",
      "   -0.0895 if x2>=1.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.1112 if x1>=1.0 & x2<=2.0 & x2>=2.0 & x3-x1>=0.0\n",
      "   -0.0780 if x1>=2.0 & x3-x1>=-2.0 & x4-x2<=-2.0 & x4-x2>=-2.0\n",
      "   -0.1112 if c<=0.0 & x2>=2.0 & x3-x1>=1.0\n",
      "   +0.0000 if x3-x1>=2.0 & x4-x2>=2.0\n",
      "   -0.8540 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "----------------- 2 --------------\n",
      "   -0.1913 if x2<=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   +0.0262 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.0891 if c>=1.0 & x1>=1.0 & x2<=2.0 & x4-x2<=-1.0\n",
      "   +0.1932 if x2<=0.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   +0.4725 if c<=0.0 & x4-x2>=-2.0\n",
      "   -0.0294 if x2>=3.0 & x3-x1<=-1.0 & x4-x2>=0.0\n",
      "   +0.1932 if c<=0.0 & x2<=0.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   -0.1390 if c<=0.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.5877 if x2>=1.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   -0.3359 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.0000 if x2>=1.0 & x3-x1<=1.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "   -0.1792 if x1>=1.0 & x2<=2.0 & x3-x1<=0.0 & x4-x2<=1.0\n",
      "   -0.0263 if x1<=1.0 & x2<=0.0\n",
      "   +0.2680 if x1<=2.0 & x3-x1<=2.0 & x3-x1>=0.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.6483 if c>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +1.0265 if c<=0.0 & x1<=1.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "----------------- 3 --------------\n",
      "   +0.1410 if x3-x1<=-1.0\n",
      "   -0.2164 if x1<=2.0 & x1>=2.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   -0.2137 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   +0.1544 if x1>=1.0 & x2<=2.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   -0.0811 if x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.2195 if x2>=3.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.0000 if x1>=2.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.4003 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.0391 if x1>=2.0 & x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-2.0\n",
      "   +0.7663 if c>=1.0 & x1>=1.0\n",
      "   -0.0269 if x3-x1<=-2.0 & x4-x2>=0.0\n",
      "   +0.0154 if x1>=2.0 & x2<=0.0 & x4-x2>=2.0\n",
      "   -0.0700 if x1>=3.0 & x2<=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   +0.0154 if x3-x1<=-1.0 & x4-x2>=2.0\n",
      "   +0.0000 if x4-x2>=3.0\n",
      "   -0.4359 if x1<=2.0 & x1>=1.0 & x3-x1<=0.0 & x4-x2<=-2.0\n",
      "init state [ 3  1 -3  1  0]\n",
      "(13,) (13,)\n",
      "init state [ 2  2  0 -1  0]\n",
      "(31,) (18,)\n",
      "init state [ 0  1  2 -1  0]\n",
      "(61,) (30,)\n",
      "init state [0 1 0 1 0]\n",
      "(79,) (18,)\n",
      "init state [ 2  0 -2  3  0]\n",
      "(118,) (39,)\n",
      "init state [0 1 2 0 0]\n",
      "(133,) (15,)\n",
      "init state [ 3  1 -2  2  0]\n",
      "(161,) (28,)\n",
      "init state [ 0  1  2 -1  0]\n",
      "(189,) (28,)\n",
      "init state [ 2  2 -2 -2  0]\n",
      "(200,) (11,)\n",
      "init state [ 3  2 -2 -2  0]\n",
      "(242,) (42,)\n",
      "============ 33 ===========\n",
      "Run episode 33 with rewards 0, accuracy 0.3\n",
      "----------------- 0 --------------\n",
      "   -0.4156 if x1<=2.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.8452 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.2764 if c<=0.0 & x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   -0.1239 if c<=0.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   +0.4573 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.1487 if c<=0.0 & x1>=1.0 & x2<=0.0 & x3-x1>=0.0\n",
      "   -0.2210 if c<=0.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   -0.5424 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.3478 if c<=0.0 & x1>=2.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.0106 if x2<=1.0 & x3-x1>=2.0\n",
      "   -0.4937 if x2<=2.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   -0.0514 if x4-x2<=-2.0\n",
      "   -0.4302 if c<=0.0 & x1>=1.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   +0.0000 if x1>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=2.0\n",
      "   +0.0085 if x1<=1.0 & x1>=1.0 & x4-x2<=-1.0\n",
      "   +0.6274 if x2<=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "----------------- 1 --------------\n",
      "   -0.3234 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.5766 if c>=1.0 & x1>=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   +0.2526 if c<=0.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.0352 if x1<=2.0 & x1>=1.0 & x2>=2.0 & x3-x1>=-1.0 & x4-x2>=0.0\n",
      "   -0.2299 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   -0.2686 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.3660 if c>=1.0 & x1>=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   +0.8601 if x2>=3.0\n",
      "   -0.5661 if c<=0.0 & x1<=1.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.0885 if x2>=2.0 & x3-x1<=-2.0 & x4-x2>=-1.0\n",
      "   -0.1911 if x2>=1.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   -0.1042 if x1>=1.0 & x2<=2.0 & x2>=2.0 & x3-x1>=0.0\n",
      "   +0.1648 if x1>=2.0 & x3-x1>=-2.0 & x4-x2<=-2.0 & x4-x2>=-2.0\n",
      "   +0.0800 if c<=0.0 & x2>=2.0 & x3-x1>=1.0\n",
      "   -0.5681 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.4400 if x1<=1.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 2 --------------\n",
      "   -0.1545 if x2<=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   +0.0723 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.0219 if c>=1.0 & x1>=1.0 & x2<=2.0 & x4-x2<=-1.0\n",
      "   -0.2094 if x2<=0.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   +0.5854 if c<=0.0 & x4-x2>=-2.0\n",
      "   +0.3828 if x2>=3.0 & x3-x1<=-1.0 & x4-x2>=0.0\n",
      "   -0.3625 if c<=0.0 & x2<=0.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.4596 if c<=0.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.3423 if x2>=1.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   -0.5629 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.2471 if x1>=1.0 & x2<=2.0 & x3-x1<=0.0 & x4-x2<=1.0\n",
      "   -0.0131 if x1<=1.0 & x2<=0.0\n",
      "   +0.1663 if x1<=2.0 & x3-x1<=2.0 & x3-x1>=0.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.7911 if c>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.0568 if c<=0.0 & x1<=1.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.4951 if x1>=1.0 & x4-x2>=-1.0\n",
      "----------------- 3 --------------\n",
      "   -0.1088 if x3-x1<=-1.0\n",
      "   -0.1499 if x1<=2.0 & x1>=2.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   -0.1294 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   +0.3123 if x1>=1.0 & x2<=2.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   -0.2825 if x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.1661 if x2>=3.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.0405 if x1>=2.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.5159 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.2252 if x1>=2.0 & x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-2.0\n",
      "   +0.8501 if c>=1.0 & x1>=1.0\n",
      "   +0.1224 if x3-x1<=-2.0 & x4-x2>=0.0\n",
      "   +0.2120 if x1>=2.0 & x2<=0.0 & x4-x2>=2.0\n",
      "   +0.0378 if x1>=3.0 & x2<=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   -0.0797 if x3-x1<=-1.0 & x4-x2>=2.0\n",
      "   -0.3635 if x1<=2.0 & x1>=1.0 & x3-x1<=0.0 & x4-x2<=-2.0\n",
      "   +0.5290 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "init state [0 0 1 2 0]\n",
      "(17,) (17,)\n",
      "init state [ 2  3 -1  0  0]\n",
      "(31,) (14,)\n",
      "init state [ 0  1  0 -1  0]\n",
      "(38,) (7,)\n",
      "init state [ 1  0 -1  0  0]\n",
      "(57,) (19,)\n",
      "init state [ 2  0 -1  1  0]\n",
      "(68,) (11,)\n",
      "init state [ 1  3  1 -3  0]\n",
      "(99,) (31,)\n",
      "init state [ 3  0 -2  3  0]\n",
      "(117,) (18,)\n",
      "init state [ 1  1 -1  2  0]\n",
      "(129,) (12,)\n",
      "init state [ 2  1 -2 -1  0]\n",
      "(147,) (18,)\n",
      "init state [ 2  2  1 -1  0]\n",
      "(174,) (27,)\n",
      "============ 34 ===========\n",
      "Run episode 34 with rewards 15, accuracy 0.6\n",
      "----------------- 0 --------------\n",
      "   -0.1919 if x1<=2.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.5343 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.1986 if c<=0.0 & x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   -0.1656 if c<=0.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   +0.7696 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.3401 if c<=0.0 & x1>=1.0 & x2<=0.0 & x3-x1>=0.0\n",
      "   -0.0159 if c<=0.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   -0.1548 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.3254 if c<=0.0 & x1>=2.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.0000 if x2<=1.0 & x3-x1>=2.0\n",
      "   -0.0925 if x2<=2.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   -0.2008 if x4-x2<=-2.0\n",
      "   -0.7612 if c<=0.0 & x1>=1.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   -0.1717 if x1<=1.0 & x1>=1.0 & x4-x2<=-1.0\n",
      "   +0.2599 if x2<=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.3428 if c<=0.0 & x1<=1.0 & x2<=2.0 & x3-x1<=0.0 & x4-x2<=1.0\n",
      "----------------- 1 --------------\n",
      "   +0.3683 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.6279 if c>=1.0 & x1>=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   +0.1191 if c<=0.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.0034 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   -0.4546 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.3049 if c>=1.0 & x1>=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   +0.9605 if x2>=3.0\n",
      "   -0.0083 if c<=0.0 & x1<=1.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.0578 if x2>=2.0 & x3-x1<=-2.0 & x4-x2>=-1.0\n",
      "   +0.5968 if x2>=1.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   -0.3688 if x1>=1.0 & x2<=2.0 & x2>=2.0 & x3-x1>=0.0\n",
      "   +0.0011 if x1>=2.0 & x3-x1>=-2.0 & x4-x2<=-2.0 & x4-x2>=-2.0\n",
      "   -0.3811 if c<=0.0 & x2>=2.0 & x3-x1>=1.0\n",
      "   -0.4945 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   -0.3074 if x1<=1.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.0299 if c>=1.0 & x1<=0.0 & x4-x2>=1.0\n",
      "----------------- 2 --------------\n",
      "   +0.4980 if x2<=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.0283 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.2745 if c>=1.0 & x1>=1.0 & x2<=2.0 & x4-x2<=-1.0\n",
      "   -0.2214 if x2<=0.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   +0.6387 if c<=0.0 & x4-x2>=-2.0\n",
      "   -0.4085 if x2>=3.0 & x3-x1<=-1.0 & x4-x2>=0.0\n",
      "   -0.2825 if c<=0.0 & x2<=0.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.3060 if c<=0.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.7340 if x2>=1.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   -0.3756 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.0200 if x1>=1.0 & x2<=2.0 & x3-x1<=0.0 & x4-x2<=1.0\n",
      "   +0.1520 if x1<=2.0 & x3-x1<=2.0 & x3-x1>=0.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.7400 if c>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.1929 if c<=0.0 & x1<=1.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.5089 if x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.5133 if x2<=1.0 & x4-x2>=0.0\n",
      "----------------- 3 --------------\n",
      "   +0.1366 if x3-x1<=-1.0\n",
      "   +0.0624 if x1<=2.0 & x1>=2.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   -0.4371 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   +0.6115 if x1>=1.0 & x2<=2.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   -0.1643 if x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.0455 if x2>=3.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.0000 if x1>=2.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.1797 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.0204 if x1>=2.0 & x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-2.0\n",
      "   +0.2571 if c>=1.0 & x1>=1.0\n",
      "   +0.2314 if x3-x1<=-2.0 & x4-x2>=0.0\n",
      "   +0.0372 if x1>=2.0 & x2<=0.0 & x4-x2>=2.0\n",
      "   +0.3985 if x3-x1<=-1.0 & x4-x2>=2.0\n",
      "   +0.0315 if x1<=2.0 & x1>=1.0 & x3-x1<=0.0 & x4-x2<=-2.0\n",
      "   +0.0000 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.5409 if x1>=3.0 & x3-x1>=0.0\n",
      "init state [2 0 1 1 0]\n",
      "(8,) (8,)\n",
      "init state [ 1  3  2 -3  0]\n",
      "(32,) (24,)\n",
      "init state [0 0 1 1 0]\n",
      "(44,) (12,)\n",
      "init state [ 0  3  0 -3  0]\n",
      "(76,) (32,)\n",
      "init state [ 2  3  1 -1  0]\n",
      "(86,) (10,)\n",
      "init state [ 0  2  0 -1  0]\n",
      "(96,) (10,)\n",
      "init state [ 3  1 -2 -1  0]\n",
      "(108,) (12,)\n",
      "init state [ 3  0 -2  3  0]\n",
      "(126,) (18,)\n",
      "init state [ 1  2  2 -1  0]\n",
      "(141,) (15,)\n",
      "init state [ 1  3  0 -1  0]\n",
      "(148,) (7,)\n",
      "============ 35 ===========\n",
      "Run episode 35 with rewards 35, accuracy 0.6\n",
      "----------------- 0 --------------\n",
      "   -0.0011 if x1<=2.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.0824 if c>=1.0 & x3-x1<=1.0\n",
      "   -0.1004 if c<=0.0 & x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   +0.0729 if c<=0.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   +0.5447 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.1170 if c<=0.0 & x1>=1.0 & x2<=0.0 & x3-x1>=0.0\n",
      "   -0.2747 if c<=0.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   -0.0986 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.1267 if c<=0.0 & x1>=2.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.0722 if x2<=2.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   -0.6335 if x4-x2<=-2.0\n",
      "   -0.7972 if c<=0.0 & x1>=1.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   -0.3187 if x1<=1.0 & x1>=1.0 & x4-x2<=-1.0\n",
      "   +0.2629 if x2<=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.1274 if c<=0.0 & x1<=1.0 & x2<=2.0 & x3-x1<=0.0 & x4-x2<=1.0\n",
      "   +0.3031 if x3-x1>=3.0\n",
      "----------------- 1 --------------\n",
      "   +0.2537 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.4040 if c>=1.0 & x1>=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   +0.0612 if c<=0.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.1857 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   -0.3934 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.0864 if c>=1.0 & x1>=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   +1.0730 if x2>=3.0\n",
      "   +0.2835 if c<=0.0 & x1<=1.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.3569 if x2>=2.0 & x3-x1<=-2.0 & x4-x2>=-1.0\n",
      "   -0.0000 if x2>=1.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   -0.4949 if x1>=1.0 & x2<=2.0 & x2>=2.0 & x3-x1>=0.0\n",
      "   +0.0232 if c<=0.0 & x2>=2.0 & x3-x1>=1.0\n",
      "   -0.4145 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   -0.3050 if x1<=1.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.0000 if c>=1.0 & x1<=0.0 & x4-x2>=1.0\n",
      "   +0.7286 if c<=0.0 & x2<=1.0 & x3-x1<=1.0 & x3-x1>=1.0 & x4-x2<=0.0\n",
      "----------------- 2 --------------\n",
      "   +0.2515 if x2<=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.1108 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.2409 if c>=1.0 & x1>=1.0 & x2<=2.0 & x4-x2<=-1.0\n",
      "   +0.0148 if x2<=0.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   +0.8651 if c<=0.0 & x4-x2>=-2.0\n",
      "   -0.3564 if x2>=3.0 & x3-x1<=-1.0 & x4-x2>=0.0\n",
      "   -0.1143 if c<=0.0 & x2<=0.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   -0.1724 if c<=0.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.5440 if x2>=1.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   -0.2760 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.2928 if x1<=2.0 & x3-x1<=2.0 & x3-x1>=0.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.4486 if c>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.6477 if c<=0.0 & x1<=1.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.6130 if x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.4287 if x2<=1.0 & x4-x2>=0.0\n",
      "   +0.3937 if x1>=2.0 & x1>=3.0 & x3-x1>=-2.0 & x4-x2<=-3.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 3 --------------\n",
      "   -0.0694 if x3-x1<=-1.0\n",
      "   +0.7565 if x1<=2.0 & x1>=2.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   -0.1020 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   +0.5279 if x1>=1.0 & x2<=2.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   -0.3231 if x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.3669 if x2>=3.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.1127 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.0335 if x1>=2.0 & x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-2.0\n",
      "   +0.4489 if c>=1.0 & x1>=1.0\n",
      "   +0.1043 if x3-x1<=-2.0 & x4-x2>=0.0\n",
      "   +0.0598 if x1>=2.0 & x2<=0.0 & x4-x2>=2.0\n",
      "   +0.0882 if x3-x1<=-1.0 & x4-x2>=2.0\n",
      "   +0.2973 if x1<=2.0 & x1>=1.0 & x3-x1<=0.0 & x4-x2<=-2.0\n",
      "   +0.3089 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.2295 if x1>=3.0 & x3-x1>=0.0\n",
      "   -0.7110 if c<=0.0 & x2<=2.0 & x3-x1>=1.0 & x4-x2>=-2.0\n",
      "init state [ 3  0 -1  0  0]\n",
      "(13,) (13,)\n",
      "init state [ 2  0 -1  2  0]\n",
      "(29,) (16,)\n",
      "init state [ 0  2  1 -1  0]\n",
      "(65,) (36,)\n",
      "init state [1 0 1 3 0]\n",
      "(71,) (6,)\n",
      "init state [1 0 0 3 0]\n",
      "(110,) (39,)\n",
      "init state [ 0  3  2 -1  0]\n",
      "(132,) (22,)\n",
      "init state [ 2  3 -2  0  0]\n",
      "(139,) (7,)\n",
      "init state [0 2 3 0 0]\n",
      "(186,) (47,)\n",
      "init state [2 1 0 1 0]\n",
      "(189,) (3,)\n",
      "init state [ 3  0 -2  2  0]\n",
      "(222,) (33,)\n",
      "============ 36 ===========\n",
      "Run episode 36 with rewards 9, accuracy 0.3\n",
      "----------------- 0 --------------\n",
      "   -0.4945 if c>=1.0 & x3-x1<=1.0\n",
      "   -0.3153 if c<=0.0 & x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   -0.2078 if c<=0.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   +0.6623 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.0358 if c<=0.0 & x1>=1.0 & x2<=0.0 & x3-x1>=0.0\n",
      "   -0.3306 if c<=0.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   -0.1356 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.1125 if c<=0.0 & x1>=2.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.0748 if x2<=2.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   -0.0706 if x4-x2<=-2.0\n",
      "   -0.1818 if c<=0.0 & x1>=1.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   -0.2493 if x1<=1.0 & x1>=1.0 & x4-x2<=-1.0\n",
      "   +0.1636 if x2<=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.1785 if c<=0.0 & x1<=1.0 & x2<=2.0 & x3-x1<=0.0 & x4-x2<=1.0\n",
      "   +0.0184 if x3-x1>=3.0\n",
      "   -0.4179 if x4-x2>=3.0\n",
      "----------------- 1 --------------\n",
      "   +0.1857 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.5592 if c>=1.0 & x1>=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   -0.1444 if c<=0.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.1842 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   -0.4070 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.1271 if c>=1.0 & x1>=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   +0.7244 if x2>=3.0\n",
      "   +0.4298 if c<=0.0 & x1<=1.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.2501 if x2>=2.0 & x3-x1<=-2.0 & x4-x2>=-1.0\n",
      "   +0.0535 if x2>=1.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   -0.0873 if x1>=1.0 & x2<=2.0 & x2>=2.0 & x3-x1>=0.0\n",
      "   -0.4012 if c<=0.0 & x2>=2.0 & x3-x1>=1.0\n",
      "   -0.4152 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.5048 if x1<=1.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.0000 if c<=0.0 & x2<=1.0 & x3-x1<=1.0 & x3-x1>=1.0 & x4-x2<=0.0\n",
      "   -0.4584 if x2>=3.0 & x3-x1<=-1.0\n",
      "----------------- 2 --------------\n",
      "   +0.0201 if x2<=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.1546 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   +0.0114 if c>=1.0 & x1>=1.0 & x2<=2.0 & x4-x2<=-1.0\n",
      "   +0.5307 if c<=0.0 & x4-x2>=-2.0\n",
      "   -0.1742 if x2>=3.0 & x3-x1<=-1.0 & x4-x2>=0.0\n",
      "   +0.6971 if c<=0.0 & x2<=0.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   -0.9663 if c<=0.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.3811 if x2>=1.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   -0.1857 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.2954 if x1<=2.0 & x3-x1<=2.0 & x3-x1>=0.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.3477 if c>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.4100 if c<=0.0 & x1<=1.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.1958 if x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.5278 if x2<=1.0 & x4-x2>=0.0\n",
      "   +0.0000 if x1>=2.0 & x1>=3.0 & x3-x1>=-2.0 & x4-x2<=-3.0\n",
      "   -0.1801 if x2<=1.0\n",
      "----------------- 3 --------------\n",
      "   +0.2339 if x3-x1<=-1.0\n",
      "   +0.3734 if x1<=2.0 & x1>=2.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   -0.3933 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   +0.3246 if x1>=1.0 & x2<=2.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   -0.3947 if x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.5022 if x2>=3.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.3971 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.5324 if c>=1.0 & x1>=1.0\n",
      "   -0.3312 if x3-x1<=-2.0 & x4-x2>=0.0\n",
      "   -0.1299 if x1>=2.0 & x2<=0.0 & x4-x2>=2.0\n",
      "   -0.1299 if x3-x1<=-1.0 & x4-x2>=2.0\n",
      "   -0.2303 if x1<=2.0 & x1>=1.0 & x3-x1<=0.0 & x4-x2<=-2.0\n",
      "   +0.2576 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.4037 if x1>=3.0 & x3-x1>=0.0\n",
      "   -0.0908 if c<=0.0 & x2<=2.0 & x3-x1>=1.0 & x4-x2>=-2.0\n",
      "   +0.2184 if x1>=1.0 & x2>=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "init state [2 1 0 2 0]\n",
      "(11,) (11,)\n",
      "init state [ 3  2 -1 -1  0]\n",
      "(18,) (7,)\n",
      "init state [0 1 0 2 0]\n",
      "(29,) (11,)\n",
      "init state [ 3  2  0 -2  0]\n",
      "(185,) (156,)\n",
      "init state [ 1  3  0 -1  0]\n",
      "(192,) (7,)\n",
      "init state [ 3  0 -3  3  0]\n",
      "(215,) (23,)\n",
      "init state [ 1  2 -1  1  0]\n",
      "(232,) (17,)\n",
      "init state [0 2 1 0 0]\n",
      "(260,) (28,)\n",
      "init state [ 1  3 -1  0  0]\n",
      "(274,) (14,)\n",
      "init state [0 1 3 0 0]\n",
      "(283,) (9,)\n",
      "============ 37 ===========\n",
      "Run episode 37 with rewards 33, accuracy 0.4\n",
      "----------------- 0 --------------\n",
      "   -0.5737 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.4400 if c<=0.0 & x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   +0.2593 if c<=0.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   +0.4225 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.4020 if c<=0.0 & x1>=1.0 & x2<=0.0 & x3-x1>=0.0\n",
      "   -0.4693 if c<=0.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   -0.9715 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.4861 if c<=0.0 & x1>=2.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.2509 if x2<=2.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   -0.3269 if x4-x2<=-2.0\n",
      "   -0.4313 if c<=0.0 & x1>=1.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   -0.4363 if x1<=1.0 & x1>=1.0 & x4-x2<=-1.0\n",
      "   -0.4971 if x2<=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.0462 if c<=0.0 & x1<=1.0 & x2<=2.0 & x3-x1<=0.0 & x4-x2<=1.0\n",
      "   -0.1446 if x4-x2>=3.0\n",
      "   +0.6501 if c<=0.0 & x1<=2.0 & x1>=2.0 & x2>=1.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "----------------- 1 --------------\n",
      "   +0.2561 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.7132 if c>=1.0 & x1>=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   -0.0567 if c<=0.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.0644 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   -0.5830 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.1219 if c>=1.0 & x1>=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   +0.3802 if x2>=3.0\n",
      "   -0.1188 if c<=0.0 & x1<=1.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.0633 if x2>=2.0 & x3-x1<=-2.0 & x4-x2>=-1.0\n",
      "   +0.2850 if x2>=1.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.4159 if x1>=1.0 & x2<=2.0 & x2>=2.0 & x3-x1>=0.0\n",
      "   -0.0409 if c<=0.0 & x2>=2.0 & x3-x1>=1.0\n",
      "   -0.4646 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.1738 if x1<=1.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.0445 if x2>=3.0 & x3-x1<=-1.0\n",
      "   -0.4680 if x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=-1.0\n",
      "----------------- 2 --------------\n",
      "   -0.4741 if x2<=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.2100 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   +0.1086 if c>=1.0 & x1>=1.0 & x2<=2.0 & x4-x2<=-1.0\n",
      "   +0.4558 if c<=0.0 & x4-x2>=-2.0\n",
      "   +0.2927 if x2>=3.0 & x3-x1<=-1.0 & x4-x2>=0.0\n",
      "   +0.5065 if c<=0.0 & x2<=0.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   -0.5539 if c<=0.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.4431 if x2>=1.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   -0.6303 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.1855 if x1<=2.0 & x3-x1<=2.0 & x3-x1>=0.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.2028 if c>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.3815 if c<=0.0 & x1<=1.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.2195 if x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.0873 if x2<=1.0 & x4-x2>=0.0\n",
      "   +0.1882 if x2<=1.0\n",
      "   +0.3696 if c<=0.0 & x1>=3.0 & x2<=2.0 & x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "----------------- 3 --------------\n",
      "   +0.2684 if x3-x1<=-1.0\n",
      "   -0.2063 if x1<=2.0 & x1>=2.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   +0.3314 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   +0.1889 if x1>=1.0 & x2<=2.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   -0.3564 if x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.2964 if x2>=3.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.3041 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.5995 if c>=1.0 & x1>=1.0\n",
      "   -0.1929 if x3-x1<=-2.0 & x4-x2>=0.0\n",
      "   +0.3545 if x1>=2.0 & x2<=0.0 & x4-x2>=2.0\n",
      "   +0.0995 if x3-x1<=-1.0 & x4-x2>=2.0\n",
      "   -0.0702 if x1<=2.0 & x1>=1.0 & x3-x1<=0.0 & x4-x2<=-2.0\n",
      "   +0.2780 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.4292 if x1>=3.0 & x3-x1>=0.0\n",
      "   +0.1689 if x1>=1.0 & x2>=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   -0.1767 if x3-x1<=-3.0\n",
      "init state [0 0 1 0 0]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(13,) (13,)\n",
      "init state [ 0  3  2 -2  0]\n",
      "(36,) (23,)\n",
      "init state [ 2  1 -1 -1  0]\n",
      "(60,) (24,)\n",
      "init state [ 1  1  1 -1  0]\n",
      "(82,) (22,)\n",
      "init state [ 2  3  0 -2  0]\n",
      "(90,) (8,)\n",
      "init state [0 1 1 0 0]\n",
      "(120,) (30,)\n",
      "init state [ 2  3 -2 -1  0]\n",
      "(131,) (11,)\n",
      "init state [ 0  2  2 -1  0]\n",
      "(155,) (24,)\n",
      "init state [ 3  2 -1 -2  0]\n",
      "(199,) (44,)\n",
      "init state [ 1  0 -1  3  0]\n",
      "(210,) (11,)\n",
      "============ 38 ===========\n",
      "Run episode 38 with rewards 31, accuracy 0.3\n",
      "----------------- 0 --------------\n",
      "   -0.3143 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.4043 if c<=0.0 & x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   -0.2067 if c<=0.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   +0.5858 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.1680 if c<=0.0 & x1>=1.0 & x2<=0.0 & x3-x1>=0.0\n",
      "   -0.1385 if c<=0.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   -0.3876 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.3231 if c<=0.0 & x1>=2.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.4724 if x2<=2.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   -0.5974 if x4-x2<=-2.0\n",
      "   -0.6922 if c<=0.0 & x1>=1.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   -0.4613 if x1<=1.0 & x1>=1.0 & x4-x2<=-1.0\n",
      "   +0.0441 if x2<=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.0735 if x4-x2>=3.0\n",
      "   +0.0000 if c<=0.0 & x1<=2.0 & x1>=2.0 & x2>=1.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.2680 if c<=0.0 & x3-x1<=-2.0\n",
      "----------------- 1 --------------\n",
      "   +0.3199 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.4662 if c>=1.0 & x1>=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   -0.0733 if c<=0.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.2576 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   -0.4920 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.2113 if c>=1.0 & x1>=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   +0.3521 if x2>=3.0\n",
      "   -0.0304 if c<=0.0 & x1<=1.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.1794 if x2>=2.0 & x3-x1<=-2.0 & x4-x2>=-1.0\n",
      "   -0.0475 if x2>=1.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.1350 if x1>=1.0 & x2<=2.0 & x2>=2.0 & x3-x1>=0.0\n",
      "   -0.5097 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.1111 if x1<=1.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.2950 if x2>=3.0 & x3-x1<=-1.0\n",
      "   -0.1973 if x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=-1.0\n",
      "   -0.4800 if x1<=2.0 & x2<=2.0 & x3-x1<=1.0 & x4-x2>=0.0\n",
      "----------------- 2 --------------\n",
      "   -0.1965 if x2<=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.1469 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.1139 if c>=1.0 & x1>=1.0 & x2<=2.0 & x4-x2<=-1.0\n",
      "   +0.6346 if c<=0.0 & x4-x2>=-2.0\n",
      "   -0.0706 if x2>=3.0 & x3-x1<=-1.0 & x4-x2>=0.0\n",
      "   +0.1773 if c<=0.0 & x2<=0.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   -0.0208 if c<=0.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.4994 if x2>=1.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   -0.3304 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.4949 if x1<=2.0 & x3-x1<=2.0 & x3-x1>=0.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.5756 if c>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.2401 if c<=0.0 & x1<=1.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.0139 if x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.0808 if x2<=1.0\n",
      "   +0.1944 if c<=0.0 & x1>=3.0 & x2<=2.0 & x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "   +0.1290 if c>=1.0 & x4-x2<=2.0 & x4-x2>=-2.0 & x4-x2>=1.0\n",
      "----------------- 3 --------------\n",
      "   -0.1649 if x3-x1<=-1.0\n",
      "   +0.0741 if x1<=2.0 & x1>=2.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   -0.1864 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   +0.4354 if x1>=1.0 & x2<=2.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   -0.1062 if x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.2304 if x2>=3.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.6192 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.7070 if c>=1.0 & x1>=1.0\n",
      "   -0.1008 if x3-x1<=-2.0 & x4-x2>=0.0\n",
      "   +0.0000 if x1>=2.0 & x2<=0.0 & x4-x2>=2.0\n",
      "   +0.3290 if x3-x1<=-1.0 & x4-x2>=2.0\n",
      "   -0.2816 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.0000 if x1>=3.0 & x3-x1>=0.0\n",
      "   -0.3150 if x1>=1.0 & x2>=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   +0.0000 if x3-x1<=-3.0\n",
      "   -0.5476 if x2>=3.0 & x4-x2>=-1.0\n",
      "init state [0 1 3 1 0]\n",
      "(18,) (18,)\n",
      "init state [0 1 3 0 0]\n",
      "(48,) (30,)\n",
      "init state [1 3 1 0 0]\n",
      "(59,) (11,)\n",
      "init state [3 0 0 2 0]\n",
      "(65,) (6,)\n",
      "init state [2 1 1 0 0]\n",
      "(71,) (6,)\n",
      "init state [ 3  0 -1  1  0]\n",
      "(79,) (8,)\n",
      "init state [ 3  2 -2 -2  0]\n",
      "(105,) (26,)\n",
      "init state [ 1  2 -1 -1  0]\n",
      "(140,) (35,)\n",
      "init state [ 3  1 -2 -1  0]\n",
      "(164,) (24,)\n",
      "init state [ 0  3  3 -3  0]\n",
      "(280,) (116,)\n",
      "============ 39 ===========\n",
      "Run episode 39 with rewards -74, accuracy 0.7\n",
      "best\n",
      "----------------- 0 --------------\n",
      "   -0.4410 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.0000 if c<=0.0 & x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   -0.0621 if c<=0.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   +0.2552 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.2369 if c<=0.0 & x1>=1.0 & x2<=0.0 & x3-x1>=0.0\n",
      "   -0.0105 if c<=0.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   -0.1344 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.1352 if c<=0.0 & x1>=2.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.0973 if x2<=2.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   -0.4788 if x4-x2<=-2.0\n",
      "   -0.6434 if c<=0.0 & x1>=1.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   -0.2360 if x1<=1.0 & x1>=1.0 & x4-x2<=-1.0\n",
      "   -0.0150 if x2<=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.0000 if x4-x2>=3.0\n",
      "   +0.2156 if c<=0.0 & x3-x1<=-2.0\n",
      "   -0.5411 if x2<=1.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "----------------- 1 --------------\n",
      "   -0.1030 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.6957 if c>=1.0 & x1>=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   +0.0117 if c<=0.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.0049 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   -0.3960 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.0285 if c>=1.0 & x1>=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   +0.3223 if x2>=3.0\n",
      "   +0.1196 if x2>=2.0 & x3-x1<=-2.0 & x4-x2>=-1.0\n",
      "   -0.0988 if x2>=1.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   -0.4143 if x1>=1.0 & x2<=2.0 & x2>=2.0 & x3-x1>=0.0\n",
      "   -0.7454 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.0205 if x1<=1.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.2502 if x2>=3.0 & x3-x1<=-1.0\n",
      "   +0.2731 if x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=-1.0\n",
      "   +0.3737 if x1<=2.0 & x2<=2.0 & x3-x1<=1.0 & x4-x2>=0.0\n",
      "   -0.2147 if x1<=2.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-3.0\n",
      "----------------- 2 --------------\n",
      "   -0.0148 if x2<=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.1587 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.1119 if c>=1.0 & x1>=1.0 & x2<=2.0 & x4-x2<=-1.0\n",
      "   +0.5859 if c<=0.0 & x4-x2>=-2.0\n",
      "   +0.0000 if x2>=3.0 & x3-x1<=-1.0 & x4-x2>=0.0\n",
      "   -0.0742 if c<=0.0 & x2<=0.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   -0.0033 if c<=0.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.4225 if x2>=1.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   -0.2680 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.0276 if x1<=2.0 & x3-x1<=2.0 & x3-x1>=0.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.4412 if c>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.3397 if c<=0.0 & x1<=1.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.0112 if x2<=1.0\n",
      "   +0.2786 if c<=0.0 & x1>=3.0 & x2<=2.0 & x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "   -0.0500 if c>=1.0 & x4-x2<=2.0 & x4-x2>=-2.0 & x4-x2>=1.0\n",
      "   -0.8154 if x2>=1.0 & x3-x1<=1.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "----------------- 3 --------------\n",
      "   +0.1004 if x3-x1<=-1.0\n",
      "   -0.4603 if x1<=2.0 & x1>=2.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   -0.4234 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   +0.4875 if x1>=1.0 & x2<=2.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   -0.0412 if x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.0971 if x2>=3.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.7462 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.7910 if c>=1.0 & x1>=1.0\n",
      "   +0.2173 if x3-x1<=-2.0 & x4-x2>=0.0\n",
      "   +0.2233 if x1>=2.0 & x2<=0.0 & x4-x2>=2.0\n",
      "   +0.0000 if x3-x1<=-1.0 & x4-x2>=2.0\n",
      "   +0.0539 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "   -0.0499 if x1>=3.0 & x3-x1>=0.0\n",
      "   -0.1168 if x1>=1.0 & x2>=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   +0.0031 if x2>=3.0 & x4-x2>=-1.0\n",
      "   -0.4122 if x1>=1.0 & x3-x1>=2.0 & x4-x2>=1.0\n",
      "init state [2 1 1 0 0]\n",
      "(21,) (21,)\n",
      "init state [1 1 1 0 0]\n",
      "(29,) (8,)\n",
      "init state [ 3  1 -3  1  0]\n",
      "(72,) (43,)\n",
      "init state [ 2  1 -1  1  0]\n",
      "(78,) (6,)\n",
      "init state [ 2  3  1 -1  0]\n",
      "(82,) (4,)\n",
      "init state [2 0 1 2 0]\n",
      "(90,) (8,)\n",
      "init state [ 3  2 -1  1  0]\n",
      "(102,) (12,)\n",
      "init state [ 0  2  3 -2  0]\n",
      "(119,) (17,)\n",
      "init state [ 1  2 -1  1  0]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(132,) (13,)\n",
      "init state [ 3  2 -1 -2  0]\n",
      "(165,) (33,)\n",
      "============ 40 ===========\n",
      "Run episode 40 with rewards 9, accuracy 0.2\n",
      "----------------- 0 --------------\n",
      "   -0.4337 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.2387 if c<=0.0 & x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   -0.3067 if c<=0.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   +0.0195 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.0575 if c<=0.0 & x1>=1.0 & x2<=0.0 & x3-x1>=0.0\n",
      "   -0.1162 if c<=0.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   -0.2619 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.0326 if c<=0.0 & x1>=2.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.3860 if x2<=2.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   -0.1550 if x4-x2<=-2.0\n",
      "   -0.6084 if c<=0.0 & x1>=1.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   -0.3507 if x1<=1.0 & x1>=1.0 & x4-x2<=-1.0\n",
      "   -0.1616 if x2<=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.0007 if c<=0.0 & x3-x1<=-2.0\n",
      "   -0.2963 if x2<=1.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   +0.3931 if c<=0.0 & x1<=2.0 & x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "----------------- 1 --------------\n",
      "   +0.1393 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.1179 if c>=1.0 & x1>=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   -0.2166 if c<=0.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.6410 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.2728 if c>=1.0 & x1>=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   +0.5305 if x2>=3.0\n",
      "   +0.2169 if x2>=2.0 & x3-x1<=-2.0 & x4-x2>=-1.0\n",
      "   -0.1100 if x2>=1.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   -0.4489 if x1>=1.0 & x2<=2.0 & x2>=2.0 & x3-x1>=0.0\n",
      "   -0.5377 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.1042 if x1<=1.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.1949 if x2>=3.0 & x3-x1<=-1.0\n",
      "   +0.3178 if x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=-1.0\n",
      "   +0.5544 if x1<=2.0 & x2<=2.0 & x3-x1<=1.0 & x4-x2>=0.0\n",
      "   +0.3341 if x1<=2.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-3.0\n",
      "   +0.4057 if x2<=1.0 & x3-x1>=3.0\n",
      "----------------- 2 --------------\n",
      "   +0.3199 if x2<=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.0642 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.3117 if c>=1.0 & x1>=1.0 & x2<=2.0 & x4-x2<=-1.0\n",
      "   +0.3191 if c<=0.0 & x4-x2>=-2.0\n",
      "   +0.3372 if c<=0.0 & x2<=0.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   -0.4217 if c<=0.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.8290 if x2>=1.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   -0.0742 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.3651 if x1<=2.0 & x3-x1<=2.0 & x3-x1>=0.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.3577 if c>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.5959 if c<=0.0 & x1<=1.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.2028 if x2<=1.0\n",
      "   +0.0482 if c<=0.0 & x1>=3.0 & x2<=2.0 & x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "   -0.0000 if c>=1.0 & x4-x2<=2.0 & x4-x2>=-2.0 & x4-x2>=1.0\n",
      "   -0.0000 if x2>=1.0 & x3-x1<=1.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.6375 if x3-x1>=0.0 & x4-x2>=1.0 & x4-x2>=2.0\n",
      "----------------- 3 --------------\n",
      "   +0.2844 if x3-x1<=-1.0\n",
      "   +0.2386 if x1<=2.0 & x1>=2.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   -0.3277 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   +0.0900 if x1>=1.0 & x2<=2.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   +0.2941 if x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.0546 if x2>=3.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.8150 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.4752 if c>=1.0 & x1>=1.0\n",
      "   +0.0876 if x3-x1<=-2.0 & x4-x2>=0.0\n",
      "   -0.4933 if x1>=2.0 & x2<=0.0 & x4-x2>=2.0\n",
      "   -0.1045 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.2031 if x1>=3.0 & x3-x1>=0.0\n",
      "   +0.0567 if x1>=1.0 & x2>=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   +0.1735 if x2>=3.0 & x4-x2>=-1.0\n",
      "   -0.1242 if x1>=1.0 & x3-x1>=2.0 & x4-x2>=1.0\n",
      "   +0.4754 if x1>=3.0 & x2<=2.0 & x3-x1>=0.0\n",
      "init state [ 2  1 -1  2  0]\n",
      "(7,) (7,)\n",
      "init state [0 1 0 2 0]\n",
      "(57,) (50,)\n",
      "init state [ 0  3  1 -3  0]\n",
      "(114,) (57,)\n",
      "init state [2 0 0 1 0]\n",
      "(123,) (9,)\n",
      "init state [ 1  3  0 -1  0]\n",
      "(130,) (7,)\n",
      "init state [ 0  2  0 -2  0]\n",
      "(144,) (14,)\n",
      "init state [2 0 1 1 0]\n",
      "(152,) (8,)\n",
      "init state [2 0 0 3 0]\n",
      "(158,) (6,)\n",
      "init state [0 2 1 0 0]\n",
      "(164,) (6,)\n",
      "init state [0 2 0 1 0]\n",
      "(177,) (13,)\n",
      "============ 41 ===========\n",
      "Run episode 41 with rewards 29, accuracy 0.2\n",
      "----------------- 0 --------------\n",
      "   -0.6440 if c>=1.0 & x3-x1<=1.0\n",
      "   -0.2616 if c<=0.0 & x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   -0.1785 if c<=0.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   +0.7083 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.2417 if c<=0.0 & x1>=1.0 & x2<=0.0 & x3-x1>=0.0\n",
      "   -0.0309 if c<=0.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   -0.0801 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.0779 if c<=0.0 & x1>=2.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.5153 if x2<=2.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   -0.3476 if x4-x2<=-2.0\n",
      "   -0.1974 if c<=0.0 & x1>=1.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   -0.1309 if x1<=1.0 & x1>=1.0 & x4-x2<=-1.0\n",
      "   -0.2454 if x2<=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.3274 if x2<=1.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   +0.4004 if c<=0.0 & x1<=2.0 & x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.3706 if x2<=0.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "----------------- 1 --------------\n",
      "   +0.3297 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.4365 if c>=1.0 & x1>=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   -0.0000 if c<=0.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.3657 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.1624 if c>=1.0 & x1>=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   +0.4494 if x2>=3.0\n",
      "   -0.3185 if x2>=2.0 & x3-x1<=-2.0 & x4-x2>=-1.0\n",
      "   -0.2578 if x2>=1.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   -0.1865 if x1>=1.0 & x2<=2.0 & x2>=2.0 & x3-x1>=0.0\n",
      "   -0.4160 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.0196 if x2>=3.0 & x3-x1<=-1.0\n",
      "   +0.0415 if x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=-1.0\n",
      "   +0.2843 if x1<=2.0 & x2<=2.0 & x3-x1<=1.0 & x4-x2>=0.0\n",
      "   +0.1986 if x1<=2.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-3.0\n",
      "   -0.0000 if x2<=1.0 & x3-x1>=3.0\n",
      "   +1.1125 if x2<=0.0 & x3-x1>=0.0 & x4-x2<=2.0 & x4-x2>=1.0\n",
      "----------------- 2 --------------\n",
      "   +0.1788 if x2<=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   +0.3896 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.0106 if c>=1.0 & x1>=1.0 & x2<=2.0 & x4-x2<=-1.0\n",
      "   +0.1313 if c<=0.0 & x4-x2>=-2.0\n",
      "   -0.0662 if c<=0.0 & x2<=0.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   -0.2893 if c<=0.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.8387 if x2>=1.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   -0.3099 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.4922 if x1<=2.0 & x3-x1<=2.0 & x3-x1>=0.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.3812 if c>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.4298 if c<=0.0 & x1<=1.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   +0.0741 if x2<=1.0\n",
      "   +0.1573 if c<=0.0 & x1>=3.0 & x2<=2.0 & x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "   +0.0000 if x2>=1.0 & x3-x1<=1.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.0828 if x3-x1>=0.0 & x4-x2>=1.0 & x4-x2>=2.0\n",
      "   +0.4919 if c<=0.0 & x1<=2.0 & x2<=0.0 & x3-x1<=0.0\n",
      "----------------- 3 --------------\n",
      "   -0.0604 if x3-x1<=-1.0\n",
      "   +0.4969 if x1<=2.0 & x1>=2.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   -0.1539 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   +0.2730 if x1>=1.0 & x2<=2.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   -0.0247 if x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.7563 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.4605 if c>=1.0 & x1>=1.0\n",
      "   +0.4080 if x3-x1<=-2.0 & x4-x2>=0.0\n",
      "   +0.1770 if x1>=2.0 & x2<=0.0 & x4-x2>=2.0\n",
      "   -0.1340 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.0431 if x1>=3.0 & x3-x1>=0.0\n",
      "   +0.3782 if x1>=1.0 & x2>=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   -0.0902 if x2>=3.0 & x4-x2>=-1.0\n",
      "   +0.0000 if x1>=1.0 & x3-x1>=2.0 & x4-x2>=1.0\n",
      "   +0.0431 if x1>=3.0 & x2<=2.0 & x3-x1>=0.0\n",
      "   -0.5985 if x2<=0.0 & x4-x2>=1.0\n",
      "init state [0 2 2 1 0]\n",
      "(10,) (10,)\n",
      "init state [2 2 0 1 0]\n",
      "(12,) (2,)\n",
      "init state [ 2  0 -2  3  0]\n",
      "(31,) (19,)\n",
      "init state [ 1  3  1 -3  0]\n",
      "(54,) (23,)\n",
      "init state [1 2 2 0 0]\n",
      "(77,) (23,)\n",
      "init state [ 2  3 -2 -2  0]\n",
      "(134,) (57,)\n",
      "init state [ 3  1 -2  0  0]\n",
      "(168,) (34,)\n",
      "init state [ 1  3  2 -3  0]\n",
      "(193,) (25,)\n",
      "init state [ 1  1  0 -1  0]\n",
      "(208,) (15,)\n",
      "init state [ 2  3  1 -2  0]\n",
      "(217,) (9,)\n",
      "============ 42 ===========\n",
      "Run episode 42 with rewards 33, accuracy 0.4\n",
      "----------------- 0 --------------\n",
      "   -0.7157 if c>=1.0 & x3-x1<=1.0\n",
      "   -0.1324 if c<=0.0 & x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   -0.0031 if c<=0.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   +0.9413 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.2953 if c<=0.0 & x1>=1.0 & x2<=0.0 & x3-x1>=0.0\n",
      "   -0.3864 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.2383 if c<=0.0 & x1>=2.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.4851 if x2<=2.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   -0.7240 if x4-x2<=-2.0\n",
      "   -0.4381 if c<=0.0 & x1>=1.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   +0.0652 if x1<=1.0 & x1>=1.0 & x4-x2<=-1.0\n",
      "   +0.0829 if x2<=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.2132 if x2<=1.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   +0.2247 if c<=0.0 & x1<=2.0 & x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.3343 if x2<=0.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   -0.2308 if x1<=0.0 & x2<=2.0 & x4-x2>=-1.0 & x4-x2>=1.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 1 --------------\n",
      "   +0.0059 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.5053 if c>=1.0 & x1>=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   -0.6593 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.0105 if c>=1.0 & x1>=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   +0.2931 if x2>=3.0\n",
      "   +0.0442 if x2>=2.0 & x3-x1<=-2.0 & x4-x2>=-1.0\n",
      "   +0.0513 if x2>=1.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   -0.4859 if x1>=1.0 & x2<=2.0 & x2>=2.0 & x3-x1>=0.0\n",
      "   -0.4732 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   -0.1016 if x2>=3.0 & x3-x1<=-1.0\n",
      "   +0.3479 if x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=-1.0\n",
      "   +0.1188 if x1<=2.0 & x2<=2.0 & x3-x1<=1.0 & x4-x2>=0.0\n",
      "   -0.0762 if x1<=2.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-3.0\n",
      "   +0.0000 if x2<=1.0 & x3-x1>=3.0\n",
      "   +0.7084 if x2<=0.0 & x3-x1>=0.0 & x4-x2<=2.0 & x4-x2>=1.0\n",
      "   +0.6453 if x2>=1.0 & x3-x1>=-2.0 & x4-x2<=1.0 & x4-x2>=-2.0\n",
      "----------------- 2 --------------\n",
      "   +0.2715 if x2<=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.1251 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.1707 if c>=1.0 & x1>=1.0 & x2<=2.0 & x4-x2<=-1.0\n",
      "   +0.9404 if c<=0.0 & x4-x2>=-2.0\n",
      "   +0.0314 if c<=0.0 & x2<=0.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   -0.1768 if c<=0.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.6615 if x2>=1.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   -0.2199 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.0353 if x1<=2.0 & x3-x1<=2.0 & x3-x1>=0.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.4040 if c>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.1065 if c<=0.0 & x1<=1.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.1933 if x2<=1.0\n",
      "   +0.0768 if c<=0.0 & x1>=3.0 & x2<=2.0 & x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "   +0.1386 if x3-x1>=0.0 & x4-x2>=1.0 & x4-x2>=2.0\n",
      "   +0.0215 if c<=0.0 & x1<=2.0 & x2<=0.0 & x3-x1<=0.0\n",
      "   -0.5613 if x3-x1>=0.0 & x4-x2>=3.0\n",
      "----------------- 3 --------------\n",
      "   +0.0735 if x3-x1<=-1.0\n",
      "   +0.6219 if x1<=2.0 & x1>=2.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   -0.4590 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   -0.0196 if x1>=1.0 & x2<=2.0 & x3-x1>=-2.0 & x4-x2>=-1.0\n",
      "   +0.1648 if x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.2238 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.4812 if c>=1.0 & x1>=1.0\n",
      "   +0.2396 if x3-x1<=-2.0 & x4-x2>=0.0\n",
      "   +0.3397 if x1>=2.0 & x2<=0.0 & x4-x2>=2.0\n",
      "   -0.6129 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "   -0.1722 if x1>=3.0 & x3-x1>=0.0\n",
      "   +0.0475 if x1>=1.0 & x2>=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   -0.0959 if x2>=3.0 & x4-x2>=-1.0\n",
      "   +0.2449 if x1>=3.0 & x2<=2.0 & x3-x1>=0.0\n",
      "   -0.2041 if x2<=0.0 & x4-x2>=1.0\n",
      "   +0.5173 if x1>=2.0 & x3-x1>=0.0 & x4-x2>=3.0\n",
      "init state [ 3  0 -1  0  0]\n",
      "(9,) (9,)\n",
      "init state [0 0 0 3 0]\n",
      "(40,) (31,)\n",
      "init state [ 0  3  2 -3  0]\n",
      "(78,) (38,)\n",
      "init state [1 1 0 1 0]\n",
      "(84,) (6,)\n",
      "init state [ 2  1 -2  0  0]\n",
      "(98,) (14,)\n",
      "init state [0 0 1 3 0]\n",
      "(114,) (16,)\n",
      "init state [ 1  3 -1 -2  0]\n",
      "(124,) (10,)\n",
      "init state [ 3  0 -2  3  0]\n",
      "(211,) (87,)\n",
      "init state [ 2  1 -2  2  0]\n",
      "(226,) (15,)\n",
      "init state [ 1  2 -1  0  0]\n",
      "(233,) (7,)\n",
      "============ 43 ===========\n",
      "Run episode 43 with rewards 35, accuracy 0.6\n",
      "----------------- 0 --------------\n",
      "   -0.8215 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.2653 if c<=0.0 & x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   +1.0062 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.0015 if c<=0.0 & x1>=1.0 & x2<=0.0 & x3-x1>=0.0\n",
      "   -0.0683 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.1249 if c<=0.0 & x1>=2.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.2458 if x2<=2.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   +0.4782 if x4-x2<=-2.0\n",
      "   +0.0139 if c<=0.0 & x1>=1.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   +0.0780 if x1<=1.0 & x1>=1.0 & x4-x2<=-1.0\n",
      "   +0.0994 if x2<=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.3622 if x2<=1.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   +0.1074 if c<=0.0 & x1<=2.0 & x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.2417 if x2<=0.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   -0.1632 if x1<=0.0 & x2<=2.0 & x4-x2>=-1.0 & x4-x2>=1.0\n",
      "   -0.2116 if x2>=3.0 & x3-x1<=-3.0\n",
      "----------------- 1 --------------\n",
      "   +0.3836 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.2044 if c>=1.0 & x1>=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   -0.6715 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.0304 if c>=1.0 & x1>=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   +0.2934 if x2>=3.0\n",
      "   +0.0176 if x2>=2.0 & x3-x1<=-2.0 & x4-x2>=-1.0\n",
      "   -0.1772 if x2>=1.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   -0.1934 if x1>=1.0 & x2<=2.0 & x2>=2.0 & x3-x1>=0.0\n",
      "   -0.8132 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   -0.1352 if x2>=3.0 & x3-x1<=-1.0\n",
      "   +0.3492 if x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=-1.0\n",
      "   +0.5144 if x1<=2.0 & x2<=2.0 & x3-x1<=1.0 & x4-x2>=0.0\n",
      "   -0.0043 if x1<=2.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=-3.0\n",
      "   -0.0954 if x2<=0.0 & x3-x1>=0.0 & x4-x2<=2.0 & x4-x2>=1.0\n",
      "   +0.4690 if x2>=1.0 & x3-x1>=-2.0 & x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   -0.3844 if c>=1.0 & x1>=3.0 & x3-x1>=-2.0\n",
      "----------------- 2 --------------\n",
      "   +0.2568 if x2<=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.1379 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.3022 if c>=1.0 & x1>=1.0 & x2<=2.0 & x4-x2<=-1.0\n",
      "   -0.0871 if c<=0.0 & x4-x2>=-2.0\n",
      "   +0.1858 if c<=0.0 & x2<=0.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   -0.2204 if c<=0.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.7727 if x2>=1.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   -0.2263 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.2891 if x1<=2.0 & x3-x1<=2.0 & x3-x1>=0.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.4328 if c>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.6198 if c<=0.0 & x1<=1.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.0739 if x2<=1.0\n",
      "   +0.3118 if c<=0.0 & x1>=3.0 & x2<=2.0 & x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "   -0.3746 if x3-x1>=0.0 & x4-x2>=1.0 & x4-x2>=2.0\n",
      "   -0.0180 if x3-x1>=0.0 & x4-x2>=3.0\n",
      "   +0.3237 if x3-x1<=-1.0 & x4-x2>=2.0\n",
      "----------------- 3 --------------\n",
      "   -0.0319 if x3-x1<=-1.0\n",
      "   -0.0674 if x1<=2.0 & x1>=2.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   +0.1135 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   -0.1139 if x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.6372 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.3893 if c>=1.0 & x1>=1.0\n",
      "   +0.1019 if x3-x1<=-2.0 & x4-x2>=0.0\n",
      "   +0.2132 if x1>=2.0 & x2<=0.0 & x4-x2>=2.0\n",
      "   -0.0000 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "   -0.0000 if x1>=3.0 & x3-x1>=0.0\n",
      "   +0.2838 if x1>=1.0 & x2>=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   +0.0768 if x2>=3.0 & x4-x2>=-1.0\n",
      "   -0.0000 if x1>=3.0 & x2<=2.0 & x3-x1>=0.0\n",
      "   +0.0403 if x2<=0.0 & x4-x2>=1.0\n",
      "   -0.0000 if x1>=2.0 & x3-x1>=0.0 & x4-x2>=3.0\n",
      "   +0.6986 if x3-x1<=-3.0 & x4-x2>=0.0\n",
      "init state [ 2  3  1 -2  0]\n",
      "(38,) (38,)\n",
      "init state [ 2  2  1 -2  0]\n",
      "(106,) (68,)\n",
      "init state [2 0 1 2 0]\n",
      "(118,) (12,)\n",
      "init state [ 0  2  0 -2  0]\n",
      "(135,) (17,)\n",
      "init state [ 0  3  2 -1  0]\n",
      "(142,) (7,)\n",
      "init state [ 0  2  1 -1  0]\n",
      "(159,) (17,)\n",
      "init state [ 0  2  0 -1  0]\n",
      "(175,) (16,)\n",
      "init state [ 2  3  1 -3  0]\n",
      "(199,) (24,)\n",
      "init state [ 2  3  1 -2  0]\n",
      "(230,) (31,)\n",
      "init state [ 2  0 -2  0  0]\n",
      "(242,) (12,)\n",
      "============ 44 ===========\n",
      "Run episode 44 with rewards 30, accuracy 0.7\n",
      "best\n",
      "----------------- 0 --------------\n",
      "   -0.8024 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.0000 if c<=0.0 & x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   +0.4361 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.0322 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.4304 if c<=0.0 & x1>=2.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.1420 if x2<=2.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   +0.2152 if x4-x2<=-2.0\n",
      "   +0.1145 if c<=0.0 & x1>=1.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   -0.0739 if x1<=1.0 & x1>=1.0 & x4-x2<=-1.0\n",
      "   +0.2878 if x2<=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.0479 if x2<=1.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   -0.1220 if c<=0.0 & x1<=2.0 & x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.0000 if x2<=0.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   +0.5436 if x1<=0.0 & x2<=2.0 & x4-x2>=-1.0 & x4-x2>=1.0\n",
      "   +0.0000 if x2>=3.0 & x3-x1<=-3.0\n",
      "   +0.6109 if c<=0.0 & x1>=3.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "----------------- 1 --------------\n",
      "   +0.5943 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.1002 if c>=1.0 & x1>=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   -0.8268 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.2770 if c>=1.0 & x1>=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   -0.0729 if x2>=3.0\n",
      "   -0.2143 if x2>=2.0 & x3-x1<=-2.0 & x4-x2>=-1.0\n",
      "   -0.0271 if x2>=1.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.3146 if x1>=1.0 & x2<=2.0 & x2>=2.0 & x3-x1>=0.0\n",
      "   -0.7806 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.1871 if x2>=3.0 & x3-x1<=-1.0\n",
      "   +0.2465 if x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=-1.0\n",
      "   +0.8028 if x1<=2.0 & x2<=2.0 & x3-x1<=1.0 & x4-x2>=0.0\n",
      "   +0.0692 if x2<=0.0 & x3-x1>=0.0 & x4-x2<=2.0 & x4-x2>=1.0\n",
      "   +0.8797 if x2>=1.0 & x3-x1>=-2.0 & x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   -0.6982 if c>=1.0 & x1>=3.0 & x3-x1>=-2.0\n",
      "   -0.7572 if x3-x1>=-2.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "----------------- 2 --------------\n",
      "   -0.0599 if x2<=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   +0.0062 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.4097 if c>=1.0 & x1>=1.0 & x2<=2.0 & x4-x2<=-1.0\n",
      "   +0.1895 if c<=0.0 & x4-x2>=-2.0\n",
      "   -0.2809 if c<=0.0 & x2<=0.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   -0.2552 if c<=0.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.2834 if x2>=1.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   -0.3403 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.0674 if x1<=2.0 & x3-x1<=2.0 & x3-x1>=0.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.4527 if c>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.1677 if c<=0.0 & x1<=1.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.2445 if x2<=1.0\n",
      "   +0.0000 if c<=0.0 & x1>=3.0 & x2<=2.0 & x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "   -0.2588 if x3-x1>=0.0 & x4-x2>=1.0 & x4-x2>=2.0\n",
      "   +0.0000 if x3-x1<=-1.0 & x4-x2>=2.0\n",
      "   +0.4520 if x2>=3.0 & x3-x1<=0.0 & x4-x2>=-1.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 3 --------------\n",
      "   -0.0345 if x3-x1<=-1.0\n",
      "   -0.4101 if x1<=2.0 & x1>=2.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   -0.1176 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   +0.1228 if x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.1556 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.8504 if c>=1.0 & x1>=1.0\n",
      "   +0.0143 if x3-x1<=-2.0 & x4-x2>=0.0\n",
      "   +0.3137 if x1>=2.0 & x2<=0.0 & x4-x2>=2.0\n",
      "   -0.4238 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.1363 if x1>=1.0 & x2>=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   -0.3700 if x2>=3.0 & x4-x2>=-1.0\n",
      "   -0.0509 if x1>=3.0 & x2<=2.0 & x3-x1>=0.0\n",
      "   +0.2779 if x2<=0.0 & x4-x2>=1.0\n",
      "   +0.0000 if x1>=2.0 & x3-x1>=0.0 & x4-x2>=3.0\n",
      "   -0.0718 if x3-x1<=-3.0 & x4-x2>=0.0\n",
      "   -0.1984 if x1<=2.0 & x4-x2>=2.0\n",
      "init state [0 0 3 0 0]\n",
      "(31,) (31,)\n",
      "init state [ 1  2  0 -1  0]\n",
      "(49,) (18,)\n",
      "init state [ 2  3 -1 -2  0]\n",
      "(77,) (28,)\n",
      "init state [1 0 1 0 0]\n",
      "(139,) (62,)\n",
      "init state [ 3  1 -1 -1  0]\n",
      "(178,) (39,)\n",
      "init state [ 3  1 -1  1  0]\n",
      "(182,) (4,)\n",
      "init state [ 3  2 -1  0  0]\n",
      "(188,) (6,)\n",
      "init state [ 0  2  0 -1  0]\n",
      "(200,) (12,)\n",
      "init state [2 0 0 2 0]\n",
      "(231,) (31,)\n",
      "init state [0 1 0 2 0]\n",
      "(258,) (27,)\n",
      "============ 45 ===========\n",
      "Run episode 45 with rewards 15, accuracy 0.3\n",
      "----------------- 0 --------------\n",
      "   -0.8000 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.0730 if c<=0.0 & x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   +0.9796 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.3949 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.2978 if c<=0.0 & x1>=2.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.5108 if x2<=2.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   +0.0244 if x4-x2<=-2.0\n",
      "   -0.4311 if c<=0.0 & x1>=1.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   -0.0771 if x1<=1.0 & x1>=1.0 & x4-x2<=-1.0\n",
      "   +0.0885 if x2<=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.4503 if x2<=1.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   -0.2352 if c<=0.0 & x1<=2.0 & x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   -0.0571 if x2<=0.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   +0.0472 if x1<=0.0 & x2<=2.0 & x4-x2>=-1.0 & x4-x2>=1.0\n",
      "   +0.5723 if c<=0.0 & x1>=3.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.2516 if c<=0.0 & x1<=1.0 & x2>=3.0 & x3-x1<=-1.0\n",
      "----------------- 1 --------------\n",
      "   -0.2021 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.6015 if c>=1.0 & x1>=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   -0.3347 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.1398 if c>=1.0 & x1>=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   +0.4672 if x2>=3.0\n",
      "   -0.1427 if x2>=2.0 & x3-x1<=-2.0 & x4-x2>=-1.0\n",
      "   +0.5821 if x1>=1.0 & x2<=2.0 & x2>=2.0 & x3-x1>=0.0\n",
      "   -0.5889 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   -0.5641 if x2>=3.0 & x3-x1<=-1.0\n",
      "   -0.5785 if x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=-1.0\n",
      "   -0.0400 if x1<=2.0 & x2<=2.0 & x3-x1<=1.0 & x4-x2>=0.0\n",
      "   +0.3332 if x2<=0.0 & x3-x1>=0.0 & x4-x2<=2.0 & x4-x2>=1.0\n",
      "   +0.0237 if x2>=1.0 & x3-x1>=-2.0 & x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   -0.1517 if c>=1.0 & x1>=3.0 & x3-x1>=-2.0\n",
      "   -0.4404 if x3-x1>=-2.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +1.1140 if x1<=2.0 & x4-x2>=-2.0\n",
      "----------------- 2 --------------\n",
      "   -0.0103 if x2<=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.0118 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.0209 if c>=1.0 & x1>=1.0 & x2<=2.0 & x4-x2<=-1.0\n",
      "   +0.4086 if c<=0.0 & x4-x2>=-2.0\n",
      "   -0.1528 if c<=0.0 & x2<=0.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   -0.1826 if c<=0.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.8262 if x2>=1.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   -0.5248 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.0393 if x1<=2.0 & x3-x1<=2.0 & x3-x1>=0.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.5337 if c>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.4040 if c<=0.0 & x1<=1.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.2327 if x2<=1.0\n",
      "   -0.2104 if x3-x1>=0.0 & x4-x2>=1.0 & x4-x2>=2.0\n",
      "   +0.1514 if x3-x1<=-1.0 & x4-x2>=2.0\n",
      "   +0.0966 if x2>=3.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   +0.2566 if x1<=2.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0\n",
      "----------------- 3 --------------\n",
      "   +0.0157 if x3-x1<=-1.0\n",
      "   +0.2153 if x1<=2.0 & x1>=2.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   -0.3005 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   +0.4281 if x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.1347 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.7850 if c>=1.0 & x1>=1.0\n",
      "   +0.3388 if x3-x1<=-2.0 & x4-x2>=0.0\n",
      "   -0.2320 if x1>=2.0 & x2<=0.0 & x4-x2>=2.0\n",
      "   -0.1502 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.1354 if x1>=1.0 & x2>=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   +0.1989 if x2>=3.0 & x4-x2>=-1.0\n",
      "   -0.1755 if x1>=3.0 & x2<=2.0 & x3-x1>=0.0\n",
      "   -0.1740 if x2<=0.0 & x4-x2>=1.0\n",
      "   +0.0000 if x3-x1<=-3.0 & x4-x2>=0.0\n",
      "   -0.0870 if x1<=2.0 & x4-x2>=2.0\n",
      "   +0.0200 if x1>=3.0 & x4-x2>=2.0\n",
      "init state [0 1 1 2 0]\n",
      "(8,) (8,)\n",
      "init state [ 3  0 -2  3  0]\n",
      "(27,) (19,)\n",
      "init state [ 2  3  0 -3  0]\n",
      "(56,) (29,)\n",
      "init state [ 2  3  1 -1  0]\n",
      "(64,) (8,)\n",
      "init state [ 1  1  2 -1  0]\n",
      "(85,) (21,)\n",
      "init state [ 2  3 -1  0  0]\n",
      "(90,) (5,)\n",
      "init state [ 0  3  1 -3  0]\n",
      "(106,) (16,)\n",
      "init state [ 2  1 -1  2  0]\n",
      "(122,) (16,)\n",
      "init state [0 1 2 1 0]\n",
      "(142,) (20,)\n",
      "init state [ 3  0 -2  2  0]\n",
      "(149,) (7,)\n",
      "============ 46 ===========\n",
      "Run episode 46 with rewards 35, accuracy 0.8\n",
      "best\n",
      "----------------- 0 --------------\n",
      "   -0.6358 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.0014 if c<=0.0 & x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   +0.6527 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.3595 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.2953 if c<=0.0 & x1>=2.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.4770 if x2<=2.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   -0.7499 if c<=0.0 & x1>=1.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   -0.2677 if x1<=1.0 & x1>=1.0 & x4-x2<=-1.0\n",
      "   -0.0545 if x2<=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.1901 if x2<=1.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   +0.5524 if c<=0.0 & x1<=2.0 & x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.3600 if x2<=0.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   -0.0961 if x1<=0.0 & x2<=2.0 & x4-x2>=-1.0 & x4-x2>=1.0\n",
      "   +0.5120 if c<=0.0 & x1>=3.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.0000 if c<=0.0 & x1<=1.0 & x2>=3.0 & x3-x1<=-1.0\n",
      "   -0.3859 if x2>=2.0 & x3-x1<=-2.0\n",
      "----------------- 1 --------------\n",
      "   +0.6080 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.4857 if c>=1.0 & x1>=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   -0.3013 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.1602 if c>=1.0 & x1>=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   +0.2342 if x2>=3.0\n",
      "   -0.1658 if x2>=2.0 & x3-x1<=-2.0 & x4-x2>=-1.0\n",
      "   +0.5105 if x1>=1.0 & x2<=2.0 & x2>=2.0 & x3-x1>=0.0\n",
      "   -1.1142 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.0995 if x2>=3.0 & x3-x1<=-1.0\n",
      "   -0.4252 if x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=-1.0\n",
      "   +0.1398 if x1<=2.0 & x2<=2.0 & x3-x1<=1.0 & x4-x2>=0.0\n",
      "   +0.0589 if x2<=0.0 & x3-x1>=0.0 & x4-x2<=2.0 & x4-x2>=1.0\n",
      "   +0.2813 if c>=1.0 & x1>=3.0 & x3-x1>=-2.0\n",
      "   -0.2356 if x3-x1>=-2.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.5192 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.1412 if x4-x2<=1.0\n",
      "----------------- 2 --------------\n",
      "   -0.0326 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.1655 if c>=1.0 & x1>=1.0 & x2<=2.0 & x4-x2<=-1.0\n",
      "   +0.3034 if c<=0.0 & x4-x2>=-2.0\n",
      "   +0.2251 if c<=0.0 & x2<=0.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   -0.0824 if c<=0.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.6377 if x2>=1.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   -1.1201 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.1334 if x1<=2.0 & x3-x1<=2.0 & x3-x1>=0.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.3420 if c>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.1938 if c<=0.0 & x1<=1.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   +0.1728 if x2<=1.0\n",
      "   +0.0028 if x3-x1>=0.0 & x4-x2>=1.0 & x4-x2>=2.0\n",
      "   -0.3470 if x3-x1<=-1.0 & x4-x2>=2.0\n",
      "   +0.1838 if x2>=3.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   +0.1538 if x1<=2.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0\n",
      "   +0.6149 if x2>=3.0 & x3-x1<=-2.0\n",
      "----------------- 3 --------------\n",
      "   +0.0410 if x3-x1<=-1.0\n",
      "   +0.3652 if x1<=2.0 & x1>=2.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   -0.2876 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   -0.2493 if x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.4910 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.7861 if c>=1.0 & x1>=1.0\n",
      "   +0.2896 if x3-x1<=-2.0 & x4-x2>=0.0\n",
      "   +0.0406 if x1>=2.0 & x2<=0.0 & x4-x2>=2.0\n",
      "   -0.2551 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.1538 if x1>=1.0 & x2>=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   -0.0459 if x2>=3.0 & x4-x2>=-1.0\n",
      "   -0.2146 if x1>=3.0 & x2<=2.0 & x3-x1>=0.0\n",
      "   -0.0051 if x2<=0.0 & x4-x2>=1.0\n",
      "   -0.1934 if x1<=2.0 & x4-x2>=2.0\n",
      "   +0.0917 if x1>=3.0 & x4-x2>=2.0\n",
      "   +0.4117 if x1<=0.0 & x2>=1.0 & x4-x2>=2.0\n",
      "init state [1 0 1 0 0]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(16,) (16,)\n",
      "init state [ 0  2  3 -1  0]\n",
      "(39,) (23,)\n",
      "init state [ 3  2 -3 -2  0]\n",
      "(83,) (44,)\n",
      "init state [2 1 0 2 0]\n",
      "(90,) (7,)\n",
      "init state [ 2  2 -1 -1  0]\n",
      "(132,) (42,)\n",
      "init state [1 2 2 0 0]\n",
      "(150,) (18,)\n",
      "init state [ 3  2 -3 -2  0]\n",
      "(189,) (39,)\n",
      "init state [ 1  3  2 -3  0]\n",
      "(229,) (40,)\n",
      "init state [ 3  2 -2 -1  0]\n",
      "(258,) (29,)\n",
      "init state [ 3  1 -1 -1  0]\n",
      "(281,) (23,)\n",
      "============ 47 ===========\n",
      "Run episode 47 with rewards 19, accuracy 0.8\n",
      "best\n",
      "----------------- 0 --------------\n",
      "   -0.6437 if c>=1.0 & x3-x1<=1.0\n",
      "   -0.1143 if c<=0.0 & x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   +0.8999 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.5134 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.0208 if c<=0.0 & x1>=2.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.4830 if x2<=2.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   -0.4848 if c<=0.0 & x1>=1.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   -0.2133 if x1<=1.0 & x1>=1.0 & x4-x2<=-1.0\n",
      "   +0.5339 if x2<=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.4760 if x2<=1.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   +0.3939 if c<=0.0 & x1<=2.0 & x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   -0.0000 if x2<=0.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   -0.0032 if x1<=0.0 & x2<=2.0 & x4-x2>=-1.0 & x4-x2>=1.0\n",
      "   +0.2362 if c<=0.0 & x1>=3.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.0165 if x2>=2.0 & x3-x1<=-2.0\n",
      "   -0.3558 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2<=1.0\n",
      "----------------- 1 --------------\n",
      "   +0.5068 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.3871 if c>=1.0 & x1>=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   -0.6682 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.3673 if c>=1.0 & x1>=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   +0.1726 if x2>=3.0\n",
      "   -0.0205 if x2>=2.0 & x3-x1<=-2.0 & x4-x2>=-1.0\n",
      "   +0.0107 if x1>=1.0 & x2<=2.0 & x2>=2.0 & x3-x1>=0.0\n",
      "   -1.2213 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.0838 if x2>=3.0 & x3-x1<=-1.0\n",
      "   -0.0322 if x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=-1.0\n",
      "   +0.3613 if x1<=2.0 & x2<=2.0 & x3-x1<=1.0 & x4-x2>=0.0\n",
      "   +0.2005 if c>=1.0 & x1>=3.0 & x3-x1>=-2.0\n",
      "   -0.4130 if x3-x1>=-2.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.3692 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.0405 if x4-x2<=1.0\n",
      "   +0.6146 if x1>=2.0 & x2>=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "----------------- 2 --------------\n",
      "   -0.2635 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.6518 if c>=1.0 & x1>=1.0 & x2<=2.0 & x4-x2<=-1.0\n",
      "   +0.9369 if c<=0.0 & x4-x2>=-2.0\n",
      "   -0.0677 if c<=0.0 & x2<=0.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.4103 if c<=0.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.3779 if x2>=1.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   -0.3789 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.0837 if x1<=2.0 & x3-x1<=2.0 & x3-x1>=0.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.3787 if c>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.2732 if c<=0.0 & x1<=1.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.3526 if x2<=1.0\n",
      "   -0.0557 if x3-x1<=-1.0 & x4-x2>=2.0\n",
      "   -0.0201 if x2>=3.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   +0.2874 if x1<=2.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0\n",
      "   +0.1647 if x2>=3.0 & x3-x1<=-2.0\n",
      "   -0.7435 if c<=0.0 & x2<=1.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x3-x1>=-2.0 & x4-x2>=-1.0 & x4-x2>=0.0\n",
      "----------------- 3 --------------\n",
      "   +0.0539 if x3-x1<=-1.0\n",
      "   +0.1527 if x1<=2.0 & x1>=2.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   +0.0538 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   -0.1513 if x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.5667 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.8490 if c>=1.0 & x1>=1.0\n",
      "   +0.1335 if x3-x1<=-2.0 & x4-x2>=0.0\n",
      "   +0.0028 if x1>=2.0 & x2<=0.0 & x4-x2>=2.0\n",
      "   +0.1262 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "   -0.2190 if x1>=1.0 & x2>=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   -0.0539 if x2>=3.0 & x4-x2>=-1.0\n",
      "   +0.2422 if x1>=3.0 & x2<=2.0 & x3-x1>=0.0\n",
      "   -0.0755 if x1<=2.0 & x4-x2>=2.0\n",
      "   +0.3697 if x1>=3.0 & x4-x2>=2.0\n",
      "   -0.0000 if x1<=0.0 & x2>=1.0 & x4-x2>=2.0\n",
      "   -0.4960 if x1<=2.0 & x2>=2.0 & x3-x1<=2.0\n",
      "init state [ 2  2  1 -2  0]\n",
      "(59,) (59,)\n",
      "init state [ 3  1 -1  1  0]\n",
      "(63,) (4,)\n",
      "init state [ 1  1  2 -1  0]\n",
      "(77,) (14,)\n",
      "init state [ 2  1 -1  2  0]\n",
      "(90,) (13,)\n",
      "init state [ 0  3  2 -3  0]\n",
      "(108,) (18,)\n",
      "init state [ 1  3 -1 -3  0]\n",
      "(132,) (24,)\n",
      "init state [ 3  2 -3 -1  0]\n",
      "(148,) (16,)\n",
      "init state [ 1  2 -1 -2  0]\n",
      "(176,) (28,)\n",
      "init state [ 2  1  1 -1  0]\n",
      "(185,) (9,)\n",
      "init state [ 3  1 -3  0  0]\n",
      "(199,) (14,)\n",
      "============ 48 ===========\n",
      "Run episode 48 with rewards 28, accuracy 0.6\n",
      "----------------- 0 --------------\n",
      "   -0.5637 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.0878 if c<=0.0 & x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   +0.6706 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.5653 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.0731 if c<=0.0 & x1>=2.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.4256 if x2<=2.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   -0.7321 if c<=0.0 & x1>=1.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   +0.0460 if x1<=1.0 & x1>=1.0 & x4-x2<=-1.0\n",
      "   +0.3110 if x2<=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.3312 if x2<=1.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   -0.1389 if c<=0.0 & x1<=2.0 & x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.0000 if x1<=0.0 & x2<=2.0 & x4-x2>=-1.0 & x4-x2>=1.0\n",
      "   +0.2892 if c<=0.0 & x1>=3.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.1427 if x2>=2.0 & x3-x1<=-2.0\n",
      "   -0.2864 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2<=1.0\n",
      "   +0.3642 if x3-x1<=-2.0 & x4-x2>=3.0\n",
      "----------------- 1 --------------\n",
      "   -0.1261 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.5729 if c>=1.0 & x1>=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   -0.6381 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.0278 if c>=1.0 & x1>=2.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   +0.7473 if x2>=3.0\n",
      "   -0.0418 if x2>=2.0 & x3-x1<=-2.0 & x4-x2>=-1.0\n",
      "   -0.8116 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.2544 if x2>=3.0 & x3-x1<=-1.0\n",
      "   +0.1617 if x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=-1.0\n",
      "   -0.1205 if x1<=2.0 & x2<=2.0 & x3-x1<=1.0 & x4-x2>=0.0\n",
      "   -0.2400 if c>=1.0 & x1>=3.0 & x3-x1>=-2.0\n",
      "   -0.4295 if x3-x1>=-2.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.7460 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.2191 if x4-x2<=1.0\n",
      "   +0.2029 if x1>=2.0 & x2>=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.0883 if x4-x2<=2.0\n",
      "----------------- 2 --------------\n",
      "   -0.0739 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.4418 if c>=1.0 & x1>=1.0 & x2<=2.0 & x4-x2<=-1.0\n",
      "   +0.5995 if c<=0.0 & x4-x2>=-2.0\n",
      "   -0.2439 if c<=0.0 & x2<=0.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   -0.4216 if c<=0.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.1468 if x2>=1.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   -0.6675 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.0895 if x1<=2.0 & x3-x1<=2.0 & x3-x1>=0.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.8757 if c>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.0041 if c<=0.0 & x1<=1.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.1463 if x2<=1.0\n",
      "   -0.1583 if x3-x1<=-1.0 & x4-x2>=2.0\n",
      "   +0.6620 if x1<=2.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0\n",
      "   -0.0529 if x2>=3.0 & x3-x1<=-2.0\n",
      "   -0.2665 if c<=0.0 & x2<=1.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x3-x1>=-2.0 & x4-x2>=-1.0 & x4-x2>=0.0\n",
      "   +0.3444 if x1>=3.0 & x4-x2<=-1.0\n",
      "----------------- 3 --------------\n",
      "   +0.1812 if x3-x1<=-1.0\n",
      "   +0.1620 if x1<=2.0 & x1>=2.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   -0.2418 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   +0.0769 if x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.8145 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.7838 if c>=1.0 & x1>=1.0\n",
      "   +0.3185 if x3-x1<=-2.0 & x4-x2>=0.0\n",
      "   -0.3060 if x1>=2.0 & x2<=0.0 & x4-x2>=2.0\n",
      "   +0.0000 if x1>=1.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "   -0.5433 if x1>=1.0 & x2>=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   -0.2000 if x2>=3.0 & x4-x2>=-1.0\n",
      "   +0.3960 if x1>=3.0 & x2<=2.0 & x3-x1>=0.0\n",
      "   +0.0342 if x1<=2.0 & x4-x2>=2.0\n",
      "   -0.1934 if x1>=3.0 & x4-x2>=2.0\n",
      "   -0.4035 if x1<=2.0 & x2>=2.0 & x3-x1<=2.0\n",
      "   -0.1974 if x1<=1.0 & x4-x2>=3.0\n",
      "init state [0 1 1 0 0]\n",
      "(14,) (14,)\n",
      "init state [2 0 1 0 0]\n",
      "(32,) (18,)\n",
      "init state [0 1 1 1 0]\n",
      "(39,) (7,)\n",
      "init state [ 2  2  0 -2  0]\n",
      "(49,) (10,)\n",
      "init state [0 1 2 0 0]\n",
      "(60,) (11,)\n",
      "init state [ 2  3  1 -2  0]\n",
      "(69,) (9,)\n",
      "init state [2 1 0 1 0]\n",
      "(74,) (5,)\n",
      "init state [ 3  2 -2 -2  0]\n",
      "(102,) (28,)\n",
      "init state [ 3  1 -3 -1  0]\n",
      "(117,) (15,)\n",
      "init state [ 1  0 -1  2  0]\n",
      "(136,) (19,)\n",
      "============ 49 ===========\n",
      "Run episode 49 with rewards 23, accuracy 0.8\n",
      "best\n",
      "----------------- 0 --------------\n",
      "   -0.4682 if c>=1.0 & x3-x1<=1.0\n",
      "   -0.0136 if c<=0.0 & x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   +0.6447 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.6441 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.3137 if c<=0.0 & x1>=2.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.2987 if x2<=2.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   -0.5242 if c<=0.0 & x1>=1.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   +0.0108 if x1<=1.0 & x1>=1.0 & x4-x2<=-1.0\n",
      "   +0.3656 if x2<=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.4712 if x2<=1.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   +0.2263 if c<=0.0 & x1<=2.0 & x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   -0.0000 if c<=0.0 & x1>=3.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.3307 if x2>=2.0 & x3-x1<=-2.0\n",
      "   +0.0895 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2<=1.0\n",
      "   -0.0000 if x3-x1<=-2.0 & x4-x2>=3.0\n",
      "   -0.4815 if c<=0.0 & x1<=2.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2>=1.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 1 --------------\n",
      "   +0.5105 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.3267 if c>=1.0 & x1>=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   -0.1405 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.5960 if x2>=3.0\n",
      "   +0.0830 if x2>=2.0 & x3-x1<=-2.0 & x4-x2>=-1.0\n",
      "   -0.6382 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   -0.0805 if x2>=3.0 & x3-x1<=-1.0\n",
      "   +0.3124 if x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=-1.0\n",
      "   -0.3738 if x1<=2.0 & x2<=2.0 & x3-x1<=1.0 & x4-x2>=0.0\n",
      "   -0.3039 if c>=1.0 & x1>=3.0 & x3-x1>=-2.0\n",
      "   -0.5204 if x3-x1>=-2.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.4925 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.1537 if x4-x2<=1.0\n",
      "   -0.1588 if x1>=2.0 & x2>=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.1927 if x4-x2<=2.0\n",
      "   -0.1579 if x4-x2<=-3.0\n",
      "----------------- 2 --------------\n",
      "   -0.1559 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.5173 if c>=1.0 & x1>=1.0 & x2<=2.0 & x4-x2<=-1.0\n",
      "   +0.4570 if c<=0.0 & x4-x2>=-2.0\n",
      "   -0.3176 if c<=0.0 & x2<=0.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   -0.2790 if c<=0.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.3104 if x2>=1.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   -0.0200 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.2818 if x1<=2.0 & x3-x1<=2.0 & x3-x1>=0.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.7148 if c>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.0589 if x2<=1.0\n",
      "   -0.0353 if x3-x1<=-1.0 & x4-x2>=2.0\n",
      "   +0.0121 if x1<=2.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0\n",
      "   +0.2480 if x2>=3.0 & x3-x1<=-2.0\n",
      "   -0.5100 if c<=0.0 & x2<=1.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x3-x1>=-2.0 & x4-x2>=-1.0 & x4-x2>=0.0\n",
      "   +0.4258 if x1>=3.0 & x4-x2<=-1.0\n",
      "   +0.3541 if x3-x1>=2.0\n",
      "----------------- 3 --------------\n",
      "   +0.2024 if x3-x1<=-1.0\n",
      "   +0.2696 if x1<=2.0 & x1>=2.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   -0.3133 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   +0.5986 if x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.4836 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.4443 if c>=1.0 & x1>=1.0\n",
      "   -0.1387 if x3-x1<=-2.0 & x4-x2>=0.0\n",
      "   +0.0716 if x1>=2.0 & x2<=0.0 & x4-x2>=2.0\n",
      "   -0.0423 if x1>=1.0 & x2>=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   -0.1889 if x2>=3.0 & x4-x2>=-1.0\n",
      "   -0.0987 if x1>=3.0 & x2<=2.0 & x3-x1>=0.0\n",
      "   +0.0336 if x1<=2.0 & x4-x2>=2.0\n",
      "   +0.0000 if x1>=3.0 & x4-x2>=2.0\n",
      "   -0.5270 if x1<=2.0 & x2>=2.0 & x3-x1<=2.0\n",
      "   +0.0000 if x1<=1.0 & x4-x2>=3.0\n",
      "   -0.3081 if x3-x1>=2.0\n",
      "init state [0 0 2 3 0]\n",
      "(16,) (16,)\n",
      "init state [ 0  2  2 -2  0]\n",
      "(56,) (40,)\n",
      "init state [ 2  2 -1  0  0]\n",
      "(65,) (9,)\n",
      "init state [1 1 1 2 0]\n",
      "(74,) (9,)\n",
      "init state [ 2  1 -1  0  0]\n",
      "(95,) (21,)\n",
      "init state [ 2  3  1 -2  0]\n",
      "(103,) (8,)\n",
      "init state [ 1  1  2 -1  0]\n",
      "(125,) (22,)\n",
      "init state [ 2  2  0 -2  0]\n",
      "(131,) (6,)\n",
      "init state [ 1  2  0 -2  0]\n",
      "(141,) (10,)\n",
      "init state [1 1 0 2 0]\n",
      "(149,) (8,)\n",
      "============ 50 ===========\n",
      "Run episode 50 with rewards 34, accuracy 0.7\n",
      "----------------- 0 --------------\n",
      "   -0.8090 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.1087 if c<=0.0 & x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   +0.8730 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.1678 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.0547 if c<=0.0 & x1>=2.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.6568 if x2<=2.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   -0.6220 if c<=0.0 & x1>=1.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   -0.1656 if x1<=1.0 & x1>=1.0 & x4-x2<=-1.0\n",
      "   +0.0836 if x2<=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.3004 if x2<=1.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   -0.2963 if c<=0.0 & x1<=2.0 & x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.1393 if x2>=2.0 & x3-x1<=-2.0\n",
      "   -0.0183 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2<=1.0\n",
      "   +0.0000 if x3-x1<=-2.0 & x4-x2>=3.0\n",
      "   -0.1549 if c<=0.0 & x1<=2.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.1851 if c<=0.0 & x2<=0.0 & x3-x1<=-1.0 & x3-x1>=-1.0\n",
      "----------------- 1 --------------\n",
      "   +0.3160 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.4672 if c>=1.0 & x1>=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   -0.3239 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.0175 if x2>=3.0\n",
      "   -0.2707 if x2>=2.0 & x3-x1<=-2.0 & x4-x2>=-1.0\n",
      "   -0.8610 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.2443 if x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=-1.0\n",
      "   -0.2104 if x1<=2.0 & x2<=2.0 & x3-x1<=1.0 & x4-x2>=0.0\n",
      "   -0.1610 if c>=1.0 & x1>=3.0 & x3-x1>=-2.0\n",
      "   +0.3011 if x3-x1>=-2.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.1711 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.0907 if x4-x2<=1.0\n",
      "   +0.4480 if x1>=2.0 & x2>=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.2995 if x4-x2<=2.0\n",
      "   +0.0692 if x4-x2<=-3.0\n",
      "   -0.1674 if x1>=1.0 & x4-x2>=0.0\n",
      "----------------- 2 --------------\n",
      "   -0.1070 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.3678 if c>=1.0 & x1>=1.0 & x2<=2.0 & x4-x2<=-1.0\n",
      "   +0.5412 if c<=0.0 & x4-x2>=-2.0\n",
      "   +0.1213 if c<=0.0 & x2<=0.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.0945 if c<=0.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.6577 if x2>=1.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   -0.5652 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.1048 if x1<=2.0 & x3-x1<=2.0 & x3-x1>=0.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.3709 if c>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.1805 if x2<=1.0\n",
      "   -0.0801 if x3-x1<=-1.0 & x4-x2>=2.0\n",
      "   +0.0000 if x2>=3.0 & x3-x1<=-2.0\n",
      "   -0.1957 if c<=0.0 & x2<=1.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x3-x1>=-2.0 & x4-x2>=-1.0 & x4-x2>=0.0\n",
      "   -0.1555 if x1>=3.0 & x4-x2<=-1.0\n",
      "   -0.0141 if x3-x1>=2.0\n",
      "   +1.0761 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "----------------- 3 --------------\n",
      "   -0.0069 if x3-x1<=-1.0\n",
      "   +0.5363 if x1<=2.0 & x1>=2.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   +0.2371 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   +0.0137 if x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.0680 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.4042 if c>=1.0 & x1>=1.0\n",
      "   -0.1229 if x3-x1<=-2.0 & x4-x2>=0.0\n",
      "   +0.0000 if x1>=2.0 & x2<=0.0 & x4-x2>=2.0\n",
      "   -0.0191 if x1>=1.0 & x2>=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   +0.2563 if x2>=3.0 & x4-x2>=-1.0\n",
      "   -0.2718 if x1>=3.0 & x2<=2.0 & x3-x1>=0.0\n",
      "   +0.4288 if x1<=2.0 & x4-x2>=2.0\n",
      "   -0.0378 if x1<=2.0 & x2>=2.0 & x3-x1<=2.0\n",
      "   +0.2354 if x1<=1.0 & x4-x2>=3.0\n",
      "   -0.1562 if x3-x1>=2.0\n",
      "   +0.5404 if c>=1.0 & x1>=3.0\n",
      "init state [ 0  2  1 -2  0]\n",
      "(19,) (19,)\n",
      "init state [ 2  1 -2  1  0]\n",
      "(37,) (18,)\n",
      "init state [1 1 2 1 0]\n",
      "(41,) (4,)\n",
      "init state [1 3 1 0 0]\n",
      "(47,) (6,)\n",
      "init state [2 1 1 0 0]\n",
      "(59,) (12,)\n",
      "init state [ 1  3  1 -1  0]\n",
      "(63,) (4,)\n",
      "init state [0 2 0 1 0]\n",
      "(73,) (10,)\n",
      "init state [ 0  3  3 -1  0]\n",
      "(79,) (6,)\n",
      "init state [ 1  0 -1  0  0]\n",
      "(99,) (20,)\n",
      "init state [ 1  2  1 -2  0]\n",
      "(134,) (35,)\n",
      "============ 51 ===========\n",
      "Run episode 51 with rewards 7, accuracy 0.7\n",
      "----------------- 0 --------------\n",
      "   -0.5612 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.2166 if c<=0.0 & x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   +0.4769 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.6552 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.0444 if c<=0.0 & x1>=2.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.2182 if x2<=2.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   -0.4134 if c<=0.0 & x1>=1.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   -0.2740 if x1<=1.0 & x1>=1.0 & x4-x2<=-1.0\n",
      "   -0.1002 if x2<=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.1855 if x2<=1.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   -0.2447 if c<=0.0 & x1<=2.0 & x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   -0.2737 if x2>=2.0 & x3-x1<=-2.0\n",
      "   -0.0761 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2<=1.0\n",
      "   +0.0858 if c<=0.0 & x1<=2.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.1359 if c<=0.0 & x2<=0.0 & x3-x1<=-1.0 & x3-x1>=-1.0\n",
      "   -0.2343 if x3-x1<=0.0\n",
      "----------------- 1 --------------\n",
      "   +0.1732 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.4735 if c>=1.0 & x1>=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   -0.6767 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.1460 if x2>=2.0 & x3-x1<=-2.0 & x4-x2>=-1.0\n",
      "   -0.5063 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.3430 if x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=-1.0\n",
      "   -0.0770 if x1<=2.0 & x2<=2.0 & x3-x1<=1.0 & x4-x2>=0.0\n",
      "   -0.0145 if c>=1.0 & x1>=3.0 & x3-x1>=-2.0\n",
      "   +0.1857 if x3-x1>=-2.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.3091 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.0175 if x4-x2<=1.0\n",
      "   +0.4603 if x1>=2.0 & x2>=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.0444 if x4-x2<=2.0\n",
      "   +0.0574 if x4-x2<=-3.0\n",
      "   +0.2569 if x1>=1.0 & x4-x2>=0.0\n",
      "   +0.5654 if x3-x1>=2.0 & x4-x2>=0.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 2 --------------\n",
      "   +0.0523 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.3229 if c>=1.0 & x1>=1.0 & x2<=2.0 & x4-x2<=-1.0\n",
      "   +0.5782 if c<=0.0 & x4-x2>=-2.0\n",
      "   +0.1457 if c<=0.0 & x2<=0.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   -0.7275 if c<=0.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.3612 if x2>=1.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   -0.3352 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.6354 if x1<=2.0 & x3-x1<=2.0 & x3-x1>=0.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.1909 if c>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.0377 if x2<=1.0\n",
      "   -0.0778 if x3-x1<=-1.0 & x4-x2>=2.0\n",
      "   -0.0076 if c<=0.0 & x2<=1.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x3-x1>=-2.0 & x4-x2>=-1.0 & x4-x2>=0.0\n",
      "   +0.3040 if x1>=3.0 & x4-x2<=-1.0\n",
      "   -0.1413 if x3-x1>=2.0\n",
      "   +0.4395 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.5013 if c<=0.0 & x2<=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "----------------- 3 --------------\n",
      "   +0.2069 if x3-x1<=-1.0\n",
      "   +0.3405 if x1<=2.0 & x1>=2.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   -0.0491 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   -0.2206 if x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.2138 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.5601 if c>=1.0 & x1>=1.0\n",
      "   -0.1381 if x3-x1<=-2.0 & x4-x2>=0.0\n",
      "   -0.1868 if x1>=1.0 & x2>=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   -0.0346 if x2>=3.0 & x4-x2>=-1.0\n",
      "   +0.2591 if x1>=3.0 & x2<=2.0 & x3-x1>=0.0\n",
      "   +0.1678 if x1<=2.0 & x4-x2>=2.0\n",
      "   -0.0718 if x1<=2.0 & x2>=2.0 & x3-x1<=2.0\n",
      "   +0.0000 if x1<=1.0 & x4-x2>=3.0\n",
      "   +0.1718 if x3-x1>=2.0\n",
      "   +0.6067 if c>=1.0 & x1>=3.0\n",
      "   +1.1555 if x3-x1<=1.0 & x3-x1>=-1.0 & x3-x1>=1.0 & x4-x2>=0.0 & x4-x2>=1.0\n",
      "init state [ 3  1 -2  0  0]\n",
      "(43,) (43,)\n",
      "init state [ 2  0 -1  0  0]\n",
      "(56,) (13,)\n",
      "init state [1 0 1 1 0]\n",
      "(70,) (14,)\n",
      "init state [ 2  3 -2  0  0]\n",
      "(151,) (81,)\n",
      "init state [ 3  0 -2  2  0]\n",
      "(175,) (24,)\n",
      "init state [0 0 2 2 0]\n",
      "(190,) (15,)\n",
      "init state [ 3  2  0 -1  0]\n",
      "(193,) (3,)\n",
      "init state [ 3  1 -2 -1  0]\n",
      "(212,) (19,)\n",
      "init state [ 3  1 -1 -1  0]\n",
      "(220,) (8,)\n",
      "init state [ 3  2 -2 -2  0]\n",
      "(248,) (28,)\n",
      "============ 52 ===========\n",
      "Run episode 52 with rewards 14, accuracy 0.7\n",
      "----------------- 0 --------------\n",
      "   -0.8852 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.5087 if c<=0.0 & x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   +0.7826 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.1213 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.5460 if x2<=2.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   -0.2427 if c<=0.0 & x1>=1.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   -0.1009 if x1<=1.0 & x1>=1.0 & x4-x2<=-1.0\n",
      "   +0.2448 if x2<=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.3381 if x2<=1.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   +0.2421 if c<=0.0 & x1<=2.0 & x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.0038 if x2>=2.0 & x3-x1<=-2.0\n",
      "   -0.3177 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2<=1.0\n",
      "   +0.2685 if c<=0.0 & x1<=2.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.2415 if c<=0.0 & x2<=0.0 & x3-x1<=-1.0 & x3-x1>=-1.0\n",
      "   -0.0909 if x3-x1<=0.0\n",
      "   -0.3598 if x1>=3.0 & x3-x1<=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "----------------- 1 --------------\n",
      "   +0.0052 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.1796 if c>=1.0 & x1>=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   -0.5485 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.0702 if x2>=2.0 & x3-x1<=-2.0 & x4-x2>=-1.0\n",
      "   -0.2270 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   -0.1391 if x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=-1.0\n",
      "   +0.2028 if x1<=2.0 & x2<=2.0 & x3-x1<=1.0 & x4-x2>=0.0\n",
      "   -0.0996 if x3-x1>=-2.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.3804 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.2313 if x4-x2<=1.0\n",
      "   +0.0000 if x1>=2.0 & x2>=1.0 & x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.2322 if x4-x2<=2.0\n",
      "   +0.1998 if x4-x2<=-3.0\n",
      "   +0.0058 if x1>=1.0 & x4-x2>=0.0\n",
      "   +0.1514 if x3-x1>=2.0 & x4-x2>=0.0\n",
      "   -0.7528 if x2<=2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "----------------- 2 --------------\n",
      "   -0.1745 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.4617 if c>=1.0 & x1>=1.0 & x2<=2.0 & x4-x2<=-1.0\n",
      "   +0.1485 if c<=0.0 & x4-x2>=-2.0\n",
      "   -0.0995 if c<=0.0 & x2<=0.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   -0.5579 if c<=0.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.6323 if x2>=1.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   -0.1226 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.3798 if x1<=2.0 & x3-x1<=2.0 & x3-x1>=0.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   +0.0007 if c>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.1780 if x2<=1.0\n",
      "   +0.5806 if x3-x1<=-1.0 & x4-x2>=2.0\n",
      "   -0.1888 if x1>=3.0 & x4-x2<=-1.0\n",
      "   -0.0614 if x3-x1>=2.0\n",
      "   +0.3632 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   +0.1751 if c<=0.0 & x2<=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.0778 if x4-x2>=3.0\n",
      "----------------- 3 --------------\n",
      "   -0.4989 if x3-x1<=-1.0\n",
      "   +0.2921 if x1<=2.0 & x1>=2.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   -0.1753 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   -0.1810 if x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.0566 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.5629 if c>=1.0 & x1>=1.0\n",
      "   -0.1993 if x3-x1<=-2.0 & x4-x2>=0.0\n",
      "   +0.3710 if x1>=1.0 & x2>=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   +0.2295 if x2>=3.0 & x4-x2>=-1.0\n",
      "   +0.0755 if x1>=3.0 & x2<=2.0 & x3-x1>=0.0\n",
      "   -0.1943 if x1<=2.0 & x4-x2>=2.0\n",
      "   -0.1794 if x1<=2.0 & x2>=2.0 & x3-x1<=2.0\n",
      "   -0.0405 if x3-x1>=2.0\n",
      "   +1.0789 if c>=1.0 & x1>=3.0\n",
      "   +0.0149 if x3-x1<=1.0 & x3-x1>=-1.0 & x3-x1>=1.0 & x4-x2>=0.0 & x4-x2>=1.0\n",
      "   +0.3482 if x1<=0.0 & x2>=2.0 & x4-x2>=1.0\n",
      "init state [1 1 1 0 0]\n",
      "(12,) (12,)\n",
      "init state [ 3  0 -3  2  0]\n",
      "(34,) (22,)\n",
      "init state [ 2  3  1 -2  0]\n",
      "(55,) (21,)\n",
      "init state [0 1 3 0 0]\n",
      "(76,) (21,)\n",
      "init state [1 0 2 0 0]\n",
      "(95,) (19,)\n",
      "init state [ 3  0 -3  1  0]\n",
      "(127,) (32,)\n",
      "init state [ 2  2 -2 -1  0]\n",
      "(152,) (25,)\n",
      "init state [2 0 1 0 0]\n",
      "(162,) (10,)\n",
      "init state [ 1  2 -1  1  0]\n",
      "(223,) (61,)\n",
      "init state [ 1  3 -1  0  0]\n",
      "(232,) (9,)\n",
      "============ 53 ===========\n",
      "Run episode 53 with rewards 33, accuracy 0.7\n",
      "----------------- 0 --------------\n",
      "   -0.6888 if c>=1.0 & x3-x1<=1.0\n",
      "   -0.3757 if c<=0.0 & x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   +0.6993 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.4116 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.2279 if x2<=2.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   -0.1380 if c<=0.0 & x1>=1.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   -0.1807 if x1<=1.0 & x1>=1.0 & x4-x2<=-1.0\n",
      "   +0.0531 if x2<=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.2128 if x2<=1.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   +0.5674 if c<=0.0 & x1<=2.0 & x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   -0.3300 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2<=1.0\n",
      "   +0.1832 if c<=0.0 & x1<=2.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.2008 if c<=0.0 & x2<=0.0 & x3-x1<=-1.0 & x3-x1>=-1.0\n",
      "   -0.2782 if x3-x1<=0.0\n",
      "   -0.1453 if x1>=3.0 & x3-x1<=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.2517 if x3-x1<=1.0\n",
      "----------------- 1 --------------\n",
      "   +0.1221 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.3007 if c>=1.0 & x1>=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   -0.6040 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.1701 if x2>=2.0 & x3-x1<=-2.0 & x4-x2>=-1.0\n",
      "   -0.5564 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   -0.0756 if x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=-1.0\n",
      "   -0.0465 if x1<=2.0 & x2<=2.0 & x3-x1<=1.0 & x4-x2>=0.0\n",
      "   -0.1799 if x3-x1>=-2.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.3736 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.5439 if x4-x2<=1.0\n",
      "   +0.2985 if x4-x2<=2.0\n",
      "   +0.0000 if x4-x2<=-3.0\n",
      "   -0.2466 if x1>=1.0 & x4-x2>=0.0\n",
      "   -0.4337 if x3-x1>=2.0 & x4-x2>=0.0\n",
      "   -0.4703 if x2<=2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.4091 if x1<=2.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "----------------- 2 --------------\n",
      "   -0.3056 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.2131 if c>=1.0 & x1>=1.0 & x2<=2.0 & x4-x2<=-1.0\n",
      "   +0.1976 if c<=0.0 & x4-x2>=-2.0\n",
      "   -0.2154 if c<=0.0 & x2<=0.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   -0.2447 if c<=0.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.7312 if x2>=1.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   -0.3950 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.0526 if x1<=2.0 & x3-x1<=2.0 & x3-x1>=0.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.3525 if x2<=1.0\n",
      "   +0.2120 if x3-x1<=-1.0 & x4-x2>=2.0\n",
      "   +0.6037 if x1>=3.0 & x4-x2<=-1.0\n",
      "   +0.2596 if x3-x1>=2.0\n",
      "   +0.7212 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.1224 if c<=0.0 & x2<=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.3087 if x4-x2>=3.0\n",
      "   +0.3688 if x3-x1>=3.0 & x4-x2<=-2.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 3 --------------\n",
      "   +0.2236 if x3-x1<=-1.0\n",
      "   +0.0448 if x1<=2.0 & x1>=2.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   -0.0897 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   +0.0503 if x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.3699 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.5540 if c>=1.0 & x1>=1.0\n",
      "   -0.5342 if x3-x1<=-2.0 & x4-x2>=0.0\n",
      "   -0.0075 if x1>=1.0 & x2>=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   -0.1543 if x2>=3.0 & x4-x2>=-1.0\n",
      "   +0.2765 if x1>=3.0 & x2<=2.0 & x3-x1>=0.0\n",
      "   +0.2584 if x1<=2.0 & x4-x2>=2.0\n",
      "   +0.3549 if x1<=2.0 & x2>=2.0 & x3-x1<=2.0\n",
      "   +0.5214 if x3-x1>=2.0\n",
      "   +0.5603 if c>=1.0 & x1>=3.0\n",
      "   +0.1040 if x1<=0.0 & x2>=2.0 & x4-x2>=1.0\n",
      "   -0.8833 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "init state [ 3  1 -2 -1  0]\n",
      "(19,) (19,)\n",
      "init state [ 3  0 -1  2  0]\n",
      "(24,) (5,)\n",
      "init state [ 2  3 -1 -1  0]\n",
      "(34,) (10,)\n",
      "init state [ 2  2  1 -1  0]\n",
      "(40,) (6,)\n",
      "init state [1 1 2 0 0]\n",
      "(67,) (27,)\n",
      "init state [ 0  3  0 -3  0]\n",
      "(93,) (26,)\n",
      "init state [1 1 2 1 0]\n",
      "(100,) (7,)\n",
      "init state [ 3  2 -2  0  0]\n",
      "(116,) (16,)\n",
      "init state [2 0 1 2 0]\n",
      "(128,) (12,)\n",
      "init state [ 0  2  0 -2  0]\n",
      "(140,) (12,)\n",
      "============ 54 ===========\n",
      "Run episode 54 with rewards 30, accuracy 0.1\n",
      "----------------- 0 --------------\n",
      "   -0.5082 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.0332 if c<=0.0 & x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   +0.4514 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.3197 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.3345 if x2<=2.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   -0.6587 if c<=0.0 & x1>=1.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   -0.2006 if x1<=1.0 & x1>=1.0 & x4-x2<=-1.0\n",
      "   -0.2608 if x2<=1.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   +0.2036 if c<=0.0 & x1<=2.0 & x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   -0.0833 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2<=1.0\n",
      "   -0.1846 if c<=0.0 & x1<=2.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.1101 if c<=0.0 & x2<=0.0 & x3-x1<=-1.0 & x3-x1>=-1.0\n",
      "   +0.0174 if x3-x1<=0.0\n",
      "   -0.2299 if x1>=3.0 & x3-x1<=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.2606 if x3-x1<=1.0\n",
      "   -0.3981 if x3-x1>=-1.0 & x4-x2<=0.0\n",
      "----------------- 1 --------------\n",
      "   -0.0055 if x1<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.0347 if c>=1.0 & x1>=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   -0.7409 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.2093 if x2>=2.0 & x3-x1<=-2.0 & x4-x2>=-1.0\n",
      "   -0.5325 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.1688 if x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=-1.0\n",
      "   +0.0947 if x1<=2.0 & x2<=2.0 & x3-x1<=1.0 & x4-x2>=0.0\n",
      "   -0.0929 if x3-x1>=-2.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.5962 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.3221 if x4-x2<=1.0\n",
      "   +0.0261 if x4-x2<=2.0\n",
      "   +0.0397 if x1>=1.0 & x4-x2>=0.0\n",
      "   -0.2988 if x3-x1>=2.0 & x4-x2>=0.0\n",
      "   -0.3278 if x2<=2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.0476 if x1<=2.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   +0.6901 if c<=0.0 & x1>=3.0 & x2<=2.0 & x4-x2>=-1.0\n",
      "----------------- 2 --------------\n",
      "   +0.0599 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   +0.0557 if c>=1.0 & x1>=1.0 & x2<=2.0 & x4-x2<=-1.0\n",
      "   +0.3218 if c<=0.0 & x4-x2>=-2.0\n",
      "   -0.0576 if c<=0.0 & x2<=0.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   -0.2192 if c<=0.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.3822 if x2>=1.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   -0.3728 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.7016 if x2<=1.0\n",
      "   -0.0686 if x3-x1<=-1.0 & x4-x2>=2.0\n",
      "   +0.1563 if x1>=3.0 & x4-x2<=-1.0\n",
      "   +0.3028 if x3-x1>=2.0\n",
      "   +1.0799 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.2255 if c<=0.0 & x2<=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.0000 if x4-x2>=3.0\n",
      "   +0.0000 if x3-x1>=3.0 & x4-x2<=-2.0\n",
      "   -0.6599 if x2<=2.0 & x2>=1.0 & x3-x1<=-2.0\n",
      "----------------- 3 --------------\n",
      "   +0.1860 if x3-x1<=-1.0\n",
      "   +0.4299 if x1<=2.0 & x1>=2.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   -0.1774 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   +0.6258 if x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.5309 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.5275 if c>=1.0 & x1>=1.0\n",
      "   -0.0359 if x3-x1<=-2.0 & x4-x2>=0.0\n",
      "   +0.1120 if x2>=3.0 & x4-x2>=-1.0\n",
      "   +0.0135 if x1>=3.0 & x2<=2.0 & x3-x1>=0.0\n",
      "   +0.1738 if x1<=2.0 & x4-x2>=2.0\n",
      "   +0.1250 if x1<=2.0 & x2>=2.0 & x3-x1<=2.0\n",
      "   +0.1764 if x3-x1>=2.0\n",
      "   +0.9332 if c>=1.0 & x1>=3.0\n",
      "   -0.0000 if x1<=0.0 & x2>=2.0 & x4-x2>=1.0\n",
      "   -0.2534 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.4472 if x4-x2>=2.0\n",
      "init state [ 1  3  2 -1  0]\n",
      "(20,) (20,)\n",
      "init state [2 0 1 0 0]\n",
      "(27,) (7,)\n",
      "init state [ 0  1  2 -1  0]\n",
      "(39,) (12,)\n",
      "init state [ 2  1 -1 -1  0]\n",
      "(63,) (24,)\n",
      "init state [0 1 1 2 0]\n",
      "(94,) (31,)\n",
      "init state [ 1  3  2 -3  0]\n",
      "(109,) (15,)\n",
      "init state [ 1  1 -1  1  0]\n",
      "(144,) (35,)\n",
      "init state [ 2  3 -2 -1  0]\n",
      "(168,) (24,)\n",
      "init state [ 2  0 -1  3  0]\n",
      "(179,) (11,)\n",
      "init state [ 3  2  0 -2  0]\n",
      "(189,) (10,)\n",
      "============ 55 ===========\n",
      "Run episode 55 with rewards 32, accuracy 0.5\n",
      "----------------- 0 --------------\n",
      "   -0.5217 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.1599 if c<=0.0 & x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   +0.3594 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.5322 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.3155 if x2<=2.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   -0.7313 if c<=0.0 & x1>=1.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   +0.1383 if x1<=1.0 & x1>=1.0 & x4-x2<=-1.0\n",
      "   -0.2859 if x2<=1.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   +0.3294 if c<=0.0 & x1<=2.0 & x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   -0.0834 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2<=1.0\n",
      "   -0.1998 if c<=0.0 & x1<=2.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.3226 if c<=0.0 & x2<=0.0 & x3-x1<=-1.0 & x3-x1>=-1.0\n",
      "   +0.0937 if x1>=3.0 & x3-x1<=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.1367 if x3-x1<=1.0\n",
      "   -0.2109 if x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   -0.2105 if x2<=0.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2>=2.0\n",
      "----------------- 1 --------------\n",
      "   +0.3750 if c>=1.0 & x1>=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   -0.6977 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.0326 if x2>=2.0 & x3-x1<=-2.0 & x4-x2>=-1.0\n",
      "   -0.8077 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   -0.1724 if x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=-1.0\n",
      "   -0.1402 if x1<=2.0 & x2<=2.0 & x3-x1<=1.0 & x4-x2>=0.0\n",
      "   +0.1514 if x3-x1>=-2.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.1328 if x1<=2.0 & x4-x2>=-2.0\n",
      "   -0.1105 if x4-x2<=1.0\n",
      "   +0.4565 if x4-x2<=2.0\n",
      "   +0.2612 if x1>=1.0 & x4-x2>=0.0\n",
      "   -0.0714 if x3-x1>=2.0 & x4-x2>=0.0\n",
      "   -0.6465 if x2<=2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.0938 if x1<=2.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   +0.4744 if c<=0.0 & x1>=3.0 & x2<=2.0 & x4-x2>=-1.0\n",
      "   +0.5344 if x1<=2.0 & x3-x1<=1.0 & x4-x2<=-1.0\n",
      "----------------- 2 --------------\n",
      "   -0.0473 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.5163 if c>=1.0 & x1>=1.0 & x2<=2.0 & x4-x2<=-1.0\n",
      "   +0.1387 if c<=0.0 & x4-x2>=-2.0\n",
      "   -0.3081 if c<=0.0 & x2<=0.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.0334 if c<=0.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.5129 if x2>=1.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   -0.1391 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.3690 if x2<=1.0\n",
      "   -0.0672 if x3-x1<=-1.0 & x4-x2>=2.0\n",
      "   +0.5598 if x1>=3.0 & x4-x2<=-1.0\n",
      "   +0.4618 if x3-x1>=2.0\n",
      "   +0.6440 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   +0.1147 if c<=0.0 & x2<=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.0000 if x3-x1>=3.0 & x4-x2<=-2.0\n",
      "   -0.2507 if x2<=2.0 & x2>=1.0 & x3-x1<=-2.0\n",
      "   +0.5618 if c<=0.0 & x1>=2.0 & x2>=1.0 & x3-x1>=0.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "----------------- 3 --------------\n",
      "   +0.4956 if x3-x1<=-1.0\n",
      "   +0.7014 if x1<=2.0 & x1>=2.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   -0.0691 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   +0.3918 if x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.0738 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.3209 if c>=1.0 & x1>=1.0\n",
      "   +0.1017 if x3-x1<=-2.0 & x4-x2>=0.0\n",
      "   +0.3205 if x2>=3.0 & x4-x2>=-1.0\n",
      "   +0.2083 if x1>=3.0 & x2<=2.0 & x3-x1>=0.0\n",
      "   -0.0052 if x1<=2.0 & x4-x2>=2.0\n",
      "   -0.0920 if x1<=2.0 & x2>=2.0 & x3-x1<=2.0\n",
      "   +0.0857 if x3-x1>=2.0\n",
      "   +0.7804 if c>=1.0 & x1>=3.0\n",
      "   +0.0118 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.1669 if x4-x2>=2.0\n",
      "   -0.6331 if c<=0.0 & x1>=3.0 & x4-x2<=1.0\n",
      "init state [0 0 1 3 0]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(20,) (20,)\n",
      "init state [ 2  3  1 -3  0]\n",
      "(34,) (14,)\n",
      "init state [1 1 1 0 0]\n",
      "(46,) (12,)\n",
      "init state [ 0  3  3 -2  0]\n",
      "(61,) (15,)\n",
      "init state [ 0  1  0 -1  0]\n",
      "(74,) (13,)\n",
      "init state [ 3  1 -3  0  0]\n",
      "(92,) (18,)\n",
      "init state [ 3  1 -2 -1  0]\n",
      "(148,) (56,)\n",
      "init state [2 2 0 1 0]\n",
      "(153,) (5,)\n",
      "init state [1 0 1 1 0]\n",
      "(160,) (7,)\n",
      "init state [ 1  3  1 -1  0]\n",
      "(164,) (4,)\n",
      "============ 56 ===========\n",
      "Run episode 56 with rewards 38, accuracy 0.3\n",
      "----------------- 0 --------------\n",
      "   -0.3384 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.2065 if c<=0.0 & x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   +0.7815 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.4326 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.1603 if x2<=2.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   -0.3365 if c<=0.0 & x1>=1.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   -0.1298 if x1<=1.0 & x1>=1.0 & x4-x2<=-1.0\n",
      "   -0.4723 if x2<=1.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   +0.0870 if c<=0.0 & x1<=2.0 & x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   -0.0360 if c<=0.0 & x1<=2.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.5265 if c<=0.0 & x2<=0.0 & x3-x1<=-1.0 & x3-x1>=-1.0\n",
      "   +0.0603 if x1>=3.0 & x3-x1<=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.2830 if x3-x1<=1.0\n",
      "   -0.3619 if x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.0000 if x2<=0.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2>=2.0\n",
      "   +0.3198 if c<=0.0 & x2>=1.0 & x3-x1<=-3.0 & x4-x2<=-1.0\n",
      "----------------- 1 --------------\n",
      "   +0.3443 if c>=1.0 & x1>=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   -0.3352 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.5418 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.0649 if x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=-1.0\n",
      "   -0.0871 if x1<=2.0 & x2<=2.0 & x3-x1<=1.0 & x4-x2>=0.0\n",
      "   -0.0114 if x3-x1>=-2.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.0633 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.2524 if x4-x2<=1.0\n",
      "   +0.3791 if x4-x2<=2.0\n",
      "   -0.2246 if x1>=1.0 & x4-x2>=0.0\n",
      "   +0.0000 if x3-x1>=2.0 & x4-x2>=0.0\n",
      "   -0.1694 if x2<=2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.3381 if x1<=2.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   -0.1637 if c<=0.0 & x1>=3.0 & x2<=2.0 & x4-x2>=-1.0\n",
      "   +0.2295 if x1<=2.0 & x3-x1<=1.0 & x4-x2<=-1.0\n",
      "   -0.9299 if x1>=2.0 & x3-x1>=1.0 & x4-x2>=-2.0\n",
      "----------------- 2 --------------\n",
      "   -0.2711 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.5267 if c>=1.0 & x1>=1.0 & x2<=2.0 & x4-x2<=-1.0\n",
      "   +0.7312 if c<=0.0 & x4-x2>=-2.0\n",
      "   +0.3433 if c<=0.0 & x2<=0.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   -0.1136 if c<=0.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.8691 if x2>=1.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   -0.1848 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.2680 if x2<=1.0\n",
      "   -0.0120 if x3-x1<=-1.0 & x4-x2>=2.0\n",
      "   -0.0018 if x1>=3.0 & x4-x2<=-1.0\n",
      "   -0.1818 if x3-x1>=2.0\n",
      "   +0.5590 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.3940 if c<=0.0 & x2<=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.1172 if x2<=2.0 & x2>=1.0 & x3-x1<=-2.0\n",
      "   -0.1574 if c<=0.0 & x1>=2.0 & x2>=1.0 & x3-x1>=0.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.2078 if x3-x1>=1.0 & x4-x2>=1.0\n",
      "----------------- 3 --------------\n",
      "   +0.3370 if x3-x1<=-1.0\n",
      "   +0.3359 if x1<=2.0 & x1>=2.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   -0.3068 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   +0.4727 if x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.3106 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.5243 if c>=1.0 & x1>=1.0\n",
      "   +0.3911 if x3-x1<=-2.0 & x4-x2>=0.0\n",
      "   +0.2900 if x2>=3.0 & x4-x2>=-1.0\n",
      "   -0.0555 if x1>=3.0 & x2<=2.0 & x3-x1>=0.0\n",
      "   -0.1635 if x1<=2.0 & x2>=2.0 & x3-x1<=2.0\n",
      "   -0.0842 if x3-x1>=2.0\n",
      "   +0.5187 if c>=1.0 & x1>=3.0\n",
      "   -0.0889 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.0246 if x4-x2>=2.0\n",
      "   -0.3091 if c<=0.0 & x1>=3.0 & x4-x2<=1.0\n",
      "   -0.8604 if c<=0.0 & x1<=1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "init state [ 1  3  0 -2  0]\n",
      "(10,) (10,)\n",
      "init state [ 0  2  3 -2  0]\n",
      "(25,) (15,)\n",
      "init state [ 3  0 -1  1  0]\n",
      "(30,) (5,)\n",
      "init state [2 1 0 1 0]\n",
      "(39,) (9,)\n",
      "init state [ 3  1 -3  0  0]\n",
      "(54,) (15,)\n",
      "init state [0 0 3 1 0]\n",
      "(69,) (15,)\n",
      "init state [ 1  3  1 -1  0]\n",
      "(73,) (4,)\n",
      "init state [2 2 0 1 0]\n",
      "(95,) (22,)\n",
      "init state [ 3  2  0 -1  0]\n",
      "(99,) (4,)\n",
      "init state [ 0  1  3 -1  0]\n",
      "(109,) (10,)\n",
      "============ 57 ===========\n",
      "Run episode 57 with rewards 32, accuracy 0.5\n",
      "----------------- 0 --------------\n",
      "   -0.3143 if c>=1.0 & x3-x1<=1.0\n",
      "   -0.0569 if c<=0.0 & x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   +0.5697 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.2596 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.1718 if x2<=2.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   -0.4116 if c<=0.0 & x1>=1.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   -0.1350 if x1<=1.0 & x1>=1.0 & x4-x2<=-1.0\n",
      "   -0.2511 if x2<=1.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   -0.0529 if c<=0.0 & x1<=2.0 & x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   -0.2505 if c<=0.0 & x1<=2.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.2631 if c<=0.0 & x2<=0.0 & x3-x1<=-1.0 & x3-x1>=-1.0\n",
      "   +0.1255 if x1>=3.0 & x3-x1<=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.4866 if x3-x1<=1.0\n",
      "   -0.7203 if x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.0000 if c<=0.0 & x2>=1.0 & x3-x1<=-3.0 & x4-x2<=-1.0\n",
      "   -0.0577 if x4-x2>=3.0\n",
      "----------------- 1 --------------\n",
      "   +0.4100 if c>=1.0 & x1>=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   -0.6577 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.6332 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.1230 if x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=-1.0\n",
      "   -0.0675 if x1<=2.0 & x2<=2.0 & x3-x1<=1.0 & x4-x2>=0.0\n",
      "   -0.3144 if x3-x1>=-2.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.4895 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.3867 if x4-x2<=1.0\n",
      "   +0.2883 if x4-x2<=2.0\n",
      "   -0.4973 if x1>=1.0 & x4-x2>=0.0\n",
      "   +0.1960 if x2<=2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.1020 if x1<=2.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   +0.2091 if c<=0.0 & x1>=3.0 & x2<=2.0 & x4-x2>=-1.0\n",
      "   -0.4423 if x1<=2.0 & x3-x1<=1.0 & x4-x2<=-1.0\n",
      "   -0.4126 if x1>=2.0 & x3-x1>=1.0 & x4-x2>=-2.0\n",
      "   +0.0527 if x2<=2.0\n",
      "----------------- 2 --------------\n",
      "   -0.3083 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.3738 if c>=1.0 & x1>=1.0 & x2<=2.0 & x4-x2<=-1.0\n",
      "   +0.6900 if c<=0.0 & x4-x2>=-2.0\n",
      "   +0.2601 if c<=0.0 & x2<=0.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   -0.4998 if c<=0.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.1329 if x2>=1.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   -0.7072 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.2594 if x2<=1.0\n",
      "   +0.0909 if x3-x1<=-1.0 & x4-x2>=2.0\n",
      "   -0.4112 if x3-x1>=2.0\n",
      "   +0.2821 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   +0.0402 if c<=0.0 & x2<=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.0105 if x2<=2.0 & x2>=1.0 & x3-x1<=-2.0\n",
      "   -0.3696 if c<=0.0 & x1>=2.0 & x2>=1.0 & x3-x1>=0.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.1687 if x3-x1>=1.0 & x4-x2>=1.0\n",
      "   -0.1256 if x2<=1.0 & x3-x1<=-3.0\n",
      "----------------- 3 --------------\n",
      "   +0.4336 if x3-x1<=-1.0\n",
      "   +0.8194 if x1<=2.0 & x1>=2.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   -0.2376 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   -0.2218 if x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.8384 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.5922 if c>=1.0 & x1>=1.0\n",
      "   -0.3048 if x3-x1<=-2.0 & x4-x2>=0.0\n",
      "   +0.0726 if x2>=3.0 & x4-x2>=-1.0\n",
      "   +0.1569 if x1>=3.0 & x2<=2.0 & x3-x1>=0.0\n",
      "   +0.3018 if x1<=2.0 & x2>=2.0 & x3-x1<=2.0\n",
      "   -0.3877 if x3-x1>=2.0\n",
      "   +0.6612 if c>=1.0 & x1>=3.0\n",
      "   -0.1147 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.0749 if c<=0.0 & x1>=3.0 & x4-x2<=1.0\n",
      "   -0.3265 if c<=0.0 & x1<=1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.1187 if x1>=2.0 & x4-x2<=2.0\n",
      "init state [1 0 1 0 0]\n",
      "(6,) (6,)\n",
      "init state [2 2 1 0 0]\n",
      "(8,) (2,)\n",
      "init state [ 3  2 -1 -2  0]\n",
      "(20,) (12,)\n",
      "init state [1 0 1 3 0]\n",
      "(34,) (14,)\n",
      "init state [ 0  2  3 -1  0]\n",
      "(51,) (17,)\n",
      "init state [ 1  3  2 -3  0]\n",
      "(78,) (27,)\n",
      "init state [ 0  3  2 -1  0]\n",
      "(83,) (5,)\n",
      "init state [ 2  3 -1 -3  0]\n",
      "(116,) (33,)\n",
      "init state [ 0  3  0 -2  0]\n",
      "(130,) (14,)\n",
      "init state [ 2  3  0 -2  0]\n",
      "(142,) (12,)\n",
      "============ 58 ===========\n",
      "Run episode 58 with rewards 30, accuracy 0.5\n",
      "----------------- 0 --------------\n",
      "   -0.4196 if c>=1.0 & x3-x1<=1.0\n",
      "   -0.0304 if c<=0.0 & x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   +0.3683 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.4727 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.4348 if x2<=2.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   -0.2192 if c<=0.0 & x1>=1.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   -0.2568 if x1<=1.0 & x1>=1.0 & x4-x2<=-1.0\n",
      "   -0.2813 if x2<=1.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   +0.0931 if c<=0.0 & x1<=2.0 & x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   -0.0304 if c<=0.0 & x1<=2.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.3003 if c<=0.0 & x2<=0.0 & x3-x1<=-1.0 & x3-x1>=-1.0\n",
      "   +0.0680 if x1>=3.0 & x3-x1<=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.1993 if x3-x1<=1.0\n",
      "   -0.2573 if x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   -0.1154 if x4-x2>=3.0\n",
      "   +0.3788 if x1>=3.0 & x2>=3.0 & x4-x2>=-2.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 1 --------------\n",
      "   +0.2056 if c>=1.0 & x1>=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   -0.6475 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.5537 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.2252 if x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=-1.0\n",
      "   +0.0419 if x1<=2.0 & x2<=2.0 & x3-x1<=1.0 & x4-x2>=0.0\n",
      "   -0.0221 if x3-x1>=-2.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.2435 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.3465 if x4-x2<=1.0\n",
      "   +0.1981 if x4-x2<=2.0\n",
      "   -0.1729 if x1>=1.0 & x4-x2>=0.0\n",
      "   +0.4850 if x2<=2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.2939 if x1<=2.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   -0.2816 if c<=0.0 & x1>=3.0 & x2<=2.0 & x4-x2>=-1.0\n",
      "   -0.4513 if x1<=2.0 & x3-x1<=1.0 & x4-x2<=-1.0\n",
      "   -0.5931 if x1>=2.0 & x3-x1>=1.0 & x4-x2>=-2.0\n",
      "   -0.4100 if c>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "----------------- 2 --------------\n",
      "   -0.0951 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.2464 if c>=1.0 & x1>=1.0 & x2<=2.0 & x4-x2<=-1.0\n",
      "   +0.8153 if c<=0.0 & x4-x2>=-2.0\n",
      "   -0.4457 if c<=0.0 & x2<=0.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   -0.2777 if c<=0.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.1517 if x2>=1.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   -0.1403 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.4681 if x2<=1.0\n",
      "   -0.0219 if x3-x1<=-1.0 & x4-x2>=2.0\n",
      "   -0.2155 if x3-x1>=2.0\n",
      "   +0.0090 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.7302 if c<=0.0 & x2<=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.0655 if c<=0.0 & x1>=2.0 & x2>=1.0 & x3-x1>=0.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.1315 if x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.0000 if x2<=1.0 & x3-x1<=-3.0\n",
      "   +0.1510 if c<=0.0 & x4-x2>=2.0\n",
      "----------------- 3 --------------\n",
      "   +0.1206 if x3-x1<=-1.0\n",
      "   +0.6510 if x1<=2.0 & x1>=2.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   +0.0132 if c<=0.0 & x1<=2.0 & x1>=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=0.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   -0.1286 if x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.5286 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.4559 if c>=1.0 & x1>=1.0\n",
      "   -0.0430 if x3-x1<=-2.0 & x4-x2>=0.0\n",
      "   +0.0215 if x1>=3.0 & x2<=2.0 & x3-x1>=0.0\n",
      "   -0.3564 if x1<=2.0 & x2>=2.0 & x3-x1<=2.0\n",
      "   -0.1628 if x3-x1>=2.0\n",
      "   +0.3505 if c>=1.0 & x1>=3.0\n",
      "   -0.1584 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.2340 if c<=0.0 & x1>=3.0 & x4-x2<=1.0\n",
      "   -0.3754 if c<=0.0 & x1<=1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   +0.3098 if x1>=2.0 & x4-x2<=2.0\n",
      "   +0.6639 if x1>=3.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "init state [1 1 2 1 0]\n",
      "(20,) (20,)\n",
      "init state [0 0 2 1 0]\n",
      "(28,) (8,)\n",
      "init state [ 0  2  0 -2  0]\n",
      "(45,) (17,)\n",
      "init state [ 2  3  1 -3  0]\n",
      "(59,) (14,)\n",
      "init state [ 2  2  1 -2  0]\n",
      "(68,) (9,)\n",
      "init state [ 1  1  1 -1  0]\n",
      "(83,) (15,)\n",
      "init state [ 0  1  2 -1  0]\n",
      "(99,) (16,)\n",
      "init state [ 2  1  1 -1  0]\n",
      "(117,) (18,)\n",
      "init state [1 1 2 0 0]\n",
      "(131,) (14,)\n",
      "init state [ 2  1 -2  0  0]\n",
      "(219,) (88,)\n",
      "============ 59 ===========\n",
      "Run episode 59 with rewards -46, accuracy 0.5\n",
      "----------------- 0 --------------\n",
      "   -0.5667 if c>=1.0 & x3-x1<=1.0\n",
      "   -0.0000 if c<=0.0 & x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   +0.6594 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.5229 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.6019 if x2<=2.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   +0.3000 if c<=0.0 & x1>=1.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   -0.4164 if x1<=1.0 & x1>=1.0 & x4-x2<=-1.0\n",
      "   -0.4947 if x2<=1.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   -0.1118 if c<=0.0 & x1<=2.0 & x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.3467 if c<=0.0 & x2<=0.0 & x3-x1<=-1.0 & x3-x1>=-1.0\n",
      "   +0.1726 if x1>=3.0 & x3-x1<=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.2672 if x3-x1<=1.0\n",
      "   -0.5042 if x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   -0.0000 if x4-x2>=3.0\n",
      "   +0.0851 if x1>=3.0 & x2>=3.0 & x4-x2>=-2.0\n",
      "   -0.2095 if x1>=3.0 & x4-x2<=-3.0\n",
      "----------------- 1 --------------\n",
      "   +0.1135 if c>=1.0 & x1>=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   -0.6021 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.9945 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.2571 if x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=-1.0\n",
      "   +0.0693 if x1<=2.0 & x2<=2.0 & x3-x1<=1.0 & x4-x2>=0.0\n",
      "   +0.2940 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.2001 if x4-x2<=1.0\n",
      "   +0.1636 if x4-x2<=2.0\n",
      "   +0.1370 if x1>=1.0 & x4-x2>=0.0\n",
      "   +0.5553 if x2<=2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.3452 if x1<=2.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   +0.3053 if c<=0.0 & x1>=3.0 & x2<=2.0 & x4-x2>=-1.0\n",
      "   -0.4063 if x1<=2.0 & x3-x1<=1.0 & x4-x2<=-1.0\n",
      "   -0.7416 if x1>=2.0 & x3-x1>=1.0 & x4-x2>=-2.0\n",
      "   -0.1711 if c>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.2121 if x1<=0.0 & x4-x2<=-1.0 & x4-x2<=-2.0\n",
      "----------------- 2 --------------\n",
      "   +0.0458 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.3610 if c>=1.0 & x1>=1.0 & x2<=2.0 & x4-x2<=-1.0\n",
      "   +0.8559 if c<=0.0 & x4-x2>=-2.0\n",
      "   -0.2598 if c<=0.0 & x2<=0.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.3335 if c<=0.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.0852 if x2>=1.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   +0.0287 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.2650 if x2<=1.0\n",
      "   +0.0000 if x3-x1<=-1.0 & x4-x2>=2.0\n",
      "   -0.4710 if x3-x1>=2.0\n",
      "   +0.0042 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.7763 if c<=0.0 & x2<=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.2734 if c<=0.0 & x1>=2.0 & x2>=1.0 & x3-x1>=0.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.0072 if x3-x1>=1.0 & x4-x2>=1.0\n",
      "   -0.0529 if c<=0.0 & x4-x2>=2.0\n",
      "   +0.5366 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1<=1.0 & x4-x2<=-1.0 & x4-x2<=-3.0\n",
      "----------------- 3 --------------\n",
      "   -0.6670 if x3-x1<=-1.0\n",
      "   +0.4396 if x1<=2.0 & x1>=2.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   -0.0036 if x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.1927 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.6454 if c>=1.0 & x1>=1.0\n",
      "   -0.3141 if x3-x1<=-2.0 & x4-x2>=0.0\n",
      "   +0.6093 if x1>=3.0 & x2<=2.0 & x3-x1>=0.0\n",
      "   -0.5938 if x1<=2.0 & x2>=2.0 & x3-x1<=2.0\n",
      "   +0.0975 if x3-x1>=2.0\n",
      "   +0.7093 if c>=1.0 & x1>=3.0\n",
      "   -0.4443 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.4112 if c<=0.0 & x1>=3.0 & x4-x2<=1.0\n",
      "   -0.6333 if c<=0.0 & x1<=1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.1758 if x1>=2.0 & x4-x2<=2.0\n",
      "   -0.1067 if x1>=3.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.3964 if c>=1.0 & x1>=3.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "init state [ 2  0 -1  0  0]\n",
      "(9,) (9,)\n",
      "init state [0 2 3 0 0]\n",
      "(13,) (4,)\n",
      "init state [ 2  3 -2 -3  0]\n",
      "(42,) (29,)\n",
      "init state [1 3 1 0 0]\n",
      "(44,) (2,)\n",
      "init state [ 1  3  1 -1  0]\n",
      "(49,) (5,)\n",
      "init state [ 2  2  1 -2  0]\n",
      "(76,) (27,)\n",
      "init state [ 3  0 -2  3  0]\n",
      "(99,) (23,)\n",
      "init state [ 1  3  0 -1  0]\n",
      "(107,) (8,)\n",
      "init state [ 1  0 -1  3  0]\n",
      "(279,) (172,)\n",
      "init state [ 1  0 -1  0  0]\n",
      "(302,) (23,)\n",
      "============ 60 ===========\n",
      "Run episode 60 with rewards 19, accuracy 0.2\n",
      "----------------- 0 --------------\n",
      "   -0.0079 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.9768 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.4460 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.6091 if x2<=2.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   -0.1291 if c<=0.0 & x1>=1.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   -0.3053 if x1<=1.0 & x1>=1.0 & x4-x2<=-1.0\n",
      "   -0.3272 if x2<=1.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   -0.0038 if c<=0.0 & x1<=2.0 & x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   -0.1327 if c<=0.0 & x2<=0.0 & x3-x1<=-1.0 & x3-x1>=-1.0\n",
      "   +0.0420 if x1>=3.0 & x3-x1<=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.7063 if x3-x1<=1.0\n",
      "   +0.2186 if x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   -1.0904 if x4-x2>=3.0\n",
      "   +0.0000 if x1>=3.0 & x2>=3.0 & x4-x2>=-2.0\n",
      "   -0.0542 if x1>=3.0 & x4-x2<=-3.0\n",
      "   +0.5577 if c<=0.0 & x1>=2.0 & x2<=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "----------------- 1 --------------\n",
      "   +0.0854 if c>=1.0 & x1>=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   -0.7656 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.5006 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   -0.1357 if x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=-1.0\n",
      "   +0.1398 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.2127 if x4-x2<=1.0\n",
      "   -0.0562 if x4-x2<=2.0\n",
      "   +0.4453 if x1>=1.0 & x4-x2>=0.0\n",
      "   +0.1279 if x2<=2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.8069 if x1<=2.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   +0.0520 if c<=0.0 & x1>=3.0 & x2<=2.0 & x4-x2>=-1.0\n",
      "   -0.2861 if x1<=2.0 & x3-x1<=1.0 & x4-x2<=-1.0\n",
      "   +0.2129 if x1>=2.0 & x3-x1>=1.0 & x4-x2>=-2.0\n",
      "   -0.0946 if c>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.0000 if x1<=0.0 & x4-x2<=-1.0 & x4-x2<=-2.0\n",
      "   -0.4382 if x2>=3.0 & x3-x1>=1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "----------------- 2 --------------\n",
      "   -0.0000 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.4995 if c>=1.0 & x1>=1.0 & x2<=2.0 & x4-x2<=-1.0\n",
      "   +0.4847 if c<=0.0 & x4-x2>=-2.0\n",
      "   +0.3473 if c<=0.0 & x2<=0.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   -0.3891 if c<=0.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.9322 if x2>=1.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   +0.8547 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.2168 if x2<=1.0\n",
      "   -0.1256 if x3-x1>=2.0\n",
      "   +0.0835 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.9183 if c<=0.0 & x2<=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.1062 if c<=0.0 & x1>=2.0 & x2>=1.0 & x3-x1>=0.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.0000 if x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +2.0184 if c<=0.0 & x4-x2>=2.0\n",
      "   +0.0798 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1<=1.0 & x4-x2<=-1.0 & x4-x2<=-3.0\n",
      "   +1.1043 if x2<=0.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 3 --------------\n",
      "   +1.0453 if x3-x1<=-1.0\n",
      "   +0.0917 if x1<=2.0 & x1>=2.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   +2.4081 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.0210 if c>=1.0 & x1>=1.0\n",
      "   +0.6814 if x3-x1<=-2.0 & x4-x2>=0.0\n",
      "   +0.3465 if x1>=3.0 & x2<=2.0 & x3-x1>=0.0\n",
      "   -0.4702 if x1<=2.0 & x2>=2.0 & x3-x1<=2.0\n",
      "   -0.1499 if x3-x1>=2.0\n",
      "   +0.5410 if c>=1.0 & x1>=3.0\n",
      "   +0.2850 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.4151 if c<=0.0 & x1>=3.0 & x4-x2<=1.0\n",
      "   +0.0226 if c<=0.0 & x1<=1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.2973 if x1>=2.0 & x4-x2<=2.0\n",
      "   +0.0143 if x1>=3.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.4302 if c>=1.0 & x1>=3.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   -1.0667 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "init state [ 1  3  2 -3  0]\n",
      "(14,) (14,)\n",
      "init state [ 3  1 -1  2  0]\n",
      "(26,) (12,)\n",
      "init state [ 0  3  1 -3  0]\n",
      "(74,) (48,)\n",
      "init state [ 0  3  3 -2  0]\n",
      "(88,) (14,)\n",
      "init state [0 1 1 0 0]\n",
      "(96,) (8,)\n",
      "init state [1 1 1 0 0]\n",
      "(100,) (4,)\n",
      "init state [0 0 2 1 0]\n",
      "(119,) (19,)\n",
      "init state [ 3  2 -2  1  0]\n",
      "(146,) (27,)\n",
      "init state [ 3  2 -3  0  0]\n",
      "(193,) (47,)\n",
      "init state [ 3  2 -2  1  0]\n",
      "(200,) (7,)\n",
      "============ 61 ===========\n",
      "Run episode 61 with rewards 35, accuracy 0.2\n",
      "----------------- 0 --------------\n",
      "   -0.5679 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.7181 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.3329 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.3732 if x2<=2.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   -0.4990 if c<=0.0 & x1>=1.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   +0.1012 if x1<=1.0 & x1>=1.0 & x4-x2<=-1.0\n",
      "   -0.2273 if x2<=1.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   +0.0920 if c<=0.0 & x1<=2.0 & x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.0046 if c<=0.0 & x2<=0.0 & x3-x1<=-1.0 & x3-x1>=-1.0\n",
      "   +0.7141 if x1>=3.0 & x3-x1<=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.1823 if x3-x1<=1.0\n",
      "   -0.5463 if x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   -0.0075 if x4-x2>=3.0\n",
      "   -0.0779 if x1>=3.0 & x4-x2<=-3.0\n",
      "   -0.2361 if c<=0.0 & x1>=2.0 & x2<=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   +0.2142 if x3-x1>=3.0\n",
      "----------------- 1 --------------\n",
      "   +0.1451 if c>=1.0 & x1>=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   -0.3523 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.8419 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   -0.1567 if x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=-1.0\n",
      "   +0.5636 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.0875 if x4-x2<=1.0\n",
      "   +0.0249 if x4-x2<=2.0\n",
      "   -0.4256 if x1>=1.0 & x4-x2>=0.0\n",
      "   +0.1581 if x2<=2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.3512 if x1<=2.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   -0.0391 if c<=0.0 & x1>=3.0 & x2<=2.0 & x4-x2>=-1.0\n",
      "   -0.4067 if x1<=2.0 & x3-x1<=1.0 & x4-x2<=-1.0\n",
      "   -0.3227 if x1>=2.0 & x3-x1>=1.0 & x4-x2>=-2.0\n",
      "   +0.2957 if c>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.0000 if x2>=3.0 & x3-x1>=1.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   +0.6106 if c>=1.0 & x1<=2.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "----------------- 2 --------------\n",
      "   -0.1707 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.3384 if c>=1.0 & x1>=1.0 & x2<=2.0 & x4-x2<=-1.0\n",
      "   +0.6136 if c<=0.0 & x4-x2>=-2.0\n",
      "   +0.2684 if c<=0.0 & x2<=0.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.0800 if c<=0.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.0596 if x2>=1.0 & x3-x1<=0.0 & x4-x2>=0.0\n",
      "   +0.5610 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.4666 if x2<=1.0\n",
      "   -0.2373 if x3-x1>=2.0\n",
      "   +0.0775 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.3720 if c<=0.0 & x2<=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.1282 if c<=0.0 & x1>=2.0 & x2>=1.0 & x3-x1>=0.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.3445 if c<=0.0 & x4-x2>=2.0\n",
      "   +0.0619 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1<=1.0 & x4-x2<=-1.0 & x4-x2<=-3.0\n",
      "   +0.3336 if x2<=0.0\n",
      "   -0.6144 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "----------------- 3 --------------\n",
      "   +0.3317 if x3-x1<=-1.0\n",
      "   +0.6509 if x1<=2.0 & x1>=2.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   +1.1442 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.7938 if c>=1.0 & x1>=1.0\n",
      "   -0.1522 if x3-x1<=-2.0 & x4-x2>=0.0\n",
      "   -0.0582 if x1>=3.0 & x2<=2.0 & x3-x1>=0.0\n",
      "   -0.3868 if x1<=2.0 & x2>=2.0 & x3-x1<=2.0\n",
      "   +0.0274 if x3-x1>=2.0\n",
      "   +0.3323 if c>=1.0 & x1>=3.0\n",
      "   -0.1257 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.4820 if c<=0.0 & x1>=3.0 & x4-x2<=1.0\n",
      "   +0.1790 if c<=0.0 & x1<=1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.0023 if x1>=2.0 & x4-x2<=2.0\n",
      "   -0.0159 if c>=1.0 & x1>=3.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   -0.0891 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   +1.0278 if x3-x1>=-1.0 & x4-x2>=2.0\n",
      "init state [0 0 3 2 0]\n",
      "(7,) (7,)\n",
      "init state [ 2  2 -1 -2  0]\n",
      "(42,) (35,)\n",
      "init state [0 0 2 1 0]\n",
      "(57,) (15,)\n",
      "init state [0 1 1 2 0]\n",
      "(63,) (6,)\n",
      "init state [0 0 0 3 0]\n",
      "(74,) (11,)\n",
      "init state [ 3  1 -1  0  0]\n",
      "(84,) (10,)\n",
      "init state [ 0  3  3 -2  0]\n",
      "(110,) (26,)\n",
      "init state [0 0 0 3 0]\n",
      "(126,) (16,)\n",
      "init state [3 1 0 1 0]\n",
      "(135,) (9,)\n",
      "init state [ 2  2  0 -1  0]\n",
      "(146,) (11,)\n",
      "============ 62 ===========\n",
      "Run episode 62 with rewards 31, accuracy 0.8\n",
      "best\n",
      "----------------- 0 --------------\n",
      "   -0.2264 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.6848 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.0265 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.3563 if x2<=2.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   -0.5126 if c<=0.0 & x1>=1.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   -0.1199 if x1<=1.0 & x1>=1.0 & x4-x2<=-1.0\n",
      "   -0.4106 if x2<=1.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   +0.0942 if c<=0.0 & x1<=2.0 & x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   -0.0084 if x1>=3.0 & x3-x1<=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.0994 if x3-x1<=1.0\n",
      "   -0.8122 if x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.3823 if x4-x2>=3.0\n",
      "   -0.0511 if x1>=3.0 & x4-x2<=-3.0\n",
      "   -0.0242 if c<=0.0 & x1>=2.0 & x2<=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   -0.0449 if x3-x1>=3.0\n",
      "   -0.2375 if x2>=2.0 & x3-x1<=-2.0\n",
      "----------------- 1 --------------\n",
      "   +0.4485 if c>=1.0 & x1>=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   -0.5795 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.3872 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.1954 if x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=-1.0\n",
      "   +0.5032 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.0354 if x4-x2<=1.0\n",
      "   -0.0302 if x4-x2<=2.0\n",
      "   -0.3140 if x1>=1.0 & x4-x2>=0.0\n",
      "   +0.1004 if x2<=2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.8231 if x1<=2.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   -0.3580 if c<=0.0 & x1>=3.0 & x2<=2.0 & x4-x2>=-1.0\n",
      "   +0.1119 if x1<=2.0 & x3-x1<=1.0 & x4-x2<=-1.0\n",
      "   +0.2047 if x1>=2.0 & x3-x1>=1.0 & x4-x2>=-2.0\n",
      "   +0.2231 if c>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.2209 if c>=1.0 & x1<=2.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   +0.4034 if x3-x1>=3.0 & x4-x2>=2.0\n",
      "----------------- 2 --------------\n",
      "   +0.0231 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.1475 if c>=1.0 & x1>=1.0 & x2<=2.0 & x4-x2<=-1.0\n",
      "   +0.6569 if c<=0.0 & x4-x2>=-2.0\n",
      "   +0.2472 if c<=0.0 & x2<=0.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.3123 if c<=0.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.1885 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.3659 if x2<=1.0\n",
      "   -0.2747 if x3-x1>=2.0\n",
      "   +0.6182 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   +0.2864 if c<=0.0 & x2<=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.1285 if c<=0.0 & x1>=2.0 & x2>=1.0 & x3-x1>=0.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.0015 if c<=0.0 & x4-x2>=2.0\n",
      "   +0.0119 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1<=1.0 & x4-x2<=-1.0 & x4-x2<=-3.0\n",
      "   +0.3949 if x2<=0.0\n",
      "   -0.5943 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.9033 if c<=0.0 & x1<=2.0 & x2>=1.0 & x3-x1<=2.0 & x4-x2>=-2.0\n",
      "----------------- 3 --------------\n",
      "   -0.1631 if x3-x1<=-1.0\n",
      "   +0.4715 if x1<=2.0 & x1>=2.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   +0.9200 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.4749 if c>=1.0 & x1>=1.0\n",
      "   +0.1944 if x3-x1<=-2.0 & x4-x2>=0.0\n",
      "   +0.4029 if x1>=3.0 & x2<=2.0 & x3-x1>=0.0\n",
      "   -0.3167 if x1<=2.0 & x2>=2.0 & x3-x1<=2.0\n",
      "   -0.0667 if x3-x1>=2.0\n",
      "   +0.6385 if c>=1.0 & x1>=3.0\n",
      "   -0.2011 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.4283 if c<=0.0 & x1>=3.0 & x4-x2<=1.0\n",
      "   +0.4505 if c<=0.0 & x1<=1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   +0.3536 if c>=1.0 & x1>=3.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   -0.1940 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   +1.0232 if x3-x1>=-1.0 & x4-x2>=2.0\n",
      "   +1.0302 if x1<=1.0 & x2<=1.0 & x2>=1.0\n",
      "init state [ 0  3  1 -2  0]\n",
      "(10,) (10,)\n",
      "init state [1 1 2 0 0]\n",
      "(21,) (11,)\n",
      "init state [2 0 0 1 0]\n",
      "(28,) (7,)\n",
      "init state [0 2 1 1 0]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(36,) (8,)\n",
      "init state [ 1  2 -1  1  0]\n",
      "(60,) (24,)\n",
      "init state [ 1  3  0 -3  0]\n",
      "(138,) (78,)\n",
      "init state [ 1  2 -1 -1  0]\n",
      "(192,) (54,)\n",
      "init state [ 2  0 -2  1  0]\n",
      "(235,) (43,)\n",
      "init state [ 0  1  1 -1  0]\n",
      "(251,) (16,)\n",
      "init state [ 2  1 -1 -1  0]\n",
      "(267,) (16,)\n",
      "============ 63 ===========\n",
      "Run episode 63 with rewards 26, accuracy 0.3\n",
      "----------------- 0 --------------\n",
      "   -0.6769 if c>=1.0 & x3-x1<=1.0\n",
      "   +1.1629 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.2830 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.1080 if x2<=2.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   +0.0075 if c<=0.0 & x1>=1.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   -0.3232 if x1<=1.0 & x1>=1.0 & x4-x2<=-1.0\n",
      "   -0.0915 if x2<=1.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   -0.1368 if c<=0.0 & x1<=2.0 & x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   -0.2198 if x3-x1<=1.0\n",
      "   -0.4705 if x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   -0.0146 if x4-x2>=3.0\n",
      "   -0.2370 if x1>=3.0 & x4-x2<=-3.0\n",
      "   +0.8254 if c<=0.0 & x1>=2.0 & x2<=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   -0.0614 if x3-x1>=3.0\n",
      "   -0.7906 if x2>=2.0 & x3-x1<=-2.0\n",
      "   +0.0021 if x3-x1<=2.0\n",
      "----------------- 1 --------------\n",
      "   +0.1907 if c>=1.0 & x1>=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   -0.6220 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -1.2265 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.0271 if x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=-1.0\n",
      "   +0.6618 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.0117 if x4-x2<=1.0\n",
      "   -0.2295 if x1>=1.0 & x4-x2>=0.0\n",
      "   +0.0169 if x2<=2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.8131 if x1<=2.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   -0.0673 if c<=0.0 & x1>=3.0 & x2<=2.0 & x4-x2>=-1.0\n",
      "   +0.5590 if x1<=2.0 & x3-x1<=1.0 & x4-x2<=-1.0\n",
      "   +0.1951 if x1>=2.0 & x3-x1>=1.0 & x4-x2>=-2.0\n",
      "   +0.2086 if c>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.2852 if c>=1.0 & x1<=2.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   +0.0000 if x3-x1>=3.0 & x4-x2>=2.0\n",
      "   +0.3244 if x3-x1>=3.0\n",
      "----------------- 2 --------------\n",
      "   -0.2447 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.3951 if c>=1.0 & x1>=1.0 & x2<=2.0 & x4-x2<=-1.0\n",
      "   +0.4889 if c<=0.0 & x4-x2>=-2.0\n",
      "   -0.1050 if c<=0.0 & x2<=0.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   -0.3819 if c<=0.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.3243 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.0725 if x2<=1.0\n",
      "   +0.0635 if x3-x1>=2.0\n",
      "   +0.5674 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   +0.0347 if c<=0.0 & x2<=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.3481 if c<=0.0 & x1>=2.0 & x2>=1.0 & x3-x1>=0.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.6089 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1<=1.0 & x4-x2<=-1.0 & x4-x2<=-3.0\n",
      "   +0.2579 if x2<=0.0\n",
      "   -0.1446 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   +0.1799 if c<=0.0 & x1<=2.0 & x2>=1.0 & x3-x1<=2.0 & x4-x2>=-2.0\n",
      "   -0.1244 if x3-x1>=3.0\n",
      "----------------- 3 --------------\n",
      "   -0.2350 if x3-x1<=-1.0\n",
      "   -0.4735 if x1<=2.0 & x1>=2.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   +0.5125 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.6151 if c>=1.0 & x1>=1.0\n",
      "   +0.2640 if x3-x1<=-2.0 & x4-x2>=0.0\n",
      "   +0.5203 if x1>=3.0 & x2<=2.0 & x3-x1>=0.0\n",
      "   -0.4316 if x1<=2.0 & x2>=2.0 & x3-x1<=2.0\n",
      "   +0.8833 if c>=1.0 & x1>=3.0\n",
      "   +0.1561 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.1955 if c<=0.0 & x1>=3.0 & x4-x2<=1.0\n",
      "   +0.0902 if c<=0.0 & x1<=1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   +0.6882 if c>=1.0 & x1>=3.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   -0.1412 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   +0.2413 if x3-x1>=-1.0 & x4-x2>=2.0\n",
      "   +0.3719 if x1<=1.0 & x2<=1.0 & x2>=1.0\n",
      "   +0.9441 if c<=0.0 & x2<=1.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "init state [0 0 0 3 0]\n",
      "(8,) (8,)\n",
      "init state [0 0 3 1 0]\n",
      "(30,) (22,)\n",
      "init state [ 3  1 -3  1  0]\n",
      "(44,) (14,)\n",
      "init state [1 0 0 3 0]\n",
      "(78,) (34,)\n",
      "init state [ 2  3 -2 -1  0]\n",
      "(119,) (41,)\n",
      "init state [ 0  2  3 -2  0]\n",
      "(130,) (11,)\n",
      "init state [1 0 2 0 0]\n",
      "(146,) (16,)\n",
      "init state [ 3  2  0 -1  0]\n",
      "(153,) (7,)\n",
      "init state [ 1  2  1 -2  0]\n",
      "(174,) (21,)\n",
      "init state [1 0 0 2 0]\n",
      "(180,) (6,)\n",
      "============ 64 ===========\n",
      "Run episode 64 with rewards 36, accuracy 0.6\n",
      "----------------- 0 --------------\n",
      "   -0.3315 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.9588 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.2448 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.2682 if x2<=2.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   +0.0761 if c<=0.0 & x1>=1.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   -0.3367 if x1<=1.0 & x1>=1.0 & x4-x2<=-1.0\n",
      "   -0.0033 if x2<=1.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   +0.4979 if c<=0.0 & x1<=2.0 & x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   -0.1516 if x3-x1<=1.0\n",
      "   -0.0213 if x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   -0.0554 if x4-x2>=3.0\n",
      "   -0.1764 if x1>=3.0 & x4-x2<=-3.0\n",
      "   +0.0906 if c<=0.0 & x1>=2.0 & x2<=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   -0.1825 if x3-x1>=3.0\n",
      "   +0.0733 if x2>=2.0 & x3-x1<=-2.0\n",
      "   -0.4218 if x4-x2<=1.0\n",
      "----------------- 1 --------------\n",
      "   +0.2055 if c>=1.0 & x1>=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   -0.9776 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.4489 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   -0.1412 if x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=-1.0\n",
      "   +0.4103 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.4600 if x4-x2<=1.0\n",
      "   -0.0775 if x1>=1.0 & x4-x2>=0.0\n",
      "   -0.1379 if x2<=2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.0613 if x1<=2.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   -0.1127 if c<=0.0 & x1>=3.0 & x2<=2.0 & x4-x2>=-1.0\n",
      "   +0.4513 if x1<=2.0 & x3-x1<=1.0 & x4-x2<=-1.0\n",
      "   -0.0101 if x1>=2.0 & x3-x1>=1.0 & x4-x2>=-2.0\n",
      "   +0.6132 if c>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.1322 if c>=1.0 & x1<=2.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   +0.5997 if x3-x1>=3.0\n",
      "   -0.1652 if x3-x1<=-2.0 & x4-x2>=1.0\n",
      "----------------- 2 --------------\n",
      "   -0.1092 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.2710 if c>=1.0 & x1>=1.0 & x2<=2.0 & x4-x2<=-1.0\n",
      "   +0.4410 if c<=0.0 & x4-x2>=-2.0\n",
      "   +0.5462 if c<=0.0 & x2<=0.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   -0.0570 if c<=0.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.3143 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.0993 if x2<=1.0\n",
      "   +0.0965 if x3-x1>=2.0\n",
      "   +0.4827 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   +0.3143 if c<=0.0 & x1>=2.0 & x2>=1.0 & x3-x1>=0.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.0813 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1<=1.0 & x4-x2<=-1.0 & x4-x2<=-3.0\n",
      "   +0.0076 if x2<=0.0\n",
      "   -0.1277 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   +0.2119 if c<=0.0 & x1<=2.0 & x2>=1.0 & x3-x1<=2.0 & x4-x2>=-2.0\n",
      "   -0.2551 if x3-x1>=3.0\n",
      "   -0.2987 if x4-x2>=0.0\n",
      "----------------- 3 --------------\n",
      "   -0.0281 if x3-x1<=-1.0\n",
      "   -0.3443 if x1<=2.0 & x1>=2.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   +1.3317 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.7395 if c>=1.0 & x1>=1.0\n",
      "   +0.0256 if x3-x1<=-2.0 & x4-x2>=0.0\n",
      "   +0.2814 if x1>=3.0 & x2<=2.0 & x3-x1>=0.0\n",
      "   +0.0057 if x1<=2.0 & x2>=2.0 & x3-x1<=2.0\n",
      "   +0.6451 if c>=1.0 & x1>=3.0\n",
      "   -0.2582 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.0471 if c<=0.0 & x1>=3.0 & x4-x2<=1.0\n",
      "   +0.3553 if c>=1.0 & x1>=3.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   +0.3311 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   +0.2827 if x3-x1>=-1.0 & x4-x2>=2.0\n",
      "   +0.2013 if x1<=1.0 & x2<=1.0 & x2>=1.0\n",
      "   +0.5809 if c<=0.0 & x2<=1.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   -0.6008 if x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "init state [ 0  2  0 -1  0]\n",
      "(8,) (8,)\n",
      "init state [ 2  3 -2 -3  0]\n",
      "(47,) (39,)\n",
      "init state [1 1 1 1 0]\n",
      "(70,) (23,)\n",
      "init state [ 0  3  3 -2  0]\n",
      "(93,) (23,)\n",
      "init state [1 0 2 2 0]\n",
      "(106,) (13,)\n",
      "init state [1 1 1 1 0]\n",
      "(118,) (12,)\n",
      "init state [0 2 2 0 0]\n",
      "(140,) (22,)\n",
      "init state [ 3  2 -3 -2  0]\n",
      "(162,) (22,)\n",
      "init state [ 0  1  1 -1  0]\n",
      "(171,) (9,)\n",
      "init state [ 3  1 -3  0  0]\n",
      "(192,) (21,)\n",
      "============ 65 ===========\n",
      "Run episode 65 with rewards 21, accuracy 0.9\n",
      "best\n",
      "----------------- 0 --------------\n",
      "   -0.4613 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.4848 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.0004 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.5902 if x2<=2.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   -0.0166 if c<=0.0 & x1>=1.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   -0.3940 if x1<=1.0 & x1>=1.0 & x4-x2<=-1.0\n",
      "   +0.5844 if c<=0.0 & x1<=2.0 & x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.4431 if x3-x1<=1.0\n",
      "   +0.1260 if x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.0000 if x4-x2>=3.0\n",
      "   +0.0379 if x1>=3.0 & x4-x2<=-3.0\n",
      "   -0.1229 if c<=0.0 & x1>=2.0 & x2<=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   -0.0981 if x3-x1>=3.0\n",
      "   +0.0721 if x2>=2.0 & x3-x1<=-2.0\n",
      "   -0.1025 if x4-x2<=1.0\n",
      "   -0.3625 if x3-x1<=0.0 & x4-x2<=1.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 1 --------------\n",
      "   +0.0280 if c>=1.0 & x1>=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   -0.5975 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.8786 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   -0.1665 if x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=-1.0\n",
      "   +0.6842 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.2441 if x4-x2<=1.0\n",
      "   -0.2999 if x1>=1.0 & x4-x2>=0.0\n",
      "   -0.0232 if x2<=2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.1218 if x1<=2.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   +0.0304 if c<=0.0 & x1>=3.0 & x2<=2.0 & x4-x2>=-1.0\n",
      "   -0.2062 if x1<=2.0 & x3-x1<=1.0 & x4-x2<=-1.0\n",
      "   +0.4606 if c>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.2035 if c>=1.0 & x1<=2.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   +0.3007 if x3-x1>=3.0\n",
      "   +0.0000 if x3-x1<=-2.0 & x4-x2>=1.0\n",
      "   +0.9794 if x1>=2.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "----------------- 2 --------------\n",
      "   -0.1366 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.3424 if c>=1.0 & x1>=1.0 & x2<=2.0 & x4-x2<=-1.0\n",
      "   +0.5853 if c<=0.0 & x4-x2>=-2.0\n",
      "   -0.1676 if c<=0.0 & x2<=0.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.3463 if c<=0.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.1660 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.2715 if x2<=1.0\n",
      "   +0.2665 if x3-x1>=2.0\n",
      "   +0.6004 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.1318 if c<=0.0 & x1>=2.0 & x2>=1.0 & x3-x1>=0.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.0224 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1<=1.0 & x4-x2<=-1.0 & x4-x2<=-3.0\n",
      "   -0.2470 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   +0.3995 if c<=0.0 & x1<=2.0 & x2>=1.0 & x3-x1<=2.0 & x4-x2>=-2.0\n",
      "   -0.1576 if x3-x1>=3.0\n",
      "   -0.2470 if x4-x2>=0.0\n",
      "   -0.4973 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "----------------- 3 --------------\n",
      "   +0.1993 if x3-x1<=-1.0\n",
      "   +0.2244 if x1<=2.0 & x1>=2.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   +0.6488 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.5178 if c>=1.0 & x1>=1.0\n",
      "   +0.6851 if x3-x1<=-2.0 & x4-x2>=0.0\n",
      "   +0.1051 if x1>=3.0 & x2<=2.0 & x3-x1>=0.0\n",
      "   +0.4962 if c>=1.0 & x1>=3.0\n",
      "   -0.5085 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.1468 if c<=0.0 & x1>=3.0 & x4-x2<=1.0\n",
      "   +0.5582 if c>=1.0 & x1>=3.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   +0.2927 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   +0.2425 if x3-x1>=-1.0 & x4-x2>=2.0\n",
      "   -0.0213 if x1<=1.0 & x2<=1.0 & x2>=1.0\n",
      "   +0.4441 if c<=0.0 & x2<=1.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.0651 if x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.7908 if x1>=1.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "init state [0 1 1 1 0]\n",
      "(14,) (14,)\n",
      "init state [0 0 2 1 0]\n",
      "(47,) (33,)\n",
      "init state [ 2  1 -2  1  0]\n",
      "(72,) (25,)\n",
      "init state [ 0  3  0 -1  0]\n",
      "(81,) (9,)\n",
      "init state [ 2  1 -1  2  0]\n",
      "(92,) (11,)\n",
      "init state [ 3  2  0 -2  0]\n",
      "(122,) (30,)\n",
      "init state [ 2  3 -2 -3  0]\n",
      "(173,) (51,)\n",
      "init state [ 3  1 -1  0  0]\n",
      "(181,) (8,)\n",
      "init state [0 0 2 0 0]\n",
      "(206,) (25,)\n",
      "init state [ 3  2 -3  0  0]\n",
      "(232,) (26,)\n",
      "============ 66 ===========\n",
      "Run episode 66 with rewards 16, accuracy 0.3\n",
      "----------------- 0 --------------\n",
      "   -0.9177 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.0553 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.1967 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.3556 if x2<=2.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   +0.2657 if c<=0.0 & x1>=1.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   -0.0001 if x1<=1.0 & x1>=1.0 & x4-x2<=-1.0\n",
      "   +0.4673 if c<=0.0 & x1<=2.0 & x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   -0.0358 if x3-x1<=1.0\n",
      "   +0.3556 if x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   -0.0229 if x1>=3.0 & x4-x2<=-3.0\n",
      "   +0.4190 if c<=0.0 & x1>=2.0 & x2<=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   +0.0299 if x3-x1>=3.0\n",
      "   +0.1509 if x2>=2.0 & x3-x1<=-2.0\n",
      "   +0.1868 if x4-x2<=1.0\n",
      "   +0.5973 if x3-x1<=0.0 & x4-x2<=1.0\n",
      "   -0.7565 if x1>=1.0 & x2<=2.0 & x3-x1>=-1.0\n",
      "----------------- 1 --------------\n",
      "   +0.1891 if c>=1.0 & x1>=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   -0.5405 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.7296 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   -0.4306 if x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=-1.0\n",
      "   +0.2406 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.1584 if x4-x2<=1.0\n",
      "   -0.2109 if x1>=1.0 & x4-x2>=0.0\n",
      "   +0.3544 if x2<=2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.0691 if x1<=2.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   -0.2108 if c<=0.0 & x1>=3.0 & x2<=2.0 & x4-x2>=-1.0\n",
      "   +0.5960 if x1<=2.0 & x3-x1<=1.0 & x4-x2<=-1.0\n",
      "   +0.6510 if c>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.3459 if c>=1.0 & x1<=2.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -0.0178 if x3-x1>=3.0\n",
      "   +0.2263 if x1>=2.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.2966 if c>=1.0 & x3-x1<=-1.0 & x3-x1<=-2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "----------------- 2 --------------\n",
      "   -0.2426 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.3726 if c>=1.0 & x1>=1.0 & x2<=2.0 & x4-x2<=-1.0\n",
      "   +0.3149 if c<=0.0 & x4-x2>=-2.0\n",
      "   -0.0665 if c<=0.0 & x2<=0.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   -0.0621 if c<=0.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.2502 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.4920 if x2<=1.0\n",
      "   +0.1691 if x3-x1>=2.0\n",
      "   -0.0521 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   +0.0000 if c<=0.0 & x1>=2.0 & x2>=1.0 & x3-x1>=0.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.2310 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   +0.4422 if c<=0.0 & x1<=2.0 & x2>=1.0 & x3-x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.0240 if x3-x1>=3.0\n",
      "   -0.2815 if x4-x2>=0.0\n",
      "   -0.3438 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.3933 if x2<=2.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=2.0\n",
      "----------------- 3 --------------\n",
      "   +0.7565 if x3-x1<=-1.0\n",
      "   +0.1570 if x1<=2.0 & x1>=2.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   +0.4085 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.4333 if c>=1.0 & x1>=1.0\n",
      "   +0.5217 if x3-x1<=-2.0 & x4-x2>=0.0\n",
      "   +0.0507 if x1>=3.0 & x2<=2.0 & x3-x1>=0.0\n",
      "   +0.6021 if c>=1.0 & x1>=3.0\n",
      "   -0.1268 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.1496 if c<=0.0 & x1>=3.0 & x4-x2<=1.0\n",
      "   +0.3456 if c>=1.0 & x1>=3.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   -0.1190 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   +0.3325 if x3-x1>=-1.0 & x4-x2>=2.0\n",
      "   +0.4854 if c<=0.0 & x2<=1.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   -0.1783 if x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.1906 if x1>=1.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.6442 if x1<=2.0 & x2>=3.0 & x3-x1<=1.0\n",
      "init state [ 3  1 -2  0  0]\n",
      "(7,) (7,)\n",
      "init state [ 0  3  2 -1  0]\n",
      "(16,) (9,)\n",
      "init state [0 1 0 1 0]\n",
      "(32,) (16,)\n",
      "init state [ 3  1 -1  0  0]\n",
      "(55,) (23,)\n",
      "init state [ 1  0 -1  2  0]\n",
      "(77,) (22,)\n",
      "init state [ 1  1 -1  2  0]\n",
      "(87,) (10,)\n",
      "init state [ 0  3  3 -1  0]\n",
      "(112,) (25,)\n",
      "init state [0 2 0 1 0]\n",
      "(124,) (12,)\n",
      "init state [ 1  2  2 -2  0]\n",
      "(152,) (28,)\n",
      "init state [ 3  0 -3  0  0]\n",
      "(170,) (18,)\n",
      "============ 67 ===========\n",
      "Run episode 67 with rewards 24, accuracy 0.4\n",
      "----------------- 0 --------------\n",
      "   -0.5346 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.3429 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.1171 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.7237 if x2<=2.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   +0.4047 if c<=0.0 & x1>=1.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   +0.8544 if c<=0.0 & x1<=2.0 & x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   -0.0465 if x3-x1<=1.0\n",
      "   +0.1751 if x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.0000 if x1>=3.0 & x4-x2<=-3.0\n",
      "   +0.1915 if c<=0.0 & x1>=2.0 & x2<=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   -0.3579 if x3-x1>=3.0\n",
      "   -0.2029 if x2>=2.0 & x3-x1<=-2.0\n",
      "   +0.1884 if x4-x2<=1.0\n",
      "   +0.4556 if x3-x1<=0.0 & x4-x2<=1.0\n",
      "   -0.6443 if x1>=1.0 & x2<=2.0 & x3-x1>=-1.0\n",
      "   +0.8704 if c<=0.0 & x2<=1.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "----------------- 1 --------------\n",
      "   +0.3941 if c>=1.0 & x1>=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   -0.6743 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.5865 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   -0.3945 if x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=-1.0\n",
      "   +0.4021 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.1359 if x4-x2<=1.0\n",
      "   +0.0526 if x1>=1.0 & x4-x2>=0.0\n",
      "   +0.6951 if x2<=2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.4048 if x1<=2.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   -0.0988 if c<=0.0 & x1>=3.0 & x2<=2.0 & x4-x2>=-1.0\n",
      "   +0.3395 if x1<=2.0 & x3-x1<=1.0 & x4-x2<=-1.0\n",
      "   +0.5732 if c>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.2128 if c>=1.0 & x1<=2.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   +0.0617 if x1>=2.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.4606 if c>=1.0 & x3-x1<=-1.0 & x3-x1<=-2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.3987 if x3-x1<=2.0 & x4-x2<=0.0\n",
      "----------------- 2 --------------\n",
      "   -0.1274 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.0391 if c>=1.0 & x1>=1.0 & x2<=2.0 & x4-x2<=-1.0\n",
      "   +0.3420 if c<=0.0 & x4-x2>=-2.0\n",
      "   +0.3433 if c<=0.0 & x2<=0.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.3212 if c<=0.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.2306 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.1014 if x2<=1.0\n",
      "   -0.0406 if x3-x1>=2.0\n",
      "   +0.1618 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.4434 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   +0.0706 if c<=0.0 & x1<=2.0 & x2>=1.0 & x3-x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.0605 if x3-x1>=3.0\n",
      "   -0.4434 if x4-x2>=0.0\n",
      "   -0.4549 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.1504 if x2<=2.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=2.0\n",
      "   -0.2088 if c>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 3 --------------\n",
      "   +0.6931 if x3-x1<=-1.0\n",
      "   +0.1293 if x1<=2.0 & x1>=2.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   +0.4258 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.4870 if c>=1.0 & x1>=1.0\n",
      "   +0.2052 if x3-x1<=-2.0 & x4-x2>=0.0\n",
      "   +0.8009 if c>=1.0 & x1>=3.0\n",
      "   -0.2124 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.3302 if c<=0.0 & x1>=3.0 & x4-x2<=1.0\n",
      "   +0.4369 if c>=1.0 & x1>=3.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   +0.2509 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   +0.5491 if x3-x1>=-1.0 & x4-x2>=2.0\n",
      "   -0.0467 if c<=0.0 & x2<=1.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   -0.4963 if x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.3181 if x1>=1.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.5557 if x1<=2.0 & x2>=3.0 & x3-x1<=1.0\n",
      "   -0.2863 if x2>=2.0 & x3-x1>=3.0\n",
      "init state [0 2 2 1 0]\n",
      "(9,) (9,)\n",
      "init state [ 0  2  0 -1  0]\n",
      "(15,) (6,)\n",
      "init state [2 0 1 2 0]\n",
      "(20,) (5,)\n",
      "init state [ 0  1  0 -1  0]\n",
      "(31,) (11,)\n",
      "init state [ 2  0 -1  1  0]\n",
      "(37,) (6,)\n",
      "init state [ 1  2  0 -2  0]\n",
      "(60,) (23,)\n",
      "init state [ 0  2  3 -1  0]\n",
      "(106,) (46,)\n",
      "init state [1 0 1 1 0]\n",
      "(113,) (7,)\n",
      "init state [ 3  2 -2 -1  0]\n",
      "(123,) (10,)\n",
      "init state [ 0  3  3 -3  0]\n",
      "(144,) (21,)\n",
      "============ 68 ===========\n",
      "Run episode 68 with rewards 21, accuracy 0.5\n",
      "----------------- 0 --------------\n",
      "   -0.3567 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.4718 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.2209 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.7613 if x2<=2.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   +0.2902 if c<=0.0 & x1>=1.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   +0.4443 if c<=0.0 & x1<=2.0 & x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   -0.0702 if x3-x1<=1.0\n",
      "   +0.2538 if x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   -0.0032 if c<=0.0 & x1>=2.0 & x2<=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   -0.0611 if x3-x1>=3.0\n",
      "   -0.1931 if x2>=2.0 & x3-x1<=-2.0\n",
      "   +0.0184 if x4-x2<=1.0\n",
      "   +0.0726 if x3-x1<=0.0 & x4-x2<=1.0\n",
      "   -0.4622 if x1>=1.0 & x2<=2.0 & x3-x1>=-1.0\n",
      "   +0.4209 if c<=0.0 & x2<=1.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.8678 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x4-x2<=-1.0\n",
      "----------------- 1 --------------\n",
      "   +0.0251 if c>=1.0 & x1>=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   -0.5044 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.6074 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   -0.0893 if x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=-1.0\n",
      "   +0.6923 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.3142 if x4-x2<=1.0\n",
      "   +0.4444 if x2<=2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.2995 if x1<=2.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   +0.0486 if c<=0.0 & x1>=3.0 & x2<=2.0 & x4-x2>=-1.0\n",
      "   -0.1764 if x1<=2.0 & x3-x1<=1.0 & x4-x2<=-1.0\n",
      "   +0.5170 if c>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.0000 if c>=1.0 & x1<=2.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0\n",
      "   -0.3430 if x1>=2.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.0640 if c>=1.0 & x3-x1<=-1.0 & x3-x1<=-2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.2887 if x3-x1<=2.0 & x4-x2<=0.0\n",
      "   -0.2209 if x4-x2>=2.0\n",
      "----------------- 2 --------------\n",
      "   -0.1857 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   +0.5097 if c<=0.0 & x4-x2>=-2.0\n",
      "   +0.4497 if c<=0.0 & x2<=0.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.1316 if c<=0.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.0686 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.1410 if x2<=1.0\n",
      "   +0.0203 if x3-x1>=2.0\n",
      "   +0.3067 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.2977 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   +0.0136 if c<=0.0 & x1<=2.0 & x2>=1.0 & x3-x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.1960 if x3-x1>=3.0\n",
      "   -0.2977 if x4-x2>=0.0\n",
      "   -0.1366 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.1260 if x2<=2.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=2.0\n",
      "   -0.4959 if c>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.4117 if x4-x2<=-1.0\n",
      "----------------- 3 --------------\n",
      "   +0.5435 if x3-x1<=-1.0\n",
      "   -0.1683 if x1<=2.0 & x1>=2.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   +0.2169 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.3720 if c>=1.0 & x1>=1.0\n",
      "   -0.1480 if x3-x1<=-2.0 & x4-x2>=0.0\n",
      "   +0.9214 if c>=1.0 & x1>=3.0\n",
      "   -0.4855 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.1032 if c<=0.0 & x1>=3.0 & x4-x2<=1.0\n",
      "   +0.7011 if c>=1.0 & x1>=3.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   +0.3010 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   +0.4285 if x3-x1>=-1.0 & x4-x2>=2.0\n",
      "   -0.2387 if x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.1179 if x1>=1.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.1534 if x1<=2.0 & x2>=3.0 & x3-x1<=1.0\n",
      "   -0.0856 if x2>=2.0 & x3-x1>=3.0\n",
      "   -0.6860 if x1<=0.0\n",
      "init state [ 0  3  1 -3  0]\n",
      "(32,) (32,)\n",
      "init state [ 3  0 -3  0  0]\n",
      "(60,) (28,)\n",
      "init state [ 1  3  2 -3  0]\n",
      "(85,) (25,)\n",
      "init state [ 2  1 -2 -1  0]\n",
      "(127,) (42,)\n",
      "init state [ 1  3  1 -2  0]\n",
      "(139,) (12,)\n",
      "init state [ 1  1 -1 -1  0]\n",
      "(196,) (57,)\n",
      "init state [ 2  2  0 -1  0]\n",
      "(204,) (8,)\n",
      "init state [ 3  2 -3 -1  0]\n",
      "(218,) (14,)\n",
      "init state [2 2 0 1 0]\n",
      "(223,) (5,)\n",
      "init state [ 3  1 -2  2  0]\n",
      "(230,) (7,)\n",
      "============ 69 ===========\n",
      "Run episode 69 with rewards 35, accuracy 0.6\n",
      "----------------- 0 --------------\n",
      "   -0.8266 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.7384 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.1195 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.5941 if x2<=2.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   -0.4012 if c<=0.0 & x1>=1.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   +0.6444 if c<=0.0 & x1<=2.0 & x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.4018 if x3-x1<=1.0\n",
      "   -0.0335 if x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   -0.0734 if x3-x1>=3.0\n",
      "   +0.2386 if x2>=2.0 & x3-x1<=-2.0\n",
      "   +0.1036 if x4-x2<=1.0\n",
      "   +0.1884 if x3-x1<=0.0 & x4-x2<=1.0\n",
      "   -0.4148 if x1>=1.0 & x2<=2.0 & x3-x1>=-1.0\n",
      "   +0.1463 if c<=0.0 & x2<=1.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.1128 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   -0.6030 if c<=0.0 & x1<=2.0 & x1>=2.0 & x2<=2.0 & x3-x1<=-1.0 & x3-x1>=-1.0\n",
      "----------------- 1 --------------\n",
      "   +0.3105 if c>=1.0 & x1>=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   -0.4823 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.6554 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   -0.1891 if x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=-1.0\n",
      "   +0.2290 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.2755 if x4-x2<=1.0\n",
      "   +0.1498 if x2<=2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.1322 if x1<=2.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   -0.0098 if c<=0.0 & x1>=3.0 & x2<=2.0 & x4-x2>=-1.0\n",
      "   +0.2180 if x1<=2.0 & x3-x1<=1.0 & x4-x2<=-1.0\n",
      "   +0.3842 if c>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.0583 if x1>=2.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.1237 if c>=1.0 & x3-x1<=-1.0 & x3-x1<=-2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.0409 if x3-x1<=2.0 & x4-x2<=0.0\n",
      "   +0.0317 if x4-x2>=2.0\n",
      "   +0.4172 if c>=1.0 & x3-x1<=-3.0\n",
      "----------------- 2 --------------\n",
      "   -0.0195 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   +0.4701 if c<=0.0 & x4-x2>=-2.0\n",
      "   -0.2382 if c<=0.0 & x2<=0.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   +0.2176 if c<=0.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.0745 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.1764 if x2<=1.0\n",
      "   +0.4808 if x3-x1>=2.0\n",
      "   +0.3159 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.3535 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.0073 if x3-x1>=3.0\n",
      "   -0.3535 if x4-x2>=0.0\n",
      "   -0.0587 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.2131 if x2<=2.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=2.0\n",
      "   -0.3445 if c>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.5823 if x4-x2<=-1.0\n",
      "   -0.1622 if x2<=0.0 & x4-x2>=1.0\n",
      "----------------- 3 --------------\n",
      "   -0.0303 if x3-x1<=-1.0\n",
      "   +0.8464 if x1<=2.0 & x1>=2.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   +0.5541 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.6224 if c>=1.0 & x1>=1.0\n",
      "   -0.6240 if x3-x1<=-2.0 & x4-x2>=0.0\n",
      "   +0.5435 if c>=1.0 & x1>=3.0\n",
      "   -0.1290 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.2388 if c<=0.0 & x1>=3.0 & x4-x2<=1.0\n",
      "   +0.4598 if c>=1.0 & x1>=3.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   -0.0807 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   +0.3603 if x3-x1>=-1.0 & x4-x2>=2.0\n",
      "   +0.0702 if x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.2493 if x1>=1.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.3278 if x1<=2.0 & x2>=3.0 & x3-x1<=1.0\n",
      "   -0.3384 if x1<=0.0\n",
      "   -0.0714 if c<=0.0 & x2>=1.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "init state [ 3  2 -1 -2  0]\n",
      "(19,) (19,)\n",
      "init state [ 2  2  1 -1  0]\n",
      "(33,) (14,)\n",
      "init state [ 2  3 -2 -3  0]\n",
      "(56,) (23,)\n",
      "init state [ 3  1 -1  1  0]\n",
      "(64,) (8,)\n",
      "init state [ 3  1 -3 -1  0]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(87,) (23,)\n",
      "init state [ 3  2 -2  0  0]\n",
      "(93,) (6,)\n",
      "init state [ 0  2  0 -2  0]\n",
      "(109,) (16,)\n",
      "init state [0 0 1 0 0]\n",
      "(115,) (6,)\n",
      "init state [ 3  0 -2  3  0]\n",
      "(125,) (10,)\n",
      "init state [ 2  3  0 -3  0]\n",
      "(135,) (10,)\n",
      "============ 70 ===========\n",
      "Run episode 70 with rewards 32, accuracy 0.8\n",
      "----------------- 0 --------------\n",
      "   -0.4501 if c>=1.0 & x3-x1<=1.0\n",
      "   +1.2551 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.2175 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.2309 if x2<=2.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   -0.3451 if c<=0.0 & x1>=1.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   +0.4784 if c<=0.0 & x1<=2.0 & x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   -0.1086 if x3-x1<=1.0\n",
      "   +0.0000 if x3-x1>=3.0\n",
      "   +0.2497 if x2>=2.0 & x3-x1<=-2.0\n",
      "   -0.1515 if x4-x2<=1.0\n",
      "   +0.2442 if x3-x1<=0.0 & x4-x2<=1.0\n",
      "   -0.1700 if x1>=1.0 & x2<=2.0 & x3-x1>=-1.0\n",
      "   +0.0998 if c<=0.0 & x2<=1.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.0609 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   -0.0671 if c<=0.0 & x1<=2.0 & x1>=2.0 & x2<=2.0 & x3-x1<=-1.0 & x3-x1>=-1.0\n",
      "   -0.0971 if x4-x2>=3.0\n",
      "----------------- 1 --------------\n",
      "   +0.1023 if c>=1.0 & x1>=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   -0.3270 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.8379 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   -0.2104 if x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=-1.0\n",
      "   +0.6968 if x1<=2.0 & x4-x2>=-2.0\n",
      "   -0.1249 if x4-x2<=1.0\n",
      "   +0.3620 if x2<=2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.2028 if x1<=2.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   +0.1235 if x1<=2.0 & x3-x1<=1.0 & x4-x2<=-1.0\n",
      "   +0.4971 if c>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.1523 if x1>=2.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.0545 if c>=1.0 & x3-x1<=-1.0 & x3-x1<=-2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.1861 if x3-x1<=2.0 & x4-x2<=0.0\n",
      "   +0.0467 if x4-x2>=2.0\n",
      "   -0.1172 if c>=1.0 & x3-x1<=-3.0\n",
      "   +0.2643 if c<=0.0 & x4-x2<=-3.0\n",
      "----------------- 2 --------------\n",
      "   -0.0230 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   +0.3833 if c<=0.0 & x4-x2>=-2.0\n",
      "   -0.0635 if c<=0.0 & x2<=0.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   -0.0344 if c<=0.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.3035 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.3410 if x2<=1.0\n",
      "   +0.0000 if x3-x1>=2.0\n",
      "   +0.8210 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.3189 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.3718 if x4-x2>=0.0\n",
      "   -0.1932 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.0085 if x2<=2.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=2.0\n",
      "   -0.2842 if c>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.6220 if x4-x2<=-1.0\n",
      "   -0.0633 if x2<=0.0 & x4-x2>=1.0\n",
      "   -0.3450 if x2>=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "----------------- 3 --------------\n",
      "   +0.4865 if x1<=2.0 & x1>=2.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   +0.3412 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.5670 if c>=1.0 & x1>=1.0\n",
      "   +0.1025 if x3-x1<=-2.0 & x4-x2>=0.0\n",
      "   +0.9126 if c>=1.0 & x1>=3.0\n",
      "   -0.0473 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.0946 if c<=0.0 & x1>=3.0 & x4-x2<=1.0\n",
      "   +0.7538 if c>=1.0 & x1>=3.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   +0.0931 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.2496 if x3-x1>=-1.0 & x4-x2>=2.0\n",
      "   -0.2437 if x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.3944 if x1>=1.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.0207 if x1<=2.0 & x2>=3.0 & x3-x1<=1.0\n",
      "   -0.1382 if x1<=0.0\n",
      "   +0.1955 if c<=0.0 & x2>=1.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.3600 if x3-x1<=-2.0 & x4-x2>=2.0\n",
      "init state [ 0  3  3 -2  0]\n",
      "(21,) (21,)\n",
      "init state [ 1  3 -1 -1  0]\n",
      "(32,) (11,)\n",
      "init state [ 0  1  2 -1  0]\n",
      "(43,) (11,)\n",
      "init state [2 2 1 0 0]\n",
      "(49,) (6,)\n",
      "init state [ 1  1 -1  0  0]\n",
      "(56,) (7,)\n",
      "init state [ 3  0 -2  1  0]\n",
      "(65,) (9,)\n",
      "init state [ 2  1 -2 -1  0]\n",
      "(78,) (13,)\n",
      "init state [ 0  2  0 -2  0]\n",
      "(88,) (10,)\n",
      "init state [ 3  0 -1  3  0]\n",
      "(93,) (5,)\n",
      "init state [ 2  2 -2  1  0]\n",
      "(107,) (14,)\n",
      "============ 71 ===========\n",
      "Run episode 71 with rewards 28, accuracy 1.0\n",
      "best\n",
      "----------------- 0 --------------\n",
      "   -0.5486 if c>=1.0 & x3-x1<=1.0\n",
      "   +1.1853 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.4262 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.5201 if x2<=2.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   -0.4243 if c<=0.0 & x1>=1.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   +0.0559 if c<=0.0 & x1<=2.0 & x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.1256 if x3-x1<=1.0\n",
      "   -0.0154 if x2>=2.0 & x3-x1<=-2.0\n",
      "   -0.2473 if x4-x2<=1.0\n",
      "   +0.1789 if x3-x1<=0.0 & x4-x2<=1.0\n",
      "   -0.0946 if x1>=1.0 & x2<=2.0 & x3-x1>=-1.0\n",
      "   +0.2686 if c<=0.0 & x2<=1.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.0814 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   -0.0752 if c<=0.0 & x1<=2.0 & x1>=2.0 & x2<=2.0 & x3-x1<=-1.0 & x3-x1>=-1.0\n",
      "   -0.1677 if x4-x2>=3.0\n",
      "   -0.1610 if x2<=2.0 & x3-x1>=2.0\n",
      "----------------- 1 --------------\n",
      "   +0.1416 if c>=1.0 & x1>=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   -0.3701 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.2574 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.0117 if x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=-1.0\n",
      "   +0.3542 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.2182 if x4-x2<=1.0\n",
      "   +0.0038 if x2<=2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.1922 if x1<=2.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   +0.2866 if x1<=2.0 & x3-x1<=1.0 & x4-x2<=-1.0\n",
      "   +0.4753 if c>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.4303 if x1>=2.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.3087 if c>=1.0 & x3-x1<=-1.0 & x3-x1<=-2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.2601 if x3-x1<=2.0 & x4-x2<=0.0\n",
      "   -0.0848 if c>=1.0 & x3-x1<=-3.0\n",
      "   +0.0000 if c<=0.0 & x4-x2<=-3.0\n",
      "   -0.4961 if x4-x2>=-1.0\n",
      "----------------- 2 --------------\n",
      "   +0.0107 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   +0.2737 if c<=0.0 & x4-x2>=-2.0\n",
      "   -0.1331 if c<=0.0 & x2<=0.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   -0.1843 if c<=0.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.4769 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.2139 if x2<=1.0\n",
      "   +0.3945 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.2841 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.3918 if x4-x2>=0.0\n",
      "   -0.1368 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.3171 if x2<=2.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=2.0\n",
      "   -0.0040 if c>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.6364 if x4-x2<=-1.0\n",
      "   -0.2461 if x2<=0.0 & x4-x2>=1.0\n",
      "   -0.2144 if x2>=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   +0.7587 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "----------------- 3 --------------\n",
      "   +0.6576 if x1<=2.0 & x1>=2.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   +0.5544 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.5662 if c>=1.0 & x1>=1.0\n",
      "   +0.1534 if x3-x1<=-2.0 & x4-x2>=0.0\n",
      "   +0.6677 if c>=1.0 & x1>=3.0\n",
      "   -0.4094 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.0137 if c<=0.0 & x1>=3.0 & x4-x2<=1.0\n",
      "   +0.3831 if c>=1.0 & x1>=3.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   -0.3083 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   +0.1767 if x3-x1>=-1.0 & x4-x2>=2.0\n",
      "   +0.0371 if x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.1709 if x1>=1.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.0277 if x1<=0.0\n",
      "   +0.2486 if c<=0.0 & x2>=1.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.0000 if x3-x1<=-2.0 & x4-x2>=2.0\n",
      "   +0.2594 if x4-x2>=3.0\n",
      "init state [ 1  2  2 -2  0]\n",
      "(22,) (22,)\n",
      "init state [ 1  3  0 -1  0]\n",
      "(34,) (12,)\n",
      "init state [ 0  1  1 -1  0]\n",
      "(41,) (7,)\n",
      "init state [1 1 1 1 0]\n",
      "(45,) (4,)\n",
      "init state [ 2  2 -1 -2  0]\n",
      "(57,) (12,)\n",
      "init state [0 1 2 2 0]\n",
      "(65,) (8,)\n",
      "init state [ 3  0 -2  0  0]\n",
      "(96,) (31,)\n",
      "init state [1 1 0 2 0]\n",
      "(103,) (7,)\n",
      "init state [0 0 2 0 0]\n",
      "(117,) (14,)\n",
      "init state [ 1  3  1 -1  0]\n",
      "(121,) (4,)\n",
      "============ 72 ===========\n",
      "Run episode 72 with rewards 38, accuracy 0.8\n",
      "----------------- 0 --------------\n",
      "   -0.4485 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.7181 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.6427 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.3123 if x2<=2.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   -0.1501 if c<=0.0 & x1>=1.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   -0.0997 if c<=0.0 & x1<=2.0 & x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   -0.2025 if x3-x1<=1.0\n",
      "   -0.1980 if x4-x2<=1.0\n",
      "   +0.3584 if x3-x1<=0.0 & x4-x2<=1.0\n",
      "   -0.1344 if x1>=1.0 & x2<=2.0 & x3-x1>=-1.0\n",
      "   -0.1125 if c<=0.0 & x2<=1.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.1225 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   +0.1871 if c<=0.0 & x1<=2.0 & x1>=2.0 & x2<=2.0 & x3-x1<=-1.0 & x3-x1>=-1.0\n",
      "   +0.0000 if x4-x2>=3.0\n",
      "   -0.1633 if x2<=2.0 & x3-x1>=2.0\n",
      "   +0.2962 if x1>=3.0 & x4-x2>=1.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 1 --------------\n",
      "   +0.1582 if c>=1.0 & x1>=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   -0.4678 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.4576 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.0253 if x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=-1.0\n",
      "   +0.6130 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.2145 if x4-x2<=1.0\n",
      "   +0.0339 if x2<=2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.4847 if x1<=2.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   -0.1038 if x1<=2.0 & x3-x1<=1.0 & x4-x2<=-1.0\n",
      "   +0.0412 if c>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.2836 if x1>=2.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.0177 if c>=1.0 & x3-x1<=-1.0 & x3-x1<=-2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.1590 if x3-x1<=2.0 & x4-x2<=0.0\n",
      "   +0.0000 if c>=1.0 & x3-x1<=-3.0\n",
      "   -0.0524 if x4-x2>=-1.0\n",
      "   -0.3482 if c<=0.0 & x1<=0.0 & x1<=1.0 & x2>=2.0 & x4-x2>=1.0\n",
      "----------------- 2 --------------\n",
      "   +0.0138 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   +0.4599 if c<=0.0 & x4-x2>=-2.0\n",
      "   +0.1660 if c<=0.0 & x2<=0.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   -0.2798 if c<=0.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.2182 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.0882 if x2<=1.0\n",
      "   +0.4502 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.5798 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.5798 if x4-x2>=0.0\n",
      "   -0.3542 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.0277 if x2<=2.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=2.0\n",
      "   +0.5439 if x4-x2<=-1.0\n",
      "   +0.0000 if x2<=0.0 & x4-x2>=1.0\n",
      "   -0.0764 if x2>=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   +0.3731 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   -0.0871 if x3-x1<=1.0\n",
      "----------------- 3 --------------\n",
      "   +0.3218 if x1<=2.0 & x1>=2.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   +0.1717 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.5482 if c>=1.0 & x1>=1.0\n",
      "   -0.0765 if x3-x1<=-2.0 & x4-x2>=0.0\n",
      "   +0.5866 if c>=1.0 & x1>=3.0\n",
      "   -0.1321 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.1729 if c<=0.0 & x1>=3.0 & x4-x2<=1.0\n",
      "   +0.3983 if c>=1.0 & x1>=3.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   -0.1251 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   +0.3772 if x3-x1>=-1.0 & x4-x2>=2.0\n",
      "   +0.2531 if x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.2152 if x1>=1.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.0319 if x1<=0.0\n",
      "   +0.0438 if c<=0.0 & x2>=1.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.0000 if x4-x2>=3.0\n",
      "   -0.1931 if x3-x1>=1.0 & x3-x1>=2.0 & x4-x2>=2.0\n",
      "init state [ 1  3 -1 -2  0]\n",
      "(12,) (12,)\n",
      "init state [ 1  2 -1 -1  0]\n",
      "(53,) (41,)\n",
      "init state [ 0  3  1 -3  0]\n",
      "(72,) (19,)\n",
      "init state [ 3  1 -3  2  0]\n",
      "(101,) (29,)\n",
      "init state [ 0  1  2 -1  0]\n",
      "(117,) (16,)\n",
      "init state [ 3  1 -2 -1  0]\n",
      "(135,) (18,)\n",
      "init state [0 0 2 2 0]\n",
      "(144,) (9,)\n",
      "init state [ 1  0 -1  1  0]\n",
      "(170,) (26,)\n",
      "init state [ 2  3  1 -2  0]\n",
      "(176,) (6,)\n",
      "init state [0 2 1 0 0]\n",
      "(184,) (8,)\n",
      "============ 73 ===========\n",
      "Run episode 73 with rewards 34, accuracy 1.0\n",
      "best\n",
      "----------------- 0 --------------\n",
      "   -0.5104 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.7334 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.1516 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.2976 if x2<=2.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   -0.2642 if c<=0.0 & x1>=1.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   +0.3024 if c<=0.0 & x1<=2.0 & x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   -0.2673 if x3-x1<=1.0\n",
      "   -0.4230 if x4-x2<=1.0\n",
      "   +0.2949 if x3-x1<=0.0 & x4-x2<=1.0\n",
      "   +0.4175 if x1>=1.0 & x2<=2.0 & x3-x1>=-1.0\n",
      "   +0.4313 if c<=0.0 & x2<=1.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.2362 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   +0.1441 if c<=0.0 & x1<=2.0 & x1>=2.0 & x2<=2.0 & x3-x1<=-1.0 & x3-x1>=-1.0\n",
      "   +0.1376 if x2<=2.0 & x3-x1>=2.0\n",
      "   +0.0157 if x1>=3.0 & x4-x2>=1.0\n",
      "   +0.2804 if x3-x1<=0.0\n",
      "----------------- 1 --------------\n",
      "   +0.2465 if c>=1.0 & x1>=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   -0.5996 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.9666 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   -0.4557 if x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=-1.0\n",
      "   +0.2987 if x1<=2.0 & x4-x2>=-2.0\n",
      "   -0.0447 if x4-x2<=1.0\n",
      "   +0.3134 if x2<=2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.3099 if x1<=2.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   +0.2402 if x1<=2.0 & x3-x1<=1.0 & x4-x2<=-1.0\n",
      "   +0.4920 if c>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.1469 if x1>=2.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.2309 if c>=1.0 & x3-x1<=-1.0 & x3-x1<=-2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.3198 if x3-x1<=2.0 & x4-x2<=0.0\n",
      "   -0.4440 if x4-x2>=-1.0\n",
      "   -0.0376 if c<=0.0 & x1<=0.0 & x1<=1.0 & x2>=2.0 & x4-x2>=1.0\n",
      "   -0.2600 if x1<=2.0 & x2<=2.0 & x3-x1>=2.0 & x4-x2>=2.0\n",
      "----------------- 2 --------------\n",
      "   -0.1262 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   +0.3031 if c<=0.0 & x4-x2>=-2.0\n",
      "   -0.0699 if c<=0.0 & x2<=0.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   -0.0854 if c<=0.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.0964 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.2506 if x2<=1.0\n",
      "   +0.7199 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.5005 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.5005 if x4-x2>=0.0\n",
      "   -0.4136 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.4275 if x2<=2.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=2.0\n",
      "   +0.3432 if x4-x2<=-1.0\n",
      "   -0.3285 if x2>=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   +0.4625 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   +0.0816 if x3-x1<=1.0\n",
      "   +0.1386 if x3-x1<=0.0\n",
      "----------------- 3 --------------\n",
      "   +0.0000 if x1<=2.0 & x1>=2.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   +0.2073 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.3671 if c>=1.0 & x1>=1.0\n",
      "   -0.1437 if x3-x1<=-2.0 & x4-x2>=0.0\n",
      "   +0.5147 if c>=1.0 & x1>=3.0\n",
      "   -0.1712 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.0650 if c<=0.0 & x1>=3.0 & x4-x2<=1.0\n",
      "   +0.4935 if c>=1.0 & x1>=3.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   -0.2116 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   +0.1071 if x3-x1>=-1.0 & x4-x2>=2.0\n",
      "   +0.7125 if x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.2011 if x1>=1.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.3699 if x1<=0.0\n",
      "   +0.4608 if c<=0.0 & x2>=1.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.1071 if x3-x1>=1.0 & x3-x1>=2.0 & x4-x2>=2.0\n",
      "   +0.0396 if x4-x2<=0.0 & x4-x2>=-1.0\n",
      "init state [2 1 1 1 0]\n",
      "(5,) (5,)\n",
      "init state [ 2  3 -1 -1  0]\n",
      "(16,) (11,)\n",
      "init state [ 1  1  0 -1  0]\n",
      "(37,) (21,)\n",
      "init state [2 1 0 2 0]\n",
      "(47,) (10,)\n",
      "init state [ 0  2  0 -2  0]\n",
      "(58,) (11,)\n",
      "init state [ 3  1  0 -1  0]\n",
      "(71,) (13,)\n",
      "init state [ 1  2  0 -2  0]\n",
      "(86,) (15,)\n",
      "init state [0 0 3 0 0]\n",
      "(103,) (17,)\n",
      "init state [ 3  0 -1  0  0]\n",
      "(110,) (7,)\n",
      "init state [1 3 1 0 0]\n",
      "(127,) (17,)\n",
      "============ 74 ===========\n",
      "Run episode 74 with rewards 25, accuracy 0.7\n",
      "----------------- 0 --------------\n",
      "   -0.3813 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.4126 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.4037 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.1593 if x2<=2.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   -0.1126 if c<=0.0 & x1>=1.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   -0.1459 if c<=0.0 & x1<=2.0 & x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   -0.1041 if x3-x1<=1.0\n",
      "   -0.4231 if x4-x2<=1.0\n",
      "   -0.0451 if x3-x1<=0.0 & x4-x2<=1.0\n",
      "   +0.3029 if x1>=1.0 & x2<=2.0 & x3-x1>=-1.0\n",
      "   -0.2714 if c<=0.0 & x2<=1.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.3435 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   +0.2028 if c<=0.0 & x1<=2.0 & x1>=2.0 & x2<=2.0 & x3-x1<=-1.0 & x3-x1>=-1.0\n",
      "   -0.0201 if x2<=2.0 & x3-x1>=2.0\n",
      "   +0.2318 if x3-x1<=0.0\n",
      "   -0.2666 if c<=0.0 & x1>=2.0 & x1>=3.0 & x2>=1.0\n",
      "----------------- 1 --------------\n",
      "   -0.1538 if c>=1.0 & x1>=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   -0.6177 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.5251 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.1442 if x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=-1.0\n",
      "   +0.3721 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.1370 if x4-x2<=1.0\n",
      "   -0.1542 if x2<=2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.2064 if x1<=2.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   +0.3224 if x1<=2.0 & x3-x1<=1.0 & x4-x2<=-1.0\n",
      "   +0.4823 if c>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.1727 if x1>=2.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.0205 if c>=1.0 & x3-x1<=-1.0 & x3-x1<=-2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.3910 if x3-x1<=2.0 & x4-x2<=0.0\n",
      "   -0.1168 if x4-x2>=-1.0\n",
      "   +0.0000 if x1<=2.0 & x2<=2.0 & x3-x1>=2.0 & x4-x2>=2.0\n",
      "   -0.5156 if x2>=2.0 & x3-x1<=1.0 & x4-x2>=1.0\n",
      "----------------- 2 --------------\n",
      "   +0.2255 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   +0.3622 if c<=0.0 & x4-x2>=-2.0\n",
      "   -0.4861 if c<=0.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.0963 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.4155 if x2<=1.0\n",
      "   +0.6974 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.3275 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.3275 if x4-x2>=0.0\n",
      "   -0.2018 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.0090 if x2<=2.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=2.0\n",
      "   +0.0727 if x4-x2<=-1.0\n",
      "   -0.0661 if x2>=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   +0.4474 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   -0.0773 if x3-x1<=1.0\n",
      "   -0.0797 if x3-x1<=0.0\n",
      "   +0.3606 if x2>=2.0 & x3-x1<=1.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 3 --------------\n",
      "   +0.0474 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.4078 if c>=1.0 & x1>=1.0\n",
      "   +0.0229 if x3-x1<=-2.0 & x4-x2>=0.0\n",
      "   +0.8025 if c>=1.0 & x1>=3.0\n",
      "   -0.5201 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.1483 if c<=0.0 & x1>=3.0 & x4-x2<=1.0\n",
      "   +0.5113 if c>=1.0 & x1>=3.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   +0.4572 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   +0.1199 if x3-x1>=-1.0 & x4-x2>=2.0\n",
      "   +0.0950 if x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.2376 if x1>=1.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.1749 if x1<=0.0\n",
      "   +0.2498 if c<=0.0 & x2>=1.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.0000 if x3-x1>=1.0 & x3-x1>=2.0 & x4-x2>=2.0\n",
      "   +0.2321 if x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.6174 if x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "init state [ 2  2 -2 -2  0]\n",
      "(42,) (42,)\n",
      "init state [0 1 0 2 0]\n",
      "(49,) (7,)\n",
      "init state [ 2  2 -1  0  0]\n",
      "(71,) (22,)\n",
      "init state [ 2  0 -2  2  0]\n",
      "(121,) (50,)\n",
      "init state [0 1 2 2 0]\n",
      "(140,) (19,)\n",
      "init state [0 0 1 3 0]\n",
      "(152,) (12,)\n",
      "init state [ 1  1  1 -1  0]\n",
      "(168,) (16,)\n",
      "init state [ 3  2 -1 -2  0]\n",
      "(190,) (22,)\n",
      "init state [0 1 3 1 0]\n",
      "(205,) (15,)\n",
      "init state [ 2  1 -1  1  0]\n",
      "(212,) (7,)\n",
      "============ 75 ===========\n",
      "Run episode 75 with rewards 35, accuracy 0.5\n",
      "----------------- 0 --------------\n",
      "   -0.6093 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.9590 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.4303 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.5111 if x2<=2.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   +0.2133 if c<=0.0 & x1>=1.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   +0.4275 if c<=0.0 & x1<=2.0 & x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.0405 if x3-x1<=1.0\n",
      "   -0.4407 if x4-x2<=1.0\n",
      "   -0.1568 if x3-x1<=0.0 & x4-x2<=1.0\n",
      "   +0.2737 if x1>=1.0 & x2<=2.0 & x3-x1>=-1.0\n",
      "   -0.0273 if c<=0.0 & x2<=1.0 & x2>=1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.1472 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   +0.0321 if c<=0.0 & x1<=2.0 & x1>=2.0 & x2<=2.0 & x3-x1<=-1.0 & x3-x1>=-1.0\n",
      "   +0.1225 if x3-x1<=0.0\n",
      "   -0.1296 if c<=0.0 & x1>=2.0 & x1>=3.0 & x2>=1.0\n",
      "   -0.4019 if c<=0.0 & x1>=1.0 & x2>=1.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "----------------- 1 --------------\n",
      "   +0.0050 if c>=1.0 & x1>=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   -0.5865 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.5709 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   -0.3209 if x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=-1.0\n",
      "   +0.1633 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.0610 if x4-x2<=1.0\n",
      "   -0.2317 if x2<=2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.2655 if x1<=2.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   +0.5592 if x1<=2.0 & x3-x1<=1.0 & x4-x2<=-1.0\n",
      "   +0.5630 if c>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.2801 if x1>=2.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.0585 if c>=1.0 & x3-x1<=-1.0 & x3-x1<=-2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.7994 if x3-x1<=2.0 & x4-x2<=0.0\n",
      "   -0.1133 if x4-x2>=-1.0\n",
      "   -0.3409 if x2>=2.0 & x3-x1<=1.0 & x4-x2>=1.0\n",
      "   -1.0650 if c<=0.0 & x1>=1.0 & x3-x1<=1.0 & x4-x2<=0.0\n",
      "----------------- 2 --------------\n",
      "   -0.1535 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   +0.1869 if c<=0.0 & x4-x2>=-2.0\n",
      "   -0.1475 if c<=0.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.1876 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.4416 if x2<=1.0\n",
      "   +0.8842 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.5014 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.5449 if x4-x2>=0.0\n",
      "   -0.2543 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.2442 if x4-x2<=-1.0\n",
      "   +0.2136 if x2>=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   +0.7790 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   -0.1971 if x3-x1<=1.0\n",
      "   -0.0996 if x3-x1<=0.0\n",
      "   +0.2062 if x2>=2.0 & x3-x1<=1.0\n",
      "   +0.3914 if x2>=2.0 & x3-x1>=3.0\n",
      "----------------- 3 --------------\n",
      "   +0.3664 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.2196 if c>=1.0 & x1>=1.0\n",
      "   +0.0701 if x3-x1<=-2.0 & x4-x2>=0.0\n",
      "   +0.5147 if c>=1.0 & x1>=3.0\n",
      "   -0.5634 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.3932 if c<=0.0 & x1>=3.0 & x4-x2<=1.0\n",
      "   +0.5763 if c>=1.0 & x1>=3.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   +0.3073 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   +0.2886 if x3-x1>=-1.0 & x4-x2>=2.0\n",
      "   +0.3438 if x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.1471 if x1>=1.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.3079 if x1<=0.0\n",
      "   +0.5297 if c<=0.0 & x2>=1.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.3349 if x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.7602 if x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.1927 if x4-x2>=3.0\n",
      "init state [ 3  0 -1  2  0]\n",
      "(5,) (5,)\n",
      "init state [ 2  2 -1  0  0]\n",
      "(11,) (6,)\n",
      "init state [ 1  1  0 -1  0]\n",
      "(41,) (30,)\n",
      "init state [2 0 1 1 0]\n",
      "(53,) (12,)\n",
      "init state [0 2 2 0 0]\n",
      "(57,) (4,)\n",
      "init state [ 3  1 -1  1  0]\n",
      "(63,) (6,)\n",
      "init state [1 0 1 3 0]\n",
      "(70,) (7,)\n",
      "init state [0 0 0 1 0]\n",
      "(78,) (8,)\n",
      "init state [2 1 0 1 0]\n",
      "(81,) (3,)\n",
      "init state [ 1  2  0 -2  0]\n",
      "(94,) (13,)\n",
      "============ 76 ===========\n",
      "Run episode 76 with rewards 29, accuracy 0.4\n",
      "----------------- 0 --------------\n",
      "   -0.4330 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.4714 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.3576 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.4466 if x2<=2.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   -0.4704 if c<=0.0 & x1>=1.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   +0.1110 if c<=0.0 & x1<=2.0 & x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   -0.1192 if x3-x1<=1.0\n",
      "   -0.4612 if x4-x2<=1.0\n",
      "   -0.2794 if x3-x1<=0.0 & x4-x2<=1.0\n",
      "   +0.2530 if x1>=1.0 & x2<=2.0 & x3-x1>=-1.0\n",
      "   +0.1438 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   +0.4419 if c<=0.0 & x1<=2.0 & x1>=2.0 & x2<=2.0 & x3-x1<=-1.0 & x3-x1>=-1.0\n",
      "   +0.1979 if x3-x1<=0.0\n",
      "   +0.0458 if c<=0.0 & x1>=2.0 & x1>=3.0 & x2>=1.0\n",
      "   +0.1675 if c<=0.0 & x1>=1.0 & x2>=1.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.2392 if x3-x1>=0.0 & x4-x2<=2.0 & x4-x2>=1.0 & x4-x2>=2.0\n",
      "----------------- 1 --------------\n",
      "   -0.9232 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.5234 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   -0.3293 if x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=-1.0\n",
      "   +0.3545 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.1115 if x4-x2<=1.0\n",
      "   -0.2369 if x2<=2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.6271 if x1<=2.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   +0.3249 if x1<=2.0 & x3-x1<=1.0 & x4-x2<=-1.0\n",
      "   +0.3838 if c>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.4834 if x1>=2.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.1076 if c>=1.0 & x3-x1<=-1.0 & x3-x1<=-2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.4567 if x3-x1<=2.0 & x4-x2<=0.0\n",
      "   +0.0500 if x4-x2>=-1.0\n",
      "   -0.0613 if x2>=2.0 & x3-x1<=1.0 & x4-x2>=1.0\n",
      "   -0.0896 if c<=0.0 & x1>=1.0 & x3-x1<=1.0 & x4-x2<=0.0\n",
      "   +0.8547 if x1<=1.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "----------------- 2 --------------\n",
      "   -0.1649 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.0820 if c<=0.0 & x4-x2>=-2.0\n",
      "   -0.0487 if c<=0.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.1909 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.4381 if x2<=1.0\n",
      "   +0.5303 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.4452 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.6026 if x4-x2>=0.0\n",
      "   -0.3724 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.3580 if x4-x2<=-1.0\n",
      "   +0.0823 if x2>=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   +0.7513 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   -0.2169 if x3-x1<=1.0\n",
      "   +0.2213 if x2>=2.0 & x3-x1<=1.0\n",
      "   +0.0000 if x2>=2.0 & x3-x1>=3.0\n",
      "   -0.0804 if x3-x1>=-2.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "----------------- 3 --------------\n",
      "   +0.8387 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.4891 if c>=1.0 & x1>=1.0\n",
      "   +0.5288 if c>=1.0 & x1>=3.0\n",
      "   -0.3189 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.0833 if c<=0.0 & x1>=3.0 & x4-x2<=1.0\n",
      "   +0.5078 if c>=1.0 & x1>=3.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   +0.3376 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   +0.0244 if x3-x1>=-1.0 & x4-x2>=2.0\n",
      "   +0.0430 if x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.0418 if x1>=1.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.0381 if x1<=0.0\n",
      "   +0.2403 if c<=0.0 & x2>=1.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.0945 if x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.5644 if x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.2926 if x4-x2>=3.0\n",
      "   -0.2772 if x1>=3.0 & x4-x2>=2.0\n",
      "init state [0 2 2 0 0]\n",
      "(6,) (6,)\n",
      "init state [ 2  0 -2  3  0]\n",
      "(28,) (22,)\n",
      "init state [1 0 1 3 0]\n",
      "(34,) (6,)\n",
      "init state [2 0 0 1 0]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(43,) (9,)\n",
      "init state [ 3  2 -3 -2  0]\n",
      "(120,) (77,)\n",
      "init state [0 0 3 2 0]\n",
      "(126,) (6,)\n",
      "init state [2 0 1 0 0]\n",
      "(136,) (10,)\n",
      "init state [ 2  0 -1  2  0]\n",
      "(144,) (8,)\n",
      "init state [ 3  0 -3  1  0]\n",
      "(179,) (35,)\n",
      "init state [1 0 1 0 0]\n",
      "(184,) (5,)\n",
      "============ 77 ===========\n",
      "Run episode 77 with rewards 37, accuracy 0.4\n",
      "----------------- 0 --------------\n",
      "   -0.6616 if c>=1.0 & x3-x1<=1.0\n",
      "   +1.0773 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.0992 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.6558 if x2<=2.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   -0.1257 if c<=0.0 & x1>=1.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   +0.2694 if c<=0.0 & x1<=2.0 & x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.0130 if x3-x1<=1.0\n",
      "   +0.0929 if x4-x2<=1.0\n",
      "   +0.0994 if x3-x1<=0.0 & x4-x2<=1.0\n",
      "   -0.3071 if x1>=1.0 & x2<=2.0 & x3-x1>=-1.0\n",
      "   -0.2659 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   +0.0835 if c<=0.0 & x1<=2.0 & x1>=2.0 & x2<=2.0 & x3-x1<=-1.0 & x3-x1>=-1.0\n",
      "   -0.1134 if x3-x1<=0.0\n",
      "   -0.2519 if c<=0.0 & x1>=1.0 & x2>=1.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.1043 if x3-x1>=0.0 & x4-x2<=2.0 & x4-x2>=1.0 & x4-x2>=2.0\n",
      "   -0.5565 if c<=0.0 & x2>=3.0 & x4-x2>=0.0\n",
      "----------------- 1 --------------\n",
      "   -0.7108 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -1.0293 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   -0.2551 if x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=-1.0\n",
      "   +0.4532 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.5163 if x4-x2<=1.0\n",
      "   +0.0302 if x2<=2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.4070 if x1<=2.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   -0.0641 if x1<=2.0 & x3-x1<=1.0 & x4-x2<=-1.0\n",
      "   +0.0842 if c>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.3654 if x1>=2.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.0067 if c>=1.0 & x3-x1<=-1.0 & x3-x1<=-2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.1054 if x3-x1<=2.0 & x4-x2<=0.0\n",
      "   -0.0577 if x2>=2.0 & x3-x1<=1.0 & x4-x2>=1.0\n",
      "   -0.3349 if c<=0.0 & x1>=1.0 & x3-x1<=1.0 & x4-x2<=0.0\n",
      "   +0.7735 if x1<=1.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   -0.3671 if x3-x1>=3.0 & x4-x2>=2.0\n",
      "----------------- 2 --------------\n",
      "   +0.3523 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   -0.2859 if c<=0.0 & x4-x2>=-2.0\n",
      "   -0.0658 if c<=0.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.1062 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.4955 if x2<=1.0\n",
      "   +0.4390 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.4528 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.5176 if x4-x2>=0.0\n",
      "   -0.3939 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.2527 if x4-x2<=-1.0\n",
      "   -0.2188 if x2>=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   +0.7780 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   -0.1444 if x3-x1<=1.0\n",
      "   +0.2407 if x2>=2.0 & x3-x1<=1.0\n",
      "   -0.0315 if x3-x1>=-2.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.6390 if x3-x1<=-3.0\n",
      "----------------- 3 --------------\n",
      "   +0.9629 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.8999 if c>=1.0 & x1>=1.0\n",
      "   +0.7785 if c>=1.0 & x1>=3.0\n",
      "   -0.1516 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.1453 if c<=0.0 & x1>=3.0 & x4-x2<=1.0\n",
      "   +0.3876 if c>=1.0 & x1>=3.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   +0.6998 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   +0.0917 if x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.1998 if x1>=1.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.1089 if x1<=0.0\n",
      "   -0.1987 if c<=0.0 & x2>=1.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.0727 if x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.0670 if x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.0934 if x4-x2>=3.0\n",
      "   -0.0000 if x1>=3.0 & x4-x2>=2.0\n",
      "   +0.6955 if x3-x1>=-1.0 & x4-x2<=2.0 & x4-x2>=2.0\n",
      "init state [0 0 1 2 0]\n",
      "(8,) (8,)\n",
      "init state [2 0 0 1 0]\n",
      "(12,) (4,)\n",
      "init state [2 1 1 1 0]\n",
      "(15,) (3,)\n",
      "init state [0 0 1 2 0]\n",
      "(30,) (15,)\n",
      "init state [ 1  3 -1  0  0]\n",
      "(38,) (8,)\n",
      "init state [ 2  3 -1 -2  0]\n",
      "(49,) (11,)\n",
      "init state [ 0  3  0 -2  0]\n",
      "(69,) (20,)\n",
      "init state [ 3  2 -2  0  0]\n",
      "(74,) (5,)\n",
      "init state [ 0  1  2 -1  0]\n",
      "(106,) (32,)\n",
      "init state [0 0 3 2 0]\n",
      "(114,) (8,)\n",
      "============ 78 ===========\n",
      "Run episode 78 with rewards 34, accuracy 0.5\n",
      "----------------- 0 --------------\n",
      "   -0.3626 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.5932 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.0772 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.4440 if x2<=2.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   -0.1219 if c<=0.0 & x1>=1.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   +0.4560 if c<=0.0 & x1<=2.0 & x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   -0.0637 if x4-x2<=1.0\n",
      "   +0.1166 if x3-x1<=0.0 & x4-x2<=1.0\n",
      "   -0.0332 if x1>=1.0 & x2<=2.0 & x3-x1>=-1.0\n",
      "   +0.1677 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   +0.2624 if c<=0.0 & x1<=2.0 & x1>=2.0 & x2<=2.0 & x3-x1<=-1.0 & x3-x1>=-1.0\n",
      "   +0.0456 if x3-x1<=0.0\n",
      "   +0.1722 if c<=0.0 & x1>=1.0 & x2>=1.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.1849 if x3-x1>=0.0 & x4-x2<=2.0 & x4-x2>=1.0 & x4-x2>=2.0\n",
      "   -0.0109 if c<=0.0 & x2>=3.0 & x4-x2>=0.0\n",
      "   +0.8049 if x1<=2.0 & x1>=2.0 & x4-x2<=-2.0 & x4-x2>=-2.0\n",
      "----------------- 1 --------------\n",
      "   -0.8019 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.7286 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   -0.3236 if x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=-1.0\n",
      "   +0.5351 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.1498 if x4-x2<=1.0\n",
      "   -0.0708 if x2<=2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.5080 if x1<=2.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   +0.3420 if x1<=2.0 & x3-x1<=1.0 & x4-x2<=-1.0\n",
      "   +0.0487 if c>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.1166 if x1>=2.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.0879 if x3-x1<=2.0 & x4-x2<=0.0\n",
      "   +0.0000 if x2>=2.0 & x3-x1<=1.0 & x4-x2>=1.0\n",
      "   -0.4206 if c<=0.0 & x1>=1.0 & x3-x1<=1.0 & x4-x2<=0.0\n",
      "   +0.1012 if x1<=1.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   -0.1878 if x3-x1>=3.0 & x4-x2>=2.0\n",
      "   +0.3535 if x3-x1>=3.0 & x4-x2<=0.0\n",
      "----------------- 2 --------------\n",
      "   -0.1041 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   +0.0349 if c<=0.0 & x4-x2>=-2.0\n",
      "   -0.0946 if c<=0.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.0864 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.3677 if x2<=1.0\n",
      "   +0.4878 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.4500 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.4500 if x4-x2>=0.0\n",
      "   -0.3652 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.0455 if x4-x2<=-1.0\n",
      "   -0.1010 if x2>=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   +0.5474 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   -0.2804 if x3-x1<=1.0\n",
      "   -0.0200 if x2>=2.0 & x3-x1<=1.0\n",
      "   +0.0000 if x3-x1<=-3.0\n",
      "   +0.3143 if x2<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "----------------- 3 --------------\n",
      "   +0.7170 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.7961 if c>=1.0 & x1>=1.0\n",
      "   +0.4733 if c>=1.0 & x1>=3.0\n",
      "   -0.3069 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.0245 if c<=0.0 & x1>=3.0 & x4-x2<=1.0\n",
      "   +0.2890 if c>=1.0 & x1>=3.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   -0.0199 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   +0.1018 if x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.0532 if x1>=1.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.0239 if x1<=0.0\n",
      "   +0.3539 if c<=0.0 & x2>=1.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.2190 if x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.3128 if x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.0000 if x4-x2>=3.0\n",
      "   +0.3263 if x3-x1>=-1.0 & x4-x2<=2.0 & x4-x2>=2.0\n",
      "   +0.6341 if x3-x1>=3.0 & x4-x2>=1.0\n",
      "init state [0 0 2 3 0]\n",
      "(9,) (9,)\n",
      "init state [ 2  0 -2  3  0]\n",
      "(22,) (13,)\n",
      "init state [ 0  3  1 -2  0]\n",
      "(38,) (16,)\n",
      "init state [ 1  2  1 -1  0]\n",
      "(53,) (15,)\n",
      "init state [ 2  1 -2 -1  0]\n",
      "(80,) (27,)\n",
      "init state [ 0  2  0 -1  0]\n",
      "(94,) (14,)\n",
      "init state [ 2  0 -2  1  0]\n",
      "(109,) (15,)\n",
      "init state [ 1  1  0 -1  0]\n",
      "(126,) (17,)\n",
      "init state [ 0  3  1 -1  0]\n",
      "(135,) (9,)\n",
      "init state [ 1  3 -1 -1  0]\n",
      "(145,) (10,)\n",
      "============ 79 ===========\n",
      "Run episode 79 with rewards 32, accuracy 0.6\n",
      "----------------- 0 --------------\n",
      "   -0.4451 if c>=1.0 & x3-x1<=1.0\n",
      "   +1.0218 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.2520 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.0277 if x2<=2.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   -0.1186 if c<=0.0 & x1>=1.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   +0.3997 if c<=0.0 & x1<=2.0 & x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   -0.2785 if x4-x2<=1.0\n",
      "   +0.1202 if x3-x1<=0.0 & x4-x2<=1.0\n",
      "   -0.1681 if x1>=1.0 & x2<=2.0 & x3-x1>=-1.0\n",
      "   -0.0487 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   +0.2167 if c<=0.0 & x1<=2.0 & x1>=2.0 & x2<=2.0 & x3-x1<=-1.0 & x3-x1>=-1.0\n",
      "   +0.0275 if x3-x1<=0.0\n",
      "   +0.3257 if c<=0.0 & x1>=1.0 & x2>=1.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.1662 if x3-x1>=0.0 & x4-x2<=2.0 & x4-x2>=1.0 & x4-x2>=2.0\n",
      "   -0.0112 if x1<=2.0 & x1>=2.0 & x4-x2<=-2.0 & x4-x2>=-2.0\n",
      "   +0.6310 if x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=1.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 1 --------------\n",
      "   -0.3194 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.8999 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.4061 if x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=-1.0\n",
      "   +0.2363 if x1<=2.0 & x4-x2>=-2.0\n",
      "   -0.0339 if x4-x2<=1.0\n",
      "   +0.0159 if x2<=2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.6640 if x1<=2.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   +0.4316 if x1<=2.0 & x3-x1<=1.0 & x4-x2<=-1.0\n",
      "   +0.1442 if c>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.1275 if x1>=2.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.6184 if x3-x1<=2.0 & x4-x2<=0.0\n",
      "   -0.0165 if c<=0.0 & x1>=1.0 & x3-x1<=1.0 & x4-x2<=0.0\n",
      "   -0.1524 if x1<=1.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   +0.0000 if x3-x1>=3.0 & x4-x2>=2.0\n",
      "   +0.0000 if x3-x1>=3.0 & x4-x2<=0.0\n",
      "   -0.2119 if x3-x1<=0.0 & x4-x2<=0.0\n",
      "----------------- 2 --------------\n",
      "   +0.2647 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   +0.1111 if c<=0.0 & x4-x2>=-2.0\n",
      "   +0.1414 if c<=0.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.1876 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   -0.0207 if x2<=1.0\n",
      "   +0.5835 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.4480 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.4547 if x4-x2>=0.0\n",
      "   -0.2819 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.1888 if x4-x2<=-1.0\n",
      "   -0.0261 if x2>=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   +0.1330 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   -0.0388 if x3-x1<=1.0\n",
      "   -0.2453 if x2>=2.0 & x3-x1<=1.0\n",
      "   +0.1797 if x2<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.2810 if x4-x2<=-2.0\n",
      "----------------- 3 --------------\n",
      "   +0.0394 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.5194 if c>=1.0 & x1>=1.0\n",
      "   +0.4111 if c>=1.0 & x1>=3.0\n",
      "   -0.2526 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.0140 if c<=0.0 & x1>=3.0 & x4-x2<=1.0\n",
      "   +0.4111 if c>=1.0 & x1>=3.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   -0.6965 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.1919 if x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.0026 if x1>=1.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.1083 if x1<=0.0\n",
      "   +0.6235 if c<=0.0 & x2>=1.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.0091 if x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.3168 if x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.1430 if x3-x1>=-1.0 & x4-x2<=2.0 & x4-x2>=2.0\n",
      "   +0.0000 if x3-x1>=3.0 & x4-x2>=1.0\n",
      "   +0.6066 if x1>=1.0 & x2>=1.0 & x4-x2>=2.0\n",
      "init state [ 0  2  0 -2  0]\n",
      "(36,) (36,)\n",
      "init state [ 0  2  3 -2  0]\n",
      "(47,) (11,)\n",
      "init state [ 1  1 -1  0  0]\n",
      "(53,) (6,)\n",
      "init state [ 2  3 -2 -2  0]\n",
      "(70,) (17,)\n",
      "init state [1 1 0 2 0]\n",
      "(76,) (6,)\n",
      "init state [ 3  1 -2  0  0]\n",
      "(82,) (6,)\n",
      "init state [0 1 2 0 0]\n",
      "(89,) (7,)\n",
      "init state [ 0  2  2 -2  0]\n",
      "(101,) (12,)\n",
      "init state [ 2  2 -1 -1  0]\n",
      "(113,) (12,)\n",
      "init state [0 2 1 0 0]\n",
      "(119,) (6,)\n",
      "============ 80 ===========\n",
      "Run episode 80 with rewards 36, accuracy 1.0\n",
      "best\n",
      "----------------- 0 --------------\n",
      "   -0.5928 if c>=1.0 & x3-x1<=1.0\n",
      "   +1.0277 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.1871 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.5158 if x2<=2.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   -0.8201 if c<=0.0 & x1>=1.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   +0.2015 if c<=0.0 & x1<=2.0 & x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   -0.2006 if x4-x2<=1.0\n",
      "   +0.1368 if x3-x1<=0.0 & x4-x2<=1.0\n",
      "   -0.0443 if x1>=1.0 & x2<=2.0 & x3-x1>=-1.0\n",
      "   +0.1028 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   +0.4592 if c<=0.0 & x1<=2.0 & x1>=2.0 & x2<=2.0 & x3-x1<=-1.0 & x3-x1>=-1.0\n",
      "   +0.0960 if x3-x1<=0.0\n",
      "   +0.3928 if c<=0.0 & x1>=1.0 & x2>=1.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.0407 if x3-x1>=0.0 & x4-x2<=2.0 & x4-x2>=1.0 & x4-x2>=2.0\n",
      "   +0.1439 if x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.0867 if x1<=0.0 & x3-x1>=2.0 & x4-x2<=-2.0\n",
      "----------------- 1 --------------\n",
      "   -0.4570 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.7110 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.0753 if x1<=2.0 & x2<=2.0 & x2>=2.0 & x3-x1<=-1.0\n",
      "   +0.4735 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.3656 if x4-x2<=1.0\n",
      "   -0.4197 if x2<=2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.8806 if x1<=2.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   +0.4356 if x1<=2.0 & x3-x1<=1.0 & x4-x2<=-1.0\n",
      "   +0.2847 if c>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.1181 if x1>=2.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.3496 if x3-x1<=2.0 & x4-x2<=0.0\n",
      "   -0.5392 if c<=0.0 & x1>=1.0 & x3-x1<=1.0 & x4-x2<=0.0\n",
      "   +0.1835 if x1<=1.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   +0.1395 if x3-x1>=3.0 & x4-x2<=0.0\n",
      "   -0.5157 if x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.1847 if c>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "----------------- 2 --------------\n",
      "   -0.2030 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   +0.0821 if c<=0.0 & x4-x2>=-2.0\n",
      "   -0.1163 if c<=0.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.1828 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.9021 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.4424 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.4424 if x4-x2>=0.0\n",
      "   -0.4044 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.0300 if x4-x2<=-1.0\n",
      "   -0.2656 if x2>=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   +0.4077 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   -0.1656 if x3-x1<=1.0\n",
      "   +0.2696 if x2>=2.0 & x3-x1<=1.0\n",
      "   +0.1278 if x2<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.0200 if x4-x2<=-2.0\n",
      "   -0.2061 if x1<=1.0 & x2<=1.0 & x3-x1>=0.0\n",
      "----------------- 3 --------------\n",
      "   +0.3593 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.6956 if c>=1.0 & x1>=1.0\n",
      "   +0.5031 if c>=1.0 & x1>=3.0\n",
      "   -0.4391 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.3305 if c<=0.0 & x1>=3.0 & x4-x2<=1.0\n",
      "   +0.2932 if c>=1.0 & x1>=3.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   -0.4949 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   +0.0437 if x1>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.1964 if x1>=1.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.1663 if x1<=0.0\n",
      "   +0.1691 if c<=0.0 & x2>=1.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.0653 if x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.3060 if x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.2747 if x3-x1>=-1.0 & x4-x2<=2.0 & x4-x2>=2.0\n",
      "   +0.2747 if x1>=1.0 & x2>=1.0 & x4-x2>=2.0\n",
      "   -0.4035 if c>=1.0 & x2>=3.0\n",
      "init state [0 0 1 1 0]\n",
      "(19,) (19,)\n",
      "init state [ 1  0 -1  3  0]\n",
      "(44,) (25,)\n",
      "init state [ 3  1 -2  2  0]\n",
      "(57,) (13,)\n",
      "init state [ 2  1  1 -1  0]\n",
      "(77,) (20,)\n",
      "init state [ 3  0 -2  0  0]\n",
      "(85,) (8,)\n",
      "init state [0 0 1 1 0]\n",
      "(93,) (8,)\n",
      "init state [ 1  3  1 -2  0]\n",
      "(100,) (7,)\n",
      "init state [ 0  3  1 -1  0]\n",
      "(107,) (7,)\n",
      "init state [ 2  3 -2  0  0]\n",
      "(116,) (9,)\n",
      "init state [2 0 1 1 0]\n",
      "(120,) (4,)\n",
      "============ 81 ===========\n",
      "Run episode 81 with rewards 38, accuracy 0.9\n",
      "----------------- 0 --------------\n",
      "   -0.1447 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.7143 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.4001 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.3420 if x2<=2.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   -0.4269 if c<=0.0 & x1>=1.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   +0.1495 if c<=0.0 & x1<=2.0 & x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   -0.1862 if x4-x2<=1.0\n",
      "   +0.1377 if x3-x1<=0.0 & x4-x2<=1.0\n",
      "   -0.3487 if x1>=1.0 & x2<=2.0 & x3-x1>=-1.0\n",
      "   -0.0511 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   +0.0164 if c<=0.0 & x1<=2.0 & x1>=2.0 & x2<=2.0 & x3-x1<=-1.0 & x3-x1>=-1.0\n",
      "   +0.3143 if x3-x1<=0.0\n",
      "   +0.0546 if c<=0.0 & x1>=1.0 & x2>=1.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.3278 if x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.0000 if x1<=0.0 & x3-x1>=2.0 & x4-x2<=-2.0\n",
      "   +0.1684 if x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "----------------- 1 --------------\n",
      "   -0.5709 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.3094 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.5114 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.2081 if x4-x2<=1.0\n",
      "   -0.0974 if x2<=2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.6884 if x1<=2.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   +0.1157 if x1<=2.0 & x3-x1<=1.0 & x4-x2<=-1.0\n",
      "   +0.1408 if c>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.2523 if x1>=2.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.0005 if x3-x1<=2.0 & x4-x2<=0.0\n",
      "   -0.0690 if c<=0.0 & x1>=1.0 & x3-x1<=1.0 & x4-x2<=0.0\n",
      "   +0.4189 if x1<=1.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   +0.0000 if x3-x1>=3.0 & x4-x2<=0.0\n",
      "   -0.4463 if x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.0952 if c>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   +0.3509 if c>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "----------------- 2 --------------\n",
      "   -0.2187 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   +0.3748 if c<=0.0 & x4-x2>=-2.0\n",
      "   -0.2221 if c<=0.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.1596 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.6281 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.5043 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.4772 if x4-x2>=0.0\n",
      "   -0.4067 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.2822 if x4-x2<=-1.0\n",
      "   -0.1054 if x2>=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   +0.6281 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   -0.1571 if x3-x1<=1.0\n",
      "   +0.1108 if x2>=2.0 & x3-x1<=1.0\n",
      "   -0.0792 if x2<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   -0.0224 if x1<=1.0 & x2<=1.0 & x3-x1>=0.0\n",
      "   -0.1601 if x1>=1.0 & x4-x2<=-1.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 3 --------------\n",
      "   +0.3647 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.7955 if c>=1.0 & x1>=1.0\n",
      "   +0.5774 if c>=1.0 & x1>=3.0\n",
      "   -0.3054 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.0278 if c<=0.0 & x1>=3.0 & x4-x2<=1.0\n",
      "   +0.1845 if c>=1.0 & x1>=3.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   -0.0925 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   +0.0048 if x1>=1.0 & x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.2464 if x1<=0.0\n",
      "   -0.1742 if c<=0.0 & x2>=1.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.0596 if x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.3736 if x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.2045 if x3-x1>=-1.0 & x4-x2<=2.0 & x4-x2>=2.0\n",
      "   +0.1405 if x1>=1.0 & x2>=1.0 & x4-x2>=2.0\n",
      "   -0.2113 if c>=1.0 & x2>=3.0\n",
      "   -0.3068 if x1<=1.0 & x2<=0.0 & x3-x1>=0.0\n",
      "init state [ 2  3 -1  0  0]\n",
      "(9,) (9,)\n",
      "init state [ 2  2 -2  0  0]\n",
      "(27,) (18,)\n",
      "init state [1 1 0 2 0]\n",
      "(53,) (26,)\n",
      "init state [ 3  0 -3  2  0]\n",
      "(71,) (18,)\n",
      "init state [ 3  0 -1  0  0]\n",
      "(78,) (7,)\n",
      "init state [1 1 2 1 0]\n",
      "(82,) (4,)\n",
      "init state [ 1  3 -1 -3  0]\n",
      "(142,) (60,)\n",
      "init state [ 3  0 -2  3  0]\n",
      "(159,) (17,)\n",
      "init state [ 2  3  0 -2  0]\n",
      "(164,) (5,)\n",
      "init state [0 0 2 3 0]\n",
      "(172,) (8,)\n",
      "============ 82 ===========\n",
      "Run episode 82 with rewards 34, accuracy 1.0\n",
      "best\n",
      "----------------- 0 --------------\n",
      "   -0.4974 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.5443 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.2997 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.5849 if x2<=2.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   -0.3740 if c<=0.0 & x1>=1.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   +0.2448 if c<=0.0 & x1<=2.0 & x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.1463 if x4-x2<=1.0\n",
      "   +0.2463 if x3-x1<=0.0 & x4-x2<=1.0\n",
      "   -0.4187 if x1>=1.0 & x2<=2.0 & x3-x1>=-1.0\n",
      "   +0.1395 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   -0.2941 if c<=0.0 & x1<=2.0 & x1>=2.0 & x2<=2.0 & x3-x1<=-1.0 & x3-x1>=-1.0\n",
      "   -0.0650 if x3-x1<=0.0\n",
      "   -0.0547 if c<=0.0 & x1>=1.0 & x2>=1.0 & x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.3803 if x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.1065 if x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   -0.3253 if x3-x1<=-3.0\n",
      "----------------- 1 --------------\n",
      "   -0.7362 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.3199 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.4685 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.3168 if x4-x2<=1.0\n",
      "   -0.2156 if x2<=2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.7810 if x1<=2.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   -0.0193 if x1<=2.0 & x3-x1<=1.0 & x4-x2<=-1.0\n",
      "   -0.1744 if c>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.1081 if x1>=2.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.0981 if x3-x1<=2.0 & x4-x2<=0.0\n",
      "   -0.3462 if c<=0.0 & x1>=1.0 & x3-x1<=1.0 & x4-x2<=0.0\n",
      "   +0.0975 if x1<=1.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   -0.4207 if x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.0769 if c>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   +0.4862 if c>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.2268 if x3-x1>=2.0\n",
      "----------------- 2 --------------\n",
      "   -0.1536 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   +0.4425 if c<=0.0 & x4-x2>=-2.0\n",
      "   -0.1743 if c<=0.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.4250 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.6640 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.3991 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.2317 if x4-x2>=0.0\n",
      "   -0.1835 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.1490 if x4-x2<=-1.0\n",
      "   -0.2942 if x2>=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   +0.4118 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   -0.4234 if x3-x1<=1.0\n",
      "   +0.1486 if x2>=2.0 & x3-x1<=1.0\n",
      "   +0.0670 if x2<=2.0 & x2>=2.0 & x4-x2>=-1.0\n",
      "   +0.1167 if x1>=1.0 & x4-x2<=-1.0\n",
      "   +0.4843 if x2<=1.0 & x3-x1>=2.0 & x4-x2>=3.0\n",
      "----------------- 3 --------------\n",
      "   +0.8104 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.6401 if c>=1.0 & x1>=1.0\n",
      "   +0.4127 if c>=1.0 & x1>=3.0\n",
      "   -0.2007 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.2942 if c<=0.0 & x1>=3.0 & x4-x2<=1.0\n",
      "   +0.1949 if c>=1.0 & x1>=3.0 & x3-x1<=-1.0 & x4-x2<=0.0\n",
      "   -0.3212 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.3015 if x1<=0.0\n",
      "   +0.6943 if c<=0.0 & x2>=1.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.2016 if x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.2671 if x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.3955 if x3-x1>=-1.0 & x4-x2<=2.0 & x4-x2>=2.0\n",
      "   +0.3761 if x1>=1.0 & x2>=1.0 & x4-x2>=2.0\n",
      "   -0.3274 if c>=1.0 & x2>=3.0\n",
      "   -0.3483 if x1<=1.0 & x2<=0.0 & x3-x1>=0.0\n",
      "   -0.3107 if x2>=2.0 & x3-x1>=1.0\n",
      "init state [0 1 2 2 0]\n",
      "(5,) (5,)\n",
      "init state [ 3  0 -1  3  0]\n",
      "(13,) (8,)\n",
      "init state [ 2  3  0 -3  0]\n",
      "(22,) (9,)\n",
      "init state [0 1 1 0 0]\n",
      "(54,) (32,)\n",
      "init state [ 0  3  2 -2  0]\n",
      "(63,) (9,)\n",
      "init state [ 2  2 -1 -1  0]\n",
      "(74,) (11,)\n",
      "init state [ 3  1 -2 -1  0]\n",
      "(98,) (24,)\n",
      "init state [ 2  1  0 -1  0]\n",
      "(105,) (7,)\n",
      "init state [ 2  3 -2 -1  0]\n",
      "(120,) (15,)\n",
      "init state [ 3  0 -1  3  0]\n",
      "(129,) (9,)\n",
      "============ 83 ===========\n",
      "Run episode 83 with rewards 33, accuracy 1.0\n",
      "best\n",
      "----------------- 0 --------------\n",
      "   -0.5694 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.0924 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.2364 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.4216 if x2<=2.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   -0.3305 if c<=0.0 & x1>=1.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   +0.1182 if c<=0.0 & x1<=2.0 & x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   -0.1180 if x4-x2<=1.0\n",
      "   +0.1167 if x3-x1<=0.0 & x4-x2<=1.0\n",
      "   -0.4543 if x1>=1.0 & x2<=2.0 & x3-x1>=-1.0\n",
      "   +0.0491 if c<=0.0 & x2<=1.0 & x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   +0.1459 if c<=0.0 & x1<=2.0 & x1>=2.0 & x2<=2.0 & x3-x1<=-1.0 & x3-x1>=-1.0\n",
      "   +0.4375 if x3-x1<=0.0\n",
      "   -0.2402 if x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.1410 if x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   -0.0792 if x3-x1<=-3.0\n",
      "   -0.7410 if c<=0.0 & x1<=2.0 & x3-x1>=0.0\n",
      "----------------- 1 --------------\n",
      "   -0.4545 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.7501 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.2564 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.1724 if x4-x2<=1.0\n",
      "   +0.0817 if x2<=2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.2712 if x1<=2.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   +0.2347 if c>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.0710 if x1>=2.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.4637 if x3-x1<=2.0 & x4-x2<=0.0\n",
      "   -0.2256 if c<=0.0 & x1>=1.0 & x3-x1<=1.0 & x4-x2<=0.0\n",
      "   +0.3556 if x1<=1.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   -0.4187 if x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.0549 if c>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   +0.5100 if c>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.2096 if x3-x1>=2.0\n",
      "   +0.8886 if x3-x1<=0.0 & x4-x2<=2.0 & x4-x2>=2.0\n",
      "----------------- 2 --------------\n",
      "   -0.0980 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   +0.2767 if c<=0.0 & x4-x2>=-2.0\n",
      "   -0.0987 if c<=0.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.0746 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.2150 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.7569 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.3008 if x4-x2>=0.0\n",
      "   -0.3990 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.3360 if x4-x2<=-1.0\n",
      "   -0.7121 if x2>=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   +0.1339 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   -0.0444 if x3-x1<=1.0\n",
      "   +0.4767 if x2>=2.0 & x3-x1<=1.0\n",
      "   -0.0505 if x1>=1.0 & x4-x2<=-1.0\n",
      "   -0.0000 if x2<=1.0 & x3-x1>=2.0 & x4-x2>=3.0\n",
      "   +0.6867 if c<=0.0 & x1<=2.0 & x2<=2.0 & x3-x1<=1.0 & x4-x2<=-1.0\n",
      "----------------- 3 --------------\n",
      "   +0.1937 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.4855 if c>=1.0 & x1>=1.0\n",
      "   +0.6493 if c>=1.0 & x1>=3.0\n",
      "   -0.2863 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.1208 if c<=0.0 & x1>=3.0 & x4-x2<=1.0\n",
      "   +0.6890 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   +0.4403 if x1<=0.0\n",
      "   +0.6079 if c<=0.0 & x2>=1.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.1628 if x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.2234 if x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.1311 if x3-x1>=-1.0 & x4-x2<=2.0 & x4-x2>=2.0\n",
      "   -0.2570 if x1>=1.0 & x2>=1.0 & x4-x2>=2.0\n",
      "   -0.0900 if c>=1.0 & x2>=3.0\n",
      "   -0.0285 if x1<=1.0 & x2<=0.0 & x3-x1>=0.0\n",
      "   -0.0853 if x2>=2.0 & x3-x1>=1.0\n",
      "   +0.0867 if x3-x1>=-2.0 & x4-x2<=1.0\n",
      "init state [ 2  0 -2  3  0]\n",
      "(29,) (29,)\n",
      "init state [ 3  1 -2  0  0]\n",
      "(45,) (16,)\n",
      "init state [3 0 0 1 0]\n",
      "(51,) (6,)\n",
      "init state [ 3  1 -1  1  0]\n",
      "(71,) (20,)\n",
      "init state [0 0 0 3 0]\n",
      "(106,) (35,)\n",
      "init state [ 2  0 -1  1  0]\n",
      "(119,) (13,)\n",
      "init state [0 3 1 0 0]\n",
      "(123,) (4,)\n",
      "init state [0 0 1 1 0]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(129,) (6,)\n",
      "init state [ 2  2 -1  0  0]\n",
      "(142,) (13,)\n",
      "init state [ 2  3  0 -2  0]\n",
      "(150,) (8,)\n",
      "============ 84 ===========\n",
      "Run episode 84 with rewards 34, accuracy 0.4\n",
      "----------------- 0 --------------\n",
      "   -0.2694 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.3507 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.1186 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.2169 if x2<=2.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   -0.1319 if c<=0.0 & x1>=1.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   +0.2312 if c<=0.0 & x1<=2.0 & x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   +0.0470 if x4-x2<=1.0\n",
      "   +0.1655 if x3-x1<=0.0 & x4-x2<=1.0\n",
      "   -0.2928 if x1>=1.0 & x2<=2.0 & x3-x1>=-1.0\n",
      "   +0.4361 if c<=0.0 & x1<=2.0 & x1>=2.0 & x2<=2.0 & x3-x1<=-1.0 & x3-x1>=-1.0\n",
      "   +0.0582 if x3-x1<=0.0\n",
      "   -0.1393 if x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.5709 if x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   +0.0185 if x3-x1<=-3.0\n",
      "   -0.2207 if c<=0.0 & x1<=2.0 & x3-x1>=0.0\n",
      "   -0.4862 if c<=0.0 & x1<=2.0 & x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "----------------- 1 --------------\n",
      "   -0.5402 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.6224 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   -0.0184 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.0908 if x4-x2<=1.0\n",
      "   +0.2380 if x2<=2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.4609 if x1<=2.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   +0.2430 if c>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.1858 if x1>=2.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.4714 if x3-x1<=2.0 & x4-x2<=0.0\n",
      "   -0.6303 if c<=0.0 & x1>=1.0 & x3-x1<=1.0 & x4-x2<=0.0\n",
      "   +0.3195 if x1<=1.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   -0.0748 if x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.4773 if c>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.0000 if x3-x1>=2.0\n",
      "   -0.3877 if x3-x1<=0.0 & x4-x2<=2.0 & x4-x2>=2.0\n",
      "   +0.5001 if x1<=2.0 & x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "----------------- 2 --------------\n",
      "   -0.2414 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   +0.5013 if c<=0.0 & x4-x2>=-2.0\n",
      "   -0.1161 if c<=0.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.3471 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.3564 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.2131 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.2599 if x4-x2>=0.0\n",
      "   -0.3008 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.0006 if x4-x2<=-1.0\n",
      "   -0.2613 if x2>=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   +0.5821 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   -0.2605 if x3-x1<=1.0\n",
      "   +0.2507 if x2>=2.0 & x3-x1<=1.0\n",
      "   -0.0006 if x1>=1.0 & x4-x2<=-1.0\n",
      "   +0.3170 if c<=0.0 & x1<=2.0 & x2<=2.0 & x3-x1<=1.0 & x4-x2<=-1.0\n",
      "   -0.1268 if x1<=2.0 & x2<=0.0\n",
      "----------------- 3 --------------\n",
      "   +0.8210 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.3656 if c>=1.0 & x1>=1.0\n",
      "   +0.3187 if c>=1.0 & x1>=3.0\n",
      "   -0.2464 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.0240 if c<=0.0 & x1>=3.0 & x4-x2<=1.0\n",
      "   +0.1825 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   +0.1219 if x1<=0.0\n",
      "   -0.1147 if c<=0.0 & x2>=1.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.1685 if x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.0883 if x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.1721 if x3-x1>=-1.0 & x4-x2<=2.0 & x4-x2>=2.0\n",
      "   +0.2995 if x1>=1.0 & x2>=1.0 & x4-x2>=2.0\n",
      "   -0.3030 if c>=1.0 & x2>=3.0\n",
      "   -0.1218 if x2>=2.0 & x3-x1>=1.0\n",
      "   +0.4096 if x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   -0.6311 if c<=0.0 & x1<=1.0 & x2>=3.0 & x3-x1<=-1.0\n",
      "init state [ 3  1 -2  2  0]\n",
      "(10,) (10,)\n",
      "init state [ 2  2  1 -2  0]\n",
      "(24,) (14,)\n",
      "init state [ 0  1  2 -1  0]\n",
      "(45,) (21,)\n",
      "init state [ 1  3 -1 -3  0]\n",
      "(73,) (28,)\n",
      "init state [0 0 3 2 0]\n",
      "(85,) (12,)\n",
      "init state [ 0  2  1 -2  0]\n",
      "(99,) (14,)\n",
      "init state [1 2 2 0 0]\n",
      "(107,) (8,)\n",
      "init state [1 0 1 0 0]\n",
      "(116,) (9,)\n",
      "init state [ 2  3 -2 -3  0]\n",
      "(183,) (67,)\n",
      "init state [ 2  2 -2  1  0]\n",
      "(199,) (16,)\n",
      "============ 85 ===========\n",
      "Run episode 85 with rewards 26, accuracy 0.1\n",
      "----------------- 0 --------------\n",
      "   -0.3523 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.5296 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.3338 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.1954 if x2<=2.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   -0.0266 if c<=0.0 & x1>=1.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   -0.0025 if c<=0.0 & x1<=2.0 & x1>=1.0 & x3-x1>=-1.0 & x4-x2<=0.0\n",
      "   -0.1087 if x4-x2<=1.0\n",
      "   +0.0546 if x3-x1<=0.0 & x4-x2<=1.0\n",
      "   -0.3108 if x1>=1.0 & x2<=2.0 & x3-x1>=-1.0\n",
      "   -0.1586 if c<=0.0 & x1<=2.0 & x1>=2.0 & x2<=2.0 & x3-x1<=-1.0 & x3-x1>=-1.0\n",
      "   +0.3012 if x3-x1<=0.0\n",
      "   -0.0227 if x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.1753 if x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   -0.0750 if c<=0.0 & x1<=2.0 & x3-x1>=0.0\n",
      "   -0.0807 if c<=0.0 & x1<=2.0 & x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "   -0.1523 if x3-x1>=-1.0 & x4-x2>=2.0\n",
      "----------------- 1 --------------\n",
      "   -0.4433 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.4598 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.0154 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.1833 if x4-x2<=1.0\n",
      "   +0.2588 if x2<=2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.3160 if x1<=2.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   +0.2234 if c>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.2637 if x1>=2.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.3657 if x3-x1<=2.0 & x4-x2<=0.0\n",
      "   +0.0024 if c<=0.0 & x1>=1.0 & x3-x1<=1.0 & x4-x2<=0.0\n",
      "   +0.2941 if x1<=1.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   -0.3040 if x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.3007 if c>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.1101 if x3-x1<=0.0 & x4-x2<=2.0 & x4-x2>=2.0\n",
      "   +0.3580 if x1<=2.0 & x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   -0.0945 if x3-x1<=2.0 & x4-x2<=1.0\n",
      "----------------- 2 --------------\n",
      "   +0.0000 if c>=1.0 & x1>=2.0 & x2>=2.0 & x4-x2<=-1.0 & x4-x2>=-1.0\n",
      "   +0.4580 if c<=0.0 & x4-x2>=-2.0\n",
      "   -0.2866 if c<=0.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.1234 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.5980 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.3432 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.3432 if x4-x2>=0.0\n",
      "   -0.4211 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.0927 if x2>=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   +0.9619 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   -0.3045 if x3-x1<=1.0\n",
      "   +0.0493 if x2>=2.0 & x3-x1<=1.0\n",
      "   +0.1211 if x1>=1.0 & x4-x2<=-1.0\n",
      "   +0.2114 if c<=0.0 & x1<=2.0 & x2<=2.0 & x3-x1<=1.0 & x4-x2<=-1.0\n",
      "   +0.4107 if x1<=2.0 & x2<=0.0\n",
      "   -0.5800 if x1>=2.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=-2.0\n",
      "----------------- 3 --------------\n",
      "   +0.4132 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.9706 if c>=1.0 & x1>=1.0\n",
      "   +0.5584 if c>=1.0 & x1>=3.0\n",
      "   -0.2320 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.1433 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.1797 if x1<=0.0\n",
      "   +0.2628 if c<=0.0 & x2>=1.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.0448 if x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.0316 if x3-x1>=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.3884 if x3-x1>=-1.0 & x4-x2<=2.0 & x4-x2>=2.0\n",
      "   +0.0548 if x1>=1.0 & x2>=1.0 & x4-x2>=2.0\n",
      "   -0.2557 if c>=1.0 & x2>=3.0\n",
      "   -0.2368 if x2>=2.0 & x3-x1>=1.0\n",
      "   +0.0786 if x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   -0.3705 if c<=0.0 & x1<=1.0 & x2>=3.0 & x3-x1<=-1.0\n",
      "   +0.0328 if x3-x1>=3.0\n",
      "init state [ 3  2 -2  1  0]\n",
      "(6,) (6,)\n",
      "init state [ 3  2 -3 -1  0]\n",
      "(23,) (17,)\n",
      "init state [ 2  0 -1  3  0]\n",
      "(35,) (12,)\n",
      "init state [ 1  1 -1  1  0]\n",
      "(48,) (13,)\n",
      "init state [ 2  2  1 -2  0]\n",
      "(61,) (13,)\n",
      "init state [ 1  0 -1  1  0]\n",
      "(106,) (45,)\n",
      "init state [ 1  1  2 -1  0]\n",
      "(135,) (29,)\n",
      "init state [ 2  3 -1 -1  0]\n",
      "(151,) (16,)\n",
      "init state [ 2  1 -1  1  0]\n",
      "(169,) (18,)\n",
      "init state [1 1 1 0 0]\n",
      "(173,) (4,)\n",
      "============ 86 ===========\n",
      "Run episode 86 with rewards 38, accuracy 0.6\n",
      "----------------- 0 --------------\n",
      "   -0.7743 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.5618 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.1525 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.6490 if x2<=2.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   +0.2062 if c<=0.0 & x1>=1.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   -0.0145 if x4-x2<=1.0\n",
      "   +0.1133 if x3-x1<=0.0 & x4-x2<=1.0\n",
      "   -0.0473 if x1>=1.0 & x2<=2.0 & x3-x1>=-1.0\n",
      "   -0.1453 if c<=0.0 & x1<=2.0 & x1>=2.0 & x2<=2.0 & x3-x1<=-1.0 & x3-x1>=-1.0\n",
      "   +0.2756 if x3-x1<=0.0\n",
      "   +0.1514 if x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.3760 if x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   -0.6359 if c<=0.0 & x1<=2.0 & x3-x1>=0.0\n",
      "   -0.3273 if c<=0.0 & x1<=2.0 & x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "   +0.1623 if x3-x1>=-1.0 & x4-x2>=2.0\n",
      "   +0.0194 if x4-x2<=0.0\n",
      "----------------- 1 --------------\n",
      "   -0.6996 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.6550 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.0851 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.0290 if x4-x2<=1.0\n",
      "   +0.2571 if x2<=2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.2856 if x1<=2.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   +0.1671 if c>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.4419 if x1>=2.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.3825 if x3-x1<=2.0 & x4-x2<=0.0\n",
      "   +0.2915 if x1<=1.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   +0.2564 if x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.4621 if c>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   +0.1717 if x3-x1<=0.0 & x4-x2<=2.0 & x4-x2>=2.0\n",
      "   -0.0306 if x1<=2.0 & x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   +0.0290 if x3-x1<=2.0 & x4-x2<=1.0\n",
      "   -0.2700 if x2<=2.0 & x4-x2>=0.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 2 --------------\n",
      "   +0.2815 if c<=0.0 & x4-x2>=-2.0\n",
      "   +0.3571 if c<=0.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.0559 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.3059 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.1851 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.5334 if x4-x2>=0.0\n",
      "   -0.3474 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.2137 if x2>=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   +0.8013 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   -0.1758 if x3-x1<=1.0\n",
      "   -0.0277 if x2>=2.0 & x3-x1<=1.0\n",
      "   +0.2046 if x1>=1.0 & x4-x2<=-1.0\n",
      "   +0.5719 if c<=0.0 & x1<=2.0 & x2<=2.0 & x3-x1<=1.0 & x4-x2<=-1.0\n",
      "   -0.0078 if x1<=2.0 & x2<=0.0\n",
      "   -0.1710 if x1>=2.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   +0.5980 if x1>=2.0 & x2<=1.0 & x3-x1>=1.0\n",
      "----------------- 3 --------------\n",
      "   +0.6008 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.5476 if c>=1.0 & x1>=1.0\n",
      "   +0.7134 if c>=1.0 & x1>=3.0\n",
      "   -0.3096 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.0473 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   +0.1781 if x1<=0.0\n",
      "   +0.1470 if c<=0.0 & x2>=1.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.0439 if x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.1061 if x3-x1>=-1.0 & x4-x2<=2.0 & x4-x2>=2.0\n",
      "   +0.1061 if x1>=1.0 & x2>=1.0 & x4-x2>=2.0\n",
      "   -0.0381 if c>=1.0 & x2>=3.0\n",
      "   -0.2046 if x2>=2.0 & x3-x1>=1.0\n",
      "   -0.1549 if x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.0000 if c<=0.0 & x1<=1.0 & x2>=3.0 & x3-x1<=-1.0\n",
      "   +0.0000 if x3-x1>=3.0\n",
      "   -0.4683 if x1>=2.0 & x4-x2>=2.0\n",
      "init state [ 3  2 -3 -1  0]\n",
      "(45,) (45,)\n",
      "init state [ 3  0 -3  2  0]\n",
      "(58,) (13,)\n",
      "init state [1 0 0 2 0]\n",
      "(75,) (17,)\n",
      "init state [ 1  3 -1 -3  0]\n",
      "(104,) (29,)\n",
      "init state [0 1 2 2 0]\n",
      "(111,) (7,)\n",
      "init state [ 2  2  0 -1  0]\n",
      "(121,) (10,)\n",
      "init state [ 3  1  0 -1  0]\n",
      "(125,) (4,)\n",
      "init state [ 2  2 -2 -2  0]\n",
      "(144,) (19,)\n",
      "init state [2 1 1 0 0]\n",
      "(151,) (7,)\n",
      "init state [0 2 2 1 0]\n",
      "(161,) (10,)\n",
      "============ 87 ===========\n",
      "Run episode 87 with rewards 32, accuracy 0.3\n",
      "----------------- 0 --------------\n",
      "   -0.5246 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.5969 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.1192 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.5981 if x2<=2.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   -0.3507 if c<=0.0 & x1>=1.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   +0.0063 if x3-x1<=0.0 & x4-x2<=1.0\n",
      "   -0.2480 if x1>=1.0 & x2<=2.0 & x3-x1>=-1.0\n",
      "   +0.2087 if c<=0.0 & x1<=2.0 & x1>=2.0 & x2<=2.0 & x3-x1<=-1.0 & x3-x1>=-1.0\n",
      "   +0.1241 if x3-x1<=0.0\n",
      "   +0.4849 if x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.3384 if x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   -0.6088 if c<=0.0 & x1<=2.0 & x3-x1>=0.0\n",
      "   +0.2917 if c<=0.0 & x1<=2.0 & x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "   -0.2434 if x3-x1>=-1.0 & x4-x2>=2.0\n",
      "   -0.3260 if x4-x2<=0.0\n",
      "   +1.0696 if c<=0.0 & x2<=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1<=1.0\n",
      "----------------- 1 --------------\n",
      "   -0.4841 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.8137 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.3624 if x1<=2.0 & x4-x2>=-2.0\n",
      "   -0.1526 if x4-x2<=1.0\n",
      "   +0.4100 if x2<=2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.1745 if x1<=2.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   +0.5066 if c>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.3596 if x1>=2.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.1499 if x3-x1<=2.0 & x4-x2<=0.0\n",
      "   +0.7409 if x1<=1.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   -0.0315 if x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.4569 if c>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   +0.0274 if x3-x1<=0.0 & x4-x2<=2.0 & x4-x2>=2.0\n",
      "   +0.0999 if x1<=2.0 & x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   +0.1538 if x2<=2.0 & x4-x2>=0.0\n",
      "   -0.1848 if x4-x2>=3.0\n",
      "----------------- 2 --------------\n",
      "   +0.2393 if c<=0.0 & x4-x2>=-2.0\n",
      "   -0.0170 if c<=0.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.0374 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.5277 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.2777 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.4638 if x4-x2>=0.0\n",
      "   -0.3974 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.0700 if x2>=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   +0.5149 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   -0.0863 if x3-x1<=1.0\n",
      "   +0.0695 if x2>=2.0 & x3-x1<=1.0\n",
      "   +0.1401 if x1>=1.0 & x4-x2<=-1.0\n",
      "   +0.1835 if c<=0.0 & x1<=2.0 & x2<=2.0 & x3-x1<=1.0 & x4-x2<=-1.0\n",
      "   -0.4952 if x1>=2.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   -0.0483 if x1>=2.0 & x2<=1.0 & x3-x1>=1.0\n",
      "   -0.2608 if x3-x1>=1.0 & x4-x2>=1.0\n",
      "----------------- 3 --------------\n",
      "   +0.2860 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.7151 if c>=1.0 & x1>=1.0\n",
      "   +0.6012 if c>=1.0 & x1>=3.0\n",
      "   -0.1847 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.0064 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.0434 if x1<=0.0\n",
      "   +0.3534 if c<=0.0 & x2>=1.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.0702 if x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.5061 if x3-x1>=-1.0 & x4-x2<=2.0 & x4-x2>=2.0\n",
      "   -0.0792 if x1>=1.0 & x2>=1.0 & x4-x2>=2.0\n",
      "   -0.1745 if c>=1.0 & x2>=3.0\n",
      "   -0.2821 if x2>=2.0 & x3-x1>=1.0\n",
      "   -0.0105 if x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   -0.0499 if c<=0.0 & x1<=1.0 & x2>=3.0 & x3-x1<=-1.0\n",
      "   +0.2752 if x1>=2.0 & x4-x2>=2.0\n",
      "   +0.2647 if x4-x2>=3.0\n",
      "init state [ 2  3 -2 -2  0]\n",
      "(13,) (13,)\n",
      "init state [ 3  0 -3  3  0]\n",
      "(47,) (34,)\n",
      "init state [2 0 1 1 0]\n",
      "(53,) (6,)\n",
      "init state [ 2  0 -2  2  0]\n",
      "(61,) (8,)\n",
      "init state [1 1 2 0 0]\n",
      "(65,) (4,)\n",
      "init state [0 3 2 0 0]\n",
      "(68,) (3,)\n",
      "init state [ 3  1 -1 -1  0]\n",
      "(79,) (11,)\n",
      "init state [ 1  1 -1 -1  0]\n",
      "(93,) (14,)\n",
      "init state [1 0 1 2 0]\n",
      "(101,) (8,)\n",
      "init state [ 1  3 -1 -2  0]\n",
      "(126,) (25,)\n",
      "============ 88 ===========\n",
      "Run episode 88 with rewards 17, accuracy 0.1\n",
      "----------------- 0 --------------\n",
      "   -0.1919 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.8651 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.2256 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.4000 if x2<=2.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   -0.1414 if c<=0.0 & x1>=1.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   -0.1575 if x1>=1.0 & x2<=2.0 & x3-x1>=-1.0\n",
      "   +0.0000 if c<=0.0 & x1<=2.0 & x1>=2.0 & x2<=2.0 & x3-x1<=-1.0 & x3-x1>=-1.0\n",
      "   +0.1937 if x3-x1<=0.0\n",
      "   +0.4378 if x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.3603 if x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   -0.3796 if c<=0.0 & x1<=2.0 & x3-x1>=0.0\n",
      "   -0.2141 if c<=0.0 & x1<=2.0 & x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "   +0.2149 if x3-x1>=-1.0 & x4-x2>=2.0\n",
      "   -0.2350 if x4-x2<=0.0\n",
      "   +0.6483 if c<=0.0 & x2<=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1<=1.0\n",
      "   +0.0436 if c<=0.0 & x1<=0.0 & x2>=2.0 & x3-x1<=0.0\n",
      "----------------- 1 --------------\n",
      "   -0.5639 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.4282 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.2008 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.3169 if x4-x2<=1.0\n",
      "   +0.5667 if x2<=2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.3022 if x1<=2.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   +0.0266 if c>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.4651 if x1>=2.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.2481 if x3-x1<=2.0 & x4-x2<=0.0\n",
      "   +0.5878 if x1<=1.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   -0.3375 if x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.4042 if c>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.1243 if x1<=2.0 & x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   +0.0028 if x2<=2.0 & x4-x2>=0.0\n",
      "   +0.0548 if x4-x2>=3.0\n",
      "   +0.3605 if x2<=0.0 & x3-x1>=1.0\n",
      "----------------- 2 --------------\n",
      "   +0.1304 if c<=0.0 & x4-x2>=-2.0\n",
      "   -0.0344 if x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.5583 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.4487 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.5762 if x4-x2>=0.0\n",
      "   -0.4810 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.0715 if x2>=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   +0.5922 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   -0.3067 if x3-x1<=1.0\n",
      "   +0.2454 if x2>=2.0 & x3-x1<=1.0\n",
      "   +0.2100 if x1>=1.0 & x4-x2<=-1.0\n",
      "   +0.2386 if c<=0.0 & x1<=2.0 & x2<=2.0 & x3-x1<=1.0 & x4-x2<=-1.0\n",
      "   -0.3782 if x1>=2.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   -0.0606 if x1>=2.0 & x2<=1.0 & x3-x1>=1.0\n",
      "   -0.0674 if x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.3740 if x1>=2.0 & x2<=0.0 & x3-x1>=0.0 & x4-x2>=2.0\n",
      "----------------- 3 --------------\n",
      "   +0.3384 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.7565 if c>=1.0 & x1>=1.0\n",
      "   +1.0359 if c>=1.0 & x1>=3.0\n",
      "   +0.0040 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.0187 if x1<=0.0\n",
      "   +0.2525 if c<=0.0 & x2>=1.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.1314 if x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.0609 if x3-x1>=-1.0 & x4-x2<=2.0 & x4-x2>=2.0\n",
      "   -0.1374 if x1>=1.0 & x2>=1.0 & x4-x2>=2.0\n",
      "   +0.0077 if c>=1.0 & x2>=3.0\n",
      "   -0.1440 if x2>=2.0 & x3-x1>=1.0\n",
      "   -0.3076 if x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   -0.0621 if c<=0.0 & x1<=1.0 & x2>=3.0 & x3-x1<=-1.0\n",
      "   +0.3379 if x1>=2.0 & x4-x2>=2.0\n",
      "   -0.0040 if x4-x2>=3.0\n",
      "   -0.4656 if x3-x1>=1.0\n",
      "init state [ 1  0 -1  1  0]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(29,) (29,)\n",
      "init state [ 0  3  3 -2  0]\n",
      "(39,) (10,)\n",
      "init state [ 3  0 -3  0  0]\n",
      "(91,) (52,)\n",
      "init state [0 0 2 0 0]\n",
      "(97,) (6,)\n",
      "init state [ 1  2 -1  1  0]\n",
      "(117,) (20,)\n",
      "init state [ 3  2 -2  1  0]\n",
      "(124,) (7,)\n",
      "init state [ 2  0 -1  1  0]\n",
      "(136,) (12,)\n",
      "init state [2 0 0 2 0]\n",
      "(145,) (9,)\n",
      "init state [ 2  3 -2 -2  0]\n",
      "(161,) (16,)\n",
      "init state [ 0  3  3 -2  0]\n",
      "(170,) (9,)\n",
      "============ 89 ===========\n",
      "Run episode 89 with rewards 33, accuracy 0.3\n",
      "----------------- 0 --------------\n",
      "   -0.5665 if c>=1.0 & x3-x1<=1.0\n",
      "   +1.0033 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.2965 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.1020 if x2<=2.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   -0.0518 if c<=0.0 & x1>=1.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   -0.0317 if x1>=1.0 & x2<=2.0 & x3-x1>=-1.0\n",
      "   +0.4516 if x3-x1<=0.0\n",
      "   +0.3313 if x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.6952 if x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   -0.0667 if c<=0.0 & x1<=2.0 & x3-x1>=0.0\n",
      "   +0.0121 if c<=0.0 & x1<=2.0 & x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "   +0.3346 if x3-x1>=-1.0 & x4-x2>=2.0\n",
      "   -0.0886 if x4-x2<=0.0\n",
      "   +0.3824 if c<=0.0 & x2<=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1<=1.0\n",
      "   -0.0867 if c<=0.0 & x1<=0.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   -0.2750 if x1<=2.0 & x4-x2>=1.0\n",
      "----------------- 1 --------------\n",
      "   -0.3243 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.9170 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.3015 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.2506 if x4-x2<=1.0\n",
      "   +0.3911 if x2<=2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.3801 if x1<=2.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   +0.1626 if c>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.1895 if x1>=2.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.4737 if x3-x1<=2.0 & x4-x2<=0.0\n",
      "   +0.2721 if x1<=1.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   -0.0639 if x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.2246 if c>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.0705 if x1<=2.0 & x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   +0.0803 if x4-x2>=3.0\n",
      "   -0.1595 if x2<=0.0 & x3-x1>=1.0\n",
      "   -0.4078 if x2>=3.0 & x3-x1>=2.0\n",
      "----------------- 2 --------------\n",
      "   +0.4002 if c<=0.0 & x4-x2>=-2.0\n",
      "   +0.6052 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.4023 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.4722 if x4-x2>=0.0\n",
      "   -0.5613 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.1768 if x2>=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   +0.3419 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   -0.1411 if x3-x1<=1.0\n",
      "   -0.1265 if x2>=2.0 & x3-x1<=1.0\n",
      "   +0.0061 if x1>=1.0 & x4-x2<=-1.0\n",
      "   -0.0092 if c<=0.0 & x1<=2.0 & x2<=2.0 & x3-x1<=1.0 & x4-x2<=-1.0\n",
      "   -0.1844 if x1>=2.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   -0.0268 if x1>=2.0 & x2<=1.0 & x3-x1>=1.0\n",
      "   +0.2176 if x3-x1>=1.0 & x4-x2>=1.0\n",
      "   -0.1380 if x1>=2.0 & x2<=0.0 & x3-x1>=0.0 & x4-x2>=2.0\n",
      "   +0.5140 if x2>=3.0 & x3-x1>=3.0\n",
      "----------------- 3 --------------\n",
      "   +0.2723 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.7761 if c>=1.0 & x1>=1.0\n",
      "   +0.9480 if c>=1.0 & x1>=3.0\n",
      "   -0.3159 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.1187 if x1<=0.0\n",
      "   +0.5838 if c<=0.0 & x2>=1.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.1390 if x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.1169 if x3-x1>=-1.0 & x4-x2<=2.0 & x4-x2>=2.0\n",
      "   +0.0409 if x1>=1.0 & x2>=1.0 & x4-x2>=2.0\n",
      "   +0.0017 if c>=1.0 & x2>=3.0\n",
      "   -0.2659 if x2>=2.0 & x3-x1>=1.0\n",
      "   -0.2005 if x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   -0.0320 if c<=0.0 & x1<=1.0 & x2>=3.0 & x3-x1<=-1.0\n",
      "   -0.1528 if x1>=2.0 & x4-x2>=2.0\n",
      "   -0.3044 if x3-x1>=1.0\n",
      "   +0.3134 if x3-x1>=-2.0 & x3-x1>=1.0 & x4-x2>=2.0\n",
      "init state [1 1 0 2 0]\n",
      "(13,) (13,)\n",
      "init state [1 1 2 0 0]\n",
      "(21,) (8,)\n",
      "init state [ 2  1 -1  0  0]\n",
      "(33,) (12,)\n",
      "init state [1 3 1 0 0]\n",
      "(35,) (2,)\n",
      "init state [0 0 0 3 0]\n",
      "(47,) (12,)\n",
      "init state [ 1  1 -1 -1  0]\n",
      "(73,) (26,)\n",
      "init state [ 1  1 -1 -1  0]\n",
      "(92,) (19,)\n",
      "init state [0 2 0 1 0]\n",
      "(100,) (8,)\n",
      "init state [ 3  2 -1  0  0]\n",
      "(104,) (4,)\n",
      "init state [0 1 3 0 0]\n",
      "(111,) (7,)\n",
      "============ 90 ===========\n",
      "Run episode 90 with rewards 35, accuracy 0.9\n",
      "----------------- 0 --------------\n",
      "   -0.4185 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.8687 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.2282 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.1131 if x2<=2.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   -0.3319 if c<=0.0 & x1>=1.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   -0.4818 if x1>=1.0 & x2<=2.0 & x3-x1>=-1.0\n",
      "   +0.4204 if x3-x1<=0.0\n",
      "   +0.1098 if x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.1710 if x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   -0.0925 if c<=0.0 & x1<=2.0 & x3-x1>=0.0\n",
      "   -0.0394 if x3-x1>=-1.0 & x4-x2>=2.0\n",
      "   -0.0532 if x4-x2<=0.0\n",
      "   -0.0827 if c<=0.0 & x2<=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1<=1.0\n",
      "   +0.3013 if c<=0.0 & x1<=0.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   -0.0231 if x1<=2.0 & x4-x2>=1.0\n",
      "   +0.0027 if c<=0.0 & x2<=1.0 & x4-x2<=0.0 & x4-x2<=2.0\n",
      "----------------- 1 --------------\n",
      "   -0.4062 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.6503 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.3638 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.5063 if x4-x2<=1.0\n",
      "   +0.2543 if x2<=2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.1395 if x1<=2.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   -0.0675 if c>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.0229 if x1>=2.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.2125 if x3-x1<=2.0 & x4-x2<=0.0\n",
      "   +0.4897 if x1<=1.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   +0.2395 if c>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.2723 if x1<=2.0 & x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   -0.1082 if x4-x2>=3.0\n",
      "   +0.0000 if x2<=0.0 & x3-x1>=1.0\n",
      "   +0.0000 if x2>=3.0 & x3-x1>=2.0\n",
      "   -0.4360 if c<=0.0 & x1<=0.0\n",
      "----------------- 2 --------------\n",
      "   -0.0153 if c<=0.0 & x4-x2>=-2.0\n",
      "   +0.4680 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.5535 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.6304 if x4-x2>=0.0\n",
      "   -0.5053 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.0655 if x2>=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   +0.3931 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   -0.2570 if x3-x1<=1.0\n",
      "   -0.2451 if x2>=2.0 & x3-x1<=1.0\n",
      "   +0.4680 if c<=0.0 & x1<=2.0 & x2<=2.0 & x3-x1<=1.0 & x4-x2<=-1.0\n",
      "   -0.2597 if x1>=2.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   -0.0367 if x1>=2.0 & x2<=1.0 & x3-x1>=1.0\n",
      "   +0.0000 if x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.0000 if x1>=2.0 & x2<=0.0 & x3-x1>=0.0 & x4-x2>=2.0\n",
      "   +0.0000 if x2>=3.0 & x3-x1>=3.0\n",
      "   -0.0553 if c<=0.0 & x1>=2.0 & x4-x2<=-2.0\n",
      "----------------- 3 --------------\n",
      "   +0.2549 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.7665 if c>=1.0 & x1>=1.0\n",
      "   +0.4541 if c>=1.0 & x1>=3.0\n",
      "   +0.0000 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.2356 if x1<=0.0\n",
      "   +0.2062 if c<=0.0 & x2>=1.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.2217 if x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.3862 if x3-x1>=-1.0 & x4-x2<=2.0 & x4-x2>=2.0\n",
      "   +0.1751 if x1>=1.0 & x2>=1.0 & x4-x2>=2.0\n",
      "   -0.0661 if x2>=2.0 & x3-x1>=1.0\n",
      "   -0.3012 if x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.0000 if c<=0.0 & x1<=1.0 & x2>=3.0 & x3-x1<=-1.0\n",
      "   +0.0000 if x1>=2.0 & x4-x2>=2.0\n",
      "   -0.4093 if x3-x1>=1.0\n",
      "   +0.0000 if x3-x1>=-2.0 & x3-x1>=1.0 & x4-x2>=2.0\n",
      "   +0.3050 if x1<=0.0 & x4-x2>=2.0\n",
      "init state [ 2  2 -1  0  0]\n",
      "(4,) (4,)\n",
      "init state [ 2  1 -2  2  0]\n",
      "(14,) (10,)\n",
      "init state [ 3  2  0 -2  0]\n",
      "(30,) (16,)\n",
      "init state [ 2  3 -1  0  0]\n",
      "(37,) (7,)\n",
      "init state [2 0 1 0 0]\n",
      "(41,) (4,)\n",
      "init state [ 3  1 -2  1  0]\n",
      "(61,) (20,)\n",
      "init state [ 3  2  0 -1  0]\n",
      "(66,) (5,)\n",
      "init state [ 2  1 -2  0  0]\n",
      "(84,) (18,)\n",
      "init state [ 1  3  2 -3  0]\n",
      "(111,) (27,)\n",
      "init state [ 0  3  2 -2  0]\n",
      "(124,) (13,)\n",
      "============ 91 ===========\n",
      "Run episode 91 with rewards 29, accuracy 0.3\n",
      "----------------- 0 --------------\n",
      "   -0.4640 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.8317 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.0337 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.4731 if x2<=2.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   -0.2126 if c<=0.0 & x1>=1.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   +0.1048 if x1>=1.0 & x2<=2.0 & x3-x1>=-1.0\n",
      "   +0.0558 if x3-x1<=0.0\n",
      "   +0.2380 if x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.1014 if x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   -0.2583 if c<=0.0 & x1<=2.0 & x3-x1>=0.0\n",
      "   -0.2284 if x3-x1>=-1.0 & x4-x2>=2.0\n",
      "   -0.0065 if x4-x2<=0.0\n",
      "   +0.2007 if c<=0.0 & x2<=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1<=1.0\n",
      "   -0.0955 if c<=0.0 & x1<=0.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   +0.0781 if x1<=2.0 & x4-x2>=1.0\n",
      "   +0.2644 if x3-x1<=-2.0 & x4-x2>=2.0\n",
      "----------------- 1 --------------\n",
      "   -0.3144 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.4172 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.1439 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.5826 if x4-x2<=1.0\n",
      "   +0.1341 if x2<=2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.1401 if x1<=2.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   -0.0211 if c>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.2783 if x1>=2.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.5093 if x3-x1<=2.0 & x4-x2<=0.0\n",
      "   +0.1269 if x1<=1.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   +0.4481 if c>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.0054 if x1<=2.0 & x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   +0.0000 if x4-x2>=3.0\n",
      "   -0.0644 if x2>=3.0 & x3-x1>=2.0\n",
      "   +0.0345 if c<=0.0 & x1<=0.0\n",
      "   -0.5544 if x2<=2.0 & x3-x1<=1.0\n",
      "----------------- 2 --------------\n",
      "   +0.3460 if c<=0.0 & x4-x2>=-2.0\n",
      "   +0.5957 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.3893 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.3893 if x4-x2>=0.0\n",
      "   -0.2290 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.2175 if x2>=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   +0.3693 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   -0.1439 if x3-x1<=1.0\n",
      "   -0.1160 if x2>=2.0 & x3-x1<=1.0\n",
      "   +0.5323 if c<=0.0 & x1<=2.0 & x2<=2.0 & x3-x1<=1.0 & x4-x2<=-1.0\n",
      "   -0.1021 if x1>=2.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   +0.3085 if x1>=2.0 & x2<=1.0 & x3-x1>=1.0\n",
      "   -0.0256 if x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.0000 if x2>=3.0 & x3-x1>=3.0\n",
      "   +0.0100 if c<=0.0 & x1>=2.0 & x4-x2<=-2.0\n",
      "   -0.2371 if x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 3 --------------\n",
      "   +0.2309 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.9415 if c>=1.0 & x1>=1.0\n",
      "   +0.7160 if c>=1.0 & x1>=3.0\n",
      "   -0.4589 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.2372 if x1<=0.0\n",
      "   +0.2544 if c<=0.0 & x2>=1.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.0806 if x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.4381 if x3-x1>=-1.0 & x4-x2<=2.0 & x4-x2>=2.0\n",
      "   +0.0915 if x1>=1.0 & x2>=1.0 & x4-x2>=2.0\n",
      "   -0.0784 if x2>=2.0 & x3-x1>=1.0\n",
      "   -0.5521 if x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.0745 if x1>=2.0 & x4-x2>=2.0\n",
      "   -0.3622 if x3-x1>=1.0\n",
      "   +0.0000 if x3-x1>=-2.0 & x3-x1>=1.0 & x4-x2>=2.0\n",
      "   +0.0000 if x1<=0.0 & x4-x2>=2.0\n",
      "   -0.0804 if x1<=0.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "init state [ 2  0 -2  0  0]\n",
      "(15,) (15,)\n",
      "init state [ 3  0 -2  3  0]\n",
      "(36,) (21,)\n",
      "init state [ 3  0 -2  2  0]\n",
      "(47,) (11,)\n",
      "init state [ 3  1  0 -1  0]\n",
      "(59,) (12,)\n",
      "init state [ 1  1  2 -1  0]\n",
      "(65,) (6,)\n",
      "init state [ 2  3  0 -1  0]\n",
      "(72,) (7,)\n",
      "init state [0 1 1 0 0]\n",
      "(77,) (5,)\n",
      "init state [ 0  3  2 -3  0]\n",
      "(87,) (10,)\n",
      "init state [0 0 2 1 0]\n",
      "(101,) (14,)\n",
      "init state [ 0  3  1 -2  0]\n",
      "(130,) (29,)\n",
      "============ 92 ===========\n",
      "Run episode 92 with rewards 13, accuracy 1.0\n",
      "best\n",
      "----------------- 0 --------------\n",
      "   -0.3070 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.8772 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.0106 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.3868 if x2<=2.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   -0.5892 if c<=0.0 & x1>=1.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   +0.1295 if x1>=1.0 & x2<=2.0 & x3-x1>=-1.0\n",
      "   -0.0558 if x3-x1<=0.0\n",
      "   +0.5173 if x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.2579 if x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   -0.4423 if c<=0.0 & x1<=2.0 & x3-x1>=0.0\n",
      "   -0.2167 if x3-x1>=-1.0 & x4-x2>=2.0\n",
      "   +0.1546 if c<=0.0 & x2<=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1<=1.0\n",
      "   +0.0000 if c<=0.0 & x1<=0.0 & x2>=2.0 & x3-x1<=0.0\n",
      "   +0.4461 if x1<=2.0 & x4-x2>=1.0\n",
      "   -0.0821 if x3-x1<=-2.0 & x4-x2>=2.0\n",
      "   -0.0710 if x3-x1<=-2.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2<=2.0\n",
      "----------------- 1 --------------\n",
      "   -0.8689 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.4586 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.5207 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.2391 if x4-x2<=1.0\n",
      "   +0.2627 if x2<=2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.0265 if x1<=2.0 & x2>=2.0 & x3-x1>=-1.0\n",
      "   +0.1269 if c>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.2503 if x1>=2.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.4192 if x3-x1<=2.0 & x4-x2<=0.0\n",
      "   +0.1889 if x1<=1.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   -0.0745 if c>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   +0.2690 if x1<=2.0 & x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   +0.1982 if x2>=3.0 & x3-x1>=2.0\n",
      "   +0.0428 if c<=0.0 & x1<=0.0\n",
      "   -0.2760 if x2<=2.0 & x3-x1<=1.0\n",
      "   -0.2244 if x1>=1.0 & x4-x2<=-3.0\n",
      "----------------- 2 --------------\n",
      "   +0.4172 if c<=0.0 & x4-x2>=-2.0\n",
      "   +0.6418 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.5612 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.6824 if x4-x2>=0.0\n",
      "   -0.4384 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.1044 if x2>=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   +0.6030 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   +0.0169 if x3-x1<=1.0\n",
      "   +0.7405 if x2>=2.0 & x3-x1<=1.0\n",
      "   +0.2667 if c<=0.0 & x1<=2.0 & x2<=2.0 & x3-x1<=1.0 & x4-x2<=-1.0\n",
      "   -0.2787 if x1>=2.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   -0.2373 if x1>=2.0 & x2<=1.0 & x3-x1>=1.0\n",
      "   -0.0837 if x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.0382 if c<=0.0 & x1>=2.0 & x4-x2<=-2.0\n",
      "   +0.0916 if x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.0783 if x1>=1.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "----------------- 3 --------------\n",
      "   +0.4918 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.9353 if c>=1.0 & x1>=1.0\n",
      "   +1.2785 if c>=1.0 & x1>=3.0\n",
      "   -0.3012 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.0713 if x1<=0.0\n",
      "   -0.0874 if c<=0.0 & x2>=1.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.1877 if x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.5037 if x3-x1>=-1.0 & x4-x2<=2.0 & x4-x2>=2.0\n",
      "   +0.2402 if x1>=1.0 & x2>=1.0 & x4-x2>=2.0\n",
      "   -0.2674 if x2>=2.0 & x3-x1>=1.0\n",
      "   -0.4804 if x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.1885 if x1>=2.0 & x4-x2>=2.0\n",
      "   -0.5013 if x3-x1>=1.0\n",
      "   +0.2635 if x1<=0.0 & x4-x2>=2.0\n",
      "   -0.1060 if x1<=0.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.1340 if x1<=0.0 & x3-x1>=2.0\n",
      "init state [ 0  3  1 -1  0]\n",
      "(5,) (5,)\n",
      "init state [1 0 0 1 0]\n",
      "(21,) (16,)\n",
      "init state [ 2  3 -1 -2  0]\n",
      "(34,) (13,)\n",
      "init state [ 2  0 -1  3  0]\n",
      "(45,) (11,)\n",
      "init state [ 0  3  2 -1  0]\n",
      "(50,) (5,)\n",
      "init state [ 1  3  1 -2  0]\n",
      "(59,) (9,)\n",
      "init state [1 0 1 2 0]\n",
      "(67,) (8,)\n",
      "init state [0 0 0 3 0]\n",
      "(77,) (10,)\n",
      "init state [ 0  1  3 -1  0]\n",
      "(88,) (11,)\n",
      "init state [ 3  0 -3  3  0]\n",
      "(112,) (24,)\n",
      "============ 93 ===========\n",
      "Run episode 93 with rewards 18, accuracy 1.0\n",
      "best\n",
      "----------------- 0 --------------\n",
      "   -0.6180 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.7215 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.0769 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.0005 if x2<=2.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   -0.5064 if c<=0.0 & x1>=1.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   -0.3186 if x1>=1.0 & x2<=2.0 & x3-x1>=-1.0\n",
      "   -0.0945 if x3-x1<=0.0\n",
      "   -0.0264 if x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.0267 if x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   -0.2463 if c<=0.0 & x1<=2.0 & x3-x1>=0.0\n",
      "   -0.0305 if x3-x1>=-1.0 & x4-x2>=2.0\n",
      "   +0.3300 if c<=0.0 & x2<=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1<=1.0\n",
      "   -0.2575 if x1<=2.0 & x4-x2>=1.0\n",
      "   +0.0637 if x3-x1<=-2.0 & x4-x2>=2.0\n",
      "   -0.0523 if x3-x1<=-2.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2<=2.0\n",
      "   +0.4156 if x4-x2>=3.0\n",
      "----------------- 1 --------------\n",
      "   -0.7981 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.6449 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.1163 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.5203 if x4-x2<=1.0\n",
      "   -0.0605 if x2<=2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.2067 if c>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.2552 if x1>=2.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.7406 if x3-x1<=2.0 & x4-x2<=0.0\n",
      "   +0.3325 if x1<=1.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   +0.3635 if c>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   +0.1376 if x1<=2.0 & x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   +0.2131 if x2>=3.0 & x3-x1>=2.0\n",
      "   -0.0144 if c<=0.0 & x1<=0.0\n",
      "   -0.8409 if x2<=2.0 & x3-x1<=1.0\n",
      "   +0.0000 if x1>=1.0 & x4-x2<=-3.0\n",
      "   -0.2794 if x3-x1>=3.0\n",
      "----------------- 2 --------------\n",
      "   +0.4249 if c<=0.0 & x4-x2>=-2.0\n",
      "   +0.5081 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.2172 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.3772 if x4-x2>=0.0\n",
      "   -0.6733 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.3015 if x2>=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   +0.1763 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   +0.0591 if x2>=2.0 & x3-x1<=1.0\n",
      "   +0.2545 if c<=0.0 & x1<=2.0 & x2<=2.0 & x3-x1<=1.0 & x4-x2<=-1.0\n",
      "   -0.2135 if x1>=2.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   -0.1259 if x1>=2.0 & x2<=1.0 & x3-x1>=1.0\n",
      "   -0.1640 if x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.0185 if c<=0.0 & x1>=2.0 & x4-x2<=-2.0\n",
      "   +0.1053 if x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   +0.2275 if x1>=1.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.4346 if x1>=2.0 & x3-x1<=-1.0 & x4-x2>=-1.0\n",
      "----------------- 3 --------------\n",
      "   +0.5186 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.7754 if c>=1.0 & x1>=1.0\n",
      "   +0.8045 if c>=1.0 & x1>=3.0\n",
      "   -0.2020 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.0036 if c<=0.0 & x2>=1.0 & x3-x1>=0.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.2879 if x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.5088 if x3-x1>=-1.0 & x4-x2<=2.0 & x4-x2>=2.0\n",
      "   -0.1047 if x1>=1.0 & x2>=1.0 & x4-x2>=2.0\n",
      "   -0.1262 if x2>=2.0 & x3-x1>=1.0\n",
      "   -0.1887 if x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   -0.3890 if x1>=2.0 & x4-x2>=2.0\n",
      "   -0.3271 if x3-x1>=1.0\n",
      "   +0.3076 if x1<=0.0 & x4-x2>=2.0\n",
      "   -0.1891 if x1<=0.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.1138 if x1<=0.0 & x3-x1>=2.0\n",
      "   +0.6358 if x1<=1.0 & x1>=1.0 & x4-x2>=2.0\n",
      "init state [2 0 1 1 0]\n",
      "(26,) (26,)\n",
      "init state [ 1  3  0 -1  0]\n",
      "(38,) (12,)\n",
      "init state [ 0  2  3 -2  0]\n",
      "(58,) (20,)\n",
      "init state [ 3  0 -1  3  0]\n",
      "(69,) (11,)\n",
      "init state [ 3  1 -2  2  0]\n",
      "(77,) (8,)\n",
      "init state [ 1  1  0 -1  0]\n",
      "(85,) (8,)\n",
      "init state [ 3  2 -3  1  0]\n",
      "(93,) (8,)\n",
      "init state [1 1 1 0 0]\n",
      "(105,) (12,)\n",
      "init state [ 3  2 -1 -2  0]\n",
      "(118,) (13,)\n",
      "init state [ 3  2 -2 -1  0]\n",
      "(151,) (33,)\n",
      "============ 94 ===========\n",
      "Run episode 94 with rewards 9, accuracy 0.8\n",
      "----------------- 0 --------------\n",
      "   -0.4365 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.7874 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.0996 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.0433 if c<=0.0 & x1>=1.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   -0.6316 if x1>=1.0 & x2<=2.0 & x3-x1>=-1.0\n",
      "   +0.0030 if x3-x1<=0.0\n",
      "   +0.0372 if x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.1367 if x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   +0.1617 if c<=0.0 & x1<=2.0 & x3-x1>=0.0\n",
      "   -0.1979 if x3-x1>=-1.0 & x4-x2>=2.0\n",
      "   -0.1611 if c<=0.0 & x2<=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1<=1.0\n",
      "   +0.0850 if x1<=2.0 & x4-x2>=1.0\n",
      "   -0.1049 if x3-x1<=-2.0 & x4-x2>=2.0\n",
      "   -0.0895 if x3-x1<=-2.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2<=2.0\n",
      "   -0.0459 if x4-x2>=3.0\n",
      "   +0.2340 if x3-x1<=-3.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 1 --------------\n",
      "   -0.7470 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.6455 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.4746 if x1<=2.0 & x4-x2>=-2.0\n",
      "   -0.0211 if x4-x2<=1.0\n",
      "   -0.1322 if x2<=2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.7162 if c>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.1999 if x1>=2.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.2225 if x3-x1<=2.0 & x4-x2<=0.0\n",
      "   +0.2561 if x1<=1.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   +0.4263 if c>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.2186 if x1<=2.0 & x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   +0.0000 if x2>=3.0 & x3-x1>=2.0\n",
      "   -0.1786 if c<=0.0 & x1<=0.0\n",
      "   -0.6021 if x2<=2.0 & x3-x1<=1.0\n",
      "   -0.1786 if x3-x1>=3.0\n",
      "   +0.4702 if x1>=1.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "----------------- 2 --------------\n",
      "   +0.4170 if c<=0.0 & x4-x2>=-2.0\n",
      "   +0.6082 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.4194 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.4842 if x4-x2>=0.0\n",
      "   -0.2191 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.2759 if x2>=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   +0.5085 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   -0.1285 if x2>=2.0 & x3-x1<=1.0\n",
      "   +0.3904 if c<=0.0 & x1<=2.0 & x2<=2.0 & x3-x1<=1.0 & x4-x2<=-1.0\n",
      "   +0.2210 if x1>=2.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   -0.0623 if x1>=2.0 & x2<=1.0 & x3-x1>=1.0\n",
      "   -0.2215 if x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.3940 if x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.4374 if x1>=1.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.0091 if x1>=2.0 & x3-x1<=-1.0 & x4-x2>=-1.0\n",
      "   -0.6382 if x3-x1<=0.0 & x4-x2>=-1.0\n",
      "----------------- 3 --------------\n",
      "   +0.4581 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.4048 if c>=1.0 & x1>=1.0\n",
      "   +0.8679 if c>=1.0 & x1>=3.0\n",
      "   -0.1986 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.1370 if x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.3488 if x3-x1>=-1.0 & x4-x2<=2.0 & x4-x2>=2.0\n",
      "   +0.5246 if x1>=1.0 & x2>=1.0 & x4-x2>=2.0\n",
      "   -0.2019 if x2>=2.0 & x3-x1>=1.0\n",
      "   +0.1192 if x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.6977 if x1>=2.0 & x4-x2>=2.0\n",
      "   -0.3344 if x3-x1>=1.0\n",
      "   +0.0000 if x1<=0.0 & x4-x2>=2.0\n",
      "   -0.1769 if x1<=0.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.1495 if x1<=0.0 & x3-x1>=2.0\n",
      "   +0.0000 if x1<=1.0 & x1>=1.0 & x4-x2>=2.0\n",
      "   -0.5592 if x1>=2.0 & x2>=1.0 & x2>=2.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "init state [1 0 2 2 0]\n",
      "(8,) (8,)\n",
      "init state [ 3  0 -1  2  0]\n",
      "(13,) (5,)\n",
      "init state [ 1  3 -1 -2  0]\n",
      "(25,) (12,)\n",
      "init state [ 2  2  1 -1  0]\n",
      "(37,) (12,)\n",
      "init state [ 2  2 -2 -1  0]\n",
      "(77,) (40,)\n",
      "init state [ 2  2 -2  1  0]\n",
      "(85,) (8,)\n",
      "init state [1 1 1 1 0]\n",
      "(91,) (6,)\n",
      "init state [1 1 1 1 0]\n",
      "(97,) (6,)\n",
      "init state [0 1 1 2 0]\n",
      "(108,) (11,)\n",
      "init state [1 0 2 1 0]\n",
      "(118,) (10,)\n",
      "============ 95 ===========\n",
      "Run episode 95 with rewards 32, accuracy 1.0\n",
      "best\n",
      "----------------- 0 --------------\n",
      "   -0.5903 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.7549 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.3588 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.4379 if c<=0.0 & x1>=1.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   -0.5391 if x1>=1.0 & x2<=2.0 & x3-x1>=-1.0\n",
      "   +0.4132 if x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.0966 if x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   -0.0638 if c<=0.0 & x1<=2.0 & x3-x1>=0.0\n",
      "   +0.2279 if x3-x1>=-1.0 & x4-x2>=2.0\n",
      "   +0.3417 if c<=0.0 & x2<=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1<=1.0\n",
      "   +0.4719 if x1<=2.0 & x4-x2>=1.0\n",
      "   -0.0000 if x3-x1<=-2.0 & x4-x2>=2.0\n",
      "   +0.1603 if x3-x1<=-2.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2<=2.0\n",
      "   -0.0000 if x4-x2>=3.0\n",
      "   -0.0954 if x3-x1<=-3.0\n",
      "   +0.7265 if c<=0.0 & x1<=0.0 & x2>=2.0\n",
      "----------------- 1 --------------\n",
      "   -0.7781 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.8525 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.3398 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.3446 if x4-x2<=1.0\n",
      "   -0.2281 if x2<=2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.6395 if c>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.1883 if x1>=2.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.0792 if x3-x1<=2.0 & x4-x2<=0.0\n",
      "   +0.0476 if x1<=1.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   +0.6047 if c>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   +0.1457 if x1<=2.0 & x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   -0.7834 if c<=0.0 & x1<=0.0\n",
      "   -0.3204 if x2<=2.0 & x3-x1<=1.0\n",
      "   -0.0000 if x3-x1>=3.0\n",
      "   -0.0345 if x1>=1.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.2570 if x1>=1.0 & x2>=3.0 & x3-x1>=1.0\n",
      "----------------- 2 --------------\n",
      "   +0.1182 if c<=0.0 & x4-x2>=-2.0\n",
      "   +0.5379 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.6073 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.6073 if x4-x2>=0.0\n",
      "   -0.8074 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.2494 if x2>=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   +0.4250 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   -0.0034 if x2>=2.0 & x3-x1<=1.0\n",
      "   +0.1230 if c<=0.0 & x1<=2.0 & x2<=2.0 & x3-x1<=1.0 & x4-x2<=-1.0\n",
      "   +0.0524 if x1>=2.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   -0.1097 if x1>=2.0 & x2<=1.0 & x3-x1>=1.0\n",
      "   -0.0361 if x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.3853 if x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   +0.3087 if x1>=1.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.2258 if x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   +0.3919 if x3-x1>=2.0 & x4-x2>=2.0\n",
      "----------------- 3 --------------\n",
      "   +0.2643 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.3225 if c>=1.0 & x1>=1.0\n",
      "   +0.5889 if c>=1.0 & x1>=3.0\n",
      "   -0.2567 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.1782 if x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.0874 if x3-x1>=-1.0 & x4-x2<=2.0 & x4-x2>=2.0\n",
      "   +0.0000 if x1>=1.0 & x2>=1.0 & x4-x2>=2.0\n",
      "   +0.1108 if x2>=2.0 & x3-x1>=1.0\n",
      "   -0.1812 if x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.1287 if x1>=2.0 & x4-x2>=2.0\n",
      "   -0.0421 if x3-x1>=1.0\n",
      "   +0.0703 if x1<=0.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.0000 if x1<=0.0 & x3-x1>=2.0\n",
      "   -0.2291 if x1<=1.0 & x1>=1.0 & x4-x2>=2.0\n",
      "   +0.0000 if x1>=2.0 & x2>=1.0 & x2>=2.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   +0.5034 if x1>=2.0 & x3-x1>=0.0 & x4-x2>=2.0\n",
      "init state [0 0 2 3 0]\n",
      "(14,) (14,)\n",
      "init state [0 0 1 2 0]\n",
      "(22,) (8,)\n",
      "init state [ 2  1  1 -1  0]\n",
      "(29,) (7,)\n",
      "init state [0 0 0 1 0]\n",
      "(38,) (9,)\n",
      "init state [2 0 1 0 0]\n",
      "(60,) (22,)\n",
      "init state [ 3  0 -2  2  0]\n",
      "(70,) (10,)\n",
      "init state [ 2  3  0 -1  0]\n",
      "(74,) (4,)\n",
      "init state [2 1 0 2 0]\n",
      "(81,) (7,)\n",
      "init state [ 0  3  0 -2  0]\n",
      "(104,) (23,)\n",
      "init state [ 3  0 -3  3  0]\n",
      "(122,) (18,)\n",
      "============ 96 ===========\n",
      "Run episode 96 with rewards 24, accuracy 0.2\n",
      "----------------- 0 --------------\n",
      "   -0.4305 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.7651 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.2120 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.1750 if c<=0.0 & x1>=1.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   -0.2030 if x1>=1.0 & x2<=2.0 & x3-x1>=-1.0\n",
      "   +0.3793 if x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.3331 if x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   -0.0686 if c<=0.0 & x1<=2.0 & x3-x1>=0.0\n",
      "   +0.1850 if x3-x1>=-1.0 & x4-x2>=2.0\n",
      "   +0.3936 if c<=0.0 & x2<=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1<=1.0\n",
      "   +0.0900 if x1<=2.0 & x4-x2>=1.0\n",
      "   -0.2453 if x3-x1<=-2.0 & x4-x2>=2.0\n",
      "   +0.3847 if x3-x1<=-2.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2<=2.0\n",
      "   -0.2035 if x3-x1<=-3.0\n",
      "   -0.3222 if c<=0.0 & x1<=0.0 & x2>=2.0\n",
      "   -0.3986 if x3-x1<=1.0\n",
      "----------------- 1 --------------\n",
      "   -0.4373 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.8266 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.2426 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.2446 if x4-x2<=1.0\n",
      "   -0.1726 if x2<=2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.5023 if c>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.1265 if x1>=2.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.3701 if x3-x1<=2.0 & x4-x2<=0.0\n",
      "   +0.0345 if x1<=1.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   +0.1314 if c>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   +0.4454 if x1<=2.0 & x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   -0.1056 if c<=0.0 & x1<=0.0\n",
      "   -0.2473 if x2<=2.0 & x3-x1<=1.0\n",
      "   +0.0650 if x1>=1.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.0436 if x1>=1.0 & x2>=3.0 & x3-x1>=1.0\n",
      "   -0.2160 if c>=1.0 & x1>=1.0 & x2>=3.0 & x3-x1>=-1.0 & x4-x2>=0.0\n",
      "----------------- 2 --------------\n",
      "   -0.0370 if c<=0.0 & x4-x2>=-2.0\n",
      "   +0.6316 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.5483 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.6061 if x4-x2>=0.0\n",
      "   -0.3850 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.1263 if x2>=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   +0.6999 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   -0.0266 if c<=0.0 & x1<=2.0 & x2<=2.0 & x3-x1<=1.0 & x4-x2<=-1.0\n",
      "   -0.2132 if x1>=2.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   -0.2271 if x1>=2.0 & x2<=1.0 & x3-x1>=1.0\n",
      "   -0.3441 if x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.2442 if x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.0649 if x1>=1.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.1191 if x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   -0.1201 if x3-x1>=2.0 & x4-x2>=2.0\n",
      "   -0.0695 if x3-x1<=1.0 & x4-x2>=-1.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 3 --------------\n",
      "   +0.3911 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.6578 if c>=1.0 & x1>=1.0\n",
      "   +0.6473 if c>=1.0 & x1>=3.0\n",
      "   -0.3635 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.1953 if x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.1376 if x3-x1>=-1.0 & x4-x2<=2.0 & x4-x2>=2.0\n",
      "   +0.3905 if x1>=1.0 & x2>=1.0 & x4-x2>=2.0\n",
      "   -0.2475 if x2>=2.0 & x3-x1>=1.0\n",
      "   +0.1747 if x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.3052 if x1>=2.0 & x4-x2>=2.0\n",
      "   -0.0052 if x3-x1>=1.0\n",
      "   +0.0635 if x1<=0.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.2256 if x1<=1.0 & x1>=1.0 & x4-x2>=2.0\n",
      "   -0.3829 if x1>=2.0 & x2>=1.0 & x2>=2.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   +0.1456 if x1>=2.0 & x3-x1>=0.0 & x4-x2>=2.0\n",
      "   +0.6954 if x1<=2.0 & x2<=0.0\n",
      "init state [ 2  0 -2  3  0]\n",
      "(11,) (11,)\n",
      "init state [1 1 1 1 0]\n",
      "(15,) (4,)\n",
      "init state [0 2 1 1 0]\n",
      "(25,) (10,)\n",
      "init state [ 2  0 -1  0  0]\n",
      "(40,) (15,)\n",
      "init state [ 3  0 -2  3  0]\n",
      "(51,) (11,)\n",
      "init state [ 3  1 -3 -1  0]\n",
      "(71,) (20,)\n",
      "init state [ 2  3 -1 -2  0]\n",
      "(83,) (12,)\n",
      "init state [ 3  1 -3 -1  0]\n",
      "(121,) (38,)\n",
      "init state [0 0 3 1 0]\n",
      "(133,) (12,)\n",
      "init state [ 1  2  2 -2  0]\n",
      "(144,) (11,)\n",
      "============ 97 ===========\n",
      "Run episode 97 with rewards 31, accuracy 0.9\n",
      "----------------- 0 --------------\n",
      "   -0.6024 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.5823 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.1520 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.3377 if c<=0.0 & x1>=1.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   -0.4789 if x1>=1.0 & x2<=2.0 & x3-x1>=-1.0\n",
      "   -0.0670 if x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.2356 if x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   +0.0000 if x3-x1>=-1.0 & x4-x2>=2.0\n",
      "   -0.0199 if c<=0.0 & x2<=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1<=1.0\n",
      "   +0.2094 if x1<=2.0 & x4-x2>=1.0\n",
      "   -0.0955 if x3-x1<=-2.0 & x4-x2>=2.0\n",
      "   +0.0643 if x3-x1<=-2.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2<=2.0\n",
      "   +0.4216 if x3-x1<=-3.0\n",
      "   +0.2250 if c<=0.0 & x1<=0.0 & x2>=2.0\n",
      "   +0.0410 if x3-x1<=1.0\n",
      "   +0.8310 if c<=0.0 & x1>=1.0 & x2>=3.0 & x4-x2>=-2.0\n",
      "----------------- 1 --------------\n",
      "   -0.5379 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.7836 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.3267 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.1397 if x4-x2<=1.0\n",
      "   +0.0511 if x2<=2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.3140 if c>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.2866 if x1>=2.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.3514 if x3-x1<=2.0 & x4-x2<=0.0\n",
      "   +0.5145 if c>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.3090 if x1<=2.0 & x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   -0.3973 if c<=0.0 & x1<=0.0\n",
      "   -0.1126 if x2<=2.0 & x3-x1<=1.0\n",
      "   +0.0106 if x1>=1.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.0000 if x1>=1.0 & x2>=3.0 & x3-x1>=1.0\n",
      "   +0.0429 if c>=1.0 & x1>=1.0 & x2>=3.0 & x3-x1>=-1.0 & x4-x2>=0.0\n",
      "   +0.5882 if x3-x1>=2.0 & x4-x2<=0.0\n",
      "----------------- 2 --------------\n",
      "   +0.0285 if c<=0.0 & x4-x2>=-2.0\n",
      "   +0.6830 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.5929 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.6749 if x4-x2>=0.0\n",
      "   -0.4904 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.4391 if x2>=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   +0.2088 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   -0.0808 if x1>=2.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   -0.0319 if x1>=2.0 & x2<=1.0 & x3-x1>=1.0\n",
      "   -0.1615 if x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.2639 if x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.3811 if x1>=1.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.1025 if x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   +0.0000 if x3-x1>=2.0 & x4-x2>=2.0\n",
      "   -0.1008 if x3-x1<=1.0 & x4-x2>=-1.0\n",
      "   +0.2377 if c<=0.0 & x4-x2<=-3.0\n",
      "----------------- 3 --------------\n",
      "   +0.4201 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.6918 if c>=1.0 & x1>=1.0\n",
      "   +0.4165 if c>=1.0 & x1>=3.0\n",
      "   -0.5904 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.2431 if x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.0000 if x3-x1>=-1.0 & x4-x2<=2.0 & x4-x2>=2.0\n",
      "   -0.0572 if x1>=1.0 & x2>=1.0 & x4-x2>=2.0\n",
      "   -0.7181 if x2>=2.0 & x3-x1>=1.0\n",
      "   -0.1308 if x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.2282 if x1>=2.0 & x4-x2>=2.0\n",
      "   -0.1655 if x1<=0.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.0000 if x1<=1.0 & x1>=1.0 & x4-x2>=2.0\n",
      "   -0.2204 if x1>=2.0 & x2>=1.0 & x2>=2.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   +0.0000 if x1>=2.0 & x3-x1>=0.0 & x4-x2>=2.0\n",
      "   +0.2309 if x1<=2.0 & x2<=0.0\n",
      "   +0.3237 if x3-x1>=-2.0\n",
      "init state [0 0 1 2 0]\n",
      "(11,) (11,)\n",
      "init state [ 0  3  3 -1  0]\n",
      "(19,) (8,)\n",
      "init state [0 1 2 1 0]\n",
      "(25,) (6,)\n",
      "init state [ 1  2  0 -1  0]\n",
      "(32,) (7,)\n",
      "init state [ 0  2  1 -1  0]\n",
      "(59,) (27,)\n",
      "init state [2 2 0 1 0]\n",
      "(61,) (2,)\n",
      "init state [ 2  1 -2 -1  0]\n",
      "(100,) (39,)\n",
      "init state [ 1  3  2 -1  0]\n",
      "(117,) (17,)\n",
      "init state [0 1 2 0 0]\n",
      "(128,) (11,)\n",
      "init state [ 2  2 -2  0  0]\n",
      "(134,) (6,)\n",
      "============ 98 ===========\n",
      "Run episode 98 with rewards 36, accuracy 0.6\n",
      "----------------- 0 --------------\n",
      "   -0.5136 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.5991 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.1350 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.4703 if c<=0.0 & x1>=1.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   -0.2693 if x1>=1.0 & x2<=2.0 & x3-x1>=-1.0\n",
      "   +0.0179 if x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.2709 if x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   +0.1024 if c<=0.0 & x2<=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1<=1.0\n",
      "   +0.1924 if x1<=2.0 & x4-x2>=1.0\n",
      "   +0.0000 if x3-x1<=-2.0 & x4-x2>=2.0\n",
      "   +0.4350 if x3-x1<=-2.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2<=2.0\n",
      "   +0.5340 if x3-x1<=-3.0\n",
      "   +0.4038 if c<=0.0 & x1<=0.0 & x2>=2.0\n",
      "   +0.0427 if x3-x1<=1.0\n",
      "   +0.0201 if c<=0.0 & x1>=1.0 & x2>=3.0 & x4-x2>=-2.0\n",
      "   +0.3768 if x3-x1>=3.0\n",
      "----------------- 1 --------------\n",
      "   -0.5223 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.7126 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.7482 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.2489 if x4-x2<=1.0\n",
      "   +0.1670 if x2<=2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.4442 if c>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.1902 if x1>=2.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.6220 if x3-x1<=2.0 & x4-x2<=0.0\n",
      "   +0.4507 if c>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   +0.0734 if x1<=2.0 & x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   -0.2014 if c<=0.0 & x1<=0.0\n",
      "   -0.9440 if x2<=2.0 & x3-x1<=1.0\n",
      "   -0.3562 if x1>=1.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.0620 if c>=1.0 & x1>=1.0 & x2>=3.0 & x3-x1>=-1.0 & x4-x2>=0.0\n",
      "   +0.5814 if x3-x1>=2.0 & x4-x2<=0.0\n",
      "   -0.6328 if c<=0.0 & x2>=1.0\n",
      "----------------- 2 --------------\n",
      "   +0.0454 if c<=0.0 & x4-x2>=-2.0\n",
      "   +0.7018 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.3528 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.3528 if x4-x2>=0.0\n",
      "   -0.3168 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.5450 if x2>=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   +0.3896 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   -0.3303 if x1>=2.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   +0.0000 if x1>=2.0 & x2<=1.0 & x3-x1>=1.0\n",
      "   -0.3823 if x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.0257 if x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.2933 if x1>=1.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.3255 if x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   +0.1570 if x3-x1<=1.0 & x4-x2>=-1.0\n",
      "   -0.0489 if c<=0.0 & x4-x2<=-3.0\n",
      "   -0.0490 if x1<=1.0\n",
      "----------------- 3 --------------\n",
      "   +0.3983 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.5996 if c>=1.0 & x1>=1.0\n",
      "   +0.4934 if c>=1.0 & x1>=3.0\n",
      "   -0.2348 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.1826 if x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.0000 if x1>=1.0 & x2>=1.0 & x4-x2>=2.0\n",
      "   -0.3573 if x2>=2.0 & x3-x1>=1.0\n",
      "   +0.1614 if x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.0000 if x1>=2.0 & x4-x2>=2.0\n",
      "   -0.5743 if x1<=0.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.0000 if x1<=1.0 & x1>=1.0 & x4-x2>=2.0\n",
      "   +0.1752 if x1>=2.0 & x2>=1.0 & x2>=2.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   +0.0000 if x1>=2.0 & x3-x1>=0.0 & x4-x2>=2.0\n",
      "   -0.2333 if x1<=2.0 & x2<=0.0\n",
      "   +0.4373 if x3-x1>=-2.0\n",
      "   -0.7363 if x1<=2.0 & x2>=1.0 & x4-x2<=0.0\n",
      "init state [ 2  3 -1 -2  0]\n",
      "(12,) (12,)\n",
      "init state [2 1 1 1 0]\n",
      "(23,) (11,)\n",
      "init state [ 1  2  2 -2  0]\n",
      "(33,) (10,)\n",
      "init state [ 0  3  1 -2  0]\n",
      "(40,) (7,)\n",
      "init state [ 1  1  2 -1  0]\n",
      "(51,) (11,)\n",
      "init state [ 2  3 -1 -3  0]\n",
      "(66,) (15,)\n",
      "init state [3 1 0 1 0]\n",
      "(68,) (2,)\n",
      "init state [ 2  3  1 -3  0]\n",
      "(82,) (14,)\n",
      "init state [ 1  1  1 -1  0]\n",
      "(90,) (8,)\n",
      "init state [ 3  1 -1  0  0]\n",
      "(96,) (6,)\n",
      "============ 99 ===========\n",
      "Run episode 99 with rewards 36, accuracy 0.7\n",
      "----------------- 0 --------------\n",
      "   -0.2938 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.3304 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.0459 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.5141 if c<=0.0 & x1>=1.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   -0.2894 if x1>=1.0 & x2<=2.0 & x3-x1>=-1.0\n",
      "   +0.0000 if x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.0293 if x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   +0.3304 if c<=0.0 & x2<=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1<=1.0\n",
      "   +0.1963 if x1<=2.0 & x4-x2>=1.0\n",
      "   -0.0696 if x3-x1<=-2.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2<=2.0\n",
      "   +0.0000 if x3-x1<=-3.0\n",
      "   -0.1018 if c<=0.0 & x1<=0.0 & x2>=2.0\n",
      "   -0.0989 if x3-x1<=1.0\n",
      "   +0.0965 if c<=0.0 & x1>=1.0 & x2>=3.0 & x4-x2>=-2.0\n",
      "   +0.0000 if x3-x1>=3.0\n",
      "   -0.1752 if c<=0.0 & x1>=2.0 & x2<=0.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 1 --------------\n",
      "   -0.5124 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.6314 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.5020 if x1<=2.0 & x4-x2>=-2.0\n",
      "   -0.0318 if x4-x2<=1.0\n",
      "   +0.2849 if x2<=2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.2903 if c>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.2825 if x1>=2.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.3812 if x3-x1<=2.0 & x4-x2<=0.0\n",
      "   +0.2735 if c>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   +0.0000 if x1<=2.0 & x2>=3.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-1.0\n",
      "   +0.3079 if c<=0.0 & x1<=0.0\n",
      "   -0.1116 if x2<=2.0 & x3-x1<=1.0\n",
      "   -0.4264 if x1>=1.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.3274 if x3-x1>=2.0 & x4-x2<=0.0\n",
      "   -0.4960 if c<=0.0 & x2>=1.0\n",
      "   -0.2064 if x2>=2.0 & x3-x1>=2.0 & x4-x2<=-2.0\n",
      "----------------- 2 --------------\n",
      "   +0.2766 if c<=0.0 & x4-x2>=-2.0\n",
      "   +0.2305 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.3683 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.3683 if x4-x2>=0.0\n",
      "   -0.3683 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.4446 if x2>=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   +0.3628 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   -0.3420 if x1>=2.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   -0.1493 if x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.1877 if x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   +0.2300 if x1>=1.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.0628 if x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   -0.0689 if x3-x1<=1.0 & x4-x2>=-1.0\n",
      "   +0.2884 if c<=0.0 & x4-x2<=-3.0\n",
      "   +0.2796 if x1<=1.0\n",
      "   -0.3735 if x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "----------------- 3 --------------\n",
      "   +0.2084 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.5105 if c>=1.0 & x1>=1.0\n",
      "   +0.6872 if c>=1.0 & x1>=3.0\n",
      "   -0.4975 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.2575 if x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.0000 if x1>=1.0 & x2>=1.0 & x4-x2>=2.0\n",
      "   -0.4898 if x2>=2.0 & x3-x1>=1.0\n",
      "   +0.2266 if x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.0000 if x1>=2.0 & x4-x2>=2.0\n",
      "   -0.0295 if x1<=0.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.0000 if x1<=1.0 & x1>=1.0 & x4-x2>=2.0\n",
      "   +0.0000 if x1>=2.0 & x2>=1.0 & x2>=2.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   +0.0628 if x1<=2.0 & x2<=0.0\n",
      "   +0.2266 if x3-x1>=-2.0\n",
      "   -0.6875 if x1<=2.0 & x2>=1.0 & x4-x2<=0.0\n",
      "   -0.1315 if x4-x2<=-2.0\n",
      "init state [ 2  2  1 -1  0]\n",
      "(9,) (9,)\n",
      "init state [1 0 2 2 0]\n",
      "(28,) (19,)\n",
      "init state [ 0  1  1 -1  0]\n",
      "(54,) (26,)\n",
      "init state [ 0  3  0 -2  0]\n",
      "(72,) (18,)\n",
      "init state [ 1  3  0 -2  0]\n",
      "(82,) (10,)\n",
      "init state [ 1  3  1 -2  0]\n",
      "(88,) (6,)\n",
      "init state [ 1  1  0 -1  0]\n",
      "(101,) (13,)\n",
      "init state [ 1  1  2 -1  0]\n",
      "(110,) (9,)\n",
      "init state [0 2 3 0 0]\n",
      "(117,) (7,)\n",
      "init state [ 1  3  0 -1  0]\n",
      "(125,) (8,)\n",
      "============ 100 ===========\n",
      "Run episode 100 with rewards 34, accuracy 0.8\n",
      "----------------- 0 --------------\n",
      "   -0.3483 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.0000 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.2683 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.1504 if c<=0.0 & x1>=1.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   +0.1762 if x1>=1.0 & x2<=2.0 & x3-x1>=-1.0\n",
      "   -0.2718 if x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   +0.0000 if c<=0.0 & x2<=1.0 & x2<=2.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1<=1.0\n",
      "   +0.1852 if x1<=2.0 & x4-x2>=1.0\n",
      "   -0.0556 if x3-x1<=-2.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2<=2.0\n",
      "   +0.2340 if x3-x1<=-3.0\n",
      "   -0.2596 if c<=0.0 & x1<=0.0 & x2>=2.0\n",
      "   -0.2414 if x3-x1<=1.0\n",
      "   -0.0092 if c<=0.0 & x1>=1.0 & x2>=3.0 & x4-x2>=-2.0\n",
      "   -0.3467 if x3-x1>=3.0\n",
      "   +0.0860 if c<=0.0 & x1>=2.0 & x2<=0.0\n",
      "   -0.2854 if x1>=3.0 & x4-x2>=1.0\n",
      "----------------- 1 --------------\n",
      "   -0.5290 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.4712 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.8848 if x1<=2.0 & x4-x2>=-2.0\n",
      "   -0.0126 if x4-x2<=1.0\n",
      "   +0.3358 if x2<=2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.3005 if c>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.3102 if x1>=2.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.1035 if x3-x1<=2.0 & x4-x2<=0.0\n",
      "   +0.1770 if c>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   +0.2944 if c<=0.0 & x1<=0.0\n",
      "   +0.0864 if x2<=2.0 & x3-x1<=1.0\n",
      "   -0.1079 if x1>=1.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.4670 if x3-x1>=2.0 & x4-x2<=0.0\n",
      "   -0.1525 if c<=0.0 & x2>=1.0\n",
      "   +0.0000 if x2>=2.0 & x3-x1>=2.0 & x4-x2<=-2.0\n",
      "   -0.3980 if x2<=2.0 & x3-x1<=0.0\n",
      "----------------- 2 --------------\n",
      "   -0.0671 if c<=0.0 & x4-x2>=-2.0\n",
      "   +0.2372 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.4672 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.4672 if x4-x2>=0.0\n",
      "   -0.3100 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.3418 if x2>=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   +0.1926 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   -0.1576 if x1>=2.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   +0.2629 if x3-x1>=1.0 & x4-x2>=1.0\n",
      "   -0.0504 if x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.0369 if x1>=1.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.1023 if x3-x1<=1.0 & x4-x2>=-1.0\n",
      "   +0.0820 if c<=0.0 & x4-x2<=-3.0\n",
      "   +0.6829 if x1<=1.0\n",
      "   -0.2759 if x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "   -0.0333 if x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "----------------- 3 --------------\n",
      "   +0.5626 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.8086 if c>=1.0 & x1>=1.0\n",
      "   +1.0020 if c>=1.0 & x1>=3.0\n",
      "   -0.3041 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.2479 if x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.0000 if x1>=1.0 & x2>=1.0 & x4-x2>=2.0\n",
      "   -0.3386 if x2>=2.0 & x3-x1>=1.0\n",
      "   +0.1799 if x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.0851 if x1>=2.0 & x4-x2>=2.0\n",
      "   +0.0862 if x1<=0.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.0000 if x1>=2.0 & x2>=1.0 & x2>=2.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   -0.1800 if x1<=2.0 & x2<=0.0\n",
      "   +0.0204 if x3-x1>=-2.0\n",
      "   -0.8170 if x1<=2.0 & x2>=1.0 & x4-x2<=0.0\n",
      "   +0.4702 if x4-x2<=-2.0\n",
      "   -0.3340 if x2>=1.0\n",
      "init state [ 1  2  1 -2  0]\n",
      "(12,) (12,)\n",
      "init state [ 1  1  2 -1  0]\n",
      "(23,) (11,)\n",
      "init state [ 2  2 -1 -2  0]\n",
      "(40,) (17,)\n",
      "init state [2 1 0 1 0]\n",
      "(46,) (6,)\n",
      "init state [ 3  1 -1 -1  0]\n",
      "(67,) (21,)\n",
      "init state [ 0  1  1 -1  0]\n",
      "(81,) (14,)\n",
      "init state [ 0  2  2 -1  0]\n",
      "(89,) (8,)\n",
      "init state [ 2  1 -1 -1  0]\n",
      "(98,) (9,)\n",
      "init state [ 2  2 -1  0  0]\n",
      "(105,) (7,)\n",
      "init state [0 2 0 1 0]\n",
      "(109,) (4,)\n",
      "============ 101 ===========\n",
      "Run episode 101 with rewards 38, accuracy 0.6\n",
      "----------------- 0 --------------\n",
      "   -0.4109 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.1071 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.2355 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.6006 if c<=0.0 & x1>=1.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   +0.0088 if x1>=1.0 & x2<=2.0 & x3-x1>=-1.0\n",
      "   -0.1781 if x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   -0.1931 if x1<=2.0 & x4-x2>=1.0\n",
      "   -0.0514 if x3-x1<=-2.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2<=2.0\n",
      "   +0.0000 if x3-x1<=-3.0\n",
      "   -0.1446 if c<=0.0 & x1<=0.0 & x2>=2.0\n",
      "   -0.2674 if x3-x1<=1.0\n",
      "   +0.0000 if c<=0.0 & x1>=1.0 & x2>=3.0 & x4-x2>=-2.0\n",
      "   +0.0000 if x3-x1>=3.0\n",
      "   -0.2519 if c<=0.0 & x1>=2.0 & x2<=0.0\n",
      "   -0.0379 if x1>=3.0 & x4-x2>=1.0\n",
      "   +0.5961 if c<=0.0 & x2<=1.0 & x3-x1<=-1.0\n",
      "----------------- 1 --------------\n",
      "   -0.6707 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.6707 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.3594 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.4314 if x4-x2<=1.0\n",
      "   -0.2290 if x2<=2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.1802 if c>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.1001 if x1>=2.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.3581 if x3-x1<=2.0 & x4-x2<=0.0\n",
      "   +0.3713 if c>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   +0.0350 if c<=0.0 & x1<=0.0\n",
      "   +0.2318 if x2<=2.0 & x3-x1<=1.0\n",
      "   -0.3826 if x1>=1.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.1529 if x3-x1>=2.0 & x4-x2<=0.0\n",
      "   -0.1179 if c<=0.0 & x2>=1.0\n",
      "   -0.3462 if x2<=2.0 & x3-x1<=0.0\n",
      "   +0.2331 if x3-x1>=-1.0\n",
      "----------------- 2 --------------\n",
      "   -0.0986 if c<=0.0 & x4-x2>=-2.0\n",
      "   +0.5113 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.1868 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.1868 if x4-x2>=0.0\n",
      "   -0.1868 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.4699 if x2>=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   +0.5113 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   -0.3727 if x1>=2.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   +0.0000 if x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.0310 if x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   +0.4975 if x1>=1.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.4391 if x3-x1<=1.0 & x4-x2>=-1.0\n",
      "   +0.0000 if c<=0.0 & x4-x2<=-3.0\n",
      "   -0.1171 if x1<=1.0\n",
      "   -0.3201 if x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "   +0.2673 if c<=0.0 & x1<=0.0 & x2<=1.0 & x4-x2<=-1.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 3 --------------\n",
      "   +0.5813 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.4304 if c>=1.0 & x1>=1.0\n",
      "   +0.7622 if c>=1.0 & x1>=3.0\n",
      "   -0.1940 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.0411 if x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.1489 if x2>=2.0 & x3-x1>=1.0\n",
      "   +0.1671 if x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.0000 if x1>=2.0 & x4-x2>=2.0\n",
      "   -0.1282 if x1<=0.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.0000 if x1>=2.0 & x2>=1.0 & x2>=2.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   +0.1340 if x1<=2.0 & x2<=0.0\n",
      "   +0.1671 if x3-x1>=-2.0\n",
      "   -0.6431 if x1<=2.0 & x2>=1.0 & x4-x2<=0.0\n",
      "   -0.1129 if x4-x2<=-2.0\n",
      "   -0.1776 if x2>=1.0\n",
      "   -0.2796 if x1>=1.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "init state [ 1  3  1 -2  0]\n",
      "(9,) (9,)\n",
      "init state [ 3  0 -3  2  0]\n",
      "(29,) (20,)\n",
      "init state [1 2 1 1 0]\n",
      "(36,) (7,)\n",
      "init state [ 0  3  3 -3  0]\n",
      "(76,) (40,)\n",
      "init state [ 3  2 -2 -1  0]\n",
      "(103,) (27,)\n",
      "init state [ 3  2 -2 -2  0]\n",
      "(121,) (18,)\n",
      "init state [ 3  1 -1  0  0]\n",
      "(129,) (8,)\n",
      "init state [2 0 1 2 0]\n",
      "(135,) (6,)\n",
      "init state [ 2  0 -2  3  0]\n",
      "(160,) (25,)\n",
      "init state [1 2 1 1 0]\n",
      "(163,) (3,)\n",
      "============ 102 ===========\n",
      "Run episode 102 with rewards 39, accuracy 0.5\n",
      "----------------- 0 --------------\n",
      "   -0.5625 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.4026 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.0611 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.0047 if c<=0.0 & x1>=1.0 & x2>=1.0 & x3-x1>=0.0\n",
      "   -0.0062 if x1>=1.0 & x2<=2.0 & x3-x1>=-1.0\n",
      "   -0.2150 if x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   -0.2176 if x1<=2.0 & x4-x2>=1.0\n",
      "   +0.2467 if x3-x1<=-2.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2<=2.0\n",
      "   -0.0755 if x3-x1<=-3.0\n",
      "   -0.1588 if c<=0.0 & x1<=0.0 & x2>=2.0\n",
      "   -0.0705 if x3-x1<=1.0\n",
      "   +0.0106 if x3-x1>=3.0\n",
      "   +0.0375 if c<=0.0 & x1>=2.0 & x2<=0.0\n",
      "   -0.0821 if x1>=3.0 & x4-x2>=1.0\n",
      "   +0.4050 if c<=0.0 & x2<=1.0 & x3-x1<=-1.0\n",
      "   +0.2758 if x2<=0.0 & x3-x1<=-2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "----------------- 1 --------------\n",
      "   -0.5929 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.7463 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.3825 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.3683 if x4-x2<=1.0\n",
      "   -0.3320 if x2<=2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.1871 if c>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.0319 if x1>=2.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.2882 if x3-x1<=2.0 & x4-x2<=0.0\n",
      "   +0.5426 if c>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.0113 if x2<=2.0 & x3-x1<=1.0\n",
      "   -0.6567 if x1>=1.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.1817 if x3-x1>=2.0 & x4-x2<=0.0\n",
      "   -0.1995 if c<=0.0 & x2>=1.0\n",
      "   -0.1368 if x2<=2.0 & x3-x1<=0.0\n",
      "   +0.2740 if x3-x1>=-1.0\n",
      "   -0.2784 if x3-x1>=2.0 & x4-x2>=1.0\n",
      "----------------- 2 --------------\n",
      "   -0.1829 if c<=0.0 & x4-x2>=-2.0\n",
      "   +0.4223 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.3479 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.3418 if x4-x2>=0.0\n",
      "   -0.3157 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.2778 if x2>=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   +0.3481 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   -0.2883 if x1>=2.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   -0.1457 if x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.1101 if x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   +0.3175 if x1>=1.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.2734 if x3-x1<=1.0 & x4-x2>=-1.0\n",
      "   -0.1241 if x1<=1.0\n",
      "   -0.2147 if x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "   +0.0000 if c<=0.0 & x1<=0.0 & x2<=1.0 & x4-x2<=-1.0\n",
      "   -0.5115 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "----------------- 3 --------------\n",
      "   +0.3867 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.3981 if c>=1.0 & x1>=1.0\n",
      "   +0.7401 if c>=1.0 & x1>=3.0\n",
      "   -0.1651 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.1739 if x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.1124 if x2>=2.0 & x3-x1>=1.0\n",
      "   -0.1073 if x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.2694 if x1>=2.0 & x4-x2>=2.0\n",
      "   -0.1129 if x1<=0.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.3928 if x1<=2.0 & x2<=0.0\n",
      "   +0.1635 if x3-x1>=-2.0\n",
      "   -0.4016 if x1<=2.0 & x2>=1.0 & x4-x2<=0.0\n",
      "   -0.1959 if x4-x2<=-2.0\n",
      "   +0.1137 if x2>=1.0\n",
      "   -0.0610 if x1>=1.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.3250 if x1<=0.0\n",
      "init state [ 1  1 -1  0  0]\n",
      "(30,) (30,)\n",
      "init state [1 0 0 3 0]\n",
      "(36,) (6,)\n",
      "init state [ 3  2 -2 -2  0]\n",
      "(74,) (38,)\n",
      "init state [ 1  3 -1  0  0]\n",
      "(85,) (11,)\n",
      "init state [0 1 2 0 0]\n",
      "(104,) (19,)\n",
      "init state [ 3  1 -2 -1  0]\n",
      "(113,) (9,)\n",
      "init state [ 2  2 -2 -2  0]\n",
      "(133,) (20,)\n",
      "init state [0 0 2 1 0]\n",
      "(139,) (6,)\n",
      "init state [ 1  0 -1  3  0]\n",
      "(153,) (14,)\n",
      "init state [ 2  0 -2  1  0]\n",
      "(166,) (13,)\n",
      "============ 103 ===========\n",
      "Run episode 103 with rewards 29, accuracy 0.8\n",
      "----------------- 0 --------------\n",
      "   -0.7148 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.4014 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.2852 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.2524 if x1>=1.0 & x2<=2.0 & x3-x1>=-1.0\n",
      "   -0.2179 if x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   -0.3907 if x1<=2.0 & x4-x2>=1.0\n",
      "   +0.0044 if x3-x1<=-2.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2<=2.0\n",
      "   +0.1203 if x3-x1<=-3.0\n",
      "   +0.1920 if c<=0.0 & x1<=0.0 & x2>=2.0\n",
      "   -0.0560 if x3-x1<=1.0\n",
      "   +0.0000 if x3-x1>=3.0\n",
      "   -0.0071 if c<=0.0 & x1>=2.0 & x2<=0.0\n",
      "   -0.0184 if x1>=3.0 & x4-x2>=1.0\n",
      "   +0.7703 if c<=0.0 & x2<=1.0 & x3-x1<=-1.0\n",
      "   -0.1303 if x2<=0.0 & x3-x1<=-2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.1649 if x4-x2>=3.0\n",
      "----------------- 1 --------------\n",
      "   -0.6070 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.5850 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.5038 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.2422 if x4-x2<=1.0\n",
      "   +0.1409 if x2<=2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.4004 if c>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.0664 if x1>=2.0 & x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.0708 if x3-x1<=2.0 & x4-x2<=0.0\n",
      "   +0.3087 if c>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.1928 if x1>=1.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.0693 if x3-x1>=2.0 & x4-x2<=0.0\n",
      "   -0.3644 if c<=0.0 & x2>=1.0\n",
      "   -0.6140 if x2<=2.0 & x3-x1<=0.0\n",
      "   +0.2136 if x3-x1>=-1.0\n",
      "   +0.2176 if x3-x1>=2.0 & x4-x2>=1.0\n",
      "   +0.5594 if x2<=0.0 & x3-x1>=1.0\n",
      "----------------- 2 --------------\n",
      "   -0.0499 if c<=0.0 & x4-x2>=-2.0\n",
      "   +0.2517 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.4029 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.4779 if x4-x2>=0.0\n",
      "   -0.1874 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.0707 if x2>=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   +0.4122 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   -0.1016 if x1>=2.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   -0.0562 if x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.2034 if x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.2175 if x1>=1.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.1398 if x3-x1<=1.0 & x4-x2>=-1.0\n",
      "   -0.2100 if x1<=1.0\n",
      "   +0.1072 if x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "   -0.1181 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   +0.6938 if c<=0.0 & x1<=0.0 & x2<=2.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2<=1.0\n",
      "----------------- 3 --------------\n",
      "   +0.7133 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.6110 if c>=1.0 & x1>=1.0\n",
      "   +0.5541 if c>=1.0 & x1>=3.0\n",
      "   -0.3673 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.3320 if x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.0330 if x2>=2.0 & x3-x1>=1.0\n",
      "   -0.0007 if x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.0000 if x1>=2.0 & x4-x2>=2.0\n",
      "   -0.0318 if x1<=0.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.0016 if x1<=2.0 & x2<=0.0\n",
      "   +0.1155 if x3-x1>=-2.0\n",
      "   -0.4261 if x1<=2.0 & x2>=1.0 & x4-x2<=0.0\n",
      "   +0.1128 if x4-x2<=-2.0\n",
      "   +0.2009 if x2>=1.0\n",
      "   -0.2871 if x1<=0.0\n",
      "   +0.3453 if x4-x2>=3.0\n",
      "init state [1 0 2 2 0]\n",
      "(14,) (14,)\n",
      "init state [ 3  0 -3  2  0]\n",
      "(24,) (10,)\n",
      "init state [ 2  2  1 -2  0]\n",
      "(41,) (17,)\n",
      "init state [ 2  0 -2  2  0]\n",
      "(58,) (17,)\n",
      "init state [2 0 0 2 0]\n",
      "(64,) (6,)\n",
      "init state [ 2  2 -2  1  0]\n",
      "(70,) (6,)\n",
      "init state [1 1 0 1 0]\n",
      "(76,) (6,)\n",
      "init state [ 2  0 -1  2  0]\n",
      "(84,) (8,)\n",
      "init state [ 2  1 -1 -1  0]\n",
      "(95,) (11,)\n",
      "init state [ 2  2 -2 -1  0]\n",
      "(113,) (18,)\n",
      "============ 104 ===========\n",
      "Run episode 104 with rewards 24, accuracy 1.0\n",
      "best\n",
      "----------------- 0 --------------\n",
      "   -0.5956 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.9330 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.0029 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.3074 if x1>=1.0 & x2<=2.0 & x3-x1>=-1.0\n",
      "   -0.1582 if x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   -0.3119 if x1<=2.0 & x4-x2>=1.0\n",
      "   -0.0163 if x3-x1<=-2.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2<=2.0\n",
      "   -0.1023 if x3-x1<=-3.0\n",
      "   -0.2598 if c<=0.0 & x1<=0.0 & x2>=2.0\n",
      "   +0.1981 if x3-x1<=1.0\n",
      "   +0.1040 if c<=0.0 & x1>=2.0 & x2<=0.0\n",
      "   +0.8991 if x1>=3.0 & x4-x2>=1.0\n",
      "   +0.7300 if c<=0.0 & x2<=1.0 & x3-x1<=-1.0\n",
      "   +0.0000 if x2<=0.0 & x3-x1<=-2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.0000 if x4-x2>=3.0\n",
      "   +0.7147 if x1>=3.0 & x2>=1.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 1 --------------\n",
      "   -0.7724 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.8193 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.3268 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.1908 if x4-x2<=1.0\n",
      "   +0.0420 if x2<=2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.1785 if c>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.4752 if x3-x1<=2.0 & x4-x2<=0.0\n",
      "   +0.2068 if c>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   +0.2883 if x1>=1.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.0292 if x3-x1>=2.0 & x4-x2<=0.0\n",
      "   -0.1212 if c<=0.0 & x2>=1.0\n",
      "   -0.8582 if x2<=2.0 & x3-x1<=0.0\n",
      "   +0.2308 if x3-x1>=-1.0\n",
      "   +0.1102 if x3-x1>=2.0 & x4-x2>=1.0\n",
      "   +0.4747 if x2<=0.0 & x3-x1>=1.0\n",
      "   -0.2783 if x3-x1<=-1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "----------------- 2 --------------\n",
      "   +0.6089 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.4333 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.4333 if x4-x2>=0.0\n",
      "   -0.3882 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.4315 if x2>=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   +0.3730 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   -0.1266 if x1>=2.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   +0.1293 if x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.0310 if x3-x1>=-1.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.2097 if x1>=1.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.4308 if x3-x1<=1.0 & x4-x2>=-1.0\n",
      "   -0.1311 if x1<=1.0\n",
      "   -0.4405 if x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "   -0.3789 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   +0.2038 if c<=0.0 & x1<=0.0 & x2<=2.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2<=1.0\n",
      "   +0.2996 if x1<=1.0 & x3-x1<=0.0\n",
      "----------------- 3 --------------\n",
      "   +0.4585 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.7107 if c>=1.0 & x1>=1.0\n",
      "   +0.4169 if c>=1.0 & x1>=3.0\n",
      "   -0.5880 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.1975 if x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.1318 if x2>=2.0 & x3-x1>=1.0\n",
      "   +0.0623 if x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   -0.1672 if x1<=0.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.2278 if x1<=2.0 & x2<=0.0\n",
      "   +0.2228 if x3-x1>=-2.0\n",
      "   -0.4318 if x1<=2.0 & x2>=1.0 & x4-x2<=0.0\n",
      "   -0.0133 if x4-x2<=-2.0\n",
      "   -0.0639 if x2>=1.0\n",
      "   +0.0617 if x1<=0.0\n",
      "   +0.0000 if x4-x2>=3.0\n",
      "   -0.4953 if x1>=3.0\n",
      "init state [ 2  0 -2  0  0]\n",
      "(13,) (13,)\n",
      "init state [ 3  1 -2  2  0]\n",
      "(22,) (9,)\n",
      "init state [ 1  3  0 -2  0]\n",
      "(43,) (21,)\n",
      "init state [ 1  2  0 -2  0]\n",
      "(66,) (23,)\n",
      "init state [ 3  2  0 -1  0]\n",
      "(72,) (6,)\n",
      "init state [0 0 2 0 0]\n",
      "(84,) (12,)\n",
      "init state [2 0 0 1 0]\n",
      "(103,) (19,)\n",
      "init state [1 1 1 0 0]\n",
      "(115,) (12,)\n",
      "init state [ 2  2  1 -1  0]\n",
      "(136,) (21,)\n",
      "init state [2 0 1 1 0]\n",
      "(141,) (5,)\n",
      "============ 105 ===========\n",
      "Run episode 105 with rewards 37, accuracy 0.8\n",
      "----------------- 0 --------------\n",
      "   -0.6021 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.3169 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.0982 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.1162 if x1>=1.0 & x2<=2.0 & x3-x1>=-1.0\n",
      "   -0.5163 if x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   +0.1842 if x1<=2.0 & x4-x2>=1.0\n",
      "   -0.1128 if x3-x1<=-2.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2<=2.0\n",
      "   +0.1533 if x3-x1<=-3.0\n",
      "   +0.0494 if c<=0.0 & x1<=0.0 & x2>=2.0\n",
      "   +0.0621 if x3-x1<=1.0\n",
      "   -0.0309 if c<=0.0 & x1>=2.0 & x2<=0.0\n",
      "   +0.1505 if x1>=3.0 & x4-x2>=1.0\n",
      "   +0.6935 if c<=0.0 & x2<=1.0 & x3-x1<=-1.0\n",
      "   +0.0000 if x4-x2>=3.0\n",
      "   +0.3094 if x1>=3.0 & x2>=1.0\n",
      "   +0.4537 if c<=0.0 & x1<=1.0 & x2<=2.0 & x2>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "----------------- 1 --------------\n",
      "   -0.7838 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.6281 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.3074 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.0686 if x4-x2<=1.0\n",
      "   +0.1442 if x2<=2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.1401 if c>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.4227 if x3-x1<=2.0 & x4-x2<=0.0\n",
      "   +0.3903 if c>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.0616 if x1>=1.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.1887 if c<=0.0 & x2>=1.0\n",
      "   -0.7177 if x2<=2.0 & x3-x1<=0.0\n",
      "   +0.3277 if x3-x1>=-1.0\n",
      "   +0.0000 if x3-x1>=2.0 & x4-x2>=1.0\n",
      "   +0.0208 if x2<=0.0 & x3-x1>=1.0\n",
      "   +0.0040 if x3-x1<=-1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.0958 if c>=1.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "----------------- 2 --------------\n",
      "   +0.4586 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.4374 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.4374 if x4-x2>=0.0\n",
      "   -0.2491 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.2452 if x2>=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   +0.4586 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   -0.2135 if x1>=2.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   -0.0766 if x3-x1>=1.0 & x4-x2>=1.0\n",
      "   -0.0465 if x1>=1.0 & x2>=2.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.6361 if x3-x1<=1.0 & x4-x2>=-1.0\n",
      "   -0.1080 if x1<=1.0\n",
      "   -0.2181 if x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "   +0.3254 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.1185 if c<=0.0 & x1<=0.0 & x2<=2.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2<=1.0\n",
      "   +0.1548 if x1<=1.0 & x3-x1<=0.0\n",
      "   -0.3006 if c>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "----------------- 3 --------------\n",
      "   +0.2332 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.7268 if c>=1.0 & x1>=1.0\n",
      "   +0.5541 if c>=1.0 & x1>=3.0\n",
      "   -0.2870 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.3480 if x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.0411 if x2>=2.0 & x3-x1>=1.0\n",
      "   +0.4777 if x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   -0.0594 if x1<=0.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.2511 if x1<=2.0 & x2<=0.0\n",
      "   +0.1399 if x3-x1>=-2.0\n",
      "   -0.3347 if x1<=2.0 & x2>=1.0 & x4-x2<=0.0\n",
      "   +0.0029 if x4-x2<=-2.0\n",
      "   -0.2117 if x2>=1.0\n",
      "   -0.3154 if x1<=0.0\n",
      "   +0.1843 if x1>=3.0\n",
      "   -0.5071 if x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "init state [ 2  2  1 -1  0]\n",
      "(11,) (11,)\n",
      "init state [0 0 2 1 0]\n",
      "(17,) (6,)\n",
      "init state [0 1 2 0 0]\n",
      "(32,) (15,)\n",
      "init state [ 2  3 -2  0  0]\n",
      "(44,) (12,)\n",
      "init state [ 3  0 -3  1  0]\n",
      "(57,) (13,)\n",
      "init state [ 0  2  2 -2  0]\n",
      "(79,) (22,)\n",
      "init state [ 0  2  2 -2  0]\n",
      "(112,) (33,)\n",
      "init state [ 3  1 -3 -1  0]\n",
      "(141,) (29,)\n",
      "init state [ 3  2  0 -2  0]\n",
      "(148,) (7,)\n",
      "init state [0 2 3 0 0]\n",
      "(152,) (4,)\n",
      "============ 106 ===========\n",
      "Run episode 106 with rewards 38, accuracy 0.6\n",
      "----------------- 0 --------------\n",
      "   -0.3502 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.6949 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.0199 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.1389 if x1>=1.0 & x2<=2.0 & x3-x1>=-1.0\n",
      "   -0.4762 if x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   -0.2910 if x1<=2.0 & x4-x2>=1.0\n",
      "   +0.2851 if x3-x1<=-2.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2<=2.0\n",
      "   +0.0191 if x3-x1<=-3.0\n",
      "   -0.2305 if c<=0.0 & x1<=0.0 & x2>=2.0\n",
      "   +0.0540 if x3-x1<=1.0\n",
      "   +0.1603 if c<=0.0 & x1>=2.0 & x2<=0.0\n",
      "   +0.1764 if x1>=3.0 & x4-x2>=1.0\n",
      "   +0.5454 if c<=0.0 & x2<=1.0 & x3-x1<=-1.0\n",
      "   -0.2224 if x1>=3.0 & x2>=1.0\n",
      "   +0.3168 if c<=0.0 & x1<=1.0 & x2<=2.0 & x2>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.2552 if c<=0.0 & x1<=1.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "----------------- 1 --------------\n",
      "   -0.1906 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.5717 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.6691 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.4539 if x4-x2<=1.0\n",
      "   +0.2300 if x2<=2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.2798 if c>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.2234 if x3-x1<=2.0 & x4-x2<=0.0\n",
      "   +0.2183 if c>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.2302 if x1>=1.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.3948 if c<=0.0 & x2>=1.0\n",
      "   -0.7697 if x2<=2.0 & x3-x1<=0.0\n",
      "   +0.5748 if x3-x1>=-1.0\n",
      "   +0.4129 if x2<=0.0 & x3-x1>=1.0\n",
      "   +0.1175 if x3-x1<=-1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.1095 if c>=1.0 & x3-x1<=1.0 & x3-x1>=0.0\n",
      "   -0.3392 if x1>=1.0 & x2<=1.0 & x3-x1<=1.0 & x4-x2>=0.0\n",
      "----------------- 2 --------------\n",
      "   +0.8275 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.4477 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.4477 if x4-x2>=0.0\n",
      "   -0.4477 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.1910 if x2>=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   +0.8085 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   -0.2760 if x1>=2.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   -0.0335 if x3-x1>=1.0 & x4-x2>=1.0\n",
      "   -0.4829 if x3-x1<=1.0 & x4-x2>=-1.0\n",
      "   -0.2484 if x1<=1.0\n",
      "   -0.0654 if x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "   +0.3267 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   +0.0000 if c<=0.0 & x1<=0.0 & x2<=2.0 & x2>=1.0 & x3-x1<=1.0 & x4-x2<=1.0\n",
      "   -0.0091 if x1<=1.0 & x3-x1<=0.0\n",
      "   -0.1996 if c>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.0919 if x4-x2>=1.0\n",
      "----------------- 3 --------------\n",
      "   +0.2268 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.7715 if c>=1.0 & x1>=1.0\n",
      "   +0.4867 if c>=1.0 & x1>=3.0\n",
      "   -0.0446 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.1109 if x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.0394 if x2>=2.0 & x3-x1>=1.0\n",
      "   -0.1916 if x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   -0.2170 if x1<=0.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.1025 if x1<=2.0 & x2<=0.0\n",
      "   -0.1916 if x3-x1>=-2.0\n",
      "   -0.3400 if x1<=2.0 & x2>=1.0 & x4-x2<=0.0\n",
      "   -0.2499 if x2>=1.0\n",
      "   -0.2979 if x1<=0.0\n",
      "   +0.1162 if x1>=3.0\n",
      "   -0.3148 if x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.7690 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "init state [0 0 3 2 0]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(14,) (14,)\n",
      "init state [ 2  1 -2  1  0]\n",
      "(45,) (31,)\n",
      "init state [ 3  2 -3  1  0]\n",
      "(64,) (19,)\n",
      "init state [ 0  3  3 -3  0]\n",
      "(84,) (20,)\n",
      "init state [1 0 0 3 0]\n",
      "(105,) (21,)\n",
      "init state [ 2  1 -2  2  0]\n",
      "(113,) (8,)\n",
      "init state [ 3  2 -3  1  0]\n",
      "(127,) (14,)\n",
      "init state [0 0 2 1 0]\n",
      "(137,) (10,)\n",
      "init state [ 2  1 -2  1  0]\n",
      "(150,) (13,)\n",
      "init state [ 1  3 -1 -1  0]\n",
      "(165,) (15,)\n",
      "============ 107 ===========\n",
      "Run episode 107 with rewards 27, accuracy 0.7\n",
      "----------------- 0 --------------\n",
      "   -0.0388 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.9432 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.0301 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   +0.4241 if x1>=1.0 & x2<=2.0 & x3-x1>=-1.0\n",
      "   -0.7384 if x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   -0.1706 if x1<=2.0 & x4-x2>=1.0\n",
      "   +0.2746 if x3-x1<=-2.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2<=2.0\n",
      "   -0.2985 if c<=0.0 & x1<=0.0 & x2>=2.0\n",
      "   -0.4539 if x3-x1<=1.0\n",
      "   +0.0000 if c<=0.0 & x1>=2.0 & x2<=0.0\n",
      "   +0.1033 if x1>=3.0 & x4-x2>=1.0\n",
      "   -0.0193 if c<=0.0 & x2<=1.0 & x3-x1<=-1.0\n",
      "   -0.0280 if x1>=3.0 & x2>=1.0\n",
      "   +0.0177 if c<=0.0 & x1<=1.0 & x2<=2.0 & x2>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.2517 if c<=0.0 & x1<=1.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   +0.4982 if x3-x1<=-2.0 & x4-x2>=0.0\n",
      "----------------- 1 --------------\n",
      "   +0.0675 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.5784 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.4317 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.0081 if x4-x2<=1.0\n",
      "   +0.0526 if x2<=2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.3613 if c>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.1000 if x3-x1<=2.0 & x4-x2<=0.0\n",
      "   +0.3548 if c>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.0603 if x1>=1.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.3314 if c<=0.0 & x2>=1.0\n",
      "   -0.7345 if x2<=2.0 & x3-x1<=0.0\n",
      "   +0.3074 if x3-x1>=-1.0\n",
      "   -0.1223 if x2<=0.0 & x3-x1>=1.0\n",
      "   +0.2113 if x3-x1<=-1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.2772 if x1>=1.0 & x2<=1.0 & x3-x1<=1.0 & x4-x2>=0.0\n",
      "   +0.6060 if x3-x1>=3.0 & x4-x2>=0.0\n",
      "----------------- 2 --------------\n",
      "   +0.5676 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.4699 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.4691 if x4-x2>=0.0\n",
      "   -0.2728 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.2066 if x2>=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   +0.7209 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   -0.1494 if x1>=2.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   -0.2033 if x3-x1>=1.0 & x4-x2>=1.0\n",
      "   -0.2941 if x3-x1<=1.0 & x4-x2>=-1.0\n",
      "   +0.1768 if x1<=1.0\n",
      "   +0.1932 if x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "   +0.2486 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.1395 if x1<=1.0 & x3-x1<=0.0\n",
      "   -0.1994 if c>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.2722 if x4-x2>=1.0\n",
      "   -0.3526 if x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "----------------- 3 --------------\n",
      "   +0.0089 if c<=0.0 & x3-x1<=0.0 & x4-x2>=1.0\n",
      "   +0.4547 if c>=1.0 & x1>=1.0\n",
      "   +0.4233 if c>=1.0 & x1>=3.0\n",
      "   +0.3366 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.3610 if x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.3612 if x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   -0.1512 if x1<=0.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.4410 if x1<=2.0 & x2<=0.0\n",
      "   +0.4958 if x3-x1>=-2.0\n",
      "   -0.1688 if x1<=2.0 & x2>=1.0 & x4-x2<=0.0\n",
      "   -0.2686 if x2>=1.0\n",
      "   +0.0994 if x1<=0.0\n",
      "   +0.2386 if x1>=3.0\n",
      "   -0.2963 if x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.6420 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   -0.2263 if x2<=1.0 & x3-x1>=3.0\n",
      "init state [1 0 2 1 0]\n",
      "(7,) (7,)\n",
      "init state [0 2 2 1 0]\n",
      "(12,) (5,)\n",
      "init state [ 3  0 -2  3  0]\n",
      "(19,) (7,)\n",
      "init state [1 0 1 0 0]\n",
      "(26,) (7,)\n",
      "init state [ 1  3 -1 -1  0]\n",
      "(38,) (12,)\n",
      "init state [ 2  1 -1  2  0]\n",
      "(47,) (9,)\n",
      "init state [ 2  1 -2  0  0]\n",
      "(62,) (15,)\n",
      "init state [ 3  1 -1  2  0]\n",
      "(69,) (7,)\n",
      "init state [ 3  1 -1 -1  0]\n",
      "(78,) (9,)\n",
      "init state [ 3  1 -2  2  0]\n",
      "(86,) (8,)\n",
      "============ 108 ===========\n",
      "Run episode 108 with rewards 34, accuracy 0.6\n",
      "----------------- 0 --------------\n",
      "   -0.4139 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.9336 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.5806 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.1949 if x1>=1.0 & x2<=2.0 & x3-x1>=-1.0\n",
      "   -0.1622 if x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   -0.1191 if x1<=2.0 & x4-x2>=1.0\n",
      "   +0.0826 if x3-x1<=-2.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2<=2.0\n",
      "   -0.3455 if c<=0.0 & x1<=0.0 & x2>=2.0\n",
      "   -0.1654 if x3-x1<=1.0\n",
      "   +0.1192 if x1>=3.0 & x4-x2>=1.0\n",
      "   -0.2036 if c<=0.0 & x2<=1.0 & x3-x1<=-1.0\n",
      "   +0.2148 if x1>=3.0 & x2>=1.0\n",
      "   +0.0842 if c<=0.0 & x1<=1.0 & x2<=2.0 & x2>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.2008 if c<=0.0 & x1<=1.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   +0.1774 if x3-x1<=-2.0 & x4-x2>=0.0\n",
      "   +0.3623 if x3-x1<=-2.0 & x4-x2>=3.0\n",
      "----------------- 1 --------------\n",
      "   -0.2821 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.0643 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.3473 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.0163 if x2<=2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.3348 if c>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.4101 if x3-x1<=2.0 & x4-x2<=0.0\n",
      "   +0.0617 if c>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   +0.0723 if x1>=1.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.6954 if c<=0.0 & x2>=1.0\n",
      "   -0.7164 if x2<=2.0 & x3-x1<=0.0\n",
      "   +0.6763 if x3-x1>=-1.0\n",
      "   +0.5958 if x2<=0.0 & x3-x1>=1.0\n",
      "   -0.0803 if x3-x1<=-1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.1585 if x1>=1.0 & x2<=1.0 & x3-x1<=1.0 & x4-x2>=0.0\n",
      "   +0.0000 if x3-x1>=3.0 & x4-x2>=0.0\n",
      "   +0.9975 if c<=0.0 & x1>=3.0 & x2<=1.0 & x4-x2<=1.0 & x4-x2<=2.0\n",
      "----------------- 2 --------------\n",
      "   +0.4089 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.5655 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.2796 if x4-x2>=0.0\n",
      "   -0.7944 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.2578 if x2>=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   +0.3077 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   -0.5718 if x1>=2.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   -0.1039 if x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.0125 if x3-x1<=1.0 & x4-x2>=-1.0\n",
      "   -0.1086 if x1<=1.0\n",
      "   -0.0993 if x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "   +0.0751 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.1278 if c>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   +0.0158 if x4-x2>=1.0\n",
      "   -0.0831 if x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.1977 if c>=1.0 & x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "----------------- 3 --------------\n",
      "   +0.4089 if c>=1.0 & x1>=1.0\n",
      "   +0.7583 if c>=1.0 & x1>=3.0\n",
      "   -0.1040 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.4329 if x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.7294 if x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.2973 if x1<=0.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.0126 if x1<=2.0 & x2<=0.0\n",
      "   +0.2546 if x3-x1>=-2.0\n",
      "   -0.4456 if x1<=2.0 & x2>=1.0 & x4-x2<=0.0\n",
      "   +0.4124 if x2>=1.0\n",
      "   +0.4406 if x1<=0.0\n",
      "   -0.0956 if x1>=3.0\n",
      "   -0.4028 if x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.5312 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   +0.0000 if x2<=1.0 & x3-x1>=3.0\n",
      "   -0.2565 if x1<=0.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "init state [ 0  2  2 -1  0]\n",
      "(8,) (8,)\n",
      "init state [0 1 1 2 0]\n",
      "(15,) (7,)\n",
      "init state [0 0 2 3 0]\n",
      "(30,) (15,)\n",
      "init state [ 0  2  1 -2  0]\n",
      "(67,) (37,)\n",
      "init state [ 3  2 -3 -1  0]\n",
      "(107,) (40,)\n",
      "init state [ 1  1 -1 -1  0]\n",
      "(123,) (16,)\n",
      "init state [ 2  1 -1  0  0]\n",
      "(129,) (6,)\n",
      "init state [2 0 1 1 0]\n",
      "(133,) (4,)\n",
      "init state [ 0  2  3 -1  0]\n",
      "(148,) (15,)\n",
      "init state [0 2 3 0 0]\n",
      "(153,) (5,)\n",
      "============ 109 ===========\n",
      "Run episode 109 with rewards 37, accuracy 0.4\n",
      "----------------- 0 --------------\n",
      "   -0.4620 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.6778 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.3226 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.3322 if x1>=1.0 & x2<=2.0 & x3-x1>=-1.0\n",
      "   -0.5286 if x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   +0.4193 if x1<=2.0 & x4-x2>=1.0\n",
      "   +0.1857 if c<=0.0 & x1<=0.0 & x2>=2.0\n",
      "   +0.1670 if x3-x1<=1.0\n",
      "   -0.0839 if x1>=3.0 & x4-x2>=1.0\n",
      "   +0.6745 if c<=0.0 & x2<=1.0 & x3-x1<=-1.0\n",
      "   +0.0355 if x1>=3.0 & x2>=1.0\n",
      "   +0.0484 if c<=0.0 & x1<=1.0 & x2<=2.0 & x2>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.0590 if c<=0.0 & x1<=1.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   +0.0218 if x3-x1<=-2.0 & x4-x2>=0.0\n",
      "   -0.0000 if x3-x1<=-2.0 & x4-x2>=3.0\n",
      "   -0.0776 if x3-x1<=-2.0\n",
      "----------------- 1 --------------\n",
      "   -0.8308 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.5105 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.8319 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.2804 if x2<=2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.1248 if c>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.3025 if x3-x1<=2.0 & x4-x2<=0.0\n",
      "   +0.2180 if c>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   +0.2523 if x1>=1.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.0460 if c<=0.0 & x2>=1.0\n",
      "   -0.8397 if x2<=2.0 & x3-x1<=0.0\n",
      "   -0.0792 if x3-x1>=-1.0\n",
      "   +0.2654 if x2<=0.0 & x3-x1>=1.0\n",
      "   +0.2295 if x3-x1<=-1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.0653 if x1>=1.0 & x2<=1.0 & x3-x1<=1.0 & x4-x2>=0.0\n",
      "   -0.1527 if c<=0.0 & x1>=3.0 & x2<=1.0 & x4-x2<=1.0 & x4-x2<=2.0\n",
      "   -0.4301 if x1<=1.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2>=1.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 2 --------------\n",
      "   +0.9696 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.3390 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.3658 if x4-x2>=0.0\n",
      "   -0.7787 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.0637 if x2>=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   -0.1442 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   +0.2344 if x1>=2.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   -0.0219 if x3-x1>=1.0 & x4-x2>=1.0\n",
      "   -0.2663 if x1<=1.0\n",
      "   +0.2436 if x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "   +0.3614 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.6147 if c>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   +0.2420 if x4-x2>=1.0\n",
      "   +0.1032 if x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.3993 if c>=1.0 & x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "   -0.1720 if x3-x1>=3.0 & x4-x2<=-1.0\n",
      "----------------- 3 --------------\n",
      "   +0.6098 if c>=1.0 & x1>=1.0\n",
      "   +0.8335 if c>=1.0 & x1>=3.0\n",
      "   +0.2734 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.2448 if x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.0895 if x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.2160 if x1<=0.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.1225 if x1<=2.0 & x2<=0.0\n",
      "   -0.1501 if x3-x1>=-2.0\n",
      "   -0.7438 if x1<=2.0 & x2>=1.0 & x4-x2<=0.0\n",
      "   -0.5103 if x2>=1.0\n",
      "   -0.0742 if x1<=0.0\n",
      "   +0.4451 if x1>=3.0\n",
      "   -0.4122 if x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.6572 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   -0.2610 if x1<=0.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   +1.1245 if x1<=1.0 & x1>=1.0 & x4-x2>=1.0\n",
      "init state [1 1 1 0 0]\n",
      "(4,) (4,)\n",
      "init state [ 0  3  1 -2  0]\n",
      "(13,) (9,)\n",
      "init state [ 2  3  0 -2  0]\n",
      "(19,) (6,)\n",
      "init state [ 2  1 -1  0  0]\n",
      "(29,) (10,)\n",
      "init state [ 2  0 -2  3  0]\n",
      "(57,) (28,)\n",
      "init state [ 1  1 -1  0  0]\n",
      "(68,) (11,)\n",
      "init state [ 3  0 -3  2  0]\n",
      "(80,) (12,)\n",
      "init state [ 0  3  1 -2  0]\n",
      "(102,) (22,)\n",
      "init state [ 1  1  0 -1  0]\n",
      "(117,) (15,)\n",
      "init state [ 2  2 -2 -1  0]\n",
      "(134,) (17,)\n",
      "============ 110 ===========\n",
      "Run episode 110 with rewards 25, accuracy 0.9\n",
      "----------------- 0 --------------\n",
      "   -0.4339 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.7105 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.0717 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.3414 if x1>=1.0 & x2<=2.0 & x3-x1>=-1.0\n",
      "   -0.1689 if x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   +0.2605 if x1<=2.0 & x4-x2>=1.0\n",
      "   +0.0598 if c<=0.0 & x1<=0.0 & x2>=2.0\n",
      "   +0.0529 if x3-x1<=1.0\n",
      "   -0.0951 if x1>=3.0 & x4-x2>=1.0\n",
      "   +0.3734 if c<=0.0 & x2<=1.0 & x3-x1<=-1.0\n",
      "   -0.1279 if x1>=3.0 & x2>=1.0\n",
      "   +0.1491 if c<=0.0 & x1<=1.0 & x2<=2.0 & x2>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.3370 if c<=0.0 & x1<=1.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   +0.0785 if x3-x1<=-2.0 & x4-x2>=0.0\n",
      "   -0.0357 if x3-x1<=-2.0\n",
      "   -0.3613 if x4-x2<=1.0\n",
      "----------------- 1 --------------\n",
      "   -0.6352 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.2862 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.2052 if x1<=2.0 & x4-x2>=-2.0\n",
      "   -0.0330 if x2<=2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.5180 if c>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.5282 if x3-x1<=2.0 & x4-x2<=0.0\n",
      "   +0.6934 if c>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.0219 if x1>=1.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.3248 if x2<=2.0 & x3-x1<=0.0\n",
      "   -0.0843 if x3-x1>=-1.0\n",
      "   +0.0000 if x2<=0.0 & x3-x1>=1.0\n",
      "   -0.3077 if x3-x1<=-1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.3403 if x1>=1.0 & x2<=1.0 & x3-x1<=1.0 & x4-x2>=0.0\n",
      "   +0.0000 if c<=0.0 & x1>=3.0 & x2<=1.0 & x4-x2<=1.0 & x4-x2<=2.0\n",
      "   +0.0000 if x1<=1.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.4706 if x3-x1>=1.0\n",
      "----------------- 2 --------------\n",
      "   +0.7279 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.1735 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.2007 if x4-x2>=0.0\n",
      "   -0.5155 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.2156 if x2>=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   +0.6303 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   -0.0330 if x1>=2.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   -0.6773 if x1<=1.0\n",
      "   -0.0410 if x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "   +0.4449 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.4235 if c>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   +0.0632 if x4-x2>=1.0\n",
      "   +0.0624 if x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.3036 if c>=1.0 & x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "   +0.0000 if x3-x1>=3.0 & x4-x2<=-1.0\n",
      "   +0.6662 if x2<=0.0 & x3-x1<=-3.0 & x4-x2<=2.0\n",
      "----------------- 3 --------------\n",
      "   +0.5618 if c>=1.0 & x1>=1.0\n",
      "   +0.5508 if c>=1.0 & x1>=3.0\n",
      "   -0.0958 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.0143 if x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.2093 if x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   -0.0624 if x1<=0.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.3515 if x1<=2.0 & x2<=0.0\n",
      "   -0.0898 if x3-x1>=-2.0\n",
      "   -0.8812 if x1<=2.0 & x2>=1.0 & x4-x2<=0.0\n",
      "   -0.2051 if x2>=1.0\n",
      "   +0.1243 if x1>=3.0\n",
      "   +0.2578 if x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.5860 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   -0.0291 if x1<=0.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   +0.8070 if x1<=1.0 & x1>=1.0 & x4-x2>=1.0\n",
      "   -0.3447 if x1<=0.0 & x2>=2.0 & x4-x2>=1.0\n",
      "init state [ 3  2 -2  0  0]\n",
      "(16,) (16,)\n",
      "init state [ 1  2  0 -2  0]\n",
      "(23,) (7,)\n",
      "init state [ 3  0 -3  0  0]\n",
      "(45,) (22,)\n",
      "init state [ 2  1 -2  2  0]\n",
      "(63,) (18,)\n",
      "init state [ 3  2 -3 -1  0]\n",
      "(84,) (21,)\n",
      "init state [0 0 1 3 0]\n",
      "(98,) (14,)\n",
      "init state [ 3  0 -1  3  0]\n",
      "(116,) (18,)\n",
      "init state [ 0  1  3 -1  0]\n",
      "(141,) (25,)\n",
      "init state [ 2  1 -1  0  0]\n",
      "(164,) (23,)\n",
      "init state [ 1  1  0 -1  0]\n",
      "(170,) (6,)\n",
      "============ 111 ===========\n",
      "Run episode 111 with rewards 36, accuracy 0.8\n",
      "----------------- 0 --------------\n",
      "   -0.4643 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.1184 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.0206 if x3-x1>=1.0 & x4-x2>=-1.0\n",
      "   -0.1976 if x1>=1.0 & x2<=2.0 & x3-x1>=-1.0\n",
      "   -0.1407 if x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   -0.1010 if x1<=2.0 & x4-x2>=1.0\n",
      "   -0.4216 if c<=0.0 & x1<=0.0 & x2>=2.0\n",
      "   +0.0872 if x3-x1<=1.0\n",
      "   +0.1352 if x1>=3.0 & x4-x2>=1.0\n",
      "   +0.8987 if c<=0.0 & x2<=1.0 & x3-x1<=-1.0\n",
      "   -0.1750 if x1>=3.0 & x2>=1.0\n",
      "   +0.0629 if c<=0.0 & x1<=1.0 & x2<=2.0 & x2>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.7541 if c<=0.0 & x1<=1.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   +0.0327 if x3-x1<=-2.0 & x4-x2>=0.0\n",
      "   -0.4385 if x4-x2<=1.0\n",
      "   -0.2863 if c<=0.0 & x1<=1.0 & x2<=1.0 & x3-x1<=0.0\n",
      "----------------- 1 --------------\n",
      "   -0.5536 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.3931 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.2150 if x1<=2.0 & x4-x2>=-2.0\n",
      "   -0.0400 if x2<=2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.5703 if c>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.2485 if x3-x1<=2.0 & x4-x2<=0.0\n",
      "   +0.6259 if c>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.0118 if x1>=1.0 & x2>=1.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   -0.7434 if x2<=2.0 & x3-x1<=0.0\n",
      "   +0.3586 if x3-x1>=-1.0\n",
      "   -0.2753 if x2<=0.0 & x3-x1>=1.0\n",
      "   -0.3868 if x3-x1<=-1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.3152 if x1>=1.0 & x2<=1.0 & x3-x1<=1.0 & x4-x2>=0.0\n",
      "   +0.1901 if x1<=1.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.2039 if x3-x1>=1.0\n",
      "   +0.7322 if c<=0.0 & x1<=0.0 & x3-x1<=1.0 & x4-x2<=1.0\n",
      "----------------- 2 --------------\n",
      "   +0.5560 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.1773 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.2773 if x4-x2>=0.0\n",
      "   +0.1321 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.0178 if x2>=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   +0.6738 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   +0.3014 if x1>=2.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   -0.2297 if x1<=1.0\n",
      "   -0.5153 if x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "   +0.2532 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.5029 if c>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.0454 if x4-x2>=1.0\n",
      "   -0.1378 if x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.3188 if c>=1.0 & x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "   +0.0133 if x2<=0.0 & x3-x1<=-3.0 & x4-x2<=2.0\n",
      "   -0.4655 if x1<=0.0 & x2<=1.0 & x3-x1<=0.0 & x4-x2<=-1.0\n",
      "----------------- 3 --------------\n",
      "   +0.8132 if c>=1.0 & x1>=1.0\n",
      "   +0.4179 if c>=1.0 & x1>=3.0\n",
      "   -0.0849 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.4484 if x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   -0.1696 if x1<=0.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.5070 if x1<=2.0 & x2<=0.0\n",
      "   -0.1830 if x3-x1>=-2.0\n",
      "   -0.5297 if x1<=2.0 & x2>=1.0 & x4-x2<=0.0\n",
      "   +0.0224 if x2>=1.0\n",
      "   +0.1930 if x1>=3.0\n",
      "   -0.0054 if x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +0.5950 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   +0.0946 if x1<=0.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   +0.1268 if x1<=1.0 & x1>=1.0 & x4-x2>=1.0\n",
      "   -0.2545 if x1<=0.0 & x2>=2.0 & x4-x2>=1.0\n",
      "   +0.6218 if x1>=3.0 & x3-x1<=-2.0\n",
      "init state [0 0 2 1 0]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(9,) (9,)\n",
      "init state [2 1 0 2 0]\n",
      "(14,) (5,)\n",
      "init state [0 2 1 0 0]\n",
      "(20,) (6,)\n",
      "init state [ 0  1  2 -1  0]\n",
      "(29,) (9,)\n",
      "init state [0 1 1 1 0]\n",
      "(42,) (13,)\n",
      "init state [ 1  2 -1  1  0]\n",
      "(80,) (38,)\n",
      "init state [1 2 2 0 0]\n",
      "(91,) (11,)\n",
      "init state [0 0 3 1 0]\n",
      "(109,) (18,)\n",
      "init state [ 1  3  0 -1  0]\n",
      "(113,) (4,)\n",
      "init state [0 0 2 1 0]\n",
      "(124,) (11,)\n",
      "============ 112 ===========\n",
      "Run episode 112 with rewards 31, accuracy 0.5\n",
      "----------------- 0 --------------\n",
      "   -0.0512 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.5313 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.2911 if x1>=1.0 & x2<=2.0 & x3-x1>=-1.0\n",
      "   -0.3574 if x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   +0.1296 if x1<=2.0 & x4-x2>=1.0\n",
      "   -0.2577 if c<=0.0 & x1<=0.0 & x2>=2.0\n",
      "   -0.1425 if x3-x1<=1.0\n",
      "   +0.3652 if x1>=3.0 & x4-x2>=1.0\n",
      "   +0.3071 if c<=0.0 & x2<=1.0 & x3-x1<=-1.0\n",
      "   -0.1117 if x1>=3.0 & x2>=1.0\n",
      "   +0.0325 if c<=0.0 & x1<=1.0 & x2<=2.0 & x2>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.1343 if c<=0.0 & x1<=1.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   +0.0302 if x3-x1<=-2.0 & x4-x2>=0.0\n",
      "   -0.2996 if x4-x2<=1.0\n",
      "   +0.1357 if c<=0.0 & x1<=1.0 & x2<=1.0 & x3-x1<=0.0\n",
      "   +0.4960 if x1>=2.0 & x2>=1.0 & x2>=2.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "----------------- 1 --------------\n",
      "   -0.5889 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.1947 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.2637 if x1<=2.0 & x4-x2>=-2.0\n",
      "   -0.0023 if x2<=2.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.6324 if c>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.2584 if x3-x1<=2.0 & x4-x2<=0.0\n",
      "   +0.4608 if c>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.0130 if x2<=2.0 & x3-x1<=0.0\n",
      "   +0.2241 if x3-x1>=-1.0\n",
      "   +0.0300 if x2<=0.0 & x3-x1>=1.0\n",
      "   -0.4221 if x3-x1<=-1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.3179 if x1>=1.0 & x2<=1.0 & x3-x1<=1.0 & x4-x2>=0.0\n",
      "   -0.2076 if x1<=1.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.3515 if x3-x1>=1.0\n",
      "   +0.5753 if c<=0.0 & x1<=0.0 & x3-x1<=1.0 & x4-x2<=1.0\n",
      "   -0.6221 if x2<=2.0 & x3-x1<=2.0\n",
      "----------------- 2 --------------\n",
      "   +0.7699 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.4055 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.4777 if x4-x2>=0.0\n",
      "   -0.0925 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.1458 if x2>=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   +0.7699 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   +0.3077 if x1>=2.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   +0.0651 if x1<=1.0\n",
      "   -0.2323 if x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "   +0.1030 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.4410 if c>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.1818 if x4-x2>=1.0\n",
      "   +0.1174 if x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.2323 if c>=1.0 & x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "   +0.0000 if x1<=0.0 & x2<=1.0 & x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   -0.3474 if x1<=1.0 & x4-x2>=-1.0\n",
      "----------------- 3 --------------\n",
      "   +0.3249 if c>=1.0 & x1>=1.0\n",
      "   +0.1883 if c>=1.0 & x1>=3.0\n",
      "   -0.2945 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.3758 if x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   -0.0723 if x1<=0.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.2698 if x1<=2.0 & x2<=0.0\n",
      "   +0.3542 if x3-x1>=-2.0\n",
      "   -0.2299 if x1<=2.0 & x2>=1.0 & x4-x2<=0.0\n",
      "   +0.0697 if x2>=1.0\n",
      "   -0.1033 if x1>=3.0\n",
      "   +0.7668 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   -0.1314 if x1<=0.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   +0.3249 if x1<=1.0 & x1>=1.0 & x4-x2>=1.0\n",
      "   -0.0756 if x1<=0.0 & x2>=2.0 & x4-x2>=1.0\n",
      "   +0.0558 if x1>=3.0 & x3-x1<=-2.0\n",
      "   -0.5911 if x1<=2.0 & x2>=1.0 & x3-x1<=0.0\n",
      "init state [0 0 3 1 0]\n",
      "(12,) (12,)\n",
      "init state [ 2  2 -2  1  0]\n",
      "(20,) (8,)\n",
      "init state [ 1  3  1 -2  0]\n",
      "(28,) (8,)\n",
      "init state [ 0  3  0 -1  0]\n",
      "(37,) (9,)\n",
      "init state [ 0  2  0 -1  0]\n",
      "(70,) (33,)\n",
      "init state [ 3  2 -2  0  0]\n",
      "(78,) (8,)\n",
      "init state [ 0  3  3 -3  0]\n",
      "(94,) (16,)\n",
      "init state [2 1 0 1 0]\n",
      "(97,) (3,)\n",
      "init state [0 0 2 1 0]\n",
      "(115,) (18,)\n",
      "init state [0 0 0 3 0]\n",
      "(124,) (9,)\n",
      "============ 113 ===========\n",
      "Run episode 113 with rewards 33, accuracy 0.6\n",
      "----------------- 0 --------------\n",
      "   -0.3047 if c>=1.0 & x3-x1<=1.0\n",
      "   +1.0755 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.1165 if x1>=1.0 & x2<=2.0 & x3-x1>=-1.0\n",
      "   -0.1940 if x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   +0.0725 if x1<=2.0 & x4-x2>=1.0\n",
      "   -0.1381 if c<=0.0 & x1<=0.0 & x2>=2.0\n",
      "   -0.1752 if x3-x1<=1.0\n",
      "   -0.0236 if x1>=3.0 & x4-x2>=1.0\n",
      "   +0.0475 if c<=0.0 & x2<=1.0 & x3-x1<=-1.0\n",
      "   -0.4262 if x1>=3.0 & x2>=1.0\n",
      "   +0.0325 if c<=0.0 & x1<=1.0 & x2<=2.0 & x2>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.2976 if c<=0.0 & x1<=1.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   -0.2675 if x4-x2<=1.0\n",
      "   -0.1064 if c<=0.0 & x1<=1.0 & x2<=1.0 & x3-x1<=0.0\n",
      "   +0.0000 if x1>=2.0 & x2>=1.0 & x2>=2.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=1.0\n",
      "   +0.1604 if x4-x2>=3.0\n",
      "----------------- 1 --------------\n",
      "   -0.4632 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.4425 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.1371 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.3185 if c>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.7509 if x3-x1<=2.0 & x4-x2<=0.0\n",
      "   +0.4623 if c>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.3649 if x2<=2.0 & x3-x1<=0.0\n",
      "   -0.0980 if x3-x1>=-1.0\n",
      "   -0.0677 if x2<=0.0 & x3-x1>=1.0\n",
      "   -0.0211 if x3-x1<=-1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.1368 if x1>=1.0 & x2<=1.0 & x3-x1<=1.0 & x4-x2>=0.0\n",
      "   -0.2611 if x1<=1.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.2480 if x3-x1>=1.0\n",
      "   +0.0363 if c<=0.0 & x1<=0.0 & x3-x1<=1.0 & x4-x2<=1.0\n",
      "   -0.3788 if x2<=2.0 & x3-x1<=2.0\n",
      "   +0.8010 if x2<=1.0 & x3-x1>=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "----------------- 2 --------------\n",
      "   +0.6443 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.2841 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.4283 if x4-x2>=0.0\n",
      "   -0.1996 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.0754 if x2>=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   +0.8080 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   -0.0981 if x1>=2.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   +0.1619 if x1<=1.0\n",
      "   +0.0330 if x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "   +0.4373 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.5220 if c>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.0359 if x4-x2>=1.0\n",
      "   +0.1491 if x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.0582 if c>=1.0 & x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "   -0.1837 if x1<=1.0 & x4-x2>=-1.0\n",
      "   -0.2782 if x3-x1<=1.0 & x4-x2<=1.0\n",
      "----------------- 3 --------------\n",
      "   +0.3299 if c>=1.0 & x1>=1.0\n",
      "   +0.4273 if c>=1.0 & x1>=3.0\n",
      "   -0.0762 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.2850 if x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   -0.3181 if x1<=0.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.3158 if x1<=2.0 & x2<=0.0\n",
      "   +0.1583 if x3-x1>=-2.0\n",
      "   -0.8044 if x1<=2.0 & x2>=1.0 & x4-x2<=0.0\n",
      "   +0.1587 if x2>=1.0\n",
      "   +0.1229 if x1>=3.0\n",
      "   +0.6748 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   +0.0000 if x1<=0.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   -0.5910 if x1<=1.0 & x1>=1.0 & x4-x2>=1.0\n",
      "   +0.3906 if x1<=0.0 & x2>=2.0 & x4-x2>=1.0\n",
      "   -0.2498 if x1<=2.0 & x2>=1.0 & x3-x1<=0.0\n",
      "   +0.0751 if x4-x2>=3.0\n",
      "init state [0 0 3 1 0]\n",
      "(16,) (16,)\n",
      "init state [ 0  3  2 -3  0]\n",
      "(36,) (20,)\n",
      "init state [ 2  3  0 -3  0]\n",
      "(46,) (10,)\n",
      "init state [0 0 2 0 0]\n",
      "(58,) (12,)\n",
      "init state [ 3  0 -1  2  0]\n",
      "(77,) (19,)\n",
      "init state [ 2  1  1 -1  0]\n",
      "(82,) (5,)\n",
      "init state [0 0 2 3 0]\n",
      "(90,) (8,)\n",
      "init state [1 0 1 2 0]\n",
      "(112,) (22,)\n",
      "init state [ 3  2 -1 -1  0]\n",
      "(117,) (5,)\n",
      "init state [1 0 2 0 0]\n",
      "(139,) (22,)\n",
      "============ 114 ===========\n",
      "Run episode 114 with rewards 20, accuracy 0.8\n",
      "----------------- 0 --------------\n",
      "   -0.3064 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.5764 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.1068 if x1>=1.0 & x2<=2.0 & x3-x1>=-1.0\n",
      "   -0.1922 if x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   -0.0963 if x1<=2.0 & x4-x2>=1.0\n",
      "   -0.2512 if c<=0.0 & x1<=0.0 & x2>=2.0\n",
      "   -0.3021 if x3-x1<=1.0\n",
      "   +0.0897 if x1>=3.0 & x4-x2>=1.0\n",
      "   +0.6321 if c<=0.0 & x2<=1.0 & x3-x1<=-1.0\n",
      "   +0.0125 if x1>=3.0 & x2>=1.0\n",
      "   +0.0141 if c<=0.0 & x1<=1.0 & x2<=2.0 & x2>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.0000 if c<=0.0 & x1<=1.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   -0.3567 if x4-x2<=1.0\n",
      "   +0.0000 if c<=0.0 & x1<=1.0 & x2<=1.0 & x3-x1<=0.0\n",
      "   -0.1064 if x4-x2>=3.0\n",
      "   +0.1844 if x4-x2<=2.0\n",
      "----------------- 1 --------------\n",
      "   -0.2662 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.2997 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.6314 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.3678 if c>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.3594 if x3-x1<=2.0 & x4-x2<=0.0\n",
      "   +0.0030 if c>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.1809 if x2<=2.0 & x3-x1<=0.0\n",
      "   -0.1903 if x3-x1>=-1.0\n",
      "   +0.2245 if x2<=0.0 & x3-x1>=1.0\n",
      "   +0.0034 if x1>=1.0 & x2<=1.0 & x3-x1<=1.0 & x4-x2>=0.0\n",
      "   +0.2710 if x1<=1.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.1720 if x3-x1>=1.0\n",
      "   +0.0000 if c<=0.0 & x1<=0.0 & x3-x1<=1.0 & x4-x2<=1.0\n",
      "   -0.3341 if x2<=2.0 & x3-x1<=2.0\n",
      "   -0.0310 if x2<=1.0 & x3-x1>=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   +0.2715 if x1>=2.0\n",
      "----------------- 2 --------------\n",
      "   +0.4820 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.3899 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.4395 if x4-x2>=0.0\n",
      "   -0.2302 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.2475 if x2>=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   +0.6429 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   +0.2001 if x1>=2.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   +0.0387 if x1<=1.0\n",
      "   +0.3490 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.6269 if c>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.5078 if x4-x2>=1.0\n",
      "   +0.2037 if x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.1271 if c>=1.0 & x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "   -0.0004 if x1<=1.0 & x4-x2>=-1.0\n",
      "   +0.1436 if x3-x1<=1.0 & x4-x2<=1.0\n",
      "   -0.4847 if c<=0.0 & x2<=1.0 & x4-x2<=0.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 3 --------------\n",
      "   +0.6431 if c>=1.0 & x1>=1.0\n",
      "   +0.6522 if c>=1.0 & x1>=3.0\n",
      "   -0.5316 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.2395 if x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   -0.3442 if x1<=0.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.3457 if x1<=2.0 & x2<=0.0\n",
      "   +0.2455 if x3-x1>=-2.0\n",
      "   -0.3847 if x1<=2.0 & x2>=1.0 & x4-x2<=0.0\n",
      "   +0.1468 if x2>=1.0\n",
      "   +0.1857 if x1>=3.0\n",
      "   +0.0787 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   -0.0750 if x1<=1.0 & x1>=1.0 & x4-x2>=1.0\n",
      "   +0.3776 if x1<=0.0 & x2>=2.0 & x4-x2>=1.0\n",
      "   -0.3796 if x1<=2.0 & x2>=1.0 & x3-x1<=0.0\n",
      "   +0.2792 if x4-x2>=3.0\n",
      "   -0.0431 if x1<=0.0 & x4-x2<=2.0 & x4-x2>=0.0\n",
      "init state [ 2  1 -1  1  0]\n",
      "(9,) (9,)\n",
      "init state [1 2 1 1 0]\n",
      "(13,) (4,)\n",
      "init state [ 2  3  1 -3  0]\n",
      "(21,) (8,)\n",
      "init state [ 0  2  2 -1  0]\n",
      "(32,) (11,)\n",
      "init state [ 2  1 -1  0  0]\n",
      "(49,) (17,)\n",
      "init state [0 0 3 0 0]\n",
      "(63,) (14,)\n",
      "init state [ 1  3 -1 -1  0]\n",
      "(103,) (40,)\n",
      "init state [1 1 1 0 0]\n",
      "(110,) (7,)\n",
      "init state [ 3  2 -3  0  0]\n",
      "(147,) (37,)\n",
      "init state [2 0 0 1 0]\n",
      "(154,) (7,)\n",
      "============ 115 ===========\n",
      "Run episode 115 with rewards 35, accuracy 1.0\n",
      "best\n",
      "----------------- 0 --------------\n",
      "   -0.3829 if c>=1.0 & x3-x1<=1.0\n",
      "   +1.3159 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.0041 if x1>=1.0 & x2<=2.0 & x3-x1>=-1.0\n",
      "   -0.0903 if x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   -0.0210 if x1<=2.0 & x4-x2>=1.0\n",
      "   -0.1501 if c<=0.0 & x1<=0.0 & x2>=2.0\n",
      "   -0.1035 if x3-x1<=1.0\n",
      "   -0.4301 if x1>=3.0 & x4-x2>=1.0\n",
      "   +0.2409 if c<=0.0 & x2<=1.0 & x3-x1<=-1.0\n",
      "   +0.4463 if x1>=3.0 & x2>=1.0\n",
      "   +0.0422 if c<=0.0 & x1<=1.0 & x2<=2.0 & x2>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.6102 if c<=0.0 & x1<=1.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   -0.2749 if x4-x2<=1.0\n",
      "   -0.0000 if x4-x2>=3.0\n",
      "   -0.5305 if x4-x2<=2.0\n",
      "   +0.8594 if x3-x1<=-3.0\n",
      "----------------- 1 --------------\n",
      "   -0.7603 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.3302 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.5909 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.3700 if c>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.0878 if x3-x1<=2.0 & x4-x2<=0.0\n",
      "   +0.2299 if c>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.4942 if x2<=2.0 & x3-x1<=0.0\n",
      "   -0.2300 if x3-x1>=-1.0\n",
      "   +0.2822 if x2<=0.0 & x3-x1>=1.0\n",
      "   +0.3309 if x1>=1.0 & x2<=1.0 & x3-x1<=1.0 & x4-x2>=0.0\n",
      "   +0.4040 if x1<=1.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.0912 if x3-x1>=1.0\n",
      "   +0.2633 if x2<=2.0 & x3-x1<=2.0\n",
      "   -0.1345 if x2<=1.0 & x3-x1>=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.1620 if x1>=2.0\n",
      "   -0.4806 if c<=0.0 & x2<=1.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "----------------- 2 --------------\n",
      "   +0.7088 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.4540 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.4540 if x4-x2>=0.0\n",
      "   -0.3614 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.3559 if x2>=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   +0.2307 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   +0.2081 if x1>=2.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   -0.1369 if x1<=1.0\n",
      "   +0.3530 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.4696 if c>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.0098 if x4-x2>=1.0\n",
      "   +0.4010 if x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.3860 if c>=1.0 & x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "   +0.5402 if x3-x1<=1.0 & x4-x2<=1.0\n",
      "   +0.1640 if c<=0.0 & x2<=1.0 & x4-x2<=0.0\n",
      "   +0.0855 if c<=0.0 & x3-x1<=-3.0\n",
      "----------------- 3 --------------\n",
      "   +0.9717 if c>=1.0 & x1>=1.0\n",
      "   +0.9124 if c>=1.0 & x1>=3.0\n",
      "   +0.2682 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.2633 if x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   -0.1464 if x1<=0.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.2209 if x1<=2.0 & x2<=0.0\n",
      "   +0.7784 if x3-x1>=-2.0\n",
      "   -0.3326 if x1<=2.0 & x2>=1.0 & x4-x2<=0.0\n",
      "   -0.5723 if x2>=1.0\n",
      "   -0.1075 if x1>=3.0\n",
      "   -0.6893 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   -0.3049 if x1<=1.0 & x1>=1.0 & x4-x2>=1.0\n",
      "   +0.0000 if x1<=0.0 & x2>=2.0 & x4-x2>=1.0\n",
      "   -0.3764 if x1<=2.0 & x2>=1.0 & x3-x1<=0.0\n",
      "   +0.0000 if x4-x2>=3.0\n",
      "   +0.3336 if x2<=1.0 & x3-x1>=2.0\n",
      "init state [ 1  3 -1 -1  0]\n",
      "(10,) (10,)\n",
      "init state [ 2  0 -1  1  0]\n",
      "(18,) (8,)\n",
      "init state [0 0 3 1 0]\n",
      "(29,) (11,)\n",
      "init state [ 3  2 -2  0  0]\n",
      "(34,) (5,)\n",
      "init state [ 3  2 -2  1  0]\n",
      "(40,) (6,)\n",
      "init state [ 1  3 -1  0  0]\n",
      "(49,) (9,)\n",
      "init state [ 1  3  2 -1  0]\n",
      "(53,) (4,)\n",
      "init state [ 1  2  1 -1  0]\n",
      "(58,) (5,)\n",
      "init state [ 3  2 -3 -2  0]\n",
      "(90,) (32,)\n",
      "init state [1 2 0 1 0]\n",
      "(119,) (29,)\n",
      "============ 116 ===========\n",
      "Run episode 116 with rewards 13, accuracy 0.3\n",
      "----------------- 0 --------------\n",
      "   -0.6753 if c>=1.0 & x3-x1<=1.0\n",
      "   +1.3291 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.3008 if x1>=1.0 & x2<=2.0 & x3-x1>=-1.0\n",
      "   +0.3489 if x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   -0.5439 if x1<=2.0 & x4-x2>=1.0\n",
      "   -0.0093 if c<=0.0 & x1<=0.0 & x2>=2.0\n",
      "   -0.0384 if x3-x1<=1.0\n",
      "   -0.3342 if x1>=3.0 & x4-x2>=1.0\n",
      "   +0.2085 if c<=0.0 & x2<=1.0 & x3-x1<=-1.0\n",
      "   -0.1629 if x1>=3.0 & x2>=1.0\n",
      "   -0.1461 if c<=0.0 & x1<=1.0 & x2<=2.0 & x2>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.2129 if c<=0.0 & x1<=1.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   -0.1123 if x4-x2<=1.0\n",
      "   -0.2840 if x4-x2<=2.0\n",
      "   -0.0969 if x3-x1<=-3.0\n",
      "   +0.1864 if x1>=3.0 & x2<=0.0 & x4-x2>=1.0\n",
      "----------------- 1 --------------\n",
      "   -0.5611 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.5367 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.5251 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.1026 if c>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.3466 if c>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.3680 if x2<=2.0 & x3-x1<=0.0\n",
      "   +0.3650 if x3-x1>=-1.0\n",
      "   +0.3828 if x2<=0.0 & x3-x1>=1.0\n",
      "   -0.0261 if x1>=1.0 & x2<=1.0 & x3-x1<=1.0 & x4-x2>=0.0\n",
      "   -0.2414 if x1<=1.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.2866 if x3-x1>=1.0\n",
      "   +0.0625 if x2<=2.0 & x3-x1<=2.0\n",
      "   +0.1447 if x2<=1.0 & x3-x1>=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.0570 if x1>=2.0\n",
      "   -0.0740 if c<=0.0 & x2<=1.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   +0.2950 if x3-x1>=2.0 & x4-x2>=0.0\n",
      "----------------- 2 --------------\n",
      "   +0.3288 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.5222 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.5222 if x4-x2>=0.0\n",
      "   -0.3787 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.1687 if x2>=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   +0.1201 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   -0.3401 if x1>=2.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   +0.3641 if x1<=1.0\n",
      "   +0.3198 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.3345 if c>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   +0.2824 if x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.0507 if c>=1.0 & x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "   +0.3220 if x3-x1<=1.0 & x4-x2<=1.0\n",
      "   +0.2281 if c<=0.0 & x2<=1.0 & x4-x2<=0.0\n",
      "   -0.0067 if c<=0.0 & x3-x1<=-3.0\n",
      "   +0.0592 if x2<=0.0\n",
      "----------------- 3 --------------\n",
      "   +1.0332 if c>=1.0 & x1>=1.0\n",
      "   +0.6960 if c>=1.0 & x1>=3.0\n",
      "   -0.1051 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.0048 if x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   -0.0444 if x1<=0.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.2652 if x1<=2.0 & x2<=0.0\n",
      "   +0.0034 if x3-x1>=-2.0\n",
      "   -0.6204 if x1<=2.0 & x2>=1.0 & x4-x2<=0.0\n",
      "   +0.1739 if x2>=1.0\n",
      "   +0.5430 if x1>=3.0\n",
      "   -0.4483 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   +0.0565 if x1<=1.0 & x1>=1.0 & x4-x2>=1.0\n",
      "   -0.0240 if x1<=0.0 & x2>=2.0 & x4-x2>=1.0\n",
      "   -0.2285 if x1<=2.0 & x2>=1.0 & x3-x1<=0.0\n",
      "   +0.1116 if x2<=1.0 & x3-x1>=2.0\n",
      "   -0.3258 if x4-x2<=0.0\n",
      "init state [ 3  2 -2 -1  0]\n",
      "(7,) (7,)\n",
      "init state [ 1  3  2 -1  0]\n",
      "(17,) (10,)\n",
      "init state [0 1 1 0 0]\n",
      "(25,) (8,)\n",
      "init state [1 1 0 1 0]\n",
      "(38,) (13,)\n",
      "init state [ 2  3  1 -2  0]\n",
      "(49,) (11,)\n",
      "init state [ 2  3 -2  0  0]\n",
      "(54,) (5,)\n",
      "init state [ 2  2 -1  1  0]\n",
      "(69,) (15,)\n",
      "init state [ 3  2  0 -1  0]\n",
      "(73,) (4,)\n",
      "init state [1 1 1 2 0]\n",
      "(90,) (17,)\n",
      "init state [ 2  3 -2 -3  0]\n",
      "(105,) (15,)\n",
      "============ 117 ===========\n",
      "Run episode 117 with rewards 27, accuracy 1.0\n",
      "best\n",
      "----------------- 0 --------------\n",
      "   -0.6733 if c>=1.0 & x3-x1<=1.0\n",
      "   +1.0368 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.4921 if x1>=1.0 & x2<=2.0 & x3-x1>=-1.0\n",
      "   -0.1051 if x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   -0.3804 if x1<=2.0 & x4-x2>=1.0\n",
      "   +0.0070 if x3-x1<=1.0\n",
      "   +0.0255 if x1>=3.0 & x4-x2>=1.0\n",
      "   +0.9595 if c<=0.0 & x2<=1.0 & x3-x1<=-1.0\n",
      "   +0.1307 if x1>=3.0 & x2>=1.0\n",
      "   -0.1686 if c<=0.0 & x1<=1.0 & x2<=2.0 & x2>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.1023 if c<=0.0 & x1<=1.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   -0.0219 if x4-x2<=1.0\n",
      "   +0.0523 if x4-x2<=2.0\n",
      "   -0.0254 if x3-x1<=-3.0\n",
      "   +0.0413 if x1>=3.0 & x2<=0.0 & x4-x2>=1.0\n",
      "   -0.2656 if x1>=3.0 & x2<=2.0 & x2>=1.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 1 --------------\n",
      "   -0.8395 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.5388 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.2974 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.3622 if c>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.4819 if c>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.2784 if x2<=2.0 & x3-x1<=0.0\n",
      "   +0.1770 if x3-x1>=-1.0\n",
      "   +0.0726 if x2<=0.0 & x3-x1>=1.0\n",
      "   -0.0368 if x1<=1.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.6191 if x3-x1>=1.0\n",
      "   +0.1436 if x2<=2.0 & x3-x1<=2.0\n",
      "   +0.0000 if x2<=1.0 & x3-x1>=2.0 & x4-x2<=0.0 & x4-x2>=0.0\n",
      "   -0.4186 if x1>=2.0\n",
      "   +0.1947 if c<=0.0 & x2<=1.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   +0.0000 if x3-x1>=2.0 & x4-x2>=0.0\n",
      "   +0.3516 if x3-x1>=2.0\n",
      "----------------- 2 --------------\n",
      "   +0.3431 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.2995 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.2660 if x4-x2>=0.0\n",
      "   -0.4974 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.0963 if x2>=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   +0.0608 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   -0.2232 if x1>=2.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   -0.0436 if x1<=1.0\n",
      "   -0.1443 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.2336 if c>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   +0.4731 if x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.1658 if c>=1.0 & x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "   +0.4344 if x3-x1<=1.0 & x4-x2<=1.0\n",
      "   -0.3083 if c<=0.0 & x2<=1.0 & x4-x2<=0.0\n",
      "   +0.0626 if x2<=0.0\n",
      "   -0.2334 if x1>=3.0 & x2>=3.0\n",
      "----------------- 3 --------------\n",
      "   +0.8285 if c>=1.0 & x1>=1.0\n",
      "   +0.7989 if c>=1.0 & x1>=3.0\n",
      "   -0.2592 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.1898 if x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.1119 if x1<=0.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.2049 if x1<=2.0 & x2<=0.0\n",
      "   -0.4853 if x1<=2.0 & x2>=1.0 & x4-x2<=0.0\n",
      "   +0.0521 if x2>=1.0\n",
      "   +0.0365 if x1>=3.0\n",
      "   -0.3032 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   -0.0978 if x1<=1.0 & x1>=1.0 & x4-x2>=1.0\n",
      "   -0.0995 if x1<=0.0 & x2>=2.0 & x4-x2>=1.0\n",
      "   -0.0571 if x1<=2.0 & x2>=1.0 & x3-x1<=0.0\n",
      "   +0.0000 if x2<=1.0 & x3-x1>=2.0\n",
      "   -0.2211 if x4-x2<=0.0\n",
      "   +0.6257 if c<=0.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "init state [1 0 2 0 0]\n",
      "(21,) (21,)\n",
      "init state [1 0 1 0 0]\n",
      "(44,) (23,)\n",
      "init state [0 0 1 0 0]\n",
      "(53,) (9,)\n",
      "init state [2 1 1 1 0]\n",
      "(62,) (9,)\n",
      "init state [ 0  3  0 -2  0]\n",
      "(78,) (16,)\n",
      "init state [ 3  0 -2  2  0]\n",
      "(96,) (18,)\n",
      "init state [ 2  1 -2  1  0]\n",
      "(115,) (19,)\n",
      "init state [ 3  1 -2  1  0]\n",
      "(135,) (20,)\n",
      "init state [ 2  2  0 -2  0]\n",
      "(143,) (8,)\n",
      "init state [ 1  0 -1  2  0]\n",
      "(154,) (11,)\n",
      "============ 118 ===========\n",
      "Run episode 118 with rewards 31, accuracy 1.0\n",
      "best\n",
      "----------------- 0 --------------\n",
      "   -0.4571 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.3463 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.4209 if x1>=1.0 & x2<=2.0 & x3-x1>=-1.0\n",
      "   -0.1774 if x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   +0.2495 if x1<=2.0 & x4-x2>=1.0\n",
      "   +0.1811 if x1>=3.0 & x4-x2>=1.0\n",
      "   +0.3130 if c<=0.0 & x2<=1.0 & x3-x1<=-1.0\n",
      "   -0.3227 if x1>=3.0 & x2>=1.0\n",
      "   +0.2186 if c<=0.0 & x1<=1.0 & x2<=2.0 & x2>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.4677 if c<=0.0 & x1<=1.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   -0.2535 if x4-x2<=1.0\n",
      "   +0.0576 if x4-x2<=2.0\n",
      "   -0.0987 if x3-x1<=-3.0\n",
      "   +0.1854 if x1>=3.0 & x2<=0.0 & x4-x2>=1.0\n",
      "   -0.3227 if x1>=3.0 & x2<=2.0 & x2>=1.0\n",
      "   +0.4697 if x1<=0.0 & x3-x1>=1.0 & x4-x2>=2.0\n",
      "----------------- 1 --------------\n",
      "   -0.7556 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.9220 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.3849 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.2361 if c>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.4876 if c>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.3466 if x2<=2.0 & x3-x1<=0.0\n",
      "   +0.2844 if x3-x1>=-1.0\n",
      "   -0.2078 if x2<=0.0 & x3-x1>=1.0\n",
      "   +0.0000 if x1<=1.0 & x1>=1.0 & x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.5425 if x3-x1>=1.0\n",
      "   +0.1958 if x2<=2.0 & x3-x1<=2.0\n",
      "   +0.0265 if x1>=2.0\n",
      "   +0.5828 if c<=0.0 & x2<=1.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   +0.0841 if x3-x1>=2.0 & x4-x2>=0.0\n",
      "   +0.0841 if x3-x1>=2.0\n",
      "   -0.2498 if c<=0.0 & x1<=0.0 & x2<=0.0 & x3-x1>=1.0 & x4-x2<=0.0\n",
      "----------------- 2 --------------\n",
      "   +0.4791 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.4425 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.4425 if x4-x2>=0.0\n",
      "   -0.0889 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.3170 if x2>=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   +0.4753 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   -0.1089 if x1>=2.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   +0.0918 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.5321 if c>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   +0.0794 if x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.1760 if c>=1.0 & x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "   -0.1213 if x3-x1<=1.0 & x4-x2<=1.0\n",
      "   +0.3337 if c<=0.0 & x2<=1.0 & x4-x2<=0.0\n",
      "   -0.4711 if x2<=0.0\n",
      "   +0.0000 if x1>=3.0 & x2>=3.0\n",
      "   +0.0550 if x1>=1.0 & x4-x2<=-1.0\n",
      "----------------- 3 --------------\n",
      "   +0.1515 if c>=1.0 & x1>=1.0\n",
      "   +0.6092 if c>=1.0 & x1>=3.0\n",
      "   -0.2914 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.0318 if x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.1907 if x1<=0.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.1600 if x1<=2.0 & x2<=0.0\n",
      "   -0.5779 if x1<=2.0 & x2>=1.0 & x4-x2<=0.0\n",
      "   +0.0521 if x2>=1.0\n",
      "   +0.6271 if x1>=3.0\n",
      "   -0.1784 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   -0.0999 if x1<=1.0 & x1>=1.0 & x4-x2>=1.0\n",
      "   +0.0000 if x1<=0.0 & x2>=2.0 & x4-x2>=1.0\n",
      "   -0.1671 if x1<=2.0 & x2>=1.0 & x3-x1<=0.0\n",
      "   +0.0851 if x4-x2<=0.0\n",
      "   +0.2379 if c<=0.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   -0.4445 if x3-x1>=1.0 & x4-x2>=1.0\n",
      "init state [ 1  3  2 -3  0]\n",
      "(11,) (11,)\n",
      "init state [ 2  3  0 -2  0]\n",
      "(18,) (7,)\n",
      "init state [0 1 3 1 0]\n",
      "(24,) (6,)\n",
      "init state [ 2  3 -1 -2  0]\n",
      "(67,) (43,)\n",
      "init state [ 0  2  1 -2  0]\n",
      "(80,) (13,)\n",
      "init state [ 2  1  0 -1  0]\n",
      "(88,) (8,)\n",
      "init state [ 1  3 -1  0  0]\n",
      "(98,) (10,)\n",
      "init state [ 3  0 -1  3  0]\n",
      "(111,) (13,)\n",
      "init state [ 0  1  1 -1  0]\n",
      "(121,) (10,)\n",
      "init state [ 1  1  1 -1  0]\n",
      "(127,) (6,)\n",
      "============ 119 ===========\n",
      "Run episode 119 with rewards 36, accuracy 0.6\n",
      "----------------- 0 --------------\n",
      "   -0.3550 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.7347 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.3103 if x1>=1.0 & x2<=2.0 & x3-x1>=-1.0\n",
      "   -0.4981 if x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   +0.1259 if x1<=2.0 & x4-x2>=1.0\n",
      "   +0.3611 if x1>=3.0 & x4-x2>=1.0\n",
      "   +1.0200 if c<=0.0 & x2<=1.0 & x3-x1<=-1.0\n",
      "   +0.0769 if x1>=3.0 & x2>=1.0\n",
      "   -0.0943 if c<=0.0 & x1<=1.0 & x2<=2.0 & x2>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.3504 if c<=0.0 & x1<=1.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   -0.0112 if x4-x2<=1.0\n",
      "   -0.0000 if x3-x1<=-3.0\n",
      "   +0.3028 if x1>=3.0 & x2<=0.0 & x4-x2>=1.0\n",
      "   +0.1856 if x1>=3.0 & x2<=2.0 & x2>=1.0\n",
      "   -0.0000 if x1<=0.0 & x3-x1>=1.0 & x4-x2>=2.0\n",
      "   +0.3196 if x3-x1>=3.0\n",
      "----------------- 1 --------------\n",
      "   -0.7160 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.6784 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.3491 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.0378 if c>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.4215 if c>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.4363 if x2<=2.0 & x3-x1<=0.0\n",
      "   +0.5145 if x3-x1>=-1.0\n",
      "   +0.2101 if x2<=0.0 & x3-x1>=1.0\n",
      "   +0.7655 if x3-x1>=1.0\n",
      "   +0.1652 if x2<=2.0 & x3-x1<=2.0\n",
      "   -0.1257 if x1>=2.0\n",
      "   +0.1648 if c<=0.0 & x2<=1.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   +0.0039 if x3-x1>=2.0 & x4-x2>=0.0\n",
      "   +0.1425 if x3-x1>=2.0\n",
      "   +0.1165 if c<=0.0 & x1<=0.0 & x2<=0.0 & x3-x1>=1.0 & x4-x2<=0.0\n",
      "   -0.4144 if x1<=0.0 & x2<=1.0 & x2>=1.0\n",
      "----------------- 2 --------------\n",
      "   +0.6317 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.4536 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.6674 if x4-x2>=0.0\n",
      "   -0.4996 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.3285 if x2>=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   +0.8331 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   -0.1538 if x1>=2.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   +0.0854 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.1746 if c>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   +0.2119 if x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.2243 if c>=1.0 & x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "   -0.0406 if x3-x1<=1.0 & x4-x2<=1.0\n",
      "   +0.2588 if c<=0.0 & x2<=1.0 & x4-x2<=0.0\n",
      "   -0.2726 if x2<=0.0\n",
      "   -0.0090 if x1>=1.0 & x4-x2<=-1.0\n",
      "   +0.2709 if x2>=1.0 & x3-x1>=0.0\n",
      "----------------- 3 --------------\n",
      "   +0.7129 if c>=1.0 & x1>=1.0\n",
      "   +0.7494 if c>=1.0 & x1>=3.0\n",
      "   -0.4329 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.0261 if x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   -0.0932 if x1<=0.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.0825 if x1<=2.0 & x2<=0.0\n",
      "   -0.2897 if x1<=2.0 & x2>=1.0 & x4-x2<=0.0\n",
      "   -0.1471 if x2>=1.0\n",
      "   +0.1092 if x1>=3.0\n",
      "   +0.0969 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   -0.1247 if x1<=1.0 & x1>=1.0 & x4-x2>=1.0\n",
      "   +0.1361 if x1<=2.0 & x2>=1.0 & x3-x1<=0.0\n",
      "   -0.2054 if x4-x2<=0.0\n",
      "   +0.5099 if c<=0.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   -0.3930 if x3-x1>=1.0 & x4-x2>=1.0\n",
      "   -0.6071 if x1<=2.0 & x4-x2<=2.0\n",
      "init state [ 0  1  2 -1  0]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(10,) (10,)\n",
      "init state [0 0 0 1 0]\n",
      "(27,) (17,)\n",
      "init state [2 0 1 0 0]\n",
      "(39,) (12,)\n",
      "init state [ 1  3  2 -2  0]\n",
      "(46,) (7,)\n",
      "init state [ 1  1 -1 -1  0]\n",
      "(59,) (13,)\n",
      "init state [ 3  2  0 -2  0]\n",
      "(65,) (6,)\n",
      "init state [ 0  3  1 -2  0]\n",
      "(79,) (14,)\n",
      "init state [ 1  0 -1  2  0]\n",
      "(94,) (15,)\n",
      "init state [ 3  2 -2  0  0]\n",
      "(111,) (17,)\n",
      "init state [ 2  0 -1  3  0]\n",
      "(124,) (13,)\n",
      "============ 120 ===========\n",
      "Run episode 120 with rewards 29, accuracy 0.7\n",
      "----------------- 0 --------------\n",
      "   -0.3382 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.3915 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.0745 if x1>=1.0 & x2<=2.0 & x3-x1>=-1.0\n",
      "   -0.3128 if x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   +0.3912 if x1<=2.0 & x4-x2>=1.0\n",
      "   +0.1264 if x1>=3.0 & x4-x2>=1.0\n",
      "   +0.8965 if c<=0.0 & x2<=1.0 & x3-x1<=-1.0\n",
      "   -0.1740 if x1>=3.0 & x2>=1.0\n",
      "   -0.1690 if c<=0.0 & x1<=1.0 & x2<=2.0 & x2>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.0556 if c<=0.0 & x1<=1.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   -0.5472 if x4-x2<=1.0\n",
      "   -0.0145 if x1>=3.0 & x2<=0.0 & x4-x2>=1.0\n",
      "   -0.1088 if x1>=3.0 & x2<=2.0 & x2>=1.0\n",
      "   -0.1215 if x1<=0.0 & x3-x1>=1.0 & x4-x2>=2.0\n",
      "   +0.0000 if x3-x1>=3.0\n",
      "   -0.1587 if x4-x2>=3.0\n",
      "----------------- 1 --------------\n",
      "   -0.5926 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.4374 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.3867 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.3475 if c>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.6049 if c>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.3338 if x2<=2.0 & x3-x1<=0.0\n",
      "   +0.1336 if x3-x1>=-1.0\n",
      "   +0.3441 if x2<=0.0 & x3-x1>=1.0\n",
      "   +0.3757 if x3-x1>=1.0\n",
      "   +0.1248 if x2<=2.0 & x3-x1<=2.0\n",
      "   -0.1826 if x1>=2.0\n",
      "   +0.4195 if c<=0.0 & x2<=1.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   -0.0788 if x3-x1>=2.0\n",
      "   +0.1337 if c<=0.0 & x1<=0.0 & x2<=0.0 & x3-x1>=1.0 & x4-x2<=0.0\n",
      "   +0.4222 if x1<=0.0 & x2<=1.0 & x2>=1.0\n",
      "   -0.2205 if x2>=3.0 & x3-x1>=2.0 & x4-x2>=-2.0\n",
      "----------------- 2 --------------\n",
      "   +0.6228 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.7380 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.5825 if x4-x2>=0.0\n",
      "   -0.4227 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.2486 if x2>=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   +0.5065 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   +0.1598 if x1>=2.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   +0.5738 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.4967 if c>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   +0.4651 if x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.2436 if c>=1.0 & x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "   -0.2301 if x3-x1<=1.0 & x4-x2<=1.0\n",
      "   +0.4565 if c<=0.0 & x2<=1.0 & x4-x2<=0.0\n",
      "   -0.1202 if x2<=0.0\n",
      "   +0.1736 if x2>=1.0 & x3-x1>=0.0\n",
      "   +0.0055 if x2<=2.0 & x3-x1<=1.0\n",
      "----------------- 3 --------------\n",
      "   +0.4179 if c>=1.0 & x1>=1.0\n",
      "   +0.4592 if c>=1.0 & x1>=3.0\n",
      "   -0.3142 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.0816 if x1<=0.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.0870 if x1<=2.0 & x2<=0.0\n",
      "   +0.0365 if x1<=2.0 & x2>=1.0 & x4-x2<=0.0\n",
      "   -0.0092 if x2>=1.0\n",
      "   +0.2605 if x1>=3.0\n",
      "   +0.0786 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   +0.2996 if x1<=1.0 & x1>=1.0 & x4-x2>=1.0\n",
      "   +0.1319 if x1<=2.0 & x2>=1.0 & x3-x1<=0.0\n",
      "   +0.1384 if x4-x2<=0.0\n",
      "   +0.4433 if c<=0.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   -0.1205 if x3-x1>=1.0 & x4-x2>=1.0\n",
      "   -0.1178 if x1<=2.0 & x4-x2<=2.0\n",
      "   -0.5780 if x1<=2.0 & x2>=1.0 & x4-x2>=-2.0\n",
      "init state [ 1  0 -1  0  0]\n",
      "(15,) (15,)\n",
      "init state [ 3  0 -3  3  0]\n",
      "(39,) (24,)\n",
      "init state [0 2 2 0 0]\n",
      "(47,) (8,)\n",
      "init state [3 1 0 1 0]\n",
      "(49,) (2,)\n",
      "init state [ 0  2  3 -1  0]\n",
      "(57,) (8,)\n",
      "init state [ 1  3  1 -1  0]\n",
      "(63,) (6,)\n",
      "init state [ 2  2 -1 -1  0]\n",
      "(73,) (10,)\n",
      "init state [ 2  1 -1  0  0]\n",
      "(85,) (12,)\n",
      "init state [ 0  2  1 -2  0]\n",
      "(98,) (13,)\n",
      "init state [ 3  0 -2  2  0]\n",
      "(109,) (11,)\n",
      "============ 121 ===========\n",
      "Run episode 121 with rewards 31, accuracy 0.8\n",
      "----------------- 0 --------------\n",
      "   -0.2293 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.5694 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.3866 if x1>=1.0 & x2<=2.0 & x3-x1>=-1.0\n",
      "   -0.2422 if x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   +0.1299 if x1<=2.0 & x4-x2>=1.0\n",
      "   +0.0094 if x1>=3.0 & x4-x2>=1.0\n",
      "   +0.6418 if c<=0.0 & x2<=1.0 & x3-x1<=-1.0\n",
      "   -0.0782 if x1>=3.0 & x2>=1.0\n",
      "   +0.0653 if c<=0.0 & x1<=1.0 & x2<=2.0 & x2>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.1629 if c<=0.0 & x1<=1.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   -0.1186 if x4-x2<=1.0\n",
      "   +0.1241 if x1>=3.0 & x2<=0.0 & x4-x2>=1.0\n",
      "   -0.0782 if x1>=3.0 & x2<=2.0 & x2>=1.0\n",
      "   -0.0000 if x1<=0.0 & x3-x1>=1.0 & x4-x2>=2.0\n",
      "   -0.1310 if x4-x2>=3.0\n",
      "   -0.5386 if c<=0.0 & x3-x1>=1.0\n",
      "----------------- 1 --------------\n",
      "   -0.2128 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.7344 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.4519 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.2315 if c>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.6122 if c>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.2097 if x2<=2.0 & x3-x1<=0.0\n",
      "   +0.1605 if x3-x1>=-1.0\n",
      "   +0.0000 if x2<=0.0 & x3-x1>=1.0\n",
      "   +0.4174 if x3-x1>=1.0\n",
      "   +0.5305 if x2<=2.0 & x3-x1<=2.0\n",
      "   -0.4413 if x1>=2.0\n",
      "   +0.2499 if c<=0.0 & x2<=1.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   +0.0000 if c<=0.0 & x1<=0.0 & x2<=0.0 & x3-x1>=1.0 & x4-x2<=0.0\n",
      "   +0.1449 if x1<=0.0 & x2<=1.0 & x2>=1.0\n",
      "   +0.4291 if x2>=3.0 & x3-x1>=2.0 & x4-x2>=-2.0\n",
      "   -0.7352 if x1>=2.0 & x2<=1.0 & x3-x1>=-2.0 & x4-x2<=2.0 & x4-x2>=0.0\n",
      "----------------- 2 --------------\n",
      "   +0.5947 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.7190 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.7110 if x4-x2>=0.0\n",
      "   -0.6120 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.1432 if x2>=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   +0.3866 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   -0.0407 if x1>=2.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   +0.3734 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.2680 if c>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   +0.4679 if x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.2793 if c>=1.0 & x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "   +0.2193 if x3-x1<=1.0 & x4-x2<=1.0\n",
      "   -0.1130 if c<=0.0 & x2<=1.0 & x4-x2<=0.0\n",
      "   -0.1365 if x2<=0.0\n",
      "   +0.0315 if x2>=1.0 & x3-x1>=0.0\n",
      "   -0.2774 if \n",
      "----------------- 3 --------------\n",
      "   +0.2396 if c>=1.0 & x1>=1.0\n",
      "   +0.3710 if c>=1.0 & x1>=3.0\n",
      "   -0.1642 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.1446 if x1<=0.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.2018 if x1<=2.0 & x2<=0.0\n",
      "   -0.1306 if x1<=2.0 & x2>=1.0 & x4-x2<=0.0\n",
      "   +0.3168 if x1>=3.0\n",
      "   +0.2757 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   +0.0730 if x1<=1.0 & x1>=1.0 & x4-x2>=1.0\n",
      "   -0.0520 if x1<=2.0 & x2>=1.0 & x3-x1<=0.0\n",
      "   +0.0646 if x4-x2<=0.0\n",
      "   +0.2868 if c<=0.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   -0.0554 if x3-x1>=1.0 & x4-x2>=1.0\n",
      "   -0.1941 if x1<=2.0 & x4-x2<=2.0\n",
      "   -0.3453 if x1<=2.0 & x2>=1.0 & x4-x2>=-2.0\n",
      "   +0.4286 if x2<=2.0 & x3-x1>=3.0\n",
      "init state [ 0  3  0 -2  0]\n",
      "(23,) (23,)\n",
      "init state [0 0 1 2 0]\n",
      "(31,) (8,)\n",
      "init state [ 3  1 -3  2  0]\n",
      "(44,) (13,)\n",
      "init state [0 1 0 1 0]\n",
      "(49,) (5,)\n",
      "init state [ 2  3 -2 -1  0]\n",
      "(58,) (9,)\n",
      "init state [1 1 0 2 0]\n",
      "(86,) (28,)\n",
      "init state [ 2  2  0 -1  0]\n",
      "(95,) (9,)\n",
      "init state [ 0  2  3 -1  0]\n",
      "(106,) (11,)\n",
      "init state [ 0  1  2 -1  0]\n",
      "(115,) (9,)\n",
      "init state [ 2  2 -2 -2  0]\n",
      "(142,) (27,)\n",
      "============ 122 ===========\n",
      "Run episode 122 with rewards 15, accuracy 0.6\n",
      "----------------- 0 --------------\n",
      "   -0.4187 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.6098 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.4218 if x1>=1.0 & x2<=2.0 & x3-x1>=-1.0\n",
      "   -0.4111 if x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   -0.5943 if x1<=2.0 & x4-x2>=1.0\n",
      "   +0.1997 if x1>=3.0 & x4-x2>=1.0\n",
      "   +0.5062 if c<=0.0 & x2<=1.0 & x3-x1<=-1.0\n",
      "   +0.0809 if x1>=3.0 & x2>=1.0\n",
      "   -0.3484 if c<=0.0 & x1<=1.0 & x2<=2.0 & x2>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.2199 if c<=0.0 & x1<=1.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   +0.0462 if x4-x2<=1.0\n",
      "   +0.0000 if x1>=3.0 & x2<=0.0 & x4-x2>=1.0\n",
      "   +0.1087 if x1>=3.0 & x2<=2.0 & x2>=1.0\n",
      "   +0.0000 if x4-x2>=3.0\n",
      "   -0.2648 if c<=0.0 & x3-x1>=1.0\n",
      "   -0.3766 if x4-x2<=-2.0 & x4-x2>=-2.0\n",
      "----------------- 1 --------------\n",
      "   -0.4190 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.4126 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.7671 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.0090 if c>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.4493 if c>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.0491 if x2<=2.0 & x3-x1<=0.0\n",
      "   +0.1813 if x3-x1>=-1.0\n",
      "   -0.2962 if x2<=0.0 & x3-x1>=1.0\n",
      "   +0.4107 if x3-x1>=1.0\n",
      "   +0.0863 if x2<=2.0 & x3-x1<=2.0\n",
      "   -0.4366 if x1>=2.0\n",
      "   +0.2801 if c<=0.0 & x2<=1.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   +0.0693 if x1<=0.0 & x2<=1.0 & x2>=1.0\n",
      "   +0.2502 if x2>=3.0 & x3-x1>=2.0 & x4-x2>=-2.0\n",
      "   -0.1992 if x1>=2.0 & x2<=1.0 & x3-x1>=-2.0 & x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.1552 if x2<=2.0\n",
      "----------------- 2 --------------\n",
      "   +0.5691 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.3689 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.3689 if x4-x2>=0.0\n",
      "   -0.3686 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.3228 if x2>=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   +0.5295 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   -0.0448 if x1>=2.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   -0.0664 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.1996 if c>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   +0.3678 if x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.0584 if c>=1.0 & x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "   -0.0691 if x3-x1<=1.0 & x4-x2<=1.0\n",
      "   -0.1232 if c<=0.0 & x2<=1.0 & x4-x2<=0.0\n",
      "   -0.0923 if x2<=0.0\n",
      "   -0.2812 if \n",
      "   -0.1260 if c>=1.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 3 --------------\n",
      "   +0.6730 if c>=1.0 & x1>=1.0\n",
      "   +0.5687 if c>=1.0 & x1>=3.0\n",
      "   +0.3479 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.1314 if x1<=0.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.3899 if x1<=2.0 & x2<=0.0\n",
      "   -0.8892 if x1<=2.0 & x2>=1.0 & x4-x2<=0.0\n",
      "   +0.3704 if x1>=3.0\n",
      "   +0.2745 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   +0.0090 if x1<=1.0 & x1>=1.0 & x4-x2>=1.0\n",
      "   -0.0937 if x4-x2<=0.0\n",
      "   +0.5293 if c<=0.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.1705 if x3-x1>=1.0 & x4-x2>=1.0\n",
      "   +0.1811 if x1<=2.0 & x4-x2<=2.0\n",
      "   -0.2236 if x1<=2.0 & x2>=1.0 & x4-x2>=-2.0\n",
      "   +0.3327 if x2<=2.0 & x3-x1>=3.0\n",
      "   +0.2844 if x3-x1>=1.0 & x4-x2>=2.0\n",
      "init state [ 0  1  2 -1  0]\n",
      "(7,) (7,)\n",
      "init state [ 1  1 -1  0  0]\n",
      "(19,) (12,)\n",
      "init state [2 1 1 0 0]\n",
      "(24,) (5,)\n",
      "init state [ 2  3  1 -3  0]\n",
      "(45,) (21,)\n",
      "init state [ 2  1 -2  0  0]\n",
      "(57,) (12,)\n",
      "init state [ 3  0 -1  2  0]\n",
      "(62,) (5,)\n",
      "init state [ 3  2 -1 -2  0]\n",
      "(84,) (22,)\n",
      "init state [ 3  0 -3  0  0]\n",
      "(95,) (11,)\n",
      "init state [ 1  1  1 -1  0]\n",
      "(107,) (12,)\n",
      "init state [ 0  1  3 -1  0]\n",
      "(125,) (18,)\n",
      "============ 123 ===========\n",
      "Run episode 123 with rewards 24, accuracy 0.8\n",
      "----------------- 0 --------------\n",
      "   -0.6240 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.8991 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.3539 if x1>=1.0 & x2<=2.0 & x3-x1>=-1.0\n",
      "   -0.2623 if x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   -0.0561 if x1<=2.0 & x4-x2>=1.0\n",
      "   +0.0286 if x1>=3.0 & x4-x2>=1.0\n",
      "   +0.5687 if c<=0.0 & x2<=1.0 & x3-x1<=-1.0\n",
      "   +0.3167 if x1>=3.0 & x2>=1.0\n",
      "   +0.0279 if c<=0.0 & x1<=1.0 & x2<=2.0 & x2>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.2020 if c<=0.0 & x1<=1.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   +0.0401 if x4-x2<=1.0\n",
      "   +0.1268 if x1>=3.0 & x2<=2.0 & x2>=1.0\n",
      "   +0.0000 if x4-x2>=3.0\n",
      "   -0.2281 if c<=0.0 & x3-x1>=1.0\n",
      "   -0.3425 if x4-x2<=-2.0 & x4-x2>=-2.0\n",
      "   -0.7508 if c<=0.0 & x3-x1>=0.0\n",
      "----------------- 1 --------------\n",
      "   -0.6400 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.6614 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.3504 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.5183 if c>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.3642 if x2<=2.0 & x3-x1<=0.0\n",
      "   +0.2223 if x3-x1>=-1.0\n",
      "   -0.0896 if x2<=0.0 & x3-x1>=1.0\n",
      "   +0.3899 if x3-x1>=1.0\n",
      "   -0.1264 if x2<=2.0 & x3-x1<=2.0\n",
      "   +0.2313 if x1>=2.0\n",
      "   +0.2905 if c<=0.0 & x2<=1.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   +0.2523 if x1<=0.0 & x2<=1.0 & x2>=1.0\n",
      "   +0.0000 if x2>=3.0 & x3-x1>=2.0 & x4-x2>=-2.0\n",
      "   +0.0200 if x1>=2.0 & x2<=1.0 & x3-x1>=-2.0 & x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.0783 if x2<=2.0\n",
      "   -0.5726 if x1>=3.0\n",
      "----------------- 2 --------------\n",
      "   +0.8600 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.3490 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.3490 if x4-x2>=0.0\n",
      "   -0.2987 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.2738 if x2>=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   +0.8310 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   -0.0954 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.1110 if c>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   +0.3214 if x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.0836 if c>=1.0 & x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "   -0.0278 if x3-x1<=1.0 & x4-x2<=1.0\n",
      "   -0.1789 if c<=0.0 & x2<=1.0 & x4-x2<=0.0\n",
      "   -0.2016 if x2<=0.0\n",
      "   -0.2032 if \n",
      "   -0.2540 if c>=1.0\n",
      "   -0.0548 if x1<=2.0 & x3-x1<=2.0\n",
      "----------------- 3 --------------\n",
      "   +0.5445 if c>=1.0 & x1>=1.0\n",
      "   +0.6159 if c>=1.0 & x1>=3.0\n",
      "   +0.0310 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.0429 if x1<=0.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.1051 if x1<=2.0 & x2<=0.0\n",
      "   -0.4362 if x1<=2.0 & x2>=1.0 & x4-x2<=0.0\n",
      "   +0.3602 if x1>=3.0\n",
      "   +0.2162 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   -0.0441 if x4-x2<=0.0\n",
      "   +0.2658 if c<=0.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.0000 if x3-x1>=1.0 & x4-x2>=1.0\n",
      "   -0.0653 if x1<=2.0 & x4-x2<=2.0\n",
      "   +0.0704 if x1<=2.0 & x2>=1.0 & x4-x2>=-2.0\n",
      "   -0.0136 if x2<=2.0 & x3-x1>=3.0\n",
      "   +0.0000 if x3-x1>=1.0 & x4-x2>=2.0\n",
      "   +0.2770 if x4-x2>=2.0\n",
      "init state [ 2  2  1 -1  0]\n",
      "(17,) (17,)\n",
      "init state [0 0 3 1 0]\n",
      "(26,) (9,)\n",
      "init state [ 3  0 -3  3  0]\n",
      "(41,) (15,)\n",
      "init state [2 1 1 0 0]\n",
      "(44,) (3,)\n",
      "init state [ 1  1 -1 -1  0]\n",
      "(54,) (10,)\n",
      "init state [ 2  2 -2  0  0]\n",
      "(68,) (14,)\n",
      "init state [ 2  1 -2 -1  0]\n",
      "(91,) (23,)\n",
      "init state [0 0 0 3 0]\n",
      "(117,) (26,)\n",
      "init state [1 2 1 0 0]\n",
      "(120,) (3,)\n",
      "init state [ 3  1 -1 -1  0]\n",
      "(136,) (16,)\n",
      "============ 124 ===========\n",
      "Run episode 124 with rewards 26, accuracy 1.0\n",
      "best\n",
      "----------------- 0 --------------\n",
      "   -0.7797 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.3407 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.5262 if x1>=1.0 & x2<=2.0 & x3-x1>=-1.0\n",
      "   +0.0837 if x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   +0.1115 if x1<=2.0 & x4-x2>=1.0\n",
      "   +0.0933 if x1>=3.0 & x4-x2>=1.0\n",
      "   +0.2700 if c<=0.0 & x2<=1.0 & x3-x1<=-1.0\n",
      "   +0.0646 if x1>=3.0 & x2>=1.0\n",
      "   -0.3144 if c<=0.0 & x1<=1.0 & x2<=2.0 & x2>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.0430 if c<=0.0 & x1<=1.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   -0.1942 if x4-x2<=1.0\n",
      "   +0.1457 if x1>=3.0 & x2<=2.0 & x2>=1.0\n",
      "   -0.0287 if c<=0.0 & x3-x1>=1.0\n",
      "   -0.0583 if x4-x2<=-2.0 & x4-x2>=-2.0\n",
      "   -0.3422 if c<=0.0 & x3-x1>=0.0\n",
      "   +0.5984 if c<=0.0 & x2<=0.0 & x3-x1<=-1.0 & x4-x2<=2.0\n",
      "----------------- 1 --------------\n",
      "   -0.1331 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.0967 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.1921 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.7295 if c>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.4438 if x2<=2.0 & x3-x1<=0.0\n",
      "   +0.5011 if x3-x1>=-1.0\n",
      "   -0.1401 if x2<=0.0 & x3-x1>=1.0\n",
      "   +0.2854 if x3-x1>=1.0\n",
      "   -0.4701 if x2<=2.0 & x3-x1<=2.0\n",
      "   +0.4849 if x1>=2.0\n",
      "   +0.4157 if c<=0.0 & x2<=1.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   -0.1300 if x1<=0.0 & x2<=1.0 & x2>=1.0\n",
      "   +0.0258 if x1>=2.0 & x2<=1.0 & x3-x1>=-2.0 & x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.3152 if x2<=2.0\n",
      "   -0.0422 if x1>=3.0\n",
      "   +0.3176 if x2>=2.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "----------------- 2 --------------\n",
      "   +0.2502 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.0917 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.3865 if x4-x2>=0.0\n",
      "   -0.6184 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.1179 if x2>=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   +0.3296 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   -0.1877 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   +0.0349 if c>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.0219 if x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.0736 if c>=1.0 & x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "   -0.2650 if c<=0.0 & x2<=1.0 & x4-x2<=0.0\n",
      "   -0.6103 if x2<=0.0\n",
      "   -0.0683 if \n",
      "   -0.3087 if c>=1.0\n",
      "   +0.3668 if x1<=2.0 & x3-x1<=2.0\n",
      "   +0.3795 if x3-x1>=2.0 & x4-x2<=-1.0\n",
      "----------------- 3 --------------\n",
      "   +0.5636 if c>=1.0 & x1>=1.0\n",
      "   +0.5079 if c>=1.0 & x1>=3.0\n",
      "   +0.3258 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.1844 if x1<=0.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.2385 if x1<=2.0 & x2<=0.0\n",
      "   -0.2561 if x1<=2.0 & x2>=1.0 & x4-x2<=0.0\n",
      "   +0.3737 if x1>=3.0\n",
      "   +0.5443 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   +0.0205 if x4-x2<=0.0\n",
      "   +0.3608 if c<=0.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   -0.2209 if x1<=2.0 & x4-x2<=2.0\n",
      "   -0.0077 if x1<=2.0 & x2>=1.0 & x4-x2>=-2.0\n",
      "   -0.3082 if x2<=2.0 & x3-x1>=3.0\n",
      "   +0.0000 if x3-x1>=1.0 & x4-x2>=2.0\n",
      "   +0.2279 if x4-x2>=2.0\n",
      "   -0.5301 if c<=0.0 & x2<=2.0 & x2>=2.0 & x3-x1>=0.0\n",
      "init state [ 1  1  0 -1  0]\n",
      "(16,) (16,)\n",
      "init state [ 2  0 -1  1  0]\n",
      "(28,) (12,)\n",
      "init state [ 1  3 -1 -3  0]\n",
      "(38,) (10,)\n",
      "init state [ 1  1  1 -1  0]\n",
      "(59,) (21,)\n",
      "init state [ 1  1 -1  0  0]\n",
      "(101,) (42,)\n",
      "init state [2 0 1 1 0]\n",
      "(108,) (7,)\n",
      "init state [ 3  2 -2 -2  0]\n",
      "(132,) (24,)\n",
      "init state [ 1  3 -1  0  0]\n",
      "(146,) (14,)\n",
      "init state [ 1  0 -1  2  0]\n",
      "(189,) (43,)\n",
      "init state [1 1 0 1 0]\n",
      "(193,) (4,)\n",
      "============ 125 ===========\n",
      "Run episode 125 with rewards 38, accuracy 0.5\n",
      "----------------- 0 --------------\n",
      "   -0.4393 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.6963 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.0986 if x1>=1.0 & x2<=2.0 & x3-x1>=-1.0\n",
      "   -0.0637 if x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   +0.2649 if x1<=2.0 & x4-x2>=1.0\n",
      "   +0.1551 if x1>=3.0 & x4-x2>=1.0\n",
      "   +0.7783 if c<=0.0 & x2<=1.0 & x3-x1<=-1.0\n",
      "   +0.0942 if x1>=3.0 & x2>=1.0\n",
      "   -0.1140 if c<=0.0 & x1<=1.0 & x2<=2.0 & x2>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.2706 if c<=0.0 & x1<=1.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   -0.0034 if x4-x2<=1.0\n",
      "   +0.0815 if x1>=3.0 & x2<=2.0 & x2>=1.0\n",
      "   -0.1628 if x4-x2<=-2.0 & x4-x2>=-2.0\n",
      "   -0.2742 if c<=0.0 & x3-x1>=0.0\n",
      "   +0.4362 if c<=0.0 & x2<=0.0 & x3-x1<=-1.0 & x4-x2<=2.0\n",
      "   -0.4286 if x3-x1>=-1.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 1 --------------\n",
      "   -0.0172 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.3232 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.2113 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.4891 if c>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.1176 if x2<=2.0 & x3-x1<=0.0\n",
      "   +0.3146 if x3-x1>=-1.0\n",
      "   +0.0311 if x2<=0.0 & x3-x1>=1.0\n",
      "   -0.0636 if x3-x1>=1.0\n",
      "   -0.1397 if x2<=2.0 & x3-x1<=2.0\n",
      "   +0.2517 if x1>=2.0\n",
      "   -0.3847 if c<=0.0 & x2<=1.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   -0.2346 if x1<=0.0 & x2<=1.0 & x2>=1.0\n",
      "   -0.1397 if x2<=2.0\n",
      "   +0.0784 if x1>=3.0\n",
      "   +0.0000 if x2>=2.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   -0.6406 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2<=1.0\n",
      "----------------- 2 --------------\n",
      "   +0.4964 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.7639 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.7639 if x4-x2>=0.0\n",
      "   -0.7754 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.1016 if x2>=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   +0.4751 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   +0.3248 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.2914 if c>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.3620 if c>=1.0 & x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "   +0.2578 if c<=0.0 & x2<=1.0 & x4-x2<=0.0\n",
      "   -0.1208 if x2<=0.0\n",
      "   +0.1174 if \n",
      "   -0.4484 if c>=1.0\n",
      "   -0.0026 if x1<=2.0 & x3-x1<=2.0\n",
      "   +0.2788 if x3-x1>=2.0 & x4-x2<=-1.0\n",
      "   -0.1346 if x3-x1<=-1.0 & x4-x2>=1.0\n",
      "----------------- 3 --------------\n",
      "   +0.7416 if c>=1.0 & x1>=1.0\n",
      "   +0.4929 if c>=1.0 & x1>=3.0\n",
      "   -0.6000 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.0329 if x1<=0.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.0487 if x1<=2.0 & x2<=0.0\n",
      "   +0.2071 if x1<=2.0 & x2>=1.0 & x4-x2<=0.0\n",
      "   -0.0083 if x1>=3.0\n",
      "   -0.0059 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   -0.0968 if x4-x2<=0.0\n",
      "   +0.5860 if c<=0.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.0180 if x1<=2.0 & x4-x2<=2.0\n",
      "   +0.0618 if x1<=2.0 & x2>=1.0 & x4-x2>=-2.0\n",
      "   -0.0000 if x2<=2.0 & x3-x1>=3.0\n",
      "   +0.0218 if x4-x2>=2.0\n",
      "   -0.2297 if c<=0.0 & x2<=2.0 & x2>=2.0 & x3-x1>=0.0\n",
      "   -0.1613 if x1<=0.0 & x4-x2>=1.0\n",
      "init state [ 3  1 -2  1  0]\n",
      "(10,) (10,)\n",
      "init state [ 0  2  0 -1  0]\n",
      "(21,) (11,)\n",
      "init state [0 2 1 1 0]\n",
      "(46,) (25,)\n",
      "init state [ 1  3  0 -3  0]\n",
      "(57,) (11,)\n",
      "init state [ 0  3  3 -1  0]\n",
      "(63,) (6,)\n",
      "init state [ 3  0 -2  3  0]\n",
      "(73,) (10,)\n",
      "init state [0 1 2 0 0]\n",
      "(82,) (9,)\n",
      "init state [ 0  3  2 -1  0]\n",
      "(101,) (19,)\n",
      "init state [0 0 1 0 0]\n",
      "(111,) (10,)\n",
      "init state [ 3  1 -3  2  0]\n",
      "(132,) (21,)\n",
      "============ 126 ===========\n",
      "Run episode 126 with rewards 21, accuracy 0.9\n",
      "----------------- 0 --------------\n",
      "   -0.4635 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.5676 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.5207 if x1>=1.0 & x2<=2.0 & x3-x1>=-1.0\n",
      "   -0.0841 if x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   +0.2034 if x1<=2.0 & x4-x2>=1.0\n",
      "   +0.3408 if x1>=3.0 & x4-x2>=1.0\n",
      "   +0.8065 if c<=0.0 & x2<=1.0 & x3-x1<=-1.0\n",
      "   +0.1606 if x1>=3.0 & x2>=1.0\n",
      "   +0.1361 if c<=0.0 & x1<=1.0 & x2<=2.0 & x2>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.1811 if c<=0.0 & x1<=1.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   +0.1606 if x1>=3.0 & x2<=2.0 & x2>=1.0\n",
      "   -0.0035 if x4-x2<=-2.0 & x4-x2>=-2.0\n",
      "   -0.7588 if c<=0.0 & x3-x1>=0.0\n",
      "   +0.0000 if c<=0.0 & x2<=0.0 & x3-x1<=-1.0 & x4-x2<=2.0\n",
      "   -0.2985 if x3-x1>=-1.0\n",
      "   +0.5905 if c<=0.0 & x2<=0.0\n",
      "----------------- 1 --------------\n",
      "   -0.4408 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.4138 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.3049 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.9368 if c>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.0562 if x2<=2.0 & x3-x1<=0.0\n",
      "   +0.3458 if x3-x1>=-1.0\n",
      "   -0.1541 if x2<=0.0 & x3-x1>=1.0\n",
      "   +0.0932 if x3-x1>=1.0\n",
      "   -0.1472 if x2<=2.0 & x3-x1<=2.0\n",
      "   -0.1758 if x1>=2.0\n",
      "   -0.4906 if c<=0.0 & x2<=1.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   -0.0803 if x1<=0.0 & x2<=1.0 & x2>=1.0\n",
      "   -0.1472 if x2<=2.0\n",
      "   -0.0543 if x1>=3.0\n",
      "   -0.1263 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2<=1.0\n",
      "   +0.6539 if x2>=3.0 & x3-x1>=2.0\n",
      "----------------- 2 --------------\n",
      "   +0.7801 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.5609 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.5098 if x4-x2>=0.0\n",
      "   -0.6657 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.2218 if x2>=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   +0.7029 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   +0.3755 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.1825 if c>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.0940 if c>=1.0 & x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "   +0.0280 if c<=0.0 & x2<=1.0 & x4-x2<=0.0\n",
      "   -0.0098 if x2<=0.0\n",
      "   -0.0776 if \n",
      "   -0.3508 if c>=1.0\n",
      "   -0.3467 if x3-x1>=2.0 & x4-x2<=-1.0\n",
      "   -0.2255 if x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   +0.5683 if c<=0.0 & x2>=3.0 & x3-x1<=1.0 & x4-x2<=-1.0\n",
      "----------------- 3 --------------\n",
      "   +0.3516 if c>=1.0 & x1>=1.0\n",
      "   +0.2747 if c>=1.0 & x1>=3.0\n",
      "   -0.3505 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.6079 if x1<=0.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.1872 if x1<=2.0 & x2<=0.0\n",
      "   -0.0890 if x1<=2.0 & x2>=1.0 & x4-x2<=0.0\n",
      "   +0.0376 if x1>=3.0\n",
      "   +0.1539 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   +0.1032 if x4-x2<=0.0\n",
      "   +0.4701 if c<=0.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   -0.1354 if x1<=2.0 & x4-x2<=2.0\n",
      "   +0.0755 if x1<=2.0 & x2>=1.0 & x4-x2>=-2.0\n",
      "   -0.0472 if x4-x2>=2.0\n",
      "   -0.2233 if c<=0.0 & x2<=2.0 & x2>=2.0 & x3-x1>=0.0\n",
      "   +0.3834 if x1<=0.0 & x4-x2>=1.0\n",
      "   +0.4793 if x1<=2.0 & x3-x1<=-2.0 & x4-x2>=0.0\n",
      "init state [2 0 1 1 0]\n",
      "(10,) (10,)\n",
      "init state [ 2  0 -2  1  0]\n",
      "(22,) (12,)\n",
      "init state [ 2  0 -1  3  0]\n",
      "(40,) (18,)\n",
      "init state [ 1  3 -1  0  0]\n",
      "(44,) (4,)\n",
      "init state [ 3  2 -1  1  0]\n",
      "(49,) (5,)\n",
      "init state [ 2  2 -1 -1  0]\n",
      "(55,) (6,)\n",
      "init state [ 0  2  3 -2  0]\n",
      "(66,) (11,)\n",
      "init state [1 2 0 1 0]\n",
      "(69,) (3,)\n",
      "init state [0 0 1 2 0]\n",
      "(81,) (12,)\n",
      "init state [ 3  0 -3  1  0]\n",
      "(92,) (11,)\n",
      "============ 127 ===========\n",
      "Run episode 127 with rewards 31, accuracy 0.9\n",
      "----------------- 0 --------------\n",
      "   -0.3280 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.8426 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.0103 if x1>=1.0 & x2<=2.0 & x3-x1>=-1.0\n",
      "   -0.1628 if x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   +0.6410 if x1<=2.0 & x4-x2>=1.0\n",
      "   -0.2619 if x1>=3.0 & x4-x2>=1.0\n",
      "   +0.8186 if c<=0.0 & x2<=1.0 & x3-x1<=-1.0\n",
      "   +0.0895 if x1>=3.0 & x2>=1.0\n",
      "   -0.1007 if c<=0.0 & x1<=1.0 & x2<=2.0 & x2>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.2997 if c<=0.0 & x1<=1.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   -0.1914 if x1>=3.0 & x2<=2.0 & x2>=1.0\n",
      "   -0.2166 if x4-x2<=-2.0 & x4-x2>=-2.0\n",
      "   -0.6896 if c<=0.0 & x3-x1>=0.0\n",
      "   -0.0264 if x3-x1>=-1.0\n",
      "   +0.2379 if c<=0.0 & x2<=0.0\n",
      "   -0.4781 if x1<=1.0 & x1<=2.0 & x2<=0.0 & x4-x2<=2.0\n",
      "----------------- 1 --------------\n",
      "   -0.2573 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.5174 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.7830 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.8193 if c>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.1716 if x2<=2.0 & x3-x1<=0.0\n",
      "   +0.0579 if x3-x1>=-1.0\n",
      "   +0.3338 if x2<=0.0 & x3-x1>=1.0\n",
      "   -0.0944 if x3-x1>=1.0\n",
      "   -0.3016 if x2<=2.0 & x3-x1<=2.0\n",
      "   -0.0474 if x1>=2.0\n",
      "   -0.4968 if c<=0.0 & x2<=1.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   -0.1241 if x1<=0.0 & x2<=1.0 & x2>=1.0\n",
      "   -0.1848 if x2<=2.0\n",
      "   -0.3139 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2<=1.0\n",
      "   +0.0000 if x2>=3.0 & x3-x1>=2.0\n",
      "   +0.5527 if x3-x1>=2.0\n",
      "----------------- 2 --------------\n",
      "   +0.3267 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.7578 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.3902 if x4-x2>=0.0\n",
      "   -0.5012 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.0226 if x2>=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   +0.3267 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   -0.0740 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.3029 if c>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.1761 if c>=1.0 & x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "   +0.5795 if c<=0.0 & x2<=1.0 & x4-x2<=0.0\n",
      "   +0.0079 if \n",
      "   -0.4445 if c>=1.0\n",
      "   -0.1973 if x3-x1>=2.0 & x4-x2<=-1.0\n",
      "   -0.1129 if x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   +0.0000 if c<=0.0 & x2>=3.0 & x3-x1<=1.0 & x4-x2<=-1.0\n",
      "   +0.0111 if x3-x1<=0.0 & x4-x2<=-1.0\n",
      "----------------- 3 --------------\n",
      "   +0.4754 if c>=1.0 & x1>=1.0\n",
      "   +0.5961 if c>=1.0 & x1>=3.0\n",
      "   -0.2428 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.1973 if x1<=0.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.6043 if x1<=2.0 & x2<=0.0\n",
      "   -0.4437 if x1<=2.0 & x2>=1.0 & x4-x2<=0.0\n",
      "   +0.4210 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   -0.1911 if x4-x2<=0.0\n",
      "   +0.4578 if c<=0.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   -0.2230 if x1<=2.0 & x4-x2<=2.0\n",
      "   -0.0144 if x1<=2.0 & x2>=1.0 & x4-x2>=-2.0\n",
      "   -0.2137 if x4-x2>=2.0\n",
      "   -0.0432 if c<=0.0 & x2<=2.0 & x2>=2.0 & x3-x1>=0.0\n",
      "   +0.5173 if x1<=0.0 & x4-x2>=1.0\n",
      "   +0.0025 if x1<=2.0 & x3-x1<=-2.0 & x4-x2>=0.0\n",
      "   +0.5622 if x1>=1.0 & x2>=2.0 & x4-x2>=1.0\n",
      "init state [0 0 2 0 0]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(10,) (10,)\n",
      "init state [ 2  0 -1  3  0]\n",
      "(22,) (12,)\n",
      "init state [1 0 0 1 0]\n",
      "(28,) (6,)\n",
      "init state [ 2  2  1 -1  0]\n",
      "(40,) (12,)\n",
      "init state [0 2 2 1 0]\n",
      "(50,) (10,)\n",
      "init state [ 3  2 -2 -2  0]\n",
      "(79,) (29,)\n",
      "init state [ 3  0 -1  1  0]\n",
      "(84,) (5,)\n",
      "init state [0 1 0 2 0]\n",
      "(104,) (20,)\n",
      "init state [ 1  1  1 -1  0]\n",
      "(112,) (8,)\n",
      "init state [1 1 2 0 0]\n",
      "(120,) (8,)\n",
      "============ 128 ===========\n",
      "Run episode 128 with rewards 34, accuracy 0.7\n",
      "----------------- 0 --------------\n",
      "   -0.2152 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.5016 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.3195 if x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   +0.0918 if x1<=2.0 & x4-x2>=1.0\n",
      "   +0.1676 if x1>=3.0 & x4-x2>=1.0\n",
      "   +0.6938 if c<=0.0 & x2<=1.0 & x3-x1<=-1.0\n",
      "   -0.1441 if x1>=3.0 & x2>=1.0\n",
      "   -0.3148 if c<=0.0 & x1<=1.0 & x2<=2.0 & x2>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.1356 if c<=0.0 & x1<=1.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   -0.1441 if x1>=3.0 & x2<=2.0 & x2>=1.0\n",
      "   +0.1150 if x4-x2<=-2.0 & x4-x2>=-2.0\n",
      "   -0.2727 if c<=0.0 & x3-x1>=0.0\n",
      "   -0.1639 if x3-x1>=-1.0\n",
      "   -0.0552 if c<=0.0 & x2<=0.0\n",
      "   -0.4456 if x1<=1.0 & x1<=2.0 & x2<=0.0 & x4-x2<=2.0\n",
      "   -0.3667 if x2>=1.0 & x3-x1>=2.0\n",
      "----------------- 1 --------------\n",
      "   -0.6251 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.4229 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.3910 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.6869 if c>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.3842 if x2<=2.0 & x3-x1<=0.0\n",
      "   +0.0982 if x3-x1>=-1.0\n",
      "   +0.5838 if x2<=0.0 & x3-x1>=1.0\n",
      "   -0.2491 if x3-x1>=1.0\n",
      "   -0.0803 if x2<=2.0 & x3-x1<=2.0\n",
      "   -0.2288 if x1>=2.0\n",
      "   -0.4548 if c<=0.0 & x2<=1.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   -0.1213 if x1<=0.0 & x2<=1.0 & x2>=1.0\n",
      "   -0.0803 if x2<=2.0\n",
      "   -0.0000 if c<=0.0 & x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-1.0 & x3-x1>=-2.0 & x4-x2<=0.0 & x4-x2<=1.0\n",
      "   +0.9131 if x3-x1>=2.0\n",
      "   +0.0197 if x4-x2<=-3.0\n",
      "----------------- 2 --------------\n",
      "   +0.2256 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.3291 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.6231 if x4-x2>=0.0\n",
      "   -0.2679 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.0062 if x2>=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   +0.0000 if c<=0.0 & x1>=1.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2<=-1.0\n",
      "   -0.2814 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.3219 if c>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.2007 if c>=1.0 & x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "   +0.1558 if c<=0.0 & x2<=1.0 & x4-x2<=0.0\n",
      "   +0.1654 if \n",
      "   -0.4043 if c>=1.0\n",
      "   +0.3025 if x3-x1>=2.0 & x4-x2<=-1.0\n",
      "   -0.1148 if x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   -0.0788 if x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   +0.2808 if x3-x1<=1.0 & x4-x2>=-2.0\n",
      "----------------- 3 --------------\n",
      "   +0.4671 if c>=1.0 & x1>=1.0\n",
      "   +0.7160 if c>=1.0 & x1>=3.0\n",
      "   -0.3118 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.2586 if x1<=0.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.2185 if x1<=2.0 & x2<=0.0\n",
      "   -0.3496 if x1<=2.0 & x2>=1.0 & x4-x2<=0.0\n",
      "   +0.4848 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   -0.2125 if x4-x2<=0.0\n",
      "   +0.7644 if c<=0.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   -0.4020 if x1<=2.0 & x4-x2<=2.0\n",
      "   +0.0370 if x1<=2.0 & x2>=1.0 & x4-x2>=-2.0\n",
      "   +0.3248 if x4-x2>=2.0\n",
      "   +0.0608 if c<=0.0 & x2<=2.0 & x2>=2.0 & x3-x1>=0.0\n",
      "   -0.0949 if x1<=0.0 & x4-x2>=1.0\n",
      "   +0.1446 if x1>=1.0 & x2>=2.0 & x4-x2>=1.0\n",
      "   +0.7306 if c<=0.0 & x2>=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=1.0\n",
      "init state [ 1  2  1 -2  0]\n",
      "(11,) (11,)\n",
      "init state [ 0  2  3 -2  0]\n",
      "(27,) (16,)\n",
      "init state [1 1 1 0 0]\n",
      "(56,) (29,)\n",
      "init state [ 2  1 -2 -1  0]\n",
      "(81,) (25,)\n",
      "init state [ 3  2 -2  0  0]\n",
      "(91,) (10,)\n",
      "init state [ 1  0 -1  0  0]\n",
      "(104,) (13,)\n",
      "init state [ 2  1 -1  1  0]\n",
      "(128,) (24,)\n",
      "init state [0 1 3 0 0]\n",
      "(142,) (14,)\n",
      "init state [ 2  1 -1  1  0]\n",
      "(153,) (11,)\n",
      "init state [ 0  3  3 -3  0]\n",
      "(164,) (11,)\n",
      "============ 129 ===========\n",
      "Run episode 129 with rewards 31, accuracy 1.0\n",
      "best\n",
      "----------------- 0 --------------\n",
      "   -0.5796 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.6589 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.5423 if x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   -0.1309 if x1<=2.0 & x4-x2>=1.0\n",
      "   +0.2826 if x1>=3.0 & x4-x2>=1.0\n",
      "   -0.0650 if c<=0.0 & x2<=1.0 & x3-x1<=-1.0\n",
      "   -0.0803 if x1>=3.0 & x2>=1.0\n",
      "   -0.2317 if c<=0.0 & x1<=1.0 & x2<=2.0 & x2>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.0938 if c<=0.0 & x1<=1.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   -0.0803 if x1>=3.0 & x2<=2.0 & x2>=1.0\n",
      "   +0.0257 if x4-x2<=-2.0 & x4-x2>=-2.0\n",
      "   -0.3897 if c<=0.0 & x3-x1>=0.0\n",
      "   -0.2937 if x3-x1>=-1.0\n",
      "   +0.1894 if x1<=1.0 & x1<=2.0 & x2<=0.0 & x4-x2<=2.0\n",
      "   +0.0373 if x2>=1.0 & x3-x1>=2.0\n",
      "   -0.2831 if c>=1.0 & x1>=3.0\n",
      "----------------- 1 --------------\n",
      "   -0.6397 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.8192 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.2622 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.7752 if c>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.2265 if x2<=2.0 & x3-x1<=0.0\n",
      "   +0.1745 if x3-x1>=-1.0\n",
      "   +0.4596 if x2<=0.0 & x3-x1>=1.0\n",
      "   +0.2943 if x3-x1>=1.0\n",
      "   -0.0245 if x2<=2.0 & x3-x1<=2.0\n",
      "   -0.4019 if x1>=2.0\n",
      "   -0.6009 if c<=0.0 & x2<=1.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   +0.0357 if x1<=0.0 & x2<=1.0 & x2>=1.0\n",
      "   +0.0377 if x2<=2.0\n",
      "   +0.2712 if x3-x1>=2.0\n",
      "   -0.1321 if x4-x2<=-3.0\n",
      "   +0.1937 if x3-x1>=3.0 & x4-x2<=-3.0\n",
      "----------------- 2 --------------\n",
      "   +0.3043 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.1755 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.1755 if x4-x2>=0.0\n",
      "   -0.1755 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.2341 if x2>=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   +0.4537 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.2173 if c>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   +0.0821 if c>=1.0 & x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "   +0.5072 if c<=0.0 & x2<=1.0 & x4-x2<=0.0\n",
      "   +0.0756 if \n",
      "   -0.3969 if c>=1.0\n",
      "   -0.0850 if x3-x1>=2.0 & x4-x2<=-1.0\n",
      "   -0.1185 if x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   +0.1353 if x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   +0.1380 if x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   +0.3207 if x2<=2.0 & x3-x1>=3.0 & x4-x2<=-2.0\n",
      "----------------- 3 --------------\n",
      "   +0.4185 if c>=1.0 & x1>=1.0\n",
      "   +0.6896 if c>=1.0 & x1>=3.0\n",
      "   -0.0401 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.1954 if x1<=0.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.5349 if x1<=2.0 & x2<=0.0\n",
      "   -0.2128 if x1<=2.0 & x2>=1.0 & x4-x2<=0.0\n",
      "   +0.3373 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   -0.1061 if x4-x2<=0.0\n",
      "   -0.2186 if c<=0.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   -0.1819 if x1<=2.0 & x4-x2<=2.0\n",
      "   +0.0000 if x4-x2>=2.0\n",
      "   +0.0636 if c<=0.0 & x2<=2.0 & x2>=2.0 & x3-x1>=0.0\n",
      "   -0.0374 if x1<=0.0 & x4-x2>=1.0\n",
      "   +0.0000 if x1>=1.0 & x2>=2.0 & x4-x2>=1.0\n",
      "   +0.4289 if c<=0.0 & x2>=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=1.0\n",
      "   -0.2301 if x1>=1.0 & x2>=2.0\n",
      "init state [ 0  2  0 -1  0]\n",
      "(7,) (7,)\n",
      "init state [ 2  3  0 -2  0]\n",
      "(14,) (7,)\n",
      "init state [0 0 1 0 0]\n",
      "(54,) (40,)\n",
      "init state [2 1 0 2 0]\n",
      "(59,) (5,)\n",
      "init state [ 2  0 -1  1  0]\n",
      "(80,) (21,)\n",
      "init state [ 3  1  0 -1  0]\n",
      "(84,) (4,)\n",
      "init state [0 3 2 0 0]\n",
      "(88,) (4,)\n",
      "init state [ 1  3  0 -2  0]\n",
      "(98,) (10,)\n",
      "init state [ 3  1 -3  1  0]\n",
      "(145,) (47,)\n",
      "init state [1 1 1 0 0]\n",
      "(156,) (11,)\n",
      "============ 130 ===========\n",
      "Run episode 130 with rewards 31, accuracy 0.7\n",
      "----------------- 0 --------------\n",
      "   -0.5430 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.3386 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.1490 if x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   +0.0886 if x1<=2.0 & x4-x2>=1.0\n",
      "   +0.1327 if x1>=3.0 & x4-x2>=1.0\n",
      "   +0.5027 if c<=0.0 & x2<=1.0 & x3-x1<=-1.0\n",
      "   -0.0727 if x1>=3.0 & x2>=1.0\n",
      "   -0.1869 if c<=0.0 & x1<=1.0 & x2<=2.0 & x2>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.4586 if c<=0.0 & x1<=1.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   -0.1665 if x1>=3.0 & x2<=2.0 & x2>=1.0\n",
      "   -0.5377 if c<=0.0 & x3-x1>=0.0\n",
      "   -0.5813 if x3-x1>=-1.0\n",
      "   +0.3792 if x1<=1.0 & x1<=2.0 & x2<=0.0 & x4-x2<=2.0\n",
      "   -0.0500 if x2>=1.0 & x3-x1>=2.0\n",
      "   -0.2175 if c>=1.0 & x1>=3.0\n",
      "   +0.2231 if c<=0.0 & x2<=1.0 & x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "----------------- 1 --------------\n",
      "   -0.7285 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.8947 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.5730 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.4094 if c>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.4859 if x2<=2.0 & x3-x1<=0.0\n",
      "   +0.3421 if x3-x1>=-1.0\n",
      "   +0.3546 if x2<=0.0 & x3-x1>=1.0\n",
      "   +0.6525 if x3-x1>=1.0\n",
      "   -0.3949 if x1>=2.0\n",
      "   -0.2412 if c<=0.0 & x2<=1.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   -0.0132 if x1<=0.0 & x2<=1.0 & x2>=1.0\n",
      "   -0.2044 if x2<=2.0\n",
      "   +0.1537 if x3-x1>=2.0\n",
      "   +0.1011 if x4-x2<=-3.0\n",
      "   +0.0000 if x3-x1>=3.0 & x4-x2<=-3.0\n",
      "   +0.1196 if x3-x1>=1.0 & x4-x2<=-1.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 2 --------------\n",
      "   +0.7938 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.6408 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.6408 if x4-x2>=0.0\n",
      "   -0.0212 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.5900 if x2>=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   +0.2833 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   +0.0279 if c>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.3908 if c>=1.0 & x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "   +0.1828 if c<=0.0 & x2<=1.0 & x4-x2<=0.0\n",
      "   -0.1817 if c>=1.0\n",
      "   +0.0000 if x3-x1>=2.0 & x4-x2<=-1.0\n",
      "   -0.3447 if x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   +0.3596 if x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   -0.2568 if x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   +0.0000 if x2<=2.0 & x3-x1>=3.0 & x4-x2<=-2.0\n",
      "   +0.3027 if x4-x2<=1.0 & x4-x2>=-2.0\n",
      "----------------- 3 --------------\n",
      "   +0.5778 if c>=1.0 & x1>=1.0\n",
      "   +0.6946 if c>=1.0 & x1>=3.0\n",
      "   -0.4325 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.2093 if x1<=0.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.2446 if x1<=2.0 & x2<=0.0\n",
      "   -0.3201 if x1<=2.0 & x2>=1.0 & x4-x2<=0.0\n",
      "   +0.2313 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   +0.1569 if x4-x2<=0.0\n",
      "   +0.2819 if c<=0.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   -0.2527 if x1<=2.0 & x4-x2<=2.0\n",
      "   +0.9055 if x4-x2>=2.0\n",
      "   -0.0273 if c<=0.0 & x2<=2.0 & x2>=2.0 & x3-x1>=0.0\n",
      "   +0.0100 if x1<=0.0 & x4-x2>=1.0\n",
      "   -0.2868 if c<=0.0 & x2>=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=1.0\n",
      "   +0.0845 if x1>=1.0 & x2>=2.0\n",
      "   -0.3771 if c<=0.0 & x2<=0.0 & x3-x1>=-2.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "init state [2 1 0 1 0]\n",
      "(7,) (7,)\n",
      "init state [ 0  3  0 -3  0]\n",
      "(24,) (17,)\n",
      "init state [ 2  2 -1 -1  0]\n",
      "(39,) (15,)\n",
      "init state [ 3  0 -1  1  0]\n",
      "(46,) (7,)\n",
      "init state [ 0  2  3 -2  0]\n",
      "(77,) (31,)\n",
      "init state [0 0 1 0 0]\n",
      "(85,) (8,)\n",
      "init state [0 0 1 2 0]\n",
      "(93,) (8,)\n",
      "init state [ 3  0 -3  1  0]\n",
      "(112,) (19,)\n",
      "init state [ 2  3  1 -3  0]\n",
      "(119,) (7,)\n",
      "init state [2 1 1 0 0]\n",
      "(122,) (3,)\n",
      "============ 131 ===========\n",
      "Run episode 131 with rewards 39, accuracy 0.7\n",
      "----------------- 0 --------------\n",
      "   -0.4214 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.5095 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.3511 if x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   -0.0077 if x1<=2.0 & x4-x2>=1.0\n",
      "   +0.2606 if x1>=3.0 & x4-x2>=1.0\n",
      "   +0.5095 if c<=0.0 & x2<=1.0 & x3-x1<=-1.0\n",
      "   -0.3108 if x1>=3.0 & x2>=1.0\n",
      "   -0.0667 if c<=0.0 & x1<=1.0 & x2<=2.0 & x2>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.0582 if c<=0.0 & x1<=1.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   -0.1473 if x1>=3.0 & x2<=2.0 & x2>=1.0\n",
      "   -0.7036 if c<=0.0 & x3-x1>=0.0\n",
      "   -0.4609 if x3-x1>=-1.0\n",
      "   +0.1209 if x1<=1.0 & x1<=2.0 & x2<=0.0 & x4-x2<=2.0\n",
      "   -0.2199 if c>=1.0 & x1>=3.0\n",
      "   +0.0000 if c<=0.0 & x2<=1.0 & x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "   +0.0065 if x3-x1<=-3.0 & x4-x2>=1.0\n",
      "----------------- 1 --------------\n",
      "   -0.5064 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.7244 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.3133 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.2826 if c>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.3299 if x2<=2.0 & x3-x1<=0.0\n",
      "   +0.0978 if x3-x1>=-1.0\n",
      "   +0.0822 if x2<=0.0 & x3-x1>=1.0\n",
      "   +0.5897 if x3-x1>=1.0\n",
      "   -0.1709 if x1>=2.0\n",
      "   +0.2264 if c<=0.0 & x2<=1.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   -0.0200 if x1<=0.0 & x2<=1.0 & x2>=1.0\n",
      "   +0.0277 if x2<=2.0\n",
      "   -0.0113 if x3-x1>=2.0\n",
      "   -0.0737 if x4-x2<=-3.0\n",
      "   +0.2811 if x3-x1>=1.0 & x4-x2<=-1.0\n",
      "   +0.0161 if c<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0 & x4-x2>=-2.0\n",
      "----------------- 2 --------------\n",
      "   +0.4307 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.2332 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.2332 if x4-x2>=0.0\n",
      "   -0.5721 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.4228 if x2>=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   +0.2796 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.1295 if c>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.2978 if c>=1.0 & x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "   +0.0771 if c<=0.0 & x2<=1.0 & x4-x2<=0.0\n",
      "   -0.1834 if c>=1.0\n",
      "   -0.0937 if x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   +0.6160 if x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   +0.0214 if x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   +0.0056 if x2<=2.0 & x3-x1>=3.0 & x4-x2<=-2.0\n",
      "   -0.3050 if x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   -0.1996 if x1>=2.0 & x4-x2>=1.0\n",
      "----------------- 3 --------------\n",
      "   +0.4579 if c>=1.0 & x1>=1.0\n",
      "   +0.4763 if c>=1.0 & x1>=3.0\n",
      "   -0.0806 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.1730 if x1<=0.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.3304 if x1<=2.0 & x2<=0.0\n",
      "   -0.0634 if x1<=2.0 & x2>=1.0 & x4-x2<=0.0\n",
      "   +0.4467 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   +0.0284 if x4-x2<=0.0\n",
      "   +0.4966 if c<=0.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   -0.0781 if x1<=2.0 & x4-x2<=2.0\n",
      "   +0.0844 if x4-x2>=2.0\n",
      "   -0.0436 if c<=0.0 & x2<=2.0 & x2>=2.0 & x3-x1>=0.0\n",
      "   -0.1327 if c<=0.0 & x2>=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=1.0\n",
      "   +0.0792 if x1>=1.0 & x2>=2.0\n",
      "   +0.1810 if c<=0.0 & x2<=0.0 & x3-x1>=-2.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   -0.2255 if x1<=0.0 & x4-x2>=1.0\n",
      "init state [ 2  3 -1 -2  0]\n",
      "(15,) (15,)\n",
      "init state [ 1  0 -1  2  0]\n",
      "(32,) (17,)\n",
      "init state [0 0 1 1 0]\n",
      "(41,) (9,)\n",
      "init state [0 1 2 1 0]\n",
      "(51,) (10,)\n",
      "init state [ 2  3 -2 -1  0]\n",
      "(75,) (24,)\n",
      "init state [ 3  1 -1  0  0]\n",
      "(114,) (39,)\n",
      "init state [ 3  2 -1 -2  0]\n",
      "(124,) (10,)\n",
      "init state [ 1  1 -1 -1  0]\n",
      "(142,) (18,)\n",
      "init state [0 0 0 3 0]\n",
      "(163,) (21,)\n",
      "init state [ 3  1 -2  1  0]\n",
      "(169,) (6,)\n",
      "============ 132 ===========\n",
      "Run episode 132 with rewards 36, accuracy 0.7\n",
      "----------------- 0 --------------\n",
      "   -0.7148 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.7675 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.2694 if x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   -0.0498 if x1<=2.0 & x4-x2>=1.0\n",
      "   +0.1673 if x1>=3.0 & x4-x2>=1.0\n",
      "   +0.7813 if c<=0.0 & x2<=1.0 & x3-x1<=-1.0\n",
      "   +0.0693 if x1>=3.0 & x2>=1.0\n",
      "   +0.0898 if c<=0.0 & x1<=1.0 & x2<=2.0 & x2>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.1663 if c<=0.0 & x1<=1.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   +0.1588 if x1>=3.0 & x2<=2.0 & x2>=1.0\n",
      "   -0.5665 if c<=0.0 & x3-x1>=0.0\n",
      "   -0.1671 if x3-x1>=-1.0\n",
      "   -0.0854 if x1<=1.0 & x1<=2.0 & x2<=0.0 & x4-x2<=2.0\n",
      "   -0.2122 if c>=1.0 & x1>=3.0\n",
      "   +0.0752 if x3-x1<=-3.0 & x4-x2>=1.0\n",
      "   -0.1957 if x1<=1.0 & x3-x1<=-1.0 & x4-x2>=3.0\n",
      "----------------- 1 --------------\n",
      "   -0.8387 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.4391 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.4809 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.3026 if c>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.3992 if x2<=2.0 & x3-x1<=0.0\n",
      "   +0.0190 if x3-x1>=-1.0\n",
      "   -0.2196 if x2<=0.0 & x3-x1>=1.0\n",
      "   +0.3773 if x3-x1>=1.0\n",
      "   -0.1742 if x1>=2.0\n",
      "   +0.0211 if c<=0.0 & x2<=1.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   +0.2882 if x1<=0.0 & x2<=1.0 & x2>=1.0\n",
      "   -0.0219 if x2<=2.0\n",
      "   +0.2504 if x4-x2<=-3.0\n",
      "   +0.0000 if x3-x1>=1.0 & x4-x2<=-1.0\n",
      "   -0.3936 if c<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   -0.1570 if x1<=0.0 & x2<=1.0 & x2>=1.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "----------------- 2 --------------\n",
      "   +0.4830 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.4318 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.4671 if x4-x2>=0.0\n",
      "   -0.3538 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.0166 if x2>=1.0 & x3-x1<=-1.0 & x4-x2<=1.0\n",
      "   +0.2837 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.2058 if c>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.1983 if c>=1.0 & x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "   -0.1632 if c<=0.0 & x2<=1.0 & x4-x2<=0.0\n",
      "   -0.2571 if c>=1.0\n",
      "   +0.0461 if x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   +0.3927 if x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   -0.0571 if x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   +0.0277 if x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   +0.0358 if x1>=2.0 & x4-x2>=1.0\n",
      "   +0.3289 if x2>=2.0 & x4-x2>=1.0\n",
      "----------------- 3 --------------\n",
      "   +0.7553 if c>=1.0 & x1>=1.0\n",
      "   +0.4503 if c>=1.0 & x1>=3.0\n",
      "   +0.2506 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.1431 if x1<=0.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.3222 if x1<=2.0 & x2<=0.0\n",
      "   -0.2768 if x1<=2.0 & x2>=1.0 & x4-x2<=0.0\n",
      "   +0.0701 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   +0.6396 if c<=0.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   -0.0608 if x1<=2.0 & x4-x2<=2.0\n",
      "   -0.0970 if x4-x2>=2.0\n",
      "   -0.0466 if c<=0.0 & x2<=2.0 & x2>=2.0 & x3-x1>=0.0\n",
      "   +0.2543 if c<=0.0 & x2>=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=1.0\n",
      "   -0.1879 if x1>=1.0 & x2>=2.0\n",
      "   +0.1300 if c<=0.0 & x2<=0.0 & x3-x1>=-2.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.1194 if x1<=0.0 & x4-x2>=1.0\n",
      "   -0.1299 if c<=0.0 & x1<=0.0 & x2<=0.0 & x3-x1<=0.0\n",
      "init state [ 0  3  2 -2  0]\n",
      "(21,) (21,)\n",
      "init state [ 2  3 -1 -2  0]\n",
      "(33,) (12,)\n",
      "init state [ 2  3  0 -1  0]\n",
      "(38,) (5,)\n",
      "init state [ 3  0 -1  1  0]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(60,) (22,)\n",
      "init state [0 0 0 2 0]\n",
      "(66,) (6,)\n",
      "init state [ 1  2 -1 -1  0]\n",
      "(75,) (9,)\n",
      "init state [ 1  3  1 -2  0]\n",
      "(106,) (31,)\n",
      "init state [ 2  3 -2 -1  0]\n",
      "(117,) (11,)\n",
      "init state [ 0  3  2 -1  0]\n",
      "(125,) (8,)\n",
      "init state [1 1 1 2 0]\n",
      "(140,) (15,)\n",
      "============ 133 ===========\n",
      "Run episode 133 with rewards 27, accuracy 1.0\n",
      "best\n",
      "----------------- 0 --------------\n",
      "   -0.6299 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.5276 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.3610 if x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   +0.5304 if x1>=3.0 & x4-x2>=1.0\n",
      "   +0.3604 if c<=0.0 & x2<=1.0 & x3-x1<=-1.0\n",
      "   +0.3256 if x1>=3.0 & x2>=1.0\n",
      "   +0.2276 if c<=0.0 & x1<=1.0 & x2<=2.0 & x2>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.0350 if c<=0.0 & x1<=1.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   +0.3724 if x1>=3.0 & x2<=2.0 & x2>=1.0\n",
      "   -0.3508 if c<=0.0 & x3-x1>=0.0\n",
      "   -0.1842 if x3-x1>=-1.0\n",
      "   -0.0242 if x1<=1.0 & x1<=2.0 & x2<=0.0 & x4-x2<=2.0\n",
      "   +0.0844 if c>=1.0 & x1>=3.0\n",
      "   +0.0000 if x3-x1<=-3.0 & x4-x2>=1.0\n",
      "   +0.0000 if x1<=1.0 & x3-x1<=-1.0 & x4-x2>=3.0\n",
      "   -0.6193 if c<=0.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "----------------- 1 --------------\n",
      "   -0.4082 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.5899 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.6379 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.4923 if c>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.3331 if x2<=2.0 & x3-x1<=0.0\n",
      "   -0.0819 if x3-x1>=-1.0\n",
      "   -0.0638 if x2<=0.0 & x3-x1>=1.0\n",
      "   +0.1814 if x3-x1>=1.0\n",
      "   +0.2016 if x1>=2.0\n",
      "   -0.0135 if c<=0.0 & x2<=1.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   +0.3646 if x1<=0.0 & x2<=1.0 & x2>=1.0\n",
      "   -0.1055 if x2<=2.0\n",
      "   +0.0000 if x4-x2<=-3.0\n",
      "   -0.3705 if c<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   +0.2412 if x1<=0.0 & x2<=1.0 & x2>=1.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   -0.4327 if x2>=2.0 & x3-x1>=2.0 & x4-x2>=0.0\n",
      "----------------- 2 --------------\n",
      "   +0.4006 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.3595 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.4172 if x4-x2>=0.0\n",
      "   -0.3960 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.4840 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.3025 if c>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.2556 if c>=1.0 & x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "   -0.1116 if c<=0.0 & x2<=1.0 & x4-x2<=0.0\n",
      "   -0.5050 if c>=1.0\n",
      "   -0.1259 if x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   +0.2132 if x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   -0.2459 if x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   +0.0491 if x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   +0.0641 if x1>=2.0 & x4-x2>=1.0\n",
      "   +0.0282 if x2>=2.0 & x4-x2>=1.0\n",
      "   +0.8545 if c<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1>=-1.0 & x3-x1>=0.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "----------------- 3 --------------\n",
      "   +0.4715 if c>=1.0 & x1>=1.0\n",
      "   +0.3592 if c>=1.0 & x1>=3.0\n",
      "   -0.0294 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.1305 if x1<=0.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.3692 if x1<=2.0 & x2<=0.0\n",
      "   -0.1851 if x1<=2.0 & x2>=1.0 & x4-x2<=0.0\n",
      "   +0.2219 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   +0.3388 if c<=0.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.0108 if x1<=2.0 & x4-x2<=2.0\n",
      "   -0.1536 if x4-x2>=2.0\n",
      "   -0.0717 if c<=0.0 & x2>=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=1.0\n",
      "   -0.3576 if x1>=1.0 & x2>=2.0\n",
      "   +0.3685 if c<=0.0 & x2<=0.0 & x3-x1>=-2.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.1739 if x1<=0.0 & x4-x2>=1.0\n",
      "   +0.1648 if c<=0.0 & x1<=0.0 & x2<=0.0 & x3-x1<=0.0\n",
      "   -0.4305 if c<=0.0 & x2>=2.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "init state [1 0 2 2 0]\n",
      "(5,) (5,)\n",
      "init state [0 0 2 2 0]\n",
      "(13,) (8,)\n",
      "init state [ 3  2 -1  1  0]\n",
      "(17,) (4,)\n",
      "init state [ 3  2 -3 -1  0]\n",
      "(48,) (31,)\n",
      "init state [0 1 0 2 0]\n",
      "(60,) (12,)\n",
      "init state [ 1  1 -1  0  0]\n",
      "(75,) (15,)\n",
      "init state [ 2  0 -2  3  0]\n",
      "(87,) (12,)\n",
      "init state [ 3  1 -3  2  0]\n",
      "(106,) (19,)\n",
      "init state [ 3  2 -3 -2  0]\n",
      "(131,) (25,)\n",
      "init state [0 0 1 0 0]\n",
      "(151,) (20,)\n",
      "============ 134 ===========\n",
      "Run episode 134 with rewards 22, accuracy 0.9\n",
      "----------------- 0 --------------\n",
      "   -0.4685 if c>=1.0 & x3-x1<=1.0\n",
      "   +1.1297 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.1329 if x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   +0.2198 if x1>=3.0 & x4-x2>=1.0\n",
      "   +0.1275 if c<=0.0 & x2<=1.0 & x3-x1<=-1.0\n",
      "   +0.3130 if x1>=3.0 & x2>=1.0\n",
      "   -0.0262 if c<=0.0 & x1<=1.0 & x2<=2.0 & x2>=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +0.3916 if c<=0.0 & x1<=1.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   +0.3130 if x1>=3.0 & x2<=2.0 & x2>=1.0\n",
      "   -0.5123 if c<=0.0 & x3-x1>=0.0\n",
      "   -0.5282 if x3-x1>=-1.0\n",
      "   +0.0985 if x1<=1.0 & x1<=2.0 & x2<=0.0 & x4-x2<=2.0\n",
      "   -0.2051 if c>=1.0 & x1>=3.0\n",
      "   +0.1128 if x1<=1.0 & x3-x1<=-1.0 & x4-x2>=3.0\n",
      "   -0.5516 if c<=0.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.5566 if x3-x1<=-1.0 & x4-x2>=3.0\n",
      "----------------- 1 --------------\n",
      "   +0.0305 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.7180 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.7642 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.4791 if c>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.6357 if x2<=2.0 & x3-x1<=0.0\n",
      "   +0.3521 if x3-x1>=-1.0\n",
      "   +0.2542 if x2<=0.0 & x3-x1>=1.0\n",
      "   +0.3337 if x3-x1>=1.0\n",
      "   -0.0857 if x1>=2.0\n",
      "   -0.0504 if c<=0.0 & x2<=1.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   +0.1956 if x1<=0.0 & x2<=1.0 & x2>=1.0\n",
      "   -0.3020 if x2<=2.0\n",
      "   -0.6787 if c<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   +0.0029 if x1<=0.0 & x2<=1.0 & x2>=1.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.2879 if x2>=2.0 & x3-x1>=2.0 & x4-x2>=0.0\n",
      "   -0.2396 if x2<=2.0 & x3-x1<=1.0 & x4-x2<=2.0\n",
      "----------------- 2 --------------\n",
      "   +0.4968 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.4385 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.5903 if x4-x2>=0.0\n",
      "   -0.0595 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.1900 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.0559 if c>=1.0 & x2<=2.0 & x3-x1<=1.0\n",
      "   -0.2927 if c>=1.0 & x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "   +0.1639 if c<=0.0 & x2<=1.0 & x4-x2<=0.0\n",
      "   -0.4535 if c>=1.0\n",
      "   -0.4154 if x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   +0.1787 if x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   -0.1685 if x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   +0.1206 if x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   -0.3127 if x1>=2.0 & x4-x2>=1.0\n",
      "   +0.2772 if c<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1>=-1.0 & x3-x1>=0.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.3143 if x3-x1<=0.0 & x4-x2<=2.0\n",
      "----------------- 3 --------------\n",
      "   +0.7156 if c>=1.0 & x1>=1.0\n",
      "   +0.3565 if c>=1.0 & x1>=3.0\n",
      "   -0.2184 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.1366 if x1<=0.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.2039 if x1<=2.0 & x2<=0.0\n",
      "   -0.4789 if x1<=2.0 & x2>=1.0 & x4-x2<=0.0\n",
      "   +0.4573 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   +0.5626 if c<=0.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   -0.0898 if x4-x2>=2.0\n",
      "   +0.0000 if c<=0.0 & x2>=1.0 & x2>=3.0 & x3-x1<=1.0 & x3-x1>=0.0 & x4-x2<=1.0\n",
      "   -0.3228 if x1>=1.0 & x2>=2.0\n",
      "   +0.1446 if c<=0.0 & x2<=0.0 & x3-x1>=-2.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.1484 if x1<=0.0 & x4-x2>=1.0\n",
      "   +0.2171 if c<=0.0 & x1<=0.0 & x2<=0.0 & x3-x1<=0.0\n",
      "   -0.3454 if c<=0.0 & x2>=2.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   +0.5087 if x1<=0.0 & x3-x1>=2.0 & x4-x2>=1.0\n",
      "init state [ 1  2  1 -1  0]\n",
      "(24,) (24,)\n",
      "init state [ 2  0 -1  2  0]\n",
      "(31,) (7,)\n",
      "init state [1 0 1 2 0]\n",
      "(37,) (6,)\n",
      "init state [ 2  2  1 -2  0]\n",
      "(46,) (9,)\n",
      "init state [ 1  2  1 -2  0]\n",
      "(66,) (20,)\n",
      "init state [ 2  2  1 -1  0]\n",
      "(75,) (9,)\n",
      "init state [0 0 2 2 0]\n",
      "(81,) (6,)\n",
      "init state [0 2 2 1 0]\n",
      "(85,) (4,)\n",
      "init state [2 1 0 2 0]\n",
      "(89,) (4,)\n",
      "init state [ 3  0 -3  2  0]\n",
      "(98,) (9,)\n",
      "============ 135 ===========\n",
      "Run episode 135 with rewards 33, accuracy 1.0\n",
      "best\n",
      "----------------- 0 --------------\n",
      "   -0.4853 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.4729 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.4013 if x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   -0.3619 if x1>=3.0 & x4-x2>=1.0\n",
      "   -0.0471 if c<=0.0 & x2<=1.0 & x3-x1<=-1.0\n",
      "   +0.1477 if x1>=3.0 & x2>=1.0\n",
      "   +0.2529 if c<=0.0 & x1<=1.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   +0.0784 if x1>=3.0 & x2<=2.0 & x2>=1.0\n",
      "   -0.9088 if c<=0.0 & x3-x1>=0.0\n",
      "   -0.2672 if x3-x1>=-1.0\n",
      "   -0.1441 if x1<=1.0 & x1<=2.0 & x2<=0.0 & x4-x2<=2.0\n",
      "   -0.0496 if c>=1.0 & x1>=3.0\n",
      "   +0.0000 if x1<=1.0 & x3-x1<=-1.0 & x4-x2>=3.0\n",
      "   -0.3915 if c<=0.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.0000 if x3-x1<=-1.0 & x4-x2>=3.0\n",
      "   +0.3567 if x1<=2.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "----------------- 1 --------------\n",
      "   -0.4566 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.1651 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.4392 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.4857 if c>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.5135 if x2<=2.0 & x3-x1<=0.0\n",
      "   +0.2418 if x3-x1>=-1.0\n",
      "   +0.7875 if x2<=0.0 & x3-x1>=1.0\n",
      "   +0.4155 if x3-x1>=1.0\n",
      "   -0.3138 if x1>=2.0\n",
      "   -0.0668 if c<=0.0 & x2<=1.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   +0.0000 if x1<=0.0 & x2<=1.0 & x2>=1.0\n",
      "   +0.0447 if x2<=2.0\n",
      "   -0.5081 if c<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   +0.3571 if x2>=2.0 & x3-x1>=2.0 & x4-x2>=0.0\n",
      "   -0.5157 if x2<=2.0 & x3-x1<=1.0 & x4-x2<=2.0\n",
      "   -0.2238 if x1<=1.0 & x1>=1.0 & x2>=2.0 & x4-x2>=1.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 2 --------------\n",
      "   +0.0729 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.7731 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.7731 if x4-x2>=0.0\n",
      "   -0.5650 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.1226 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.1290 if c>=1.0 & x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "   +0.3440 if c<=0.0 & x2<=1.0 & x4-x2<=0.0\n",
      "   -0.4607 if c>=1.0\n",
      "   -0.0426 if x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   -0.2106 if x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   +0.1341 if x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   +0.2936 if x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   -0.1744 if x1>=2.0 & x4-x2>=1.0\n",
      "   -0.0280 if c<=0.0 & x1<=1.0 & x2>=2.0 & x3-x1>=-1.0 & x3-x1>=0.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   -0.5434 if x3-x1<=0.0 & x4-x2<=2.0\n",
      "   +0.2024 if x1<=1.0\n",
      "----------------- 3 --------------\n",
      "   +0.4817 if c>=1.0 & x1>=1.0\n",
      "   +0.0621 if c>=1.0 & x1>=3.0\n",
      "   -0.7066 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.0799 if x1<=0.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.2539 if x1<=2.0 & x2<=0.0\n",
      "   -0.5269 if x1<=2.0 & x2>=1.0 & x4-x2<=0.0\n",
      "   +0.1384 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   +0.5052 if c<=0.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.0584 if x4-x2>=2.0\n",
      "   +0.2312 if x1>=1.0 & x2>=2.0\n",
      "   -0.0381 if c<=0.0 & x2<=0.0 & x3-x1>=-2.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   -0.3476 if x1<=0.0 & x4-x2>=1.0\n",
      "   +0.0000 if c<=0.0 & x1<=0.0 & x2<=0.0 & x3-x1<=0.0\n",
      "   -0.1274 if c<=0.0 & x2>=2.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   -0.3476 if x1<=0.0 & x3-x1>=2.0 & x4-x2>=1.0\n",
      "   +0.6054 if \n",
      "init state [ 1  2  2 -1  0]\n",
      "(9,) (9,)\n",
      "init state [0 1 2 0 0]\n",
      "(18,) (9,)\n",
      "init state [ 1  1 -1  1  0]\n",
      "(30,) (12,)\n",
      "init state [ 0  1  1 -1  0]\n",
      "(39,) (9,)\n",
      "init state [0 1 0 2 0]\n",
      "(44,) (5,)\n",
      "init state [1 0 0 2 0]\n",
      "(51,) (7,)\n",
      "init state [ 2  3 -1  0  0]\n",
      "(58,) (7,)\n",
      "init state [3 0 0 1 0]\n",
      "(63,) (5,)\n",
      "init state [ 2  3 -1 -3  0]\n",
      "(100,) (37,)\n",
      "init state [ 1  3 -1 -2  0]\n",
      "(110,) (10,)\n",
      "============ 136 ===========\n",
      "Run episode 136 with rewards 32, accuracy 0.2\n",
      "----------------- 0 --------------\n",
      "   -0.4985 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.5168 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.2856 if x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   -0.0262 if x1>=3.0 & x4-x2>=1.0\n",
      "   +0.2453 if c<=0.0 & x2<=1.0 & x3-x1<=-1.0\n",
      "   +0.0240 if x1>=3.0 & x2>=1.0\n",
      "   -0.1819 if c<=0.0 & x1<=1.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   -0.1051 if x1>=3.0 & x2<=2.0 & x2>=1.0\n",
      "   -0.8735 if c<=0.0 & x3-x1>=0.0\n",
      "   -0.4762 if x3-x1>=-1.0\n",
      "   -0.0754 if x1<=1.0 & x1<=2.0 & x2<=0.0 & x4-x2<=2.0\n",
      "   -0.1409 if c>=1.0 & x1>=3.0\n",
      "   -0.1505 if c<=0.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.0000 if x3-x1<=-1.0 & x4-x2>=3.0\n",
      "   -0.0801 if x1<=2.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   +0.2880 if c<=0.0 & x1<=1.0 & x3-x1<=-1.0 & x3-x1<=0.0 & x4-x2<=-2.0\n",
      "----------------- 1 --------------\n",
      "   -0.6738 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.4416 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.0980 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.8218 if c>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.5987 if x2<=2.0 & x3-x1<=0.0\n",
      "   -0.0158 if x3-x1>=-1.0\n",
      "   -0.2138 if x2<=0.0 & x3-x1>=1.0\n",
      "   +0.4254 if x3-x1>=1.0\n",
      "   +0.5297 if x1>=2.0\n",
      "   -0.0600 if c<=0.0 & x2<=1.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   +0.0396 if x2<=2.0\n",
      "   +0.1209 if c<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   +0.0000 if x2>=2.0 & x3-x1>=2.0 & x4-x2>=0.0\n",
      "   -0.2467 if x2<=2.0 & x3-x1<=1.0 & x4-x2<=2.0\n",
      "   +0.0000 if x1<=1.0 & x1>=1.0 & x2>=2.0 & x4-x2>=1.0\n",
      "   +0.3444 if x1<=0.0 & x2>=1.0 & x3-x1>=1.0\n",
      "----------------- 2 --------------\n",
      "   +0.5155 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.5417 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.5417 if x4-x2>=0.0\n",
      "   -0.4566 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.3161 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.2839 if c>=1.0 & x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "   +0.2362 if c<=0.0 & x2<=1.0 & x4-x2<=0.0\n",
      "   -0.5114 if c>=1.0\n",
      "   -0.0103 if x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   +0.4528 if x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   -0.3453 if x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   -0.1621 if x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   -0.0205 if x1>=2.0 & x4-x2>=1.0\n",
      "   -0.0006 if x3-x1<=0.0 & x4-x2<=2.0\n",
      "   -0.0672 if x1<=1.0\n",
      "   +0.1709 if x1<=0.0 & x2<=2.0\n",
      "----------------- 3 --------------\n",
      "   +0.5374 if c>=1.0 & x1>=1.0\n",
      "   +0.2707 if c>=1.0 & x1>=3.0\n",
      "   -0.8386 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.3410 if x1<=0.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.4001 if x1<=2.0 & x2<=0.0\n",
      "   -0.1637 if x1<=2.0 & x2>=1.0 & x4-x2<=0.0\n",
      "   +0.2816 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   +0.4699 if c<=0.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.2456 if x4-x2>=2.0\n",
      "   -0.1345 if x1>=1.0 & x2>=2.0\n",
      "   +0.1479 if c<=0.0 & x2<=0.0 & x3-x1>=-2.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.2456 if x1<=0.0 & x4-x2>=1.0\n",
      "   +0.0843 if c<=0.0 & x2>=2.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   +0.0000 if x1<=0.0 & x3-x1>=2.0 & x4-x2>=1.0\n",
      "   +0.0261 if \n",
      "   +0.5195 if c<=0.0 & x1<=1.0 & x4-x2<=1.0\n",
      "init state [ 2  1 -1  0  0]\n",
      "(15,) (15,)\n",
      "init state [3 1 0 1 0]\n",
      "(18,) (3,)\n",
      "init state [ 1  0 -1  2  0]\n",
      "(35,) (17,)\n",
      "init state [1 1 1 0 0]\n",
      "(43,) (8,)\n",
      "init state [0 2 2 0 0]\n",
      "(56,) (13,)\n",
      "init state [ 2  2 -1 -1  0]\n",
      "(73,) (17,)\n",
      "init state [ 3  0 -1  2  0]\n",
      "(93,) (20,)\n",
      "init state [1 0 1 1 0]\n",
      "(114,) (21,)\n",
      "init state [ 2  3 -1 -2  0]\n",
      "(129,) (15,)\n",
      "init state [ 3  1 -2  1  0]\n",
      "(140,) (11,)\n",
      "============ 137 ===========\n",
      "Run episode 137 with rewards 31, accuracy 0.7\n",
      "----------------- 0 --------------\n",
      "   -0.4782 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.5806 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.2617 if x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   +0.1818 if x1>=3.0 & x4-x2>=1.0\n",
      "   +0.0929 if c<=0.0 & x2<=1.0 & x3-x1<=-1.0\n",
      "   +0.0681 if x1>=3.0 & x2>=1.0\n",
      "   -0.0797 if c<=0.0 & x1<=1.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   -0.2811 if x1>=3.0 & x2<=2.0 & x2>=1.0\n",
      "   -0.6225 if c<=0.0 & x3-x1>=0.0\n",
      "   -0.3852 if x3-x1>=-1.0\n",
      "   -0.0288 if x1<=1.0 & x1<=2.0 & x2<=0.0 & x4-x2<=2.0\n",
      "   -0.0268 if c>=1.0 & x1>=3.0\n",
      "   -0.0854 if c<=0.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.1574 if x1<=2.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   +0.0000 if c<=0.0 & x1<=1.0 & x3-x1<=-1.0 & x3-x1<=0.0 & x4-x2<=-2.0\n",
      "   +0.3362 if x1>=1.0 & x2<=2.0 & x3-x1<=-2.0\n",
      "----------------- 1 --------------\n",
      "   -0.4274 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.3310 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   -0.0931 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.4498 if c>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.3026 if x2<=2.0 & x3-x1<=0.0\n",
      "   +0.3327 if x3-x1>=-1.0\n",
      "   +0.0007 if x2<=0.0 & x3-x1>=1.0\n",
      "   +0.4840 if x3-x1>=1.0\n",
      "   -0.0296 if x1>=2.0\n",
      "   +0.2872 if c<=0.0 & x2<=1.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   -0.3635 if x2<=2.0\n",
      "   +0.0953 if c<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   -0.0923 if x2>=2.0 & x3-x1>=2.0 & x4-x2>=0.0\n",
      "   -0.2712 if x2<=2.0 & x3-x1<=1.0 & x4-x2<=2.0\n",
      "   +0.0423 if x1<=0.0 & x2>=1.0 & x3-x1>=1.0\n",
      "   +0.2289 if x3-x1<=0.0\n",
      "----------------- 2 --------------\n",
      "   +0.4427 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.4866 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.4866 if x4-x2>=0.0\n",
      "   -0.4730 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.1546 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.0091 if c>=1.0 & x3-x1<=-1.0 & x4-x2<=-1.0\n",
      "   -0.1775 if c<=0.0 & x2<=1.0 & x4-x2<=0.0\n",
      "   -0.2154 if c>=1.0\n",
      "   -0.0635 if x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   +0.4249 if x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   -0.2116 if x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   -0.2623 if x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   -0.0883 if x1>=2.0 & x4-x2>=1.0\n",
      "   -0.2864 if x1<=1.0\n",
      "   -0.0232 if x1<=0.0 & x2<=2.0\n",
      "   -0.3082 if x3-x1<=-3.0\n",
      "----------------- 3 --------------\n",
      "   +0.5991 if c>=1.0 & x1>=1.0\n",
      "   +0.0363 if c>=1.0 & x1>=3.0\n",
      "   -0.3308 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.0737 if x1<=0.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.0540 if x1<=2.0 & x2<=0.0\n",
      "   +0.0357 if x1<=2.0 & x2>=1.0 & x4-x2<=0.0\n",
      "   +0.4645 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   +0.2631 if c<=0.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.0753 if x4-x2>=2.0\n",
      "   -0.0547 if x1>=1.0 & x2>=2.0\n",
      "   -0.0024 if c<=0.0 & x2<=0.0 & x3-x1>=-2.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.0000 if x1<=0.0 & x4-x2>=1.0\n",
      "   +0.2425 if c<=0.0 & x2>=2.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   -0.1390 if \n",
      "   -0.2188 if c<=0.0 & x1<=1.0 & x4-x2<=1.0\n",
      "   +0.1598 if x3-x1<=-3.0\n",
      "init state [ 2  3  0 -3  0]\n",
      "(48,) (48,)\n",
      "init state [0 1 3 1 0]\n",
      "(56,) (8,)\n",
      "init state [0 2 1 0 0]\n",
      "(65,) (9,)\n",
      "init state [ 1  3 -1 -3  0]\n",
      "(78,) (13,)\n",
      "init state [ 2  1  0 -1  0]\n",
      "(87,) (9,)\n",
      "init state [ 0  3  0 -1  0]\n",
      "(109,) (22,)\n",
      "init state [0 1 1 2 0]\n",
      "(122,) (13,)\n",
      "init state [2 1 0 2 0]\n",
      "(127,) (5,)\n",
      "init state [ 1  1 -1  1  0]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(133,) (6,)\n",
      "init state [1 0 0 1 0]\n",
      "(138,) (5,)\n",
      "============ 138 ===========\n",
      "Run episode 138 with rewards 37, accuracy 0.4\n",
      "----------------- 0 --------------\n",
      "   -0.6908 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.6206 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.2873 if x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   +0.0000 if x1>=3.0 & x4-x2>=1.0\n",
      "   +0.5082 if c<=0.0 & x2<=1.0 & x3-x1<=-1.0\n",
      "   +0.0253 if x1>=3.0 & x2>=1.0\n",
      "   +0.1333 if c<=0.0 & x1<=1.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   +0.0404 if x1>=3.0 & x2<=2.0 & x2>=1.0\n",
      "   -0.4881 if c<=0.0 & x3-x1>=0.0\n",
      "   -0.4383 if x3-x1>=-1.0\n",
      "   +0.1100 if x1<=1.0 & x1<=2.0 & x2<=0.0 & x4-x2<=2.0\n",
      "   -0.2563 if c>=1.0 & x1>=3.0\n",
      "   -0.0995 if c<=0.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.0157 if x1<=2.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   -0.3617 if x1>=1.0 & x2<=2.0 & x3-x1<=-2.0\n",
      "   -0.1233 if c<=0.0 & x1>=3.0 & x2<=0.0\n",
      "----------------- 1 --------------\n",
      "   -0.4451 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.4303 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.6953 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.6069 if c>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.4987 if x2<=2.0 & x3-x1<=0.0\n",
      "   +0.0775 if x3-x1>=-1.0\n",
      "   +0.2589 if x3-x1>=1.0\n",
      "   +0.0251 if x1>=2.0\n",
      "   +0.4578 if c<=0.0 & x2<=1.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   -0.4176 if x2<=2.0\n",
      "   -0.4314 if c<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   -0.2371 if x2>=2.0 & x3-x1>=2.0 & x4-x2>=0.0\n",
      "   -0.1551 if x2<=2.0 & x3-x1<=1.0 & x4-x2<=2.0\n",
      "   +0.1389 if x1<=0.0 & x2>=1.0 & x3-x1>=1.0\n",
      "   +0.1738 if x3-x1<=0.0\n",
      "   +0.2304 if x3-x1>=3.0\n",
      "----------------- 2 --------------\n",
      "   +0.9353 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.5875 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.5875 if x4-x2>=0.0\n",
      "   -0.4066 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.0747 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   +0.2021 if c<=0.0 & x2<=1.0 & x4-x2<=0.0\n",
      "   -0.5943 if c>=1.0\n",
      "   -0.0524 if x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   +0.5265 if x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   -0.3012 if x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   -0.3868 if x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   -0.1460 if x1>=2.0 & x4-x2>=1.0\n",
      "   -0.1869 if x1<=1.0\n",
      "   -0.2815 if x1<=0.0 & x2<=2.0\n",
      "   -0.0936 if x3-x1<=-3.0\n",
      "   -0.0677 if x2<=0.0 & x3-x1>=-1.0\n",
      "----------------- 3 --------------\n",
      "   +0.5057 if c>=1.0 & x1>=1.0\n",
      "   +0.5954 if c>=1.0 & x1>=3.0\n",
      "   -0.3436 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.1525 if x1<=0.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.0676 if x1<=2.0 & x2<=0.0\n",
      "   -0.3180 if x1<=2.0 & x2>=1.0 & x4-x2<=0.0\n",
      "   +0.1822 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   +0.1366 if c<=0.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   -0.3102 if x4-x2>=2.0\n",
      "   +0.3724 if x1>=1.0 & x2>=2.0\n",
      "   +0.2016 if c<=0.0 & x2<=0.0 & x3-x1>=-2.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.6426 if c<=0.0 & x2>=2.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   +0.1225 if \n",
      "   +0.0587 if c<=0.0 & x1<=1.0 & x4-x2<=1.0\n",
      "   +0.2418 if x3-x1<=-3.0\n",
      "   -0.2883 if x1>=1.0 & x3-x1<=1.0 & x4-x2<=1.0\n",
      "init state [1 3 1 0 0]\n",
      "(12,) (12,)\n",
      "init state [0 0 2 2 0]\n",
      "(37,) (25,)\n",
      "init state [ 1  2 -1 -1  0]\n",
      "(48,) (11,)\n",
      "init state [ 2  1 -2  1  0]\n",
      "(57,) (9,)\n",
      "init state [ 2  2 -1 -2  0]\n",
      "(73,) (16,)\n",
      "init state [ 1  3  2 -2  0]\n",
      "(102,) (29,)\n",
      "init state [0 1 2 1 0]\n",
      "(115,) (13,)\n",
      "init state [ 1  1 -1  1  0]\n",
      "(124,) (9,)\n",
      "init state [ 3  0 -3  2  0]\n",
      "(160,) (36,)\n",
      "init state [ 1  2  2 -1  0]\n",
      "(165,) (5,)\n",
      "============ 139 ===========\n",
      "Run episode 139 with rewards 37, accuracy 1.0\n",
      "best\n",
      "----------------- 0 --------------\n",
      "   -0.2974 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.7374 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.4214 if x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   +0.2399 if c<=0.0 & x2<=1.0 & x3-x1<=-1.0\n",
      "   -0.2272 if x1>=3.0 & x2>=1.0\n",
      "   +0.6430 if c<=0.0 & x1<=1.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   +0.2102 if x1>=3.0 & x2<=2.0 & x2>=1.0\n",
      "   -0.5650 if c<=0.0 & x3-x1>=0.0\n",
      "   -0.2547 if x3-x1>=-1.0\n",
      "   -0.0070 if x1<=1.0 & x1<=2.0 & x2<=0.0 & x4-x2<=2.0\n",
      "   +0.1681 if c>=1.0 & x1>=3.0\n",
      "   +0.0693 if c<=0.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.1959 if x1<=2.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   +0.1309 if x1>=1.0 & x2<=2.0 & x3-x1<=-2.0\n",
      "   +0.1571 if c<=0.0 & x1>=3.0 & x2<=0.0\n",
      "   +0.5705 if x2>=1.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "----------------- 1 --------------\n",
      "   -0.4071 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.1311 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.9857 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.3850 if c>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.4067 if x2<=2.0 & x3-x1<=0.0\n",
      "   -0.3071 if x3-x1>=-1.0\n",
      "   +0.0135 if x3-x1>=1.0\n",
      "   -0.1153 if c<=0.0 & x2<=1.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   -0.5382 if x2<=2.0\n",
      "   -0.2386 if c<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   +0.0108 if x2>=2.0 & x3-x1>=2.0 & x4-x2>=0.0\n",
      "   -0.0540 if x2<=2.0 & x3-x1<=1.0 & x4-x2<=2.0\n",
      "   -0.0961 if x1<=0.0 & x2>=1.0 & x3-x1>=1.0\n",
      "   +0.1678 if x3-x1<=0.0\n",
      "   +0.0275 if x3-x1>=3.0\n",
      "   +0.0699 if x3-x1>=2.0 & x4-x2>=-1.0\n",
      "----------------- 2 --------------\n",
      "   +0.8619 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.4411 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.4411 if x4-x2>=0.0\n",
      "   -0.4579 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.2295 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   +0.1171 if c<=0.0 & x2<=1.0 & x4-x2<=0.0\n",
      "   -0.4466 if c>=1.0\n",
      "   +0.6219 if x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   -0.1451 if x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   -0.3949 if x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   -0.0315 if x1>=2.0 & x4-x2>=1.0\n",
      "   -0.3920 if x1<=1.0\n",
      "   -0.0282 if x1<=0.0 & x2<=2.0\n",
      "   +0.1398 if x3-x1<=-3.0\n",
      "   -0.0684 if x2<=0.0 & x3-x1>=-1.0\n",
      "   -0.0972 if x1<=0.0\n",
      "----------------- 3 --------------\n",
      "   +0.4828 if c>=1.0 & x1>=1.0\n",
      "   +0.3500 if c>=1.0 & x1>=3.0\n",
      "   -0.5512 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.0642 if x1<=0.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.0038 if x1<=2.0 & x2<=0.0\n",
      "   -0.2720 if x1<=2.0 & x2>=1.0 & x4-x2<=0.0\n",
      "   -0.2870 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   +0.4917 if c<=0.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   -0.0972 if x4-x2>=2.0\n",
      "   +0.2853 if x1>=1.0 & x2>=2.0\n",
      "   -0.0248 if c<=0.0 & x2<=0.0 & x3-x1>=-2.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.5880 if c<=0.0 & x2>=2.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   -0.1790 if \n",
      "   -0.0628 if x3-x1<=-3.0\n",
      "   -0.1364 if x1>=1.0 & x3-x1<=1.0 & x4-x2<=1.0\n",
      "   +0.4076 if x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "init state [ 0  3  0 -2  0]\n",
      "(12,) (12,)\n",
      "init state [ 2  2 -1  1  0]\n",
      "(17,) (5,)\n",
      "init state [ 3  2 -3 -1  0]\n",
      "(48,) (31,)\n",
      "init state [2 2 0 1 0]\n",
      "(50,) (2,)\n",
      "init state [ 3  1 -2  2  0]\n",
      "(86,) (36,)\n",
      "init state [ 3  2 -1 -2  0]\n",
      "(127,) (41,)\n",
      "init state [ 3  2 -1  0  0]\n",
      "(132,) (5,)\n",
      "init state [ 0  2  2 -2  0]\n",
      "(151,) (19,)\n",
      "init state [ 2  2  0 -2  0]\n",
      "(164,) (13,)\n",
      "init state [2 0 1 2 0]\n",
      "(168,) (4,)\n",
      "============ 140 ===========\n",
      "Run episode 140 with rewards 38, accuracy 0.9\n",
      "----------------- 0 --------------\n",
      "   -0.5697 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.4953 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.1255 if x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   +0.1707 if c<=0.0 & x2<=1.0 & x3-x1<=-1.0\n",
      "   +0.2048 if x1>=3.0 & x2>=1.0\n",
      "   +0.3380 if c<=0.0 & x1<=1.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   +0.1151 if x1>=3.0 & x2<=2.0 & x2>=1.0\n",
      "   -0.5016 if c<=0.0 & x3-x1>=0.0\n",
      "   -0.1495 if x3-x1>=-1.0\n",
      "   +0.0209 if c>=1.0 & x1>=3.0\n",
      "   -0.5300 if c<=0.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.5289 if x1<=2.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   -0.0439 if x1>=1.0 & x2<=2.0 & x3-x1<=-2.0\n",
      "   +0.0315 if c<=0.0 & x1>=3.0 & x2<=0.0\n",
      "   -0.1944 if x2>=1.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   +0.3229 if x1>=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "----------------- 1 --------------\n",
      "   -0.3228 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.3475 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.2713 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.6114 if c>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.4618 if x2<=2.0 & x3-x1<=0.0\n",
      "   +0.3907 if x3-x1>=-1.0\n",
      "   +0.2811 if x3-x1>=1.0\n",
      "   -0.2522 if c<=0.0 & x2<=1.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   -0.3391 if x2<=2.0\n",
      "   -0.1912 if c<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   -0.2510 if x2<=2.0 & x3-x1<=1.0 & x4-x2<=2.0\n",
      "   -0.0474 if x1<=0.0 & x2>=1.0 & x3-x1>=1.0\n",
      "   +0.1893 if x3-x1<=0.0\n",
      "   +0.0000 if x3-x1>=3.0\n",
      "   -0.1659 if x3-x1>=2.0 & x4-x2>=-1.0\n",
      "   +0.3994 if x1>=2.0 & x2>=2.0 & x3-x1>=1.0 & x4-x2<=1.0\n",
      "----------------- 2 --------------\n",
      "   +0.7521 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.3652 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.3652 if x4-x2>=0.0\n",
      "   -0.3507 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.3289 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   +0.2415 if c<=0.0 & x2<=1.0 & x4-x2<=0.0\n",
      "   -0.6398 if c>=1.0\n",
      "   +0.1888 if x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   -0.0877 if x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   -0.1401 if x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   -0.2372 if x1>=2.0 & x4-x2>=1.0\n",
      "   -0.3399 if x1<=1.0\n",
      "   +0.1351 if x3-x1<=-3.0\n",
      "   -0.2017 if x2<=0.0 & x3-x1>=-1.0\n",
      "   -0.2321 if x1<=0.0\n",
      "   +0.0384 if x2>=2.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 3 --------------\n",
      "   +0.5084 if c>=1.0 & x1>=1.0\n",
      "   +0.2547 if c>=1.0 & x1>=3.0\n",
      "   -0.3372 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   +0.0516 if x1<=0.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.5538 if x1<=2.0 & x2>=1.0 & x4-x2<=0.0\n",
      "   +0.1823 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   +0.9140 if c<=0.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.2841 if x4-x2>=2.0\n",
      "   -0.2538 if x1>=1.0 & x2>=2.0\n",
      "   +0.0925 if c<=0.0 & x2<=0.0 & x3-x1>=-2.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.3697 if c<=0.0 & x2>=2.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   +0.0127 if \n",
      "   +0.0767 if x3-x1<=-3.0\n",
      "   -0.1773 if x1>=1.0 & x3-x1<=1.0 & x4-x2<=1.0\n",
      "   -0.4339 if x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.8509 if c>=1.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2>=-2.0\n",
      "init state [ 3  2 -2 -2  0]\n",
      "(15,) (15,)\n",
      "init state [ 3  1 -2  1  0]\n",
      "(23,) (8,)\n",
      "init state [ 2  1 -2  1  0]\n",
      "(36,) (13,)\n",
      "init state [0 1 0 1 0]\n",
      "(48,) (12,)\n",
      "init state [ 1  0 -1  2  0]\n",
      "(63,) (15,)\n",
      "init state [ 2  3  0 -2  0]\n",
      "(70,) (7,)\n",
      "init state [ 0  3  2 -3  0]\n",
      "(84,) (14,)\n",
      "init state [ 1  1  2 -1  0]\n",
      "(95,) (11,)\n",
      "init state [ 1  3  1 -3  0]\n",
      "(116,) (21,)\n",
      "init state [ 3  1 -3 -1  0]\n",
      "(150,) (34,)\n",
      "============ 141 ===========\n",
      "Run episode 141 with rewards 8, accuracy 0.8\n",
      "----------------- 0 --------------\n",
      "   -0.6124 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.7344 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.1109 if x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   +0.7697 if c<=0.0 & x2<=1.0 & x3-x1<=-1.0\n",
      "   +0.0624 if x1>=3.0 & x2>=1.0\n",
      "   -0.2433 if c<=0.0 & x1<=1.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   +0.2595 if x1>=3.0 & x2<=2.0 & x2>=1.0\n",
      "   -0.3280 if c<=0.0 & x3-x1>=0.0\n",
      "   -0.2387 if x3-x1>=-1.0\n",
      "   -0.2516 if c<=0.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.3608 if x1<=2.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   -0.2464 if x1>=1.0 & x2<=2.0 & x3-x1<=-2.0\n",
      "   -0.0375 if c<=0.0 & x1>=3.0 & x2<=0.0\n",
      "   +0.0000 if x2>=1.0 & x3-x1>=1.0 & x4-x2>=0.0\n",
      "   +0.2635 if x1>=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.2521 if c<=0.0 & x1<=2.0 & x3-x1<=1.0 & x4-x2<=1.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "----------------- 1 --------------\n",
      "   -0.2782 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.4595 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.3316 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.4600 if c>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.4388 if x2<=2.0 & x3-x1<=0.0\n",
      "   +0.2648 if x3-x1>=-1.0\n",
      "   +0.0989 if x3-x1>=1.0\n",
      "   +0.0175 if c<=0.0 & x2<=1.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   -0.0281 if x2<=2.0\n",
      "   -0.0391 if c<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   -0.1663 if x2<=2.0 & x3-x1<=1.0 & x4-x2<=2.0\n",
      "   -0.2050 if x1<=0.0 & x2>=1.0 & x3-x1>=1.0\n",
      "   -0.0130 if x3-x1<=0.0\n",
      "   +0.1055 if x3-x1>=2.0 & x4-x2>=-1.0\n",
      "   +0.1038 if x1>=2.0 & x2>=2.0 & x3-x1>=1.0 & x4-x2<=1.0\n",
      "   +0.3860 if x1<=1.0 & x4-x2>=1.0\n",
      "----------------- 2 --------------\n",
      "   +0.7162 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.3610 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.3610 if x4-x2>=0.0\n",
      "   -0.2915 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.3829 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   +0.3152 if c<=0.0 & x2<=1.0 & x4-x2<=0.0\n",
      "   -0.6979 if c>=1.0\n",
      "   +0.2697 if x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   -0.2469 if x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   -0.2030 if x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   -0.0842 if x1>=2.0 & x4-x2>=1.0\n",
      "   -0.1553 if x1<=1.0\n",
      "   -0.0768 if x3-x1<=-3.0\n",
      "   -0.3515 if x2<=0.0 & x3-x1>=-1.0\n",
      "   +0.3270 if x1<=0.0\n",
      "   +0.0215 if x1<=2.0 & x3-x1<=2.0 & x3-x1>=0.0\n",
      "----------------- 3 --------------\n",
      "   +0.6153 if c>=1.0 & x1>=1.0\n",
      "   +0.3218 if c>=1.0 & x1>=3.0\n",
      "   -0.6571 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.2126 if x1<=0.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.4742 if x1<=2.0 & x2>=1.0 & x4-x2<=0.0\n",
      "   +0.2039 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   +0.2528 if c<=0.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.1396 if x4-x2>=2.0\n",
      "   +0.0911 if x1>=1.0 & x2>=2.0\n",
      "   -0.0605 if c<=0.0 & x2<=0.0 & x3-x1>=-2.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.0000 if c<=0.0 & x2>=2.0 & x3-x1>=0.0 & x4-x2>=0.0\n",
      "   +0.3394 if x3-x1<=-3.0\n",
      "   +0.0045 if x1>=1.0 & x3-x1<=1.0 & x4-x2<=1.0\n",
      "   -0.4245 if x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.3892 if c>=1.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2>=-2.0\n",
      "   -0.5579 if x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-2.0 & x4-x2>=1.0\n",
      "init state [ 0  3  0 -3  0]\n",
      "(23,) (23,)\n",
      "init state [ 0  3  2 -1  0]\n",
      "(32,) (9,)\n",
      "init state [0 1 2 2 0]\n",
      "(38,) (6,)\n",
      "init state [ 3  2 -3  0  0]\n",
      "(66,) (28,)\n",
      "init state [3 0 0 1 0]\n",
      "(69,) (3,)\n",
      "init state [ 3  2 -2  1  0]\n",
      "(79,) (10,)\n",
      "init state [ 3  2 -3  0  0]\n",
      "(105,) (26,)\n",
      "init state [2 1 1 0 0]\n",
      "(111,) (6,)\n",
      "init state [1 2 2 0 0]\n",
      "(114,) (3,)\n",
      "init state [ 2  2 -2 -2  0]\n",
      "(132,) (18,)\n",
      "============ 142 ===========\n",
      "Run episode 142 with rewards 24, accuracy 1.0\n",
      "best\n",
      "----------------- 0 --------------\n",
      "   -0.6500 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.4824 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.1595 if x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   +0.4006 if c<=0.0 & x2<=1.0 & x3-x1<=-1.0\n",
      "   +0.4872 if x1>=3.0 & x2>=1.0\n",
      "   +0.0820 if c<=0.0 & x1<=1.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   -0.1625 if x1>=3.0 & x2<=2.0 & x2>=1.0\n",
      "   -0.7684 if c<=0.0 & x3-x1>=0.0\n",
      "   -0.3822 if x3-x1>=-1.0\n",
      "   -0.3154 if c<=0.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.3443 if x1<=2.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   +0.0005 if x1>=1.0 & x2<=2.0 & x3-x1<=-2.0\n",
      "   -0.0625 if c<=0.0 & x1>=3.0 & x2<=0.0\n",
      "   +0.0756 if x1>=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.0271 if c<=0.0 & x1<=2.0 & x3-x1<=1.0 & x4-x2<=1.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   +0.4967 if c<=0.0 & x1>=3.0 & x3-x1<=-1.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "----------------- 1 --------------\n",
      "   -0.2582 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.4697 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.8028 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.1533 if c>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.5637 if x2<=2.0 & x3-x1<=0.0\n",
      "   +0.4147 if x3-x1>=-1.0\n",
      "   +0.7234 if x3-x1>=1.0\n",
      "   +0.2452 if c<=0.0 & x2<=1.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   +0.0013 if x2<=2.0\n",
      "   -0.0848 if c<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   -0.1985 if x2<=2.0 & x3-x1<=1.0 & x4-x2<=2.0\n",
      "   +0.1761 if x1<=0.0 & x2>=1.0 & x3-x1>=1.0\n",
      "   +0.2684 if x3-x1>=2.0 & x4-x2>=-1.0\n",
      "   +0.1199 if x1>=2.0 & x2>=2.0 & x3-x1>=1.0 & x4-x2<=1.0\n",
      "   +0.0552 if x1<=1.0 & x4-x2>=1.0\n",
      "   -0.7728 if c<=0.0 & x2<=2.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x3-x1>=-2.0\n",
      "----------------- 2 --------------\n",
      "   +0.1237 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.3943 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.3943 if x4-x2>=0.0\n",
      "   -0.2209 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.2215 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   +0.1064 if c<=0.0 & x2<=1.0 & x4-x2<=0.0\n",
      "   -0.1319 if c>=1.0\n",
      "   +0.2941 if x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   -0.1574 if x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   -0.2369 if x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   -0.2244 if x1>=2.0 & x4-x2>=1.0\n",
      "   +0.0072 if x1<=1.0\n",
      "   -0.3411 if x3-x1<=-3.0\n",
      "   -0.0863 if x2<=0.0 & x3-x1>=-1.0\n",
      "   +0.1761 if x1<=0.0\n",
      "   -0.2080 if x1>=3.0 & x3-x1<=-1.0\n",
      "----------------- 3 --------------\n",
      "   +0.4347 if c>=1.0 & x1>=1.0\n",
      "   +0.5331 if c>=1.0 & x1>=3.0\n",
      "   -0.1953 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.1019 if x1<=0.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.8496 if x1<=2.0 & x2>=1.0 & x4-x2<=0.0\n",
      "   +0.3636 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   +0.6287 if c<=0.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   -0.1118 if x4-x2>=2.0\n",
      "   -0.1482 if x1>=1.0 & x2>=2.0\n",
      "   +0.1477 if c<=0.0 & x2<=0.0 & x3-x1>=-2.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.4350 if x3-x1<=-3.0\n",
      "   +0.0909 if x1>=1.0 & x3-x1<=1.0 & x4-x2<=1.0\n",
      "   -0.4333 if x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.4899 if c>=1.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2>=-2.0\n",
      "   -0.1444 if x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-2.0 & x4-x2>=1.0\n",
      "   -0.3605 if x3-x1>=1.0 & x4-x2>=2.0\n",
      "init state [2 0 1 0 0]\n",
      "(4,) (4,)\n",
      "init state [2 2 1 0 0]\n",
      "(6,) (2,)\n",
      "init state [2 1 0 1 0]\n",
      "(9,) (3,)\n",
      "init state [1 1 1 1 0]\n",
      "(13,) (4,)\n",
      "init state [ 1  1 -1  2  0]\n",
      "(19,) (6,)\n",
      "init state [ 3  0 -3  1  0]\n",
      "(50,) (31,)\n",
      "init state [ 3  0 -2  1  0]\n",
      "(64,) (14,)\n",
      "init state [2 1 1 0 0]\n",
      "(68,) (4,)\n",
      "init state [ 2  0 -2  3  0]\n",
      "(99,) (31,)\n",
      "init state [ 3  1 -3  1  0]\n",
      "(118,) (19,)\n",
      "============ 143 ===========\n",
      "Run episode 143 with rewards 23, accuracy 1.0\n",
      "best\n",
      "----------------- 0 --------------\n",
      "   -0.5340 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.8333 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.1357 if x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   +0.4421 if c<=0.0 & x2<=1.0 & x3-x1<=-1.0\n",
      "   +0.2783 if x1>=3.0 & x2>=1.0\n",
      "   +0.1529 if c<=0.0 & x1<=1.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   +0.0829 if x1>=3.0 & x2<=2.0 & x2>=1.0\n",
      "   -0.3742 if c<=0.0 & x3-x1>=0.0\n",
      "   -0.3259 if x3-x1>=-1.0\n",
      "   -0.2576 if c<=0.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   -0.2283 if x1<=2.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   +0.0480 if c<=0.0 & x1>=3.0 & x2<=0.0\n",
      "   +0.1149 if x1>=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.0448 if c<=0.0 & x1<=2.0 & x3-x1<=1.0 & x4-x2<=1.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   +0.0613 if c<=0.0 & x1>=3.0 & x3-x1<=-1.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.0767 if x4-x2>=3.0\n",
      "----------------- 1 --------------\n",
      "   -0.5414 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.5574 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.9738 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.5917 if c>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.4177 if x2<=2.0 & x3-x1<=0.0\n",
      "   +0.1401 if x3-x1>=-1.0\n",
      "   +0.5251 if x3-x1>=1.0\n",
      "   +0.2978 if c<=0.0 & x2<=1.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   -0.0323 if c<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   +0.1447 if x2<=2.0 & x3-x1<=1.0 & x4-x2<=2.0\n",
      "   -0.0000 if x1<=0.0 & x2>=1.0 & x3-x1>=1.0\n",
      "   -0.0000 if x3-x1>=2.0 & x4-x2>=-1.0\n",
      "   +0.0889 if x1>=2.0 & x2>=2.0 & x3-x1>=1.0 & x4-x2<=1.0\n",
      "   -0.1538 if x1<=1.0 & x4-x2>=1.0\n",
      "   -0.6117 if c<=0.0 & x2<=2.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x3-x1>=-2.0\n",
      "   -0.0868 if x3-x1<=-2.0 & x3-x1>=-2.0 & x4-x2<=0.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 2 --------------\n",
      "   +0.2981 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.4681 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.4562 if x4-x2>=0.0\n",
      "   -0.4418 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.1135 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -0.0444 if c<=0.0 & x2<=1.0 & x4-x2<=0.0\n",
      "   -0.4223 if c>=1.0\n",
      "   +0.0313 if x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   -0.4249 if x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   -0.4105 if x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   -0.1398 if x1>=2.0 & x4-x2>=1.0\n",
      "   -0.1747 if x3-x1<=-3.0\n",
      "   -0.0265 if x2<=0.0 & x3-x1>=-1.0\n",
      "   -0.0365 if x1<=0.0\n",
      "   -0.0993 if x1>=3.0 & x3-x1<=-1.0\n",
      "   -0.2346 if x4-x2>=1.0\n",
      "----------------- 3 --------------\n",
      "   +0.0677 if c>=1.0 & x1>=1.0\n",
      "   +0.7041 if c>=1.0 & x1>=3.0\n",
      "   -0.0000 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.0746 if x1<=0.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.8918 if x1<=2.0 & x2>=1.0 & x4-x2<=0.0\n",
      "   +0.6767 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   +0.5496 if c<=0.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.1242 if x4-x2>=2.0\n",
      "   +0.2782 if x1>=1.0 & x2>=2.0\n",
      "   +0.1013 if c<=0.0 & x2<=0.0 & x3-x1>=-2.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   -0.0297 if x3-x1<=-3.0\n",
      "   -0.2695 if x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.1245 if c>=1.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2>=-2.0\n",
      "   +0.2989 if x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-2.0 & x4-x2>=1.0\n",
      "   -0.0000 if x3-x1>=1.0 & x4-x2>=2.0\n",
      "   -0.6051 if x1<=2.0 & x1>=1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "init state [ 0  1  0 -1  0]\n",
      "(12,) (12,)\n",
      "init state [ 2  2  1 -2  0]\n",
      "(112,) (100,)\n",
      "init state [ 1  1 -1  2  0]\n",
      "(118,) (6,)\n",
      "init state [0 1 0 2 0]\n",
      "(127,) (9,)\n",
      "init state [ 3  0 -3  0  0]\n",
      "(152,) (25,)\n",
      "init state [ 0  2  3 -1  0]\n",
      "(166,) (14,)\n",
      "init state [ 2  3  1 -2  0]\n",
      "(193,) (27,)\n",
      "init state [ 2  2  1 -2  0]\n",
      "(231,) (38,)\n",
      "init state [ 1  1  2 -1  0]\n",
      "(329,) (98,)\n",
      "init state [1 1 1 0 0]\n",
      "(333,) (4,)\n",
      "============ 144 ===========\n",
      "Run episode 144 with rewards 38, accuracy 0.7\n",
      "----------------- 0 --------------\n",
      "   -2.9475 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.2802 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.7894 if x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   +0.0117 if c<=0.0 & x2<=1.0 & x3-x1<=-1.0\n",
      "   +4.9343 if x1>=3.0 & x2>=1.0\n",
      "   -0.7499 if c<=0.0 & x1<=1.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   -1.4505 if x1>=3.0 & x2<=2.0 & x2>=1.0\n",
      "   +1.8548 if c<=0.0 & x3-x1>=0.0\n",
      "   -0.2933 if x3-x1>=-1.0\n",
      "   -0.2230 if c<=0.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   -0.4385 if x1<=2.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   -0.0144 if c<=0.0 & x1>=3.0 & x2<=0.0\n",
      "   +0.0000 if x1>=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +0.0000 if c<=0.0 & x1>=3.0 & x3-x1<=-1.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "   +0.0000 if x4-x2>=3.0\n",
      "   +5.8312 if c<=0.0 & x1>=1.0 & x4-x2<=-2.0\n",
      "----------------- 1 --------------\n",
      "   -0.1431 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -2.6754 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +1.2154 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.8591 if c>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   +0.1324 if x2<=2.0 & x3-x1<=0.0\n",
      "   -1.5614 if x3-x1>=-1.0\n",
      "   +0.1595 if x3-x1>=1.0\n",
      "   +0.8637 if c<=0.0 & x2<=1.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   +0.3022 if c<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   +0.2931 if x2<=2.0 & x3-x1<=1.0 & x4-x2<=2.0\n",
      "   +0.2040 if x3-x1>=2.0 & x4-x2>=-1.0\n",
      "   -0.6969 if x1>=2.0 & x2>=2.0 & x3-x1>=1.0 & x4-x2<=1.0\n",
      "   +0.1263 if x1<=1.0 & x4-x2>=1.0\n",
      "   -0.1209 if c<=0.0 & x2<=2.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x3-x1>=-2.0\n",
      "   +0.0604 if x3-x1<=-2.0 & x3-x1>=-2.0 & x4-x2<=0.0\n",
      "   -2.9494 if x4-x2<=-3.0\n",
      "----------------- 2 --------------\n",
      "   +0.6930 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.3868 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.3868 if x4-x2>=0.0\n",
      "   -0.3536 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +4.0196 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -1.5701 if c<=0.0 & x2<=1.0 & x4-x2<=0.0\n",
      "   -1.6271 if c>=1.0\n",
      "   +4.5338 if x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   -1.3334 if x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   -0.8059 if x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   -0.0000 if x1>=2.0 & x4-x2>=1.0\n",
      "   -0.2067 if x3-x1<=-3.0\n",
      "   -0.8669 if x1<=0.0\n",
      "   -0.3108 if x1>=3.0 & x3-x1<=-1.0\n",
      "   -0.0449 if x4-x2>=1.0\n",
      "   +0.7883 if x2<=2.0 & x4-x2<=-1.0\n",
      "----------------- 3 --------------\n",
      "   +1.4117 if c>=1.0 & x1>=1.0\n",
      "   +1.3602 if c>=1.0 & x1>=3.0\n",
      "   -0.1052 if x1<=0.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.2943 if x1<=2.0 & x2>=1.0 & x4-x2<=0.0\n",
      "   -0.3055 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   -0.2096 if c<=0.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.2114 if x4-x2>=2.0\n",
      "   -1.2477 if x1>=1.0 & x2>=2.0\n",
      "   +0.0000 if c<=0.0 & x2<=0.0 & x3-x1>=-2.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   -0.2707 if x3-x1<=-3.0\n",
      "   -1.2343 if x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +1.3595 if c>=1.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2>=-2.0\n",
      "   +1.1489 if x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-2.0 & x4-x2>=1.0\n",
      "   +0.0000 if x3-x1>=1.0 & x4-x2>=2.0\n",
      "   +0.3566 if x1<=2.0 & x1>=1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -1.8055 if x1>=2.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2>=-2.0\n",
      "init state [ 2  2  1 -2  0]\n",
      "(201,) (201,)\n",
      "init state [ 3  1 -3  1  0]\n",
      "(217,) (16,)\n",
      "init state [ 2  3 -2 -1  0]\n",
      "(230,) (13,)\n",
      "init state [3 0 0 1 0]\n",
      "(431,) (201,)\n",
      "init state [ 2  3  1 -2  0]\n",
      "(632,) (201,)\n",
      "init state [0 0 1 2 0]\n",
      "(647,) (15,)\n",
      "init state [ 1  3  2 -1  0]\n",
      "(743,) (96,)\n",
      "init state [ 2  3  1 -3  0]\n",
      "(944,) (201,)\n",
      "init state [ 0  3  3 -3  0]\n",
      "(1145,) (201,)\n",
      "init state [1 2 0 1 0]\n",
      "(1158,) (13,)\n",
      "============ 145 ===========\n",
      "Run episode 145 with rewards 29, accuracy 0.1\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/tmp/ipykernel_316/4286230475.py:3: RuntimeWarning: overflow encountered in exp\n",
      "  exps = np.exp(all_values)\n",
      "/tmp/ipykernel_316/4286230475.py:4: RuntimeWarning: overflow encountered in exp\n",
      "  res = np.exp(all_values[np.arange(values.shape[0]), action]) / np.sum(exps, axis=1)\n",
      "/tmp/ipykernel_316/4286230475.py:4: RuntimeWarning: invalid value encountered in divide\n",
      "  res = np.exp(all_values[np.arange(values.shape[0]), action]) / np.sum(exps, axis=1)\n",
      "/tmp/ipykernel_316/4286230475.py:3: RuntimeWarning: overflow encountered in exp\n",
      "  exps = np.exp(all_values)\n",
      "/tmp/ipykernel_316/4286230475.py:4: RuntimeWarning: overflow encountered in exp\n",
      "  res = np.exp(all_values[np.arange(values.shape[0]), action]) / np.sum(exps, axis=1)\n",
      "/tmp/ipykernel_316/4286230475.py:4: RuntimeWarning: invalid value encountered in divide\n",
      "  res = np.exp(all_values[np.arange(values.shape[0]), action]) / np.sum(exps, axis=1)\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 0 --------------\n",
      "   -7.4782 if c>=1.0 & x3-x1<=1.0\n",
      "   -0.1684 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -6.2738 if x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   -0.3875 if c<=0.0 & x2<=1.0 & x3-x1<=-1.0\n",
      "   -5.1669 if x1>=3.0 & x2>=1.0\n",
      "   -2.0213 if c<=0.0 & x1<=1.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   -2.5184 if x1>=3.0 & x2<=2.0 & x2>=1.0\n",
      "   -8.1086 if c<=0.0 & x3-x1>=0.0\n",
      "  -11.1963 if x3-x1>=-1.0\n",
      "   -0.5746 if c<=0.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   -0.7276 if x1<=2.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   -0.0373 if c<=0.0 & x1>=3.0 & x2<=0.0\n",
      "   +0.4032 if x1>=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.0000 if x4-x2>=3.0\n",
      "   -5.1778 if c<=0.0 & x1>=1.0 & x4-x2<=-2.0\n",
      "   +1.7738 if c<=0.0 & x1<=1.0 & x3-x1<=1.0\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/tmp/ipykernel_316/4286230475.py:3: RuntimeWarning: overflow encountered in exp\n",
      "  exps = np.exp(all_values)\n",
      "/tmp/ipykernel_316/4286230475.py:4: RuntimeWarning: overflow encountered in exp\n",
      "  res = np.exp(all_values[np.arange(values.shape[0]), action]) / np.sum(exps, axis=1)\n",
      "/tmp/ipykernel_316/4286230475.py:4: RuntimeWarning: invalid value encountered in divide\n",
      "  res = np.exp(all_values[np.arange(values.shape[0]), action]) / np.sum(exps, axis=1)\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 1 --------------\n",
      "   -0.4801 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   +1.4960 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +2.7343 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.4859 if c>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.7700 if x2<=2.0 & x3-x1<=0.0\n",
      "   +6.3099 if x3-x1>=-1.0\n",
      "   +5.9288 if x3-x1>=1.0\n",
      "   +0.5991 if c<=0.0 & x2<=1.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   +2.4463 if c<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   -1.3516 if x2<=2.0 & x3-x1<=1.0 & x4-x2<=2.0\n",
      "   +1.1990 if x3-x1>=2.0 & x4-x2>=-1.0\n",
      "   +0.6788 if x1>=2.0 & x2>=2.0 & x3-x1>=1.0 & x4-x2<=1.0\n",
      "   -0.9474 if x1<=1.0 & x4-x2>=1.0\n",
      "   -0.4984 if c<=0.0 & x2<=2.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x3-x1>=-2.0\n",
      "   +5.5038 if x4-x2<=-3.0\n",
      "   +0.9599 if c<=0.0 & x1<=1.0 & x3-x1<=1.0\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/tmp/ipykernel_316/4286230475.py:3: RuntimeWarning: overflow encountered in exp\n",
      "  exps = np.exp(all_values)\n",
      "/tmp/ipykernel_316/4286230475.py:4: RuntimeWarning: overflow encountered in exp\n",
      "  res = np.exp(all_values[np.arange(values.shape[0]), action]) / np.sum(exps, axis=1)\n",
      "/tmp/ipykernel_316/4286230475.py:4: RuntimeWarning: invalid value encountered in divide\n",
      "  res = np.exp(all_values[np.arange(values.shape[0]), action]) / np.sum(exps, axis=1)\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 2 --------------\n",
      "   +0.4053 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -6.1439 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -6.1439 if x4-x2>=0.0\n",
      "   -5.4734 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +2.9372 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   +6.2151 if c<=0.0 & x2<=1.0 & x4-x2<=0.0\n",
      "   -1.8092 if c>=1.0\n",
      "   +0.5745 if x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   -6.6439 if x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   +9.8034 if x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   -0.1720 if x3-x1<=-3.0\n",
      "  +13.6960 if x1<=0.0\n",
      "   -0.2803 if x1>=3.0 & x3-x1<=-1.0\n",
      "   -3.3534 if x4-x2>=1.0\n",
      "   +8.7750 if x2<=2.0 & x4-x2<=-1.0\n",
      "   +3.9541 if \n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/tmp/ipykernel_316/4286230475.py:3: RuntimeWarning: overflow encountered in exp\n",
      "  exps = np.exp(all_values)\n",
      "/tmp/ipykernel_316/4286230475.py:4: RuntimeWarning: overflow encountered in exp\n",
      "  res = np.exp(all_values[np.arange(values.shape[0]), action]) / np.sum(exps, axis=1)\n",
      "/tmp/ipykernel_316/4286230475.py:4: RuntimeWarning: invalid value encountered in divide\n",
      "  res = np.exp(all_values[np.arange(values.shape[0]), action]) / np.sum(exps, axis=1)\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 3 --------------\n",
      "   -3.9567 if c>=1.0 & x1>=1.0\n",
      "   -0.7258 if c>=1.0 & x1>=3.0\n",
      "  +15.7447 if x1<=0.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "  +13.3867 if x1<=2.0 & x2>=1.0 & x4-x2<=0.0\n",
      "   -2.1494 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   -0.0245 if c<=0.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.3511 if x4-x2>=2.0\n",
      "   -5.6165 if x1>=1.0 & x2>=2.0\n",
      "   +0.5445 if c<=0.0 & x2<=0.0 & x3-x1>=-2.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   -0.1638 if x3-x1<=-3.0\n",
      "  +14.5227 if x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -2.2404 if c>=1.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2>=-2.0\n",
      "   -1.4834 if x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-2.0 & x4-x2>=1.0\n",
      "   -4.3194 if x1<=2.0 & x1>=1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.9359 if x1>=2.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2>=-2.0\n",
      "   +6.8486 if x3-x1>=1.0 & x4-x2<=-1.0\n",
      "init state [0 1 2 0 0]\n",
      "(201,) (201,)\n",
      "init state [2 1 0 1 0]\n",
      "(402,) (201,)\n",
      "init state [ 1  3  0 -3  0]\n",
      "(603,) (201,)\n",
      "init state [ 1  3  2 -2  0]\n",
      "(804,) (201,)\n",
      "init state [ 2  3  0 -3  0]\n",
      "(1005,) (201,)\n",
      "init state [ 3  1 -2  0  0]\n",
      "(1206,) (201,)\n",
      "init state [ 3  1 -2  1  0]\n",
      "(1407,) (201,)\n",
      "init state [ 1  2  2 -1  0]\n",
      "(1608,) (201,)\n",
      "init state [ 0  2  0 -2  0]\n",
      "(1809,) (201,)\n",
      "init state [ 3  1 -2  0  0]\n",
      "(2010,) (201,)\n",
      "============ 146 ===========\n",
      "Run episode 146 with rewards -201, accuracy 0.0\n",
      "----------------- 0 --------------\n",
      "   +6.5961 if c>=1.0 & x3-x1<=1.0\n",
      "  +10.3899 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "  +10.9636 if x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   +8.1984 if c<=0.0 & x2<=1.0 & x3-x1<=-1.0\n",
      "  +16.8699 if x1>=3.0 & x2>=1.0\n",
      "   +1.7829 if c<=0.0 & x1<=1.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "  +11.7762 if x1>=3.0 & x2<=2.0 & x2>=1.0\n",
      "   +7.4197 if c<=0.0 & x3-x1>=0.0\n",
      "  +15.3386 if x3-x1>=-1.0\n",
      "   +0.5159 if c<=0.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.6417 if x1<=2.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   +0.6368 if c<=0.0 & x1>=3.0 & x2<=0.0\n",
      "   +3.0602 if x1>=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +7.4032 if c<=0.0 & x1>=1.0 & x4-x2<=-2.0\n",
      "   +1.7890 if c<=0.0 & x1<=1.0 & x3-x1<=1.0\n",
      "   +1.0000 if x1<=2.0 & x2<=0.0\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/tmp/ipykernel_316/4286230475.py:3: RuntimeWarning: overflow encountered in exp\n",
      "  exps = np.exp(all_values)\n",
      "/tmp/ipykernel_316/4286230475.py:4: RuntimeWarning: overflow encountered in exp\n",
      "  res = np.exp(all_values[np.arange(values.shape[0]), action]) / np.sum(exps, axis=1)\n",
      "/tmp/ipykernel_316/4286230475.py:4: RuntimeWarning: invalid value encountered in divide\n",
      "  res = np.exp(all_values[np.arange(values.shape[0]), action]) / np.sum(exps, axis=1)\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 1 --------------\n",
      "   +4.6657 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +1.9506 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.3306 if c>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   +9.4685 if x2<=2.0 & x3-x1<=0.0\n",
      "   +3.8591 if x3-x1>=-1.0\n",
      "   +4.0335 if x3-x1>=1.0\n",
      "   +0.4076 if c<=0.0 & x2<=1.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   +5.7132 if c<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   +9.8643 if x2<=2.0 & x3-x1<=1.0 & x4-x2<=2.0\n",
      "   +0.8156 if x3-x1>=2.0 & x4-x2>=-1.0\n",
      "   +0.4619 if x1>=2.0 & x2>=2.0 & x3-x1>=1.0 & x4-x2<=1.0\n",
      "   +0.6447 if x1<=1.0 & x4-x2>=1.0\n",
      "   +0.3399 if c<=0.0 & x2<=2.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x3-x1>=-2.0\n",
      "   +3.3434 if x4-x2<=-3.0\n",
      "   +0.5742 if c<=0.0 & x1<=1.0 & x3-x1<=1.0\n",
      "   +1.0000 if x2<=2.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "----------------- 2 --------------\n",
      "   +0.4053 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   +6.1439 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   +6.1439 if x4-x2>=0.0\n",
      "   +5.4734 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +2.9372 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   +6.2151 if c<=0.0 & x2<=1.0 & x4-x2<=0.0\n",
      "   +1.8092 if c>=1.0\n",
      "   +0.5745 if x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   +6.6439 if x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   +9.8034 if x4-x2<=1.0 & x4-x2>=-2.0\n",
      "  +13.6960 if x1<=0.0\n",
      "   +0.2803 if x1>=3.0 & x3-x1<=-1.0\n",
      "   +3.3534 if x4-x2>=1.0\n",
      "   +8.7750 if x2<=2.0 & x4-x2<=-1.0\n",
      "   +3.9541 if \n",
      "   +1.0000 if x1>=3.0 & x2<=0.0 & x3-x1>=-2.0\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/tmp/ipykernel_316/4286230475.py:3: RuntimeWarning: overflow encountered in exp\n",
      "  exps = np.exp(all_values)\n",
      "/tmp/ipykernel_316/4286230475.py:4: RuntimeWarning: overflow encountered in exp\n",
      "  res = np.exp(all_values[np.arange(values.shape[0]), action]) / np.sum(exps, axis=1)\n",
      "/tmp/ipykernel_316/4286230475.py:4: RuntimeWarning: invalid value encountered in divide\n",
      "  res = np.exp(all_values[np.arange(values.shape[0]), action]) / np.sum(exps, axis=1)\n",
      "/tmp/ipykernel_316/4286230475.py:3: RuntimeWarning: overflow encountered in exp\n",
      "  exps = np.exp(all_values)\n",
      "/tmp/ipykernel_316/4286230475.py:4: RuntimeWarning: overflow encountered in exp\n",
      "  res = np.exp(all_values[np.arange(values.shape[0]), action]) / np.sum(exps, axis=1)\n",
      "/tmp/ipykernel_316/4286230475.py:4: RuntimeWarning: invalid value encountered in divide\n",
      "  res = np.exp(all_values[np.arange(values.shape[0]), action]) / np.sum(exps, axis=1)\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 3 --------------\n",
      "   -0.0650 if c>=1.0 & x1>=1.0\n",
      "   -0.0119 if c>=1.0 & x1>=3.0\n",
      "   -0.3786 if x1<=0.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.1913 if x1<=2.0 & x2>=1.0 & x4-x2<=0.0\n",
      "   +0.7339 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   -0.0058 if x4-x2>=2.0\n",
      "  +25.5604 if x1>=1.0 & x2>=2.0\n",
      "   -0.0089 if c<=0.0 & x2<=0.0 & x3-x1>=-2.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +1.7190 if x3-x1<=-3.0\n",
      "   +0.3131 if x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.0368 if c>=1.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2>=-2.0\n",
      "   +1.2057 if x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-2.0 & x4-x2>=1.0\n",
      "   -0.0233 if x1<=2.0 & x1>=1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   -0.0301 if x1>=2.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2>=-2.0\n",
      "   -0.1992 if x3-x1>=1.0 & x4-x2<=-1.0\n",
      "   +0.9283 if x1<=0.0 & x2>=3.0\n",
      "init state [ 2  2  1 -1  0]\n",
      "(201,) (201,)\n",
      "init state [1 1 1 2 0]\n",
      "(402,) (201,)\n",
      "init state [1 0 1 1 0]\n",
      "(603,) (201,)\n",
      "init state [ 1  0 -1  1  0]\n",
      "(804,) (201,)\n",
      "init state [ 2  2 -1  0  0]\n",
      "(1005,) (201,)\n",
      "init state [ 1  3  0 -2  0]\n",
      "(1206,) (201,)\n",
      "init state [ 3  1 -1  1  0]\n",
      "(1407,) (201,)\n",
      "init state [ 2  3 -2  0  0]\n",
      "(1608,) (201,)\n",
      "init state [ 0  1  1 -1  0]\n",
      "(1809,) (201,)\n",
      "init state [2 0 0 3 0]\n",
      "(2010,) (201,)\n",
      "============ 147 ===========\n",
      "Run episode 147 with rewards -201, accuracy 0.0\n",
      "----------------- 0 --------------\n",
      "   +0.0000 if c>=1.0 & x3-x1<=1.0\n",
      "   -0.2416 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.4499 if x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   -0.5203 if c<=0.0 & x2<=1.0 & x3-x1<=-1.0\n",
      "   -0.1006 if x1>=3.0 & x2>=1.0\n",
      "   -0.1102 if c<=0.0 & x1<=1.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   -0.1006 if x1>=3.0 & x2<=2.0 & x2>=1.0\n",
      "   -1.6932 if c<=0.0 & x3-x1>=0.0\n",
      "   -2.2135 if x3-x1>=-1.0\n",
      "   -0.1410 if x1<=2.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   -0.2787 if c<=0.0 & x1>=3.0 & x2<=0.0\n",
      "   -0.1842 if x1>=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.1552 if c<=0.0 & x1>=1.0 & x4-x2<=-2.0\n",
      "   -0.3480 if c<=0.0 & x1<=1.0 & x3-x1<=1.0\n",
      "   -1.5141 if x1<=2.0 & x2<=0.0\n",
      "   +0.0000 if x1>=3.0\n",
      "----------------- 1 --------------\n",
      "   +0.0000 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   -0.2748 if x1<=2.0 & x4-x2>=-2.0\n",
      "   -0.9251 if x2<=2.0 & x3-x1<=0.0\n",
      "   -0.9251 if x3-x1>=-1.0\n",
      "   +0.0000 if x3-x1>=1.0\n",
      "   +0.0000 if c<=0.0 & x2<=1.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   +0.0000 if c<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   -0.9251 if x2<=2.0 & x3-x1<=1.0 & x4-x2<=2.0\n",
      "   +0.0000 if x3-x1>=2.0 & x4-x2>=-1.0\n",
      "   +0.0000 if x1>=2.0 & x2>=2.0 & x3-x1>=1.0 & x4-x2<=1.0\n",
      "   +0.0000 if x1<=1.0 & x4-x2>=1.0\n",
      "   -0.9251 if c<=0.0 & x2<=2.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x3-x1>=-2.0\n",
      "   +0.0000 if x4-x2<=-3.0\n",
      "   +0.0000 if c<=0.0 & x1<=1.0 & x3-x1<=1.0\n",
      "   +0.0000 if x2<=2.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.0000 if x1>=2.0 & x3-x1>=0.0 & x4-x2<=2.0 & x4-x2>=2.0\n",
      "----------------- 2 --------------\n",
      "   -0.1524 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -2.7104 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -2.2833 if x4-x2>=0.0\n",
      "   -2.0878 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -1.1048 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -2.3378 if c<=0.0 & x2<=1.0 & x4-x2<=0.0\n",
      "   -0.6805 if c>=1.0\n",
      "   -0.2161 if x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   -2.9729 if x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   -3.7859 if x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   -4.7951 if x1<=0.0\n",
      "   -1.1917 if x4-x2>=1.0\n",
      "   -3.2967 if x2<=2.0 & x4-x2<=-1.0\n",
      "   -1.5289 if \n",
      "   -0.6863 if x1>=3.0 & x2<=0.0 & x3-x1>=-2.0\n",
      "   +1.0000 if x3-x1>=-1.0 & x4-x2<=2.0\n",
      "----------------- 3 --------------\n",
      "   +0.0000 if c>=1.0 & x1>=1.0\n",
      "   +0.0000 if c>=1.0 & x1>=3.0\n",
      "   +0.0000 if x1<=0.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.0626 if x1<=2.0 & x2>=1.0 & x4-x2<=0.0\n",
      "   +0.0000 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   -0.0626 if x1>=1.0 & x2>=2.0\n",
      "   +0.0000 if c<=0.0 & x2<=0.0 & x3-x1>=-2.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.0000 if x3-x1<=-3.0\n",
      "   -0.0626 if x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.0000 if c>=1.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2>=-2.0\n",
      "   +0.0000 if x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-2.0 & x4-x2>=1.0\n",
      "   -0.0626 if x1<=2.0 & x1>=1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   +0.0000 if x1>=2.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2>=-2.0\n",
      "   -0.0626 if x3-x1>=1.0 & x4-x2<=-1.0\n",
      "   +0.0000 if x1<=0.0 & x2>=3.0\n",
      "   +0.0000 if x1>=1.0 & x4-x2<=-2.0\n",
      "init state [0 0 3 1 0]\n",
      "(201,) (201,)\n",
      "init state [ 2  2  0 -2  0]\n",
      "(402,) (201,)\n",
      "init state [1 0 0 1 0]\n",
      "(413,) (11,)\n",
      "init state [ 2  3  1 -2  0]\n",
      "(614,) (201,)\n",
      "init state [0 1 2 1 0]\n",
      "(815,) (201,)\n",
      "init state [2 1 1 1 0]\n",
      "(1016,) (201,)\n",
      "init state [ 1  3  0 -1  0]\n",
      "(1217,) (201,)\n",
      "init state [ 2  2 -2  1  0]\n",
      "(1324,) (107,)\n",
      "init state [0 0 1 1 0]\n",
      "(1344,) (20,)\n",
      "init state [0 0 1 0 0]\n",
      "(1362,) (18,)\n",
      "============ 148 ===========\n",
      "Run episode 148 with rewards 24, accuracy 0.1\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/tmp/ipykernel_316/4286230475.py:3: RuntimeWarning: overflow encountered in exp\n",
      "  exps = np.exp(all_values)\n",
      "/tmp/ipykernel_316/4286230475.py:4: RuntimeWarning: overflow encountered in exp\n",
      "  res = np.exp(all_values[np.arange(values.shape[0]), action]) / np.sum(exps, axis=1)\n",
      "/tmp/ipykernel_316/4286230475.py:4: RuntimeWarning: invalid value encountered in divide\n",
      "  res = np.exp(all_values[np.arange(values.shape[0]), action]) / np.sum(exps, axis=1)\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 0 --------------\n",
      "   -0.3376 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.4812 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "  +11.6861 if x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   +0.4669 if c<=0.0 & x2<=1.0 & x3-x1<=-1.0\n",
      "  +10.2475 if x1>=3.0 & x2>=1.0\n",
      "   +0.2378 if c<=0.0 & x1<=1.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   +0.2788 if x1>=3.0 & x2<=2.0 & x2>=1.0\n",
      "   +8.5702 if c<=0.0 & x3-x1>=0.0\n",
      "  +13.3112 if x3-x1>=-1.0\n",
      "   +0.1303 if x1<=2.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   +0.2501 if c<=0.0 & x1>=3.0 & x2<=0.0\n",
      "   +0.1687 if x1>=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   +6.5603 if c<=0.0 & x1>=1.0 & x4-x2<=-2.0\n",
      "   +0.3939 if c<=0.0 & x1<=1.0 & x3-x1<=1.0\n",
      "   +1.2225 if x1<=2.0 & x2<=0.0\n",
      "   +1.0000 if x1>=1.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/tmp/ipykernel_316/4286230475.py:3: RuntimeWarning: overflow encountered in exp\n",
      "  exps = np.exp(all_values)\n",
      "/tmp/ipykernel_316/4286230475.py:4: RuntimeWarning: overflow encountered in exp\n",
      "  res = np.exp(all_values[np.arange(values.shape[0]), action]) / np.sum(exps, axis=1)\n",
      "/tmp/ipykernel_316/4286230475.py:4: RuntimeWarning: invalid value encountered in divide\n",
      "  res = np.exp(all_values[np.arange(values.shape[0]), action]) / np.sum(exps, axis=1)\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 1 --------------\n",
      "  +12.5912 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +2.0989 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +1.1863 if x2<=2.0 & x3-x1<=0.0\n",
      "  +13.5253 if x3-x1>=-1.0\n",
      "   +0.3596 if x3-x1>=1.0\n",
      "   +0.0147 if c<=0.0 & x2<=1.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "  +10.7356 if c<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   +1.2484 if x2<=2.0 & x3-x1<=1.0 & x4-x2<=2.0\n",
      "   +0.0311 if x3-x1>=2.0 & x4-x2>=-1.0\n",
      "   +0.2296 if x1>=2.0 & x2>=2.0 & x3-x1>=1.0 & x4-x2<=1.0\n",
      "   -0.1311 if x1<=1.0 & x4-x2>=1.0\n",
      "   +1.0793 if c<=0.0 & x2<=2.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x3-x1>=-2.0\n",
      "   +2.0834 if x4-x2<=-3.0\n",
      "   +0.0689 if c<=0.0 & x1<=1.0 & x3-x1<=1.0\n",
      "   +0.6113 if x2<=2.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +1.0000 if x1<=2.0 & x3-x1<=-1.0 & x4-x2<=-2.0\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/tmp/ipykernel_316/4286230475.py:3: RuntimeWarning: overflow encountered in exp\n",
      "  exps = np.exp(all_values)\n",
      "/tmp/ipykernel_316/4286230475.py:4: RuntimeWarning: overflow encountered in exp\n",
      "  res = np.exp(all_values[np.arange(values.shape[0]), action]) / np.sum(exps, axis=1)\n",
      "/tmp/ipykernel_316/4286230475.py:4: RuntimeWarning: invalid value encountered in divide\n",
      "  res = np.exp(all_values[np.arange(values.shape[0]), action]) / np.sum(exps, axis=1)\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 2 --------------\n",
      "   +2.7816 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   +2.3632 if x4-x2>=0.0\n",
      "   +2.1717 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +3.8009 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   +2.2846 if c<=0.0 & x2<=1.0 & x4-x2<=0.0\n",
      "   +0.5981 if c>=1.0\n",
      "   +2.7192 if x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   +5.2486 if x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   +6.0536 if x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   +4.6786 if x1<=0.0\n",
      "   +1.1523 if x4-x2>=1.0\n",
      "   +3.2820 if x2<=2.0 & x4-x2<=-1.0\n",
      "   +4.1785 if \n",
      "   +0.6723 if x1>=3.0 & x2<=0.0 & x3-x1>=-2.0\n",
      "   +3.3046 if x3-x1>=-1.0 & x4-x2<=2.0\n",
      "   +1.0000 if x2<=2.0 & x4-x2>=0.0\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/tmp/ipykernel_316/4286230475.py:3: RuntimeWarning: overflow encountered in exp\n",
      "  exps = np.exp(all_values)\n",
      "/tmp/ipykernel_316/4286230475.py:4: RuntimeWarning: overflow encountered in exp\n",
      "  res = np.exp(all_values[np.arange(values.shape[0]), action]) / np.sum(exps, axis=1)\n",
      "/tmp/ipykernel_316/4286230475.py:4: RuntimeWarning: invalid value encountered in divide\n",
      "  res = np.exp(all_values[np.arange(values.shape[0]), action]) / np.sum(exps, axis=1)\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------- 3 --------------\n",
      "   -1.0774 if c>=1.0 & x1>=1.0\n",
      "   -0.0000 if c>=1.0 & x1>=3.0\n",
      "   -0.9690 if x1<=0.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +3.0429 if x1<=2.0 & x2>=1.0 & x4-x2<=0.0\n",
      "   -0.1748 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "  +13.6818 if x1>=1.0 & x2>=2.0\n",
      "   -0.7797 if c<=0.0 & x2<=0.0 & x3-x1>=-2.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   -0.5741 if x3-x1<=-3.0\n",
      "  +11.1300 if x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.4475 if c>=1.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2>=-2.0\n",
      "   +0.1600 if x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-2.0 & x4-x2>=1.0\n",
      "   +1.6134 if x1<=2.0 & x1>=1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "  +10.8632 if x1>=2.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2>=-2.0\n",
      "   +0.6803 if x3-x1>=1.0 & x4-x2<=-1.0\n",
      "   -0.2490 if x1<=0.0 & x2>=3.0\n",
      "   +1.0000 if x1>=3.0 & x2>=3.0 & x4-x2>=-2.0\n",
      "init state [ 3  0 -2  0  0]\n",
      "(201,) (201,)\n",
      "init state [ 3  2 -1 -2  0]\n",
      "(402,) (201,)\n",
      "init state [ 1  0 -1  2  0]\n",
      "(603,) (201,)\n",
      "init state [1 0 0 1 0]\n",
      "(804,) (201,)\n",
      "init state [ 1  2 -1  0  0]\n",
      "(1005,) (201,)\n",
      "init state [0 0 2 1 0]\n",
      "(1206,) (201,)\n",
      "init state [ 3  0 -3  0  0]\n",
      "(1407,) (201,)\n",
      "init state [ 2  0 -1  3  0]\n",
      "(1608,) (201,)\n",
      "init state [ 3  0 -1  1  0]\n",
      "(1809,) (201,)\n",
      "init state [ 1  1 -1 -1  0]\n",
      "(2010,) (201,)\n",
      "============ 149 ===========\n",
      "Run episode 149 with rewards -201, accuracy 0.0\n",
      "----------------- 0 --------------\n",
      "   +0.0174 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.0248 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.2732 if x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   +0.0280 if c<=0.0 & x2<=1.0 & x3-x1<=-1.0\n",
      "   +0.1413 if x1>=3.0 & x2>=1.0\n",
      "   +0.0127 if c<=0.0 & x1<=1.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   -0.3721 if x1>=3.0 & x2<=2.0 & x2>=1.0\n",
      "   -0.0158 if c<=0.0 & x3-x1>=0.0\n",
      "   -0.1542 if x3-x1>=-1.0\n",
      "   +0.0129 if c<=0.0 & x1>=3.0 & x2<=0.0\n",
      "   +0.0087 if x1>=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.3981 if c<=0.0 & x1>=1.0 & x4-x2<=-2.0\n",
      "   -0.4754 if c<=0.0 & x1<=1.0 & x3-x1<=1.0\n",
      "   -0.0685 if x1<=2.0 & x2<=0.0\n",
      "   +0.0515 if x1>=1.0 & x3-x1<=1.0 & x4-x2<=0.0 & x4-x2>=-1.0\n",
      "   +1.0000 if x2>=2.0 & x3-x1>=-2.0\n",
      "----------------- 1 --------------\n",
      "   -0.1171 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.3208 if x1<=2.0 & x4-x2>=-2.0\n",
      "   -1.3958 if x2<=2.0 & x3-x1<=0.0\n",
      "   +1.7713 if x3-x1>=-1.0\n",
      "   +0.2064 if x3-x1>=1.0\n",
      "   -0.1512 if c<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   -1.3823 if x2<=2.0 & x3-x1<=1.0 & x4-x2<=2.0\n",
      "   +0.2165 if x3-x1>=2.0 & x4-x2>=-1.0\n",
      "   +0.0249 if x1>=2.0 & x2>=2.0 & x3-x1>=1.0 & x4-x2<=1.0\n",
      "   +0.1934 if x1<=1.0 & x4-x2>=1.0\n",
      "   +0.2529 if c<=0.0 & x2<=2.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x3-x1>=-2.0\n",
      "   +0.2262 if x4-x2<=-3.0\n",
      "   -0.0265 if c<=0.0 & x1<=1.0 & x3-x1<=1.0\n",
      "   -0.4036 if x2<=2.0 & x3-x1<=0.0 & x4-x2<=0.0\n",
      "   +0.1086 if x1<=2.0 & x3-x1<=-1.0 & x4-x2<=-2.0\n",
      "   +1.0000 if x4-x2>=2.0\n",
      "----------------- 2 --------------\n",
      "   -3.7107 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -3.0610 if x4-x2>=0.0\n",
      "   -0.9378 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "  -10.9425 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   -5.4456 if c<=0.0 & x2<=1.0 & x4-x2<=0.0\n",
      "   -7.8289 if x3-x1<=0.0 & x4-x2<=-1.0\n",
      "  -11.4206 if x3-x1<=1.0 & x4-x2>=-2.0\n",
      "  -12.0314 if x4-x2<=1.0 & x4-x2>=-2.0\n",
      "  -13.3347 if x1<=0.0\n",
      "   -0.7066 if x4-x2>=1.0\n",
      "   -9.3665 if x2<=2.0 & x4-x2<=-1.0\n",
      "   -8.2051 if \n",
      "   +4.0729 if x1>=3.0 & x2<=0.0 & x3-x1>=-2.0\n",
      "   -9.2076 if x3-x1>=-1.0 & x4-x2<=2.0\n",
      "   +0.8635 if x2<=2.0 & x4-x2>=0.0\n",
      "   +1.0000 if x3-x1>=-2.0\n",
      "----------------- 3 --------------\n",
      "   +0.0000 if c>=1.0 & x1>=1.0\n",
      "   +0.0000 if x1<=0.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.0000 if x1<=2.0 & x2>=1.0 & x4-x2<=0.0\n",
      "   +0.0000 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   +0.0000 if x1>=1.0 & x2>=2.0\n",
      "   +0.0000 if c<=0.0 & x2<=0.0 & x3-x1>=-2.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.0000 if x3-x1<=-3.0\n",
      "   +0.0000 if x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.0000 if c>=1.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2>=-2.0\n",
      "   +0.0000 if x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-2.0 & x4-x2>=1.0\n",
      "   +0.0000 if x1<=2.0 & x1>=1.0 & x4-x2<=1.0 & x4-x2>=-1.0\n",
      "   +0.0000 if x1>=2.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2>=-2.0\n",
      "   +0.0000 if x3-x1>=1.0 & x4-x2<=-1.0\n",
      "   +0.0000 if x1<=0.0 & x2>=3.0\n",
      "   +0.0000 if x1>=3.0 & x2>=3.0 & x4-x2>=-2.0\n",
      "   +0.0000 if x3-x1<=-2.0 & x4-x2>=3.0\n",
      "\n",
      "Done\n"
     ]
    }
   ],
   "source": [
    "rewards = train()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "39cee1c7",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": 27,
   "id": "3d20e8e0",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "------------------------\n",
      "   -0.6500 if c>=1.0 & x3-x1<=1.0\n",
      "   +0.4824 if c<=0.0 & x3-x1<=-1.0 & x4-x2<=1.0 & x4-x2>=0.0\n",
      "   -0.1595 if x3-x1<=1.0 & x3-x1>=-1.0 & x4-x2<=1.0\n",
      "   +0.4006 if c<=0.0 & x2<=1.0 & x3-x1<=-1.0\n",
      "   +0.4872 if x1>=3.0 & x2>=1.0\n",
      "   +0.0820 if c<=0.0 & x1<=1.0 & x3-x1<=0.0 & x4-x2>=-1.0\n",
      "   -0.1625 if x1>=3.0 & x2<=2.0 & x2>=1.0\n",
      "   -0.7684 if c<=0.0 & x3-x1>=0.0\n",
      "   -0.3822 if x3-x1>=-1.0\n",
      "   -0.3154 if c<=0.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.3443 if x1<=2.0 & x3-x1<=-1.0 & x4-x2>=1.0\n",
      "   +0.0005 if x1>=1.0 & x2<=2.0 & x3-x1<=-2.0\n",
      "   -0.0625 if c<=0.0 & x1>=3.0 & x2<=0.0\n",
      "   +0.0756 if x1>=2.0 & x4-x2<=1.0 & x4-x2>=1.0\n",
      "   -0.0271 if c<=0.0 & x1<=2.0 & x3-x1<=1.0 & x4-x2<=1.0 & x4-x2>=-1.0 & x4-x2>=-2.0\n",
      "   +0.4967 if c<=0.0 & x1>=3.0 & x3-x1<=-1.0 & x3-x1>=-2.0 & x4-x2>=0.0\n",
      "------------------------\n",
      "   -0.2582 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x4-x2>=-2.0\n",
      "   -0.4697 if c<=0.0 & x3-x1<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0\n",
      "   +0.8028 if x1<=2.0 & x4-x2>=-2.0\n",
      "   +0.1533 if c>=1.0 & x3-x1<=0.0 & x3-x1>=-2.0\n",
      "   -0.5637 if x2<=2.0 & x3-x1<=0.0\n",
      "   +0.4147 if x3-x1>=-1.0\n",
      "   +0.7234 if x3-x1>=1.0\n",
      "   +0.2452 if c<=0.0 & x2<=1.0 & x2>=1.0 & x3-x1<=1.0 & x3-x1>=1.0\n",
      "   +0.0013 if x2<=2.0\n",
      "   -0.0848 if c<=0.0 & x3-x1>=-2.0 & x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   -0.1985 if x2<=2.0 & x3-x1<=1.0 & x4-x2<=2.0\n",
      "   +0.1761 if x1<=0.0 & x2>=1.0 & x3-x1>=1.0\n",
      "   +0.2684 if x3-x1>=2.0 & x4-x2>=-1.0\n",
      "   +0.1199 if x1>=2.0 & x2>=2.0 & x3-x1>=1.0 & x4-x2<=1.0\n",
      "   +0.0552 if x1<=1.0 & x4-x2>=1.0\n",
      "   -0.7728 if c<=0.0 & x2<=2.0 & x3-x1<=0.0 & x3-x1>=-1.0 & x3-x1>=-2.0\n",
      "------------------------\n",
      "   +0.1237 if c<=0.0 & x3-x1<=0.0 & x4-x2<=-1.0 & x4-x2>=-2.0\n",
      "   -0.3943 if x4-x2<=2.0 & x4-x2>=0.0\n",
      "   -0.3943 if x4-x2>=0.0\n",
      "   -0.2209 if x4-x2<=1.0 & x4-x2>=0.0\n",
      "   +0.2215 if c<=0.0 & x1>=1.0 & x2>=3.0\n",
      "   +0.1064 if c<=0.0 & x2<=1.0 & x4-x2<=0.0\n",
      "   -0.1319 if c>=1.0\n",
      "   +0.2941 if x3-x1<=0.0 & x4-x2<=-1.0\n",
      "   -0.1574 if x3-x1<=1.0 & x4-x2>=-2.0\n",
      "   -0.2369 if x4-x2<=1.0 & x4-x2>=-2.0\n",
      "   -0.2244 if x1>=2.0 & x4-x2>=1.0\n",
      "   +0.0072 if x1<=1.0\n",
      "   -0.3411 if x3-x1<=-3.0\n",
      "   -0.0863 if x2<=0.0 & x3-x1>=-1.0\n",
      "   +0.1761 if x1<=0.0\n",
      "   -0.2080 if x1>=3.0 & x3-x1<=-1.0\n",
      "------------------------\n",
      "   +0.4347 if c>=1.0 & x1>=1.0\n",
      "   +0.5331 if c>=1.0 & x1>=3.0\n",
      "   -0.1953 if c<=0.0 & x3-x1>=0.0 & x4-x2<=-1.0\n",
      "   -0.1019 if x1<=0.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   -0.8496 if x1<=2.0 & x2>=1.0 & x4-x2<=0.0\n",
      "   +0.3636 if x1>=1.0 & x2<=2.0 & x3-x1<=1.0 & x3-x1>=-1.0\n",
      "   +0.6287 if c<=0.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   -0.1118 if x4-x2>=2.0\n",
      "   -0.1482 if x1>=1.0 & x2>=2.0\n",
      "   +0.1477 if c<=0.0 & x2<=0.0 & x3-x1>=-2.0 & x3-x1>=0.0 & x4-x2>=1.0\n",
      "   +0.4350 if x3-x1<=-3.0\n",
      "   +0.0909 if x1>=1.0 & x3-x1<=1.0 & x4-x2<=1.0\n",
      "   -0.4333 if x3-x1>=-1.0 & x4-x2<=0.0 & x4-x2>=-2.0\n",
      "   +0.4899 if c>=1.0 & x3-x1<=0.0 & x3-x1>=0.0 & x4-x2>=-2.0\n",
      "   -0.1444 if x2>=1.0 & x3-x1<=-1.0 & x3-x1>=-2.0 & x4-x2>=1.0\n",
      "   -0.3605 if x3-x1>=1.0 & x4-x2>=2.0\n"
     ]
    }
   ],
   "source": [
    "for i in range(4):\n",
    "    print('------------------------')\n",
    "    print(actor.best_model[i].rules_)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 28,
   "id": "0b443f87",
   "metadata": {},
   "outputs": [],
   "source": [
    "def test(num_test_episodes=100):\n",
    "    \"\"\"\n",
    "    Test the learned policy using the trained actor model.\n",
    "\n",
    "    Args:\n",
    "        num_test_episodes (int): Number of episodes to test the model.\n",
    "\n",
    "    Returns:\n",
    "        float: Average reward over the test episodes.\n",
    "    \"\"\"\n",
    "    total_reward = 0\n",
    "\n",
    "    for episode in range(num_test_episodes):\n",
    "        state = env.reset()[0]  # Reset the environment and get the initial state\n",
    "        episode_reward = 0\n",
    "\n",
    "        for t in range(1, 100):  # Limit the number of time steps\n",
    "            # Convert state to tensor and predict action probabilities\n",
    "            #             state_tensor = torch.tensor(state, dtype=torch.float32).to(device)\n",
    "            action_probs = actor.predict(pd.DataFrame(np.array([state]), columns=column_names))\n",
    "            # Select action based on the highest probability\n",
    "            action = np.argmax(action_probs)\n",
    "            # Take the chosen action\n",
    "            next_state, reward, done, trunc, _ = env.step(action)\n",
    "            # Accumulate reward\n",
    "            episode_reward += reward\n",
    "            if done or trunc:\n",
    "                break\n",
    "            # Update state\n",
    "            state = next_state\n",
    "        total_reward += episode_reward\n",
    "        print(f\"Test Episode {episode + 1}, Reward: {episode_reward}\")\n",
    "    avg_reward = total_reward / num_test_episodes\n",
    "    print(f\"\\nAverage Reward over {num_test_episodes} Test Episodes: {avg_reward}\")\n",
    "    return avg_reward"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 31,
   "id": "ef9e3e26",
   "metadata": {
    "scrolled": false
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Test Episode 1, Reward: 39\n",
      "Test Episode 2, Reward: 35\n",
      "Test Episode 3, Reward: 33\n",
      "Test Episode 4, Reward: 37\n",
      "Test Episode 5, Reward: 34\n",
      "Test Episode 6, Reward: 36\n",
      "Test Episode 7, Reward: 35\n",
      "Test Episode 8, Reward: 35\n",
      "Test Episode 9, Reward: 39\n",
      "Test Episode 10, Reward: 35\n",
      "Test Episode 11, Reward: 39\n",
      "Test Episode 12, Reward: 37\n",
      "Test Episode 13, Reward: 36\n",
      "Test Episode 14, Reward: 39\n",
      "Test Episode 15, Reward: 33\n",
      "Test Episode 16, Reward: 35\n",
      "Test Episode 17, Reward: -99\n",
      "Test Episode 18, Reward: 37\n",
      "Test Episode 19, Reward: 35\n",
      "Test Episode 20, Reward: 37\n",
      "Test Episode 21, Reward: 36\n",
      "Test Episode 22, Reward: 36\n",
      "Test Episode 23, Reward: -99\n",
      "Test Episode 24, Reward: 34\n",
      "Test Episode 25, Reward: 37\n",
      "Test Episode 26, Reward: 36\n",
      "Test Episode 27, Reward: 36\n",
      "Test Episode 28, Reward: 34\n",
      "Test Episode 29, Reward: 35\n",
      "Test Episode 30, Reward: 37\n",
      "Test Episode 31, Reward: 39\n",
      "Test Episode 32, Reward: 34\n",
      "Test Episode 33, Reward: 36\n",
      "Test Episode 34, Reward: 37\n",
      "Test Episode 35, Reward: 36\n",
      "Test Episode 36, Reward: 35\n",
      "Test Episode 37, Reward: 36\n",
      "Test Episode 38, Reward: 36\n",
      "Test Episode 39, Reward: 37\n",
      "Test Episode 40, Reward: 35\n",
      "Test Episode 41, Reward: 36\n",
      "Test Episode 42, Reward: 36\n",
      "Test Episode 43, Reward: 34\n",
      "Test Episode 44, Reward: -99\n",
      "Test Episode 45, Reward: 38\n",
      "Test Episode 46, Reward: -99\n",
      "Test Episode 47, Reward: 35\n",
      "Test Episode 48, Reward: 38\n",
      "Test Episode 49, Reward: 34\n",
      "Test Episode 50, Reward: 34\n",
      "Test Episode 51, Reward: 37\n",
      "Test Episode 52, Reward: 37\n",
      "Test Episode 53, Reward: 38\n",
      "Test Episode 54, Reward: 37\n",
      "Test Episode 55, Reward: 37\n",
      "Test Episode 56, Reward: -99\n",
      "Test Episode 57, Reward: 39\n",
      "Test Episode 58, Reward: 34\n",
      "Test Episode 59, Reward: 38\n",
      "Test Episode 60, Reward: 34\n",
      "Test Episode 61, Reward: 34\n",
      "Test Episode 62, Reward: 37\n",
      "Test Episode 63, Reward: 38\n",
      "Test Episode 64, Reward: 35\n",
      "Test Episode 65, Reward: 34\n",
      "Test Episode 66, Reward: 36\n",
      "Test Episode 67, Reward: 37\n",
      "Test Episode 68, Reward: -99\n",
      "Test Episode 69, Reward: 34\n",
      "Test Episode 70, Reward: 36\n",
      "Test Episode 71, Reward: 33\n",
      "Test Episode 72, Reward: 37\n",
      "Test Episode 73, Reward: 35\n",
      "Test Episode 74, Reward: 36\n",
      "Test Episode 75, Reward: 37\n",
      "Test Episode 76, Reward: 34\n",
      "Test Episode 77, Reward: 35\n",
      "Test Episode 78, Reward: 38\n",
      "Test Episode 79, Reward: 36\n",
      "Test Episode 80, Reward: 38\n",
      "Test Episode 81, Reward: 37\n",
      "Test Episode 82, Reward: 40\n",
      "Test Episode 83, Reward: 36\n",
      "Test Episode 84, Reward: 36\n",
      "Test Episode 85, Reward: 37\n",
      "Test Episode 86, Reward: 35\n",
      "Test Episode 87, Reward: 36\n",
      "Test Episode 88, Reward: 38\n",
      "Test Episode 89, Reward: 35\n",
      "Test Episode 90, Reward: 37\n",
      "Test Episode 91, Reward: 36\n",
      "Test Episode 92, Reward: 39\n",
      "Test Episode 93, Reward: 36\n",
      "Test Episode 94, Reward: 33\n",
      "Test Episode 95, Reward: 37\n",
      "Test Episode 96, Reward: 37\n",
      "Test Episode 97, Reward: 33\n",
      "Test Episode 98, Reward: 36\n",
      "Test Episode 99, Reward: 34\n",
      "Test Episode 100, Reward: 36\n",
      "\n",
      "Average Reward over 100 Test Episodes: 27.94\n"
     ]
    }
   ],
   "source": [
    "avg_test_reward = test(num_test_episodes=100)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 30,
   "id": "31340922",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[<matplotlib.lines.Line2D at 0x7fcc449884f0>]"
      ]
     },
     "execution_count": 30,
     "metadata": {},
     "output_type": "execute_result"
    },
    {
     "data": {
      "image/png": "iVBORw0KGgoAAAANSUhEUgAAAX8AAAD8CAYAAACfF6SlAAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjUuMiwgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy8qNh9FAAAACXBIWXMAAAsTAAALEwEAmpwYAABQaklEQVR4nO2dd3gc1dWH3zuzTb1YsuQmV9nGBRtjjDE9mBrAlECAUJJQQgKhpBFC8iWEkEAISeiEUBJ6L6YXY1rAGBts425ZbrJlWbJ623q/P2Z2tSutbGF7pZV03ufxY+3M7s7VaPfMmd/53XOV1hpBEAShf2H09AAEQRCE7keCvyAIQj9Egr8gCEI/RIK/IAhCP0SCvyAIQj9Egr8gCEI/xJHoAyilNgINQBAIaK2nK6VygWeAEcBG4GytdU2ixyIIgiBYdFfmf7TWeqrWerr9+NfAPK11MTDPfiwIgiB0Ez0l+8wB/mv//F/gtB4ahyAIQr9EJXqGr1JqA1ADaOBfWusHlFK1Wutse78CasKPOyMvL0+PGDEioWMVBEHoSyxevLhKa50fb1/CNX/gMK31VqXUQOBdpdTq6J1aa62UinsFUkpdBlwGUFRUxKJFixI/WkEQhD6CUmpTZ/sSLvtorbfa/+8AXgJmABVKqUH24AYBOzp57QNa6+la6+n5+XEvXoIgCMIekNDgr5RKU0plhH8GjgOWA3OBi+ynXQS8kshxCIIgCLEkWvYpAF6yZH0cwJNa67eUUl8AzyqlLgY2AWcneByCIAhCFAkN/lrrUmBKnO07gWMSeWxBEAShc2SGryAIQj9Egr8gCEI/RIK/IAhCP0SCvyAIcQkEQ7y7soL5q+M6sfsczb4AL35ZRiAY6umhdAsS/BNMXbOfP8xdQYsv2NND6dUsKN3J3e+v69ExPPhxKe+vrtjr95m/Zge3vb2aUGjXs+trmnz8/pXl1Lf69/qY35S3lpdz2K3zufTRRVz++GK8gY6f3/pWP499tpG/vLFqt79LT/C/kioe/Wxjl5//8Ccb+NmzS/nT66v2+JhaaxZtrOYPc1fwdVldp897btEW3l6xfY+Psy/ojhm+/ZpXl23jP59u5LiJBcwanbfH7xMKaX727BIOHZPHWdOH7fb5/mCI295eQ0Ornz+fPhnbbtsr0Vrzx1dXsrK8ntkTChhfmNntY2jxBbn1rdWkOE3e/8VR5KW7O33u4ws2sWJbPTfNmYjDbMuvQiHN3fNL+Pu7awEYnJ3C9w4e3un7vLViO//9bBODs1P40ZGj990vE4XWGm/AynTdDgOlFNvrWvnFc8sYlpvKFSPKWbniS77edADTRxdGXvfp+iou/s8iWvzWRWHO1CFMGNz2d1m8qZpb31zDfedPY4B9rrTW3fo5vP/D9SzeVMMFM4d36bjvrqzAaSr+8+lGxhZkcN7BRV06TosvyEUPL6SioZVWf5CKei8ASsHkoVlxX3P7O2tJc5scP7Ew7v7uQDL/3dDqD1Lb7Ot0/zsrtnPEX+fHzYwAPt9QDUCTd+8y/6e+2MzLS7bx4pdbO+xraPXT6A1EHlc1evneg5/zwEelPLVwC5+t3xn3PQPBEFWN3r0aV0V9K/H6Q+1s9OLfR7fPX22pZWV5PWAF1l0RCmm217V22F5a2cgBf3yHNdsbdnu87XWtHW79v9xcgz+oqW8NcHO7zLC+1R/JzrXW3P1+CU8t3Mxf3ozpZMJt76zh7++u5cr9mvhz/nt88OZzVO6M+ts0VUFN2++3rKwWgCc+39xpZt3Z+e8q33/kC8b/7i3G/+4tvn3nJ2ze2cxNr60kJVjPc4Me54K1V/AX50OMee4YWPNW5HVzl2zDaSru+940ABZvbuvIXlbTzGWPLmbhxmo+tT97G6uamPrHd/m8NP5nEaCywdup5BIMaU69+xNuaXdOO0NrzbKyOpp9QSobdv8Z317XytKyOq76VjFHjcvn/15Zzpbq5i4d69Vl21i4sZpxBRnMGp3HLWdM5oCsJuoam+I+v67Fz/b6VtZXNrG1tqVLx0gEEvx3w9/fXcsZ937a6f7lW+vYXN1MeW3HgKO1ZoH9YW/07vmte2WDl1vtD/3K8voOX/Yrn/yKa59ZEnl88+urWLqllr+euT8FmW7+OS++XPLUF1s46rYPaPV/8wtTMKS57e3VHPzneTzyv40x+wLBEN+6/UMe+mRDp69fV9HQ5Q/+459tIt3t4MRJhbz05VYadiGDvLOygkNumcenJVUx299fvYOaZj8LN3QefMC62B9z+wdc+eRXMQF3QelOTEPxg0NH8NJXW/lf1Pv/+PHFXPTwQgC+3lrH9vpWxhdm8NAnG3hq4WYAVm6r56GP1nHX8E/4+aafcF7Dw/ybm8i/axT65sFwSxHcNhru2B/euxFCQZZuqSPFabK5upmP1lXGjDMU0tz+zhoO/vO83V4QO+Oz9Tv5cG0lZxwwhGtnj2VrbQsn3fkxH369njey/kr6qufg0Gv4fdrvaAyY8NR34YsHAVixrZ7JQ7M4YVIh+RluvtxkBf9mX4BLH13MtOASXnb9H1Wr/wfAx+sqqWvx87d31sS9WDV6Axx523yeXVQWd6yvLt3GsrI6nv5iM77A7pOKTTubqWuxPielVbFBuK7Zz0I7KQvz7ipLzjthYgG3HNjAJeoVFiz5erfHASshGVuQzr8uOJB/TN7MOct/xEveSzmp7I64zy/Z0Rj5+eO1lXGf0x1I8N8NVQ1eSquaqKjvGNwBau0PWLz9G6qaIllHY2ugw/6uoLXmptdW0uoP8YNDR1DX4u8QNJdvrWPltvrI41Xl9Rw2Jo+zDxrG5UeOZuGG6rjZ/+ryehq9AXbYt6n1rX4e+mQDTd5dj9UbCHLZo4u4Z/56slOd3PtBSUxNY3t9K3Ut/l1qnhf/dxF/em1lh+1fbKzmza/LI4+rm3y8tqycM6YN4UdHjmaofwOlz/0W1r0H3o5Z/IptdWgNv315eczd2IJS68u+LuqLF4+SHY00+YK8tWI7/3xvbWT756XVTBqcyXXHDOc/qXfifemn4G+h2Rdg4YZqvtpcy9IttbyzogLTUDx+ycEcMTafO178gJX3nsewf09gtesCTqm4FzX2eLh6Ga9MvJNb/efwmP9o3jUP50+B83kmcBR88ndC/zmFs6vu5pHBL/Oj1Pl8+sGbYAfNYEhz2WOLuev9EtJcJo98unGPsv875q1lYIabP58xmatnFzP3ykMZke3g0fS7yWsphfOehWNvRI07kZO8NxEqPgFe/zmhl37Cryt/zX0V56P+vh/PG9ezY+NyAJ78fDPp2xdyv/k3pholfHf1VbDpMxbbF4cvN1ax7IsPaS5bzmPvfxUJ0GsrGmj2BVlb0fFvGgxp7nx/HeluB7XNfj7sQsBcat81gXXXEabFF+SChz/n7H99xitL2u6i311ZwdE5OxjzwrEUvngGv3Y+zakfnwLz/wIB6/vhD4a474P1LCjdGTnfS7fUsqysjvNnDkctewaevQAat7PWPZmjmt6E6o4JUMkO63dMcZodLurdiQT/3eAPtf2R41HTbH14t8cJ/uGAA1DfxeAfClnBPhwAH1uwiblLt3HF0WM4dVIeudSzdsPGSCCob/Wzs8nHtroWvIEgWms2VzdTNCAVgHNnFJGf4eae9zveLpfVWBeRykZr7K8s2cZNr63kjHs/ZdPO+LesAPd9sJ55q3dw46kTeeCC6VQ1+njSznCj33d9ZfxAu72ulc3VzWyLI8/8/Z21/OTJL3lvZQVaa+77oARfMMT5M4czZaDJIyl3MGX9/fDEmXDHVAjESnLrKxtJcZqUVjVx3wfrASt4hDP+eMElmlW2vHTYmDzufL+Et5aX0+oPsmRLLYeMzMLzyqUcFVrAt5reIPTQCWx7925uM+7iZdfvGProTM5fcDLvpP0fec+fySPqRj5K+QWjK97hTf80Vo/9MZz9GHz3ccgZzqnfuZDDf3gzC8f+nJu5BGPWlfwm9CPeGXkdwcq1nG58xEFVL3F96N/8pvwq6ub/E7DkoPdWVfCzY8fyxzmTKK1s6lTaC3P3++tiitWfl+5kQWk1lx85Go/ThNIPGD7vx7xq/oJpgSWoU+6E4tkAzByVS73fwZJD7oCJZ6CWPkkO9dQWHgrFxzIwVMk/mm+gZvVH6M/u5b+e2zCzh3HfuEfYHspGPzqH76/9Cc/m/otFniuY8sYcUh88lO99eDTLXrF+p5IK67NSXtfxbvC1ZdsorWzi5tMnkZvm4uUlHaXP9iwrq8PtMHCZBhvsz7LWml+9sIyvt9YxZmA6v3x+GUu21FLf6mfx+m38lTtRzdUw5x7uGvcY74emwYe3wIPHQNU6Fn69mtfefpPzHviU2X//kAc/LuWBj0tJdZmcObAc5v4URhwOVyzkmeE3EsCED2/tMLa1FY14nAYnTR7EJ+uqesxdJAXf3RD+w3y9tY7j4hRnwvWAcPYczecbdpKf4aa22Rejye+KZVvreOiTDTz0yQZOmzqYV5eVM3u/gfz0AAf891t86Smz2uKtnA3nPMXGKkuX1NoKuhkeB82+ICMGpAHgMeGR9Htxlq2D0FIw2q73ZTXNMWPfXteCoawL2Wn3/I8Pf3U0mR5nzPg2VDVx7/z1nDJlMBfNGgHAIaMGcP+H6/newUV4nCZb7eBfWtVEMKQxjdhi25e2PlwVR4vdXN2M1nD1019xxNh83ly+nTOmDWFsQQa8di2DQtu5OPBrDknZzCXNT0J1KQwcH3n9+h1NHDpmACkuB/fOX88ZBwylweunvjVApscRc8sdjzXbG3A7DB68aDpn3f8Zv315OX86bTK+YJALq/4BG95g3YH/x62fNXF/1f2M2f57MoxsqtOL+aShkKBWHJSrIRTEBIwpZ/JS5gWsac7mrG/vZ1UBbZRSzBqdF2MEWFZWy9+qD2XbYefyh1dX8tm1R9NYuYX1j17BcR/fBKMPZn2VVYg8O3stAxfcxNaUA3j8s4HMGhPfUKC15p756xlbkM63xhcAcPf8EvIz3FZR09cMz/0ADBM1ZDoc8SuYem7k9TNGDgDgs02NTDvrEV4e/juufXEV751yBAzMoHT4+eS/eDY5T5/CpcD2rKmkXvgkA0s0Zy/9Ha+O+x/+1QuZEFzDjsJZ/H7zGDxuB2fwHjPX/BW2n0jDhrW84rqJ13ecC0yPHNsfDHHnvHWMLUjnlP0Hs2hjDc8u2sLmnc0sfuJ3FGSnMeuCG2POK8DXZXVMHJxJfWuADZVW8H9y4WZeXbqN644fx/cKN7Pw+btxPfhr/qxO4WpVSn5LKXzveSg+lnGu7Vy21OStE37I+M+vg7uncyjwuhtqMsbyD/P7/Ol1632vm9xI2otXQuZgOPtRMJ04cgbzePA4Ll72DOrQa2I+o+t2NDJmYDpHjcvnhS/LWLa1jmlFObv8XCaCfpf5V9S37lIzbk8gnPnbEkarPxhTCKptji/7hPX+maMGkO52dFn2eXfldkxD8Z0Dh/Lykm2Mzk/jjm8XYDw2B8PXyL3ui3kj6xwoeQ/mXsm2sk1cYr7O8cZCNu9sZvNOa2xFA1KtK8Kbv2JSzTzGqc34Sj+OGV9YPqq0i74V9V4KMj3cdNokapr9kSAe/Zrfvvw1bqfB707eL7L9qmOKqWzw8urSbQCENv6Pu513cFToc7bF0fXD+nBlozdGrvAHQ5TXtXDWgUNJdTt4c/l2fn7sWP72nSnW77voYdSsK/nJpZfzoT4AgOCOtjuaYEizYWcTo/LTueGk/UDBPfNLWFBaTQqtPJj/DPf7fkPw7xNhw8fEY01FA8UF6XicJn85YzLVTT5+9fxSrnc8xeANL8CR1zH0+Gv4yDiIOyc+x5V5D3FZ/hPo773I1b4r+Jn/J1YA+eGb8MM3UafdxxnfmsXvTp7QJcfJcRMKWVvRyKvLysnPcFOYlULRyDFcF7ycWvdgePYihiy+lVtcD1L46nkYjRVcpZ/k/HVXs2N7fL28viVAiz/I0rI6Kupb2V7XyiclVZGLNUuegJZq667kvKdjAj9AbpqLcQUZkfrV1xWteJwGI/PSARg9YTrnBf7AffpMTvL9BXXx25A1hCnDsqgii9/5f8BZvj+w5rwFDLnkSSYc/0N++tPreHLo/1FPGjx1Dhes+hFTjFJ+2HA/+Ns+M//+uJT1lU1cd8J4DENx2gGD8QZC/OWft3N69YPMKr0D3v5N5E44/DlYvq2O/YdmM2JAGhvtzP+t5duZkm9w+fbfkfnM6Rzt+Jq8FMUt3MVljtfRB/4Qio8F4JDRA3AYirmt+8OP/weH/4JHsy7nztQryTFb+WPtb1g17BaeG/0Wl5f+FJwpcN5zkJoLwIA0F/f4TwZXGjxyInz+AAStWFFS0UDxwAwOG5OHUvBRD+n+/S74n/fvBfx+7oouPz+c+S8rq43o79++8+NI0KqxM//2ss+mnc1U1HuZOSqXdI+jy5n/uysrmDEil7+dNYUnvn8AL8woIe2xk6C5Gi54kTUjL+BPrWfDt34Hy57h+LeO5LfOJ7jbeRfN6z9hox38h+emwse3wxcPsnr4eTRqD4Elz0SOs7PJR6vf+t3CdYmK+lYKMj2kuUyADm6d5Vvr+V/JTq6dPZaBGZ7I9pmjcklzGbSufhcePpGzvr6ME42F3OW8i6oV8wCruBi+aC7eXMMA6nAFGmPksG21LYQ0HDQylxcun8ULP57FT48pxjAUfHgb5IyAo3/LgcNzOGrWLEJaEaxoC/5ba1rwBUKMzk+jMMvDuQcN44Uvy3hlyVZOySplRuULOAgSCAThlSvA11HaWlXeELGSThqSxfdnjeQc/0v8yPEaHHQJHHU9KS6TGSNymVvi4+3yVGaOGsCEwZkcPDKX/YdmMSw3tUt/63gcO8HKzBdvqmHK0CyUUrgdJgMG5HFX3u/Bk8VB257kbGM+TL8YfraSqm/dzoFqLa3P/yQmCIYpr28Lpu+urGDu0q1oDadNHQLBAHx2Nww9CIpmdjquQ0YPYOGGaqoavazYVsf4wszIHZ3HaZI5ZCy3es8kZ9Q0CjKtz8aovHTS3Q7mra7AZRpMGpKJ22Fy+ZGjGZabStGwEVzj+zG6rozlFPMT31UUspPAgn8BsKW6mTvnreP4iQUcMy4f3vgV01b9jdm5O7jZ/DebnaN4NHQCLLgXXrgEGizffMmORpp9QfYfmsWo/DQ27mzGGwiyY9MqHvRdh1r7Nhz3J8xfrGHgr76E0+6Dqeejjrsp8vtmeJxMK8qxNPnMwQSP/i231hxN1bhz4Yov4KS/kYKfg7Y+iiqaCZd9CPljI6/PTXNTQybbTn8JCibCm7+Ep86locmSO8cMTCcnzcX4wky+3Fy7h5+WvaNfBf9gSLNpZzMfr6vqcoEsnPnXNvtZsa2eF7/cSn1rgPqWQGQ7dJR9VtgF2KnDskl3O2lol/kHbbdG9F3Exqom1lY0WgEg6OfQ979Dxrs/g7Q8uPBlGHIgEwdnsq2ulZppP4Wjf8sHOWdxqetWysnj8CW/pKp8M4aCopLH4f2bYP/vsuHA3/J2aDruta9FildlUVl9eOxW8HfjtL3p7YN/OIM6tJ28oEJBnnDfwgUl10LtJv6T+RO+m/ogm3UBEz78Md5NX/DD/3zBVU9/Ras/yNatW3jXcx0Pum6PsZpuqbbGNCwnlaIBqRw43L4V3rEKtiywgp3TCiwOTzplOg9d2Rb8wzWG0flWRnr5UaMxlGJZWR2H5dQC8EPfL/lw0s1QuwnmtX3ZwbKnVjV6GV+YEdl2XeZb/Mb5FGvzj4UTb4vIC0eMzWPjzmb8Qc3MUZYs8u+LpvPoD2ewNwzLTY0cf/+h2ZHtYwdm8GFdPvx0ESdkvMCVI96Ak/8OzhTyjriEu41zKar6EJa/0OE9w9ZXh6F4Z2UFL3+1jSnDshmRlwar5kLNRjj06g7SSTTnzxyOLxjigY9KWVlez8QoTz8Q+VvNmTIkss0wFJOGZKI1kcAfzcTBmXwcnMTiMz7irJZfsyLnW8wPTkF98g9oqeEPc1dgKsUfTp1oJTIL/4VacC8PNl9DjtnCypm38X++C6g9+Jew8hW4cxp8ejdLt1h3ltM9W5kVXIwvEGLeklLu4VaydC1c+ArMsrN1w4Cp58Fp94A7PWZ8R4zNY/nWeqoavazZ3kCTL2j9nk4PzLgUfvIZXPM1XPBSJOMPMyDdZZ37lDFw0atw0t+g5F18L18FaIoHWsfK8DjwdWITTzT9KvjvbPQSCGkqG7xsqOq8oBlNIKjJcFulkRtfXRGZ1FLZ2Io/GIpk9O0z/2r7jiA/w02Gx9HB6rlmewN3vV/CD/7zRUSGenelVZA7dkIBrH0LdqyAk/8Bl86HoZYOOnGwNWlkRXkDHPlL/mleRMvAA7gl8wbcgQbO/+q7vJRyE463r4PxJ8Oce8lJ9zA3eCimrw7WvQsQkXTcDiMi+2yvszL/cPD3BWIvkOELxpCclNiTVLOBqf4lPGacClct4eHAcQwqGs1V5g20Kg+uR47lD/o+yjZv4L4P1vMb47/kUs9MYxXNGxZG3mZLTZRkFc3i/4Dpsr6kNm6HQYkeglG1JrItHPxH2cF/UFYK3z3ImhA3yV2J9mTjdWXzaWC8lcV/fr99Ox6I/E0AxhVmWBn0B7fgnn8jetKZjL38qZh6yeHF1spyhoLpI6zAl+lxkp3qYm8J15b2j5ogVFyQzqadzTT7AmyqbmZ4YWywWZB/Nuuc4+GNX8KXj8Fn90DtFqAt+B8/sZBP1lWysryeOVMGg7/VKkjmjoZxJ+1yTGMGWpr7I//bQENrIPI5DHPy/oOZOSqXEyfH1sWm2BewyIU8ivB7PL8OgpgcOTafvwbOwfDWEbprOrNLbuavxSsZVPoCzL8ZJp8NVy+Bg3+MmnMPA0ZPAxRfjbwMrvgcRh4B79zAqA+u5Cr36wx7/iSOWnwFv3f8l9x51zJSldNy2iMw8vBd/wFswn+HJxZsjsxjiNHmlYLsIjDMDq8dkGZ9DqqbfNbzZlwKR17HgHXP8Yn7ao6ZOwOeOIvc0E56anJ0vwr+0QE62omzKwKhEPsNysTlMPhiYw0pTusPXdngo7bZz9HGV7zn/hXe+sqYu4naJiv4Z6e4yHB3lH12NlkBt2RHI1c/vYT1lY28ubyc8YUZlmyw+D+QMRgOuDAmI5swyMq4LEujZkNVEyPyUtEFk7je81s+d8wgzaFh6vfgOw+D6SAn1cUnoUl43QOs963dTFm1FSgnD8liR0MrLb4g9a0BCjI9pPqquM7xFAFf7AVta20z2alO0t3tfAJ1VpB5tWUK1V5LvhmWk0LqwJFcm3svnxeey+nmx3zo+TnDPvo5p5mfsm2/i2nQKeQuezDyNpurm3GaisLMNkkJfwssfQr2O8W6A7JxOw3W6SGYNeshZF2Q11c2kZPqJDetLQBfdUwx584ookhvReUVM6Yg03L8zP6DFQTe/CWh+2bBkqdYu9XSXscPTIPXfw4f/AWmnIc6499gxha+xxdmMDDDzaQhWWS0K4rvLefNKOL8mUWROwqwgm8wpPlwTSX+oI7c3YQZOTCTG0I/ss7X3CstHfzVqwEor2tFKfjewUWEtHXBOnnKICugVq6GE26JG8Dac9UxYyJ3wu0z/ynDsnn6skM6nIvw3Uu8guaw3BQy3A5et51tRxTns0oP53+HPEBtwSGcYn7Gt9ffaEl0A/eDU/5pSX8n3gL7nx05B+srG2HAaGrn/Jensi7hgMaP+Jl6AjXuRJoOuJQfON5mZsvHPOy5kKwJXV9GZGxBBsdOKOChT0r5cM0O8jPcDG2f+HRCbiT4W9/zFl8Q72G/Yv6Qy1mqi1ET5sCGj/lr5U8Y17qsw+sDwVCnE0f3Ff3K7VNuZ0BKWU6crkzf9gc1mSkO9huUydIttVw4azj/+rCUykYveekuphnrGKPKuJiXqWs5LZL5VTf7SHc7cDkM0j0O1lfGBv+w3HHxYSN56JMNvG83z7r6mGJrlmfJPDjyOjBj/0Q5aS6GZKfwxcYazppuuVhG5qWT5m7lkVXFvO8ez0mTB/Hn0yZHvcZJEJN1g09lUskj8M/JXIriEg/UVRdwJn+LFKwLMj0MWfEPfux4lUWV58F+bbfxZTUt8T/8doa5VefxSUkVgZBmSE4KoxrSmL+mmT+kn8t+hbO5Rj/Bd3bMo1QVkX3iH3n663Iu3vo21JVB1lC2VDczODsFs7kSPrgFdqy0bs1b6+DA78cc0uMwrcw/6LVkiwGjWV/ZGMn6w+RnuPnLGZPh9vUw6iiKA+mWT9ydARfOpebLl6iZ+1tGvXw5ZxvpTPUMJf/pW6F8KRx6DRzz+5iMP4xSin+eM5VU177/ChVmefhT1N8PrEAERPrBjMpPi9k/Oj+dZxcVUP/LJWSqFkv+ef8m2PQpFfXp5KW7OXjUAPLS3UwYnMnA6i/h07vgwB/A2OO6NK4xAzM4ef/BvL1iu3V31AWOnVDATXMmMtuuZUSjlGK/wZks3FCNy2Fw8CjrbmaZexpb9pvJ71adxceXjmRQYBsMm2EVT6PITXORk+pkve3m+fWLy5lXdQwDD5vFMUM1TDqTVOBni1MpCm1h55RLuzTmaK4+ppiTV1bw3qodnDCxsMvtKQakWS0tdtpJ4Gn3/I+KhlbcjmPJHXAy355zOMy6ksD9J3FW4xPAj2Jef9vba/hycw3PXT7rG4+5q/SvzN8O/jNHDoiZqLErAqEQDkNxyKgBDMxw833b3ljV4KWm2U8elgvoIvNtdm5dH3ldbbOf7FQnaM1E/woa2zmMqhqsD8XVs4t56tKZ3HHOVO45bxqXHTEKvnzUukJNuyDumE6eMoj5a3ZEvN0j81IZnpuGLxiittlvFXujyLEvSPMG/xi+/wac/A9eyzqPue5TyfVv51st70QujIPSFDnrngfA1RA7c7SspoWh2XGKmXVlaGVQQQ4f2BexoTmpjB6YTlWjl9XbGxi731QKL3uOiz1/45n97iQ7PY3HQieADsFb10PNJloqN3Kt+SzceQB8+V8roy9fBkOmW/7pKNxOg3WhodaDSkv6Ka1sZHS7oAiAtxEaymHAGMYWpFPZ4LUsukrxmm8a3/L+lXN9N/B2cDpOl8uSfL79dzj2xriBP8ys0XlMHZbd6f59yci8NAwF81ZZ53d0XuxFLnzRW9/khtyRMPMnkF4I826ivLaFwkwPpqF4+rKZ3D5nFLx0OeQMh+P+9I3G8efTJ/HC5bMsl1AXcDkMLjhkRERKbE/4DmJUXhoZHidZKU7Ka1sty63LTcHIyTDuhA6aevTvvb6yEW8gyIdrKzl3RhHHnHgmTP4OKIVSilUDjuWfge9w8OgBcd9jV0waksXs/QYC8aWrzkhxmaQ4TXY2WjbvNRUNZKU42dno44CibOtJ+ePY5BpDeqjj3JPyutbIdzJR9KvMf3t9Kw5DcdL+g/jdy8vZtLPZKnrtgkBQ4zAUPz9uLD85ejTpLgcOQ1HZaAWQfFVLk3sgjtYa0j79KxQ/AlguoNw0Fyx/gcvWX8Fnwd9grV9vUdXoxeUwyHA7OCT6QxkKwlePQ/FxkDU07pi+N2M4D3xUyt/esYLeiAFpMcW04e00c6dpkOFxUNMSgBGHwohDufvj0YwYksas6k1cVP0m75dbEsHoynmY3loA3PVtwV9rTVlNM0eNze84oLotkDEYV9AdmX05NCclZhr+EWPzcDtM/nnN93E5DAxD4U0fwgeZ5/Kt1U/Bqld5AIVCw/hvw+wbIW9Mp38Xt8OkRA+2HlSupq7oWKoafR3kEAB2llj/5xVTbFgZ69qKRmaMzOWdlRWMGJCGmXMk15ZM5AfTRzDxlImdHren8DhNhg9IY0NVE3npbrJSY+WV8EVvfWUTBxTlgCsVjvgFvPELDvc8xfr8Y0BrxgxMh7nXW3+zH7zZoci5OzI8zk6ble0JYd2/2L6zGZTlobyuhYbWAGMLMyyn1y4YnZ/G+6t3sHhjDS3+IEcUd/x8jsxLZVV5PQeP/ObBH+DaY8eyfGs9R42L89nfBblpLqqbfJF5BtefOJ5ZY/JwO9ouhC1GOoN0x1nAQa0T3im132X+BZkeDrG11AW7aDIVJhDSOE0Dp2mQ6XFiGIq8dDdVDV5qm/3kqTp8ueN4JHg8BRtegior0NQ0+y0J6Gsriz5CL44JhlWNPvLSXB1vIzd/Bo3bYco5nY6paEAqR47NZ0NVE6ahGJabGhPwi3I7XtBy01wRW6oVyFsYmpPK1vE/oMioRK9+A4C8tU/hzxpBmc4jpbEt+Ffb1tAOxV6AujJU1lDGDEyP3OYOyU6JSBN56W72s+2TGR5n5EKVl+7m8fQfwNXL8B72K+4KnMaTB78K5zyxy8AP4HEaNJKKN6UAKtewviq22BtDOPgPGMOUYdm4HQbPLdpCfaufBaU7OX5iIfecN41jJxRw0uRBuzxuTxJ2iLSXfMByCTlNFTuretqFUDiZS1of4S9bzof7ZsFbv7HuLA+9epfWzu4inPmPHRgu0nvYVtvKmoqGLnVvHZ2fTlWjj1eXleM0VWwiZTNn6hAuPGQ4+Rmdd2Ld9RizWPCbYyIXqK4yIN3FziYfpVVtLrTMqM8/QKuRRpruaD4JhTTBvWjY1xX6VfAvr2uhMMvD6Pw08tJdfLGxZrevCQRDHWao5mW4qGr0UtPsI0/Vk5oziAcD3yakHPD5fYDVi32wu9WanAQcZSzp0HkzL96HcdVrYLphzLG7HNcFM61WwMNyUnCaBoOyUnCa1jjbZ/5gST/VdmCuafbT7AsyNCeF0NhvszmUz+HbHuYXrhdxbPmU1snnsyFUSFrjlsjrw06foTlxZJ/azZA9zMoqsYK6x2lSlJuKyzQ4vDgvbgaXn+G25hhkD6N04pX8M/Adsod0rXVx+AvUkDkGqtZEsqt4gdEK/gpyR5Gb5uK8g4t48autPPbZJvxBzbETCshKdfLvC6dz0Ij48kIyUFxgT6qKc4FzmgZFuamU2sG/ssGLDyctP5jPcd5b+Xj0L6yi9YJ7oGASHHV9t469M8YVZHDt7LGcPs2qLQ3KTmHdjgZqm/0xltvOCF/sX/qqjGlFOaS1NyNguZz+OGfSvh14FxiQ5qK6ycv6HY2YhuroYgNazTRSdXOH+RnBkCbRXR/6VfCvqPdSmOVBKcX4TB919fW7fU0gpHGYsYErP93dJvtQhyu7kGBqHktyjoUlT0JzNTXNPg7xfgYhPxuHncZIo4LW7W2NwqoaWjnaWAo72+oEaA2rX4Mxx+z2dvyocQMpyk2NFN5MQzEsJ5W8dHfcL0BOqjOS+W+NsmzmZ6XyQPBkxoQ2cKXxPGQMxj/5XDbrAtKbO/br6VDwDQWhfhtkDY0UJcPPcZoGD31/Or88flzc3yEv3R0pfIfnOxR1cYJU+Na5Pn0UVK6lobnF/j3jWC2r1kH2MKt4DFx+5GhMQ3H7O2vIS3dZMkkvIHx+49Y1sC4K6yub2NHQylG3zefu+SVsb/CxVg+jcuIP4EcfwY8/tXzujj3Lgvc1hqG4enZxJKkYnOXBH7QCYVeCf/hctPpDHBFPkuxBctPcVDf6WF/ZxLCclA7zHABaHemYhDpMOAxpTUgy/32D1pryuhZm+z+CB47m8erz+H7lbbt9XSCocbYr+lmyj4+Wxhrcyo9KH0hBpoe5KaeDv5ngokdoaA0wtX4e5Ixk06QrAVAl70TeY3jDl1y74zdw1zS47zAoWwTlSywtdvzJux2XaSie/dEh/OWM/SPbphZltxWT2pGT5qKmySo6h3v6DM1JIT/DzePB2UxvvY/zC1+Bn6/CkVXARl2A218HLTUxr+kg+zRWQMgPWUMjskT0BeLw4nwGZ8e3x+VnWME/3IwOrAleXSFccCzPnQH+Jg5Z/nsUoYgVN4ad62BAceRhQaaH82ZYtsdjxhd0uLNLVqYOy8ZlGkzrpPA4emA6m3ZavZeafEHeW1kRaZQWsc8WTIyxzCYbg7LaPitdkX3CchcQV+/vScKyz/rKxvi1KKDVsLd7YxNRK/OX4L9PqG8J4PHXcerGP4GviY3ucRzgXdihK2R7AqEQZvvM3w5awXq7S2KaFfy/8g6GUUehFtzHNY7nGVb7BUw6E8eAkZSEBpOy8X3AuhCd4HuHVjMDjv+zZWV84izLeqdMGHdil36nwixPjKf9tu9MiSyu0Z7cKNknWsJJdTlIdzupIovcLKv45jINNmnbmme3pN1a20Kmx9Gh0Rt1dj+ZrCKKB1qZWty6QBzy0t34g5q6Fj9lNS2kux2WQ6oLhDP/DQOOhKN/y7iK17nV8W/ctSWxt9BaW3dXA2JrCD8+ajTjCzM4+6D4RfVkZPiANJbfeHynTcBG5aXhD2oe/WwjaS6TleX1rNhqBZXCLE/c1yQbg7KtcRZmejoUtePhNA2GD0hjQJqrw9yDniY3zYU3EKJkRyOjB8YP/l7T3t4aG/xDGsn895b67RvYWb2T8voW5pifYmo/fOch5uefTxotsOXzXb4+ENI422v+6W4CIU1ztb0GZ3o+BZluy0p69A2EUFzjeBGUAfufTbrbwfzQVDIrFoCvifqaSo5XCykddBIccgVc9Io1yWb5CzB8Vqe2tt1hGipm2cBoctJctPiDtPqDlFY1kZ1q2eoABtq1h3CAcMYE/1KASIG4A7W2NJQ1lKE5KVwwczgnTx7cpfHm2VPgwzOuh+akdNlH7bYzfG8gBEf8gv8NuoizHR9i3DsDbh0O9xwMj86xJmr5GiGvOOb1BZke3rrmCA4cnrwafzxcjs6/stEB5s9nWPMEnlts1W16S/AfbGf+4wd1vbh68WEjuebYsbt1BnU34cQsENKM6sRV6HOEg3/s2hchcfvsHU21lej7DmXLU9dSXtfK2eYHNA2YDIWTKc89GD9mpCBb0+SLZMbRBIK6Q0ANuwb8dXbwTxtIYaaHqkYvgcHT+fKszylufZTPzloM+ePI8DiYF5qGEfLDvD/i++pp3MrPjjFnWa/PHQXnPQOpA2DaRQk5F+EPYk2zj5IdDYwd2PblCheewxcB01CUYXmbw5l/WU1z/Alekcx/KIahuOm0SV22AobP44aqJhaU7mTGyK4H4nDm3+oPglK8VXAZp6o74dS7YNKZVrBvqmrrp54fv+7Qlxidn46hLHfLKfsPJjfNxdqKRjI9joRMRksEhVkeHIaKzGTvCufOKIoYIJKJAVF35bvN/OPJPgnO/HvHJ2IPScvO542sb3NS5bN8/cVgJhqbqJn8F9IAZ1oWi0NjObjkPdSxN/KL55bSGgjyxCWx9jd/0JrkFU148e5sbbuF0gdSkGV1pNzRYLmA/DjIyrJuz9M9DhaE9mPV8PPZ7/P7yXWksDw0AufQA9redMiB8It1XZpmvyeEC6E7G32srWjk2/u3WRrDQb8gqq1CwEylwZlPRs2GiDX0sDGdePw9WeD55rfc+fZ5fPzzzXgDIeZMHbKbV7QRDv7hxcdb/UEqXUNh2jGWxTFM9QbY/jUMP+wbj6+3kZXi5LGLD2bSkCwMQ3HYmDzmLt3Wa7J+sGo5T102MyY56a1ES7Kdaf7eTjL/YEgTErfP3uE/8jd8HRrB5JL78GonaQda/vk0t4MPglNQFcuhvpxtda0s3VLXYdZvMJ7bxw6WeaqOEAakDogsnrJxZ1NkgZcc+4+f4XYCig9HXgvTLsQMtPB08OjIRSRCggI/WG4fgHU7Gqhr8Ud81dG/T3SQcJkG1e4hUF1KrW0N7czjT9bu22TEI3zcj9ZWUpSbyrROitXxsFodG5H+Jy3+YPxib+5ImHDqLmfq9iUOHZMXkfMOL7YKu4VZXavBJAsHjcjtkt6f7ESSxHb9pqLxOeyLnLe95i8+/71m9qRhXKevokW7mGccgivDkhYy3A4+CE21nrR+HvUtfhq9gZhWx1prAiGN2S5whDPWPOpodeaAYUZmCm+oaqLadtWEA67HaWAaikZvEE7+J28d+ABPBo+JaN7dQfjDF164OnrCSjgIF0T16Hc6DKpcVvDv1OYJVl+fTmYi746sFGfEqTFn6uAu6/1h3A4Dr78t8+9qy4H+Qtj6OCiz92T+fYnwd66zrB+iNf/ud/v0adkHrAy/eOI0vrXkdgYPHkK4cW26x8FqPYxAWiGO13/Bk4EsPnOMZ/2mUQzLtVapCncwbF/wzUxx4DIN8lU9Xs8AUrG+YG6HwcaqJgylcDmMSCaqlCLd7bBaNxsmK9xTQZXsk/a/XSV8F/K53c20OCrzP2nSIGqb/THB3WkqKp2DobqC+oZa6z3ijbeuzGoZsQcoZc2WLq9rZc7UrhWJo3E7zdjM3yXBP5qCTA+/PH4cB3+DWoqw70i1+/t0Ni8DIGSmEMDA0aHga/2vtf7GSVFX6fPBH6wVi15Zso1J2W2FyHRbitly+G0Mr/6Y5Z8t4UzzY/xvnAjpD0Lx7MiVt33B1wpaLvJa6gimWIVRw1CMGJDGhqpmctOc5KQ6Y/5o6W4HDfYM36pGL7lp7m71l2fbUkBpVRNZKc6Yqe4j8tL4zUn7xTzfaRpUOKyA7LR75nucUefB22itOeCt2+PMH6w2EHnpbsbsgcbrcUZn/qHY8QkAXHH0rttkCIlDKcWd5x4Qk2i1xzStNiXZcWQfiC877yv6RfA/rDiPwVkexha0/RHCPenL82eRu/+JXPHRO4xTm3nMdRep7/0eimdHVrJqX/AFSyrJb61Fp7VNGx+Rl0rJjkaUSu+QJWd42tbxrWzwdavkA9YFLCvFSV2Ln+KB6bvNJlymwcqUaeBMY8jaR4FzyahdCU+eD81RPZHS8q1FNPaQf3x36h5fBN0Ok9Zw5u8LRmQ2QUgWjo3TyjoapaCBNLLjyD5gNXhLVJDuseCvlDoBuAMwgQe11rck6lhO0+Dta4+I0YQzPNav3tgaoN5ut7xGF/E5kzml3lpdKhAMZ/4dg1Nemou8yjqaMgdGto3IS2P+6koyU5wdgn961IIuO5u8HYu93UBumssK/gWdZyJhnKZBnU6D6T9g8Gf3MkIdxeCPbrUmoR15HRgOa05C0SF7Vajem/VuRfMXejumUjTolLhWTyChjp8eCf5KKRO4BzgWKAO+UErN1VqvTNQx268wFO5/0+gNUNdiBf9xBRms35kGjmoI+CKaf7yJU0PTgniUH19m27J1o/Ksnvprtjd0aP+a7nFE5hFUNXoZXrTnQW9PCc+eLe6CxOJ0KOvO55ArCX3+Lx5z3oJ7RyWc+ZDVKz0J8DjNiNWzU7ePICQxpqFoIDXODN+2zD9R9JRIOgMo0VqXaq19wNPAnO4cQFj2afIGqLeD/4yRuVTobOsJTTsIhDqXfUZ4rEZMnpw2v3zY7tnsC3Yo5qa722SfqgZfz2T+9pi6mvn7giHIHETJ4DkMMyrxjTjKmkCVJLgdhjXJC8n8hd6JYSgadGqcGb7h//te8B8CbIl6XGZv6zbCsk+Dt032OWhkLpXh4N9Y0Sb7xAn+p4+1smhXZpumNzJqCnd7/TnDYxV8m7wBWvxBBvRA8A87frqU+ZtGpOaxuOgS5gYPwXfC7THrCfc0ls8/KvMXt4/QyzAU1MeRfUIR2afvBf8uoZS6TCm1SCm1qLKycp++t9th4DCUpfm3WBn5lKFZ1Bi2La5xR5vVM47skx2qtX5Ib9P88zPcpNkBqGPB10lja4CdjZb0090FX4CxBekU5aZSkLn7C4/bYURa69Y487nK/1NceaMSPcRvhMe2eoZC2nb7SPAXehemUtTpjrJPMMrtkyh6KvhvBYZFPR5qb4tBa/2A1nq61np6fv6+bdeqlCLdYxVhw5l/bpqLtAG237xhOwE78+3gRtEaKu3e/GltwV8pFZnsFa/g2+IP8r/1VUAnK04lmEsPH8W8nx/ZJd9wdObvtaUVZ4IsZ3uKJfuEItm/aP5Cb8MwFPWkor31MdXdaLdPwo6dsHfeNV8AxUqpkUopF3AOMLe7B5HmsnT4uhY/hrIep4Q1/MYdkcw3JuiteQv+uT/M/5PViC01dtm4SPBPi5V9wjWGBz4qZWxB+jdqZbCvUEp1upB2e5ymiiw76Q2EcDuMhE022VPcDivzb7EvTini8xd6GZbbJ9Vau9rXtgRnqBvcPj3ybdFaB4ArgbeBVcCzWusV3T2OjHDm3+Inw16f13S6qFMZ0Li9bZJXuL1DdSm8cIm1ytace+HKRWDGGqZG2kXfDgVfu8awoaqJC2YOT7pA2p6YzN8O/smGx2lp/uGir8g+Qm/DCLt9IEb3D3aD26fHfP5a6zeAN3rq+NDmva9vDZCZYp0Kl2mwkxyyGnfgty+7pqmsRV+ev9jq0X/eM5Adv5nZpCGZmIaK9CUPk2Fn/qkuk9MO6Nba9h7hMts0f28ghCvOEnQ9jdtp0uqPyvyl4Cv0Moywzx8sx489Wz7i9umDmn9SkB6V+Yc7ITpNgyqybc0/3NvHsBa+3vYlnHpnp4EfrMWiP/rV0R3a6IYz/9MPGNJhzkEyEpv5B5Mz87fdPi0+yfyF3olpQD22SzCq6BuRffqg5p8UhL33dS3+yPKELodBJdm228f2+ZsKVr8BQ6bDxNN2+Z5KKYbEWbN2fGEmBw7P4ZLDk8sx0xmRSV6ALxDCnYR6uttpojWRgr0UfIXeRkzmH0/2kcw/MYSbrdW3tgV/p2lYE70aKwjYBU9XsMXK+kcevsfHys9w88KPZ8XMBUhmnKYRU/B1dbFQ3J2E70bqmq3gL5m/0NswVJTmH5X5B7sh8+8Xjd06I93toMkbwFQqIvu4HAY7QlmAF7y1AGTuXAKhQL9YDSqMKzzDF7vgm4SBNTym2hbJ/IXeiRme4QtWh1ybsOwT7Gu9fZKFdI+DZl+QYEjHFHzLgplggNFkTSzL3L7AamhWdHBPDrdbcUYVfH1JqvmHx1Rjr5yW4kq+MQrCrgj7/IGYFg9h2Uc0/wQR9t57A6GOsg/gbN5hPW/7Ahg8Fdy9f13RruI0jchqQslq9RTZR+jtmErhxYk2XbEFXzvmi+afIML9fYDImqEuh8EOO/ibzTvw4CVlxxIY0X8kH7AKvmAtYO9L0uAfDvZ1IvsIvRSreYAi5MqIKfh2h9unX8s+4bbOQFTmryLN3VwtlRxg1KFC/n6l9wORAq8/GLIz/+QLrO1lH8n8hd6GYbeOCbkyMVu71+3Tr4N/enTwtzV/t8Owem2YblytlRxh7EQrA1U0s6eG2SM4I8Ff4w0EcSVh5h++INWK7CP0Ukx7pn/I3Zb5a60JJ/yS+SeIaNknWvMHRTA1n4GVC/ihWYJ31PF4PJk9NMqewRmV+Sev7GNr/i1+XA6jW9dEFoR9gRmV+YcLvtHZfiLdPsn3je5GrEXcLaJn+AIE0wrIbVhNJdk0n/CPHhlfTxJuZucLhOz2Dsn3UYnO/EXvF3oj4RZfQWcGeBuAtmKv9bMUfBNCenTmH+XzB/ClFhJUTn7suwYzLa9HxteThM+DPxjC60/OzD8867i2xRe5CxCE3kRb5p8eFfzbAn4ie/v0a9kn3dWZ7APlM65jRfZZfP2pK+4C7n2daM3fF0zOgm9Y42/1hyjMTL7xCcLuCGv+AWd6RPOPkX0k808MaW4rYLhMI5I5hjPc5rThbMuYDNCvg3+L35oEl5yyT9uYpNgr9EbCbp+I7KN1TMAXt0+CcJgGKU6TNLcZ6a8fDnq+QChqDd/kC3yJJqz5hxedT0rZJ2pM0s5Z6I0Y0Zm/DoG/mVCorRYpmn8CSfc4IpIPtAU9fzBEIBRCqTjLOPYDwj7/Rm/yBv/obF8KvkJvJNwvMeC0l3X1Nojbp7vIcDsixV6IKvgGQ/iD2url3w8Jn4dw8E/GxVwchiJ8XRbZR+iNRDJ/h93t19sgbp/uIi/dTX6GO/I4WvYJhkL9MuuHtvPQlMSZv1IqEvQl8xd6I+H4EnCEM/96cft0F7efPSWmoOuOsjj6g7pfFnuhLfhHZJ8ktVK6HQbNvqBk/kKvJJz5+6My/2Ba97h9+n3wH5abGvM4puAbCkUe9zdcdmO3Brvgm4yLuUB4opdf2jkLvZK24G93DO6g+Yvs021ET24KhrTIPpHMPzkz67BF15OENQlB2B3h+OJ3tq3jGyP7iObffUQy/6C2C779O/g32OvjJqPmD20tHsTqKfRGwjfUPrOTgq+4fboPV4zPP4QjSeWORNNe80/GSV7QVosQzV/ojYTnF/miNX+Z4dszRMs+gZDG0U8z/97g84c2uUfcPkJvJNzeIYgDHCnd6vZJzm90DxLdzTLQn90+dsG3LfgnZ3ANZ/4i+wi9kUhjN421TKxk/j2HwzQwVNsM3/7Y2gGiZJ8kbu8AbeOSrp5CbyTs9gmGdNzgL5l/N+M0DXxh2aefZv5huavRGwSSOPjLJC+hF9OW+bcF/1A3NXZLzm90D+MyjTbZp59q/kopXKZBozfs9knO4NqW+Sfn+ARhV4TDS3TmH9veIYHHTtxb915cDsOe4dt/3T5g1T9a/ZbXLGndPlLwFXoxRkzmn9lR9hHNv3txhjP/fuz2AXBGBfxkDf4esXoKvZjIAu4R2adOZJ+exMr8ta35999TFC76Ok2VtDOdZZKX0JsJf6+CIcTtkww4TWUVfIOhfjvDF9q8/sna1wfaNH+RfYTeSHgB91BIg8eSfUJRTfzF7dPNuBxmpOCbrBlvdxCe85CsfX2gTe4R2UfojXRw+4QC6EBrZH+vLPgqpf6glNqqlFpi/zspat/1SqkSpdQapdTxiRrDnuIyVcTn31+7ekKb7JOsNk+A/QZlMK4gg6yoBXkEobcQmeEbDv6A8jVG9vfmNXz/obX+W/QGpdQE4BxgIjAYeE8pNVZrHUzwWLpMTMG3n/r8oS34J2uxF+CocQM5atzAnh6GIOwREbdPSENKprXN1xDZ39fcPnOAp7XWXq31BqAEmNED4+iUsNWz38s+juTP/AWhN9Nhhi+gvG3Bvze7fa5USi1TSj2slMqxtw0BtkQ9p8zeljRYM3y1Jfv00/YOAO5ekPkLQm+mzepJJPgb/qjgn6yZv1LqPaXU8jj/5gD3AaOBqUA5cPsevP9lSqlFSqlFlZWVezPUb4TLYfT7xm7Q1twtWWf3CkJvJ5xbhqI0fyNK80/aNXy11rO78jyl1L+B1+yHW4FhUbuH2tvivf8DwAMA06dPT2DdOxaXGTXDtz/LPr2g4CsIvZk2n39b8Df9jYAllPRWt8+gqIenA8vtn+cC5yil3EqpkUAxsDBR49gTwpl/UCZ5ASL7CEKiMGLcPh0Lvr3V7fNXpdRUQAMbgR8BaK1XKKWeBVYCAeCKZHL6gOVv9wdD+Pu528clmb8gJJRw8NdRmr/D3z1un4QFf631BbvYdzNwc6KOvbc4zbDbp7/LPqL5C0IiiZF9HG4w3bbsQ9v2BCEpXRxcDgOvP0RI028XcwGRfQQh0cS0dAZwZ8QE/77m8096XKZBs99Sopz9WPYRn78gJBalFEpFBXl3Bg7J/HsOl8OInHSzH2f+bZq/yD6CkChMpWIyf0egCbBW0+uVbp/eTHQ/n36d+du/u8g+gpA4jOgg787E5aujkJ1kml7p6tndRAf//l3wFdlHEBKNqVSb7OPJYmDtVyzw/JRHzZsSOsM30Y3deiXRma4pPn/czv57DgQh0RgqSts/8lcsCowkuO49xhjlvdbn32txRUk9/XoxF0fyL+YiCL0dw4jS/AdPZcmITAJrNjLFKBW3T3cTnfn37xm+yb+YiyD0dkxDodut29ukPXjwQTBx81/7b2TbBaL5W4jmLwiJx1QqRtsPaWgiBQBnsClhx5VvdRxiM38J/hL8BSFxKKWIWraXkNY04gHALcG/e4nN/PvvKZLePoKQeEwjtnVzMKRp1JL59wgukX0A6ecvCN1BjNUTW/O3ZR9XsDlhx5XgHweRfSykt48gJB7DaK/5a5rCsk9Ign+3EjvDt/+eItH8BSHxGErFyD4hrWlWqQC4JfPvXmImefVj2WdkXhoZHgdDclJ6eiiC0GcxDUUwys4fDEGLLfskMvOXSV5xiO7n0597+4wtyODrPxzf08MQhD6NoWJbN4e0psWwgr9HZJ/uxSVuH0EQugnTUB3cPq1h2Sckbp9uRWQfQRC6CyO6pTNW8A8aTnw4E5r5i+wTByn4CoLQXRjtrJ4hrTENhZdUUkItCTuuBP84iNVTEITuwmy3aEtIawylaFUpeHTigr+ktXGQ3j6CIHQXMV09sdw+hlK0GqmkSMG3e3FLV09BELoJs73bJ6QxDfAaaXi0BP9uJUbzl8xfEIQE0qHgqzWmUniNVFJE9uleTEMRjvni9hEEIZFYa/jGZv6GofCaqaRK5t/9hIu+IvsIgpBITKUIRbV0DtpuH5+RSiqS+Xc7YemnP8/wFQQh8ZgdGrvZBV8zlVSRfbqfcNFXZB9BEBKJil7AHVv2UeA300illZjbgn2IBP9OiGT+0t5BEIQEYhod+/mbhsJnWi0e8DUm5LgS2TrBaRoYyirGCIIgJIoOi7nYk7x8jjRrgwT/7sXlMKSpmyAICcea5NX2OGRn/n7TDv5eCf7ditM0pLWDIAgJx1B0WMzFCv627ONtSMxxE/KufQAr85fgLwhCYmnv9glqUErhj8g+SRj8lVJnKaVWKKVCSqnp7fZdr5QqUUqtUUodH7X9BHtbiVLq13tz/ETiMpV4/AVBSDgdunqGNKaiLfgnqeyzHDgD+Ch6o1JqAnAOMBE4AbhXKWUqpUzgHuBEYAJwrv3cpEMyf0EQuoN4i7mYhiKY4ILvXrV01lqvAusWpR1zgKe11l5gg1KqBJhh7yvRWpfar3vafu7KvRlHInCahvTyFwQh4RiqvexjuX3aMv8klH12wRBgS9TjMntbZ9uTDqdpyAQvQRASjtGuvUMokvmnWxsSFPx3m/krpd4DCuPsukFr/cq+H1LMsS8DLgMoKipK5KE6kJvqIjvV2a3HFASh/2EaHRdwN5QiZLoJaANHT8k+WuvZe/C+W4FhUY+H2tvYxfZ4x34AeABg+vTpurPnJYLrTxpPiz/YnYcUBKEfYrZfzEVb3n/DNGjCQ2ZrPYnQIBIl+8wFzlFKuZVSI4FiYCHwBVCslBqplHJhFYXnJmgMe0V2qotBWSk9PQxBEPo4qhO3j6kUjaSgE+T22auCr1LqdOAuIB94XSm1RGt9vNZ6hVLqWaxCbgC4QmsdtF9zJfA2YAIPa61X7NVvIAiC0Isx2y/mYmv+hqFo0h50T2n+u0Jr/RLwUif7bgZujrP9DeCNvTmuIAhCX6GzBdxNw8r8pbePIAhCH8Ry+3TM/E2laNQpvc7qKQiCIHQBQ9FuMRcr81cKmvAk7QxfQRAEYS9o7/YJ2W4f01A0kYIS2UcQBKHvYRiKqMTfkn2UdVH4OjQS/5AZnb94b46bkHcVBEEQuoTZvr1DSFs+f6X4b/B46k66PyHHleAvCILQgxjt1/DVGtN2+1iPE3TcxLytIAiC0BXCS8WGHT/hxVzCrcWi7wr26XET8q6CIAhClzDtrsjhIB8MWbN+DRV7UdjXSPAXBEHoQSKZv47O/InIPkEJ/oIgCH2Ptgzfemy5fdo0f5F9BEEQ+iDhNaPCQT4U5fYJP04EEvwFQRB6kHCQD8s7QXH7CIIg9H3CQV5Haf5GtNtHMn9BEIS+R/vCbihk3Q1EZB/R/AVBEPoeqr3VU9w+giAIfR+zE7ePIW4fQRCEvkvY7RPSOuLsMex+/iBuH0EQhD5JtNsnrO+bMZp/go6bmLcVBEEQukJ0YTcs8RiGwgj7/yXzFwRB6HtEF3bDur+homQf0fwFQRD6HkbUZK5w5i9uH0EQhD5OdIYfDvSGuH0EQRD6NtEzecPOHjPK7aMl+AuCIPQ9DKOj2yd6hm8wlKDjJuZtBUEQhK7QluEjbh9BEIT+QnTf/rDbJ7arpwR/QRCEPoeK0vxj3D5K3D6CIAh9lugMPxTH7SOZvyAIQh8kOsMPxnH7SPAXBEHog0Rn+OL2EQRB6CdEL+AeiuP2ka6egiAIfZDoBdyDcdw+STnDVyl1llJqhVIqpJSaHrV9hFKqRSm1xP53f9S+A5VSXyulSpRSd6rwMjaCIAj9ECOqb3+b5p/8bp/lwBnAR3H2rddaT7X/XR61/T7gUqDY/nfCXo5BEASh12J2pvkbSdzeQWu9Smu9pqvPV0oNAjK11gu09Rs9Cpy2N2MQBEHozcRdzMVQMdsTctyEvKvFSKXUV0qpD5VSh9vbhgBlUc8ps7cJgiD0S4xOunpGZJ8EreTl2N0TlFLvAYVxdt2gtX6lk5eVA0Va651KqQOBl5VSE7/p4JRSlwGXARQVFX3TlwuCICQ9bX37u9fts9vgr7We/U3fVGvtBbz2z4uVUuuBscBWYGjUU4fa2zp7nweABwCmT5+eoOufIAhCzxG9gHuvcft0hlIqXyll2j+Pwirslmqty4F6pdRM2+VzIdDZ3YMgCEKfR8WTfQySW/NXSp2ulCoDDgFeV0q9be86AlimlFoCPA9crrWutvf9BHgQKAHWA2/uzRgEQRB6M2a8gm9U5p8ot89uZZ9dobV+CXgpzvYXgBc6ec0iYNLeHFcQBKGvYMZbzMWQ9g6CIAh9mjY/P7Fr+IZbPfcmzV8QBEHoGtFBPtrnr+wLgPT2EQRB6IPEtnSO3WYaSjJ/QRCEvkh0S+dotw9Y8o9k/oIgCH0QM6qxW7TsA3bwl8xfEASh72FEtXGIbuwGtuwjbh9BEIS+R3Qbh2i3j/W/LOMoCILQJ4lu49Be9rEyfwn+giAIfY7Yrp7WNnH7CIIg9HEii7mEdMTZE+32ScrFXARBEIS9I7qNQzy3j8g+giAIfZDoGb5BcfsIgiD0D6LbOITau30McfsIgiD0WUxDxczwjbh9RPYRBEHouyilbNnHemxGMn9x+wiCIPRZTLuHT3u3jyluH0EQhL5LuLDbvr2DuH0EQRD6MOE2DsH2Vk9x+wiCIPRdDLvg297tY4rbRxAEoe8SdvVE2juI20cQBKHvE8782yZ5xW5PyDET8q6CIAhCl7HcPtZEL0NZ1k+QxVwEQRD6NIZqa+kc1vtBZB9BEIQ+jWFYPv+g1pE1fa3tEBK3jyAIQt8k3Lc/FNKR2b3R2xOBBH9BEIQexlSKkLbaOpvRmb/IPoIgCH0XFe7qqTVRsR/TkPYOgiAIfZbwWr2h9pq/EtlHEAShzxIO8sF2mr8l+yTomIl5W0EQBKGrhOWd9pm/aRBp+bCvkeAvCILQwxiR9g7i9hEEQeg3WIu2xHf7JGXmr5S6TSm1Wim1TCn1klIqO2rf9UqpEqXUGqXU8VHbT7C3lSilfr03xxcEQegLmNFun6ionMztHd4FJmmt9wfWAtcDKKUmAOcAE4ETgHuVUqZSygTuAU4EJgDn2s8VBEHot8S4fXqD7KO1fkdrHbAfLgCG2j/PAZ7WWnu11huAEmCG/a9Ea12qtfYBT9vPFQRB6Lco1baAe3u3T29o7/BD4E375yHAlqh9Zfa2zrYLgiD0W0w7+Mdz+yRqhq9jd09QSr0HFMbZdYPW+hX7OTcAAeCJfTk4pdRlwGUARUVF+/KtBUEQkgbTUHy5uQ6naTAkOyVme6Jkn90Gf6317F3tV0p9HzgZOEa3zUPeCgyLetpQexu72B7v2A8ADwBMnz49MWdAEAShhzl/ZhGZKVY4PnJsfmT75CHZJCj2o/amb4RS6gTg78CRWuvKqO0TgSexNP7BwDygGFBYheFjsIL+F8B5WusVuzvW9OnT9aJFi/Z4rIIgCP0NpdRirfX0ePt2m/nvhrsBN/CuvfLMAq315VrrFUqpZ4GVWHLQFVrroD2YK4G3ARN4uCuBXxAEQdi37FXm351I5i8IgvDN2FXmLzN8BUEQ+iES/AVBEPohEvwFQRD6IRL8BUEQ+iES/AVBEPohEvwFQRD6Ib3G6qmUqgQ27eHL84CqfTicRCBj3HuSfXwgY9xXyBi7xnCtdX68Hb0m+O8NSqlFnXldkwUZ496T7OMDGeO+Qsa494jsIwiC0A+R4C8IgtAP6S/B/4GeHkAXkDHuPck+PpAx7itkjHtJv9D8BUEQhFj6S+YvCIIgRNGng79S6gSl1BqlVIlS6tc9PR4ApdQwpdR8pdRKpdQKpdTV9vZcpdS7Sql19v85STBWUyn1lVLqNfvxSKXU5/b5fEYp5erh8WUrpZ5XSq1WSq1SSh2SbOdRKXWt/XderpR6Sinl6enzqJR6WCm1Qym1PGpb3POmLO60x7pMKTWtB8d4m/23XqaUekkplR2173p7jGuUUsf3xPii9v1cKaWVUnn24x45h7ujzwZ/pZQJ3AOcCEwAzlVKTejZUQHW+gY/11pPAGYCV9jj+jUwT2tdjLX4TTJcrK4GVkU9vhX4h9Z6DFADXNwjo2rjDuAtrfV4YArWWJPmPCqlhgBXAdO11pOw1rA4h54/j/8BTmi3rbPzdiLWQkzFWEuq3teDY3wXmKS13h9rUajrAezvzznARPs199rf/+4eH0qpYcBxwOaozT11DneN1rpP/gMOAd6Oenw9cH1PjyvOOF8BjgXWAIPsbYOANT08rqFYQeBbwGtYq7BVAY5457cHxpcFbMCuW0VtT5rzCAwBtgC5WAsnvQYcnwznERgBLN/deQP+BZwb73ndPcZ2+04HnrB/jvluYy0WdUhPjA94HisR2Qjk9fQ53NW/Ppv50/bFC1Nmb0salFIjgAOAz4ECrXW5vWs7UNBT47L5J/ArIGQ/HgDUaq0D9uOePp8jgUrgEVuaelAplUYSnUet9Vbgb1hZYDlQBywmuc5jmM7OW7J+j34IvGn/nBRjVErNAbZqrZe225UU42tPXw7+SY1SKh14AbhGa10fvU9b6UGP2bCUUicDO7TWi3tqDF3AAUwD7tNaHwA00U7iSYLzmAPMwbpQDQbSiCMVJBs9fd52h1LqBiz59ImeHksYpVQq8Bvg/3p6LF2lLwf/rcCwqMdD7W09jlLKiRX4n9Bav2hvrlBKDbL3DwJ29NT4gEOBU5VSG4GnsaSfO4BspVR43eeePp9lQJnW+nP78fNYF4NkOo+zgQ1a60qttR94EevcJtN5DNPZeUuq75FS6vvAycD37IsUJMcYR2Nd5Jfa35uhwJdKqcIkGV8H+nLw/wIotp0VLqyC0NweHhNKKQU8BKzSWv89atdc4CL754uwagE9gtb6eq31UK31CKzz9r7W+nvAfOA79tN6eozbgS1KqXH2pmOAlSTRecSSe2YqpVLtv3t4jElzHqPo7LzNBS60HSszgbooeahbUUqdgCVFnqq1bo7aNRc4RynlVkqNxCqsLuzOsWmtv9ZaD9Raj7C/N2XANPtzmjTnMIaeLjok8h9wEpYrYD1wQ0+Pxx7TYVi31MuAJfa/k7A09XnAOuA9ILenx2qP9yjgNfvnUVhfqhLgOcDdw2ObCiyyz+XLQE6ynUfgRmA1sBx4DHD39HkEnsKqQfixgtTFnZ03rEL/PfZ36Gss51JPjbEESzsPf2/uj3r+DfYY1wAn9sT42u3fSFvBt0fO4e7+yQxfQRCEfkhfln0EQRCETpDgLwiC0A+R4C8IgtAPkeAvCILQD5HgLwiC0A+R4C8IgtAPkeAvCILQD5HgLwiC0A/5f5+Xt/DOupeuAAAAAElFTkSuQmCC\n",
      "text/plain": [
       "<Figure size 432x288 with 1 Axes>"
      ]
     },
     "metadata": {
      "needs_background": "light"
     },
     "output_type": "display_data"
    }
   ],
   "source": [
    "import matplotlib.pyplot as plt\n",
    "# Generate recent 50 interval average\n",
    "average_reward = []\n",
    "for idx in range(len(rewards)):\n",
    "    avg_list = np.empty(shape=(1,), dtype=int)\n",
    "    if idx < 5:\n",
    "        avg_list = rewards[:idx+1]\n",
    "    else:\n",
    "        avg_list = rewards[idx-4:idx+1]\n",
    "    average_reward.append(np.average(avg_list))\n",
    "plt.plot(rewards)\n",
    "plt.plot(average_reward)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "9f18bae5",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "44b0354e",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "58e2db1b",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "8385f8b3",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "c1d27da3",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "fb4df6e4",
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.10.12"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
