{
 "cells": [
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# Oracle Matching Bandits"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Compare the performance of Oracle matching bandit algorithms; algrothims whichc optimize for matching, while having full knowledge of transitions"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {},
   "outputs": [],
   "source": [
    "%load_ext autoreload\n",
    "%autoreload 2"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "metadata": {},
   "outputs": [],
   "source": [
    "import numpy as np\n",
    "import random \n",
    "import matplotlib.pyplot as plt\n",
    "import json \n",
    "import argparse \n",
    "import sys\n",
    "from itertools import combinations"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "metadata": {},
   "outputs": [],
   "source": [
    "from rmab.simulator import RMABSimulator\n",
    "from rmab.baselines import optimal_whittle, random_policy, optimal_q_iteration, myopic_match_n_step\n",
    "from rmab.fr_dynamics import get_all_transitions\n",
    "from rmab.utils import get_save_path, delete_duplicate_results"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "metadata": {},
   "outputs": [],
   "source": [
    "is_jupyter = 'ipykernel' in sys.modules"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "metadata": {},
   "outputs": [],
   "source": [
    "if is_jupyter: \n",
    "    seed        = 42\n",
    "    n_arms      = 4\n",
    "    budget      = 3\n",
    "    discount    = 0.9\n",
    "    alpha       = 3 \n",
    "    n_episodes  = 30\n",
    "    episode_len = 20\n",
    "    n_epochs    = 10\n",
    "    save_name = 'results'\n",
    "    match_prob = 0.5\n",
    "    save_with_date = True \n",
    "else:\n",
    "    parser = argparse.ArgumentParser()\n",
    "    parser.add_argument('--n_arms',         '-N', help='num beneficiaries (arms)', type=int, default=8)\n",
    "    parser.add_argument('--episode_len',    '-H', help='episode length', type=int, default=20)\n",
    "    parser.add_argument('--n_episodes',     '-T', help='num episodes', type=int, default=30)\n",
    "    parser.add_argument('--budget',         '-B', help='budget', type=int, default=3)\n",
    "    parser.add_argument('--n_epochs',       '-E', help='number of epochs (num_repeats)', type=int, default=10)\n",
    "    parser.add_argument('--discount',       '-d', help='discount factor', type=float, default=0.9)\n",
    "    parser.add_argument('--alpha',          '-a', help='alpha: for conf radius', type=float, default=3)\n",
    "    parser.add_argument('--seed',           '-s', help='random seed', type=int, default=42)\n",
    "    parser.add_argument('--save_name',      '-n', help='save name', type=str, default='results')\n",
    "    parser.add_argument('--match_prob',      '-m', help='match probability', type=float, default=0.5)\n",
    "    parser.add_argument('--use_date', action='store_true')\n",
    "\n",
    "    args = parser.parse_args()\n",
    "\n",
    "    n_arms      = args.n_arms\n",
    "    budget      = args.budget\n",
    "    discount    = args.discount\n",
    "    alpha       = args.alpha \n",
    "    seed        = args.seed\n",
    "    n_episodes  = args.n_episodes\n",
    "    episode_len = args.episode_len\n",
    "    n_epochs    = args.n_epochs\n",
    "    save_name   = args.save_name \n",
    "    save_with_date = args.use_date \n",
    "    match_prob = args.match_prob \n",
    "\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "metadata": {},
   "outputs": [],
   "source": [
    "n_states = 2\n",
    "n_actions = 2"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "metadata": {},
   "outputs": [],
   "source": [
    "all_population_size = 100 # number of random arms to generate\n",
    "all_transitions = get_all_transitions(all_population_size)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "(100, 2, 2, 2)"
      ]
     },
     "execution_count": 8,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "all_transitions.shape"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 9,
   "metadata": {},
   "outputs": [],
   "source": [
    "all_features = np.arange(all_population_size)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 10,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "acting should always be good! 0.000 < 0.044\n",
      "acting should always be good! 0.000 < 0.162\n",
      "acting should always be good! 0.108 < 0.183\n",
      "good start state should always be good! 0.380 < 0.508\n",
      "good start state should always be good! 0.506 < 0.760\n",
      "cohort [83 53 70 45]\n",
      "cohort [41 39 15 76]\n",
      "cohort [79 72 62 94]\n",
      "cohort [92 64 85 36]\n",
      "cohort [ 7 38 78  2]\n",
      "cohort [12 59 91 73]\n",
      "cohort [48 64  7 37]\n",
      "cohort [18 53 12 32]\n",
      "cohort [69 64 53 61]\n",
      "cohort [46 87 15 26]\n"
     ]
    }
   ],
   "source": [
    "np.random.seed(seed)\n",
    "random.seed(seed)\n",
    "simulator = RMABSimulator(all_population_size, all_features, all_transitions,\n",
    "            n_arms, episode_len, n_epochs, n_episodes, budget, number_states=n_states, reward_style='match',match_probability=match_prob)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 11,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "(4, 2, 2, 2)"
      ]
     },
     "execution_count": 11,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "simulator.reset_instance()\n",
    "simulator.transitions.shape"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 15,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "first state [0 1 1 1]\n",
      "instance 0, ep 1, state [1 1 1 1]\n",
      "instance 0, ep 2, state [0 0 0 1]\n",
      "instance 0, ep 3, state [1 1 0 1]\n",
      "instance 0, ep 4, state [0 1 1 1]\n",
      "instance 0, ep 5, state [0 0 0 1]\n",
      "instance 0, ep 6, state [0 0 0 1]\n",
      "instance 0, ep 7, state [0 1 1 0]\n",
      "instance 0, ep 8, state [1 1 0 1]\n",
      "instance 0, ep 9, state [1 1 1 1]\n",
      "instance 0, ep 10, state [0 0 0 0]\n",
      "instance 0, ep 11, state [0 1 0 0]\n",
      "instance 0, ep 12, state [0 1 0 1]\n",
      "instance 0, ep 13, state [0 0 0 0]\n",
      "instance 0, ep 14, state [1 0 1 0]\n",
      "instance 0, ep 15, state [0 0 0 1]\n",
      "instance 0, ep 16, state [0 0 0 0]\n",
      "instance 0, ep 17, state [1 1 0 1]\n",
      "instance 0, ep 18, state [0 1 0 0]\n",
      "instance 0, ep 19, state [0 1 1 1]\n",
      "instance 0, ep 20, state [0 1 1 0]\n",
      "instance 0, ep 21, state [0 0 1 0]\n",
      "instance 0, ep 22, state [1 0 1 1]\n",
      "instance 0, ep 23, state [0 1 1 1]\n",
      "instance 0, ep 24, state [0 0 1 1]\n",
      "instance 0, ep 25, state [0 0 1 0]\n",
      "instance 0, ep 26, state [1 1 1 1]\n",
      "instance 0, ep 27, state [0 1 1 0]\n",
      "instance 0, ep 28, state [0 1 1 0]\n",
      "instance 0, ep 29, state [1 1 1 1]\n",
      "first state [1 0 0 0]\n",
      "instance 1, ep 1, state [1 0 0 1]\n",
      "instance 1, ep 2, state [0 0 0 0]\n",
      "instance 1, ep 3, state [1 0 1 0]\n",
      "instance 1, ep 4, state [1 0 0 1]\n",
      "instance 1, ep 5, state [1 1 0 0]\n",
      "instance 1, ep 6, state [0 1 0 1]\n",
      "instance 1, ep 7, state [0 1 0 1]\n",
      "instance 1, ep 8, state [0 0 1 0]\n",
      "instance 1, ep 9, state [0 1 1 0]\n",
      "instance 1, ep 10, state [0 0 1 0]\n",
      "instance 1, ep 11, state [0 0 0 1]\n",
      "instance 1, ep 12, state [0 1 0 0]\n",
      "instance 1, ep 13, state [0 0 1 1]\n",
      "instance 1, ep 14, state [1 1 0 1]\n",
      "instance 1, ep 15, state [0 1 0 0]\n",
      "instance 1, ep 16, state [0 0 0 0]\n",
      "instance 1, ep 17, state [1 0 0 1]\n",
      "instance 1, ep 18, state [1 0 0 1]\n",
      "instance 1, ep 19, state [0 1 1 0]\n",
      "instance 1, ep 20, state [0 1 1 1]\n",
      "instance 1, ep 21, state [1 1 1 1]\n",
      "instance 1, ep 22, state [1 1 1 1]\n",
      "instance 1, ep 23, state [1 0 1 1]\n",
      "instance 1, ep 24, state [1 1 1 0]\n",
      "instance 1, ep 25, state [0 0 0 0]\n",
      "instance 1, ep 26, state [1 0 1 0]\n",
      "instance 1, ep 27, state [1 0 0 0]\n",
      "instance 1, ep 28, state [1 0 1 0]\n",
      "instance 1, ep 29, state [0 1 1 0]\n",
      "first state [1 0 0 1]\n",
      "instance 2, ep 1, state [0 1 0 1]\n",
      "instance 2, ep 2, state [0 1 1 1]\n",
      "instance 2, ep 3, state [0 1 1 1]\n",
      "instance 2, ep 4, state [1 1 0 1]\n",
      "instance 2, ep 5, state [1 1 0 0]\n",
      "instance 2, ep 6, state [1 1 0 1]\n",
      "instance 2, ep 7, state [0 0 0 0]\n",
      "instance 2, ep 8, state [1 0 1 1]\n",
      "instance 2, ep 9, state [1 1 0 1]\n",
      "instance 2, ep 10, state [1 0 1 1]\n",
      "instance 2, ep 11, state [1 1 1 0]\n",
      "instance 2, ep 12, state [1 1 0 0]\n",
      "instance 2, ep 13, state [0 1 1 0]\n",
      "instance 2, ep 14, state [1 0 1 1]\n",
      "instance 2, ep 15, state [1 0 0 0]\n",
      "instance 2, ep 16, state [0 1 1 1]\n",
      "instance 2, ep 17, state [1 1 1 1]\n",
      "instance 2, ep 18, state [1 0 0 0]\n",
      "instance 2, ep 19, state [1 1 0 1]\n",
      "instance 2, ep 20, state [1 0 0 1]\n",
      "instance 2, ep 21, state [1 1 1 1]\n",
      "instance 2, ep 22, state [1 1 1 0]\n",
      "instance 2, ep 23, state [0 0 1 1]\n",
      "instance 2, ep 24, state [1 0 0 0]\n",
      "instance 2, ep 25, state [0 1 0 0]\n",
      "instance 2, ep 26, state [1 0 1 1]\n",
      "instance 2, ep 27, state [0 1 1 1]\n",
      "instance 2, ep 28, state [0 1 0 0]\n",
      "instance 2, ep 29, state [0 1 0 0]\n",
      "first state [0 1 1 0]\n",
      "instance 3, ep 1, state [1 1 0 0]\n",
      "instance 3, ep 2, state [0 0 0 0]\n",
      "instance 3, ep 3, state [0 0 1 0]\n",
      "instance 3, ep 4, state [1 0 1 0]\n",
      "instance 3, ep 5, state [0 1 1 1]\n",
      "instance 3, ep 6, state [0 0 1 1]\n",
      "instance 3, ep 7, state [1 1 0 1]\n",
      "instance 3, ep 8, state [0 0 0 1]\n",
      "instance 3, ep 9, state [0 0 1 0]\n",
      "instance 3, ep 10, state [1 0 0 1]\n",
      "instance 3, ep 11, state [0 0 0 0]\n",
      "instance 3, ep 12, state [1 0 1 0]\n",
      "instance 3, ep 13, state [1 1 1 0]\n",
      "instance 3, ep 14, state [0 0 1 1]\n",
      "instance 3, ep 15, state [1 0 1 1]\n",
      "instance 3, ep 16, state [0 0 1 1]\n",
      "instance 3, ep 17, state [1 0 1 0]\n",
      "instance 3, ep 18, state [0 0 1 1]\n",
      "instance 3, ep 19, state [1 0 1 0]\n",
      "instance 3, ep 20, state [1 0 0 0]\n",
      "instance 3, ep 21, state [0 1 1 0]\n",
      "instance 3, ep 22, state [1 0 1 1]\n",
      "instance 3, ep 23, state [1 0 1 1]\n",
      "instance 3, ep 24, state [0 0 1 1]\n",
      "instance 3, ep 25, state [1 1 1 0]\n",
      "instance 3, ep 26, state [0 0 1 0]\n",
      "instance 3, ep 27, state [1 1 1 0]\n",
      "instance 3, ep 28, state [1 0 1 0]\n",
      "instance 3, ep 29, state [0 1 0 0]\n",
      "first state [0 1 0 1]\n",
      "instance 4, ep 1, state [0 0 0 0]\n",
      "instance 4, ep 2, state [1 0 1 0]\n",
      "instance 4, ep 3, state [1 0 0 1]\n",
      "instance 4, ep 4, state [0 0 1 1]\n",
      "instance 4, ep 5, state [0 0 1 0]\n",
      "instance 4, ep 6, state [0 0 1 1]\n",
      "instance 4, ep 7, state [0 0 0 1]\n",
      "instance 4, ep 8, state [0 0 1 0]\n",
      "instance 4, ep 9, state [1 0 0 0]\n",
      "instance 4, ep 10, state [1 1 1 0]\n",
      "instance 4, ep 11, state [1 0 0 1]\n",
      "instance 4, ep 12, state [0 0 0 0]\n",
      "instance 4, ep 13, state [0 1 0 1]\n",
      "instance 4, ep 14, state [1 0 0 0]\n",
      "instance 4, ep 15, state [1 0 1 0]\n",
      "instance 4, ep 16, state [1 0 0 1]\n",
      "instance 4, ep 17, state [1 0 1 0]\n",
      "instance 4, ep 18, state [1 1 0 0]\n",
      "instance 4, ep 19, state [0 1 1 0]\n",
      "instance 4, ep 20, state [0 1 1 1]\n",
      "instance 4, ep 21, state [0 0 0 1]\n",
      "instance 4, ep 22, state [0 1 0 1]\n",
      "instance 4, ep 23, state [1 1 0 0]\n",
      "instance 4, ep 24, state [0 1 1 1]\n",
      "instance 4, ep 25, state [1 1 0 1]\n",
      "instance 4, ep 26, state [0 0 1 0]\n",
      "instance 4, ep 27, state [0 1 0 1]\n",
      "instance 4, ep 28, state [0 0 0 0]\n",
      "instance 4, ep 29, state [1 0 1 0]\n",
      "first state [0 1 1 1]\n",
      "instance 5, ep 1, state [0 0 1 0]\n",
      "instance 5, ep 2, state [1 1 1 1]\n",
      "instance 5, ep 3, state [1 0 1 0]\n",
      "instance 5, ep 4, state [0 1 1 1]\n",
      "instance 5, ep 5, state [1 0 0 1]\n",
      "instance 5, ep 6, state [0 0 0 0]\n",
      "instance 5, ep 7, state [0 0 0 0]\n",
      "instance 5, ep 8, state [1 0 0 1]\n",
      "instance 5, ep 9, state [0 1 1 0]\n",
      "instance 5, ep 10, state [0 1 1 0]\n",
      "instance 5, ep 11, state [1 0 1 0]\n",
      "instance 5, ep 12, state [1 1 1 1]\n",
      "instance 5, ep 13, state [0 0 0 0]\n",
      "instance 5, ep 14, state [1 0 0 1]\n",
      "instance 5, ep 15, state [1 1 1 0]\n",
      "instance 5, ep 16, state [0 1 1 0]\n",
      "instance 5, ep 17, state [1 0 0 1]\n",
      "instance 5, ep 18, state [1 1 0 1]\n",
      "instance 5, ep 19, state [0 0 1 1]\n",
      "instance 5, ep 20, state [1 1 1 1]\n",
      "instance 5, ep 21, state [0 0 0 0]\n",
      "instance 5, ep 22, state [1 0 0 0]\n",
      "instance 5, ep 23, state [1 0 1 0]\n",
      "instance 5, ep 24, state [0 1 1 0]\n",
      "instance 5, ep 25, state [1 1 0 1]\n",
      "instance 5, ep 26, state [1 1 1 1]\n",
      "instance 5, ep 27, state [1 1 1 1]\n",
      "instance 5, ep 28, state [1 1 0 1]\n",
      "instance 5, ep 29, state [1 0 1 0]\n",
      "first state [0 0 1 0]\n",
      "instance 6, ep 1, state [1 0 1 0]\n",
      "instance 6, ep 2, state [1 1 1 1]\n",
      "instance 6, ep 3, state [1 1 0 0]\n",
      "instance 6, ep 4, state [1 1 1 0]\n",
      "instance 6, ep 5, state [0 0 1 0]\n",
      "instance 6, ep 6, state [0 0 0 1]\n",
      "instance 6, ep 7, state [0 1 0 0]\n",
      "instance 6, ep 8, state [0 0 0 0]\n",
      "instance 6, ep 9, state [1 0 1 1]\n",
      "instance 6, ep 10, state [1 0 0 0]\n",
      "instance 6, ep 11, state [0 1 0 0]\n",
      "instance 6, ep 12, state [1 1 1 0]\n",
      "instance 6, ep 13, state [0 1 0 0]\n",
      "instance 6, ep 14, state [0 0 0 0]\n",
      "instance 6, ep 15, state [1 1 1 0]\n",
      "instance 6, ep 16, state [0 0 1 1]\n",
      "instance 6, ep 17, state [0 1 0 1]\n",
      "instance 6, ep 18, state [1 1 1 1]\n",
      "instance 6, ep 19, state [0 1 0 1]\n",
      "instance 6, ep 20, state [1 1 0 1]\n",
      "instance 6, ep 21, state [1 1 0 0]\n",
      "instance 6, ep 22, state [0 0 1 0]\n",
      "instance 6, ep 23, state [1 0 0 1]\n",
      "instance 6, ep 24, state [1 0 1 1]\n",
      "instance 6, ep 25, state [0 1 1 1]\n",
      "instance 6, ep 26, state [0 1 0 0]\n",
      "instance 6, ep 27, state [0 0 1 1]\n",
      "instance 6, ep 28, state [1 0 0 0]\n",
      "instance 6, ep 29, state [1 0 1 1]\n",
      "first state [1 0 1 0]\n",
      "instance 7, ep 1, state [1 0 0 0]\n",
      "instance 7, ep 2, state [1 0 1 1]\n",
      "instance 7, ep 3, state [0 1 0 1]\n",
      "instance 7, ep 4, state [0 1 1 1]\n",
      "instance 7, ep 5, state [1 0 1 1]\n",
      "instance 7, ep 6, state [1 0 1 1]\n",
      "instance 7, ep 7, state [1 0 1 0]\n",
      "instance 7, ep 8, state [1 0 1 1]\n",
      "instance 7, ep 9, state [0 1 0 1]\n",
      "instance 7, ep 10, state [1 1 1 1]\n",
      "instance 7, ep 11, state [0 0 1 1]\n",
      "instance 7, ep 12, state [1 1 0 1]\n",
      "instance 7, ep 13, state [0 1 0 0]\n",
      "instance 7, ep 14, state [0 0 1 0]\n",
      "instance 7, ep 15, state [0 0 0 0]\n",
      "instance 7, ep 16, state [0 1 1 1]\n",
      "instance 7, ep 17, state [0 0 1 1]\n",
      "instance 7, ep 18, state [0 0 0 0]\n",
      "instance 7, ep 19, state [0 1 1 1]\n",
      "instance 7, ep 20, state [1 1 1 1]\n",
      "instance 7, ep 21, state [0 0 0 1]\n",
      "instance 7, ep 22, state [1 0 1 0]\n",
      "instance 7, ep 23, state [1 0 0 0]\n",
      "instance 7, ep 24, state [0 0 0 1]\n",
      "instance 7, ep 25, state [1 0 1 1]\n",
      "instance 7, ep 26, state [0 0 0 0]\n",
      "instance 7, ep 27, state [1 0 1 1]\n",
      "instance 7, ep 28, state [0 1 0 1]\n",
      "instance 7, ep 29, state [0 1 1 0]\n",
      "first state [0 0 1 1]\n",
      "instance 8, ep 1, state [0 1 0 1]\n",
      "instance 8, ep 2, state [0 0 1 0]\n",
      "instance 8, ep 3, state [1 1 1 0]\n",
      "instance 8, ep 4, state [0 0 1 1]\n",
      "instance 8, ep 5, state [1 1 1 1]\n",
      "instance 8, ep 6, state [0 1 0 1]\n",
      "instance 8, ep 7, state [1 1 0 0]\n",
      "instance 8, ep 8, state [0 0 0 1]\n",
      "instance 8, ep 9, state [1 0 0 0]\n",
      "instance 8, ep 10, state [1 1 1 0]\n",
      "instance 8, ep 11, state [1 1 0 1]\n",
      "instance 8, ep 12, state [0 1 0 1]\n",
      "instance 8, ep 13, state [1 1 1 0]\n",
      "instance 8, ep 14, state [0 0 0 1]\n",
      "instance 8, ep 15, state [0 1 1 1]\n",
      "instance 8, ep 16, state [0 1 1 0]\n",
      "instance 8, ep 17, state [1 1 0 1]\n",
      "instance 8, ep 18, state [0 0 0 0]\n",
      "instance 8, ep 19, state [0 0 1 1]\n",
      "instance 8, ep 20, state [1 0 0 1]\n",
      "instance 8, ep 21, state [0 0 1 0]\n",
      "instance 8, ep 22, state [1 1 0 0]\n",
      "instance 8, ep 23, state [1 0 0 1]\n",
      "instance 8, ep 24, state [0 1 1 0]\n",
      "instance 8, ep 25, state [0 0 0 0]\n",
      "instance 8, ep 26, state [1 0 1 1]\n",
      "instance 8, ep 27, state [1 1 0 1]\n",
      "instance 8, ep 28, state [1 0 0 1]\n",
      "instance 8, ep 29, state [0 0 0 0]\n",
      "first state [1 1 1 0]\n",
      "instance 9, ep 1, state [1 1 0 0]\n",
      "instance 9, ep 2, state [0 0 1 0]\n",
      "instance 9, ep 3, state [1 0 0 0]\n",
      "instance 9, ep 4, state [0 0 1 1]\n",
      "instance 9, ep 5, state [1 0 0 0]\n",
      "instance 9, ep 6, state [1 0 0 1]\n",
      "instance 9, ep 7, state [0 0 0 1]\n",
      "instance 9, ep 8, state [1 0 0 1]\n",
      "instance 9, ep 9, state [1 0 1 0]\n",
      "instance 9, ep 10, state [1 1 0 1]\n",
      "instance 9, ep 11, state [1 1 0 0]\n",
      "instance 9, ep 12, state [0 1 0 1]\n",
      "instance 9, ep 13, state [1 0 1 0]\n",
      "instance 9, ep 14, state [1 0 0 0]\n",
      "instance 9, ep 15, state [0 1 1 1]\n",
      "instance 9, ep 16, state [0 0 0 1]\n",
      "instance 9, ep 17, state [1 0 0 1]\n",
      "instance 9, ep 18, state [1 1 1 0]\n",
      "instance 9, ep 19, state [0 1 1 0]\n",
      "instance 9, ep 20, state [1 1 1 1]\n",
      "instance 9, ep 21, state [0 1 1 1]\n",
      "instance 9, ep 22, state [1 1 0 1]\n",
      "instance 9, ep 23, state [1 1 1 1]\n",
      "instance 9, ep 24, state [0 1 0 0]\n",
      "instance 9, ep 25, state [1 1 0 0]\n",
      "instance 9, ep 26, state [1 0 0 0]\n",
      "instance 9, ep 27, state [0 0 0 0]\n",
      "instance 9, ep 28, state [1 1 1 0]\n",
      "instance 9, ep 29, state [0 1 0 0]\n"
     ]
    }
   ],
   "source": [
    "np.random.seed(seed)\n",
    "random.seed(seed)\n",
    "random_rewards = random_policy(simulator, n_episodes, n_epochs)\n",
    "random_active_rate = simulator.total_active/(random_rewards.size * n_arms)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 16,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "first state [0 1 1 1]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.26 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 0 1] state_WI [0.26 0.47 0.58 0.26] sorted [2 1 0]\n",
      "   state [0 1 0 0] state_WI [0.39 0.47 0.58 0.71] sorted [3 2 1]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.39 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [0 0 1 1] state_WI [0.39 0.54 0.47 0.26] sorted [1 2 0]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.26 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [1 0 1 1] state_WI [0.26 0.54 0.47 0.26] sorted [1 2 0]\n",
      "   state [1 1 0 0] state_WI [0.26 0.47 0.58 0.71] sorted [3 2 1]\n",
      "   state [1 1 0 1] state_WI [0.26 0.47 0.58 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.26 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.26 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [1 1 1 0] state_WI [0.26 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "instance 0, ep 1, state [1 1 1 1]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.26 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [0 0 0 0] state_WI [0.39 0.54 0.58 0.71] sorted [3 2 1]\n",
      "   state [1 1 1 0] state_WI [0.26 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.39 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 0 0 1] state_WI [0.26 0.54 0.58 0.26] sorted [2 1 0]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [0 0 0 0] state_WI [0.39 0.54 0.58 0.71] sorted [3 2 1]\n",
      "   state [0 1 0 0] state_WI [0.39 0.47 0.58 0.71] sorted [3 2 1]\n",
      "   state [1 0 1 0] state_WI [0.26 0.54 0.47 0.71] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.26 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "instance 0, ep 2, state [0 0 0 1]\n",
      "   state [0 0 0 1] state_WI [0.39 0.54 0.58 0.26] sorted [2 1 0]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.39 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [1 0 1 1] state_WI [0.26 0.54 0.47 0.26] sorted [1 2 0]\n",
      "   state [1 1 1 0] state_WI [0.26 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 0 1] state_WI [0.26 0.47 0.58 0.26] sorted [2 1 0]\n",
      "   state [0 1 0 1] state_WI [0.39 0.47 0.58 0.26] sorted [2 1 0]\n",
      "   state [0 0 0 1] state_WI [0.39 0.54 0.58 0.26] sorted [2 1 0]\n",
      "   state [1 0 0 1] state_WI [0.26 0.54 0.58 0.26] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.39 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 0 1 1] state_WI [0.26 0.54 0.47 0.26] sorted [1 2 0]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [0 1 0 0] state_WI [0.39 0.47 0.58 0.71] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [0 1 0 1] state_WI [0.39 0.47 0.58 0.26] sorted [2 1 0]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "instance 0, ep 3, state [1 1 0 1]\n",
      "   state [1 1 0 1] state_WI [0.26 0.47 0.58 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 0 0] state_WI [0.26 0.47 0.58 0.71] sorted [3 2 1]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.26 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [1 0 1 1] state_WI [0.26 0.54 0.47 0.26] sorted [1 2 0]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 0 1 1] state_WI [0.26 0.54 0.47 0.26] sorted [1 2 0]\n",
      "   state [1 1 1 0] state_WI [0.26 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [1 1 0 0] state_WI [0.26 0.47 0.58 0.71] sorted [3 2 1]\n",
      "   state [0 1 1 0] state_WI [0.39 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.26 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.26 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.26 0.47 0.47 0.71] sorted [3 2 1]\n",
      "instance 0, ep 4, state [0 1 1 1]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.26 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.39 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [0 1 1 0] state_WI [0.39 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [0 1 0 0] state_WI [0.39 0.47 0.58 0.71] sorted [3 2 1]\n",
      "   state [0 0 0 1] state_WI [0.39 0.54 0.58 0.26] sorted [2 1 0]\n",
      "   state [0 0 1 1] state_WI [0.39 0.54 0.47 0.26] sorted [1 2 0]\n",
      "   state [1 0 1 0] state_WI [0.26 0.54 0.47 0.71] sorted [3 1 2]\n",
      "   state [0 0 1 0] state_WI [0.39 0.54 0.47 0.71] sorted [3 1 2]\n",
      "   state [0 1 1 0] state_WI [0.39 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [0 1 0 1] state_WI [0.39 0.47 0.58 0.26] sorted [2 1 0]\n",
      "   state [1 0 1 1] state_WI [0.26 0.54 0.47 0.26] sorted [1 2 0]\n",
      "   state [0 0 1 1] state_WI [0.39 0.54 0.47 0.26] sorted [1 2 0]\n",
      "   state [0 0 1 1] state_WI [0.39 0.54 0.47 0.26] sorted [1 2 0]\n",
      "   state [1 0 1 1] state_WI [0.26 0.54 0.47 0.26] sorted [1 2 0]\n",
      "   state [0 0 1 1] state_WI [0.39 0.54 0.47 0.26] sorted [1 2 0]\n",
      "   state [1 1 0 0] state_WI [0.26 0.47 0.58 0.71] sorted [3 2 1]\n",
      "instance 0, ep 5, state [0 0 0 1]\n",
      "   state [0 0 0 1] state_WI [0.39 0.54 0.58 0.26] sorted [2 1 0]\n",
      "   state [0 0 0 0] state_WI [0.39 0.54 0.58 0.71] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 0 1] state_WI [0.26 0.47 0.58 0.26] sorted [2 1 0]\n",
      "   state [1 1 0 0] state_WI [0.26 0.47 0.58 0.71] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.39 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [0 0 1 0] state_WI [0.39 0.54 0.47 0.71] sorted [3 1 2]\n",
      "   state [0 0 1 1] state_WI [0.39 0.54 0.47 0.26] sorted [1 2 0]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.26 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 0 1 0] state_WI [0.26 0.54 0.47 0.71] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "instance 0, ep 6, state [0 0 0 1]\n",
      "   state [0 0 0 1] state_WI [0.39 0.54 0.58 0.26] sorted [2 1 0]\n",
      "   state [1 0 0 1] state_WI [0.26 0.54 0.58 0.26] sorted [2 1 0]\n",
      "   state [1 1 0 1] state_WI [0.26 0.47 0.58 0.26] sorted [2 1 0]\n",
      "   state [0 0 0 1] state_WI [0.39 0.54 0.58 0.26] sorted [2 1 0]\n",
      "   state [1 1 0 1] state_WI [0.26 0.47 0.58 0.26] sorted [2 1 0]\n",
      "   state [1 1 0 0] state_WI [0.26 0.47 0.58 0.71] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [0 1 0 1] state_WI [0.39 0.47 0.58 0.26] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.39 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.26 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 0 1] state_WI [0.26 0.47 0.58 0.26] sorted [2 1 0]\n",
      "instance 0, ep 7, state [0 1 1 0]\n",
      "   state [0 1 1 0] state_WI [0.39 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [0 0 1 1] state_WI [0.39 0.54 0.47 0.26] sorted [1 2 0]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [0 0 1 1] state_WI [0.39 0.54 0.47 0.26] sorted [1 2 0]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 0 0] state_WI [0.26 0.47 0.58 0.71] sorted [3 2 1]\n",
      "   state [1 0 0 1] state_WI [0.26 0.54 0.58 0.26] sorted [2 1 0]\n",
      "   state [1 1 0 0] state_WI [0.26 0.47 0.58 0.71] sorted [3 2 1]\n",
      "   state [1 1 0 1] state_WI [0.26 0.47 0.58 0.26] sorted [2 1 0]\n",
      "   state [0 0 1 0] state_WI [0.39 0.54 0.47 0.71] sorted [3 1 2]\n",
      "   state [1 0 1 1] state_WI [0.26 0.54 0.47 0.26] sorted [1 2 0]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [0 1 0 1] state_WI [0.39 0.47 0.58 0.26] sorted [2 1 0]\n",
      "   state [1 1 0 1] state_WI [0.26 0.47 0.58 0.26] sorted [2 1 0]\n",
      "   state [0 1 0 0] state_WI [0.39 0.47 0.58 0.71] sorted [3 2 1]\n",
      "   state [0 1 1 0] state_WI [0.39 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.39 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [1 1 1 0] state_WI [0.26 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [1 1 0 0] state_WI [0.26 0.47 0.58 0.71] sorted [3 2 1]\n",
      "instance 0, ep 8, state [1 1 0 1]\n",
      "   state [1 1 0 1] state_WI [0.26 0.47 0.58 0.26] sorted [2 1 0]\n",
      "   state [0 1 0 0] state_WI [0.39 0.47 0.58 0.71] sorted [3 2 1]\n",
      "   state [1 0 1 0] state_WI [0.26 0.54 0.47 0.71] sorted [3 1 2]\n",
      "   state [0 0 1 1] state_WI [0.39 0.54 0.47 0.26] sorted [1 2 0]\n",
      "   state [1 0 1 0] state_WI [0.26 0.54 0.47 0.71] sorted [3 1 2]\n",
      "   state [0 1 0 0] state_WI [0.39 0.47 0.58 0.71] sorted [3 2 1]\n",
      "   state [0 0 0 1] state_WI [0.39 0.54 0.58 0.26] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.39 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [0 1 1 0] state_WI [0.39 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.39 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 0 1 1] state_WI [0.26 0.54 0.47 0.26] sorted [1 2 0]\n",
      "   state [1 0 1 1] state_WI [0.26 0.54 0.47 0.26] sorted [1 2 0]\n",
      "   state [1 1 1 0] state_WI [0.26 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [0 0 1 1] state_WI [0.39 0.54 0.47 0.26] sorted [1 2 0]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.39 0.47 0.47 0.71] sorted [3 2 1]\n",
      "instance 0, ep 9, state [1 1 1 1]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.39 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [0 1 1 0] state_WI [0.39 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 0 0] state_WI [0.26 0.47 0.58 0.71] sorted [3 2 1]\n",
      "   state [1 0 1 1] state_WI [0.26 0.54 0.47 0.26] sorted [1 2 0]\n",
      "   state [1 1 0 0] state_WI [0.26 0.47 0.58 0.71] sorted [3 2 1]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.39 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [1 0 1 1] state_WI [0.26 0.54 0.47 0.26] sorted [1 2 0]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 0 1 1] state_WI [0.26 0.54 0.47 0.26] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.39 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 0 1] state_WI [0.26 0.47 0.58 0.26] sorted [2 1 0]\n",
      "   state [0 0 0 1] state_WI [0.39 0.54 0.58 0.26] sorted [2 1 0]\n",
      "instance 0, ep 10, state [0 0 0 0]\n",
      "   state [0 0 0 0] state_WI [0.39 0.54 0.58 0.71] sorted [3 2 1]\n",
      "   state [0 1 0 1] state_WI [0.39 0.47 0.58 0.26] sorted [2 1 0]\n",
      "   state [1 1 0 0] state_WI [0.26 0.47 0.58 0.71] sorted [3 2 1]\n",
      "   state [1 0 1 1] state_WI [0.26 0.54 0.47 0.26] sorted [1 2 0]\n",
      "   state [1 1 1 0] state_WI [0.26 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.26 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [0 1 1 0] state_WI [0.39 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [0 1 1 0] state_WI [0.39 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [0 0 1 1] state_WI [0.39 0.54 0.47 0.26] sorted [1 2 0]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 0 1 1] state_WI [0.26 0.54 0.47 0.26] sorted [1 2 0]\n",
      "   state [1 1 1 0] state_WI [0.26 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.26 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [0 1 1 0] state_WI [0.39 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 0 1 1] state_WI [0.26 0.54 0.47 0.26] sorted [1 2 0]\n",
      "   state [1 0 1 0] state_WI [0.26 0.54 0.47 0.71] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "instance 0, ep 11, state [0 1 0 0]\n",
      "   state [0 1 0 0] state_WI [0.39 0.47 0.58 0.71] sorted [3 2 1]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 0 0] state_WI [0.26 0.47 0.58 0.71] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.39 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.39 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [1 0 1 1] state_WI [0.26 0.54 0.47 0.26] sorted [1 2 0]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 0 1 1] state_WI [0.26 0.54 0.47 0.26] sorted [1 2 0]\n",
      "   state [1 0 1 1] state_WI [0.26 0.54 0.47 0.26] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.39 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [0 1 0 1] state_WI [0.39 0.47 0.58 0.26] sorted [2 1 0]\n",
      "   state [0 1 0 1] state_WI [0.39 0.47 0.58 0.26] sorted [2 1 0]\n",
      "instance 0, ep 12, state [0 1 0 1]\n",
      "   state [0 1 0 1] state_WI [0.39 0.47 0.58 0.26] sorted [2 1 0]\n",
      "   state [1 0 0 0] state_WI [0.26 0.54 0.58 0.71] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.39 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [0 1 1 0] state_WI [0.39 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [0 1 1 0] state_WI [0.39 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [1 0 1 1] state_WI [0.26 0.54 0.47 0.26] sorted [1 2 0]\n",
      "   state [1 1 1 0] state_WI [0.26 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [1 1 1 0] state_WI [0.26 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [0 0 1 1] state_WI [0.39 0.54 0.47 0.26] sorted [1 2 0]\n",
      "   state [1 1 1 0] state_WI [0.26 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.26 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [0 0 1 0] state_WI [0.39 0.54 0.47 0.71] sorted [3 1 2]\n",
      "   state [0 1 0 1] state_WI [0.39 0.47 0.58 0.26] sorted [2 1 0]\n",
      "   state [0 1 0 0] state_WI [0.39 0.47 0.58 0.71] sorted [3 2 1]\n",
      "   state [0 0 0 1] state_WI [0.39 0.54 0.58 0.26] sorted [2 1 0]\n",
      "   state [1 0 1 1] state_WI [0.26 0.54 0.47 0.26] sorted [1 2 0]\n",
      "   state [1 0 1 0] state_WI [0.26 0.54 0.47 0.71] sorted [3 1 2]\n",
      "instance 0, ep 13, state [0 0 0 0]\n",
      "   state [0 0 0 0] state_WI [0.39 0.54 0.58 0.71] sorted [3 2 1]\n",
      "   state [0 1 1 0] state_WI [0.39 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [0 1 0 0] state_WI [0.39 0.47 0.58 0.71] sorted [3 2 1]\n",
      "   state [0 0 0 0] state_WI [0.39 0.54 0.58 0.71] sorted [3 2 1]\n",
      "   state [0 1 1 0] state_WI [0.39 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [0 0 1 1] state_WI [0.39 0.54 0.47 0.26] sorted [1 2 0]\n",
      "   state [0 1 0 1] state_WI [0.39 0.47 0.58 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 0 1] state_WI [0.26 0.47 0.58 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 0 0] state_WI [0.26 0.47 0.58 0.71] sorted [3 2 1]\n",
      "   state [0 0 1 0] state_WI [0.39 0.54 0.47 0.71] sorted [3 1 2]\n",
      "   state [1 0 1 1] state_WI [0.26 0.54 0.47 0.26] sorted [1 2 0]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [0 1 0 0] state_WI [0.39 0.47 0.58 0.71] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.26 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [1 0 1 1] state_WI [0.26 0.54 0.47 0.26] sorted [1 2 0]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "instance 0, ep 14, state [1 0 1 0]\n",
      "   state [1 0 1 0] state_WI [0.26 0.54 0.47 0.71] sorted [3 1 2]\n",
      "   state [1 0 1 1] state_WI [0.26 0.54 0.47 0.26] sorted [1 2 0]\n",
      "   state [1 0 1 1] state_WI [0.26 0.54 0.47 0.26] sorted [1 2 0]\n",
      "   state [0 0 1 0] state_WI [0.39 0.54 0.47 0.71] sorted [3 1 2]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.39 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [0 1 1 0] state_WI [0.39 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [1 1 1 0] state_WI [0.26 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [0 0 0 1] state_WI [0.39 0.54 0.58 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.26 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [0 0 1 1] state_WI [0.39 0.54 0.47 0.26] sorted [1 2 0]\n",
      "   state [0 0 1 1] state_WI [0.39 0.54 0.47 0.26] sorted [1 2 0]\n",
      "   state [0 1 0 0] state_WI [0.39 0.47 0.58 0.71] sorted [3 2 1]\n",
      "   state [1 1 0 1] state_WI [0.26 0.47 0.58 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.26 0.47 0.47 0.71] sorted [3 2 1]\n",
      "instance 0, ep 15, state [0 0 0 1]\n",
      "   state [0 0 0 1] state_WI [0.39 0.54 0.58 0.26] sorted [2 1 0]\n",
      "   state [1 0 1 0] state_WI [0.26 0.54 0.47 0.71] sorted [3 1 2]\n",
      "   state [1 0 1 1] state_WI [0.26 0.54 0.47 0.26] sorted [1 2 0]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 0 1] state_WI [0.26 0.47 0.58 0.26] sorted [2 1 0]\n",
      "   state [1 1 0 1] state_WI [0.26 0.47 0.58 0.26] sorted [2 1 0]\n",
      "   state [1 1 0 1] state_WI [0.26 0.47 0.58 0.26] sorted [2 1 0]\n",
      "   state [1 0 1 0] state_WI [0.26 0.54 0.47 0.71] sorted [3 1 2]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.26 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [1 0 1 0] state_WI [0.26 0.54 0.47 0.71] sorted [3 1 2]\n",
      "   state [0 0 1 1] state_WI [0.39 0.54 0.47 0.26] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.39 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [0 0 1 1] state_WI [0.39 0.54 0.47 0.26] sorted [1 2 0]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 0 0] state_WI [0.26 0.47 0.58 0.71] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 0 1 0] state_WI [0.26 0.54 0.47 0.71] sorted [3 1 2]\n",
      "instance 0, ep 16, state [0 0 0 0]\n",
      "   state [0 0 0 0] state_WI [0.39 0.54 0.58 0.71] sorted [3 2 1]\n",
      "   state [0 1 0 0] state_WI [0.39 0.47 0.58 0.71] sorted [3 2 1]\n",
      "   state [0 1 0 0] state_WI [0.39 0.47 0.58 0.71] sorted [3 2 1]\n",
      "   state [1 1 0 1] state_WI [0.26 0.47 0.58 0.26] sorted [2 1 0]\n",
      "   state [1 1 0 0] state_WI [0.26 0.47 0.58 0.71] sorted [3 2 1]\n",
      "   state [0 1 0 1] state_WI [0.39 0.47 0.58 0.26] sorted [2 1 0]\n",
      "   state [1 0 1 0] state_WI [0.26 0.54 0.47 0.71] sorted [3 1 2]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.26 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.26 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [1 1 1 0] state_WI [0.26 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [1 1 1 0] state_WI [0.26 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [1 1 1 0] state_WI [0.26 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 0 1 0] state_WI [0.26 0.54 0.47 0.71] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [0 0 1 1] state_WI [0.39 0.54 0.47 0.26] sorted [1 2 0]\n",
      "instance 0, ep 17, state [1 1 0 1]\n",
      "   state [1 1 0 1] state_WI [0.26 0.47 0.58 0.26] sorted [2 1 0]\n",
      "   state [0 1 0 0] state_WI [0.39 0.47 0.58 0.71] sorted [3 2 1]\n",
      "   state [0 1 0 1] state_WI [0.39 0.47 0.58 0.26] sorted [2 1 0]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 0 1 1] state_WI [0.26 0.54 0.47 0.26] sorted [1 2 0]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.39 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [0 1 1 0] state_WI [0.39 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [0 0 1 1] state_WI [0.39 0.54 0.47 0.26] sorted [1 2 0]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 0 0] state_WI [0.26 0.47 0.58 0.71] sorted [3 2 1]\n",
      "   state [0 1 0 1] state_WI [0.39 0.47 0.58 0.26] sorted [2 1 0]\n",
      "   state [1 1 0 0] state_WI [0.26 0.47 0.58 0.71] sorted [3 2 1]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.26 0.47 0.47 0.71] sorted [3 2 1]\n",
      "instance 0, ep 18, state [0 1 0 0]\n",
      "   state [0 1 0 0] state_WI [0.39 0.47 0.58 0.71] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 0 1 0] state_WI [0.26 0.54 0.47 0.71] sorted [3 1 2]\n",
      "   state [0 0 1 1] state_WI [0.39 0.54 0.47 0.26] sorted [1 2 0]\n",
      "   state [1 0 1 1] state_WI [0.26 0.54 0.47 0.26] sorted [1 2 0]\n",
      "   state [1 0 1 0] state_WI [0.26 0.54 0.47 0.71] sorted [3 1 2]\n",
      "   state [1 1 1 0] state_WI [0.26 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [1 1 0 1] state_WI [0.26 0.47 0.58 0.26] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.39 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [0 0 1 0] state_WI [0.39 0.54 0.47 0.71] sorted [3 1 2]\n",
      "   state [0 0 1 1] state_WI [0.39 0.54 0.47 0.26] sorted [1 2 0]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.26 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [1 1 1 0] state_WI [0.26 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [0 1 0 0] state_WI [0.39 0.47 0.58 0.71] sorted [3 2 1]\n",
      "   state [0 0 1 0] state_WI [0.39 0.54 0.47 0.71] sorted [3 1 2]\n",
      "   state [0 0 1 1] state_WI [0.39 0.54 0.47 0.26] sorted [1 2 0]\n",
      "instance 0, ep 19, state [0 1 1 1]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [0 1 0 1] state_WI [0.39 0.47 0.58 0.26] sorted [2 1 0]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.26 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 0 0] state_WI [0.26 0.47 0.58 0.71] sorted [3 2 1]\n",
      "   state [1 0 0 0] state_WI [0.26 0.54 0.58 0.71] sorted [3 2 1]\n",
      "   state [1 1 0 0] state_WI [0.26 0.47 0.58 0.71] sorted [3 2 1]\n",
      "   state [0 1 1 0] state_WI [0.39 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [0 0 1 1] state_WI [0.39 0.54 0.47 0.26] sorted [1 2 0]\n",
      "   state [0 0 0 1] state_WI [0.39 0.54 0.58 0.26] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.39 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [0 0 1 1] state_WI [0.39 0.54 0.47 0.26] sorted [1 2 0]\n",
      "   state [1 1 0 1] state_WI [0.26 0.47 0.58 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "instance 0, ep 20, state [0 1 1 0]\n",
      "   state [0 1 1 0] state_WI [0.39 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.26 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.26 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 0 0] state_WI [0.26 0.47 0.58 0.71] sorted [3 2 1]\n",
      "   state [0 1 1 0] state_WI [0.39 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [0 1 0 0] state_WI [0.39 0.47 0.58 0.71] sorted [3 2 1]\n",
      "   state [0 1 0 1] state_WI [0.39 0.47 0.58 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 0 1 0] state_WI [0.26 0.54 0.47 0.71] sorted [3 1 2]\n",
      "   state [1 0 1 1] state_WI [0.26 0.54 0.47 0.26] sorted [1 2 0]\n",
      "   state [1 0 1 1] state_WI [0.26 0.54 0.47 0.26] sorted [1 2 0]\n",
      "   state [1 0 1 1] state_WI [0.26 0.54 0.47 0.26] sorted [1 2 0]\n",
      "instance 0, ep 21, state [0 0 1 0]\n",
      "   state [0 0 1 0] state_WI [0.39 0.54 0.47 0.71] sorted [3 1 2]\n",
      "   state [0 0 1 0] state_WI [0.39 0.54 0.47 0.71] sorted [3 1 2]\n",
      "   state [0 0 1 1] state_WI [0.39 0.54 0.47 0.26] sorted [1 2 0]\n",
      "   state [1 0 1 1] state_WI [0.26 0.54 0.47 0.26] sorted [1 2 0]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.26 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.26 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [0 1 0 0] state_WI [0.39 0.47 0.58 0.71] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.39 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [0 1 1 0] state_WI [0.39 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [0 0 0 1] state_WI [0.39 0.54 0.58 0.26] sorted [2 1 0]\n",
      "   state [0 1 0 1] state_WI [0.39 0.47 0.58 0.26] sorted [2 1 0]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [0 0 1 1] state_WI [0.39 0.54 0.47 0.26] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.39 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [0 0 1 1] state_WI [0.39 0.54 0.47 0.26] sorted [1 2 0]\n",
      "instance 0, ep 22, state [1 0 1 1]\n",
      "   state [1 0 1 1] state_WI [0.26 0.54 0.47 0.26] sorted [1 2 0]\n",
      "   state [0 0 1 0] state_WI [0.39 0.54 0.47 0.71] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [0 1 0 0] state_WI [0.39 0.47 0.58 0.71] sorted [3 2 1]\n",
      "   state [1 0 1 1] state_WI [0.26 0.54 0.47 0.26] sorted [1 2 0]\n",
      "   state [1 1 0 1] state_WI [0.26 0.47 0.58 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.26 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.39 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [0 0 1 0] state_WI [0.39 0.54 0.47 0.71] sorted [3 1 2]\n",
      "   state [1 1 1 0] state_WI [0.26 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [1 1 0 1] state_WI [0.26 0.47 0.58 0.26] sorted [2 1 0]\n",
      "   state [1 0 1 1] state_WI [0.26 0.54 0.47 0.26] sorted [1 2 0]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.39 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [0 1 1 0] state_WI [0.39 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "instance 0, ep 23, state [0 1 1 1]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [0 0 1 1] state_WI [0.39 0.54 0.47 0.26] sorted [1 2 0]\n",
      "   state [1 1 0 1] state_WI [0.26 0.47 0.58 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.26 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.26 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [0 1 1 0] state_WI [0.39 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [0 1 0 1] state_WI [0.39 0.47 0.58 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.26 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [1 1 1 0] state_WI [0.26 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [1 1 1 0] state_WI [0.26 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.26 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [0 1 1 0] state_WI [0.39 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [0 1 1 0] state_WI [0.39 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [0 1 0 0] state_WI [0.39 0.47 0.58 0.71] sorted [3 2 1]\n",
      "instance 0, ep 24, state [0 0 1 1]\n",
      "   state [0 0 1 1] state_WI [0.39 0.54 0.47 0.26] sorted [1 2 0]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.26 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [1 1 1 0] state_WI [0.26 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [0 1 0 0] state_WI [0.39 0.47 0.58 0.71] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 0 0] state_WI [0.26 0.47 0.58 0.71] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 0 1 0] state_WI [0.26 0.54 0.47 0.71] sorted [3 1 2]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.39 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [1 1 1 0] state_WI [0.26 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [1 1 0 0] state_WI [0.26 0.47 0.58 0.71] sorted [3 2 1]\n",
      "   state [0 1 0 1] state_WI [0.39 0.47 0.58 0.26] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.39 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "instance 0, ep 25, state [0 0 1 0]\n",
      "   state [0 0 1 0] state_WI [0.39 0.54 0.47 0.71] sorted [3 1 2]\n",
      "   state [0 0 1 1] state_WI [0.39 0.54 0.47 0.26] sorted [1 2 0]\n",
      "   state [1 1 0 1] state_WI [0.26 0.47 0.58 0.26] sorted [2 1 0]\n",
      "   state [1 0 0 1] state_WI [0.26 0.54 0.58 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.26 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [0 1 0 0] state_WI [0.39 0.47 0.58 0.71] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.26 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [0 1 1 0] state_WI [0.39 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [0 1 1 0] state_WI [0.39 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [0 1 1 0] state_WI [0.39 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [0 1 0 0] state_WI [0.39 0.47 0.58 0.71] sorted [3 2 1]\n",
      "   state [0 0 0 0] state_WI [0.39 0.54 0.58 0.71] sorted [3 2 1]\n",
      "   state [1 1 1 0] state_WI [0.26 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [1 1 0 1] state_WI [0.26 0.47 0.58 0.26] sorted [2 1 0]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.26 0.47 0.47 0.71] sorted [3 2 1]\n",
      "instance 0, ep 26, state [1 1 1 1]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.26 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [1 1 1 0] state_WI [0.26 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [1 0 1 0] state_WI [0.26 0.54 0.47 0.71] sorted [3 1 2]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.26 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [1 0 0 0] state_WI [0.26 0.54 0.58 0.71] sorted [3 2 1]\n",
      "   state [1 1 1 0] state_WI [0.26 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [1 0 1 1] state_WI [0.26 0.54 0.47 0.26] sorted [1 2 0]\n",
      "   state [1 1 1 0] state_WI [0.26 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [1 0 1 0] state_WI [0.26 0.54 0.47 0.71] sorted [3 1 2]\n",
      "   state [0 0 1 1] state_WI [0.39 0.54 0.47 0.26] sorted [1 2 0]\n",
      "   state [1 0 1 1] state_WI [0.26 0.54 0.47 0.26] sorted [1 2 0]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.26 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.26 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.26 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [0 0 1 0] state_WI [0.39 0.54 0.47 0.71] sorted [3 1 2]\n",
      "instance 0, ep 27, state [0 1 1 0]\n",
      "   state [0 1 1 0] state_WI [0.39 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [0 0 1 0] state_WI [0.39 0.54 0.47 0.71] sorted [3 1 2]\n",
      "   state [0 1 1 0] state_WI [0.39 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [1 1 1 0] state_WI [0.26 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [0 0 1 1] state_WI [0.39 0.54 0.47 0.26] sorted [1 2 0]\n",
      "   state [0 0 0 0] state_WI [0.39 0.54 0.58 0.71] sorted [3 2 1]\n",
      "   state [0 0 1 1] state_WI [0.39 0.54 0.47 0.26] sorted [1 2 0]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.26 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [0 1 1 0] state_WI [0.39 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.39 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.26 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.26 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "instance 0, ep 28, state [0 1 1 0]\n",
      "   state [0 1 1 0] state_WI [0.39 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [0 1 1 0] state_WI [0.39 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.26 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.26 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [0 0 1 0] state_WI [0.39 0.54 0.47 0.71] sorted [3 1 2]\n",
      "   state [1 1 0 1] state_WI [0.26 0.47 0.58 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 0 1 0] state_WI [0.26 0.54 0.47 0.71] sorted [3 1 2]\n",
      "   state [1 0 1 1] state_WI [0.26 0.54 0.47 0.26] sorted [1 2 0]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [0 0 1 1] state_WI [0.39 0.54 0.47 0.26] sorted [1 2 0]\n",
      "   state [1 0 1 1] state_WI [0.26 0.54 0.47 0.26] sorted [1 2 0]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [0 1 0 0] state_WI [0.39 0.47 0.58 0.71] sorted [3 2 1]\n",
      "   state [0 0 0 0] state_WI [0.39 0.54 0.58 0.71] sorted [3 2 1]\n",
      "   state [1 1 0 1] state_WI [0.26 0.47 0.58 0.26] sorted [2 1 0]\n",
      "instance 0, ep 29, state [1 1 1 1]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 0 0] state_WI [0.26 0.47 0.58 0.71] sorted [3 2 1]\n",
      "   state [0 1 0 0] state_WI [0.39 0.47 0.58 0.71] sorted [3 2 1]\n",
      "   state [1 1 0 1] state_WI [0.26 0.47 0.58 0.26] sorted [2 1 0]\n",
      "   state [1 1 0 1] state_WI [0.26 0.47 0.58 0.26] sorted [2 1 0]\n",
      "   state [1 1 0 1] state_WI [0.26 0.47 0.58 0.26] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.39 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [0 1 0 1] state_WI [0.39 0.47 0.58 0.26] sorted [2 1 0]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.26 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [1 0 1 0] state_WI [0.26 0.54 0.47 0.71] sorted [3 1 2]\n",
      "   state [0 1 0 0] state_WI [0.39 0.47 0.58 0.71] sorted [3 2 1]\n",
      "   state [0 0 1 0] state_WI [0.39 0.54 0.47 0.71] sorted [3 1 2]\n",
      "   state [0 1 1 0] state_WI [0.39 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [0 1 1 0] state_WI [0.39 0.47 0.47 0.71] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.39 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [0 1 0 1] state_WI [0.39 0.47 0.58 0.26] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.26 0.47 0.47 0.26] sorted [2 1 0]\n",
      "   state [0 0 1 1] state_WI [0.39 0.54 0.47 0.26] sorted [1 2 0]\n",
      "first state [1 0 0 0]\n",
      "   state [1 0 0 0] state_WI [0.43 0.52 0.39 0.91] sorted [3 1 0]\n",
      "   state [0 0 0 1] state_WI [0.44 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.44 0.32 0.36 0.91] sorted [3 0 2]\n",
      "   state [1 1 0 1] state_WI [0.43 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [1 1 0 1] state_WI [0.43 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [1 1 0 0] state_WI [0.43 0.32 0.39 0.91] sorted [3 0 2]\n",
      "   state [0 1 0 1] state_WI [0.44 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [0 0 1 0] state_WI [0.44 0.52 0.36 0.91] sorted [3 1 0]\n",
      "   state [0 0 0 0] state_WI [0.44 0.52 0.39 0.91] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [0.43 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [1 1 0 0] state_WI [0.43 0.32 0.39 0.91] sorted [3 0 2]\n",
      "   state [1 1 1 0] state_WI [0.43 0.32 0.36 0.91] sorted [3 0 2]\n",
      "   state [1 1 1 1] state_WI [0.43 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [1 1 1 1] state_WI [0.43 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [0 1 1 0] state_WI [0.44 0.32 0.36 0.91] sorted [3 0 2]\n",
      "   state [1 1 1 0] state_WI [0.43 0.32 0.36 0.91] sorted [3 0 2]\n",
      "   state [1 1 0 1] state_WI [0.43 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [1 0 0 1] state_WI [0.43 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [1 1 1 1] state_WI [0.43 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [1 1 1 1] state_WI [0.43 0.32 0.36 0.18] sorted [0 2 1]\n",
      "instance 1, ep 1, state [1 0 0 1]\n",
      "   state [1 0 0 1] state_WI [0.43 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [0 0 0 1] state_WI [0.44 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [1 1 1 1] state_WI [0.43 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [1 1 1 0] state_WI [0.43 0.32 0.36 0.91] sorted [3 0 2]\n",
      "   state [1 1 1 0] state_WI [0.43 0.32 0.36 0.91] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [0.43 0.52 0.36 0.18] sorted [1 0 2]\n",
      "   state [1 0 1 1] state_WI [0.43 0.52 0.36 0.18] sorted [1 0 2]\n",
      "   state [1 1 0 1] state_WI [0.43 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [1 1 0 1] state_WI [0.43 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [1 1 0 1] state_WI [0.43 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [0 1 0 1] state_WI [0.44 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [1 1 0 1] state_WI [0.43 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [1 1 1 0] state_WI [0.43 0.32 0.36 0.91] sorted [3 0 2]\n",
      "   state [1 0 1 0] state_WI [0.43 0.52 0.36 0.91] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [0.43 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [1 0 0 1] state_WI [0.43 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [1 0 1 0] state_WI [0.43 0.52 0.36 0.91] sorted [3 1 0]\n",
      "   state [0 0 1 1] state_WI [0.44 0.52 0.36 0.18] sorted [1 0 2]\n",
      "   state [1 1 0 1] state_WI [0.43 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [1 0 0 0] state_WI [0.43 0.52 0.39 0.91] sorted [3 1 0]\n",
      "instance 1, ep 2, state [0 0 0 0]\n",
      "   state [0 0 0 0] state_WI [0.44 0.52 0.39 0.91] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.44 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [1 1 0 0] state_WI [0.43 0.32 0.39 0.91] sorted [3 0 2]\n",
      "   state [1 0 0 1] state_WI [0.43 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [1 0 1 1] state_WI [0.43 0.52 0.36 0.18] sorted [1 0 2]\n",
      "   state [1 0 0 1] state_WI [0.43 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [1 0 1 1] state_WI [0.43 0.52 0.36 0.18] sorted [1 0 2]\n",
      "   state [1 0 0 1] state_WI [0.43 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [1 1 1 1] state_WI [0.43 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [1 1 1 1] state_WI [0.43 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [1 0 0 1] state_WI [0.43 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [1 1 0 1] state_WI [0.43 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [1 1 0 0] state_WI [0.43 0.32 0.39 0.91] sorted [3 0 2]\n",
      "   state [1 0 0 1] state_WI [0.43 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [1 1 0 1] state_WI [0.43 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [1 0 0 1] state_WI [0.43 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [0 1 1 1] state_WI [0.44 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [0 1 1 0] state_WI [0.44 0.32 0.36 0.91] sorted [3 0 2]\n",
      "   state [1 1 1 0] state_WI [0.43 0.32 0.36 0.91] sorted [3 0 2]\n",
      "   state [1 0 0 1] state_WI [0.43 0.52 0.39 0.18] sorted [1 0 2]\n",
      "instance 1, ep 3, state [1 0 1 0]\n",
      "   state [1 0 1 0] state_WI [0.43 0.52 0.36 0.91] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [0.43 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [1 1 1 0] state_WI [0.43 0.32 0.36 0.91] sorted [3 0 2]\n",
      "   state [1 1 1 1] state_WI [0.43 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [1 1 0 1] state_WI [0.43 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [1 1 0 0] state_WI [0.43 0.32 0.39 0.91] sorted [3 0 2]\n",
      "   state [1 1 1 1] state_WI [0.43 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [1 1 1 1] state_WI [0.43 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [1 1 1 0] state_WI [0.43 0.32 0.36 0.91] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [0.43 0.52 0.36 0.18] sorted [1 0 2]\n",
      "   state [1 0 1 0] state_WI [0.43 0.52 0.36 0.91] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [0.43 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.44 0.32 0.36 0.91] sorted [3 0 2]\n",
      "   state [1 0 1 0] state_WI [0.43 0.52 0.36 0.91] sorted [3 1 0]\n",
      "   state [0 0 0 0] state_WI [0.44 0.52 0.39 0.91] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [0.43 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [0 1 0 0] state_WI [0.44 0.32 0.39 0.91] sorted [3 0 2]\n",
      "   state [0 0 0 1] state_WI [0.44 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [1 1 0 1] state_WI [0.43 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [1 1 0 1] state_WI [0.43 0.32 0.39 0.18] sorted [0 2 1]\n",
      "instance 1, ep 4, state [1 0 0 1]\n",
      "   state [1 0 0 1] state_WI [0.43 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [1 1 0 1] state_WI [0.43 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [1 1 1 1] state_WI [0.43 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [1 1 0 1] state_WI [0.43 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [0 1 0 0] state_WI [0.44 0.32 0.39 0.91] sorted [3 0 2]\n",
      "   state [0 0 1 1] state_WI [0.44 0.52 0.36 0.18] sorted [1 0 2]\n",
      "   state [0 0 0 0] state_WI [0.44 0.52 0.39 0.91] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.44 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [0 0 0 1] state_WI [0.44 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [0 0 0 0] state_WI [0.44 0.52 0.39 0.91] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.44 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [0 1 0 1] state_WI [0.44 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [1 0 0 1] state_WI [0.43 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [1 1 0 0] state_WI [0.43 0.32 0.39 0.91] sorted [3 0 2]\n",
      "   state [1 0 0 0] state_WI [0.43 0.52 0.39 0.91] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [0.43 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [0 1 0 0] state_WI [0.44 0.32 0.39 0.91] sorted [3 0 2]\n",
      "   state [1 0 0 1] state_WI [0.43 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [1 1 0 0] state_WI [0.43 0.32 0.39 0.91] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [0.43 0.52 0.36 0.18] sorted [1 0 2]\n",
      "instance 1, ep 5, state [1 1 0 0]\n",
      "   state [1 1 0 0] state_WI [0.43 0.32 0.39 0.91] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [0.43 0.52 0.36 0.18] sorted [1 0 2]\n",
      "   state [1 0 1 1] state_WI [0.43 0.52 0.36 0.18] sorted [1 0 2]\n",
      "   state [1 0 0 1] state_WI [0.43 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [1 1 1 0] state_WI [0.43 0.32 0.36 0.91] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [0.43 0.52 0.36 0.18] sorted [1 0 2]\n",
      "   state [1 1 1 0] state_WI [0.43 0.32 0.36 0.91] sorted [3 0 2]\n",
      "   state [0 0 1 0] state_WI [0.44 0.52 0.36 0.91] sorted [3 1 0]\n",
      "   state [0 1 1 1] state_WI [0.44 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [1 0 0 1] state_WI [0.43 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [1 0 1 1] state_WI [0.43 0.52 0.36 0.18] sorted [1 0 2]\n",
      "   state [1 0 1 1] state_WI [0.43 0.52 0.36 0.18] sorted [1 0 2]\n",
      "   state [1 1 1 1] state_WI [0.43 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [0 1 1 1] state_WI [0.44 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [0 0 1 1] state_WI [0.44 0.52 0.36 0.18] sorted [1 0 2]\n",
      "   state [1 1 1 1] state_WI [0.43 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [1 1 1 0] state_WI [0.43 0.32 0.36 0.91] sorted [3 0 2]\n",
      "   state [1 1 0 0] state_WI [0.43 0.32 0.39 0.91] sorted [3 0 2]\n",
      "   state [1 0 0 1] state_WI [0.43 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [1 1 0 0] state_WI [0.43 0.32 0.39 0.91] sorted [3 0 2]\n",
      "instance 1, ep 6, state [0 1 0 1]\n",
      "   state [0 1 0 1] state_WI [0.44 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [1 1 1 0] state_WI [0.43 0.32 0.36 0.91] sorted [3 0 2]\n",
      "   state [1 1 0 0] state_WI [0.43 0.32 0.39 0.91] sorted [3 0 2]\n",
      "   state [0 1 0 1] state_WI [0.44 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [0 1 1 1] state_WI [0.44 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [1 0 0 1] state_WI [0.43 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [1 0 0 0] state_WI [0.43 0.52 0.39 0.91] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.44 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [0 1 0 1] state_WI [0.44 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [1 1 1 1] state_WI [0.43 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [1 1 0 1] state_WI [0.43 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [0 0 1 0] state_WI [0.44 0.52 0.36 0.91] sorted [3 1 0]\n",
      "   state [1 1 1 1] state_WI [0.43 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [0 0 1 0] state_WI [0.44 0.52 0.36 0.91] sorted [3 1 0]\n",
      "   state [0 0 1 1] state_WI [0.44 0.52 0.36 0.18] sorted [1 0 2]\n",
      "   state [0 1 0 0] state_WI [0.44 0.32 0.39 0.91] sorted [3 0 2]\n",
      "   state [1 1 1 0] state_WI [0.43 0.32 0.36 0.91] sorted [3 0 2]\n",
      "   state [1 1 1 1] state_WI [0.43 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [1 1 1 1] state_WI [0.43 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [1 1 1 1] state_WI [0.43 0.32 0.36 0.18] sorted [0 2 1]\n",
      "instance 1, ep 7, state [0 1 0 1]\n",
      "   state [0 1 0 1] state_WI [0.44 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [0 1 0 1] state_WI [0.44 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [1 1 1 1] state_WI [0.43 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [1 0 1 1] state_WI [0.43 0.52 0.36 0.18] sorted [1 0 2]\n",
      "   state [1 0 1 0] state_WI [0.43 0.52 0.36 0.91] sorted [3 1 0]\n",
      "   state [1 1 1 1] state_WI [0.43 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [1 0 1 1] state_WI [0.43 0.52 0.36 0.18] sorted [1 0 2]\n",
      "   state [0 1 1 1] state_WI [0.44 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [1 0 0 1] state_WI [0.43 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [1 1 1 1] state_WI [0.43 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [1 1 1 1] state_WI [0.43 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [0 1 0 1] state_WI [0.44 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [1 1 0 0] state_WI [0.43 0.32 0.39 0.91] sorted [3 0 2]\n",
      "   state [0 0 0 1] state_WI [0.44 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [1 1 1 0] state_WI [0.43 0.32 0.36 0.91] sorted [3 0 2]\n",
      "   state [1 1 0 1] state_WI [0.43 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [1 1 1 0] state_WI [0.43 0.32 0.36 0.91] sorted [3 0 2]\n",
      "   state [1 1 1 1] state_WI [0.43 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [1 0 0 0] state_WI [0.43 0.52 0.39 0.91] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [0.43 0.32 0.39 0.18] sorted [0 2 1]\n",
      "instance 1, ep 8, state [0 0 1 0]\n",
      "   state [0 0 1 0] state_WI [0.44 0.52 0.36 0.91] sorted [3 1 0]\n",
      "   state [0 1 0 0] state_WI [0.44 0.32 0.39 0.91] sorted [3 0 2]\n",
      "   state [0 0 1 1] state_WI [0.44 0.52 0.36 0.18] sorted [1 0 2]\n",
      "   state [1 0 0 1] state_WI [0.43 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [1 0 0 0] state_WI [0.43 0.52 0.39 0.91] sorted [3 1 0]\n",
      "   state [1 0 0 0] state_WI [0.43 0.52 0.39 0.91] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.44 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [1 0 0 1] state_WI [0.43 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [1 1 1 0] state_WI [0.43 0.32 0.36 0.91] sorted [3 0 2]\n",
      "   state [1 0 0 1] state_WI [0.43 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [1 1 0 1] state_WI [0.43 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [1 1 0 1] state_WI [0.43 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [1 1 0 1] state_WI [0.43 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [1 1 0 1] state_WI [0.43 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [1 1 1 1] state_WI [0.43 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [0 1 1 1] state_WI [0.44 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [0 1 1 1] state_WI [0.44 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [0 1 1 1] state_WI [0.44 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [0 0 1 0] state_WI [0.44 0.52 0.36 0.91] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [0.43 0.32 0.39 0.18] sorted [0 2 1]\n",
      "instance 1, ep 9, state [0 1 1 0]\n",
      "   state [0 1 1 0] state_WI [0.44 0.32 0.36 0.91] sorted [3 0 2]\n",
      "   state [0 1 0 0] state_WI [0.44 0.32 0.39 0.91] sorted [3 0 2]\n",
      "   state [0 0 1 0] state_WI [0.44 0.52 0.36 0.91] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [0.43 0.32 0.39 0.91] sorted [3 0 2]\n",
      "   state [1 1 0 0] state_WI [0.43 0.32 0.39 0.91] sorted [3 0 2]\n",
      "   state [1 1 1 0] state_WI [0.43 0.32 0.36 0.91] sorted [3 0 2]\n",
      "   state [1 0 0 1] state_WI [0.43 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [1 0 0 1] state_WI [0.43 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [1 1 1 0] state_WI [0.43 0.32 0.36 0.91] sorted [3 0 2]\n",
      "   state [1 0 0 1] state_WI [0.43 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [1 0 0 0] state_WI [0.43 0.52 0.39 0.91] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.44 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [1 0 0 1] state_WI [0.43 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [1 1 1 1] state_WI [0.43 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [1 0 0 0] state_WI [0.43 0.52 0.39 0.91] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [0.43 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [1 1 0 0] state_WI [0.43 0.32 0.39 0.91] sorted [3 0 2]\n",
      "   state [1 0 1 0] state_WI [0.43 0.52 0.36 0.91] sorted [3 1 0]\n",
      "   state [0 1 0 0] state_WI [0.44 0.32 0.39 0.91] sorted [3 0 2]\n",
      "   state [1 0 1 0] state_WI [0.43 0.52 0.36 0.91] sorted [3 1 0]\n",
      "instance 1, ep 10, state [0 0 1 0]\n",
      "   state [0 0 1 0] state_WI [0.44 0.52 0.36 0.91] sorted [3 1 0]\n",
      "   state [1 0 1 0] state_WI [0.43 0.52 0.36 0.91] sorted [3 1 0]\n",
      "   state [1 1 1 1] state_WI [0.43 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [0 0 1 1] state_WI [0.44 0.52 0.36 0.18] sorted [1 0 2]\n",
      "   state [1 0 0 0] state_WI [0.43 0.52 0.39 0.91] sorted [3 1 0]\n",
      "   state [1 1 1 0] state_WI [0.43 0.32 0.36 0.91] sorted [3 0 2]\n",
      "   state [1 1 0 1] state_WI [0.43 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [1 1 1 0] state_WI [0.43 0.32 0.36 0.91] sorted [3 0 2]\n",
      "   state [1 1 0 1] state_WI [0.43 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [1 1 1 0] state_WI [0.43 0.32 0.36 0.91] sorted [3 0 2]\n",
      "   state [1 0 1 0] state_WI [0.43 0.52 0.36 0.91] sorted [3 1 0]\n",
      "   state [1 1 1 0] state_WI [0.43 0.32 0.36 0.91] sorted [3 0 2]\n",
      "   state [1 1 0 0] state_WI [0.43 0.32 0.39 0.91] sorted [3 0 2]\n",
      "   state [0 1 0 1] state_WI [0.44 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [0 1 0 1] state_WI [0.44 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [1 1 1 1] state_WI [0.43 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [1 1 1 0] state_WI [0.43 0.32 0.36 0.91] sorted [3 0 2]\n",
      "   state [0 0 1 1] state_WI [0.44 0.52 0.36 0.18] sorted [1 0 2]\n",
      "   state [0 1 1 1] state_WI [0.44 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [0 1 0 0] state_WI [0.44 0.32 0.39 0.91] sorted [3 0 2]\n",
      "instance 1, ep 11, state [0 0 0 1]\n",
      "   state [0 0 0 1] state_WI [0.44 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [0 1 0 0] state_WI [0.44 0.32 0.39 0.91] sorted [3 0 2]\n",
      "   state [0 0 1 1] state_WI [0.44 0.52 0.36 0.18] sorted [1 0 2]\n",
      "   state [0 0 1 1] state_WI [0.44 0.52 0.36 0.18] sorted [1 0 2]\n",
      "   state [0 1 1 1] state_WI [0.44 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [1 1 1 1] state_WI [0.43 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [1 1 0 1] state_WI [0.43 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [1 0 0 1] state_WI [0.43 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [0 1 0 0] state_WI [0.44 0.32 0.39 0.91] sorted [3 0 2]\n",
      "   state [1 1 0 1] state_WI [0.43 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [1 0 0 1] state_WI [0.43 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [1 1 1 1] state_WI [0.43 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [1 1 1 0] state_WI [0.43 0.32 0.36 0.91] sorted [3 0 2]\n",
      "   state [0 0 1 1] state_WI [0.44 0.52 0.36 0.18] sorted [1 0 2]\n",
      "   state [0 1 0 1] state_WI [0.44 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [0 1 1 1] state_WI [0.44 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [0 1 1 0] state_WI [0.44 0.32 0.36 0.91] sorted [3 0 2]\n",
      "   state [0 0 1 1] state_WI [0.44 0.52 0.36 0.18] sorted [1 0 2]\n",
      "   state [1 0 1 1] state_WI [0.43 0.52 0.36 0.18] sorted [1 0 2]\n",
      "   state [1 0 1 0] state_WI [0.43 0.52 0.36 0.91] sorted [3 1 0]\n",
      "instance 1, ep 12, state [0 1 0 0]\n",
      "   state [0 1 0 0] state_WI [0.44 0.32 0.39 0.91] sorted [3 0 2]\n",
      "   state [0 0 0 1] state_WI [0.44 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [0 1 1 1] state_WI [0.44 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [1 0 1 0] state_WI [0.43 0.52 0.36 0.91] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [0.43 0.32 0.39 0.91] sorted [3 0 2]\n",
      "   state [1 0 0 1] state_WI [0.43 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [1 1 0 0] state_WI [0.43 0.32 0.39 0.91] sorted [3 0 2]\n",
      "   state [0 0 0 1] state_WI [0.44 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [1 0 0 0] state_WI [0.43 0.52 0.39 0.91] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.44 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [0 1 0 0] state_WI [0.44 0.32 0.39 0.91] sorted [3 0 2]\n",
      "   state [0 1 1 0] state_WI [0.44 0.32 0.36 0.91] sorted [3 0 2]\n",
      "   state [1 1 1 1] state_WI [0.43 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [1 1 1 1] state_WI [0.43 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [1 1 1 1] state_WI [0.43 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [0 1 1 1] state_WI [0.44 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [0 1 1 0] state_WI [0.44 0.32 0.36 0.91] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [0.43 0.52 0.36 0.18] sorted [1 0 2]\n",
      "   state [1 0 0 0] state_WI [0.43 0.52 0.39 0.91] sorted [3 1 0]\n",
      "   state [0 1 1 1] state_WI [0.44 0.32 0.36 0.18] sorted [0 2 1]\n",
      "instance 1, ep 13, state [0 0 1 1]\n",
      "   state [0 0 1 1] state_WI [0.44 0.52 0.36 0.18] sorted [1 0 2]\n",
      "   state [1 0 1 0] state_WI [0.43 0.52 0.36 0.91] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [0.43 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [1 0 1 0] state_WI [0.43 0.52 0.36 0.91] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [0.43 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [1 0 0 1] state_WI [0.43 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [1 1 0 1] state_WI [0.43 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [0 0 1 1] state_WI [0.44 0.52 0.36 0.18] sorted [1 0 2]\n",
      "   state [0 0 0 1] state_WI [0.44 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [1 0 0 1] state_WI [0.43 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [1 0 0 0] state_WI [0.43 0.52 0.39 0.91] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [0.43 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [0 1 0 0] state_WI [0.44 0.32 0.39 0.91] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [0.43 0.52 0.36 0.18] sorted [1 0 2]\n",
      "   state [1 1 0 1] state_WI [0.43 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [1 1 0 1] state_WI [0.43 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [1 1 0 0] state_WI [0.43 0.32 0.39 0.91] sorted [3 0 2]\n",
      "   state [1 1 0 1] state_WI [0.43 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [1 1 0 0] state_WI [0.43 0.32 0.39 0.91] sorted [3 0 2]\n",
      "   state [1 0 0 1] state_WI [0.43 0.52 0.39 0.18] sorted [1 0 2]\n",
      "instance 1, ep 14, state [1 1 0 1]\n",
      "   state [1 1 0 1] state_WI [0.43 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [1 1 1 0] state_WI [0.43 0.32 0.36 0.91] sorted [3 0 2]\n",
      "   state [0 0 1 1] state_WI [0.44 0.52 0.36 0.18] sorted [1 0 2]\n",
      "   state [1 0 0 1] state_WI [0.43 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [1 0 1 0] state_WI [0.43 0.52 0.36 0.91] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [0.43 0.32 0.39 0.91] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [0.43 0.52 0.36 0.18] sorted [1 0 2]\n",
      "   state [1 1 1 0] state_WI [0.43 0.32 0.36 0.91] sorted [3 0 2]\n",
      "   state [1 0 1 0] state_WI [0.43 0.52 0.36 0.91] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.44 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [1 1 1 1] state_WI [0.43 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [1 1 1 1] state_WI [0.43 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [1 1 0 1] state_WI [0.43 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [1 0 1 1] state_WI [0.43 0.52 0.36 0.18] sorted [1 0 2]\n",
      "   state [1 1 1 0] state_WI [0.43 0.32 0.36 0.91] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [0.43 0.52 0.36 0.18] sorted [1 0 2]\n",
      "   state [1 0 1 0] state_WI [0.43 0.52 0.36 0.91] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [0.43 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [1 1 0 1] state_WI [0.43 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [1 1 1 1] state_WI [0.43 0.32 0.36 0.18] sorted [0 2 1]\n",
      "instance 1, ep 15, state [0 1 0 0]\n",
      "   state [0 1 0 0] state_WI [0.44 0.32 0.39 0.91] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [0.43 0.52 0.36 0.18] sorted [1 0 2]\n",
      "   state [0 0 0 1] state_WI [0.44 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [1 0 1 0] state_WI [0.43 0.52 0.36 0.91] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [0.43 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [0 0 0 0] state_WI [0.44 0.52 0.39 0.91] sorted [3 1 0]\n",
      "   state [1 0 0 0] state_WI [0.43 0.52 0.39 0.91] sorted [3 1 0]\n",
      "   state [1 1 1 0] state_WI [0.43 0.32 0.36 0.91] sorted [3 0 2]\n",
      "   state [1 1 1 1] state_WI [0.43 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [0 0 1 0] state_WI [0.44 0.52 0.36 0.91] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [0.43 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [1 1 1 1] state_WI [0.43 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [1 1 1 1] state_WI [0.43 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [1 0 0 0] state_WI [0.43 0.52 0.39 0.91] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [0.43 0.32 0.39 0.91] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [0.43 0.52 0.36 0.18] sorted [1 0 2]\n",
      "   state [1 0 0 1] state_WI [0.43 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [1 1 0 1] state_WI [0.43 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [1 1 0 0] state_WI [0.43 0.32 0.39 0.91] sorted [3 0 2]\n",
      "   state [1 0 0 0] state_WI [0.43 0.52 0.39 0.91] sorted [3 1 0]\n",
      "instance 1, ep 16, state [0 0 0 0]\n",
      "   state [0 0 0 0] state_WI [0.44 0.52 0.39 0.91] sorted [3 1 0]\n",
      "   state [0 0 0 1] state_WI [0.44 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [1 0 0 0] state_WI [0.43 0.52 0.39 0.91] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [0.43 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [1 1 1 1] state_WI [0.43 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [1 1 0 0] state_WI [0.43 0.32 0.39 0.91] sorted [3 0 2]\n",
      "   state [1 1 1 1] state_WI [0.43 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [0 1 0 1] state_WI [0.44 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [1 1 1 1] state_WI [0.43 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [1 1 1 0] state_WI [0.43 0.32 0.36 0.91] sorted [3 0 2]\n",
      "   state [0 0 1 1] state_WI [0.44 0.52 0.36 0.18] sorted [1 0 2]\n",
      "   state [1 0 0 1] state_WI [0.43 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [0 1 1 1] state_WI [0.44 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [0 0 0 1] state_WI [0.44 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [0 0 1 1] state_WI [0.44 0.52 0.36 0.18] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.44 0.32 0.36 0.91] sorted [3 0 2]\n",
      "   state [0 1 1 1] state_WI [0.44 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [1 1 1 1] state_WI [0.43 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [1 0 1 1] state_WI [0.43 0.52 0.36 0.18] sorted [1 0 2]\n",
      "   state [1 1 0 0] state_WI [0.43 0.32 0.39 0.91] sorted [3 0 2]\n",
      "instance 1, ep 17, state [1 0 0 1]\n",
      "   state [1 0 0 1] state_WI [0.43 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [1 0 1 1] state_WI [0.43 0.52 0.36 0.18] sorted [1 0 2]\n",
      "   state [1 1 0 0] state_WI [0.43 0.32 0.39 0.91] sorted [3 0 2]\n",
      "   state [1 1 0 0] state_WI [0.43 0.32 0.39 0.91] sorted [3 0 2]\n",
      "   state [1 0 0 1] state_WI [0.43 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [1 1 0 1] state_WI [0.43 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [0 1 0 1] state_WI [0.44 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [1 1 1 0] state_WI [0.43 0.32 0.36 0.91] sorted [3 0 2]\n",
      "   state [1 1 1 1] state_WI [0.43 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [0 1 1 1] state_WI [0.44 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [0 1 0 1] state_WI [0.44 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [0 1 0 0] state_WI [0.44 0.32 0.39 0.91] sorted [3 0 2]\n",
      "   state [1 1 1 1] state_WI [0.43 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [1 1 1 0] state_WI [0.43 0.32 0.36 0.91] sorted [3 0 2]\n",
      "   state [1 1 1 0] state_WI [0.43 0.32 0.36 0.91] sorted [3 0 2]\n",
      "   state [0 0 1 1] state_WI [0.44 0.52 0.36 0.18] sorted [1 0 2]\n",
      "   state [0 1 1 1] state_WI [0.44 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [1 0 1 1] state_WI [0.43 0.52 0.36 0.18] sorted [1 0 2]\n",
      "   state [1 1 0 1] state_WI [0.43 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [0 1 1 0] state_WI [0.44 0.32 0.36 0.91] sorted [3 0 2]\n",
      "instance 1, ep 18, state [1 0 0 1]\n",
      "   state [1 0 0 1] state_WI [0.43 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [1 1 1 1] state_WI [0.43 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [1 1 0 1] state_WI [0.43 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [0 1 0 0] state_WI [0.44 0.32 0.39 0.91] sorted [3 0 2]\n",
      "   state [0 1 0 0] state_WI [0.44 0.32 0.39 0.91] sorted [3 0 2]\n",
      "   state [1 1 0 0] state_WI [0.43 0.32 0.39 0.91] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [0.43 0.52 0.36 0.18] sorted [1 0 2]\n",
      "   state [1 0 1 1] state_WI [0.43 0.52 0.36 0.18] sorted [1 0 2]\n",
      "   state [1 1 1 1] state_WI [0.43 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [1 1 1 1] state_WI [0.43 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [0 1 1 0] state_WI [0.44 0.32 0.36 0.91] sorted [3 0 2]\n",
      "   state [0 1 1 1] state_WI [0.44 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [0 1 0 1] state_WI [0.44 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [0 0 0 1] state_WI [0.44 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [0 0 0 1] state_WI [0.44 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [0 1 0 1] state_WI [0.44 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [0 0 0 1] state_WI [0.44 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [1 1 1 0] state_WI [0.43 0.32 0.36 0.91] sorted [3 0 2]\n",
      "   state [0 0 0 1] state_WI [0.44 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [1 0 1 1] state_WI [0.43 0.52 0.36 0.18] sorted [1 0 2]\n",
      "instance 1, ep 19, state [0 1 1 0]\n",
      "   state [0 1 1 0] state_WI [0.44 0.32 0.36 0.91] sorted [3 0 2]\n",
      "   state [0 0 0 1] state_WI [0.44 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [1 1 1 0] state_WI [0.43 0.32 0.36 0.91] sorted [3 0 2]\n",
      "   state [1 0 0 0] state_WI [0.43 0.52 0.39 0.91] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [0.43 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [1 0 0 0] state_WI [0.43 0.52 0.39 0.91] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.44 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [0 1 0 0] state_WI [0.44 0.32 0.39 0.91] sorted [3 0 2]\n",
      "   state [0 1 1 1] state_WI [0.44 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [0 1 0 0] state_WI [0.44 0.32 0.39 0.91] sorted [3 0 2]\n",
      "   state [0 1 1 0] state_WI [0.44 0.32 0.36 0.91] sorted [3 0 2]\n",
      "   state [1 1 0 1] state_WI [0.43 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [1 1 0 1] state_WI [0.43 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [1 1 0 1] state_WI [0.43 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [1 1 1 0] state_WI [0.43 0.32 0.36 0.91] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [0.43 0.52 0.36 0.18] sorted [1 0 2]\n",
      "   state [1 1 1 0] state_WI [0.43 0.32 0.36 0.91] sorted [3 0 2]\n",
      "   state [1 0 0 0] state_WI [0.43 0.52 0.39 0.91] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [0.43 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [0 1 1 1] state_WI [0.44 0.32 0.36 0.18] sorted [0 2 1]\n",
      "instance 1, ep 20, state [0 1 1 1]\n",
      "   state [0 1 1 1] state_WI [0.44 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [0 1 1 1] state_WI [0.44 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [0 1 0 0] state_WI [0.44 0.32 0.39 0.91] sorted [3 0 2]\n",
      "   state [1 0 0 1] state_WI [0.43 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [1 1 1 1] state_WI [0.43 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [1 0 0 1] state_WI [0.43 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [1 1 0 0] state_WI [0.43 0.32 0.39 0.91] sorted [3 0 2]\n",
      "   state [1 0 1 0] state_WI [0.43 0.52 0.36 0.91] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [0.43 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [0 1 0 1] state_WI [0.44 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [0 1 0 0] state_WI [0.44 0.32 0.39 0.91] sorted [3 0 2]\n",
      "   state [1 1 1 1] state_WI [0.43 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [1 1 1 1] state_WI [0.43 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [1 0 0 0] state_WI [0.43 0.52 0.39 0.91] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [0.43 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [1 1 0 0] state_WI [0.43 0.32 0.39 0.91] sorted [3 0 2]\n",
      "   state [0 0 0 0] state_WI [0.44 0.52 0.39 0.91] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.44 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [1 1 1 0] state_WI [0.43 0.32 0.36 0.91] sorted [3 0 2]\n",
      "   state [0 1 1 1] state_WI [0.44 0.32 0.36 0.18] sorted [0 2 1]\n",
      "instance 1, ep 21, state [1 1 1 1]\n",
      "   state [1 1 1 1] state_WI [0.43 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [1 1 1 0] state_WI [0.43 0.32 0.36 0.91] sorted [3 0 2]\n",
      "   state [0 1 0 0] state_WI [0.44 0.32 0.39 0.91] sorted [3 0 2]\n",
      "   state [0 1 0 1] state_WI [0.44 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [0 1 1 0] state_WI [0.44 0.32 0.36 0.91] sorted [3 0 2]\n",
      "   state [0 0 1 1] state_WI [0.44 0.52 0.36 0.18] sorted [1 0 2]\n",
      "   state [1 0 1 1] state_WI [0.43 0.52 0.36 0.18] sorted [1 0 2]\n",
      "   state [1 1 1 0] state_WI [0.43 0.32 0.36 0.91] sorted [3 0 2]\n",
      "   state [1 1 1 0] state_WI [0.43 0.32 0.36 0.91] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [0.43 0.52 0.36 0.18] sorted [1 0 2]\n",
      "   state [1 0 1 0] state_WI [0.43 0.52 0.36 0.91] sorted [3 1 0]\n",
      "   state [0 1 1 1] state_WI [0.44 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [1 1 1 0] state_WI [0.43 0.32 0.36 0.91] sorted [3 0 2]\n",
      "   state [1 0 0 0] state_WI [0.43 0.52 0.39 0.91] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [0.43 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [1 1 0 1] state_WI [0.43 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [1 1 0 1] state_WI [0.43 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [1 1 0 1] state_WI [0.43 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [1 1 0 0] state_WI [0.43 0.32 0.39 0.91] sorted [3 0 2]\n",
      "   state [1 1 0 1] state_WI [0.43 0.32 0.39 0.18] sorted [0 2 1]\n",
      "instance 1, ep 22, state [1 1 1 1]\n",
      "   state [1 1 1 1] state_WI [0.43 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [1 1 1 0] state_WI [0.43 0.32 0.36 0.91] sorted [3 0 2]\n",
      "   state [1 1 1 0] state_WI [0.43 0.32 0.36 0.91] sorted [3 0 2]\n",
      "   state [1 0 0 1] state_WI [0.43 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [1 1 0 0] state_WI [0.43 0.32 0.39 0.91] sorted [3 0 2]\n",
      "   state [1 0 0 1] state_WI [0.43 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [1 1 0 1] state_WI [0.43 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [1 1 0 1] state_WI [0.43 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [1 1 0 1] state_WI [0.43 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [1 0 0 1] state_WI [0.43 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [0 1 1 1] state_WI [0.44 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [0 0 1 0] state_WI [0.44 0.52 0.36 0.91] sorted [3 1 0]\n",
      "   state [1 0 0 0] state_WI [0.43 0.52 0.39 0.91] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [0.43 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [1 1 0 1] state_WI [0.43 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [1 1 0 1] state_WI [0.43 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [1 0 1 1] state_WI [0.43 0.52 0.36 0.18] sorted [1 0 2]\n",
      "   state [1 0 1 0] state_WI [0.43 0.52 0.36 0.91] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [0.43 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [1 1 0 0] state_WI [0.43 0.32 0.39 0.91] sorted [3 0 2]\n",
      "instance 1, ep 23, state [1 0 1 1]\n",
      "   state [1 0 1 1] state_WI [0.43 0.52 0.36 0.18] sorted [1 0 2]\n",
      "   state [1 0 0 1] state_WI [0.43 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [0 0 1 1] state_WI [0.44 0.52 0.36 0.18] sorted [1 0 2]\n",
      "   state [1 0 0 0] state_WI [0.43 0.52 0.39 0.91] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [0.43 0.32 0.39 0.91] sorted [3 0 2]\n",
      "   state [1 0 0 1] state_WI [0.43 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [1 0 0 1] state_WI [0.43 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [0 0 0 0] state_WI [0.44 0.52 0.39 0.91] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.44 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [1 1 1 1] state_WI [0.43 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [0 1 1 1] state_WI [0.44 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [0 1 1 0] state_WI [0.44 0.32 0.36 0.91] sorted [3 0 2]\n",
      "   state [0 1 1 0] state_WI [0.44 0.32 0.36 0.91] sorted [3 0 2]\n",
      "   state [1 0 0 1] state_WI [0.43 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [0 1 0 1] state_WI [0.44 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [0 1 0 0] state_WI [0.44 0.32 0.39 0.91] sorted [3 0 2]\n",
      "   state [0 0 0 0] state_WI [0.44 0.52 0.39 0.91] sorted [3 1 0]\n",
      "   state [0 0 0 1] state_WI [0.44 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [0 0 0 1] state_WI [0.44 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [0 0 0 0] state_WI [0.44 0.52 0.39 0.91] sorted [3 1 0]\n",
      "instance 1, ep 24, state [1 1 1 0]\n",
      "   state [1 1 1 0] state_WI [0.43 0.32 0.36 0.91] sorted [3 0 2]\n",
      "   state [0 0 1 0] state_WI [0.44 0.52 0.36 0.91] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [0.43 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [1 1 0 1] state_WI [0.43 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [0 1 1 1] state_WI [0.44 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [1 1 1 0] state_WI [0.43 0.32 0.36 0.91] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [0.43 0.52 0.36 0.18] sorted [1 0 2]\n",
      "   state [1 0 1 0] state_WI [0.43 0.52 0.36 0.91] sorted [3 1 0]\n",
      "   state [1 1 1 1] state_WI [0.43 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [1 0 1 0] state_WI [0.43 0.52 0.36 0.91] sorted [3 1 0]\n",
      "   state [1 0 0 0] state_WI [0.43 0.52 0.39 0.91] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [0.43 0.32 0.39 0.91] sorted [3 0 2]\n",
      "   state [0 0 1 0] state_WI [0.44 0.52 0.36 0.91] sorted [3 1 0]\n",
      "   state [1 0 1 1] state_WI [0.43 0.52 0.36 0.18] sorted [1 0 2]\n",
      "   state [1 0 1 0] state_WI [0.43 0.52 0.36 0.91] sorted [3 1 0]\n",
      "   state [0 1 1 1] state_WI [0.44 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [1 1 0 0] state_WI [0.43 0.32 0.39 0.91] sorted [3 0 2]\n",
      "   state [1 1 0 0] state_WI [0.43 0.32 0.39 0.91] sorted [3 0 2]\n",
      "   state [1 1 0 0] state_WI [0.43 0.32 0.39 0.91] sorted [3 0 2]\n",
      "   state [0 0 0 1] state_WI [0.44 0.52 0.39 0.18] sorted [1 0 2]\n",
      "instance 1, ep 25, state [0 0 0 0]\n",
      "   state [0 0 0 0] state_WI [0.44 0.52 0.39 0.91] sorted [3 1 0]\n",
      "   state [0 1 0 0] state_WI [0.44 0.32 0.39 0.91] sorted [3 0 2]\n",
      "   state [0 1 0 1] state_WI [0.44 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [0 1 0 0] state_WI [0.44 0.32 0.39 0.91] sorted [3 0 2]\n",
      "   state [1 0 0 0] state_WI [0.43 0.52 0.39 0.91] sorted [3 1 0]\n",
      "   state [0 0 0 1] state_WI [0.44 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [0 1 0 0] state_WI [0.44 0.32 0.39 0.91] sorted [3 0 2]\n",
      "   state [1 0 1 0] state_WI [0.43 0.52 0.36 0.91] sorted [3 1 0]\n",
      "   state [1 1 1 1] state_WI [0.43 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [1 0 0 1] state_WI [0.43 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [1 0 1 0] state_WI [0.43 0.52 0.36 0.91] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [0.43 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [0 0 0 0] state_WI [0.44 0.52 0.39 0.91] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [0.43 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [1 1 0 0] state_WI [0.43 0.32 0.39 0.91] sorted [3 0 2]\n",
      "   state [1 1 1 1] state_WI [0.43 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [1 1 1 1] state_WI [0.43 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [1 1 1 1] state_WI [0.43 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [1 1 1 0] state_WI [0.43 0.32 0.36 0.91] sorted [3 0 2]\n",
      "   state [1 1 1 1] state_WI [0.43 0.32 0.36 0.18] sorted [0 2 1]\n",
      "instance 1, ep 26, state [1 0 1 0]\n",
      "   state [1 0 1 0] state_WI [0.43 0.52 0.36 0.91] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [0.43 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [1 0 1 1] state_WI [0.43 0.52 0.36 0.18] sorted [1 0 2]\n",
      "   state [1 0 1 1] state_WI [0.43 0.52 0.36 0.18] sorted [1 0 2]\n",
      "   state [1 1 0 1] state_WI [0.43 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [0 0 0 0] state_WI [0.44 0.52 0.39 0.91] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [0.43 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [1 0 1 1] state_WI [0.43 0.52 0.36 0.18] sorted [1 0 2]\n",
      "   state [1 1 1 1] state_WI [0.43 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [1 1 0 1] state_WI [0.43 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [0 1 1 1] state_WI [0.44 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [0 1 1 0] state_WI [0.44 0.32 0.36 0.91] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [0.43 0.52 0.36 0.18] sorted [1 0 2]\n",
      "   state [0 0 0 1] state_WI [0.44 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [0 1 0 0] state_WI [0.44 0.32 0.39 0.91] sorted [3 0 2]\n",
      "   state [0 0 0 1] state_WI [0.44 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [1 0 1 1] state_WI [0.43 0.52 0.36 0.18] sorted [1 0 2]\n",
      "   state [1 1 0 0] state_WI [0.43 0.32 0.39 0.91] sorted [3 0 2]\n",
      "   state [1 0 0 1] state_WI [0.43 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [1 1 0 1] state_WI [0.43 0.32 0.39 0.18] sorted [0 2 1]\n",
      "instance 1, ep 27, state [1 0 0 0]\n",
      "   state [1 0 0 0] state_WI [0.43 0.52 0.39 0.91] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [0.43 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [1 1 0 1] state_WI [0.43 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [1 1 0 1] state_WI [0.43 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [0 0 0 1] state_WI [0.44 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [0 0 0 0] state_WI [0.44 0.52 0.39 0.91] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [0.43 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [1 0 0 0] state_WI [0.43 0.52 0.39 0.91] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [0.43 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [1 0 1 1] state_WI [0.43 0.52 0.36 0.18] sorted [1 0 2]\n",
      "   state [1 0 1 1] state_WI [0.43 0.52 0.36 0.18] sorted [1 0 2]\n",
      "   state [0 0 1 0] state_WI [0.44 0.52 0.36 0.91] sorted [3 1 0]\n",
      "   state [0 1 1 0] state_WI [0.44 0.32 0.36 0.91] sorted [3 0 2]\n",
      "   state [1 0 0 0] state_WI [0.43 0.52 0.39 0.91] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [0.43 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [1 0 0 0] state_WI [0.43 0.52 0.39 0.91] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [0.43 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [1 0 0 0] state_WI [0.43 0.52 0.39 0.91] sorted [3 1 0]\n",
      "   state [1 1 1 1] state_WI [0.43 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [1 1 0 1] state_WI [0.43 0.32 0.39 0.18] sorted [0 2 1]\n",
      "instance 1, ep 28, state [1 0 1 0]\n",
      "   state [1 0 1 0] state_WI [0.43 0.52 0.36 0.91] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [0.43 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [1 1 0 0] state_WI [0.43 0.32 0.39 0.91] sorted [3 0 2]\n",
      "   state [1 1 0 1] state_WI [0.43 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [0 0 1 1] state_WI [0.44 0.52 0.36 0.18] sorted [1 0 2]\n",
      "   state [1 0 1 1] state_WI [0.43 0.52 0.36 0.18] sorted [1 0 2]\n",
      "   state [1 0 1 1] state_WI [0.43 0.52 0.36 0.18] sorted [1 0 2]\n",
      "   state [1 1 1 1] state_WI [0.43 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [1 0 0 0] state_WI [0.43 0.52 0.39 0.91] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [0.43 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [0 1 0 0] state_WI [0.44 0.32 0.39 0.91] sorted [3 0 2]\n",
      "   state [1 0 0 1] state_WI [0.43 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [0 1 0 0] state_WI [0.44 0.32 0.39 0.91] sorted [3 0 2]\n",
      "   state [0 1 0 1] state_WI [0.44 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [0 0 0 1] state_WI [0.44 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [1 0 0 1] state_WI [0.43 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [1 1 0 1] state_WI [0.43 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [1 1 1 1] state_WI [0.43 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [1 1 0 1] state_WI [0.43 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [1 1 0 1] state_WI [0.43 0.32 0.39 0.18] sorted [0 2 1]\n",
      "instance 1, ep 29, state [0 1 1 0]\n",
      "   state [0 1 1 0] state_WI [0.44 0.32 0.36 0.91] sorted [3 0 2]\n",
      "   state [0 1 1 1] state_WI [0.44 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [1 1 1 1] state_WI [0.43 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [1 0 1 0] state_WI [0.43 0.52 0.36 0.91] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [0.43 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [1 1 0 0] state_WI [0.43 0.32 0.39 0.91] sorted [3 0 2]\n",
      "   state [1 0 0 1] state_WI [0.43 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [1 0 1 1] state_WI [0.43 0.52 0.36 0.18] sorted [1 0 2]\n",
      "   state [0 1 1 1] state_WI [0.44 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [1 1 1 0] state_WI [0.43 0.32 0.36 0.91] sorted [3 0 2]\n",
      "   state [1 1 0 1] state_WI [0.43 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [1 1 0 1] state_WI [0.43 0.32 0.39 0.18] sorted [0 2 1]\n",
      "   state [1 1 1 1] state_WI [0.43 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [1 1 1 1] state_WI [0.43 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [1 0 1 1] state_WI [0.43 0.52 0.36 0.18] sorted [1 0 2]\n",
      "   state [0 1 1 1] state_WI [0.44 0.32 0.36 0.18] sorted [0 2 1]\n",
      "   state [0 1 1 0] state_WI [0.44 0.32 0.36 0.91] sorted [3 0 2]\n",
      "   state [1 0 0 1] state_WI [0.43 0.52 0.39 0.18] sorted [1 0 2]\n",
      "   state [1 0 0 0] state_WI [0.43 0.52 0.39 0.91] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [0.43 0.32 0.39 0.91] sorted [3 0 2]\n",
      "first state [1 0 0 1]\n",
      "   state [1 0 0 1] state_WI [0.38 0.61 1.   0.27] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.38 0.32 0.21 0.77] sorted [3 0 1]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 1 0] state_WI [0.38 0.32 0.21 0.77] sorted [3 0 1]\n",
      "   state [1 1 0 0] state_WI [0.38 0.32 1.   0.77] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [0.38 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [0 1 1 1] state_WI [0.54 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 0 0 0] state_WI [0.38 0.61 1.   0.77] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.54 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [0 1 0 1] state_WI [0.54 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [0 1 1 0] state_WI [0.54 0.32 0.21 0.77] sorted [3 0 1]\n",
      "   state [1 0 1 1] state_WI [0.38 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [1 1 1 0] state_WI [0.38 0.32 0.21 0.77] sorted [3 0 1]\n",
      "   state [1 1 1 0] state_WI [0.38 0.32 0.21 0.77] sorted [3 0 1]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [0 1 1 1] state_WI [0.54 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [0 0 1 1] state_WI [0.54 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [0.38 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [0 1 1 1] state_WI [0.54 0.32 0.21 0.27] sorted [0 1 3]\n",
      "instance 2, ep 1, state [0 1 0 1]\n",
      "   state [0 1 0 1] state_WI [0.54 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [0 1 0 1] state_WI [0.54 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [0 1 1 1] state_WI [0.54 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [0 1 0 1] state_WI [0.54 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [0 1 1 1] state_WI [0.54 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [0 1 1 1] state_WI [0.54 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 0 1 1] state_WI [0.38 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [0 0 0 0] state_WI [0.54 0.61 1.   0.77] sorted [2 3 1]\n",
      "   state [0 1 0 0] state_WI [0.54 0.32 1.   0.77] sorted [2 3 0]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [0.38 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 0 0] state_WI [0.38 0.32 1.   0.77] sorted [2 3 0]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [0 0 1 1] state_WI [0.54 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [0 1 1 1] state_WI [0.54 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 1 0] state_WI [0.38 0.32 0.21 0.77] sorted [3 0 1]\n",
      "instance 2, ep 2, state [0 1 1 1]\n",
      "   state [0 1 1 1] state_WI [0.54 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [0 1 1 1] state_WI [0.54 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [0 1 1 1] state_WI [0.54 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [0 1 0 1] state_WI [0.54 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [0.38 0.32 0.21 0.77] sorted [3 0 1]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 1 0] state_WI [0.38 0.32 0.21 0.77] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.38 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [0.38 0.32 0.21 0.77] sorted [3 0 1]\n",
      "   state [0 1 0 0] state_WI [0.54 0.32 1.   0.77] sorted [2 3 0]\n",
      "   state [0 0 1 0] state_WI [0.54 0.61 0.21 0.77] sorted [3 1 0]\n",
      "   state [0 1 0 0] state_WI [0.54 0.32 1.   0.77] sorted [2 3 0]\n",
      "   state [0 1 1 1] state_WI [0.54 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [0.38 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [0 1 1 1] state_WI [0.54 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [0.38 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [0 1 1 0] state_WI [0.54 0.32 0.21 0.77] sorted [3 0 1]\n",
      "instance 2, ep 3, state [0 1 1 1]\n",
      "   state [0 1 1 1] state_WI [0.54 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 0 0] state_WI [0.38 0.32 1.   0.77] sorted [2 3 0]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [0.38 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [1 0 1 0] state_WI [0.38 0.61 0.21 0.77] sorted [3 1 0]\n",
      "   state [1 0 1 0] state_WI [0.38 0.61 0.21 0.77] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.54 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [1 0 1 1] state_WI [0.38 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [0 1 1 1] state_WI [0.54 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [0 0 0 1] state_WI [0.54 0.61 1.   0.27] sorted [2 1 0]\n",
      "   state [0 0 1 1] state_WI [0.54 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [1 0 0 1] state_WI [0.38 0.61 1.   0.27] sorted [2 1 0]\n",
      "   state [1 0 0 0] state_WI [0.38 0.61 1.   0.77] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.54 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [0 1 1 0] state_WI [0.54 0.32 0.21 0.77] sorted [3 0 1]\n",
      "   state [0 1 1 1] state_WI [0.54 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "instance 2, ep 4, state [1 1 0 1]\n",
      "   state [1 1 0 1] state_WI [0.38 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [1 0 0 0] state_WI [0.38 0.61 1.   0.77] sorted [2 3 1]\n",
      "   state [1 0 0 1] state_WI [0.38 0.61 1.   0.27] sorted [2 1 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [0 0 0 1] state_WI [0.54 0.61 1.   0.27] sorted [2 1 0]\n",
      "   state [0 1 0 1] state_WI [0.54 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [0.38 0.32 0.21 0.77] sorted [3 0 1]\n",
      "   state [1 1 0 0] state_WI [0.38 0.32 1.   0.77] sorted [2 3 0]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [0.38 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 0 1 1] state_WI [0.38 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [1 0 1 1] state_WI [0.38 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [0.38 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [0 1 1 1] state_WI [0.54 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [0 0 1 1] state_WI [0.54 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [1 0 1 0] state_WI [0.38 0.61 0.21 0.77] sorted [3 1 0]\n",
      "instance 2, ep 5, state [1 1 0 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.32 1.   0.77] sorted [2 3 0]\n",
      "   state [0 1 0 1] state_WI [0.54 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [0 1 1 1] state_WI [0.54 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [0.38 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 0 0 1] state_WI [0.38 0.61 1.   0.27] sorted [2 1 0]\n",
      "   state [1 0 0 1] state_WI [0.38 0.61 1.   0.27] sorted [2 1 0]\n",
      "   state [1 0 1 0] state_WI [0.38 0.61 0.21 0.77] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.32 1.   0.77] sorted [2 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 1 0] state_WI [0.38 0.32 0.21 0.77] sorted [3 0 1]\n",
      "   state [1 1 1 0] state_WI [0.38 0.32 0.21 0.77] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.38 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [0 0 1 1] state_WI [0.54 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [1 0 1 0] state_WI [0.38 0.61 0.21 0.77] sorted [3 1 0]\n",
      "   state [0 0 1 1] state_WI [0.54 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [0.38 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [1 1 0 1] state_WI [0.38 0.32 1.   0.27] sorted [2 0 1]\n",
      "instance 2, ep 6, state [1 1 0 1]\n",
      "   state [1 1 0 1] state_WI [0.38 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [1 0 1 1] state_WI [0.38 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [0 1 1 0] state_WI [0.54 0.32 0.21 0.77] sorted [3 0 1]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [0 1 1 0] state_WI [0.54 0.32 0.21 0.77] sorted [3 0 1]\n",
      "   state [0 1 1 0] state_WI [0.54 0.32 0.21 0.77] sorted [3 0 1]\n",
      "   state [0 1 1 0] state_WI [0.54 0.32 0.21 0.77] sorted [3 0 1]\n",
      "   state [1 0 1 1] state_WI [0.38 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [1 0 1 1] state_WI [0.38 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [0.38 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [1 0 1 0] state_WI [0.38 0.61 0.21 0.77] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [0 1 1 1] state_WI [0.54 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [0 1 0 0] state_WI [0.54 0.32 1.   0.77] sorted [2 3 0]\n",
      "instance 2, ep 7, state [0 0 0 0]\n",
      "   state [0 0 0 0] state_WI [0.54 0.61 1.   0.77] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.54 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [0 1 1 1] state_WI [0.54 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 0 1 1] state_WI [0.38 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [0.38 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [0 1 0 1] state_WI [0.54 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [0 1 1 1] state_WI [0.54 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [0 0 1 0] state_WI [0.54 0.61 0.21 0.77] sorted [3 1 0]\n",
      "   state [0 1 1 1] state_WI [0.54 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [0.38 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [0 0 0 1] state_WI [0.54 0.61 1.   0.27] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.38 0.32 0.21 0.77] sorted [3 0 1]\n",
      "   state [0 1 1 1] state_WI [0.54 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 0 0 0] state_WI [0.38 0.61 1.   0.77] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.54 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [0 1 0 1] state_WI [0.54 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [1 0 1 1] state_WI [0.38 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [0 0 0 0] state_WI [0.54 0.61 1.   0.77] sorted [2 3 1]\n",
      "instance 2, ep 8, state [1 0 1 1]\n",
      "   state [1 0 1 1] state_WI [0.38 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [0 0 0 1] state_WI [0.54 0.61 1.   0.27] sorted [2 1 0]\n",
      "   state [0 1 1 1] state_WI [0.54 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [0 0 0 1] state_WI [0.54 0.61 1.   0.27] sorted [2 1 0]\n",
      "   state [0 1 1 1] state_WI [0.54 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 0 0 1] state_WI [0.38 0.61 1.   0.27] sorted [2 1 0]\n",
      "   state [1 0 0 1] state_WI [0.38 0.61 1.   0.27] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.54 0.32 0.21 0.77] sorted [3 0 1]\n",
      "   state [0 0 1 1] state_WI [0.54 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 0 0] state_WI [0.38 0.32 1.   0.77] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [0.38 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [0 1 0 1] state_WI [0.54 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [0 0 1 0] state_WI [0.54 0.61 0.21 0.77] sorted [3 1 0]\n",
      "   state [0 0 1 1] state_WI [0.54 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [0 0 1 1] state_WI [0.54 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [0.38 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [0 1 0 1] state_WI [0.54 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 0 1 1] state_WI [0.38 0.61 0.21 0.27] sorted [1 0 3]\n",
      "instance 2, ep 9, state [1 1 0 1]\n",
      "   state [1 1 0 1] state_WI [0.38 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [1 0 1 1] state_WI [0.38 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [0.38 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [1 0 1 0] state_WI [0.38 0.61 0.21 0.77] sorted [3 1 0]\n",
      "   state [1 0 1 1] state_WI [0.38 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [0 1 0 1] state_WI [0.54 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [0.38 0.32 0.21 0.77] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.38 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [0 1 1 1] state_WI [0.54 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [0 1 1 1] state_WI [0.54 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [0.38 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 0 1 1] state_WI [0.38 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [0.38 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "instance 2, ep 10, state [1 0 1 1]\n",
      "   state [1 0 1 1] state_WI [0.38 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [0 0 1 1] state_WI [0.54 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [0 0 0 1] state_WI [0.54 0.61 1.   0.27] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [0 0 1 1] state_WI [0.54 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [0 1 1 1] state_WI [0.54 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [0 0 0 1] state_WI [0.54 0.61 1.   0.27] sorted [2 1 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [0 1 1 1] state_WI [0.54 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [0 1 0 1] state_WI [0.54 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [0 1 1 0] state_WI [0.54 0.32 0.21 0.77] sorted [3 0 1]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 0 0] state_WI [0.38 0.32 1.   0.77] sorted [2 3 0]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [0.38 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [0.38 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [0.38 0.32 0.21 0.77] sorted [3 0 1]\n",
      "instance 2, ep 11, state [1 1 1 0]\n",
      "   state [1 1 1 0] state_WI [0.38 0.32 0.21 0.77] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.38 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [0 1 1 0] state_WI [0.54 0.32 0.21 0.77] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.38 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [1 1 0 1] state_WI [0.38 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [0.38 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [1 0 1 1] state_WI [0.38 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 0 0 1] state_WI [0.38 0.61 1.   0.27] sorted [2 1 0]\n",
      "   state [1 0 1 0] state_WI [0.38 0.61 0.21 0.77] sorted [3 1 0]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [0 1 1 1] state_WI [0.54 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [0 1 1 1] state_WI [0.54 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [0.38 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [0.38 0.32 0.21 0.77] sorted [3 0 1]\n",
      "   state [1 0 1 0] state_WI [0.38 0.61 0.21 0.77] sorted [3 1 0]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "instance 2, ep 12, state [1 1 0 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.32 1.   0.77] sorted [2 3 0]\n",
      "   state [1 0 1 0] state_WI [0.38 0.61 0.21 0.77] sorted [3 1 0]\n",
      "   state [0 1 1 1] state_WI [0.54 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [0 1 1 1] state_WI [0.54 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [0 0 1 0] state_WI [0.54 0.61 0.21 0.77] sorted [3 1 0]\n",
      "   state [0 0 0 1] state_WI [0.54 0.61 1.   0.27] sorted [2 1 0]\n",
      "   state [0 0 1 0] state_WI [0.54 0.61 0.21 0.77] sorted [3 1 0]\n",
      "   state [0 1 1 1] state_WI [0.54 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [0.38 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [0.38 0.32 0.21 0.77] sorted [3 0 1]\n",
      "   state [1 1 1 0] state_WI [0.38 0.32 0.21 0.77] sorted [3 0 1]\n",
      "   state [1 0 1 0] state_WI [0.38 0.61 0.21 0.77] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.54 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [0 1 1 1] state_WI [0.54 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 0 0 1] state_WI [0.38 0.61 1.   0.27] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [0 1 1 1] state_WI [0.54 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 0 1 1] state_WI [0.38 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [0 1 0 1] state_WI [0.54 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [1 0 1 1] state_WI [0.38 0.61 0.21 0.27] sorted [1 0 3]\n",
      "instance 2, ep 13, state [0 1 1 0]\n",
      "   state [0 1 1 0] state_WI [0.54 0.32 0.21 0.77] sorted [3 0 1]\n",
      "   state [0 1 0 1] state_WI [0.54 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [0 1 1 1] state_WI [0.54 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [0 1 1 0] state_WI [0.54 0.32 0.21 0.77] sorted [3 0 1]\n",
      "   state [0 1 0 1] state_WI [0.54 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 1 0] state_WI [0.38 0.32 0.21 0.77] sorted [3 0 1]\n",
      "   state [1 1 1 0] state_WI [0.38 0.32 0.21 0.77] sorted [3 0 1]\n",
      "   state [0 1 1 1] state_WI [0.54 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [0 1 1 1] state_WI [0.54 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [0 1 1 1] state_WI [0.54 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [0.38 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [1 0 0 1] state_WI [0.38 0.61 1.   0.27] sorted [2 1 0]\n",
      "   state [1 0 1 1] state_WI [0.38 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [1 0 0 1] state_WI [0.38 0.61 1.   0.27] sorted [2 1 0]\n",
      "   state [1 0 1 1] state_WI [0.38 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [0 0 1 1] state_WI [0.54 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [1 0 1 1] state_WI [0.38 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [1 1 1 0] state_WI [0.38 0.32 0.21 0.77] sorted [3 0 1]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "instance 2, ep 14, state [1 0 1 1]\n",
      "   state [1 0 1 1] state_WI [0.38 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [0.38 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [1 0 1 1] state_WI [0.38 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [1 0 0 1] state_WI [0.38 0.61 1.   0.27] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [0.38 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [0 0 1 1] state_WI [0.54 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [0 0 0 1] state_WI [0.54 0.61 1.   0.27] sorted [2 1 0]\n",
      "   state [1 0 1 1] state_WI [0.38 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [1 0 1 1] state_WI [0.38 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [1 0 0 1] state_WI [0.38 0.61 1.   0.27] sorted [2 1 0]\n",
      "   state [1 0 1 0] state_WI [0.38 0.61 0.21 0.77] sorted [3 1 0]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [0.38 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [0.38 0.32 0.21 0.77] sorted [3 0 1]\n",
      "instance 2, ep 15, state [1 0 0 0]\n",
      "   state [1 0 0 0] state_WI [0.38 0.61 1.   0.77] sorted [2 3 1]\n",
      "   state [1 0 1 1] state_WI [0.38 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [1 0 0 0] state_WI [0.38 0.61 1.   0.77] sorted [2 3 1]\n",
      "   state [1 1 1 0] state_WI [0.38 0.32 0.21 0.77] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.38 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [1 0 1 1] state_WI [0.38 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [0 0 1 1] state_WI [0.54 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [0 1 1 0] state_WI [0.54 0.32 0.21 0.77] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.38 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [1 0 0 1] state_WI [0.38 0.61 1.   0.27] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.38 0.32 0.21 0.77] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [0.38 0.61 1.   0.27] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.38 0.32 0.21 0.77] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.38 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [1 0 1 0] state_WI [0.38 0.61 0.21 0.77] sorted [3 1 0]\n",
      "   state [1 1 1 0] state_WI [0.38 0.32 0.21 0.77] sorted [3 0 1]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "instance 2, ep 16, state [0 1 1 1]\n",
      "   state [0 1 1 1] state_WI [0.54 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [0 0 0 1] state_WI [0.54 0.61 1.   0.27] sorted [2 1 0]\n",
      "   state [0 1 1 1] state_WI [0.54 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [0 1 1 0] state_WI [0.54 0.32 0.21 0.77] sorted [3 0 1]\n",
      "   state [0 1 1 0] state_WI [0.54 0.32 0.21 0.77] sorted [3 0 1]\n",
      "   state [0 1 1 1] state_WI [0.54 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [0 1 1 1] state_WI [0.54 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [0 1 0 1] state_WI [0.54 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [0.38 0.32 0.21 0.77] sorted [3 0 1]\n",
      "   state [1 1 1 0] state_WI [0.38 0.32 0.21 0.77] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.38 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [1 0 0 0] state_WI [0.38 0.61 1.   0.77] sorted [2 3 1]\n",
      "   state [1 0 1 1] state_WI [0.38 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [1 0 0 1] state_WI [0.38 0.61 1.   0.27] sorted [2 1 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.32 1.   0.77] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [0.38 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [0 1 1 0] state_WI [0.54 0.32 0.21 0.77] sorted [3 0 1]\n",
      "   state [1 1 1 0] state_WI [0.38 0.32 0.21 0.77] sorted [3 0 1]\n",
      "   state [1 1 1 0] state_WI [0.38 0.32 0.21 0.77] sorted [3 0 1]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "instance 2, ep 17, state [1 1 1 1]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 0 0 1] state_WI [0.38 0.61 1.   0.27] sorted [2 1 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.32 1.   0.77] sorted [2 3 0]\n",
      "   state [0 0 1 1] state_WI [0.54 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [1 0 1 1] state_WI [0.38 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [1 0 0 1] state_WI [0.38 0.61 1.   0.27] sorted [2 1 0]\n",
      "   state [1 0 0 1] state_WI [0.38 0.61 1.   0.27] sorted [2 1 0]\n",
      "   state [1 0 1 1] state_WI [0.38 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 0 0 1] state_WI [0.38 0.61 1.   0.27] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.38 0.32 0.21 0.77] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [0.38 0.61 1.   0.27] sorted [2 1 0]\n",
      "   state [1 0 1 1] state_WI [0.38 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [0.38 0.32 1.   0.77] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [0.38 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 1 0] state_WI [0.38 0.32 0.21 0.77] sorted [3 0 1]\n",
      "   state [1 1 0 0] state_WI [0.38 0.32 1.   0.77] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [0.38 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [1 0 1 1] state_WI [0.38 0.61 0.21 0.27] sorted [1 0 3]\n",
      "instance 2, ep 18, state [1 0 0 0]\n",
      "   state [1 0 0 0] state_WI [0.38 0.61 1.   0.77] sorted [2 3 1]\n",
      "   state [1 0 1 1] state_WI [0.38 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [1 0 1 1] state_WI [0.38 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [0.38 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [0 1 1 1] state_WI [0.54 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 1 0] state_WI [0.38 0.32 0.21 0.77] sorted [3 0 1]\n",
      "   state [0 1 1 1] state_WI [0.54 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [0 0 1 1] state_WI [0.54 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [0 0 1 1] state_WI [0.54 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [0.38 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [0 0 1 1] state_WI [0.54 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [0 0 1 0] state_WI [0.54 0.61 0.21 0.77] sorted [3 1 0]\n",
      "   state [0 0 0 1] state_WI [0.54 0.61 1.   0.27] sorted [2 1 0]\n",
      "   state [0 0 1 1] state_WI [0.54 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [0 0 0 1] state_WI [0.54 0.61 1.   0.27] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [0.38 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [1 0 1 0] state_WI [0.38 0.61 0.21 0.77] sorted [3 1 0]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "instance 2, ep 19, state [1 1 0 1]\n",
      "   state [1 1 0 1] state_WI [0.38 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [0.38 0.32 0.21 0.77] sorted [3 0 1]\n",
      "   state [1 1 1 0] state_WI [0.38 0.32 0.21 0.77] sorted [3 0 1]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 1 0] state_WI [0.38 0.32 0.21 0.77] sorted [3 0 1]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [0 1 0 1] state_WI [0.54 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [0 0 1 1] state_WI [0.54 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [1 0 1 1] state_WI [0.38 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 0 1 1] state_WI [0.38 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [1 0 0 1] state_WI [0.38 0.61 1.   0.27] sorted [2 1 0]\n",
      "   state [1 0 1 1] state_WI [0.38 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [1 0 0 1] state_WI [0.38 0.61 1.   0.27] sorted [2 1 0]\n",
      "   state [0 0 1 1] state_WI [0.54 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [0 0 0 1] state_WI [0.54 0.61 1.   0.27] sorted [2 1 0]\n",
      "   state [1 0 1 1] state_WI [0.38 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [1 0 1 1] state_WI [0.38 0.61 0.21 0.27] sorted [1 0 3]\n",
      "instance 2, ep 20, state [1 0 0 1]\n",
      "   state [1 0 0 1] state_WI [0.38 0.61 1.   0.27] sorted [2 1 0]\n",
      "   state [1 0 1 1] state_WI [0.38 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [0.38 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 0 1 1] state_WI [0.38 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [1 1 1 0] state_WI [0.38 0.32 0.21 0.77] sorted [3 0 1]\n",
      "   state [1 0 1 1] state_WI [0.38 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 1 0] state_WI [0.38 0.32 0.21 0.77] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.38 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 0 1 1] state_WI [0.38 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [1 0 1 1] state_WI [0.38 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [0.38 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [1 1 0 1] state_WI [0.38 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 0 1 1] state_WI [0.38 0.61 0.21 0.27] sorted [1 0 3]\n",
      "instance 2, ep 21, state [1 1 1 1]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 0 1 0] state_WI [0.38 0.61 0.21 0.77] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [0.38 0.61 1.   0.27] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.38 0.32 0.21 0.77] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.38 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [0.38 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [0.38 0.32 0.21 0.77] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.38 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [0 1 1 1] state_WI [0.54 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [0.38 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [1 0 1 1] state_WI [0.38 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [0 1 1 1] state_WI [0.54 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [0 1 0 1] state_WI [0.54 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [0 0 1 1] state_WI [0.54 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [0 0 1 0] state_WI [0.54 0.61 0.21 0.77] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [0.38 0.61 1.   0.27] sorted [2 1 0]\n",
      "   state [1 0 1 1] state_WI [0.38 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [1 0 1 1] state_WI [0.38 0.61 0.21 0.27] sorted [1 0 3]\n",
      "instance 2, ep 22, state [1 1 1 0]\n",
      "   state [1 1 1 0] state_WI [0.38 0.32 0.21 0.77] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [0.38 0.61 1.   0.27] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.38 0.32 0.21 0.77] sorted [3 0 1]\n",
      "   state [1 1 1 0] state_WI [0.38 0.32 0.21 0.77] sorted [3 0 1]\n",
      "   state [0 1 0 1] state_WI [0.54 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [0 1 1 1] state_WI [0.54 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [0 1 0 1] state_WI [0.54 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [0 1 1 0] state_WI [0.54 0.32 0.21 0.77] sorted [3 0 1]\n",
      "   state [1 0 1 1] state_WI [0.38 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [1 0 0 1] state_WI [0.38 0.61 1.   0.27] sorted [2 1 0]\n",
      "   state [0 1 1 1] state_WI [0.54 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [0 1 1 1] state_WI [0.54 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [0 0 0 1] state_WI [0.54 0.61 1.   0.27] sorted [2 1 0]\n",
      "   state [0 1 1 1] state_WI [0.54 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [0.38 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [0 1 1 1] state_WI [0.54 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 0 0] state_WI [0.38 0.32 1.   0.77] sorted [2 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.32 1.   0.27] sorted [2 0 1]\n",
      "instance 2, ep 23, state [0 0 1 1]\n",
      "   state [0 0 1 1] state_WI [0.54 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [0 1 1 1] state_WI [0.54 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [0 1 0 0] state_WI [0.54 0.32 1.   0.77] sorted [2 3 0]\n",
      "   state [1 0 1 0] state_WI [0.38 0.61 0.21 0.77] sorted [3 1 0]\n",
      "   state [1 0 1 1] state_WI [0.38 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [1 0 0 1] state_WI [0.38 0.61 1.   0.27] sorted [2 1 0]\n",
      "   state [1 0 1 0] state_WI [0.38 0.61 0.21 0.77] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.32 1.   0.77] sorted [2 3 0]\n",
      "   state [0 1 1 1] state_WI [0.54 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [0 1 1 1] state_WI [0.54 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [0 0 1 1] state_WI [0.54 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [0 1 1 1] state_WI [0.54 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [0 1 1 1] state_WI [0.54 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [0 0 0 1] state_WI [0.54 0.61 1.   0.27] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.54 0.32 0.21 0.77] sorted [3 0 1]\n",
      "   state [0 1 0 1] state_WI [0.54 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [0 0 0 1] state_WI [0.54 0.61 1.   0.27] sorted [2 1 0]\n",
      "instance 2, ep 24, state [1 0 0 0]\n",
      "   state [1 0 0 0] state_WI [0.38 0.61 1.   0.77] sorted [2 3 1]\n",
      "   state [1 0 0 1] state_WI [0.38 0.61 1.   0.27] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.38 0.32 0.21 0.77] sorted [3 0 1]\n",
      "   state [1 0 1 1] state_WI [0.38 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [0.38 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [0.38 0.32 0.21 0.77] sorted [3 0 1]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 1 0] state_WI [0.38 0.32 0.21 0.77] sorted [3 0 1]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 0 1 1] state_WI [0.38 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [1 0 1 1] state_WI [0.38 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [0.38 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [0.38 0.32 0.21 0.77] sorted [3 0 1]\n",
      "   state [0 1 0 1] state_WI [0.54 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [1 1 0 0] state_WI [0.38 0.32 1.   0.77] sorted [2 3 0]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [0 0 1 1] state_WI [0.54 0.61 0.21 0.27] sorted [1 0 3]\n",
      "instance 2, ep 25, state [0 1 0 0]\n",
      "   state [0 1 0 0] state_WI [0.54 0.32 1.   0.77] sorted [2 3 0]\n",
      "   state [0 0 1 1] state_WI [0.54 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [0 1 1 1] state_WI [0.54 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 0 0] state_WI [0.38 0.32 1.   0.77] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [0.38 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [1 0 1 1] state_WI [0.38 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [0 0 1 1] state_WI [0.54 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [0 0 1 1] state_WI [0.54 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [0 1 1 1] state_WI [0.54 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [0.38 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [0.38 0.32 0.21 0.77] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [0.38 0.61 1.   0.27] sorted [2 1 0]\n",
      "   state [0 1 0 0] state_WI [0.54 0.32 1.   0.77] sorted [2 3 0]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 0 0] state_WI [0.38 0.32 1.   0.77] sorted [2 3 0]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 0 0 1] state_WI [0.38 0.61 1.   0.27] sorted [2 1 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.32 1.   0.27] sorted [2 0 1]\n",
      "instance 2, ep 26, state [1 0 1 1]\n",
      "   state [1 0 1 1] state_WI [0.38 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [1 0 1 1] state_WI [0.38 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [0.38 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [1 0 1 0] state_WI [0.38 0.61 0.21 0.77] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [0.38 0.61 1.   0.27] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [0.38 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 1 0] state_WI [0.38 0.32 0.21 0.77] sorted [3 0 1]\n",
      "   state [1 1 0 0] state_WI [0.38 0.32 1.   0.77] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [0.38 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [0 1 1 1] state_WI [0.54 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [0 1 0 1] state_WI [0.54 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [0 1 1 1] state_WI [0.54 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [0 1 1 1] state_WI [0.54 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [0 1 1 1] state_WI [0.54 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "instance 2, ep 27, state [0 1 1 1]\n",
      "   state [0 1 1 1] state_WI [0.54 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [0 1 1 1] state_WI [0.54 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [0 1 0 1] state_WI [0.54 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [0 1 1 1] state_WI [0.54 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [0 1 0 1] state_WI [0.54 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [0.38 0.32 0.21 0.77] sorted [3 0 1]\n",
      "   state [0 0 1 1] state_WI [0.54 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [0.38 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [1 1 0 1] state_WI [0.38 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [0.38 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [1 0 0 1] state_WI [0.38 0.61 1.   0.27] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.38 0.32 0.21 0.77] sorted [3 0 1]\n",
      "   state [0 1 0 1] state_WI [0.54 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [1 0 1 0] state_WI [0.38 0.61 0.21 0.77] sorted [3 1 0]\n",
      "   state [1 0 1 1] state_WI [0.38 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [0.38 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [1 1 0 1] state_WI [0.38 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [0 1 1 1] state_WI [0.54 0.32 0.21 0.27] sorted [0 1 3]\n",
      "instance 2, ep 28, state [0 1 0 0]\n",
      "   state [0 1 0 0] state_WI [0.54 0.32 1.   0.77] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [0.38 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [0.38 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [0 1 1 1] state_WI [0.54 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [0 1 0 0] state_WI [0.54 0.32 1.   0.77] sorted [2 3 0]\n",
      "   state [0 1 1 1] state_WI [0.54 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [0 0 1 0] state_WI [0.54 0.61 0.21 0.77] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [0 1 1 0] state_WI [0.54 0.32 0.21 0.77] sorted [3 0 1]\n",
      "   state [0 1 1 0] state_WI [0.54 0.32 0.21 0.77] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [0.38 0.61 1.   0.27] sorted [2 1 0]\n",
      "   state [0 0 1 0] state_WI [0.54 0.61 0.21 0.77] sorted [3 1 0]\n",
      "   state [0 0 1 1] state_WI [0.54 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [0 0 0 0] state_WI [0.54 0.61 1.   0.77] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.54 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [0 1 1 1] state_WI [0.54 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [0 1 1 1] state_WI [0.54 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [0 1 1 1] state_WI [0.54 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 0 0 1] state_WI [0.38 0.61 1.   0.27] sorted [2 1 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.32 1.   0.27] sorted [2 0 1]\n",
      "instance 2, ep 29, state [0 1 0 0]\n",
      "   state [0 1 0 0] state_WI [0.54 0.32 1.   0.77] sorted [2 3 0]\n",
      "   state [1 0 0 1] state_WI [0.38 0.61 1.   0.27] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [0 0 0 1] state_WI [0.54 0.61 1.   0.27] sorted [2 1 0]\n",
      "   state [1 0 1 1] state_WI [0.38 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [1 0 0 1] state_WI [0.38 0.61 1.   0.27] sorted [2 1 0]\n",
      "   state [0 0 0 1] state_WI [0.54 0.61 1.   0.27] sorted [2 1 0]\n",
      "   state [0 1 0 0] state_WI [0.54 0.32 1.   0.77] sorted [2 3 0]\n",
      "   state [0 0 1 0] state_WI [0.54 0.61 0.21 0.77] sorted [3 1 0]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 1 0] state_WI [0.38 0.32 0.21 0.77] sorted [3 0 1]\n",
      "   state [0 1 1 1] state_WI [0.54 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [0 1 0 1] state_WI [0.54 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [0 1 0 1] state_WI [0.54 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [1 1 1 1] state_WI [0.38 0.32 0.21 0.27] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [0.38 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [1 0 1 1] state_WI [0.38 0.61 0.21 0.27] sorted [1 0 3]\n",
      "   state [0 1 0 1] state_WI [0.54 0.32 1.   0.27] sorted [2 0 1]\n",
      "   state [0 1 1 0] state_WI [0.54 0.32 0.21 0.77] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [0.38 0.61 1.   0.27] sorted [2 1 0]\n",
      "first state [0 1 1 0]\n",
      "   state [0 1 1 0] state_WI [1.   0.3  0.55 0.66] sorted [0 3 2]\n",
      "   state [1 0 0 1] state_WI [0.18 0.45 0.49 0.33] sorted [2 1 3]\n",
      "   state [1 0 0 1] state_WI [0.18 0.45 0.49 0.33] sorted [2 1 3]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [0 1 0 0] state_WI [1.   0.3  0.49 0.66] sorted [0 3 2]\n",
      "   state [0 0 0 1] state_WI [1.   0.45 0.49 0.33] sorted [0 2 1]\n",
      "   state [1 0 0 1] state_WI [0.18 0.45 0.49 0.33] sorted [2 1 3]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [1 0 1 0] state_WI [0.18 0.45 0.55 0.66] sorted [3 2 1]\n",
      "   state [0 0 1 0] state_WI [1.   0.45 0.55 0.66] sorted [0 3 2]\n",
      "   state [1 0 1 0] state_WI [0.18 0.45 0.55 0.66] sorted [3 2 1]\n",
      "   state [0 0 1 1] state_WI [1.   0.45 0.55 0.33] sorted [0 2 1]\n",
      "   state [0 1 1 0] state_WI [1.   0.3  0.55 0.66] sorted [0 3 2]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [1 0 0 1] state_WI [0.18 0.45 0.49 0.33] sorted [2 1 3]\n",
      "   state [1 1 0 0] state_WI [0.18 0.3  0.49 0.66] sorted [3 2 1]\n",
      "   state [1 1 0 1] state_WI [0.18 0.3  0.49 0.33] sorted [2 3 1]\n",
      "   state [1 1 0 1] state_WI [0.18 0.3  0.49 0.33] sorted [2 3 1]\n",
      "instance 3, ep 1, state [1 1 0 0]\n",
      "   state [1 1 0 0] state_WI [0.18 0.3  0.49 0.66] sorted [3 2 1]\n",
      "   state [1 1 0 1] state_WI [0.18 0.3  0.49 0.33] sorted [2 3 1]\n",
      "   state [1 1 0 1] state_WI [0.18 0.3  0.49 0.33] sorted [2 3 1]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [1.   0.3  0.55 0.33] sorted [0 2 3]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [0 0 1 0] state_WI [1.   0.45 0.55 0.66] sorted [0 3 2]\n",
      "   state [1 0 1 0] state_WI [0.18 0.45 0.55 0.66] sorted [3 2 1]\n",
      "   state [1 1 1 0] state_WI [0.18 0.3  0.55 0.66] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [1.   0.3  0.55 0.33] sorted [0 2 3]\n",
      "   state [1 0 1 0] state_WI [0.18 0.45 0.55 0.66] sorted [3 2 1]\n",
      "   state [1 1 1 0] state_WI [0.18 0.3  0.55 0.66] sorted [3 2 1]\n",
      "   state [1 1 1 0] state_WI [0.18 0.3  0.55 0.66] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [1.   0.3  0.55 0.33] sorted [0 2 3]\n",
      "   state [0 0 1 1] state_WI [1.   0.45 0.55 0.33] sorted [0 2 1]\n",
      "   state [1 1 0 1] state_WI [0.18 0.3  0.49 0.33] sorted [2 3 1]\n",
      "   state [1 0 1 0] state_WI [0.18 0.45 0.55 0.66] sorted [3 2 1]\n",
      "   state [0 0 1 0] state_WI [1.   0.45 0.55 0.66] sorted [0 3 2]\n",
      "   state [1 0 1 0] state_WI [0.18 0.45 0.55 0.66] sorted [3 2 1]\n",
      "   state [0 1 1 0] state_WI [1.   0.3  0.55 0.66] sorted [0 3 2]\n",
      "instance 3, ep 2, state [0 0 0 0]\n",
      "   state [0 0 0 0] state_WI [1.   0.45 0.49 0.66] sorted [0 3 2]\n",
      "   state [0 0 0 1] state_WI [1.   0.45 0.49 0.33] sorted [0 2 1]\n",
      "   state [0 1 0 1] state_WI [1.   0.3  0.49 0.33] sorted [0 2 3]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [1 1 1 0] state_WI [0.18 0.3  0.55 0.66] sorted [3 2 1]\n",
      "   state [1 1 1 0] state_WI [0.18 0.3  0.55 0.66] sorted [3 2 1]\n",
      "   state [1 1 1 0] state_WI [0.18 0.3  0.55 0.66] sorted [3 2 1]\n",
      "   state [0 1 0 0] state_WI [1.   0.3  0.49 0.66] sorted [0 3 2]\n",
      "   state [1 0 0 1] state_WI [0.18 0.45 0.49 0.33] sorted [2 1 3]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [1.   0.45 0.55 0.33] sorted [0 2 1]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [1.   0.3  0.55 0.33] sorted [0 2 3]\n",
      "   state [1 0 1 0] state_WI [0.18 0.45 0.55 0.66] sorted [3 2 1]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "instance 3, ep 3, state [0 0 1 0]\n",
      "   state [0 0 1 0] state_WI [1.   0.45 0.55 0.66] sorted [0 3 2]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [1 0 0 1] state_WI [0.18 0.45 0.49 0.33] sorted [2 1 3]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [1 0 1 0] state_WI [0.18 0.45 0.55 0.66] sorted [3 2 1]\n",
      "   state [1 1 1 0] state_WI [0.18 0.3  0.55 0.66] sorted [3 2 1]\n",
      "   state [1 0 1 0] state_WI [0.18 0.45 0.55 0.66] sorted [3 2 1]\n",
      "   state [0 0 1 1] state_WI [1.   0.45 0.55 0.33] sorted [0 2 1]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [1.   0.3  0.55 0.33] sorted [0 2 3]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [1.   0.45 0.55 0.33] sorted [0 2 1]\n",
      "   state [0 1 1 1] state_WI [1.   0.3  0.55 0.33] sorted [0 2 3]\n",
      "   state [0 1 1 0] state_WI [1.   0.3  0.55 0.66] sorted [0 3 2]\n",
      "   state [1 0 1 0] state_WI [0.18 0.45 0.55 0.66] sorted [3 2 1]\n",
      "   state [1 0 1 0] state_WI [0.18 0.45 0.55 0.66] sorted [3 2 1]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [1.   0.45 0.55 0.33] sorted [0 2 1]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "instance 3, ep 4, state [1 0 1 0]\n",
      "   state [1 0 1 0] state_WI [0.18 0.45 0.55 0.66] sorted [3 2 1]\n",
      "   state [0 0 1 1] state_WI [1.   0.45 0.55 0.33] sorted [0 2 1]\n",
      "   state [1 1 0 0] state_WI [0.18 0.3  0.49 0.66] sorted [3 2 1]\n",
      "   state [0 0 1 0] state_WI [1.   0.45 0.55 0.66] sorted [0 3 2]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [0 1 0 1] state_WI [1.   0.3  0.49 0.33] sorted [0 2 3]\n",
      "   state [1 0 0 1] state_WI [0.18 0.45 0.49 0.33] sorted [2 1 3]\n",
      "   state [1 1 0 1] state_WI [0.18 0.3  0.49 0.33] sorted [2 3 1]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [1 1 1 0] state_WI [0.18 0.3  0.55 0.66] sorted [3 2 1]\n",
      "   state [1 1 1 0] state_WI [0.18 0.3  0.55 0.66] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [1.   0.3  0.55 0.33] sorted [0 2 3]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [1 0 1 0] state_WI [0.18 0.45 0.55 0.66] sorted [3 2 1]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "instance 3, ep 5, state [0 1 1 1]\n",
      "   state [0 1 1 1] state_WI [1.   0.3  0.55 0.33] sorted [0 2 3]\n",
      "   state [0 1 1 1] state_WI [1.   0.3  0.55 0.33] sorted [0 2 3]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [0 0 1 0] state_WI [1.   0.45 0.55 0.66] sorted [0 3 2]\n",
      "   state [1 0 1 0] state_WI [0.18 0.45 0.55 0.66] sorted [3 2 1]\n",
      "   state [0 1 1 0] state_WI [1.   0.3  0.55 0.66] sorted [0 3 2]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [1 1 1 0] state_WI [0.18 0.3  0.55 0.66] sorted [3 2 1]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [1 1 1 0] state_WI [0.18 0.3  0.55 0.66] sorted [3 2 1]\n",
      "   state [1 1 1 0] state_WI [0.18 0.3  0.55 0.66] sorted [3 2 1]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [1 0 0 0] state_WI [0.18 0.45 0.49 0.66] sorted [3 2 1]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [1.   0.3  0.55 0.33] sorted [0 2 3]\n",
      "   state [1 1 1 0] state_WI [0.18 0.3  0.55 0.66] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [1.   0.3  0.55 0.33] sorted [0 2 3]\n",
      "instance 3, ep 6, state [0 0 1 1]\n",
      "   state [0 0 1 1] state_WI [1.   0.45 0.55 0.33] sorted [0 2 1]\n",
      "   state [1 0 1 0] state_WI [0.18 0.45 0.55 0.66] sorted [3 2 1]\n",
      "   state [1 0 1 0] state_WI [0.18 0.45 0.55 0.66] sorted [3 2 1]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [1.   0.3  0.55 0.33] sorted [0 2 3]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [1 0 0 1] state_WI [0.18 0.45 0.49 0.33] sorted [2 1 3]\n",
      "   state [1 1 1 0] state_WI [0.18 0.3  0.55 0.66] sorted [3 2 1]\n",
      "   state [0 1 1 0] state_WI [1.   0.3  0.55 0.66] sorted [0 3 2]\n",
      "   state [1 0 0 0] state_WI [0.18 0.45 0.49 0.66] sorted [3 2 1]\n",
      "   state [0 1 1 0] state_WI [1.   0.3  0.55 0.66] sorted [0 3 2]\n",
      "   state [0 1 1 1] state_WI [1.   0.3  0.55 0.33] sorted [0 2 3]\n",
      "   state [1 1 1 0] state_WI [0.18 0.3  0.55 0.66] sorted [3 2 1]\n",
      "   state [0 0 1 1] state_WI [1.   0.45 0.55 0.33] sorted [0 2 1]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [1.   0.3  0.55 0.33] sorted [0 2 3]\n",
      "   state [0 1 1 1] state_WI [1.   0.3  0.55 0.33] sorted [0 2 3]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "instance 3, ep 7, state [1 1 0 1]\n",
      "   state [1 1 0 1] state_WI [0.18 0.3  0.49 0.33] sorted [2 3 1]\n",
      "   state [0 1 0 1] state_WI [1.   0.3  0.49 0.33] sorted [0 2 3]\n",
      "   state [1 1 0 0] state_WI [0.18 0.3  0.49 0.66] sorted [3 2 1]\n",
      "   state [1 0 0 1] state_WI [0.18 0.45 0.49 0.33] sorted [2 1 3]\n",
      "   state [0 0 0 1] state_WI [1.   0.45 0.49 0.33] sorted [0 2 1]\n",
      "   state [1 0 0 1] state_WI [0.18 0.45 0.49 0.33] sorted [2 1 3]\n",
      "   state [1 0 1 0] state_WI [0.18 0.45 0.55 0.66] sorted [3 2 1]\n",
      "   state [1 1 1 0] state_WI [0.18 0.3  0.55 0.66] sorted [3 2 1]\n",
      "   state [0 0 1 0] state_WI [1.   0.45 0.55 0.66] sorted [0 3 2]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [1.   0.45 0.55 0.33] sorted [0 2 1]\n",
      "   state [0 1 1 1] state_WI [1.   0.3  0.55 0.33] sorted [0 2 3]\n",
      "   state [0 1 1 0] state_WI [1.   0.3  0.55 0.66] sorted [0 3 2]\n",
      "   state [1 0 1 0] state_WI [0.18 0.45 0.55 0.66] sorted [3 2 1]\n",
      "   state [1 0 1 0] state_WI [0.18 0.45 0.55 0.66] sorted [3 2 1]\n",
      "   state [1 0 1 0] state_WI [0.18 0.45 0.55 0.66] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [1.   0.3  0.55 0.33] sorted [0 2 3]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [1.   0.3  0.55 0.66] sorted [0 3 2]\n",
      "   state [0 1 1 0] state_WI [1.   0.3  0.55 0.66] sorted [0 3 2]\n",
      "instance 3, ep 8, state [0 0 0 1]\n",
      "   state [0 0 0 1] state_WI [1.   0.45 0.49 0.33] sorted [0 2 1]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [1.   0.45 0.55 0.33] sorted [0 2 1]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [1.   0.3  0.55 0.66] sorted [0 3 2]\n",
      "   state [1 0 1 0] state_WI [0.18 0.45 0.55 0.66] sorted [3 2 1]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [1 1 1 0] state_WI [0.18 0.3  0.55 0.66] sorted [3 2 1]\n",
      "   state [1 1 1 0] state_WI [0.18 0.3  0.55 0.66] sorted [3 2 1]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [1.   0.3  0.55 0.33] sorted [0 2 3]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [1.   0.3  0.55 0.66] sorted [0 3 2]\n",
      "   state [0 0 1 1] state_WI [1.   0.45 0.55 0.33] sorted [0 2 1]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [1.   0.3  0.55 0.33] sorted [0 2 3]\n",
      "   state [1 0 1 0] state_WI [0.18 0.45 0.55 0.66] sorted [3 2 1]\n",
      "   state [1 0 1 0] state_WI [0.18 0.45 0.55 0.66] sorted [3 2 1]\n",
      "instance 3, ep 9, state [0 0 1 0]\n",
      "   state [0 0 1 0] state_WI [1.   0.45 0.55 0.66] sorted [0 3 2]\n",
      "   state [1 0 0 0] state_WI [0.18 0.45 0.49 0.66] sorted [3 2 1]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [1.   0.45 0.55 0.33] sorted [0 2 1]\n",
      "   state [1 1 0 0] state_WI [0.18 0.3  0.49 0.66] sorted [3 2 1]\n",
      "   state [1 1 0 1] state_WI [0.18 0.3  0.49 0.33] sorted [2 3 1]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [1 0 0 1] state_WI [0.18 0.45 0.49 0.33] sorted [2 1 3]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [1.   0.3  0.55 0.66] sorted [0 3 2]\n",
      "   state [0 1 1 0] state_WI [1.   0.3  0.55 0.66] sorted [0 3 2]\n",
      "   state [0 1 1 1] state_WI [1.   0.3  0.55 0.33] sorted [0 2 3]\n",
      "   state [0 1 1 1] state_WI [1.   0.3  0.55 0.33] sorted [0 2 3]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [1.   0.3  0.55 0.33] sorted [0 2 3]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [1.   0.3  0.55 0.33] sorted [0 2 3]\n",
      "instance 3, ep 10, state [1 0 0 1]\n",
      "   state [1 0 0 1] state_WI [0.18 0.45 0.49 0.33] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [1.   0.3  0.55 0.66] sorted [0 3 2]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [1.   0.45 0.55 0.33] sorted [0 2 1]\n",
      "   state [1 1 1 0] state_WI [0.18 0.3  0.55 0.66] sorted [3 2 1]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [1.   0.3  0.55 0.33] sorted [0 2 3]\n",
      "   state [1 1 1 0] state_WI [0.18 0.3  0.55 0.66] sorted [3 2 1]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [0 1 0 1] state_WI [1.   0.3  0.49 0.33] sorted [0 2 3]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [0 0 1 0] state_WI [1.   0.45 0.55 0.66] sorted [0 3 2]\n",
      "   state [0 0 0 1] state_WI [1.   0.45 0.49 0.33] sorted [0 2 1]\n",
      "   state [1 1 1 0] state_WI [0.18 0.3  0.55 0.66] sorted [3 2 1]\n",
      "   state [1 1 1 0] state_WI [0.18 0.3  0.55 0.66] sorted [3 2 1]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "instance 3, ep 11, state [0 0 0 0]\n",
      "   state [0 0 0 0] state_WI [1.   0.45 0.49 0.66] sorted [0 3 2]\n",
      "   state [0 0 1 0] state_WI [1.   0.45 0.55 0.66] sorted [0 3 2]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [1.   0.3  0.55 0.33] sorted [0 2 3]\n",
      "   state [1 0 1 0] state_WI [0.18 0.45 0.55 0.66] sorted [3 2 1]\n",
      "   state [1 1 1 0] state_WI [0.18 0.3  0.55 0.66] sorted [3 2 1]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [1.   0.45 0.55 0.33] sorted [0 2 1]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [1 1 1 0] state_WI [0.18 0.3  0.55 0.66] sorted [3 2 1]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [1.   0.3  0.55 0.66] sorted [0 3 2]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [1.   0.45 0.55 0.33] sorted [0 2 1]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [1.   0.45 0.55 0.33] sorted [0 2 1]\n",
      "   state [1 1 1 0] state_WI [0.18 0.3  0.55 0.66] sorted [3 2 1]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "instance 3, ep 12, state [1 0 1 0]\n",
      "   state [1 0 1 0] state_WI [0.18 0.45 0.55 0.66] sorted [3 2 1]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [0 1 1 0] state_WI [1.   0.3  0.55 0.66] sorted [0 3 2]\n",
      "   state [1 1 1 0] state_WI [0.18 0.3  0.55 0.66] sorted [3 2 1]\n",
      "   state [1 1 1 0] state_WI [0.18 0.3  0.55 0.66] sorted [3 2 1]\n",
      "   state [1 1 1 0] state_WI [0.18 0.3  0.55 0.66] sorted [3 2 1]\n",
      "   state [0 0 1 1] state_WI [1.   0.45 0.55 0.33] sorted [0 2 1]\n",
      "   state [0 0 1 0] state_WI [1.   0.45 0.55 0.66] sorted [0 3 2]\n",
      "   state [1 0 1 0] state_WI [0.18 0.45 0.55 0.66] sorted [3 2 1]\n",
      "   state [1 0 0 1] state_WI [0.18 0.45 0.49 0.33] sorted [2 1 3]\n",
      "   state [1 1 1 0] state_WI [0.18 0.3  0.55 0.66] sorted [3 2 1]\n",
      "   state [1 1 1 0] state_WI [0.18 0.3  0.55 0.66] sorted [3 2 1]\n",
      "   state [1 1 1 0] state_WI [0.18 0.3  0.55 0.66] sorted [3 2 1]\n",
      "instance 3, ep 13, state [1 1 1 0]\n",
      "   state [1 1 1 0] state_WI [0.18 0.3  0.55 0.66] sorted [3 2 1]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [0 1 0 1] state_WI [1.   0.3  0.49 0.33] sorted [0 2 3]\n",
      "   state [1 1 1 0] state_WI [0.18 0.3  0.55 0.66] sorted [3 2 1]\n",
      "   state [0 1 1 0] state_WI [1.   0.3  0.55 0.66] sorted [0 3 2]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [1 1 1 0] state_WI [0.18 0.3  0.55 0.66] sorted [3 2 1]\n",
      "   state [1 1 1 0] state_WI [0.18 0.3  0.55 0.66] sorted [3 2 1]\n",
      "   state [0 0 1 1] state_WI [1.   0.45 0.55 0.33] sorted [0 2 1]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [0 1 0 1] state_WI [1.   0.3  0.49 0.33] sorted [0 2 3]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [0 0 1 0] state_WI [1.   0.45 0.55 0.66] sorted [0 3 2]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [1.   0.45 0.55 0.33] sorted [0 2 1]\n",
      "   state [1 0 1 0] state_WI [0.18 0.45 0.55 0.66] sorted [3 2 1]\n",
      "instance 3, ep 14, state [0 0 1 1]\n",
      "   state [0 0 1 1] state_WI [1.   0.45 0.55 0.33] sorted [0 2 1]\n",
      "   state [1 1 1 0] state_WI [0.18 0.3  0.55 0.66] sorted [3 2 1]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [1 1 1 0] state_WI [0.18 0.3  0.55 0.66] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [1.   0.3  0.55 0.33] sorted [0 2 3]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [1.   0.45 0.55 0.33] sorted [0 2 1]\n",
      "   state [1 0 1 0] state_WI [0.18 0.45 0.55 0.66] sorted [3 2 1]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [1.   0.3  0.55 0.33] sorted [0 2 3]\n",
      "   state [0 1 1 0] state_WI [1.   0.3  0.55 0.66] sorted [0 3 2]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [1 1 1 0] state_WI [0.18 0.3  0.55 0.66] sorted [3 2 1]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [1.   0.3  0.55 0.33] sorted [0 2 3]\n",
      "   state [1 1 0 1] state_WI [0.18 0.3  0.49 0.33] sorted [2 3 1]\n",
      "   state [1 0 0 1] state_WI [0.18 0.45 0.49 0.33] sorted [2 1 3]\n",
      "instance 3, ep 15, state [1 0 1 1]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [1 1 1 0] state_WI [0.18 0.3  0.55 0.66] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [1.   0.3  0.55 0.33] sorted [0 2 3]\n",
      "   state [1 1 1 0] state_WI [0.18 0.3  0.55 0.66] sorted [3 2 1]\n",
      "   state [0 1 0 0] state_WI [1.   0.3  0.49 0.66] sorted [0 3 2]\n",
      "   state [1 0 1 0] state_WI [0.18 0.45 0.55 0.66] sorted [3 2 1]\n",
      "   state [0 0 1 0] state_WI [1.   0.45 0.55 0.66] sorted [0 3 2]\n",
      "   state [1 1 1 0] state_WI [0.18 0.3  0.55 0.66] sorted [3 2 1]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [0 1 1 0] state_WI [1.   0.3  0.55 0.66] sorted [0 3 2]\n",
      "   state [0 0 1 0] state_WI [1.   0.45 0.55 0.66] sorted [0 3 2]\n",
      "   state [1 0 1 0] state_WI [0.18 0.45 0.55 0.66] sorted [3 2 1]\n",
      "   state [0 0 1 1] state_WI [1.   0.45 0.55 0.33] sorted [0 2 1]\n",
      "   state [0 1 1 1] state_WI [1.   0.3  0.55 0.33] sorted [0 2 3]\n",
      "   state [1 0 1 0] state_WI [0.18 0.45 0.55 0.66] sorted [3 2 1]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [1 1 1 0] state_WI [0.18 0.3  0.55 0.66] sorted [3 2 1]\n",
      "   state [1 0 1 0] state_WI [0.18 0.45 0.55 0.66] sorted [3 2 1]\n",
      "instance 3, ep 16, state [0 0 1 1]\n",
      "   state [0 0 1 1] state_WI [1.   0.45 0.55 0.33] sorted [0 2 1]\n",
      "   state [0 0 1 0] state_WI [1.   0.45 0.55 0.66] sorted [0 3 2]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [1.   0.45 0.55 0.33] sorted [0 2 1]\n",
      "   state [1 1 1 0] state_WI [0.18 0.3  0.55 0.66] sorted [3 2 1]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [1 1 1 0] state_WI [0.18 0.3  0.55 0.66] sorted [3 2 1]\n",
      "   state [0 0 1 1] state_WI [1.   0.45 0.55 0.33] sorted [0 2 1]\n",
      "   state [1 1 0 0] state_WI [0.18 0.3  0.49 0.66] sorted [3 2 1]\n",
      "   state [0 1 1 0] state_WI [1.   0.3  0.55 0.66] sorted [0 3 2]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [1 0 1 0] state_WI [0.18 0.45 0.55 0.66] sorted [3 2 1]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [1 1 0 1] state_WI [0.18 0.3  0.49 0.33] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [1.   0.45 0.55 0.33] sorted [0 2 1]\n",
      "   state [0 1 1 0] state_WI [1.   0.3  0.55 0.66] sorted [0 3 2]\n",
      "instance 3, ep 17, state [1 0 1 0]\n",
      "   state [1 0 1 0] state_WI [0.18 0.45 0.55 0.66] sorted [3 2 1]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [0 1 1 0] state_WI [1.   0.3  0.55 0.66] sorted [0 3 2]\n",
      "   state [1 1 0 1] state_WI [0.18 0.3  0.49 0.33] sorted [2 3 1]\n",
      "   state [1 1 0 1] state_WI [0.18 0.3  0.49 0.33] sorted [2 3 1]\n",
      "   state [1 1 0 1] state_WI [0.18 0.3  0.49 0.33] sorted [2 3 1]\n",
      "   state [0 1 0 1] state_WI [1.   0.3  0.49 0.33] sorted [0 2 3]\n",
      "   state [1 0 0 0] state_WI [0.18 0.45 0.49 0.66] sorted [3 2 1]\n",
      "   state [1 1 0 1] state_WI [0.18 0.3  0.49 0.33] sorted [2 3 1]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [1.   0.3  0.55 0.33] sorted [0 2 3]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [1 1 1 0] state_WI [0.18 0.3  0.55 0.66] sorted [3 2 1]\n",
      "   state [0 0 1 0] state_WI [1.   0.45 0.55 0.66] sorted [0 3 2]\n",
      "   state [1 0 0 0] state_WI [0.18 0.45 0.49 0.66] sorted [3 2 1]\n",
      "   state [0 1 0 0] state_WI [1.   0.3  0.49 0.66] sorted [0 3 2]\n",
      "   state [1 1 0 1] state_WI [0.18 0.3  0.49 0.33] sorted [2 3 1]\n",
      "   state [1 1 1 0] state_WI [0.18 0.3  0.55 0.66] sorted [3 2 1]\n",
      "   state [1 1 1 0] state_WI [0.18 0.3  0.55 0.66] sorted [3 2 1]\n",
      "instance 3, ep 18, state [0 0 1 1]\n",
      "   state [0 0 1 1] state_WI [1.   0.45 0.55 0.33] sorted [0 2 1]\n",
      "   state [0 1 1 0] state_WI [1.   0.3  0.55 0.66] sorted [0 3 2]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [1.   0.3  0.55 0.33] sorted [0 2 3]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [1 1 1 0] state_WI [0.18 0.3  0.55 0.66] sorted [3 2 1]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [1.   0.45 0.55 0.33] sorted [0 2 1]\n",
      "   state [0 1 1 0] state_WI [1.   0.3  0.55 0.66] sorted [0 3 2]\n",
      "   state [1 0 1 0] state_WI [0.18 0.45 0.55 0.66] sorted [3 2 1]\n",
      "   state [1 1 1 0] state_WI [0.18 0.3  0.55 0.66] sorted [3 2 1]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [1 0 1 0] state_WI [0.18 0.45 0.55 0.66] sorted [3 2 1]\n",
      "   state [0 0 1 1] state_WI [1.   0.45 0.55 0.33] sorted [0 2 1]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [1 0 1 0] state_WI [0.18 0.45 0.55 0.66] sorted [3 2 1]\n",
      "   state [0 1 0 0] state_WI [1.   0.3  0.49 0.66] sorted [0 3 2]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "instance 3, ep 19, state [1 0 1 0]\n",
      "   state [1 0 1 0] state_WI [0.18 0.45 0.55 0.66] sorted [3 2 1]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [1.   0.3  0.55 0.33] sorted [0 2 3]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [1 0 0 1] state_WI [0.18 0.45 0.49 0.33] sorted [2 1 3]\n",
      "   state [1 1 0 1] state_WI [0.18 0.3  0.49 0.33] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [1.   0.45 0.55 0.33] sorted [0 2 1]\n",
      "   state [0 0 1 1] state_WI [1.   0.45 0.55 0.33] sorted [0 2 1]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [1.   0.3  0.55 0.66] sorted [0 3 2]\n",
      "   state [0 0 1 1] state_WI [1.   0.45 0.55 0.33] sorted [0 2 1]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [1.   0.45 0.55 0.33] sorted [0 2 1]\n",
      "   state [1 1 1 0] state_WI [0.18 0.3  0.55 0.66] sorted [3 2 1]\n",
      "   state [0 1 1 0] state_WI [1.   0.3  0.55 0.66] sorted [0 3 2]\n",
      "   state [1 1 1 0] state_WI [0.18 0.3  0.55 0.66] sorted [3 2 1]\n",
      "instance 3, ep 20, state [1 0 0 0]\n",
      "   state [1 0 0 0] state_WI [0.18 0.45 0.49 0.66] sorted [3 2 1]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [1.   0.45 0.55 0.33] sorted [0 2 1]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [1 1 0 0] state_WI [0.18 0.3  0.49 0.66] sorted [3 2 1]\n",
      "   state [1 0 0 1] state_WI [0.18 0.45 0.49 0.33] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [1.   0.45 0.55 0.33] sorted [0 2 1]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [1 1 0 1] state_WI [0.18 0.3  0.49 0.33] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [1.   0.3  0.55 0.33] sorted [0 2 3]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [1 1 1 0] state_WI [0.18 0.3  0.55 0.66] sorted [3 2 1]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [0 1 1 0] state_WI [1.   0.3  0.55 0.66] sorted [0 3 2]\n",
      "instance 3, ep 21, state [0 1 1 0]\n",
      "   state [0 1 1 0] state_WI [1.   0.3  0.55 0.66] sorted [0 3 2]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [1.   0.3  0.55 0.33] sorted [0 2 3]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [1.   0.3  0.55 0.33] sorted [0 2 3]\n",
      "   state [0 0 1 0] state_WI [1.   0.45 0.55 0.66] sorted [0 3 2]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [1 0 1 0] state_WI [0.18 0.45 0.55 0.66] sorted [3 2 1]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [0 0 1 0] state_WI [1.   0.45 0.55 0.66] sorted [0 3 2]\n",
      "   state [0 0 1 1] state_WI [1.   0.45 0.55 0.33] sorted [0 2 1]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [1.   0.3  0.55 0.33] sorted [0 2 3]\n",
      "   state [0 0 1 0] state_WI [1.   0.45 0.55 0.66] sorted [0 3 2]\n",
      "   state [1 0 1 0] state_WI [0.18 0.45 0.55 0.66] sorted [3 2 1]\n",
      "   state [1 1 1 0] state_WI [0.18 0.3  0.55 0.66] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [1.   0.3  0.55 0.33] sorted [0 2 3]\n",
      "   state [1 0 1 0] state_WI [0.18 0.45 0.55 0.66] sorted [3 2 1]\n",
      "   state [0 0 1 1] state_WI [1.   0.45 0.55 0.33] sorted [0 2 1]\n",
      "   state [0 1 1 1] state_WI [1.   0.3  0.55 0.33] sorted [0 2 3]\n",
      "instance 3, ep 22, state [1 0 1 1]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [1.   0.3  0.55 0.33] sorted [0 2 3]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [1 1 1 0] state_WI [0.18 0.3  0.55 0.66] sorted [3 2 1]\n",
      "   state [0 0 1 0] state_WI [1.   0.45 0.55 0.66] sorted [0 3 2]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [1 0 0 1] state_WI [0.18 0.45 0.49 0.33] sorted [2 1 3]\n",
      "   state [0 0 0 1] state_WI [1.   0.45 0.49 0.33] sorted [0 2 1]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [1 1 1 0] state_WI [0.18 0.3  0.55 0.66] sorted [3 2 1]\n",
      "   state [1 0 0 1] state_WI [0.18 0.45 0.49 0.33] sorted [2 1 3]\n",
      "   state [1 0 1 0] state_WI [0.18 0.45 0.55 0.66] sorted [3 2 1]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [1.   0.3  0.55 0.33] sorted [0 2 3]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "instance 3, ep 23, state [1 0 1 1]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [1 1 0 1] state_WI [0.18 0.3  0.49 0.33] sorted [2 3 1]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [1 1 1 0] state_WI [0.18 0.3  0.55 0.66] sorted [3 2 1]\n",
      "   state [0 0 0 0] state_WI [1.   0.45 0.49 0.66] sorted [0 3 2]\n",
      "   state [0 0 1 0] state_WI [1.   0.45 0.55 0.66] sorted [0 3 2]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [1 1 0 1] state_WI [0.18 0.3  0.49 0.33] sorted [2 3 1]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [1 0 1 0] state_WI [0.18 0.45 0.55 0.66] sorted [3 2 1]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [1 1 1 0] state_WI [0.18 0.3  0.55 0.66] sorted [3 2 1]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [1.   0.45 0.55 0.33] sorted [0 2 1]\n",
      "   state [0 1 1 1] state_WI [1.   0.3  0.55 0.33] sorted [0 2 3]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "instance 3, ep 24, state [0 0 1 1]\n",
      "   state [0 0 1 1] state_WI [1.   0.45 0.55 0.33] sorted [0 2 1]\n",
      "   state [1 1 1 0] state_WI [0.18 0.3  0.55 0.66] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [1.   0.3  0.55 0.33] sorted [0 2 3]\n",
      "   state [1 0 1 0] state_WI [0.18 0.45 0.55 0.66] sorted [3 2 1]\n",
      "   state [1 1 1 0] state_WI [0.18 0.3  0.55 0.66] sorted [3 2 1]\n",
      "   state [1 1 1 0] state_WI [0.18 0.3  0.55 0.66] sorted [3 2 1]\n",
      "   state [1 1 1 0] state_WI [0.18 0.3  0.55 0.66] sorted [3 2 1]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [0 0 1 0] state_WI [1.   0.45 0.55 0.66] sorted [0 3 2]\n",
      "   state [1 0 0 0] state_WI [0.18 0.45 0.49 0.66] sorted [3 2 1]\n",
      "   state [0 1 0 1] state_WI [1.   0.3  0.49 0.33] sorted [0 2 3]\n",
      "   state [0 0 1 1] state_WI [1.   0.45 0.55 0.33] sorted [0 2 1]\n",
      "   state [0 1 1 1] state_WI [1.   0.3  0.55 0.33] sorted [0 2 3]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [1 1 0 0] state_WI [0.18 0.3  0.49 0.66] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [1.   0.3  0.55 0.33] sorted [0 2 3]\n",
      "   state [0 0 1 1] state_WI [1.   0.45 0.55 0.33] sorted [0 2 1]\n",
      "   state [1 1 1 0] state_WI [0.18 0.3  0.55 0.66] sorted [3 2 1]\n",
      "   state [1 1 1 0] state_WI [0.18 0.3  0.55 0.66] sorted [3 2 1]\n",
      "   state [0 0 1 1] state_WI [1.   0.45 0.55 0.33] sorted [0 2 1]\n",
      "instance 3, ep 25, state [1 1 1 0]\n",
      "   state [1 1 1 0] state_WI [0.18 0.3  0.55 0.66] sorted [3 2 1]\n",
      "   state [1 1 1 0] state_WI [0.18 0.3  0.55 0.66] sorted [3 2 1]\n",
      "   state [1 0 1 0] state_WI [0.18 0.45 0.55 0.66] sorted [3 2 1]\n",
      "   state [1 0 1 0] state_WI [0.18 0.45 0.55 0.66] sorted [3 2 1]\n",
      "   state [1 0 1 0] state_WI [0.18 0.45 0.55 0.66] sorted [3 2 1]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [1.   0.45 0.55 0.33] sorted [0 2 1]\n",
      "   state [0 1 1 1] state_WI [1.   0.3  0.55 0.33] sorted [0 2 3]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [0 0 1 0] state_WI [1.   0.45 0.55 0.66] sorted [0 3 2]\n",
      "   state [0 0 1 0] state_WI [1.   0.45 0.55 0.66] sorted [0 3 2]\n",
      "   state [0 0 1 1] state_WI [1.   0.45 0.55 0.33] sorted [0 2 1]\n",
      "   state [1 0 1 0] state_WI [0.18 0.45 0.55 0.66] sorted [3 2 1]\n",
      "   state [1 1 1 0] state_WI [0.18 0.3  0.55 0.66] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [1.   0.3  0.55 0.33] sorted [0 2 3]\n",
      "   state [0 0 1 1] state_WI [1.   0.45 0.55 0.33] sorted [0 2 1]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "instance 3, ep 26, state [0 0 1 0]\n",
      "   state [0 0 1 0] state_WI [1.   0.45 0.55 0.66] sorted [0 3 2]\n",
      "   state [1 0 1 0] state_WI [0.18 0.45 0.55 0.66] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [1.   0.3  0.55 0.33] sorted [0 2 3]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [0 0 1 0] state_WI [1.   0.45 0.55 0.66] sorted [0 3 2]\n",
      "   state [1 0 1 0] state_WI [0.18 0.45 0.55 0.66] sorted [3 2 1]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [1.   0.45 0.55 0.33] sorted [0 2 1]\n",
      "   state [1 0 1 0] state_WI [0.18 0.45 0.55 0.66] sorted [3 2 1]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [0 0 1 0] state_WI [1.   0.45 0.55 0.66] sorted [0 3 2]\n",
      "   state [1 0 1 0] state_WI [0.18 0.45 0.55 0.66] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [1.   0.3  0.55 0.33] sorted [0 2 3]\n",
      "   state [1 0 0 1] state_WI [0.18 0.45 0.49 0.33] sorted [2 1 3]\n",
      "   state [1 1 0 1] state_WI [0.18 0.3  0.49 0.33] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [1.   0.3  0.55 0.33] sorted [0 2 3]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "instance 3, ep 27, state [1 1 1 0]\n",
      "   state [1 1 1 0] state_WI [0.18 0.3  0.55 0.66] sorted [3 2 1]\n",
      "   state [1 0 1 0] state_WI [0.18 0.45 0.55 0.66] sorted [3 2 1]\n",
      "   state [0 0 1 0] state_WI [1.   0.45 0.55 0.66] sorted [0 3 2]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [1.   0.3  0.55 0.33] sorted [0 2 3]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [1.   0.3  0.55 0.33] sorted [0 2 3]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [0 1 1 0] state_WI [1.   0.3  0.55 0.66] sorted [0 3 2]\n",
      "   state [1 0 0 1] state_WI [0.18 0.45 0.49 0.33] sorted [2 1 3]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [1.   0.3  0.55 0.33] sorted [0 2 3]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [1.   0.3  0.55 0.33] sorted [0 2 3]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [1 1 0 1] state_WI [0.18 0.3  0.49 0.33] sorted [2 3 1]\n",
      "instance 3, ep 28, state [1 0 1 0]\n",
      "   state [1 0 1 0] state_WI [0.18 0.45 0.55 0.66] sorted [3 2 1]\n",
      "   state [0 0 1 0] state_WI [1.   0.45 0.55 0.66] sorted [0 3 2]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [1.   0.45 0.55 0.33] sorted [0 2 1]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [1.   0.45 0.55 0.33] sorted [0 2 1]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [0 1 1 0] state_WI [1.   0.3  0.55 0.66] sorted [0 3 2]\n",
      "   state [1 0 1 0] state_WI [0.18 0.45 0.55 0.66] sorted [3 2 1]\n",
      "   state [0 1 1 0] state_WI [1.   0.3  0.55 0.66] sorted [0 3 2]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [1.   0.3  0.55 0.33] sorted [0 2 3]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [0 1 0 1] state_WI [1.   0.3  0.49 0.33] sorted [0 2 3]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [1.   0.45 0.55 0.33] sorted [0 2 1]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "instance 3, ep 29, state [0 1 0 0]\n",
      "   state [0 1 0 0] state_WI [1.   0.3  0.49 0.66] sorted [0 3 2]\n",
      "   state [1 1 1 0] state_WI [0.18 0.3  0.55 0.66] sorted [3 2 1]\n",
      "   state [0 1 0 1] state_WI [1.   0.3  0.49 0.33] sorted [0 2 3]\n",
      "   state [1 0 0 0] state_WI [0.18 0.45 0.49 0.66] sorted [3 2 1]\n",
      "   state [0 0 1 0] state_WI [1.   0.45 0.55 0.66] sorted [0 3 2]\n",
      "   state [1 0 1 0] state_WI [0.18 0.45 0.55 0.66] sorted [3 2 1]\n",
      "   state [0 0 1 0] state_WI [1.   0.45 0.55 0.66] sorted [0 3 2]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [1 1 1 1] state_WI [0.18 0.3  0.55 0.33] sorted [2 3 1]\n",
      "   state [1 1 1 0] state_WI [0.18 0.3  0.55 0.66] sorted [3 2 1]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [1.   0.3  0.55 0.33] sorted [0 2 3]\n",
      "   state [1 0 1 1] state_WI [0.18 0.45 0.55 0.33] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [1.   0.45 0.55 0.33] sorted [0 2 1]\n",
      "   state [1 1 1 0] state_WI [0.18 0.3  0.55 0.66] sorted [3 2 1]\n",
      "first state [0 1 0 1]\n",
      "   state [0 1 0 1] state_WI [ 0.24  0.47  0.27 -0.07] sorted [1 2 0]\n",
      "   state [0 1 0 0] state_WI [0.24 0.47 0.27 0.04] sorted [1 2 0]\n",
      "   state [1 0 1 0] state_WI [0.14 0.38 0.21 0.04] sorted [1 2 0]\n",
      "   state [1 0 1 0] state_WI [0.14 0.38 0.21 0.04] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [1 1 0 0] state_WI [0.14 0.47 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 0 0 0] state_WI [0.24 0.38 0.27 0.04] sorted [1 2 0]\n",
      "   state [1 0 0 0] state_WI [0.14 0.38 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 0 1 1] state_WI [ 0.24  0.38  0.21 -0.07] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [1 0 1 0] state_WI [0.14 0.38 0.21 0.04] sorted [1 2 0]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "   state [1 0 1 0] state_WI [0.14 0.38 0.21 0.04] sorted [1 2 0]\n",
      "   state [1 0 0 0] state_WI [0.14 0.38 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 1 0 0] state_WI [0.24 0.47 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 1 0 0] state_WI [0.24 0.47 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "instance 4, ep 1, state [0 0 0 0]\n",
      "   state [0 0 0 0] state_WI [0.24 0.38 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 0 0] state_WI [0.24 0.47 0.27 0.04] sorted [1 2 0]\n",
      "   state [1 0 1 0] state_WI [0.14 0.38 0.21 0.04] sorted [1 2 0]\n",
      "   state [1 0 1 0] state_WI [0.14 0.38 0.21 0.04] sorted [1 2 0]\n",
      "   state [0 0 0 0] state_WI [0.24 0.38 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [1 0 0 0] state_WI [0.14 0.38 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [1 0 0 0] state_WI [0.14 0.38 0.27 0.04] sorted [1 2 0]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "   state [0 1 0 0] state_WI [0.24 0.47 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 1 0 0] state_WI [0.24 0.47 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "instance 4, ep 2, state [1 0 1 0]\n",
      "   state [1 0 1 0] state_WI [0.14 0.38 0.21 0.04] sorted [1 2 0]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [1 0 0 0] state_WI [0.14 0.38 0.27 0.04] sorted [1 2 0]\n",
      "   state [1 0 1 1] state_WI [ 0.14  0.38  0.21 -0.07] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "   state [0 1 0 0] state_WI [0.24 0.47 0.27 0.04] sorted [1 2 0]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "   state [1 1 1 1] state_WI [ 0.14  0.47  0.21 -0.07] sorted [1 2 0]\n",
      "   state [1 0 1 0] state_WI [0.14 0.38 0.21 0.04] sorted [1 2 0]\n",
      "   state [0 0 0 0] state_WI [0.24 0.38 0.27 0.04] sorted [1 2 0]\n",
      "   state [1 0 1 0] state_WI [0.14 0.38 0.21 0.04] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "instance 4, ep 3, state [1 0 0 1]\n",
      "   state [1 0 0 1] state_WI [ 0.14  0.38  0.27 -0.07] sorted [1 2 0]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "   state [0 1 0 0] state_WI [0.24 0.47 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 0 0 0] state_WI [0.24 0.38 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 0 0] state_WI [0.24 0.47 0.27 0.04] sorted [1 2 0]\n",
      "   state [1 0 1 0] state_WI [0.14 0.38 0.21 0.04] sorted [1 2 0]\n",
      "   state [0 0 0 0] state_WI [0.24 0.38 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 0 0 0] state_WI [0.24 0.38 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 0 0 0] state_WI [0.24 0.38 0.27 0.04] sorted [1 2 0]\n",
      "   state [1 0 1 0] state_WI [0.14 0.38 0.21 0.04] sorted [1 2 0]\n",
      "   state [1 0 1 0] state_WI [0.14 0.38 0.21 0.04] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 1] state_WI [ 0.24  0.47  0.21 -0.07] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [1 0 1 0] state_WI [0.14 0.38 0.21 0.04] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "instance 4, ep 4, state [0 0 1 1]\n",
      "   state [0 0 1 1] state_WI [ 0.24  0.38  0.21 -0.07] sorted [1 0 2]\n",
      "   state [1 0 1 0] state_WI [0.14 0.38 0.21 0.04] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 1] state_WI [ 0.24  0.47  0.21 -0.07] sorted [1 0 2]\n",
      "   state [1 1 0 0] state_WI [0.14 0.47 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [1 1 0 0] state_WI [0.14 0.47 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [1 0 1 0] state_WI [0.14 0.38 0.21 0.04] sorted [1 2 0]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 0 0 0] state_WI [0.24 0.38 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "   state [1 1 0 0] state_WI [0.14 0.47 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 0 0] state_WI [0.24 0.47 0.27 0.04] sorted [1 2 0]\n",
      "instance 4, ep 5, state [0 0 1 0]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "   state [0 1 0 0] state_WI [0.24 0.47 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 0 0] state_WI [0.24 0.47 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 0 0] state_WI [0.24 0.47 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [1 1 1 1] state_WI [ 0.14  0.47  0.21 -0.07] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "   state [1 1 0 0] state_WI [0.14 0.47 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 0 0 0] state_WI [0.24 0.38 0.27 0.04] sorted [1 2 0]\n",
      "instance 4, ep 6, state [0 0 1 1]\n",
      "   state [0 0 1 1] state_WI [ 0.24  0.38  0.21 -0.07] sorted [1 0 2]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [1 0 1 0] state_WI [0.14 0.38 0.21 0.04] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 0 0] state_WI [0.24 0.47 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 0 0 0] state_WI [0.24 0.38 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 1] state_WI [ 0.24  0.47  0.21 -0.07] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "   state [1 0 1 0] state_WI [0.14 0.38 0.21 0.04] sorted [1 2 0]\n",
      "   state [1 1 0 0] state_WI [0.14 0.47 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "instance 4, ep 7, state [0 0 0 1]\n",
      "   state [0 0 0 1] state_WI [ 0.24  0.38  0.27 -0.07] sorted [1 2 0]\n",
      "   state [1 0 1 0] state_WI [0.14 0.38 0.21 0.04] sorted [1 2 0]\n",
      "   state [0 1 1 1] state_WI [ 0.24  0.47  0.21 -0.07] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 0 0] state_WI [0.24 0.47 0.27 0.04] sorted [1 2 0]\n",
      "   state [1 1 0 0] state_WI [0.14 0.47 0.27 0.04] sorted [1 2 0]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [1 1 0 0] state_WI [0.14 0.47 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 1 0 0] state_WI [0.24 0.47 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [1 0 1 0] state_WI [0.14 0.38 0.21 0.04] sorted [1 2 0]\n",
      "   state [1 0 1 0] state_WI [0.14 0.38 0.21 0.04] sorted [1 2 0]\n",
      "   state [1 0 0 0] state_WI [0.14 0.38 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 0 0 0] state_WI [0.24 0.38 0.27 0.04] sorted [1 2 0]\n",
      "   state [1 0 1 0] state_WI [0.14 0.38 0.21 0.04] sorted [1 2 0]\n",
      "instance 4, ep 8, state [0 0 1 0]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 0 0] state_WI [0.24 0.47 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 0 0 0] state_WI [0.24 0.38 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 1 0 0] state_WI [0.24 0.47 0.27 0.04] sorted [1 2 0]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 1] state_WI [ 0.24  0.47  0.21 -0.07] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 0 0] state_WI [0.24 0.47 0.27 0.04] sorted [1 2 0]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "instance 4, ep 9, state [1 0 0 0]\n",
      "   state [1 0 0 0] state_WI [0.14 0.38 0.27 0.04] sorted [1 2 0]\n",
      "   state [1 0 0 0] state_WI [0.14 0.38 0.27 0.04] sorted [1 2 0]\n",
      "   state [1 1 0 0] state_WI [0.14 0.47 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [1 0 1 0] state_WI [0.14 0.38 0.21 0.04] sorted [1 2 0]\n",
      "   state [1 0 1 0] state_WI [0.14 0.38 0.21 0.04] sorted [1 2 0]\n",
      "   state [1 0 1 0] state_WI [0.14 0.38 0.21 0.04] sorted [1 2 0]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 0 0] state_WI [0.24 0.47 0.27 0.04] sorted [1 2 0]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "   state [1 1 0 0] state_WI [0.14 0.47 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [1 1 0 0] state_WI [0.14 0.47 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "instance 4, ep 10, state [1 1 1 0]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 0 0] state_WI [0.24 0.47 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 0 0 0] state_WI [0.24 0.38 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "   state [1 0 1 0] state_WI [0.14 0.38 0.21 0.04] sorted [1 2 0]\n",
      "   state [0 1 0 0] state_WI [0.24 0.47 0.27 0.04] sorted [1 2 0]\n",
      "instance 4, ep 11, state [1 0 0 1]\n",
      "   state [1 0 0 1] state_WI [ 0.14  0.38  0.27 -0.07] sorted [1 2 0]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [1 0 0 0] state_WI [0.14 0.38 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 0 0] state_WI [0.24 0.47 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 1 1 1] state_WI [ 0.24  0.47  0.21 -0.07] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 0 0] state_WI [0.24 0.47 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 1 0 0] state_WI [0.24 0.47 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 0 0] state_WI [0.24 0.47 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 1] state_WI [ 0.24  0.47  0.21 -0.07] sorted [1 0 2]\n",
      "   state [1 0 0 0] state_WI [0.14 0.38 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [1 0 1 0] state_WI [0.14 0.38 0.21 0.04] sorted [1 2 0]\n",
      "instance 4, ep 12, state [0 0 0 0]\n",
      "   state [0 0 0 0] state_WI [0.24 0.38 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 0 0 0] state_WI [0.24 0.38 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [1 0 1 0] state_WI [0.14 0.38 0.21 0.04] sorted [1 2 0]\n",
      "   state [0 0 0 0] state_WI [0.24 0.38 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 0 1 1] state_WI [ 0.24  0.38  0.21 -0.07] sorted [1 0 2]\n",
      "   state [1 0 1 0] state_WI [0.14 0.38 0.21 0.04] sorted [1 2 0]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "instance 4, ep 13, state [0 1 0 1]\n",
      "   state [0 1 0 1] state_WI [ 0.24  0.47  0.27 -0.07] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [1 0 1 0] state_WI [0.14 0.38 0.21 0.04] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [1 0 1 0] state_WI [0.14 0.38 0.21 0.04] sorted [1 2 0]\n",
      "   state [1 0 0 0] state_WI [0.14 0.38 0.27 0.04] sorted [1 2 0]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "   state [0 1 0 0] state_WI [0.24 0.47 0.27 0.04] sorted [1 2 0]\n",
      "   state [1 0 0 0] state_WI [0.14 0.38 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 1] state_WI [ 0.24  0.47  0.21 -0.07] sorted [1 0 2]\n",
      "instance 4, ep 14, state [1 0 0 0]\n",
      "   state [1 0 0 0] state_WI [0.14 0.38 0.27 0.04] sorted [1 2 0]\n",
      "   state [1 0 0 1] state_WI [ 0.14  0.38  0.27 -0.07] sorted [1 2 0]\n",
      "   state [0 1 0 0] state_WI [0.24 0.47 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [1 0 0 0] state_WI [0.14 0.38 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 0 0 0] state_WI [0.24 0.38 0.27 0.04] sorted [1 2 0]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 0 0] state_WI [0.24 0.47 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 1 0 0] state_WI [0.24 0.47 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [1 1 0 0] state_WI [0.14 0.47 0.27 0.04] sorted [1 2 0]\n",
      "   state [1 0 1 0] state_WI [0.14 0.38 0.21 0.04] sorted [1 2 0]\n",
      "instance 4, ep 15, state [1 0 1 0]\n",
      "   state [1 0 1 0] state_WI [0.14 0.38 0.21 0.04] sorted [1 2 0]\n",
      "   state [1 0 1 0] state_WI [0.14 0.38 0.21 0.04] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [1 1 0 0] state_WI [0.14 0.47 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 1 0 0] state_WI [0.24 0.47 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 1 1 1] state_WI [ 0.24  0.47  0.21 -0.07] sorted [1 0 2]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [1 0 1 0] state_WI [0.14 0.38 0.21 0.04] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [1 0 1 1] state_WI [ 0.14  0.38  0.21 -0.07] sorted [1 2 0]\n",
      "   state [1 0 1 0] state_WI [0.14 0.38 0.21 0.04] sorted [1 2 0]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "   state [1 1 0 0] state_WI [0.14 0.47 0.27 0.04] sorted [1 2 0]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "   state [1 1 1 1] state_WI [ 0.14  0.47  0.21 -0.07] sorted [1 2 0]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "instance 4, ep 16, state [1 0 0 1]\n",
      "   state [1 0 0 1] state_WI [ 0.14  0.38  0.27 -0.07] sorted [1 2 0]\n",
      "   state [1 1 0 0] state_WI [0.14 0.47 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 0 0 0] state_WI [0.24 0.38 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 1] state_WI [ 0.24  0.47  0.21 -0.07] sorted [1 0 2]\n",
      "   state [0 1 1 1] state_WI [ 0.24  0.47  0.21 -0.07] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 0 0 0] state_WI [0.24 0.38 0.27 0.04] sorted [1 2 0]\n",
      "   state [1 1 0 0] state_WI [0.14 0.47 0.27 0.04] sorted [1 2 0]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "   state [0 1 0 0] state_WI [0.24 0.47 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "instance 4, ep 17, state [1 0 1 0]\n",
      "   state [1 0 1 0] state_WI [0.14 0.38 0.21 0.04] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "   state [1 0 1 0] state_WI [0.14 0.38 0.21 0.04] sorted [1 2 0]\n",
      "   state [0 1 0 0] state_WI [0.24 0.47 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "   state [0 1 0 0] state_WI [0.24 0.47 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 0 0 0] state_WI [0.24 0.38 0.27 0.04] sorted [1 2 0]\n",
      "   state [1 0 1 0] state_WI [0.14 0.38 0.21 0.04] sorted [1 2 0]\n",
      "   state [0 0 1 1] state_WI [ 0.24  0.38  0.21 -0.07] sorted [1 0 2]\n",
      "   state [0 0 1 1] state_WI [ 0.24  0.38  0.21 -0.07] sorted [1 0 2]\n",
      "instance 4, ep 18, state [1 1 0 0]\n",
      "   state [1 1 0 0] state_WI [0.14 0.47 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 0 0 0] state_WI [0.24 0.38 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "   state [1 1 0 0] state_WI [0.14 0.47 0.27 0.04] sorted [1 2 0]\n",
      "   state [1 0 1 0] state_WI [0.14 0.38 0.21 0.04] sorted [1 2 0]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "   state [0 1 0 0] state_WI [0.24 0.47 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [1 0 1 0] state_WI [0.14 0.38 0.21 0.04] sorted [1 2 0]\n",
      "   state [0 0 0 0] state_WI [0.24 0.38 0.27 0.04] sorted [1 2 0]\n",
      "   state [1 0 1 0] state_WI [0.14 0.38 0.21 0.04] sorted [1 2 0]\n",
      "   state [1 0 1 1] state_WI [ 0.14  0.38  0.21 -0.07] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "instance 4, ep 19, state [0 1 1 0]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 0 0] state_WI [0.24 0.47 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [1 0 1 1] state_WI [ 0.14  0.38  0.21 -0.07] sorted [1 2 0]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 0 0] state_WI [0.24 0.47 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [1 1 0 0] state_WI [0.14 0.47 0.27 0.04] sorted [1 2 0]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "   state [1 0 1 0] state_WI [0.14 0.38 0.21 0.04] sorted [1 2 0]\n",
      "   state [0 1 0 0] state_WI [0.24 0.47 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [1 0 1 0] state_WI [0.14 0.38 0.21 0.04] sorted [1 2 0]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "instance 4, ep 20, state [0 1 1 1]\n",
      "   state [0 1 1 1] state_WI [ 0.24  0.47  0.21 -0.07] sorted [1 0 2]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "   state [1 0 0 0] state_WI [0.14 0.38 0.27 0.04] sorted [1 2 0]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "   state [0 1 0 0] state_WI [0.24 0.47 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [1 1 0 0] state_WI [0.14 0.47 0.27 0.04] sorted [1 2 0]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [1 1 1 1] state_WI [ 0.14  0.47  0.21 -0.07] sorted [1 2 0]\n",
      "   state [0 1 0 0] state_WI [0.24 0.47 0.27 0.04] sorted [1 2 0]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "   state [0 0 1 1] state_WI [ 0.24  0.38  0.21 -0.07] sorted [1 0 2]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "instance 4, ep 21, state [0 0 0 1]\n",
      "   state [0 0 0 1] state_WI [ 0.24  0.38  0.27 -0.07] sorted [1 2 0]\n",
      "   state [1 1 0 0] state_WI [0.14 0.47 0.27 0.04] sorted [1 2 0]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 0 0 1] state_WI [ 0.24  0.38  0.27 -0.07] sorted [1 2 0]\n",
      "   state [0 0 1 1] state_WI [ 0.24  0.38  0.21 -0.07] sorted [1 0 2]\n",
      "   state [1 0 0 0] state_WI [0.14 0.38 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 1 1 1] state_WI [ 0.24  0.47  0.21 -0.07] sorted [1 0 2]\n",
      "   state [0 1 1 1] state_WI [ 0.24  0.47  0.21 -0.07] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 0 0] state_WI [0.24 0.47 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 0 0 0] state_WI [0.24 0.38 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 0 0 0] state_WI [0.24 0.38 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 1 0 0] state_WI [0.24 0.47 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "instance 4, ep 22, state [0 1 0 1]\n",
      "   state [0 1 0 1] state_WI [ 0.24  0.47  0.27 -0.07] sorted [1 2 0]\n",
      "   state [1 1 1 1] state_WI [ 0.14  0.47  0.21 -0.07] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "   state [0 1 0 0] state_WI [0.24 0.47 0.27 0.04] sorted [1 2 0]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "   state [0 1 0 0] state_WI [0.24 0.47 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 0 0 0] state_WI [0.24 0.38 0.27 0.04] sorted [1 2 0]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "instance 4, ep 23, state [1 1 0 0]\n",
      "   state [1 1 0 0] state_WI [0.14 0.47 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 1 1 1] state_WI [ 0.24  0.47  0.21 -0.07] sorted [1 0 2]\n",
      "   state [0 1 0 0] state_WI [0.24 0.47 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [1 0 1 0] state_WI [0.14 0.38 0.21 0.04] sorted [1 2 0]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 0 0 0] state_WI [0.24 0.38 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 0 0] state_WI [0.24 0.47 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 1 0 0] state_WI [0.24 0.47 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 1 0 0] state_WI [0.24 0.47 0.27 0.04] sorted [1 2 0]\n",
      "instance 4, ep 24, state [0 1 1 1]\n",
      "   state [0 1 1 1] state_WI [ 0.24  0.47  0.21 -0.07] sorted [1 0 2]\n",
      "   state [0 0 1 1] state_WI [ 0.24  0.38  0.21 -0.07] sorted [1 0 2]\n",
      "   state [0 1 1 1] state_WI [ 0.24  0.47  0.21 -0.07] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [1 0 0 0] state_WI [0.14 0.38 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 0 0 0] state_WI [0.24 0.38 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 0 0] state_WI [0.24 0.47 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 0 0] state_WI [0.24 0.47 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 1 0 1] state_WI [ 0.24  0.47  0.27 -0.07] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [1 1 1 1] state_WI [ 0.14  0.47  0.21 -0.07] sorted [1 2 0]\n",
      "instance 4, ep 25, state [1 1 0 1]\n",
      "   state [1 1 0 1] state_WI [ 0.14  0.47  0.27 -0.07] sorted [1 2 0]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 0 0 0] state_WI [0.24 0.38 0.27 0.04] sorted [1 2 0]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "   state [0 1 0 0] state_WI [0.24 0.47 0.27 0.04] sorted [1 2 0]\n",
      "   state [1 0 1 0] state_WI [0.14 0.38 0.21 0.04] sorted [1 2 0]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [1 0 0 0] state_WI [0.14 0.38 0.27 0.04] sorted [1 2 0]\n",
      "   state [1 0 1 0] state_WI [0.14 0.38 0.21 0.04] sorted [1 2 0]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [1 0 1 0] state_WI [0.14 0.38 0.21 0.04] sorted [1 2 0]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "instance 4, ep 26, state [0 0 1 0]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [1 1 0 0] state_WI [0.14 0.47 0.27 0.04] sorted [1 2 0]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "   state [1 1 1 1] state_WI [ 0.14  0.47  0.21 -0.07] sorted [1 2 0]\n",
      "   state [1 0 1 0] state_WI [0.14 0.38 0.21 0.04] sorted [1 2 0]\n",
      "   state [0 1 0 0] state_WI [0.24 0.47 0.27 0.04] sorted [1 2 0]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 0 0 0] state_WI [0.24 0.38 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 1 0 0] state_WI [0.24 0.47 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [1 0 1 0] state_WI [0.14 0.38 0.21 0.04] sorted [1 2 0]\n",
      "   state [1 0 1 0] state_WI [0.14 0.38 0.21 0.04] sorted [1 2 0]\n",
      "instance 4, ep 27, state [0 1 0 1]\n",
      "   state [0 1 0 1] state_WI [ 0.24  0.47  0.27 -0.07] sorted [1 2 0]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [1 0 1 0] state_WI [0.14 0.38 0.21 0.04] sorted [1 2 0]\n",
      "   state [0 0 0 0] state_WI [0.24 0.38 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 0 0 0] state_WI [0.24 0.38 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [1 0 1 0] state_WI [0.14 0.38 0.21 0.04] sorted [1 2 0]\n",
      "   state [0 1 1 1] state_WI [ 0.24  0.47  0.21 -0.07] sorted [1 0 2]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [1 0 1 0] state_WI [0.14 0.38 0.21 0.04] sorted [1 2 0]\n",
      "   state [1 0 1 1] state_WI [ 0.14  0.38  0.21 -0.07] sorted [1 2 0]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "   state [0 0 0 0] state_WI [0.24 0.38 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 0 0 0] state_WI [0.24 0.38 0.27 0.04] sorted [1 2 0]\n",
      "instance 4, ep 28, state [0 0 0 0]\n",
      "   state [0 0 0 0] state_WI [0.24 0.38 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 0 0] state_WI [0.24 0.47 0.27 0.04] sorted [1 2 0]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "   state [1 1 0 0] state_WI [0.14 0.47 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [1 0 0 1] state_WI [ 0.14  0.38  0.27 -0.07] sorted [1 2 0]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 0 1 1] state_WI [ 0.24  0.38  0.21 -0.07] sorted [1 0 2]\n",
      "   state [0 0 0 0] state_WI [0.24 0.38 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 0 1 1] state_WI [ 0.24  0.38  0.21 -0.07] sorted [1 0 2]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 0 0 0] state_WI [0.24 0.38 0.27 0.04] sorted [1 2 0]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "   state [1 0 1 0] state_WI [0.14 0.38 0.21 0.04] sorted [1 2 0]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "instance 4, ep 29, state [1 0 1 0]\n",
      "   state [1 0 1 0] state_WI [0.14 0.38 0.21 0.04] sorted [1 2 0]\n",
      "   state [1 0 0 0] state_WI [0.14 0.38 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 0 0 0] state_WI [0.24 0.38 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 0 1 1] state_WI [ 0.24  0.38  0.21 -0.07] sorted [1 0 2]\n",
      "   state [1 0 1 0] state_WI [0.14 0.38 0.21 0.04] sorted [1 2 0]\n",
      "   state [1 0 1 0] state_WI [0.14 0.38 0.21 0.04] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 0 1 0] state_WI [0.24 0.38 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "   state [0 0 0 0] state_WI [0.24 0.38 0.27 0.04] sorted [1 2 0]\n",
      "   state [0 1 0 0] state_WI [0.24 0.47 0.27 0.04] sorted [1 2 0]\n",
      "   state [1 1 1 0] state_WI [0.14 0.47 0.21 0.04] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.24 0.47 0.21 0.04] sorted [1 0 2]\n",
      "first state [0 1 1 1]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [0.3  0.32 0.6  0.38] sorted [2 3 1]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [1 0 0 0] state_WI [0.3  0.46 0.58 0.38] sorted [2 1 3]\n",
      "   state [1 0 1 1] state_WI [0.3  0.46 0.6  0.31] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.33 0.46 0.6  0.31] sorted [2 1 0]\n",
      "   state [1 0 1 1] state_WI [0.3  0.46 0.6  0.31] sorted [2 1 3]\n",
      "   state [1 0 1 1] state_WI [0.3  0.46 0.6  0.31] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.33 0.46 0.6  0.31] sorted [2 1 0]\n",
      "   state [0 0 1 0] state_WI [0.33 0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "   state [1 0 1 0] state_WI [0.3  0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [1 1 1 1] state_WI [0.3  0.32 0.6  0.31] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [0.3  0.46 0.6  0.31] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "   state [1 1 0 0] state_WI [0.3  0.32 0.58 0.38] sorted [2 3 1]\n",
      "instance 5, ep 1, state [0 0 1 0]\n",
      "   state [0 0 1 0] state_WI [0.33 0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.33 0.46 0.6  0.31] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [0 0 1 0] state_WI [0.33 0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [0 0 1 0] state_WI [0.33 0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [0 1 0 1] state_WI [0.33 0.32 0.58 0.31] sorted [2 0 1]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [0.3  0.46 0.6  0.31] sorted [2 1 3]\n",
      "   state [1 0 1 1] state_WI [0.3  0.46 0.6  0.31] sorted [2 1 3]\n",
      "   state [0 1 0 1] state_WI [0.33 0.32 0.58 0.31] sorted [2 0 1]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [0 0 1 0] state_WI [0.33 0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [1 1 1 0] state_WI [0.3  0.32 0.6  0.38] sorted [2 3 1]\n",
      "   state [1 1 1 1] state_WI [0.3  0.32 0.6  0.31] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "   state [0 0 1 1] state_WI [0.33 0.46 0.6  0.31] sorted [2 1 0]\n",
      "   state [0 0 1 0] state_WI [0.33 0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [0 0 1 0] state_WI [0.33 0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [1 1 1 0] state_WI [0.3  0.32 0.6  0.38] sorted [2 3 1]\n",
      "instance 5, ep 2, state [1 1 1 1]\n",
      "   state [1 1 1 1] state_WI [0.3  0.32 0.6  0.31] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.33 0.46 0.6  0.31] sorted [2 1 0]\n",
      "   state [0 0 1 1] state_WI [0.33 0.46 0.6  0.31] sorted [2 1 0]\n",
      "   state [0 0 1 1] state_WI [0.33 0.46 0.6  0.31] sorted [2 1 0]\n",
      "   state [0 0 1 1] state_WI [0.33 0.46 0.6  0.31] sorted [2 1 0]\n",
      "   state [0 0 0 0] state_WI [0.33 0.46 0.58 0.38] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.33 0.46 0.6  0.31] sorted [2 1 0]\n",
      "   state [0 0 1 0] state_WI [0.33 0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "   state [1 1 1 1] state_WI [0.3  0.32 0.6  0.31] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "   state [1 1 1 1] state_WI [0.3  0.32 0.6  0.31] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [0.3  0.46 0.6  0.31] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [0.3  0.32 0.6  0.38] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "instance 5, ep 3, state [1 0 1 0]\n",
      "   state [1 0 1 0] state_WI [0.3  0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [1 1 1 1] state_WI [0.3  0.32 0.6  0.31] sorted [2 1 3]\n",
      "   state [1 0 1 1] state_WI [0.3  0.46 0.6  0.31] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [1 0 1 0] state_WI [0.3  0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [1 0 1 0] state_WI [0.3  0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [1 1 1 1] state_WI [0.3  0.32 0.6  0.31] sorted [2 1 3]\n",
      "   state [0 0 1 0] state_WI [0.33 0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [1 1 1 0] state_WI [0.3  0.32 0.6  0.38] sorted [2 3 1]\n",
      "   state [1 0 1 0] state_WI [0.3  0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [1 1 1 1] state_WI [0.3  0.32 0.6  0.31] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [0.3  0.32 0.6  0.38] sorted [2 3 1]\n",
      "   state [1 1 1 1] state_WI [0.3  0.32 0.6  0.31] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.33 0.46 0.6  0.31] sorted [2 1 0]\n",
      "   state [0 0 1 1] state_WI [0.33 0.46 0.6  0.31] sorted [2 1 0]\n",
      "   state [1 0 0 0] state_WI [0.3  0.46 0.58 0.38] sorted [2 1 3]\n",
      "   state [0 0 0 1] state_WI [0.33 0.46 0.58 0.31] sorted [2 1 0]\n",
      "instance 5, ep 4, state [0 1 1 1]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "   state [0 1 0 1] state_WI [0.33 0.32 0.58 0.31] sorted [2 0 1]\n",
      "   state [1 1 0 1] state_WI [0.3  0.32 0.58 0.31] sorted [2 1 3]\n",
      "   state [1 0 1 1] state_WI [0.3  0.46 0.6  0.31] sorted [2 1 3]\n",
      "   state [1 1 1 1] state_WI [0.3  0.32 0.6  0.31] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "   state [1 0 1 0] state_WI [0.3  0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [0 0 1 0] state_WI [0.33 0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [1 1 1 1] state_WI [0.3  0.32 0.6  0.31] sorted [2 1 3]\n",
      "   state [1 1 1 1] state_WI [0.3  0.32 0.6  0.31] sorted [2 1 3]\n",
      "   state [1 0 1 1] state_WI [0.3  0.46 0.6  0.31] sorted [2 1 3]\n",
      "   state [1 0 1 0] state_WI [0.3  0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [0 0 1 0] state_WI [0.33 0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [0 0 1 0] state_WI [0.33 0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [0 0 1 0] state_WI [0.33 0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [0 0 1 0] state_WI [0.33 0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [0 0 1 0] state_WI [0.33 0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [0 0 1 0] state_WI [0.33 0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "instance 5, ep 5, state [1 0 0 1]\n",
      "   state [1 0 0 1] state_WI [0.3  0.46 0.58 0.31] sorted [2 1 3]\n",
      "   state [0 0 0 0] state_WI [0.33 0.46 0.58 0.38] sorted [2 1 3]\n",
      "   state [0 0 1 0] state_WI [0.33 0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.33 0.46 0.6  0.31] sorted [2 1 0]\n",
      "   state [1 0 1 1] state_WI [0.3  0.46 0.6  0.31] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [0.3  0.32 0.6  0.38] sorted [2 3 1]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [1 1 1 0] state_WI [0.3  0.32 0.6  0.38] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "   state [0 0 1 0] state_WI [0.33 0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [1 0 1 0] state_WI [0.3  0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "instance 5, ep 6, state [0 0 0 0]\n",
      "   state [0 0 0 0] state_WI [0.33 0.46 0.58 0.38] sorted [2 1 3]\n",
      "   state [0 0 0 0] state_WI [0.33 0.46 0.58 0.38] sorted [2 1 3]\n",
      "   state [0 0 0 0] state_WI [0.33 0.46 0.58 0.38] sorted [2 1 3]\n",
      "   state [0 1 0 1] state_WI [0.33 0.32 0.58 0.31] sorted [2 0 1]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [1 1 1 1] state_WI [0.3  0.32 0.6  0.31] sorted [2 1 3]\n",
      "   state [0 1 0 0] state_WI [0.33 0.32 0.58 0.38] sorted [2 3 0]\n",
      "   state [0 1 0 0] state_WI [0.33 0.32 0.58 0.38] sorted [2 3 0]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "   state [1 1 1 1] state_WI [0.3  0.32 0.6  0.31] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [1 1 1 1] state_WI [0.3  0.32 0.6  0.31] sorted [2 1 3]\n",
      "   state [1 1 1 1] state_WI [0.3  0.32 0.6  0.31] sorted [2 1 3]\n",
      "   state [1 1 1 0] state_WI [0.3  0.32 0.6  0.38] sorted [2 3 1]\n",
      "   state [0 1 0 0] state_WI [0.33 0.32 0.58 0.38] sorted [2 3 0]\n",
      "   state [0 1 0 0] state_WI [0.33 0.32 0.58 0.38] sorted [2 3 0]\n",
      "   state [1 0 0 0] state_WI [0.3  0.46 0.58 0.38] sorted [2 1 3]\n",
      "   state [0 0 0 1] state_WI [0.33 0.46 0.58 0.31] sorted [2 1 0]\n",
      "   state [0 0 1 0] state_WI [0.33 0.46 0.6  0.38] sorted [2 1 3]\n",
      "instance 5, ep 7, state [0 0 0 0]\n",
      "   state [0 0 0 0] state_WI [0.33 0.46 0.58 0.38] sorted [2 1 3]\n",
      "   state [0 0 1 0] state_WI [0.33 0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [1 0 1 0] state_WI [0.3  0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [1 0 1 0] state_WI [0.3  0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [0 0 1 0] state_WI [0.33 0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.33 0.46 0.6  0.31] sorted [2 1 0]\n",
      "   state [1 0 1 1] state_WI [0.3  0.46 0.6  0.31] sorted [2 1 3]\n",
      "   state [0 0 1 0] state_WI [0.33 0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [0 0 1 0] state_WI [0.33 0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [0 0 0 0] state_WI [0.33 0.46 0.58 0.38] sorted [2 1 3]\n",
      "   state [1 0 1 0] state_WI [0.3  0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [1 0 1 1] state_WI [0.3  0.46 0.6  0.31] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [0.3  0.32 0.6  0.38] sorted [2 3 1]\n",
      "   state [1 1 1 0] state_WI [0.3  0.32 0.6  0.38] sorted [2 3 1]\n",
      "   state [1 1 1 0] state_WI [0.3  0.32 0.6  0.38] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "instance 5, ep 8, state [1 0 0 1]\n",
      "   state [1 0 0 1] state_WI [0.3  0.46 0.58 0.31] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [0.3  0.32 0.6  0.38] sorted [2 3 1]\n",
      "   state [1 1 1 0] state_WI [0.3  0.32 0.6  0.38] sorted [2 3 1]\n",
      "   state [1 0 1 1] state_WI [0.3  0.46 0.6  0.31] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.33 0.46 0.6  0.31] sorted [2 1 0]\n",
      "   state [0 0 1 0] state_WI [0.33 0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [0 0 1 0] state_WI [0.33 0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [1 0 0 0] state_WI [0.3  0.46 0.58 0.38] sorted [2 1 3]\n",
      "   state [0 0 1 0] state_WI [0.33 0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.33 0.46 0.6  0.31] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [0 0 1 1] state_WI [0.33 0.46 0.6  0.31] sorted [2 1 0]\n",
      "   state [0 0 1 1] state_WI [0.33 0.46 0.6  0.31] sorted [2 1 0]\n",
      "instance 5, ep 9, state [0 1 1 0]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [0 0 1 0] state_WI [0.33 0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.33 0.46 0.6  0.31] sorted [2 1 0]\n",
      "   state [0 0 1 0] state_WI [0.33 0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "   state [0 1 0 0] state_WI [0.33 0.32 0.58 0.38] sorted [2 3 0]\n",
      "   state [0 0 1 0] state_WI [0.33 0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.33 0.46 0.6  0.31] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [0 1 0 0] state_WI [0.33 0.32 0.58 0.38] sorted [2 3 0]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "   state [1 1 1 1] state_WI [0.3  0.32 0.6  0.31] sorted [2 1 3]\n",
      "   state [1 0 0 1] state_WI [0.3  0.46 0.58 0.31] sorted [2 1 3]\n",
      "   state [0 1 0 0] state_WI [0.33 0.32 0.58 0.38] sorted [2 3 0]\n",
      "   state [0 0 0 0] state_WI [0.33 0.46 0.58 0.38] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [0 0 0 1] state_WI [0.33 0.46 0.58 0.31] sorted [2 1 0]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "instance 5, ep 10, state [0 1 1 0]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [1 1 1 0] state_WI [0.3  0.32 0.6  0.38] sorted [2 3 1]\n",
      "   state [1 0 0 1] state_WI [0.3  0.46 0.58 0.31] sorted [2 1 3]\n",
      "   state [0 1 0 1] state_WI [0.33 0.32 0.58 0.31] sorted [2 0 1]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [0.3  0.32 0.6  0.38] sorted [2 3 1]\n",
      "   state [1 1 1 0] state_WI [0.3  0.32 0.6  0.38] sorted [2 3 1]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "   state [1 1 1 1] state_WI [0.3  0.32 0.6  0.31] sorted [2 1 3]\n",
      "   state [0 1 0 1] state_WI [0.33 0.32 0.58 0.31] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [0.3  0.32 0.6  0.38] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.33 0.46 0.6  0.31] sorted [2 1 0]\n",
      "   state [1 0 1 1] state_WI [0.3  0.46 0.6  0.31] sorted [2 1 3]\n",
      "   state [0 1 0 0] state_WI [0.33 0.32 0.58 0.38] sorted [2 3 0]\n",
      "   state [0 1 0 0] state_WI [0.33 0.32 0.58 0.38] sorted [2 3 0]\n",
      "   state [0 0 0 0] state_WI [0.33 0.46 0.58 0.38] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.33 0.46 0.6  0.31] sorted [2 1 0]\n",
      "instance 5, ep 11, state [1 0 1 0]\n",
      "   state [1 0 1 0] state_WI [0.3  0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.33 0.46 0.6  0.31] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.3  0.32 0.6  0.38] sorted [2 3 1]\n",
      "   state [0 0 1 0] state_WI [0.33 0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.33 0.46 0.6  0.31] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [0 0 1 1] state_WI [0.33 0.46 0.6  0.31] sorted [2 1 0]\n",
      "   state [1 0 1 0] state_WI [0.3  0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [0 0 1 0] state_WI [0.33 0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [0 0 0 0] state_WI [0.33 0.46 0.58 0.38] sorted [2 1 3]\n",
      "   state [1 0 1 1] state_WI [0.3  0.46 0.6  0.31] sorted [2 1 3]\n",
      "   state [1 1 1 1] state_WI [0.3  0.32 0.6  0.31] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "   state [1 1 1 1] state_WI [0.3  0.32 0.6  0.31] sorted [2 1 3]\n",
      "   state [1 1 1 1] state_WI [0.3  0.32 0.6  0.31] sorted [2 1 3]\n",
      "   state [1 1 1 0] state_WI [0.3  0.32 0.6  0.38] sorted [2 3 1]\n",
      "   state [1 1 1 0] state_WI [0.3  0.32 0.6  0.38] sorted [2 3 1]\n",
      "   state [1 1 1 1] state_WI [0.3  0.32 0.6  0.31] sorted [2 1 3]\n",
      "   state [0 1 0 1] state_WI [0.33 0.32 0.58 0.31] sorted [2 0 1]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "instance 5, ep 12, state [1 1 1 1]\n",
      "   state [1 1 1 1] state_WI [0.3  0.32 0.6  0.31] sorted [2 1 3]\n",
      "   state [0 1 0 1] state_WI [0.33 0.32 0.58 0.31] sorted [2 0 1]\n",
      "   state [0 0 0 1] state_WI [0.33 0.46 0.58 0.31] sorted [2 1 0]\n",
      "   state [1 0 1 1] state_WI [0.3  0.46 0.6  0.31] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.33 0.46 0.6  0.31] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.3  0.32 0.6  0.38] sorted [2 3 1]\n",
      "   state [1 1 1 0] state_WI [0.3  0.32 0.6  0.38] sorted [2 3 1]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [0 0 1 1] state_WI [0.33 0.46 0.6  0.31] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [1 1 1 0] state_WI [0.3  0.32 0.6  0.38] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [0 0 1 1] state_WI [0.33 0.46 0.6  0.31] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.3  0.32 0.6  0.38] sorted [2 3 1]\n",
      "   state [1 1 1 1] state_WI [0.3  0.32 0.6  0.31] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "instance 5, ep 13, state [0 0 0 0]\n",
      "   state [0 0 0 0] state_WI [0.33 0.46 0.58 0.38] sorted [2 1 3]\n",
      "   state [0 0 0 0] state_WI [0.33 0.46 0.58 0.38] sorted [2 1 3]\n",
      "   state [0 0 0 1] state_WI [0.33 0.46 0.58 0.31] sorted [2 1 0]\n",
      "   state [0 0 1 1] state_WI [0.33 0.46 0.6  0.31] sorted [2 1 0]\n",
      "   state [0 0 1 0] state_WI [0.33 0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [0 0 1 0] state_WI [0.33 0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [0 1 0 1] state_WI [0.33 0.32 0.58 0.31] sorted [2 0 1]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [1 1 1 1] state_WI [0.3  0.32 0.6  0.31] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [1 1 1 0] state_WI [0.3  0.32 0.6  0.38] sorted [2 3 1]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [1 1 1 1] state_WI [0.3  0.32 0.6  0.31] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [0 0 1 0] state_WI [0.33 0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [0 0 1 1] state_WI [0.33 0.46 0.6  0.31] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [1 1 1 0] state_WI [0.3  0.32 0.6  0.38] sorted [2 3 1]\n",
      "instance 5, ep 14, state [1 0 0 1]\n",
      "   state [1 0 0 1] state_WI [0.3  0.46 0.58 0.31] sorted [2 1 3]\n",
      "   state [1 0 1 1] state_WI [0.3  0.46 0.6  0.31] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.33 0.46 0.6  0.31] sorted [2 1 0]\n",
      "   state [1 0 1 1] state_WI [0.3  0.46 0.6  0.31] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [0.3  0.32 0.6  0.38] sorted [2 3 1]\n",
      "   state [0 0 1 0] state_WI [0.33 0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [0 0 1 0] state_WI [0.33 0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.33 0.46 0.6  0.31] sorted [2 1 0]\n",
      "   state [1 0 1 1] state_WI [0.3  0.46 0.6  0.31] sorted [2 1 3]\n",
      "   state [1 1 1 1] state_WI [0.3  0.32 0.6  0.31] sorted [2 1 3]\n",
      "   state [0 1 0 0] state_WI [0.33 0.32 0.58 0.38] sorted [2 3 0]\n",
      "   state [1 1 1 1] state_WI [0.3  0.32 0.6  0.31] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "   state [1 1 1 1] state_WI [0.3  0.32 0.6  0.31] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "   state [1 1 1 1] state_WI [0.3  0.32 0.6  0.31] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [0.3  0.46 0.6  0.31] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "instance 5, ep 15, state [1 1 1 0]\n",
      "   state [1 1 1 0] state_WI [0.3  0.32 0.6  0.38] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "   state [1 1 1 1] state_WI [0.3  0.32 0.6  0.31] sorted [2 1 3]\n",
      "   state [1 1 1 1] state_WI [0.3  0.32 0.6  0.31] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "   state [1 1 1 1] state_WI [0.3  0.32 0.6  0.31] sorted [2 1 3]\n",
      "   state [1 1 1 1] state_WI [0.3  0.32 0.6  0.31] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "   state [1 1 1 1] state_WI [0.3  0.32 0.6  0.31] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "   state [0 0 1 0] state_WI [0.33 0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.33 0.46 0.6  0.31] sorted [2 1 0]\n",
      "   state [1 0 1 0] state_WI [0.3  0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [1 1 1 0] state_WI [0.3  0.32 0.6  0.38] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "   state [1 0 1 1] state_WI [0.3  0.46 0.6  0.31] sorted [2 1 3]\n",
      "   state [1 0 1 1] state_WI [0.3  0.46 0.6  0.31] sorted [2 1 3]\n",
      "   state [0 0 1 0] state_WI [0.33 0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [0 0 1 0] state_WI [0.33 0.46 0.6  0.38] sorted [2 1 3]\n",
      "instance 5, ep 16, state [0 1 1 0]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [0 0 1 0] state_WI [0.33 0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [1 1 1 1] state_WI [0.3  0.32 0.6  0.31] sorted [2 1 3]\n",
      "   state [1 1 1 0] state_WI [0.3  0.32 0.6  0.38] sorted [2 3 1]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [1 1 1 0] state_WI [0.3  0.32 0.6  0.38] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [0 1 0 0] state_WI [0.33 0.32 0.58 0.38] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [0.3  0.46 0.6  0.31] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.33 0.46 0.6  0.31] sorted [2 1 0]\n",
      "   state [0 0 1 1] state_WI [0.33 0.46 0.6  0.31] sorted [2 1 0]\n",
      "   state [0 0 1 1] state_WI [0.33 0.46 0.6  0.31] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.3  0.32 0.6  0.31] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [1 1 1 1] state_WI [0.3  0.32 0.6  0.31] sorted [2 1 3]\n",
      "instance 5, ep 17, state [1 0 0 1]\n",
      "   state [1 0 0 1] state_WI [0.3  0.46 0.58 0.31] sorted [2 1 3]\n",
      "   state [1 1 1 0] state_WI [0.3  0.32 0.6  0.38] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [0.3  0.32 0.6  0.38] sorted [2 3 1]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [0 0 0 1] state_WI [0.33 0.46 0.58 0.31] sorted [2 1 0]\n",
      "   state [0 0 0 0] state_WI [0.33 0.46 0.58 0.38] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.33 0.46 0.6  0.31] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.3  0.32 0.6  0.38] sorted [2 3 1]\n",
      "   state [1 1 1 0] state_WI [0.3  0.32 0.6  0.38] sorted [2 3 1]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [0 0 1 1] state_WI [0.33 0.46 0.6  0.31] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.3  0.32 0.6  0.31] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "   state [1 0 1 1] state_WI [0.3  0.46 0.6  0.31] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "   state [0 1 0 1] state_WI [0.33 0.32 0.58 0.31] sorted [2 0 1]\n",
      "   state [1 0 1 0] state_WI [0.3  0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [0 0 1 0] state_WI [0.33 0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "instance 5, ep 18, state [1 1 0 1]\n",
      "   state [1 1 0 1] state_WI [0.3  0.32 0.58 0.31] sorted [2 1 3]\n",
      "   state [1 1 1 1] state_WI [0.3  0.32 0.6  0.31] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [1 1 1 0] state_WI [0.3  0.32 0.6  0.38] sorted [2 3 1]\n",
      "   state [0 1 0 0] state_WI [0.33 0.32 0.58 0.38] sorted [2 3 0]\n",
      "   state [0 0 0 0] state_WI [0.33 0.46 0.58 0.38] sorted [2 1 3]\n",
      "   state [0 0 0 0] state_WI [0.33 0.46 0.58 0.38] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "   state [0 0 1 0] state_WI [0.33 0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [0.3  0.46 0.6  0.31] sorted [2 1 3]\n",
      "   state [1 1 1 1] state_WI [0.3  0.32 0.6  0.31] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [0 0 0 1] state_WI [0.33 0.46 0.58 0.31] sorted [2 1 0]\n",
      "   state [1 1 0 1] state_WI [0.3  0.32 0.58 0.31] sorted [2 1 3]\n",
      "   state [0 1 0 1] state_WI [0.33 0.32 0.58 0.31] sorted [2 0 1]\n",
      "   state [0 1 0 0] state_WI [0.33 0.32 0.58 0.38] sorted [2 3 0]\n",
      "   state [0 0 1 0] state_WI [0.33 0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.33 0.46 0.6  0.31] sorted [2 1 0]\n",
      "instance 5, ep 19, state [0 0 1 1]\n",
      "   state [0 0 1 1] state_WI [0.33 0.46 0.6  0.31] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "   state [0 0 0 1] state_WI [0.33 0.46 0.58 0.31] sorted [2 1 0]\n",
      "   state [0 0 1 1] state_WI [0.33 0.46 0.6  0.31] sorted [2 1 0]\n",
      "   state [0 0 1 0] state_WI [0.33 0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.33 0.46 0.6  0.31] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.3  0.32 0.6  0.31] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "   state [0 0 1 0] state_WI [0.33 0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [0 0 1 1] state_WI [0.33 0.46 0.6  0.31] sorted [2 1 0]\n",
      "   state [0 0 0 0] state_WI [0.33 0.46 0.58 0.38] sorted [2 1 3]\n",
      "   state [1 0 1 1] state_WI [0.3  0.46 0.6  0.31] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "   state [0 1 0 1] state_WI [0.33 0.32 0.58 0.31] sorted [2 0 1]\n",
      "   state [0 1 0 1] state_WI [0.33 0.32 0.58 0.31] sorted [2 0 1]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "instance 5, ep 20, state [1 1 1 1]\n",
      "   state [1 1 1 1] state_WI [0.3  0.32 0.6  0.31] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.33 0.46 0.6  0.31] sorted [2 1 0]\n",
      "   state [1 0 1 0] state_WI [0.3  0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.33 0.46 0.6  0.31] sorted [2 1 0]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [0 0 0 0] state_WI [0.33 0.46 0.58 0.38] sorted [2 1 3]\n",
      "   state [0 1 0 1] state_WI [0.33 0.32 0.58 0.31] sorted [2 0 1]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [0 0 1 1] state_WI [0.33 0.46 0.6  0.31] sorted [2 1 0]\n",
      "   state [0 0 0 0] state_WI [0.33 0.46 0.58 0.38] sorted [2 1 3]\n",
      "   state [0 0 0 0] state_WI [0.33 0.46 0.58 0.38] sorted [2 1 3]\n",
      "   state [0 0 1 0] state_WI [0.33 0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.33 0.46 0.6  0.31] sorted [2 1 0]\n",
      "   state [0 0 1 0] state_WI [0.33 0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [0 0 1 0] state_WI [0.33 0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.33 0.46 0.6  0.31] sorted [2 1 0]\n",
      "   state [1 1 0 0] state_WI [0.3  0.32 0.58 0.38] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.33 0.46 0.6  0.31] sorted [2 1 0]\n",
      "   state [1 0 1 1] state_WI [0.3  0.46 0.6  0.31] sorted [2 1 3]\n",
      "instance 5, ep 21, state [0 0 0 0]\n",
      "   state [0 0 0 0] state_WI [0.33 0.46 0.58 0.38] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.33 0.46 0.6  0.31] sorted [2 1 0]\n",
      "   state [0 0 1 0] state_WI [0.33 0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.33 0.46 0.6  0.31] sorted [2 1 0]\n",
      "   state [1 0 1 0] state_WI [0.3  0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.33 0.46 0.6  0.31] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.3  0.32 0.6  0.38] sorted [2 3 1]\n",
      "   state [1 1 1 1] state_WI [0.3  0.32 0.6  0.31] sorted [2 1 3]\n",
      "   state [1 0 1 1] state_WI [0.3  0.46 0.6  0.31] sorted [2 1 3]\n",
      "   state [1 0 1 1] state_WI [0.3  0.46 0.6  0.31] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [0 0 0 0] state_WI [0.33 0.46 0.58 0.38] sorted [2 1 3]\n",
      "   state [0 1 0 0] state_WI [0.33 0.32 0.58 0.38] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [0.3  0.46 0.6  0.31] sorted [2 1 3]\n",
      "   state [0 0 1 0] state_WI [0.33 0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.33 0.46 0.6  0.31] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [0 0 1 0] state_WI [0.33 0.46 0.6  0.38] sorted [2 1 3]\n",
      "instance 5, ep 22, state [1 0 0 0]\n",
      "   state [1 0 0 0] state_WI [0.3  0.46 0.58 0.38] sorted [2 1 3]\n",
      "   state [0 0 1 0] state_WI [0.33 0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.33 0.46 0.6  0.31] sorted [2 1 0]\n",
      "   state [0 0 1 0] state_WI [0.33 0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.33 0.46 0.6  0.31] sorted [2 1 0]\n",
      "   state [1 0 1 0] state_WI [0.3  0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [1 1 1 1] state_WI [0.3  0.32 0.6  0.31] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.33 0.46 0.6  0.31] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.3  0.32 0.6  0.31] sorted [2 1 3]\n",
      "   state [1 1 0 1] state_WI [0.3  0.32 0.58 0.31] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [1 1 1 1] state_WI [0.3  0.32 0.6  0.31] sorted [2 1 3]\n",
      "   state [0 0 1 0] state_WI [0.33 0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [0 0 0 1] state_WI [0.33 0.46 0.58 0.31] sorted [2 1 0]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "   state [1 0 1 1] state_WI [0.3  0.46 0.6  0.31] sorted [2 1 3]\n",
      "   state [1 1 1 1] state_WI [0.3  0.32 0.6  0.31] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "   state [0 0 0 1] state_WI [0.33 0.46 0.58 0.31] sorted [2 1 0]\n",
      "   state [0 1 0 0] state_WI [0.33 0.32 0.58 0.38] sorted [2 3 0]\n",
      "instance 5, ep 23, state [1 0 1 0]\n",
      "   state [1 0 1 0] state_WI [0.3  0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [1 1 1 0] state_WI [0.3  0.32 0.6  0.38] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "   state [1 1 1 1] state_WI [0.3  0.32 0.6  0.31] sorted [2 1 3]\n",
      "   state [1 1 1 1] state_WI [0.3  0.32 0.6  0.31] sorted [2 1 3]\n",
      "   state [1 1 1 1] state_WI [0.3  0.32 0.6  0.31] sorted [2 1 3]\n",
      "   state [1 1 1 1] state_WI [0.3  0.32 0.6  0.31] sorted [2 1 3]\n",
      "   state [1 0 1 1] state_WI [0.3  0.46 0.6  0.31] sorted [2 1 3]\n",
      "   state [1 0 1 1] state_WI [0.3  0.46 0.6  0.31] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.33 0.46 0.6  0.31] sorted [2 1 0]\n",
      "   state [0 0 1 1] state_WI [0.33 0.46 0.6  0.31] sorted [2 1 0]\n",
      "   state [1 1 0 1] state_WI [0.3  0.32 0.58 0.31] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [1 1 0 1] state_WI [0.3  0.32 0.58 0.31] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [1 0 1 0] state_WI [0.3  0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [1 1 1 1] state_WI [0.3  0.32 0.6  0.31] sorted [2 1 3]\n",
      "   state [0 1 0 1] state_WI [0.33 0.32 0.58 0.31] sorted [2 0 1]\n",
      "   state [1 1 0 1] state_WI [0.3  0.32 0.58 0.31] sorted [2 1 3]\n",
      "instance 5, ep 24, state [0 1 1 0]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [1 0 1 0] state_WI [0.3  0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [1 0 1 0] state_WI [0.3  0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.33 0.46 0.6  0.31] sorted [2 1 0]\n",
      "   state [1 0 0 1] state_WI [0.3  0.46 0.58 0.31] sorted [2 1 3]\n",
      "   state [1 1 1 0] state_WI [0.3  0.32 0.6  0.38] sorted [2 3 1]\n",
      "   state [1 1 0 1] state_WI [0.3  0.32 0.58 0.31] sorted [2 1 3]\n",
      "   state [1 1 0 0] state_WI [0.3  0.32 0.58 0.38] sorted [2 3 1]\n",
      "   state [0 1 0 1] state_WI [0.33 0.32 0.58 0.31] sorted [2 0 1]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "   state [1 0 1 0] state_WI [0.3  0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [1 0 1 0] state_WI [0.3  0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.33 0.46 0.6  0.31] sorted [2 1 0]\n",
      "   state [1 0 1 1] state_WI [0.3  0.46 0.6  0.31] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.33 0.46 0.6  0.31] sorted [2 1 0]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [0.3  0.32 0.6  0.38] sorted [2 3 1]\n",
      "   state [1 1 1 1] state_WI [0.3  0.32 0.6  0.31] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "instance 5, ep 25, state [1 1 0 1]\n",
      "   state [1 1 0 1] state_WI [0.3  0.32 0.58 0.31] sorted [2 1 3]\n",
      "   state [1 0 1 1] state_WI [0.3  0.46 0.6  0.31] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.33 0.46 0.6  0.31] sorted [2 1 0]\n",
      "   state [0 0 1 0] state_WI [0.33 0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [1 0 1 0] state_WI [0.3  0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [1 0 1 1] state_WI [0.3  0.46 0.6  0.31] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "   state [1 1 1 1] state_WI [0.3  0.32 0.6  0.31] sorted [2 1 3]\n",
      "   state [1 1 0 1] state_WI [0.3  0.32 0.58 0.31] sorted [2 1 3]\n",
      "   state [0 0 1 0] state_WI [0.33 0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [0 0 1 0] state_WI [0.33 0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.33 0.46 0.6  0.31] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.3  0.32 0.6  0.38] sorted [2 3 1]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [0 0 1 1] state_WI [0.33 0.46 0.6  0.31] sorted [2 1 0]\n",
      "   state [0 0 0 1] state_WI [0.33 0.46 0.58 0.31] sorted [2 1 0]\n",
      "   state [1 1 0 1] state_WI [0.3  0.32 0.58 0.31] sorted [2 1 3]\n",
      "   state [1 1 1 1] state_WI [0.3  0.32 0.6  0.31] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.33 0.46 0.6  0.31] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.3  0.32 0.6  0.38] sorted [2 3 1]\n",
      "instance 5, ep 26, state [1 1 1 1]\n",
      "   state [1 1 1 1] state_WI [0.3  0.32 0.6  0.31] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "   state [0 0 1 1] state_WI [0.33 0.46 0.6  0.31] sorted [2 1 0]\n",
      "   state [0 0 0 1] state_WI [0.33 0.46 0.58 0.31] sorted [2 1 0]\n",
      "   state [1 0 0 1] state_WI [0.3  0.46 0.58 0.31] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "   state [0 1 0 1] state_WI [0.33 0.32 0.58 0.31] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [0.3  0.32 0.6  0.38] sorted [2 3 1]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [0 0 1 1] state_WI [0.33 0.46 0.6  0.31] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.3  0.32 0.6  0.31] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [0 0 1 0] state_WI [0.33 0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.33 0.46 0.6  0.31] sorted [2 1 0]\n",
      "   state [1 0 1 1] state_WI [0.3  0.46 0.6  0.31] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [0.3  0.32 0.6  0.38] sorted [2 3 1]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [0 0 1 1] state_WI [0.33 0.46 0.6  0.31] sorted [2 1 0]\n",
      "   state [1 1 0 0] state_WI [0.3  0.32 0.58 0.38] sorted [2 3 1]\n",
      "instance 5, ep 27, state [1 1 1 1]\n",
      "   state [1 1 1 1] state_WI [0.3  0.32 0.6  0.31] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "   state [1 1 1 1] state_WI [0.3  0.32 0.6  0.31] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "   state [1 0 1 0] state_WI [0.3  0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [1 1 1 0] state_WI [0.3  0.32 0.6  0.38] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.33 0.46 0.6  0.31] sorted [2 1 0]\n",
      "   state [0 0 1 0] state_WI [0.33 0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "   state [0 0 0 0] state_WI [0.33 0.46 0.58 0.38] sorted [2 1 3]\n",
      "   state [0 0 1 0] state_WI [0.33 0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [0 0 1 0] state_WI [0.33 0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [0 0 1 1] state_WI [0.33 0.46 0.6  0.31] sorted [2 1 0]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "instance 5, ep 28, state [1 1 0 1]\n",
      "   state [1 1 0 1] state_WI [0.3  0.32 0.58 0.31] sorted [2 1 3]\n",
      "   state [1 0 0 1] state_WI [0.3  0.46 0.58 0.31] sorted [2 1 3]\n",
      "   state [1 1 1 0] state_WI [0.3  0.32 0.6  0.38] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "   state [0 0 1 0] state_WI [0.33 0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "   state [0 0 1 0] state_WI [0.33 0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [0 0 1 0] state_WI [0.33 0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [0 0 0 1] state_WI [0.33 0.46 0.58 0.31] sorted [2 1 0]\n",
      "   state [0 1 0 1] state_WI [0.33 0.32 0.58 0.31] sorted [2 0 1]\n",
      "   state [0 1 0 1] state_WI [0.33 0.32 0.58 0.31] sorted [2 0 1]\n",
      "   state [0 0 1 0] state_WI [0.33 0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [1 0 1 1] state_WI [0.3  0.46 0.6  0.31] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.33 0.46 0.6  0.31] sorted [2 1 0]\n",
      "   state [1 0 1 0] state_WI [0.3  0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [0 0 1 1] state_WI [0.33 0.46 0.6  0.31] sorted [2 1 0]\n",
      "   state [0 0 1 1] state_WI [0.33 0.46 0.6  0.31] sorted [2 1 0]\n",
      "instance 5, ep 29, state [1 0 1 0]\n",
      "   state [1 0 1 0] state_WI [0.3  0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [0 0 1 0] state_WI [0.33 0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.33 0.46 0.6  0.31] sorted [2 1 0]\n",
      "   state [0 0 1 0] state_WI [0.33 0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "   state [1 1 0 1] state_WI [0.3  0.32 0.58 0.31] sorted [2 1 3]\n",
      "   state [0 1 0 1] state_WI [0.33 0.32 0.58 0.31] sorted [2 0 1]\n",
      "   state [1 1 0 0] state_WI [0.3  0.32 0.58 0.38] sorted [2 3 1]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [0 1 1 0] state_WI [0.33 0.32 0.6  0.38] sorted [2 3 0]\n",
      "   state [0 0 1 0] state_WI [0.33 0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.33 0.46 0.6  0.31] sorted [2 1 0]\n",
      "   state [1 0 0 0] state_WI [0.3  0.46 0.58 0.38] sorted [2 1 3]\n",
      "   state [0 1 0 1] state_WI [0.33 0.32 0.58 0.31] sorted [2 0 1]\n",
      "   state [1 1 0 0] state_WI [0.3  0.32 0.58 0.38] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "   state [0 1 1 1] state_WI [0.33 0.32 0.6  0.31] sorted [2 0 1]\n",
      "   state [0 0 1 0] state_WI [0.33 0.46 0.6  0.38] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.33 0.46 0.6  0.31] sorted [2 1 0]\n",
      "first state [0 0 1 0]\n",
      "   state [0 0 1 0] state_WI [0.52 0.45 0.14 0.41] sorted [0 1 3]\n",
      "   state [0 0 0 0] state_WI [0.52 0.45 0.24 0.41] sorted [0 1 3]\n",
      "   state [0 0 1 0] state_WI [0.52 0.45 0.14 0.41] sorted [0 1 3]\n",
      "   state [0 0 1 1] state_WI [0.52 0.45 0.14 0.43] sorted [0 1 3]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [0.4  0.3  0.24 0.41] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 1 1] state_WI [0.4  0.3  0.14 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 1 0] state_WI [0.4  0.3  0.14 0.41] sorted [3 0 1]\n",
      "   state [1 1 1 1] state_WI [0.4  0.3  0.14 0.43] sorted [3 0 1]\n",
      "   state [0 0 0 0] state_WI [0.52 0.45 0.24 0.41] sorted [0 1 3]\n",
      "   state [1 0 0 0] state_WI [0.4  0.45 0.24 0.41] sorted [1 3 0]\n",
      "   state [1 0 0 0] state_WI [0.4  0.45 0.24 0.41] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [0.4  0.3  0.24 0.41] sorted [3 0 1]\n",
      "   state [1 1 1 1] state_WI [0.4  0.3  0.14 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 0] state_WI [0.4  0.3  0.24 0.41] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "instance 6, ep 1, state [1 0 1 0]\n",
      "   state [1 0 1 0] state_WI [0.4  0.45 0.14 0.41] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.52 0.3  0.24 0.43] sorted [0 3 1]\n",
      "   state [0 1 0 0] state_WI [0.52 0.3  0.24 0.41] sorted [0 3 1]\n",
      "   state [1 1 0 0] state_WI [0.4  0.3  0.24 0.41] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 0] state_WI [0.4  0.3  0.24 0.41] sorted [3 0 1]\n",
      "   state [1 0 0 0] state_WI [0.4  0.45 0.24 0.41] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.52 0.3  0.24 0.41] sorted [0 3 1]\n",
      "   state [0 0 0 1] state_WI [0.52 0.45 0.24 0.43] sorted [0 1 3]\n",
      "   state [1 1 0 0] state_WI [0.4  0.3  0.24 0.41] sorted [3 0 1]\n",
      "   state [1 0 0 0] state_WI [0.4  0.45 0.24 0.41] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 0 0 0] state_WI [0.4  0.45 0.24 0.41] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [0 0 0 1] state_WI [0.52 0.45 0.24 0.43] sorted [0 1 3]\n",
      "   state [0 1 0 1] state_WI [0.52 0.3  0.24 0.43] sorted [0 3 1]\n",
      "instance 6, ep 2, state [1 1 1 1]\n",
      "   state [1 1 1 1] state_WI [0.4  0.3  0.14 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [1 1 1 0] state_WI [0.4  0.3  0.14 0.41] sorted [3 0 1]\n",
      "   state [1 0 1 1] state_WI [0.4  0.45 0.14 0.43] sorted [1 3 0]\n",
      "   state [1 0 1 1] state_WI [0.4  0.45 0.14 0.43] sorted [1 3 0]\n",
      "   state [1 1 1 1] state_WI [0.4  0.3  0.14 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 0 0 0] state_WI [0.4  0.45 0.24 0.41] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [0.4  0.3  0.24 0.41] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 1 1] state_WI [0.4  0.3  0.14 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 0] state_WI [0.4  0.3  0.24 0.41] sorted [3 0 1]\n",
      "   state [1 1 0 0] state_WI [0.4  0.3  0.24 0.41] sorted [3 0 1]\n",
      "   state [0 1 0 1] state_WI [0.52 0.3  0.24 0.43] sorted [0 3 1]\n",
      "   state [1 1 0 0] state_WI [0.4  0.3  0.24 0.41] sorted [3 0 1]\n",
      "   state [1 1 1 0] state_WI [0.4  0.3  0.14 0.41] sorted [3 0 1]\n",
      "instance 6, ep 3, state [1 1 0 0]\n",
      "   state [1 1 0 0] state_WI [0.4  0.3  0.24 0.41] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 0 1 1] state_WI [0.4  0.45 0.14 0.43] sorted [1 3 0]\n",
      "   state [1 0 1 0] state_WI [0.4  0.45 0.14 0.41] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [0 1 1 1] state_WI [0.52 0.3  0.14 0.43] sorted [0 3 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [0 1 0 1] state_WI [0.52 0.3  0.24 0.43] sorted [0 3 1]\n",
      "   state [0 1 0 0] state_WI [0.52 0.3  0.24 0.41] sorted [0 3 1]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.52 0.3  0.24 0.43] sorted [0 3 1]\n",
      "   state [0 1 0 0] state_WI [0.52 0.3  0.24 0.41] sorted [0 3 1]\n",
      "   state [0 1 0 1] state_WI [0.52 0.3  0.24 0.43] sorted [0 3 1]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [0 0 0 1] state_WI [0.52 0.45 0.24 0.43] sorted [0 1 3]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [1 1 1 1] state_WI [0.4  0.3  0.14 0.43] sorted [3 0 1]\n",
      "   state [0 1 1 1] state_WI [0.52 0.3  0.14 0.43] sorted [0 3 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 0] state_WI [0.4  0.3  0.24 0.41] sorted [3 0 1]\n",
      "instance 6, ep 4, state [1 1 1 0]\n",
      "   state [1 1 1 0] state_WI [0.4  0.3  0.14 0.41] sorted [3 0 1]\n",
      "   state [1 1 1 0] state_WI [0.4  0.3  0.14 0.41] sorted [3 0 1]\n",
      "   state [0 1 1 1] state_WI [0.52 0.3  0.14 0.43] sorted [0 3 1]\n",
      "   state [0 0 0 0] state_WI [0.52 0.45 0.24 0.41] sorted [0 1 3]\n",
      "   state [1 1 0 0] state_WI [0.4  0.3  0.24 0.41] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 0] state_WI [0.4  0.3  0.24 0.41] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [0 0 0 1] state_WI [0.52 0.45 0.24 0.43] sorted [0 1 3]\n",
      "   state [0 1 0 1] state_WI [0.52 0.3  0.24 0.43] sorted [0 3 1]\n",
      "   state [1 1 1 1] state_WI [0.4  0.3  0.14 0.43] sorted [3 0 1]\n",
      "   state [1 0 0 0] state_WI [0.4  0.45 0.24 0.41] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [0 1 0 1] state_WI [0.52 0.3  0.24 0.43] sorted [0 3 1]\n",
      "   state [0 1 0 0] state_WI [0.52 0.3  0.24 0.41] sorted [0 3 1]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.52 0.3  0.24 0.43] sorted [0 3 1]\n",
      "instance 6, ep 5, state [0 0 1 0]\n",
      "   state [0 0 1 0] state_WI [0.52 0.45 0.14 0.41] sorted [0 1 3]\n",
      "   state [0 0 1 0] state_WI [0.52 0.45 0.14 0.41] sorted [0 1 3]\n",
      "   state [0 0 0 0] state_WI [0.52 0.45 0.24 0.41] sorted [0 1 3]\n",
      "   state [0 0 0 1] state_WI [0.52 0.45 0.24 0.43] sorted [0 1 3]\n",
      "   state [0 0 0 0] state_WI [0.52 0.45 0.24 0.41] sorted [0 1 3]\n",
      "   state [0 1 0 1] state_WI [0.52 0.3  0.24 0.43] sorted [0 3 1]\n",
      "   state [0 1 0 1] state_WI [0.52 0.3  0.24 0.43] sorted [0 3 1]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 0] state_WI [0.4  0.3  0.24 0.41] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "instance 6, ep 6, state [0 0 0 1]\n",
      "   state [0 0 0 1] state_WI [0.52 0.45 0.24 0.43] sorted [0 1 3]\n",
      "   state [0 0 0 1] state_WI [0.52 0.45 0.24 0.43] sorted [0 1 3]\n",
      "   state [0 1 0 1] state_WI [0.52 0.3  0.24 0.43] sorted [0 3 1]\n",
      "   state [1 1 0 0] state_WI [0.4  0.3  0.24 0.41] sorted [3 0 1]\n",
      "   state [0 1 0 1] state_WI [0.52 0.3  0.24 0.43] sorted [0 3 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [0 1 0 1] state_WI [0.52 0.3  0.24 0.43] sorted [0 3 1]\n",
      "   state [0 0 0 0] state_WI [0.52 0.45 0.24 0.41] sorted [0 1 3]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [1 0 0 0] state_WI [0.4  0.45 0.24 0.41] sorted [1 3 0]\n",
      "   state [0 0 0 0] state_WI [0.52 0.45 0.24 0.41] sorted [0 1 3]\n",
      "   state [0 1 0 0] state_WI [0.52 0.3  0.24 0.41] sorted [0 3 1]\n",
      "   state [0 1 1 0] state_WI [0.52 0.3  0.14 0.41] sorted [0 3 1]\n",
      "   state [1 1 0 0] state_WI [0.4  0.3  0.24 0.41] sorted [3 0 1]\n",
      "   state [1 1 0 0] state_WI [0.4  0.3  0.24 0.41] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "instance 6, ep 7, state [0 1 0 0]\n",
      "   state [0 1 0 0] state_WI [0.52 0.3  0.24 0.41] sorted [0 3 1]\n",
      "   state [0 1 0 0] state_WI [0.52 0.3  0.24 0.41] sorted [0 3 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [0 1 0 1] state_WI [0.52 0.3  0.24 0.43] sorted [0 3 1]\n",
      "   state [0 0 0 1] state_WI [0.52 0.45 0.24 0.43] sorted [0 1 3]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [0 0 0 1] state_WI [0.52 0.45 0.24 0.43] sorted [0 1 3]\n",
      "   state [1 1 1 0] state_WI [0.4  0.3  0.14 0.41] sorted [3 0 1]\n",
      "   state [1 0 0 0] state_WI [0.4  0.45 0.24 0.41] sorted [1 3 0]\n",
      "   state [0 1 1 0] state_WI [0.52 0.3  0.14 0.41] sorted [0 3 1]\n",
      "   state [1 1 1 1] state_WI [0.4  0.3  0.14 0.43] sorted [3 0 1]\n",
      "   state [0 1 1 1] state_WI [0.52 0.3  0.14 0.43] sorted [0 3 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 0] state_WI [0.4  0.3  0.24 0.41] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [0 1 0 1] state_WI [0.52 0.3  0.24 0.43] sorted [0 3 1]\n",
      "   state [1 1 0 0] state_WI [0.4  0.3  0.24 0.41] sorted [3 0 1]\n",
      "instance 6, ep 8, state [0 0 0 0]\n",
      "   state [0 0 0 0] state_WI [0.52 0.45 0.24 0.41] sorted [0 1 3]\n",
      "   state [0 1 0 1] state_WI [0.52 0.3  0.24 0.43] sorted [0 3 1]\n",
      "   state [0 1 0 1] state_WI [0.52 0.3  0.24 0.43] sorted [0 3 1]\n",
      "   state [0 1 0 1] state_WI [0.52 0.3  0.24 0.43] sorted [0 3 1]\n",
      "   state [0 0 0 1] state_WI [0.52 0.45 0.24 0.43] sorted [0 1 3]\n",
      "   state [0 0 0 1] state_WI [0.52 0.45 0.24 0.43] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [1 1 1 1] state_WI [0.4  0.3  0.14 0.43] sorted [3 0 1]\n",
      "   state [0 1 0 0] state_WI [0.52 0.3  0.24 0.41] sorted [0 3 1]\n",
      "   state [0 1 0 0] state_WI [0.52 0.3  0.24 0.41] sorted [0 3 1]\n",
      "   state [1 0 0 0] state_WI [0.4  0.45 0.24 0.41] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "instance 6, ep 9, state [1 0 1 1]\n",
      "   state [1 0 1 1] state_WI [0.4  0.45 0.14 0.43] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [0.4  0.3  0.24 0.41] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 1 1] state_WI [0.4  0.3  0.14 0.43] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [0.4  0.3  0.24 0.41] sorted [3 0 1]\n",
      "   state [1 1 0 0] state_WI [0.4  0.3  0.24 0.41] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 0] state_WI [0.4  0.3  0.24 0.41] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.52 0.3  0.24 0.43] sorted [0 3 1]\n",
      "instance 6, ep 10, state [1 0 0 0]\n",
      "   state [1 0 0 0] state_WI [0.4  0.45 0.24 0.41] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.52 0.3  0.24 0.41] sorted [0 3 1]\n",
      "   state [1 0 0 0] state_WI [0.4  0.45 0.24 0.41] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 0] state_WI [0.4  0.3  0.24 0.41] sorted [3 0 1]\n",
      "   state [1 1 0 0] state_WI [0.4  0.3  0.24 0.41] sorted [3 0 1]\n",
      "   state [0 0 0 1] state_WI [0.52 0.45 0.24 0.43] sorted [0 1 3]\n",
      "   state [0 1 0 1] state_WI [0.52 0.3  0.24 0.43] sorted [0 3 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [1 0 0 0] state_WI [0.4  0.45 0.24 0.41] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [0.4  0.3  0.24 0.41] sorted [3 0 1]\n",
      "   state [1 0 0 0] state_WI [0.4  0.45 0.24 0.41] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.52 0.3  0.24 0.41] sorted [0 3 1]\n",
      "   state [1 1 0 0] state_WI [0.4  0.3  0.24 0.41] sorted [3 0 1]\n",
      "instance 6, ep 11, state [0 1 0 0]\n",
      "   state [0 1 0 0] state_WI [0.52 0.3  0.24 0.41] sorted [0 3 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 0] state_WI [0.4  0.3  0.24 0.41] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [0 1 0 1] state_WI [0.52 0.3  0.24 0.43] sorted [0 3 1]\n",
      "   state [0 1 0 1] state_WI [0.52 0.3  0.24 0.43] sorted [0 3 1]\n",
      "   state [0 1 0 1] state_WI [0.52 0.3  0.24 0.43] sorted [0 3 1]\n",
      "   state [0 1 1 1] state_WI [0.52 0.3  0.14 0.43] sorted [0 3 1]\n",
      "   state [0 0 0 1] state_WI [0.52 0.45 0.24 0.43] sorted [0 1 3]\n",
      "   state [0 1 0 1] state_WI [0.52 0.3  0.24 0.43] sorted [0 3 1]\n",
      "   state [0 1 1 1] state_WI [0.52 0.3  0.14 0.43] sorted [0 3 1]\n",
      "   state [0 0 0 1] state_WI [0.52 0.45 0.24 0.43] sorted [0 1 3]\n",
      "   state [1 1 0 0] state_WI [0.4  0.3  0.24 0.41] sorted [3 0 1]\n",
      "   state [1 0 1 1] state_WI [0.4  0.45 0.14 0.43] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "instance 6, ep 12, state [1 1 1 0]\n",
      "   state [1 1 1 0] state_WI [0.4  0.3  0.14 0.41] sorted [3 0 1]\n",
      "   state [1 0 1 1] state_WI [0.4  0.45 0.14 0.43] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [0 1 0 1] state_WI [0.52 0.3  0.24 0.43] sorted [0 3 1]\n",
      "   state [0 0 0 1] state_WI [0.52 0.45 0.24 0.43] sorted [0 1 3]\n",
      "   state [0 0 0 1] state_WI [0.52 0.45 0.24 0.43] sorted [0 1 3]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [0 0 0 1] state_WI [0.52 0.45 0.24 0.43] sorted [0 1 3]\n",
      "   state [0 0 1 0] state_WI [0.52 0.45 0.14 0.41] sorted [0 1 3]\n",
      "   state [1 1 1 0] state_WI [0.4  0.3  0.14 0.41] sorted [3 0 1]\n",
      "   state [0 0 1 1] state_WI [0.52 0.45 0.14 0.43] sorted [0 1 3]\n",
      "   state [1 1 1 1] state_WI [0.4  0.3  0.14 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 1 1] state_WI [0.4  0.3  0.14 0.43] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "instance 6, ep 13, state [0 1 0 0]\n",
      "   state [0 1 0 0] state_WI [0.52 0.3  0.24 0.41] sorted [0 3 1]\n",
      "   state [1 1 0 0] state_WI [0.4  0.3  0.24 0.41] sorted [3 0 1]\n",
      "   state [1 1 0 0] state_WI [0.4  0.3  0.24 0.41] sorted [3 0 1]\n",
      "   state [1 1 1 1] state_WI [0.4  0.3  0.14 0.43] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [1 0 0 0] state_WI [0.4  0.45 0.24 0.41] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [0 0 1 1] state_WI [0.52 0.45 0.14 0.43] sorted [0 1 3]\n",
      "   state [0 1 0 1] state_WI [0.52 0.3  0.24 0.43] sorted [0 3 1]\n",
      "   state [0 1 0 1] state_WI [0.52 0.3  0.24 0.43] sorted [0 3 1]\n",
      "   state [0 0 0 0] state_WI [0.52 0.45 0.24 0.41] sorted [0 1 3]\n",
      "   state [0 0 0 0] state_WI [0.52 0.45 0.24 0.41] sorted [0 1 3]\n",
      "   state [0 1 0 0] state_WI [0.52 0.3  0.24 0.41] sorted [0 3 1]\n",
      "   state [0 1 0 0] state_WI [0.52 0.3  0.24 0.41] sorted [0 3 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "instance 6, ep 14, state [0 0 0 0]\n",
      "   state [0 0 0 0] state_WI [0.52 0.45 0.24 0.41] sorted [0 1 3]\n",
      "   state [0 1 0 1] state_WI [0.52 0.3  0.24 0.43] sorted [0 3 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 0 0 0] state_WI [0.4  0.45 0.24 0.41] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [0.4  0.3  0.24 0.41] sorted [3 0 1]\n",
      "   state [0 1 0 1] state_WI [0.52 0.3  0.24 0.43] sorted [0 3 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [0 0 0 1] state_WI [0.52 0.45 0.24 0.43] sorted [0 1 3]\n",
      "   state [0 1 0 1] state_WI [0.52 0.3  0.24 0.43] sorted [0 3 1]\n",
      "   state [0 1 0 1] state_WI [0.52 0.3  0.24 0.43] sorted [0 3 1]\n",
      "   state [0 1 0 0] state_WI [0.52 0.3  0.24 0.41] sorted [0 3 1]\n",
      "   state [1 0 1 1] state_WI [0.4  0.45 0.14 0.43] sorted [1 3 0]\n",
      "   state [1 1 1 1] state_WI [0.4  0.3  0.14 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "instance 6, ep 15, state [1 1 1 0]\n",
      "   state [1 1 1 0] state_WI [0.4  0.3  0.14 0.41] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [0 0 0 1] state_WI [0.52 0.45 0.24 0.43] sorted [0 1 3]\n",
      "   state [0 0 0 1] state_WI [0.52 0.45 0.24 0.43] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [0 0 0 1] state_WI [0.52 0.45 0.24 0.43] sorted [0 1 3]\n",
      "   state [0 0 0 1] state_WI [0.52 0.45 0.24 0.43] sorted [0 1 3]\n",
      "   state [0 1 0 1] state_WI [0.52 0.3  0.24 0.43] sorted [0 3 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [0 1 0 1] state_WI [0.52 0.3  0.24 0.43] sorted [0 3 1]\n",
      "   state [1 1 0 0] state_WI [0.4  0.3  0.24 0.41] sorted [3 0 1]\n",
      "   state [1 0 0 0] state_WI [0.4  0.45 0.24 0.41] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.52 0.3  0.24 0.41] sorted [0 3 1]\n",
      "   state [0 1 1 1] state_WI [0.52 0.3  0.14 0.43] sorted [0 3 1]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "instance 6, ep 16, state [0 0 1 1]\n",
      "   state [0 0 1 1] state_WI [0.52 0.45 0.14 0.43] sorted [0 1 3]\n",
      "   state [0 1 0 0] state_WI [0.52 0.3  0.24 0.41] sorted [0 3 1]\n",
      "   state [0 1 0 1] state_WI [0.52 0.3  0.24 0.43] sorted [0 3 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [0 1 0 1] state_WI [0.52 0.3  0.24 0.43] sorted [0 3 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [0.4  0.3  0.24 0.41] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 0] state_WI [0.4  0.3  0.24 0.41] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [0 0 0 1] state_WI [0.52 0.45 0.24 0.43] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "instance 6, ep 17, state [0 1 0 1]\n",
      "   state [0 1 0 1] state_WI [0.52 0.3  0.24 0.43] sorted [0 3 1]\n",
      "   state [0 0 0 0] state_WI [0.52 0.45 0.24 0.41] sorted [0 1 3]\n",
      "   state [0 1 0 0] state_WI [0.52 0.3  0.24 0.41] sorted [0 3 1]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.52 0.3  0.24 0.43] sorted [0 3 1]\n",
      "   state [0 0 0 0] state_WI [0.52 0.45 0.24 0.41] sorted [0 1 3]\n",
      "   state [1 1 0 0] state_WI [0.4  0.3  0.24 0.41] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [1 0 0 0] state_WI [0.4  0.45 0.24 0.41] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.52 0.3  0.24 0.43] sorted [0 3 1]\n",
      "   state [0 1 1 1] state_WI [0.52 0.3  0.14 0.43] sorted [0 3 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "instance 6, ep 18, state [1 1 1 1]\n",
      "   state [1 1 1 1] state_WI [0.4  0.3  0.14 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [0 1 0 1] state_WI [0.52 0.3  0.24 0.43] sorted [0 3 1]\n",
      "   state [0 0 0 1] state_WI [0.52 0.45 0.24 0.43] sorted [0 1 3]\n",
      "   state [0 0 0 1] state_WI [0.52 0.45 0.24 0.43] sorted [0 1 3]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [1 0 0 0] state_WI [0.4  0.45 0.24 0.41] sorted [1 3 0]\n",
      "   state [1 0 1 1] state_WI [0.4  0.45 0.14 0.43] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 0] state_WI [0.4  0.3  0.24 0.41] sorted [3 0 1]\n",
      "   state [1 0 0 0] state_WI [0.4  0.45 0.24 0.41] sorted [1 3 0]\n",
      "   state [1 0 1 0] state_WI [0.4  0.45 0.14 0.41] sorted [1 3 0]\n",
      "   state [1 0 0 0] state_WI [0.4  0.45 0.24 0.41] sorted [1 3 0]\n",
      "   state [1 0 0 0] state_WI [0.4  0.45 0.24 0.41] sorted [1 3 0]\n",
      "   state [0 0 0 0] state_WI [0.52 0.45 0.24 0.41] sorted [0 1 3]\n",
      "   state [0 1 0 0] state_WI [0.52 0.3  0.24 0.41] sorted [0 3 1]\n",
      "   state [1 1 0 0] state_WI [0.4  0.3  0.24 0.41] sorted [3 0 1]\n",
      "   state [1 1 0 0] state_WI [0.4  0.3  0.24 0.41] sorted [3 0 1]\n",
      "instance 6, ep 19, state [0 1 0 1]\n",
      "   state [0 1 0 1] state_WI [0.52 0.3  0.24 0.43] sorted [0 3 1]\n",
      "   state [1 1 0 0] state_WI [0.4  0.3  0.24 0.41] sorted [3 0 1]\n",
      "   state [1 1 0 0] state_WI [0.4  0.3  0.24 0.41] sorted [3 0 1]\n",
      "   state [1 1 1 0] state_WI [0.4  0.3  0.14 0.41] sorted [3 0 1]\n",
      "   state [1 0 0 0] state_WI [0.4  0.45 0.24 0.41] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 0 0 0] state_WI [0.4  0.45 0.24 0.41] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [0 1 0 1] state_WI [0.52 0.3  0.24 0.43] sorted [0 3 1]\n",
      "   state [0 1 0 1] state_WI [0.52 0.3  0.24 0.43] sorted [0 3 1]\n",
      "   state [1 1 1 1] state_WI [0.4  0.3  0.14 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [0 1 0 1] state_WI [0.52 0.3  0.24 0.43] sorted [0 3 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 1 1] state_WI [0.4  0.3  0.14 0.43] sorted [3 0 1]\n",
      "   state [0 1 1 1] state_WI [0.52 0.3  0.14 0.43] sorted [0 3 1]\n",
      "   state [0 1 0 1] state_WI [0.52 0.3  0.24 0.43] sorted [0 3 1]\n",
      "   state [0 1 0 1] state_WI [0.52 0.3  0.24 0.43] sorted [0 3 1]\n",
      "   state [1 1 0 0] state_WI [0.4  0.3  0.24 0.41] sorted [3 0 1]\n",
      "   state [1 1 0 0] state_WI [0.4  0.3  0.24 0.41] sorted [3 0 1]\n",
      "instance 6, ep 20, state [1 1 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 0] state_WI [0.4  0.3  0.24 0.41] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 1 1] state_WI [0.4  0.3  0.14 0.43] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [0 0 0 1] state_WI [0.52 0.45 0.24 0.43] sorted [0 1 3]\n",
      "   state [0 0 0 1] state_WI [0.52 0.45 0.24 0.43] sorted [0 1 3]\n",
      "   state [0 0 0 1] state_WI [0.52 0.45 0.24 0.43] sorted [0 1 3]\n",
      "   state [0 1 0 1] state_WI [0.52 0.3  0.24 0.43] sorted [0 3 1]\n",
      "   state [0 0 0 1] state_WI [0.52 0.45 0.24 0.43] sorted [0 1 3]\n",
      "   state [0 0 0 1] state_WI [0.52 0.45 0.24 0.43] sorted [0 1 3]\n",
      "   state [0 1 0 1] state_WI [0.52 0.3  0.24 0.43] sorted [0 3 1]\n",
      "   state [0 1 0 1] state_WI [0.52 0.3  0.24 0.43] sorted [0 3 1]\n",
      "   state [0 1 0 1] state_WI [0.52 0.3  0.24 0.43] sorted [0 3 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 1 0] state_WI [0.4  0.3  0.14 0.41] sorted [3 0 1]\n",
      "   state [0 1 1 1] state_WI [0.52 0.3  0.14 0.43] sorted [0 3 1]\n",
      "   state [0 1 0 1] state_WI [0.52 0.3  0.24 0.43] sorted [0 3 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "instance 6, ep 21, state [1 1 0 0]\n",
      "   state [1 1 0 0] state_WI [0.4  0.3  0.24 0.41] sorted [3 0 1]\n",
      "   state [1 1 0 0] state_WI [0.4  0.3  0.24 0.41] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [0 1 0 1] state_WI [0.52 0.3  0.24 0.43] sorted [0 3 1]\n",
      "   state [0 1 1 1] state_WI [0.52 0.3  0.14 0.43] sorted [0 3 1]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [0.4  0.3  0.24 0.41] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [0 1 0 1] state_WI [0.52 0.3  0.24 0.43] sorted [0 3 1]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [0.4  0.3  0.24 0.41] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "instance 6, ep 22, state [0 0 1 0]\n",
      "   state [0 0 1 0] state_WI [0.52 0.45 0.14 0.41] sorted [0 1 3]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [0.4  0.3  0.24 0.41] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [0 1 0 1] state_WI [0.52 0.3  0.24 0.43] sorted [0 3 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [1 0 1 1] state_WI [0.4  0.45 0.14 0.43] sorted [1 3 0]\n",
      "   state [0 0 1 1] state_WI [0.52 0.45 0.14 0.43] sorted [0 1 3]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [0.4  0.3  0.24 0.41] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [0 1 0 1] state_WI [0.52 0.3  0.24 0.43] sorted [0 3 1]\n",
      "   state [0 1 0 1] state_WI [0.52 0.3  0.24 0.43] sorted [0 3 1]\n",
      "   state [0 0 1 1] state_WI [0.52 0.45 0.14 0.43] sorted [0 1 3]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.52 0.3  0.24 0.41] sorted [0 3 1]\n",
      "   state [0 0 0 1] state_WI [0.52 0.45 0.24 0.43] sorted [0 1 3]\n",
      "   state [0 0 0 1] state_WI [0.52 0.45 0.24 0.43] sorted [0 1 3]\n",
      "   state [0 1 0 0] state_WI [0.52 0.3  0.24 0.41] sorted [0 3 1]\n",
      "instance 6, ep 23, state [1 0 0 1]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [0.4  0.3  0.24 0.41] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 0 0 0] state_WI [0.4  0.45 0.24 0.41] sorted [1 3 0]\n",
      "   state [0 0 0 0] state_WI [0.52 0.45 0.24 0.41] sorted [0 1 3]\n",
      "   state [0 1 0 0] state_WI [0.52 0.3  0.24 0.41] sorted [0 3 1]\n",
      "   state [1 0 0 0] state_WI [0.4  0.45 0.24 0.41] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.52 0.3  0.24 0.41] sorted [0 3 1]\n",
      "   state [0 1 0 0] state_WI [0.52 0.3  0.24 0.41] sorted [0 3 1]\n",
      "   state [0 1 0 0] state_WI [0.52 0.3  0.24 0.41] sorted [0 3 1]\n",
      "   state [0 1 0 1] state_WI [0.52 0.3  0.24 0.43] sorted [0 3 1]\n",
      "   state [1 0 1 1] state_WI [0.4  0.45 0.14 0.43] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 0 0 0] state_WI [0.4  0.45 0.24 0.41] sorted [1 3 0]\n",
      "   state [1 0 0 0] state_WI [0.4  0.45 0.24 0.41] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "instance 6, ep 24, state [1 0 1 1]\n",
      "   state [1 0 1 1] state_WI [0.4  0.45 0.14 0.43] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [0 1 0 1] state_WI [0.52 0.3  0.24 0.43] sorted [0 3 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [0 1 0 1] state_WI [0.52 0.3  0.24 0.43] sorted [0 3 1]\n",
      "   state [0 1 0 0] state_WI [0.52 0.3  0.24 0.41] sorted [0 3 1]\n",
      "   state [0 1 0 0] state_WI [0.52 0.3  0.24 0.41] sorted [0 3 1]\n",
      "   state [1 1 0 0] state_WI [0.4  0.3  0.24 0.41] sorted [3 0 1]\n",
      "   state [1 1 0 0] state_WI [0.4  0.3  0.24 0.41] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [0 1 0 1] state_WI [0.52 0.3  0.24 0.43] sorted [0 3 1]\n",
      "   state [0 1 0 0] state_WI [0.52 0.3  0.24 0.41] sorted [0 3 1]\n",
      "   state [0 1 0 0] state_WI [0.52 0.3  0.24 0.41] sorted [0 3 1]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [1 0 1 1] state_WI [0.4  0.45 0.14 0.43] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [0 0 0 1] state_WI [0.52 0.45 0.24 0.43] sorted [0 1 3]\n",
      "instance 6, ep 25, state [0 1 1 1]\n",
      "   state [0 1 1 1] state_WI [0.52 0.3  0.14 0.43] sorted [0 3 1]\n",
      "   state [0 0 0 1] state_WI [0.52 0.45 0.24 0.43] sorted [0 1 3]\n",
      "   state [0 1 0 1] state_WI [0.52 0.3  0.24 0.43] sorted [0 3 1]\n",
      "   state [0 0 0 1] state_WI [0.52 0.45 0.24 0.43] sorted [0 1 3]\n",
      "   state [0 1 0 0] state_WI [0.52 0.3  0.24 0.41] sorted [0 3 1]\n",
      "   state [0 0 0 1] state_WI [0.52 0.45 0.24 0.43] sorted [0 1 3]\n",
      "   state [0 0 0 0] state_WI [0.52 0.45 0.24 0.41] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.52 0.3  0.24 0.43] sorted [0 3 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 0] state_WI [0.4  0.3  0.24 0.41] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "instance 6, ep 26, state [0 1 0 0]\n",
      "   state [0 1 0 0] state_WI [0.52 0.3  0.24 0.41] sorted [0 3 1]\n",
      "   state [1 1 0 0] state_WI [0.4  0.3  0.24 0.41] sorted [3 0 1]\n",
      "   state [1 1 0 0] state_WI [0.4  0.3  0.24 0.41] sorted [3 0 1]\n",
      "   state [0 1 0 1] state_WI [0.52 0.3  0.24 0.43] sorted [0 3 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [0 1 0 1] state_WI [0.52 0.3  0.24 0.43] sorted [0 3 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 0 1 1] state_WI [0.4  0.45 0.14 0.43] sorted [1 3 0]\n",
      "   state [0 0 0 1] state_WI [0.52 0.45 0.24 0.43] sorted [0 1 3]\n",
      "   state [0 1 0 0] state_WI [0.52 0.3  0.24 0.41] sorted [0 3 1]\n",
      "   state [0 1 0 0] state_WI [0.52 0.3  0.24 0.41] sorted [0 3 1]\n",
      "   state [0 1 0 0] state_WI [0.52 0.3  0.24 0.41] sorted [0 3 1]\n",
      "   state [0 0 0 0] state_WI [0.52 0.45 0.24 0.41] sorted [0 1 3]\n",
      "   state [0 1 0 0] state_WI [0.52 0.3  0.24 0.41] sorted [0 3 1]\n",
      "instance 6, ep 27, state [0 0 1 1]\n",
      "   state [0 0 1 1] state_WI [0.52 0.45 0.14 0.43] sorted [0 1 3]\n",
      "   state [1 1 1 1] state_WI [0.4  0.3  0.14 0.43] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [0 1 0 1] state_WI [0.52 0.3  0.24 0.43] sorted [0 3 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 1 1 1] state_WI [0.4  0.3  0.14 0.43] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [0 0 0 1] state_WI [0.52 0.45 0.24 0.43] sorted [0 1 3]\n",
      "   state [0 0 0 1] state_WI [0.52 0.45 0.24 0.43] sorted [0 1 3]\n",
      "   state [1 0 0 0] state_WI [0.4  0.45 0.24 0.41] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.52 0.3  0.24 0.43] sorted [0 3 1]\n",
      "   state [0 0 0 1] state_WI [0.52 0.45 0.24 0.43] sorted [0 1 3]\n",
      "instance 6, ep 28, state [1 0 0 0]\n",
      "   state [1 0 0 0] state_WI [0.4  0.45 0.24 0.41] sorted [1 3 0]\n",
      "   state [1 1 1 1] state_WI [0.4  0.3  0.14 0.43] sorted [3 0 1]\n",
      "   state [0 1 0 1] state_WI [0.52 0.3  0.24 0.43] sorted [0 3 1]\n",
      "   state [1 1 0 0] state_WI [0.4  0.3  0.24 0.41] sorted [3 0 1]\n",
      "   state [0 1 0 0] state_WI [0.52 0.3  0.24 0.41] sorted [0 3 1]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [0 1 0 1] state_WI [0.52 0.3  0.24 0.43] sorted [0 3 1]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [1 0 0 0] state_WI [0.4  0.45 0.24 0.41] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [0 0 0 0] state_WI [0.52 0.45 0.24 0.41] sorted [0 1 3]\n",
      "   state [1 0 0 0] state_WI [0.4  0.45 0.24 0.41] sorted [1 3 0]\n",
      "   state [0 0 0 0] state_WI [0.52 0.45 0.24 0.41] sorted [0 1 3]\n",
      "   state [0 0 0 1] state_WI [0.52 0.45 0.24 0.43] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [0 1 0 1] state_WI [0.52 0.3  0.24 0.43] sorted [0 3 1]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "instance 6, ep 29, state [1 0 1 1]\n",
      "   state [1 0 1 1] state_WI [0.4  0.45 0.14 0.43] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.52 0.3  0.24 0.43] sorted [0 3 1]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [1 0 1 1] state_WI [0.4  0.45 0.14 0.43] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.52 0.3  0.24 0.41] sorted [0 3 1]\n",
      "   state [0 1 0 0] state_WI [0.52 0.3  0.24 0.41] sorted [0 3 1]\n",
      "   state [0 1 0 0] state_WI [0.52 0.3  0.24 0.41] sorted [0 3 1]\n",
      "   state [0 1 0 0] state_WI [0.52 0.3  0.24 0.41] sorted [0 3 1]\n",
      "   state [0 1 0 1] state_WI [0.52 0.3  0.24 0.43] sorted [0 3 1]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [0.4  0.45 0.24 0.43] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.4  0.3  0.24 0.43] sorted [3 0 1]\n",
      "first state [1 0 1 0]\n",
      "   state [1 0 1 0] state_WI [0.38 0.54 0.3  0.47] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.38 0.54 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.38 0.54 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.38 0.54 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 0 0 0] state_WI [0.38 0.54 0.33 0.47] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.37 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [0 1 0 0] state_WI [0.37 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.38 0.54 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "instance 7, ep 1, state [1 0 0 0]\n",
      "   state [1 0 0 0] state_WI [0.38 0.54 0.33 0.47] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 0 0 1] state_WI [0.37 0.54 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.37 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [1 1 1 0] state_WI [0.38 0.47 0.3  0.47] sorted [3 1 0]\n",
      "   state [1 1 1 1] state_WI [0.38 0.47 0.3  0.39] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [1 1 1 0] state_WI [0.38 0.47 0.3  0.47] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "instance 7, ep 2, state [1 0 1 1]\n",
      "   state [1 0 1 1] state_WI [0.38 0.54 0.3  0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.37 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [0 0 0 0] state_WI [0.37 0.54 0.33 0.47] sorted [1 3 0]\n",
      "   state [0 0 0 1] state_WI [0.37 0.54 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "instance 7, ep 3, state [0 1 0 1]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 1 1] state_WI [0.38 0.47 0.3  0.39] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.37 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 1 1] state_WI [0.38 0.47 0.3  0.39] sorted [1 3 0]\n",
      "   state [1 1 1 1] state_WI [0.38 0.47 0.3  0.39] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 0 0 0] state_WI [0.37 0.54 0.33 0.47] sorted [1 3 0]\n",
      "   state [0 0 0 1] state_WI [0.37 0.54 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 0 0 1] state_WI [0.37 0.54 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "instance 7, ep 4, state [0 1 1 1]\n",
      "   state [0 1 1 1] state_WI [0.37 0.47 0.3  0.39] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 1 1] state_WI [0.37 0.47 0.3  0.39] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 0 0 0] state_WI [0.37 0.54 0.33 0.47] sorted [1 3 0]\n",
      "   state [0 0 0 0] state_WI [0.37 0.54 0.33 0.47] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.38 0.54 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 1 0] state_WI [0.37 0.47 0.3  0.47] sorted [3 1 0]\n",
      "   state [1 1 1 1] state_WI [0.38 0.47 0.3  0.39] sorted [1 3 0]\n",
      "   state [1 1 1 1] state_WI [0.38 0.47 0.3  0.39] sorted [1 3 0]\n",
      "   state [1 1 1 0] state_WI [0.38 0.47 0.3  0.47] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.37 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.38 0.54 0.33 0.39] sorted [1 3 0]\n",
      "instance 7, ep 5, state [1 0 1 1]\n",
      "   state [1 0 1 1] state_WI [0.38 0.54 0.3  0.39] sorted [1 3 0]\n",
      "   state [0 0 0 1] state_WI [0.37 0.54 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.38 0.54 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 1 1] state_WI [0.38 0.47 0.3  0.39] sorted [1 3 0]\n",
      "   state [0 1 1 1] state_WI [0.37 0.47 0.3  0.39] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 0 0 0] state_WI [0.38 0.54 0.33 0.47] sorted [1 3 0]\n",
      "   state [0 0 0 0] state_WI [0.37 0.54 0.33 0.47] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.38 0.54 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 1 0] state_WI [0.38 0.47 0.3  0.47] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "instance 7, ep 6, state [1 0 1 1]\n",
      "   state [1 0 1 1] state_WI [0.38 0.54 0.3  0.39] sorted [1 3 0]\n",
      "   state [1 0 1 0] state_WI [0.38 0.54 0.3  0.47] sorted [1 3 0]\n",
      "   state [1 0 0 0] state_WI [0.38 0.54 0.33 0.47] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [1 0 0 0] state_WI [0.38 0.54 0.33 0.47] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.37 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 0 0 1] state_WI [0.37 0.54 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 0 0 1] state_WI [0.37 0.54 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 0 0 0] state_WI [0.37 0.54 0.33 0.47] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 0 1 1] state_WI [0.37 0.54 0.3  0.39] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.38 0.54 0.33 0.39] sorted [1 3 0]\n",
      "instance 7, ep 7, state [1 0 1 0]\n",
      "   state [1 0 1 0] state_WI [0.38 0.54 0.3  0.47] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.38 0.54 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.38 0.54 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 0 0 0] state_WI [0.38 0.54 0.33 0.47] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.38 0.54 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.37 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [0 0 0 0] state_WI [0.37 0.54 0.33 0.47] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.38 0.54 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.38 0.54 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 0 0 0] state_WI [0.38 0.54 0.33 0.47] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "instance 7, ep 8, state [1 0 1 1]\n",
      "   state [1 0 1 1] state_WI [0.38 0.54 0.3  0.39] sorted [1 3 0]\n",
      "   state [0 0 0 1] state_WI [0.37 0.54 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 1 1] state_WI [0.38 0.47 0.3  0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 0 1 1] state_WI [0.37 0.54 0.3  0.39] sorted [1 3 0]\n",
      "   state [1 1 1 1] state_WI [0.38 0.47 0.3  0.39] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 1 1] state_WI [0.37 0.47 0.3  0.39] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.37 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 0 0 1] state_WI [0.37 0.54 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 0 1 1] state_WI [0.38 0.54 0.3  0.39] sorted [1 3 0]\n",
      "   state [1 1 1 1] state_WI [0.38 0.47 0.3  0.39] sorted [1 3 0]\n",
      "   state [0 1 1 1] state_WI [0.37 0.47 0.3  0.39] sorted [1 3 0]\n",
      "   state [0 1 1 1] state_WI [0.37 0.47 0.3  0.39] sorted [1 3 0]\n",
      "instance 7, ep 9, state [0 1 0 1]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.37 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [0 1 1 1] state_WI [0.37 0.47 0.3  0.39] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 0 0 1] state_WI [0.37 0.54 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.37 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [0 1 0 0] state_WI [0.37 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [0 0 1 1] state_WI [0.37 0.54 0.3  0.39] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.38 0.54 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [0 1 0 0] state_WI [0.37 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [1 0 0 0] state_WI [0.38 0.54 0.33 0.47] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "instance 7, ep 10, state [1 1 1 1]\n",
      "   state [1 1 1 1] state_WI [0.38 0.47 0.3  0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 1 0] state_WI [0.38 0.47 0.3  0.47] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 1 1] state_WI [0.38 0.47 0.3  0.39] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 1 1] state_WI [0.37 0.47 0.3  0.39] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.37 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "instance 7, ep 11, state [0 0 1 1]\n",
      "   state [0 0 1 1] state_WI [0.37 0.54 0.3  0.39] sorted [1 3 0]\n",
      "   state [0 1 1 1] state_WI [0.37 0.47 0.3  0.39] sorted [1 3 0]\n",
      "   state [0 1 1 0] state_WI [0.37 0.47 0.3  0.47] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.38 0.54 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 1 1] state_WI [0.37 0.47 0.3  0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [1 1 1 0] state_WI [0.38 0.47 0.3  0.47] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "instance 7, ep 12, state [1 1 0 1]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [0 1 1 1] state_WI [0.37 0.47 0.3  0.39] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.37 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [0 0 0 0] state_WI [0.37 0.54 0.33 0.47] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.37 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [0 0 0 1] state_WI [0.37 0.54 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 0 0 1] state_WI [0.37 0.54 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 0 1 0] state_WI [0.37 0.54 0.3  0.47] sorted [1 3 0]\n",
      "   state [0 0 1 1] state_WI [0.37 0.54 0.3  0.39] sorted [1 3 0]\n",
      "   state [1 0 0 0] state_WI [0.38 0.54 0.33 0.47] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 0 0 1] state_WI [0.37 0.54 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "instance 7, ep 13, state [0 1 0 0]\n",
      "   state [0 1 0 0] state_WI [0.37 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [1 1 1 0] state_WI [0.38 0.47 0.3  0.47] sorted [3 1 0]\n",
      "   state [1 0 1 0] state_WI [0.38 0.54 0.3  0.47] sorted [1 3 0]\n",
      "   state [1 0 0 0] state_WI [0.38 0.54 0.33 0.47] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [1 0 0 0] state_WI [0.38 0.54 0.33 0.47] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.37 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [0 0 0 0] state_WI [0.37 0.54 0.33 0.47] sorted [1 3 0]\n",
      "instance 7, ep 14, state [0 0 1 0]\n",
      "   state [0 0 1 0] state_WI [0.37 0.54 0.3  0.47] sorted [1 3 0]\n",
      "   state [0 0 0 1] state_WI [0.37 0.54 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.38 0.54 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [0 1 0 0] state_WI [0.37 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 0 0 0] state_WI [0.37 0.54 0.33 0.47] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.37 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.38 0.54 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.38 0.54 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.38 0.54 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "instance 7, ep 15, state [0 0 0 0]\n",
      "   state [0 0 0 0] state_WI [0.37 0.54 0.33 0.47] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.38 0.54 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [0 1 0 0] state_WI [0.37 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.37 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [0 0 0 0] state_WI [0.37 0.54 0.33 0.47] sorted [1 3 0]\n",
      "   state [0 1 1 0] state_WI [0.37 0.47 0.3  0.47] sorted [3 1 0]\n",
      "   state [0 1 0 0] state_WI [0.37 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [0 1 0 0] state_WI [0.37 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 1 0] state_WI [0.38 0.47 0.3  0.47] sorted [3 1 0]\n",
      "   state [0 1 1 0] state_WI [0.37 0.47 0.3  0.47] sorted [3 1 0]\n",
      "instance 7, ep 16, state [0 1 1 1]\n",
      "   state [0 1 1 1] state_WI [0.37 0.47 0.3  0.39] sorted [1 3 0]\n",
      "   state [1 1 1 1] state_WI [0.38 0.47 0.3  0.39] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.37 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.37 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [0 1 0 0] state_WI [0.37 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.38 0.54 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.38 0.54 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.38 0.54 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.37 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 1 1] state_WI [0.38 0.47 0.3  0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "instance 7, ep 17, state [0 0 1 1]\n",
      "   state [0 0 1 1] state_WI [0.37 0.54 0.3  0.39] sorted [1 3 0]\n",
      "   state [1 1 1 1] state_WI [0.38 0.47 0.3  0.39] sorted [1 3 0]\n",
      "   state [1 0 0 0] state_WI [0.38 0.54 0.33 0.47] sorted [1 3 0]\n",
      "   state [0 0 0 0] state_WI [0.37 0.54 0.33 0.47] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 1 1] state_WI [0.37 0.47 0.3  0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [0 1 0 0] state_WI [0.37 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [1 1 1 1] state_WI [0.38 0.47 0.3  0.39] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [0.38 0.54 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 1 1] state_WI [0.37 0.47 0.3  0.39] sorted [1 3 0]\n",
      "   state [0 0 0 0] state_WI [0.37 0.54 0.33 0.47] sorted [1 3 0]\n",
      "   state [0 0 0 1] state_WI [0.37 0.54 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "instance 7, ep 18, state [0 0 0 0]\n",
      "   state [0 0 0 0] state_WI [0.37 0.54 0.33 0.47] sorted [1 3 0]\n",
      "   state [0 0 0 1] state_WI [0.37 0.54 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 1 1] state_WI [0.37 0.47 0.3  0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.37 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [0 1 1 1] state_WI [0.37 0.47 0.3  0.39] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.37 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 0 0 1] state_WI [0.37 0.54 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "instance 7, ep 19, state [0 1 1 1]\n",
      "   state [0 1 1 1] state_WI [0.37 0.47 0.3  0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 1 0] state_WI [0.38 0.47 0.3  0.47] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.37 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [0 0 0 0] state_WI [0.37 0.54 0.33 0.47] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.38 0.54 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 0 0 0] state_WI [0.38 0.54 0.33 0.47] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.37 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [0 1 0 0] state_WI [0.37 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 0 1 1] state_WI [0.37 0.54 0.3  0.39] sorted [1 3 0]\n",
      "   state [0 1 1 1] state_WI [0.37 0.47 0.3  0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "instance 7, ep 20, state [1 1 1 1]\n",
      "   state [1 1 1 1] state_WI [0.38 0.47 0.3  0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.37 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 1 0] state_WI [0.38 0.47 0.3  0.47] sorted [3 1 0]\n",
      "   state [1 0 0 0] state_WI [0.38 0.54 0.33 0.47] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.38 0.54 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 1 1] state_WI [0.38 0.47 0.3  0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 1 1] state_WI [0.38 0.47 0.3  0.39] sorted [1 3 0]\n",
      "   state [1 1 1 0] state_WI [0.38 0.47 0.3  0.47] sorted [3 1 0]\n",
      "   state [0 1 0 0] state_WI [0.37 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [0 0 0 0] state_WI [0.37 0.54 0.33 0.47] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.38 0.54 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 1 0] state_WI [0.38 0.47 0.3  0.47] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [0 1 0 0] state_WI [0.37 0.47 0.33 0.47] sorted [3 1 0]\n",
      "instance 7, ep 21, state [0 0 0 1]\n",
      "   state [0 0 0 1] state_WI [0.37 0.54 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 1 0] state_WI [0.38 0.47 0.3  0.47] sorted [3 1 0]\n",
      "   state [0 0 0 0] state_WI [0.37 0.54 0.33 0.47] sorted [1 3 0]\n",
      "   state [1 0 0 0] state_WI [0.38 0.54 0.33 0.47] sorted [1 3 0]\n",
      "   state [1 1 1 1] state_WI [0.38 0.47 0.3  0.39] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [0.38 0.54 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.38 0.54 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 0 0 0] state_WI [0.37 0.54 0.33 0.47] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.38 0.54 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 0 0 0] state_WI [0.38 0.54 0.33 0.47] sorted [1 3 0]\n",
      "   state [0 0 0 0] state_WI [0.37 0.54 0.33 0.47] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "instance 7, ep 22, state [1 0 1 0]\n",
      "   state [1 0 1 0] state_WI [0.38 0.54 0.3  0.47] sorted [1 3 0]\n",
      "   state [0 1 1 1] state_WI [0.37 0.47 0.3  0.39] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.37 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 0 0 1] state_WI [0.37 0.54 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 0 0 1] state_WI [0.37 0.54 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.37 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [0 1 0 0] state_WI [0.37 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [0 1 0 0] state_WI [0.37 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.37 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [0 1 0 0] state_WI [0.37 0.47 0.33 0.47] sorted [3 1 0]\n",
      "instance 7, ep 23, state [1 0 0 0]\n",
      "   state [1 0 0 0] state_WI [0.38 0.54 0.33 0.47] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.38 0.54 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 0 0 0] state_WI [0.38 0.54 0.33 0.47] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [0 1 1 1] state_WI [0.37 0.47 0.3  0.39] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.37 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 1 1] state_WI [0.37 0.47 0.3  0.39] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 1 1] state_WI [0.38 0.47 0.3  0.39] sorted [1 3 0]\n",
      "   state [1 0 0 0] state_WI [0.38 0.54 0.33 0.47] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.37 0.47 0.33 0.47] sorted [3 1 0]\n",
      "instance 7, ep 24, state [0 0 0 1]\n",
      "   state [0 0 0 1] state_WI [0.37 0.54 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 0 1 1] state_WI [0.38 0.54 0.3  0.39] sorted [1 3 0]\n",
      "   state [1 0 1 1] state_WI [0.38 0.54 0.3  0.39] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.38 0.54 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [0 0 1 0] state_WI [0.37 0.54 0.3  0.47] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.37 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.37 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 0 0 0] state_WI [0.37 0.54 0.33 0.47] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.38 0.54 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 0 0 0] state_WI [0.38 0.54 0.33 0.47] sorted [1 3 0]\n",
      "   state [0 0 0 1] state_WI [0.37 0.54 0.33 0.39] sorted [1 3 0]\n",
      "instance 7, ep 25, state [1 0 1 1]\n",
      "   state [1 0 1 1] state_WI [0.38 0.54 0.3  0.39] sorted [1 3 0]\n",
      "   state [1 0 1 1] state_WI [0.38 0.54 0.3  0.39] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.38 0.54 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 0 1 0] state_WI [0.38 0.54 0.3  0.47] sorted [1 3 0]\n",
      "   state [0 1 1 1] state_WI [0.37 0.47 0.3  0.39] sorted [1 3 0]\n",
      "   state [0 0 0 1] state_WI [0.37 0.54 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.37 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 1 1] state_WI [0.37 0.47 0.3  0.39] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 0 1 1] state_WI [0.38 0.54 0.3  0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 0 1 0] state_WI [0.38 0.54 0.3  0.47] sorted [1 3 0]\n",
      "   state [1 1 1 0] state_WI [0.38 0.47 0.3  0.47] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "instance 7, ep 26, state [0 0 0 0]\n",
      "   state [0 0 0 0] state_WI [0.37 0.54 0.33 0.47] sorted [1 3 0]\n",
      "   state [0 0 0 1] state_WI [0.37 0.54 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [0 1 1 1] state_WI [0.37 0.47 0.3  0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [1 1 1 1] state_WI [0.38 0.47 0.3  0.39] sorted [1 3 0]\n",
      "   state [1 1 1 1] state_WI [0.38 0.47 0.3  0.39] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [0 1 0 0] state_WI [0.37 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 0 1 1] state_WI [0.37 0.54 0.3  0.39] sorted [1 3 0]\n",
      "   state [1 1 1 1] state_WI [0.38 0.47 0.3  0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "instance 7, ep 27, state [1 0 1 1]\n",
      "   state [1 0 1 1] state_WI [0.38 0.54 0.3  0.39] sorted [1 3 0]\n",
      "   state [0 0 0 0] state_WI [0.37 0.54 0.33 0.47] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.37 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.37 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [1 0 0 0] state_WI [0.38 0.54 0.33 0.47] sorted [1 3 0]\n",
      "   state [0 0 0 1] state_WI [0.37 0.54 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 1 1] state_WI [0.37 0.47 0.3  0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "instance 7, ep 28, state [0 1 0 1]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 1 0] state_WI [0.38 0.47 0.3  0.47] sorted [3 1 0]\n",
      "   state [0 1 1 0] state_WI [0.37 0.47 0.3  0.47] sorted [3 1 0]\n",
      "   state [1 1 1 0] state_WI [0.38 0.47 0.3  0.47] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 0 0 0] state_WI [0.38 0.54 0.33 0.47] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.37 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 0 0 1] state_WI [0.37 0.54 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 0 1 1] state_WI [0.37 0.54 0.3  0.39] sorted [1 3 0]\n",
      "   state [1 0 0 0] state_WI [0.38 0.54 0.33 0.47] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.38 0.54 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.38 0.54 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.38 0.54 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "instance 7, ep 29, state [0 1 1 0]\n",
      "   state [0 1 1 0] state_WI [0.37 0.47 0.3  0.47] sorted [3 1 0]\n",
      "   state [0 1 0 0] state_WI [0.37 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [0 0 1 1] state_WI [0.37 0.54 0.3  0.39] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.37 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [0.38 0.54 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 0 1 1] state_WI [0.38 0.54 0.3  0.39] sorted [1 3 0]\n",
      "   state [1 1 1 1] state_WI [0.38 0.47 0.3  0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [0.38 0.47 0.33 0.47] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 1 1] state_WI [0.37 0.47 0.3  0.39] sorted [1 3 0]\n",
      "   state [0 1 1 1] state_WI [0.37 0.47 0.3  0.39] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 0 0 1] state_WI [0.37 0.54 0.33 0.39] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.38 0.47 0.33 0.39] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 0.47 0.33 0.39] sorted [1 3 0]\n",
      "first state [0 0 1 1]\n",
      "   state [0 0 1 1] state_WI [0.84 0.45 0.47 0.29] sorted [0 2 1]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [1 1 0 1] state_WI [0.33 0.3  0.54 0.29] sorted [2 0 1]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.84 0.3  0.47 0.91] sorted [3 0 2]\n",
      "   state [1 1 0 1] state_WI [0.33 0.3  0.54 0.29] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [1 0 1 0] state_WI [0.33 0.45 0.47 0.91] sorted [3 2 1]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [1 0 1 0] state_WI [0.33 0.45 0.47 0.91] sorted [3 2 1]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "   state [1 1 0 1] state_WI [0.33 0.3  0.54 0.29] sorted [2 0 1]\n",
      "   state [0 0 0 0] state_WI [0.84 0.45 0.54 0.91] sorted [3 0 2]\n",
      "instance 8, ep 1, state [0 1 0 1]\n",
      "   state [0 1 0 1] state_WI [0.84 0.3  0.54 0.29] sorted [0 2 1]\n",
      "   state [1 1 0 1] state_WI [0.33 0.3  0.54 0.29] sorted [2 0 1]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "   state [1 0 1 0] state_WI [0.33 0.45 0.47 0.91] sorted [3 2 1]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [0 0 1 1] state_WI [0.84 0.45 0.47 0.29] sorted [0 2 1]\n",
      "   state [0 1 1 0] state_WI [0.84 0.3  0.47 0.91] sorted [3 0 2]\n",
      "   state [1 0 0 0] state_WI [0.33 0.45 0.54 0.91] sorted [3 2 1]\n",
      "   state [0 1 0 1] state_WI [0.84 0.3  0.54 0.29] sorted [0 2 1]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "   state [1 1 0 0] state_WI [0.33 0.3  0.54 0.91] sorted [3 2 0]\n",
      "   state [1 0 0 1] state_WI [0.33 0.45 0.54 0.29] sorted [2 1 0]\n",
      "   state [1 1 0 1] state_WI [0.33 0.3  0.54 0.29] sorted [2 0 1]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "instance 8, ep 2, state [0 0 1 0]\n",
      "   state [0 0 1 0] state_WI [0.84 0.45 0.47 0.91] sorted [3 0 2]\n",
      "   state [0 0 1 0] state_WI [0.84 0.45 0.47 0.91] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [0 0 1 1] state_WI [0.84 0.45 0.47 0.29] sorted [0 2 1]\n",
      "   state [0 1 1 0] state_WI [0.84 0.3  0.47 0.91] sorted [3 0 2]\n",
      "   state [0 1 0 1] state_WI [0.84 0.3  0.54 0.29] sorted [0 2 1]\n",
      "   state [0 0 1 0] state_WI [0.84 0.45 0.47 0.91] sorted [3 0 2]\n",
      "   state [0 1 1 1] state_WI [0.84 0.3  0.47 0.29] sorted [0 2 1]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "   state [0 1 1 1] state_WI [0.84 0.3  0.47 0.29] sorted [0 2 1]\n",
      "   state [0 0 1 1] state_WI [0.84 0.45 0.47 0.29] sorted [0 2 1]\n",
      "   state [0 0 1 1] state_WI [0.84 0.45 0.47 0.29] sorted [0 2 1]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "   state [0 1 1 0] state_WI [0.84 0.3  0.47 0.91] sorted [3 0 2]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "instance 8, ep 3, state [1 1 1 0]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "   state [1 0 0 1] state_WI [0.33 0.45 0.54 0.29] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "   state [1 0 1 0] state_WI [0.33 0.45 0.47 0.91] sorted [3 2 1]\n",
      "   state [0 1 1 0] state_WI [0.84 0.3  0.47 0.91] sorted [3 0 2]\n",
      "   state [0 0 1 1] state_WI [0.84 0.45 0.47 0.29] sorted [0 2 1]\n",
      "   state [0 0 1 1] state_WI [0.84 0.45 0.47 0.29] sorted [0 2 1]\n",
      "   state [1 1 0 1] state_WI [0.33 0.3  0.54 0.29] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "   state [0 0 1 1] state_WI [0.84 0.45 0.47 0.29] sorted [0 2 1]\n",
      "   state [0 0 1 0] state_WI [0.84 0.45 0.47 0.91] sorted [3 0 2]\n",
      "   state [0 0 1 1] state_WI [0.84 0.45 0.47 0.29] sorted [0 2 1]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [0 1 0 0] state_WI [0.84 0.3  0.54 0.91] sorted [3 0 2]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "instance 8, ep 4, state [0 0 1 1]\n",
      "   state [0 0 1 1] state_WI [0.84 0.45 0.47 0.29] sorted [0 2 1]\n",
      "   state [0 0 1 1] state_WI [0.84 0.45 0.47 0.29] sorted [0 2 1]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [1 0 0 1] state_WI [0.33 0.45 0.54 0.29] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [1 0 1 0] state_WI [0.33 0.45 0.47 0.91] sorted [3 2 1]\n",
      "   state [1 0 0 1] state_WI [0.33 0.45 0.54 0.29] sorted [2 1 0]\n",
      "   state [1 0 0 0] state_WI [0.33 0.45 0.54 0.91] sorted [3 2 1]\n",
      "   state [0 0 1 1] state_WI [0.84 0.45 0.47 0.29] sorted [0 2 1]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [0 0 1 1] state_WI [0.84 0.45 0.47 0.29] sorted [0 2 1]\n",
      "   state [0 1 1 1] state_WI [0.84 0.3  0.47 0.29] sorted [0 2 1]\n",
      "   state [0 1 0 1] state_WI [0.84 0.3  0.54 0.29] sorted [0 2 1]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "   state [1 0 1 0] state_WI [0.33 0.45 0.47 0.91] sorted [3 2 1]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "instance 8, ep 5, state [1 1 1 1]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [1 1 0 1] state_WI [0.33 0.3  0.54 0.29] sorted [2 0 1]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "   state [1 1 0 1] state_WI [0.33 0.3  0.54 0.29] sorted [2 0 1]\n",
      "   state [0 1 0 1] state_WI [0.84 0.3  0.54 0.29] sorted [0 2 1]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [1 0 1 0] state_WI [0.33 0.45 0.47 0.91] sorted [3 2 1]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [1 0 1 0] state_WI [0.33 0.45 0.47 0.91] sorted [3 2 1]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.84 0.3  0.47 0.91] sorted [3 0 2]\n",
      "   state [0 1 1 1] state_WI [0.84 0.3  0.47 0.29] sorted [0 2 1]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [1 1 0 0] state_WI [0.33 0.3  0.54 0.91] sorted [3 2 0]\n",
      "   state [1 0 0 0] state_WI [0.33 0.45 0.54 0.91] sorted [3 2 1]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "instance 8, ep 6, state [0 1 0 1]\n",
      "   state [0 1 0 1] state_WI [0.84 0.3  0.54 0.29] sorted [0 2 1]\n",
      "   state [1 0 0 1] state_WI [0.33 0.45 0.54 0.29] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [1 1 0 1] state_WI [0.33 0.3  0.54 0.29] sorted [2 0 1]\n",
      "   state [1 0 1 0] state_WI [0.33 0.45 0.47 0.91] sorted [3 2 1]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [1 0 0 1] state_WI [0.33 0.45 0.54 0.29] sorted [2 1 0]\n",
      "   state [1 0 1 0] state_WI [0.33 0.45 0.47 0.91] sorted [3 2 1]\n",
      "   state [0 0 0 1] state_WI [0.84 0.45 0.54 0.29] sorted [0 2 1]\n",
      "   state [0 1 0 0] state_WI [0.84 0.3  0.54 0.91] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.84 0.3  0.47 0.91] sorted [3 0 2]\n",
      "   state [0 1 0 1] state_WI [0.84 0.3  0.54 0.29] sorted [0 2 1]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "instance 8, ep 7, state [1 1 0 0]\n",
      "   state [1 1 0 0] state_WI [0.33 0.3  0.54 0.91] sorted [3 2 0]\n",
      "   state [1 0 0 0] state_WI [0.33 0.45 0.54 0.91] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.84 0.3  0.47 0.29] sorted [0 2 1]\n",
      "   state [1 1 0 0] state_WI [0.33 0.3  0.54 0.91] sorted [3 2 0]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [1 0 1 0] state_WI [0.33 0.45 0.47 0.91] sorted [3 2 1]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [0 0 1 1] state_WI [0.84 0.45 0.47 0.29] sorted [0 2 1]\n",
      "   state [1 0 1 0] state_WI [0.33 0.45 0.47 0.91] sorted [3 2 1]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "   state [0 1 1 1] state_WI [0.84 0.3  0.47 0.29] sorted [0 2 1]\n",
      "   state [0 1 1 1] state_WI [0.84 0.3  0.47 0.29] sorted [0 2 1]\n",
      "   state [0 1 1 0] state_WI [0.84 0.3  0.47 0.91] sorted [3 0 2]\n",
      "   state [0 0 0 1] state_WI [0.84 0.45 0.54 0.29] sorted [0 2 1]\n",
      "   state [0 0 1 1] state_WI [0.84 0.45 0.47 0.29] sorted [0 2 1]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [1 0 1 0] state_WI [0.33 0.45 0.47 0.91] sorted [3 2 1]\n",
      "instance 8, ep 8, state [0 0 0 1]\n",
      "   state [0 0 0 1] state_WI [0.84 0.45 0.54 0.29] sorted [0 2 1]\n",
      "   state [1 1 0 0] state_WI [0.33 0.3  0.54 0.91] sorted [3 2 0]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "   state [1 1 0 1] state_WI [0.33 0.3  0.54 0.29] sorted [2 0 1]\n",
      "   state [1 0 1 0] state_WI [0.33 0.45 0.47 0.91] sorted [3 2 1]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [1 0 0 1] state_WI [0.33 0.45 0.54 0.29] sorted [2 1 0]\n",
      "   state [0 1 1 1] state_WI [0.84 0.3  0.47 0.29] sorted [0 2 1]\n",
      "   state [0 1 1 1] state_WI [0.84 0.3  0.47 0.29] sorted [0 2 1]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [0 1 1 0] state_WI [0.84 0.3  0.47 0.91] sorted [3 0 2]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [0 1 1 0] state_WI [0.84 0.3  0.47 0.91] sorted [3 0 2]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "instance 8, ep 9, state [1 0 0 0]\n",
      "   state [1 0 0 0] state_WI [0.33 0.45 0.54 0.91] sorted [3 2 1]\n",
      "   state [1 0 0 1] state_WI [0.33 0.45 0.54 0.29] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "   state [0 0 1 1] state_WI [0.84 0.45 0.47 0.29] sorted [0 2 1]\n",
      "   state [0 1 1 0] state_WI [0.84 0.3  0.47 0.91] sorted [3 0 2]\n",
      "   state [0 0 0 1] state_WI [0.84 0.45 0.54 0.29] sorted [0 2 1]\n",
      "   state [1 0 0 0] state_WI [0.33 0.45 0.54 0.91] sorted [3 2 1]\n",
      "   state [1 1 0 1] state_WI [0.33 0.3  0.54 0.29] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [1 1 0 1] state_WI [0.33 0.3  0.54 0.29] sorted [2 0 1]\n",
      "   state [1 1 0 0] state_WI [0.33 0.3  0.54 0.91] sorted [3 2 0]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "instance 8, ep 10, state [1 1 1 0]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [1 0 0 0] state_WI [0.33 0.45 0.54 0.91] sorted [3 2 1]\n",
      "   state [0 0 0 1] state_WI [0.84 0.45 0.54 0.29] sorted [0 2 1]\n",
      "   state [0 0 1 1] state_WI [0.84 0.45 0.47 0.29] sorted [0 2 1]\n",
      "   state [0 1 1 1] state_WI [0.84 0.3  0.47 0.29] sorted [0 2 1]\n",
      "   state [0 1 1 0] state_WI [0.84 0.3  0.47 0.91] sorted [3 0 2]\n",
      "   state [0 0 1 1] state_WI [0.84 0.45 0.47 0.29] sorted [0 2 1]\n",
      "   state [1 0 1 0] state_WI [0.33 0.45 0.47 0.91] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.84 0.3  0.47 0.29] sorted [0 2 1]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [0 1 0 0] state_WI [0.84 0.3  0.54 0.91] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.84 0.3  0.47 0.91] sorted [3 0 2]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [1 0 1 0] state_WI [0.33 0.45 0.47 0.91] sorted [3 2 1]\n",
      "instance 8, ep 11, state [1 1 0 1]\n",
      "   state [1 1 0 1] state_WI [0.33 0.3  0.54 0.29] sorted [2 0 1]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [0 1 1 1] state_WI [0.84 0.3  0.47 0.29] sorted [0 2 1]\n",
      "   state [1 0 1 0] state_WI [0.33 0.45 0.47 0.91] sorted [3 2 1]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [0 0 0 0] state_WI [0.84 0.45 0.54 0.91] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [1 0 1 0] state_WI [0.33 0.45 0.47 0.91] sorted [3 2 1]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [0 1 1 0] state_WI [0.84 0.3  0.47 0.91] sorted [3 0 2]\n",
      "   state [1 0 0 1] state_WI [0.33 0.45 0.54 0.29] sorted [2 1 0]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.84 0.3  0.47 0.91] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.84 0.3  0.47 0.91] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "instance 8, ep 12, state [0 1 0 1]\n",
      "   state [0 1 0 1] state_WI [0.84 0.3  0.54 0.29] sorted [0 2 1]\n",
      "   state [0 1 0 1] state_WI [0.84 0.3  0.54 0.29] sorted [0 2 1]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [1 0 1 0] state_WI [0.33 0.45 0.47 0.91] sorted [3 2 1]\n",
      "   state [0 0 1 1] state_WI [0.84 0.45 0.47 0.29] sorted [0 2 1]\n",
      "   state [0 1 1 0] state_WI [0.84 0.3  0.47 0.91] sorted [3 0 2]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [1 0 1 0] state_WI [0.33 0.45 0.47 0.91] sorted [3 2 1]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [1 1 0 1] state_WI [0.33 0.3  0.54 0.29] sorted [2 0 1]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "instance 8, ep 13, state [1 1 1 0]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [1 0 0 0] state_WI [0.33 0.45 0.54 0.91] sorted [3 2 1]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [1 0 1 0] state_WI [0.33 0.45 0.47 0.91] sorted [3 2 1]\n",
      "   state [0 0 1 1] state_WI [0.84 0.45 0.47 0.29] sorted [0 2 1]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "   state [0 1 0 1] state_WI [0.84 0.3  0.54 0.29] sorted [0 2 1]\n",
      "   state [0 1 0 1] state_WI [0.84 0.3  0.54 0.29] sorted [0 2 1]\n",
      "   state [1 0 0 1] state_WI [0.33 0.45 0.54 0.29] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "instance 8, ep 14, state [0 0 0 1]\n",
      "   state [0 0 0 1] state_WI [0.84 0.45 0.54 0.29] sorted [0 2 1]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [1 0 1 0] state_WI [0.33 0.45 0.47 0.91] sorted [3 2 1]\n",
      "   state [0 0 1 1] state_WI [0.84 0.45 0.47 0.29] sorted [0 2 1]\n",
      "   state [0 0 1 1] state_WI [0.84 0.45 0.47 0.29] sorted [0 2 1]\n",
      "   state [1 0 0 1] state_WI [0.33 0.45 0.54 0.29] sorted [2 1 0]\n",
      "   state [1 0 0 1] state_WI [0.33 0.45 0.54 0.29] sorted [2 1 0]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [1 0 1 0] state_WI [0.33 0.45 0.47 0.91] sorted [3 2 1]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [1 0 1 0] state_WI [0.33 0.45 0.47 0.91] sorted [3 2 1]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "instance 8, ep 15, state [0 1 1 1]\n",
      "   state [0 1 1 1] state_WI [0.84 0.3  0.47 0.29] sorted [0 2 1]\n",
      "   state [0 0 0 1] state_WI [0.84 0.45 0.54 0.29] sorted [0 2 1]\n",
      "   state [1 0 0 0] state_WI [0.33 0.45 0.54 0.91] sorted [3 2 1]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [0 1 1 1] state_WI [0.84 0.3  0.47 0.29] sorted [0 2 1]\n",
      "   state [0 1 1 1] state_WI [0.84 0.3  0.47 0.29] sorted [0 2 1]\n",
      "   state [0 1 0 1] state_WI [0.84 0.3  0.54 0.29] sorted [0 2 1]\n",
      "   state [0 1 1 0] state_WI [0.84 0.3  0.47 0.91] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [1 1 0 1] state_WI [0.33 0.3  0.54 0.29] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [1 0 1 0] state_WI [0.33 0.45 0.47 0.91] sorted [3 2 1]\n",
      "   state [1 1 0 0] state_WI [0.33 0.3  0.54 0.91] sorted [3 2 0]\n",
      "   state [1 0 0 1] state_WI [0.33 0.45 0.54 0.29] sorted [2 1 0]\n",
      "   state [1 1 0 0] state_WI [0.33 0.3  0.54 0.91] sorted [3 2 0]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "instance 8, ep 16, state [0 1 1 0]\n",
      "   state [0 1 1 0] state_WI [0.84 0.3  0.47 0.91] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [1 1 0 1] state_WI [0.33 0.3  0.54 0.29] sorted [2 0 1]\n",
      "   state [1 0 0 0] state_WI [0.33 0.45 0.54 0.91] sorted [3 2 1]\n",
      "   state [1 1 0 1] state_WI [0.33 0.3  0.54 0.29] sorted [2 0 1]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [0 1 1 0] state_WI [0.84 0.3  0.47 0.91] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "   state [0 1 1 0] state_WI [0.84 0.3  0.47 0.91] sorted [3 0 2]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [1 0 0 0] state_WI [0.33 0.45 0.54 0.91] sorted [3 2 1]\n",
      "   state [0 1 0 1] state_WI [0.84 0.3  0.54 0.29] sorted [0 2 1]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "instance 8, ep 17, state [1 1 0 1]\n",
      "   state [1 1 0 1] state_WI [0.33 0.3  0.54 0.29] sorted [2 0 1]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "   state [1 0 0 1] state_WI [0.33 0.45 0.54 0.29] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [0 0 1 1] state_WI [0.84 0.45 0.47 0.29] sorted [0 2 1]\n",
      "   state [1 0 0 1] state_WI [0.33 0.45 0.54 0.29] sorted [2 1 0]\n",
      "   state [1 0 1 0] state_WI [0.33 0.45 0.47 0.91] sorted [3 2 1]\n",
      "   state [1 0 0 1] state_WI [0.33 0.45 0.54 0.29] sorted [2 1 0]\n",
      "   state [1 0 1 0] state_WI [0.33 0.45 0.47 0.91] sorted [3 2 1]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [0 0 1 0] state_WI [0.84 0.45 0.47 0.91] sorted [3 0 2]\n",
      "   state [0 0 1 1] state_WI [0.84 0.45 0.47 0.29] sorted [0 2 1]\n",
      "   state [0 1 1 0] state_WI [0.84 0.3  0.47 0.91] sorted [3 0 2]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [0 1 1 0] state_WI [0.84 0.3  0.47 0.91] sorted [3 0 2]\n",
      "   state [0 0 1 1] state_WI [0.84 0.45 0.47 0.29] sorted [0 2 1]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [0 0 0 1] state_WI [0.84 0.45 0.54 0.29] sorted [0 2 1]\n",
      "instance 8, ep 18, state [0 0 0 0]\n",
      "   state [0 0 0 0] state_WI [0.84 0.45 0.54 0.91] sorted [3 0 2]\n",
      "   state [1 0 0 1] state_WI [0.33 0.45 0.54 0.29] sorted [2 1 0]\n",
      "   state [1 0 0 1] state_WI [0.33 0.45 0.54 0.29] sorted [2 1 0]\n",
      "   state [1 1 0 0] state_WI [0.33 0.3  0.54 0.91] sorted [3 2 0]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "   state [1 0 1 0] state_WI [0.33 0.45 0.47 0.91] sorted [3 2 1]\n",
      "   state [1 0 1 0] state_WI [0.33 0.45 0.47 0.91] sorted [3 2 1]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "instance 8, ep 19, state [0 0 1 1]\n",
      "   state [0 0 1 1] state_WI [0.84 0.45 0.47 0.29] sorted [0 2 1]\n",
      "   state [1 0 1 0] state_WI [0.33 0.45 0.47 0.91] sorted [3 2 1]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [1 1 0 1] state_WI [0.33 0.3  0.54 0.29] sorted [2 0 1]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [0 1 1 0] state_WI [0.84 0.3  0.47 0.91] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [1 1 0 0] state_WI [0.33 0.3  0.54 0.91] sorted [3 2 0]\n",
      "   state [0 0 0 1] state_WI [0.84 0.45 0.54 0.29] sorted [0 2 1]\n",
      "   state [1 1 0 0] state_WI [0.33 0.3  0.54 0.91] sorted [3 2 0]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [1 1 0 1] state_WI [0.33 0.3  0.54 0.29] sorted [2 0 1]\n",
      "   state [1 1 0 0] state_WI [0.33 0.3  0.54 0.91] sorted [3 2 0]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [1 0 1 0] state_WI [0.33 0.45 0.47 0.91] sorted [3 2 1]\n",
      "instance 8, ep 20, state [1 0 0 1]\n",
      "   state [1 0 0 1] state_WI [0.33 0.45 0.54 0.29] sorted [2 1 0]\n",
      "   state [1 1 0 1] state_WI [0.33 0.3  0.54 0.29] sorted [2 0 1]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [1 0 1 0] state_WI [0.33 0.45 0.47 0.91] sorted [3 2 1]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "   state [0 0 1 1] state_WI [0.84 0.45 0.47 0.29] sorted [0 2 1]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "   state [1 0 1 0] state_WI [0.33 0.45 0.47 0.91] sorted [3 2 1]\n",
      "   state [0 1 1 0] state_WI [0.84 0.3  0.47 0.91] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [1 0 0 0] state_WI [0.33 0.45 0.54 0.91] sorted [3 2 1]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "   state [1 0 0 1] state_WI [0.33 0.45 0.54 0.29] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "instance 8, ep 21, state [0 0 1 0]\n",
      "   state [0 0 1 0] state_WI [0.84 0.45 0.47 0.91] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [0 1 1 1] state_WI [0.84 0.3  0.47 0.29] sorted [0 2 1]\n",
      "   state [0 1 1 1] state_WI [0.84 0.3  0.47 0.29] sorted [0 2 1]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [1 1 0 0] state_WI [0.33 0.3  0.54 0.91] sorted [3 2 0]\n",
      "   state [1 0 0 1] state_WI [0.33 0.45 0.54 0.29] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "   state [1 0 1 0] state_WI [0.33 0.45 0.47 0.91] sorted [3 2 1]\n",
      "   state [1 0 1 0] state_WI [0.33 0.45 0.47 0.91] sorted [3 2 1]\n",
      "   state [1 0 0 1] state_WI [0.33 0.45 0.54 0.29] sorted [2 1 0]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [1 0 1 0] state_WI [0.33 0.45 0.47 0.91] sorted [3 2 1]\n",
      "   state [0 0 1 1] state_WI [0.84 0.45 0.47 0.29] sorted [0 2 1]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "instance 8, ep 22, state [1 1 0 0]\n",
      "   state [1 1 0 0] state_WI [0.33 0.3  0.54 0.91] sorted [3 2 0]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [1 1 0 0] state_WI [0.33 0.3  0.54 0.91] sorted [3 2 0]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [1 0 1 0] state_WI [0.33 0.45 0.47 0.91] sorted [3 2 1]\n",
      "   state [0 0 1 1] state_WI [0.84 0.45 0.47 0.29] sorted [0 2 1]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [1 0 1 0] state_WI [0.33 0.45 0.47 0.91] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.84 0.3  0.47 0.29] sorted [0 2 1]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "   state [0 0 1 1] state_WI [0.84 0.45 0.47 0.29] sorted [0 2 1]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [0 1 1 1] state_WI [0.84 0.3  0.47 0.29] sorted [0 2 1]\n",
      "   state [0 1 1 0] state_WI [0.84 0.3  0.47 0.91] sorted [3 0 2]\n",
      "   state [1 1 0 1] state_WI [0.33 0.3  0.54 0.29] sorted [2 0 1]\n",
      "instance 8, ep 23, state [1 0 0 1]\n",
      "   state [1 0 0 1] state_WI [0.33 0.45 0.54 0.29] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [1 0 1 0] state_WI [0.33 0.45 0.47 0.91] sorted [3 2 1]\n",
      "   state [0 1 1 0] state_WI [0.84 0.3  0.47 0.91] sorted [3 0 2]\n",
      "   state [0 1 1 1] state_WI [0.84 0.3  0.47 0.29] sorted [0 2 1]\n",
      "   state [1 0 0 1] state_WI [0.33 0.45 0.54 0.29] sorted [2 1 0]\n",
      "   state [1 0 0 0] state_WI [0.33 0.45 0.54 0.91] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.84 0.3  0.47 0.29] sorted [0 2 1]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [0 1 1 1] state_WI [0.84 0.3  0.47 0.29] sorted [0 2 1]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [1 0 0 1] state_WI [0.33 0.45 0.54 0.29] sorted [2 1 0]\n",
      "   state [0 1 1 1] state_WI [0.84 0.3  0.47 0.29] sorted [0 2 1]\n",
      "   state [0 1 1 1] state_WI [0.84 0.3  0.47 0.29] sorted [0 2 1]\n",
      "   state [1 0 1 0] state_WI [0.33 0.45 0.47 0.91] sorted [3 2 1]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "instance 8, ep 24, state [0 1 1 0]\n",
      "   state [0 1 1 0] state_WI [0.84 0.3  0.47 0.91] sorted [3 0 2]\n",
      "   state [1 1 0 1] state_WI [0.33 0.3  0.54 0.29] sorted [2 0 1]\n",
      "   state [1 1 0 0] state_WI [0.33 0.3  0.54 0.91] sorted [3 2 0]\n",
      "   state [1 0 1 0] state_WI [0.33 0.45 0.47 0.91] sorted [3 2 1]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [0 1 0 0] state_WI [0.84 0.3  0.54 0.91] sorted [3 0 2]\n",
      "   state [0 1 0 1] state_WI [0.84 0.3  0.54 0.29] sorted [0 2 1]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "   state [1 0 0 1] state_WI [0.33 0.45 0.54 0.29] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [0 0 1 1] state_WI [0.84 0.45 0.47 0.29] sorted [0 2 1]\n",
      "   state [0 0 1 1] state_WI [0.84 0.45 0.47 0.29] sorted [0 2 1]\n",
      "   state [0 1 1 1] state_WI [0.84 0.3  0.47 0.29] sorted [0 2 1]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "   state [0 1 1 0] state_WI [0.84 0.3  0.47 0.91] sorted [3 0 2]\n",
      "   state [1 1 0 1] state_WI [0.33 0.3  0.54 0.29] sorted [2 0 1]\n",
      "   state [0 0 0 0] state_WI [0.84 0.45 0.54 0.91] sorted [3 0 2]\n",
      "instance 8, ep 25, state [0 0 0 0]\n",
      "   state [0 0 0 0] state_WI [0.84 0.45 0.54 0.91] sorted [3 0 2]\n",
      "   state [1 0 0 1] state_WI [0.33 0.45 0.54 0.29] sorted [2 1 0]\n",
      "   state [1 0 0 1] state_WI [0.33 0.45 0.54 0.29] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [1 1 0 0] state_WI [0.33 0.3  0.54 0.91] sorted [3 2 0]\n",
      "   state [1 0 0 1] state_WI [0.33 0.45 0.54 0.29] sorted [2 1 0]\n",
      "   state [1 0 0 0] state_WI [0.33 0.45 0.54 0.91] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.84 0.3  0.47 0.29] sorted [0 2 1]\n",
      "   state [0 0 1 0] state_WI [0.84 0.45 0.47 0.91] sorted [3 0 2]\n",
      "   state [0 0 0 1] state_WI [0.84 0.45 0.54 0.29] sorted [0 2 1]\n",
      "   state [1 1 0 1] state_WI [0.33 0.3  0.54 0.29] sorted [2 0 1]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "   state [1 1 0 1] state_WI [0.33 0.3  0.54 0.29] sorted [2 0 1]\n",
      "   state [1 1 0 0] state_WI [0.33 0.3  0.54 0.91] sorted [3 2 0]\n",
      "   state [1 0 0 1] state_WI [0.33 0.45 0.54 0.29] sorted [2 1 0]\n",
      "   state [0 0 1 0] state_WI [0.84 0.45 0.47 0.91] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "instance 8, ep 26, state [1 0 1 1]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [1 0 1 0] state_WI [0.33 0.45 0.47 0.91] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.84 0.3  0.47 0.29] sorted [0 2 1]\n",
      "   state [1 1 0 0] state_WI [0.33 0.3  0.54 0.91] sorted [3 2 0]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [1 1 0 0] state_WI [0.33 0.3  0.54 0.91] sorted [3 2 0]\n",
      "   state [0 0 0 1] state_WI [0.84 0.45 0.54 0.29] sorted [0 2 1]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "   state [0 0 1 1] state_WI [0.84 0.45 0.47 0.29] sorted [0 2 1]\n",
      "   state [0 1 1 1] state_WI [0.84 0.3  0.47 0.29] sorted [0 2 1]\n",
      "   state [0 1 1 1] state_WI [0.84 0.3  0.47 0.29] sorted [0 2 1]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "instance 8, ep 27, state [1 1 0 1]\n",
      "   state [1 1 0 1] state_WI [0.33 0.3  0.54 0.29] sorted [2 0 1]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "   state [1 0 0 0] state_WI [0.33 0.45 0.54 0.91] sorted [3 2 1]\n",
      "   state [0 1 1 0] state_WI [0.84 0.3  0.47 0.91] sorted [3 0 2]\n",
      "   state [0 0 1 0] state_WI [0.84 0.45 0.47 0.91] sorted [3 0 2]\n",
      "   state [0 0 1 1] state_WI [0.84 0.45 0.47 0.29] sorted [0 2 1]\n",
      "   state [0 1 1 0] state_WI [0.84 0.3  0.47 0.91] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [1 1 0 0] state_WI [0.33 0.3  0.54 0.91] sorted [3 2 0]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [1 1 0 1] state_WI [0.33 0.3  0.54 0.29] sorted [2 0 1]\n",
      "   state [1 1 0 0] state_WI [0.33 0.3  0.54 0.91] sorted [3 2 0]\n",
      "   state [1 1 0 0] state_WI [0.33 0.3  0.54 0.91] sorted [3 2 0]\n",
      "   state [0 0 1 0] state_WI [0.84 0.45 0.47 0.91] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "instance 8, ep 28, state [1 0 0 1]\n",
      "   state [1 0 0 1] state_WI [0.33 0.45 0.54 0.29] sorted [2 1 0]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [1 1 0 0] state_WI [0.33 0.3  0.54 0.91] sorted [3 2 0]\n",
      "   state [1 0 1 0] state_WI [0.33 0.45 0.47 0.91] sorted [3 2 1]\n",
      "   state [1 0 0 1] state_WI [0.33 0.45 0.54 0.29] sorted [2 1 0]\n",
      "   state [1 0 0 1] state_WI [0.33 0.45 0.54 0.29] sorted [2 1 0]\n",
      "   state [1 0 1 0] state_WI [0.33 0.45 0.47 0.91] sorted [3 2 1]\n",
      "   state [1 0 1 0] state_WI [0.33 0.45 0.47 0.91] sorted [3 2 1]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "   state [1 1 0 0] state_WI [0.33 0.3  0.54 0.91] sorted [3 2 0]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "   state [1 1 0 1] state_WI [0.33 0.3  0.54 0.29] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [1 0 1 0] state_WI [0.33 0.45 0.47 0.91] sorted [3 2 1]\n",
      "   state [0 0 1 1] state_WI [0.84 0.45 0.47 0.29] sorted [0 2 1]\n",
      "   state [1 0 1 0] state_WI [0.33 0.45 0.47 0.91] sorted [3 2 1]\n",
      "   state [1 1 0 1] state_WI [0.33 0.3  0.54 0.29] sorted [2 0 1]\n",
      "   state [0 0 0 1] state_WI [0.84 0.45 0.54 0.29] sorted [0 2 1]\n",
      "instance 8, ep 29, state [0 0 0 0]\n",
      "   state [0 0 0 0] state_WI [0.84 0.45 0.54 0.91] sorted [3 0 2]\n",
      "   state [1 0 0 1] state_WI [0.33 0.45 0.54 0.29] sorted [2 1 0]\n",
      "   state [0 0 1 1] state_WI [0.84 0.45 0.47 0.29] sorted [0 2 1]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "   state [0 1 1 1] state_WI [0.84 0.3  0.47 0.29] sorted [0 2 1]\n",
      "   state [1 0 1 0] state_WI [0.33 0.45 0.47 0.91] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.84 0.3  0.47 0.29] sorted [0 2 1]\n",
      "   state [1 0 0 1] state_WI [0.33 0.45 0.54 0.29] sorted [2 1 0]\n",
      "   state [0 0 1 1] state_WI [0.84 0.45 0.47 0.29] sorted [0 2 1]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [0.33 0.3  0.47 0.91] sorted [3 2 0]\n",
      "   state [0 1 0 1] state_WI [0.84 0.3  0.54 0.29] sorted [0 2 1]\n",
      "   state [0 1 0 1] state_WI [0.84 0.3  0.54 0.29] sorted [0 2 1]\n",
      "   state [0 1 1 0] state_WI [0.84 0.3  0.47 0.91] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [0.33 0.45 0.47 0.29] sorted [2 1 0]\n",
      "   state [1 0 0 1] state_WI [0.33 0.45 0.54 0.29] sorted [2 1 0]\n",
      "   state [1 0 1 0] state_WI [0.33 0.45 0.47 0.91] sorted [3 2 1]\n",
      "   state [1 1 1 1] state_WI [0.33 0.3  0.47 0.29] sorted [2 0 1]\n",
      "first state [1 1 1 0]\n",
      "   state [1 1 1 0] state_WI [0.34 0.44 0.36 0.41] sorted [1 3 2]\n",
      "   state [1 1 1 0] state_WI [0.34 0.44 0.36 0.41] sorted [1 3 2]\n",
      "   state [1 1 1 1] state_WI [0.34 0.44 0.36 0.42] sorted [1 3 2]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [0 1 1 1] state_WI [0.42 0.44 0.36 0.42] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [1 1 1 0] state_WI [0.34 0.44 0.36 0.41] sorted [1 3 2]\n",
      "   state [0 1 1 0] state_WI [0.42 0.44 0.36 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [0.34 0.44 0.39 0.41] sorted [1 3 2]\n",
      "   state [0 1 0 0] state_WI [0.42 0.44 0.39 0.41] sorted [1 0 3]\n",
      "   state [0 1 0 0] state_WI [0.42 0.44 0.39 0.41] sorted [1 0 3]\n",
      "   state [0 1 0 0] state_WI [0.42 0.44 0.39 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [0.34 0.44 0.39 0.41] sorted [1 3 2]\n",
      "   state [0 1 1 0] state_WI [0.42 0.44 0.36 0.41] sorted [1 0 3]\n",
      "   state [0 1 0 0] state_WI [0.42 0.44 0.39 0.41] sorted [1 0 3]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [0 0 0 1] state_WI [0.42 0.84 0.39 0.42] sorted [1 3 0]\n",
      "instance 9, ep 1, state [1 1 0 0]\n",
      "   state [1 1 0 0] state_WI [0.34 0.44 0.39 0.41] sorted [1 3 2]\n",
      "   state [0 0 1 1] state_WI [0.42 0.84 0.36 0.42] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [0.34 0.44 0.39 0.41] sorted [1 3 2]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [0 1 1 0] state_WI [0.42 0.44 0.36 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [0.34 0.44 0.39 0.41] sorted [1 3 2]\n",
      "   state [0 1 0 0] state_WI [0.42 0.44 0.39 0.41] sorted [1 0 3]\n",
      "   state [0 1 0 0] state_WI [0.42 0.44 0.39 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [0.34 0.44 0.39 0.41] sorted [1 3 2]\n",
      "   state [1 1 1 0] state_WI [0.34 0.44 0.36 0.41] sorted [1 3 2]\n",
      "   state [1 1 1 0] state_WI [0.34 0.44 0.36 0.41] sorted [1 3 2]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [1 1 0 0] state_WI [0.34 0.44 0.39 0.41] sorted [1 3 2]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [0 1 0 0] state_WI [0.42 0.44 0.39 0.41] sorted [1 0 3]\n",
      "   state [0 1 0 0] state_WI [0.42 0.44 0.39 0.41] sorted [1 0 3]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "instance 9, ep 2, state [0 0 1 0]\n",
      "   state [0 0 1 0] state_WI [0.42 0.84 0.36 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [0.34 0.44 0.39 0.41] sorted [1 3 2]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [0.34 0.44 0.39 0.41] sorted [1 3 2]\n",
      "   state [1 1 0 0] state_WI [0.34 0.44 0.39 0.41] sorted [1 3 2]\n",
      "   state [0 0 0 0] state_WI [0.42 0.84 0.39 0.41] sorted [1 0 3]\n",
      "   state [0 1 1 0] state_WI [0.42 0.44 0.36 0.41] sorted [1 0 3]\n",
      "   state [0 1 1 0] state_WI [0.42 0.44 0.36 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [0.34 0.44 0.39 0.41] sorted [1 3 2]\n",
      "   state [1 1 1 0] state_WI [0.34 0.44 0.36 0.41] sorted [1 3 2]\n",
      "   state [1 1 1 1] state_WI [0.34 0.44 0.36 0.42] sorted [1 3 2]\n",
      "   state [1 1 1 1] state_WI [0.34 0.44 0.36 0.42] sorted [1 3 2]\n",
      "   state [0 1 1 1] state_WI [0.42 0.44 0.36 0.42] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.42 0.44 0.39 0.41] sorted [1 0 3]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "instance 9, ep 3, state [1 0 0 0]\n",
      "   state [1 0 0 0] state_WI [0.34 0.84 0.39 0.41] sorted [1 3 2]\n",
      "   state [0 1 1 1] state_WI [0.42 0.44 0.36 0.42] sorted [1 3 0]\n",
      "   state [0 1 1 1] state_WI [0.42 0.44 0.36 0.42] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [0.34 0.44 0.39 0.41] sorted [1 3 2]\n",
      "   state [0 0 0 1] state_WI [0.42 0.84 0.39 0.42] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.34 0.84 0.39 0.42] sorted [1 3 2]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [0.34 0.44 0.39 0.41] sorted [1 3 2]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [0.34 0.44 0.39 0.41] sorted [1 3 2]\n",
      "   state [0 1 1 0] state_WI [0.42 0.44 0.36 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [0.34 0.44 0.39 0.41] sorted [1 3 2]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [0 1 1 1] state_WI [0.42 0.44 0.36 0.42] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [0 1 0 0] state_WI [0.42 0.44 0.39 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [0.34 0.44 0.39 0.41] sorted [1 3 2]\n",
      "   state [1 1 0 0] state_WI [0.34 0.44 0.39 0.41] sorted [1 3 2]\n",
      "instance 9, ep 4, state [0 0 1 1]\n",
      "   state [0 0 1 1] state_WI [0.42 0.84 0.36 0.42] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [0.34 0.44 0.39 0.41] sorted [1 3 2]\n",
      "   state [0 0 0 1] state_WI [0.42 0.84 0.39 0.42] sorted [1 3 0]\n",
      "   state [1 1 1 1] state_WI [0.34 0.44 0.36 0.42] sorted [1 3 2]\n",
      "   state [0 1 0 0] state_WI [0.42 0.44 0.39 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [1 0 0 1] state_WI [0.34 0.84 0.39 0.42] sorted [1 3 2]\n",
      "   state [0 1 0 0] state_WI [0.42 0.44 0.39 0.41] sorted [1 0 3]\n",
      "   state [0 1 0 0] state_WI [0.42 0.44 0.39 0.41] sorted [1 0 3]\n",
      "   state [0 1 0 0] state_WI [0.42 0.44 0.39 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [0.34 0.44 0.39 0.41] sorted [1 3 2]\n",
      "   state [1 1 0 0] state_WI [0.34 0.44 0.39 0.41] sorted [1 3 2]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [1 1 0 0] state_WI [0.34 0.44 0.39 0.41] sorted [1 3 2]\n",
      "   state [1 1 0 0] state_WI [0.34 0.44 0.39 0.41] sorted [1 3 2]\n",
      "   state [1 1 1 1] state_WI [0.34 0.44 0.36 0.42] sorted [1 3 2]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "instance 9, ep 5, state [1 0 0 0]\n",
      "   state [1 0 0 0] state_WI [0.34 0.84 0.39 0.41] sorted [1 3 2]\n",
      "   state [0 1 1 1] state_WI [0.42 0.44 0.36 0.42] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [1 1 1 1] state_WI [0.34 0.44 0.36 0.42] sorted [1 3 2]\n",
      "   state [0 0 1 1] state_WI [0.42 0.84 0.36 0.42] sorted [1 3 0]\n",
      "   state [0 1 1 0] state_WI [0.42 0.44 0.36 0.41] sorted [1 0 3]\n",
      "   state [0 1 0 0] state_WI [0.42 0.44 0.39 0.41] sorted [1 0 3]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [0 1 1 0] state_WI [0.42 0.44 0.36 0.41] sorted [1 0 3]\n",
      "   state [0 1 1 0] state_WI [0.42 0.44 0.36 0.41] sorted [1 0 3]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [0 0 0 1] state_WI [0.42 0.84 0.39 0.42] sorted [1 3 0]\n",
      "   state [0 1 1 1] state_WI [0.42 0.44 0.36 0.42] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.34 0.84 0.39 0.42] sorted [1 3 2]\n",
      "instance 9, ep 6, state [1 0 0 1]\n",
      "   state [1 0 0 1] state_WI [0.34 0.84 0.39 0.42] sorted [1 3 2]\n",
      "   state [1 1 1 1] state_WI [0.34 0.44 0.36 0.42] sorted [1 3 2]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [1 1 1 0] state_WI [0.34 0.44 0.36 0.41] sorted [1 3 2]\n",
      "   state [0 0 1 0] state_WI [0.42 0.84 0.36 0.41] sorted [1 0 3]\n",
      "   state [0 1 1 0] state_WI [0.42 0.44 0.36 0.41] sorted [1 0 3]\n",
      "   state [1 0 0 0] state_WI [0.34 0.84 0.39 0.41] sorted [1 3 2]\n",
      "   state [1 0 0 1] state_WI [0.34 0.84 0.39 0.42] sorted [1 3 2]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [0.34 0.44 0.39 0.41] sorted [1 3 2]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [0 1 1 1] state_WI [0.42 0.44 0.36 0.42] sorted [1 3 0]\n",
      "   state [0 1 1 0] state_WI [0.42 0.44 0.36 0.41] sorted [1 0 3]\n",
      "   state [0 1 0 0] state_WI [0.42 0.44 0.39 0.41] sorted [1 0 3]\n",
      "   state [0 1 1 1] state_WI [0.42 0.44 0.36 0.42] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.42 0.44 0.39 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "instance 9, ep 7, state [0 0 0 1]\n",
      "   state [0 0 0 1] state_WI [0.42 0.84 0.39 0.42] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [0.34 0.44 0.39 0.41] sorted [1 3 2]\n",
      "   state [0 1 1 0] state_WI [0.42 0.44 0.36 0.41] sorted [1 0 3]\n",
      "   state [0 0 0 0] state_WI [0.42 0.84 0.39 0.41] sorted [1 0 3]\n",
      "   state [0 1 0 0] state_WI [0.42 0.44 0.39 0.41] sorted [1 0 3]\n",
      "   state [1 0 1 0] state_WI [0.34 0.84 0.36 0.41] sorted [1 3 2]\n",
      "   state [1 1 1 0] state_WI [0.34 0.44 0.36 0.41] sorted [1 3 2]\n",
      "   state [1 0 1 1] state_WI [0.34 0.84 0.36 0.42] sorted [1 3 2]\n",
      "   state [1 1 1 1] state_WI [0.34 0.44 0.36 0.42] sorted [1 3 2]\n",
      "   state [0 1 1 1] state_WI [0.42 0.44 0.36 0.42] sorted [1 3 0]\n",
      "   state [1 1 1 1] state_WI [0.34 0.44 0.36 0.42] sorted [1 3 2]\n",
      "   state [0 1 1 0] state_WI [0.42 0.44 0.36 0.41] sorted [1 0 3]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [0 0 1 1] state_WI [0.42 0.84 0.36 0.42] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [1 1 1 1] state_WI [0.34 0.44 0.36 0.42] sorted [1 3 2]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "instance 9, ep 8, state [1 0 0 1]\n",
      "   state [1 0 0 1] state_WI [0.34 0.84 0.39 0.42] sorted [1 3 2]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [0 1 1 1] state_WI [0.42 0.44 0.36 0.42] sorted [1 3 0]\n",
      "   state [0 0 0 1] state_WI [0.42 0.84 0.39 0.42] sorted [1 3 0]\n",
      "   state [0 0 0 1] state_WI [0.42 0.84 0.39 0.42] sorted [1 3 0]\n",
      "   state [1 1 1 1] state_WI [0.34 0.44 0.36 0.42] sorted [1 3 2]\n",
      "   state [0 1 1 0] state_WI [0.42 0.44 0.36 0.41] sorted [1 0 3]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [1 0 1 0] state_WI [0.34 0.84 0.36 0.41] sorted [1 3 2]\n",
      "   state [1 1 1 1] state_WI [0.34 0.44 0.36 0.42] sorted [1 3 2]\n",
      "   state [1 1 1 1] state_WI [0.34 0.44 0.36 0.42] sorted [1 3 2]\n",
      "   state [0 1 1 0] state_WI [0.42 0.44 0.36 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.42 0.44 0.39 0.41] sorted [1 0 3]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.42 0.44 0.39 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "instance 9, ep 9, state [1 0 1 0]\n",
      "   state [1 0 1 0] state_WI [0.34 0.84 0.36 0.41] sorted [1 3 2]\n",
      "   state [1 1 1 0] state_WI [0.34 0.44 0.36 0.41] sorted [1 3 2]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.34 0.84 0.39 0.42] sorted [1 3 2]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [1 1 1 0] state_WI [0.34 0.44 0.36 0.41] sorted [1 3 2]\n",
      "   state [1 1 0 0] state_WI [0.34 0.44 0.39 0.41] sorted [1 3 2]\n",
      "   state [1 1 1 1] state_WI [0.34 0.44 0.36 0.42] sorted [1 3 2]\n",
      "   state [0 1 1 1] state_WI [0.42 0.44 0.36 0.42] sorted [1 3 0]\n",
      "   state [1 1 1 1] state_WI [0.34 0.44 0.36 0.42] sorted [1 3 2]\n",
      "   state [1 1 1 0] state_WI [0.34 0.44 0.36 0.41] sorted [1 3 2]\n",
      "   state [1 1 0 0] state_WI [0.34 0.44 0.39 0.41] sorted [1 3 2]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [1 1 1 1] state_WI [0.34 0.44 0.36 0.42] sorted [1 3 2]\n",
      "   state [1 1 1 0] state_WI [0.34 0.44 0.36 0.41] sorted [1 3 2]\n",
      "   state [1 0 0 1] state_WI [0.34 0.84 0.39 0.42] sorted [1 3 2]\n",
      "   state [0 1 1 1] state_WI [0.42 0.44 0.36 0.42] sorted [1 3 0]\n",
      "   state [0 1 1 1] state_WI [0.42 0.44 0.36 0.42] sorted [1 3 0]\n",
      "instance 9, ep 10, state [1 1 0 1]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [1 1 1 1] state_WI [0.34 0.44 0.36 0.42] sorted [1 3 2]\n",
      "   state [1 0 0 0] state_WI [0.34 0.84 0.39 0.41] sorted [1 3 2]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.34 0.84 0.39 0.42] sorted [1 3 2]\n",
      "   state [1 1 1 1] state_WI [0.34 0.44 0.36 0.42] sorted [1 3 2]\n",
      "   state [0 1 1 1] state_WI [0.42 0.44 0.36 0.42] sorted [1 3 0]\n",
      "   state [1 1 1 1] state_WI [0.34 0.44 0.36 0.42] sorted [1 3 2]\n",
      "   state [0 1 1 1] state_WI [0.42 0.44 0.36 0.42] sorted [1 3 0]\n",
      "   state [1 1 1 1] state_WI [0.34 0.44 0.36 0.42] sorted [1 3 2]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [1 1 1 1] state_WI [0.34 0.44 0.36 0.42] sorted [1 3 2]\n",
      "   state [0 1 0 0] state_WI [0.42 0.44 0.39 0.41] sorted [1 0 3]\n",
      "   state [0 1 0 0] state_WI [0.42 0.44 0.39 0.41] sorted [1 0 3]\n",
      "   state [0 0 0 0] state_WI [0.42 0.84 0.39 0.41] sorted [1 0 3]\n",
      "   state [0 1 0 0] state_WI [0.42 0.44 0.39 0.41] sorted [1 0 3]\n",
      "   state [0 1 0 0] state_WI [0.42 0.44 0.39 0.41] sorted [1 0 3]\n",
      "   state [0 1 0 0] state_WI [0.42 0.44 0.39 0.41] sorted [1 0 3]\n",
      "instance 9, ep 11, state [1 1 0 0]\n",
      "   state [1 1 0 0] state_WI [0.34 0.44 0.39 0.41] sorted [1 3 2]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [0 1 1 0] state_WI [0.42 0.44 0.36 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [1 1 1 1] state_WI [0.34 0.44 0.36 0.42] sorted [1 3 2]\n",
      "   state [1 1 1 1] state_WI [0.34 0.44 0.36 0.42] sorted [1 3 2]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [0 1 1 0] state_WI [0.42 0.44 0.36 0.41] sorted [1 0 3]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.34 0.84 0.39 0.42] sorted [1 3 2]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [0 1 0 0] state_WI [0.42 0.44 0.39 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [1 1 1 1] state_WI [0.34 0.44 0.36 0.42] sorted [1 3 2]\n",
      "   state [1 1 0 0] state_WI [0.34 0.44 0.39 0.41] sorted [1 3 2]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.42 0.44 0.39 0.41] sorted [1 0 3]\n",
      "instance 9, ep 12, state [0 1 0 1]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.34 0.84 0.39 0.42] sorted [1 3 2]\n",
      "   state [1 1 0 0] state_WI [0.34 0.44 0.39 0.41] sorted [1 3 2]\n",
      "   state [0 1 1 0] state_WI [0.42 0.44 0.36 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [0 1 1 1] state_WI [0.42 0.44 0.36 0.42] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.42 0.44 0.39 0.41] sorted [1 0 3]\n",
      "   state [1 0 0 1] state_WI [0.34 0.84 0.39 0.42] sorted [1 3 2]\n",
      "   state [0 1 0 0] state_WI [0.42 0.44 0.39 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [0 1 0 0] state_WI [0.42 0.44 0.39 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [0 1 1 1] state_WI [0.42 0.44 0.36 0.42] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "instance 9, ep 13, state [1 0 1 0]\n",
      "   state [1 0 1 0] state_WI [0.34 0.84 0.36 0.41] sorted [1 3 2]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [0 0 0 0] state_WI [0.42 0.84 0.39 0.41] sorted [1 0 3]\n",
      "   state [1 0 0 1] state_WI [0.34 0.84 0.39 0.42] sorted [1 3 2]\n",
      "   state [0 0 0 1] state_WI [0.42 0.84 0.39 0.42] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.42 0.44 0.39 0.41] sorted [1 0 3]\n",
      "   state [1 0 0 0] state_WI [0.34 0.84 0.39 0.41] sorted [1 3 2]\n",
      "   state [0 1 0 0] state_WI [0.42 0.44 0.39 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [0.34 0.44 0.39 0.41] sorted [1 3 2]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [0 1 1 1] state_WI [0.42 0.44 0.36 0.42] sorted [1 3 0]\n",
      "   state [0 1 1 1] state_WI [0.42 0.44 0.36 0.42] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [0 0 1 0] state_WI [0.42 0.84 0.36 0.41] sorted [1 0 3]\n",
      "instance 9, ep 14, state [1 0 0 0]\n",
      "   state [1 0 0 0] state_WI [0.34 0.84 0.39 0.41] sorted [1 3 2]\n",
      "   state [1 1 1 1] state_WI [0.34 0.44 0.36 0.42] sorted [1 3 2]\n",
      "   state [1 1 1 1] state_WI [0.34 0.44 0.36 0.42] sorted [1 3 2]\n",
      "   state [1 1 1 0] state_WI [0.34 0.44 0.36 0.41] sorted [1 3 2]\n",
      "   state [1 1 1 0] state_WI [0.34 0.44 0.36 0.41] sorted [1 3 2]\n",
      "   state [0 1 1 0] state_WI [0.42 0.44 0.36 0.41] sorted [1 0 3]\n",
      "   state [0 1 0 0] state_WI [0.42 0.44 0.39 0.41] sorted [1 0 3]\n",
      "   state [1 0 0 1] state_WI [0.34 0.84 0.39 0.42] sorted [1 3 2]\n",
      "   state [1 0 0 0] state_WI [0.34 0.84 0.39 0.41] sorted [1 3 2]\n",
      "   state [0 0 1 0] state_WI [0.42 0.84 0.36 0.41] sorted [1 0 3]\n",
      "   state [1 1 1 1] state_WI [0.34 0.44 0.36 0.42] sorted [1 3 2]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [1 1 1 1] state_WI [0.34 0.44 0.36 0.42] sorted [1 3 2]\n",
      "   state [0 1 1 1] state_WI [0.42 0.44 0.36 0.42] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [0 1 0 0] state_WI [0.42 0.44 0.39 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "instance 9, ep 15, state [0 1 1 1]\n",
      "   state [0 1 1 1] state_WI [0.42 0.44 0.36 0.42] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [0.34 0.44 0.39 0.41] sorted [1 3 2]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.42 0.44 0.39 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [0.34 0.44 0.39 0.41] sorted [1 3 2]\n",
      "   state [1 1 1 1] state_WI [0.34 0.44 0.36 0.42] sorted [1 3 2]\n",
      "   state [0 1 1 1] state_WI [0.42 0.44 0.36 0.42] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [0 0 0 1] state_WI [0.42 0.84 0.39 0.42] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [0.34 0.44 0.39 0.41] sorted [1 3 2]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [1 1 1 0] state_WI [0.34 0.44 0.36 0.41] sorted [1 3 2]\n",
      "   state [1 1 1 1] state_WI [0.34 0.44 0.36 0.42] sorted [1 3 2]\n",
      "   state [0 1 1 1] state_WI [0.42 0.44 0.36 0.42] sorted [1 3 0]\n",
      "   state [0 1 1 0] state_WI [0.42 0.44 0.36 0.41] sorted [1 0 3]\n",
      "   state [0 1 1 1] state_WI [0.42 0.44 0.36 0.42] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [0.34 0.44 0.39 0.41] sorted [1 3 2]\n",
      "instance 9, ep 16, state [0 0 0 1]\n",
      "   state [0 0 0 1] state_WI [0.42 0.84 0.39 0.42] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [1 0 0 0] state_WI [0.34 0.84 0.39 0.41] sorted [1 3 2]\n",
      "   state [1 0 0 0] state_WI [0.34 0.84 0.39 0.41] sorted [1 3 2]\n",
      "   state [1 0 0 0] state_WI [0.34 0.84 0.39 0.41] sorted [1 3 2]\n",
      "   state [1 1 1 1] state_WI [0.34 0.44 0.36 0.42] sorted [1 3 2]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [0.34 0.44 0.39 0.41] sorted [1 3 2]\n",
      "   state [1 1 0 0] state_WI [0.34 0.44 0.39 0.41] sorted [1 3 2]\n",
      "   state [1 1 1 0] state_WI [0.34 0.44 0.36 0.41] sorted [1 3 2]\n",
      "   state [0 1 1 0] state_WI [0.42 0.44 0.36 0.41] sorted [1 0 3]\n",
      "   state [0 0 1 0] state_WI [0.42 0.84 0.36 0.41] sorted [1 0 3]\n",
      "   state [1 1 1 0] state_WI [0.34 0.44 0.36 0.41] sorted [1 3 2]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "instance 9, ep 17, state [1 0 0 1]\n",
      "   state [1 0 0 1] state_WI [0.34 0.84 0.39 0.42] sorted [1 3 2]\n",
      "   state [0 0 0 1] state_WI [0.42 0.84 0.39 0.42] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.42 0.44 0.39 0.41] sorted [1 0 3]\n",
      "   state [1 0 0 0] state_WI [0.34 0.84 0.39 0.41] sorted [1 3 2]\n",
      "   state [0 1 0 0] state_WI [0.42 0.44 0.39 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [0.34 0.44 0.39 0.41] sorted [1 3 2]\n",
      "   state [0 1 1 0] state_WI [0.42 0.44 0.36 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [0.34 0.44 0.39 0.41] sorted [1 3 2]\n",
      "   state [1 1 0 0] state_WI [0.34 0.44 0.39 0.41] sorted [1 3 2]\n",
      "   state [1 1 1 1] state_WI [0.34 0.44 0.36 0.42] sorted [1 3 2]\n",
      "   state [0 0 1 1] state_WI [0.42 0.84 0.36 0.42] sorted [1 3 0]\n",
      "   state [1 0 0 0] state_WI [0.34 0.84 0.39 0.41] sorted [1 3 2]\n",
      "   state [0 0 1 1] state_WI [0.42 0.84 0.36 0.42] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.34 0.84 0.39 0.42] sorted [1 3 2]\n",
      "instance 9, ep 18, state [1 1 1 0]\n",
      "   state [1 1 1 0] state_WI [0.34 0.44 0.36 0.41] sorted [1 3 2]\n",
      "   state [0 1 1 0] state_WI [0.42 0.44 0.36 0.41] sorted [1 0 3]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [0 1 1 1] state_WI [0.42 0.44 0.36 0.42] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [0.34 0.44 0.39 0.41] sorted [1 3 2]\n",
      "   state [0 1 0 0] state_WI [0.42 0.44 0.39 0.41] sorted [1 0 3]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [0 1 1 0] state_WI [0.42 0.44 0.36 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [0.34 0.44 0.39 0.41] sorted [1 3 2]\n",
      "   state [0 1 1 0] state_WI [0.42 0.44 0.36 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [1 1 0 0] state_WI [0.34 0.44 0.39 0.41] sorted [1 3 2]\n",
      "   state [1 1 1 0] state_WI [0.34 0.44 0.36 0.41] sorted [1 3 2]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [1 1 1 1] state_WI [0.34 0.44 0.36 0.42] sorted [1 3 2]\n",
      "   state [1 1 1 1] state_WI [0.34 0.44 0.36 0.42] sorted [1 3 2]\n",
      "   state [1 1 1 1] state_WI [0.34 0.44 0.36 0.42] sorted [1 3 2]\n",
      "   state [0 1 1 0] state_WI [0.42 0.44 0.36 0.41] sorted [1 0 3]\n",
      "instance 9, ep 19, state [0 1 1 0]\n",
      "   state [0 1 1 0] state_WI [0.42 0.44 0.36 0.41] sorted [1 0 3]\n",
      "   state [0 1 0 0] state_WI [0.42 0.44 0.39 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [1 0 1 1] state_WI [0.34 0.84 0.36 0.42] sorted [1 3 2]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [0 1 1 1] state_WI [0.42 0.44 0.36 0.42] sorted [1 3 0]\n",
      "   state [1 1 1 1] state_WI [0.34 0.44 0.36 0.42] sorted [1 3 2]\n",
      "   state [0 0 1 1] state_WI [0.42 0.84 0.36 0.42] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [0.34 0.44 0.39 0.41] sorted [1 3 2]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [0 0 0 1] state_WI [0.42 0.84 0.39 0.42] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [1 1 1 1] state_WI [0.34 0.44 0.36 0.42] sorted [1 3 2]\n",
      "   state [0 1 1 0] state_WI [0.42 0.44 0.36 0.41] sorted [1 0 3]\n",
      "   state [1 1 1 0] state_WI [0.34 0.44 0.36 0.41] sorted [1 3 2]\n",
      "   state [1 0 0 0] state_WI [0.34 0.84 0.39 0.41] sorted [1 3 2]\n",
      "   state [0 1 1 1] state_WI [0.42 0.44 0.36 0.42] sorted [1 3 0]\n",
      "instance 9, ep 20, state [1 1 1 1]\n",
      "   state [1 1 1 1] state_WI [0.34 0.44 0.36 0.42] sorted [1 3 2]\n",
      "   state [1 1 1 1] state_WI [0.34 0.44 0.36 0.42] sorted [1 3 2]\n",
      "   state [0 1 1 1] state_WI [0.42 0.44 0.36 0.42] sorted [1 3 0]\n",
      "   state [0 1 1 1] state_WI [0.42 0.44 0.36 0.42] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [0.34 0.44 0.39 0.41] sorted [1 3 2]\n",
      "   state [0 0 0 0] state_WI [0.42 0.84 0.39 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [0.34 0.44 0.39 0.41] sorted [1 3 2]\n",
      "   state [0 1 0 0] state_WI [0.42 0.44 0.39 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [0.34 0.44 0.39 0.41] sorted [1 3 2]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [1 1 1 1] state_WI [0.34 0.44 0.36 0.42] sorted [1 3 2]\n",
      "   state [0 1 1 1] state_WI [0.42 0.44 0.36 0.42] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "instance 9, ep 21, state [0 1 1 1]\n",
      "   state [0 1 1 1] state_WI [0.42 0.44 0.36 0.42] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [1 0 0 0] state_WI [0.34 0.84 0.39 0.41] sorted [1 3 2]\n",
      "   state [0 1 0 0] state_WI [0.42 0.44 0.39 0.41] sorted [1 0 3]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [0 1 1 1] state_WI [0.42 0.44 0.36 0.42] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.42 0.44 0.39 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [0.34 0.44 0.39 0.41] sorted [1 3 2]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [1 1 1 0] state_WI [0.34 0.44 0.36 0.41] sorted [1 3 2]\n",
      "   state [1 1 1 1] state_WI [0.34 0.44 0.36 0.42] sorted [1 3 2]\n",
      "   state [0 1 1 0] state_WI [0.42 0.44 0.36 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [0.34 0.44 0.39 0.41] sorted [1 3 2]\n",
      "   state [0 1 0 0] state_WI [0.42 0.44 0.39 0.41] sorted [1 0 3]\n",
      "   state [0 1 0 0] state_WI [0.42 0.44 0.39 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [0.34 0.44 0.39 0.41] sorted [1 3 2]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "instance 9, ep 22, state [1 1 0 1]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.42 0.44 0.39 0.41] sorted [1 0 3]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [0.34 0.44 0.39 0.41] sorted [1 3 2]\n",
      "   state [0 1 0 0] state_WI [0.42 0.44 0.39 0.41] sorted [1 0 3]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [1 1 1 1] state_WI [0.34 0.44 0.36 0.42] sorted [1 3 2]\n",
      "   state [1 1 1 1] state_WI [0.34 0.44 0.36 0.42] sorted [1 3 2]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [0.34 0.44 0.39 0.41] sorted [1 3 2]\n",
      "   state [0 1 0 0] state_WI [0.42 0.44 0.39 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [0.34 0.44 0.39 0.41] sorted [1 3 2]\n",
      "   state [1 1 0 0] state_WI [0.34 0.44 0.39 0.41] sorted [1 3 2]\n",
      "   state [0 1 0 0] state_WI [0.42 0.44 0.39 0.41] sorted [1 0 3]\n",
      "   state [1 1 1 1] state_WI [0.34 0.44 0.36 0.42] sorted [1 3 2]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [0.34 0.44 0.39 0.41] sorted [1 3 2]\n",
      "instance 9, ep 23, state [1 1 1 1]\n",
      "   state [1 1 1 1] state_WI [0.34 0.44 0.36 0.42] sorted [1 3 2]\n",
      "   state [1 1 1 0] state_WI [0.34 0.44 0.36 0.41] sorted [1 3 2]\n",
      "   state [1 0 0 0] state_WI [0.34 0.84 0.39 0.41] sorted [1 3 2]\n",
      "   state [0 1 0 0] state_WI [0.42 0.44 0.39 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [0.34 0.44 0.39 0.41] sorted [1 3 2]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [0 1 1 1] state_WI [0.42 0.44 0.36 0.42] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.42 0.44 0.39 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [0 1 0 0] state_WI [0.42 0.44 0.39 0.41] sorted [1 0 3]\n",
      "   state [0 0 0 1] state_WI [0.42 0.84 0.39 0.42] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.42 0.44 0.39 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "instance 9, ep 24, state [0 1 0 0]\n",
      "   state [0 1 0 0] state_WI [0.42 0.44 0.39 0.41] sorted [1 0 3]\n",
      "   state [1 1 1 0] state_WI [0.34 0.44 0.36 0.41] sorted [1 3 2]\n",
      "   state [1 1 1 0] state_WI [0.34 0.44 0.36 0.41] sorted [1 3 2]\n",
      "   state [0 1 1 0] state_WI [0.42 0.44 0.36 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [0.34 0.44 0.39 0.41] sorted [1 3 2]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.34 0.84 0.39 0.42] sorted [1 3 2]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [0 0 0 1] state_WI [0.42 0.84 0.39 0.42] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [1 1 1 1] state_WI [0.34 0.44 0.36 0.42] sorted [1 3 2]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [0.34 0.44 0.39 0.41] sorted [1 3 2]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [0 1 1 1] state_WI [0.42 0.44 0.36 0.42] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [0.34 0.84 0.39 0.42] sorted [1 3 2]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.42 0.44 0.39 0.41] sorted [1 0 3]\n",
      "instance 9, ep 25, state [1 1 0 0]\n",
      "   state [1 1 0 0] state_WI [0.34 0.44 0.39 0.41] sorted [1 3 2]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [0 1 1 1] state_WI [0.42 0.44 0.36 0.42] sorted [1 3 0]\n",
      "   state [1 1 1 1] state_WI [0.34 0.44 0.36 0.42] sorted [1 3 2]\n",
      "   state [0 1 0 0] state_WI [0.42 0.44 0.39 0.41] sorted [1 0 3]\n",
      "   state [0 1 0 0] state_WI [0.42 0.44 0.39 0.41] sorted [1 0 3]\n",
      "   state [1 1 1 1] state_WI [0.34 0.44 0.36 0.42] sorted [1 3 2]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [0 0 0 1] state_WI [0.42 0.84 0.39 0.42] sorted [1 3 0]\n",
      "   state [0 0 0 1] state_WI [0.42 0.84 0.39 0.42] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [0 1 1 1] state_WI [0.42 0.44 0.36 0.42] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [0.34 0.44 0.39 0.41] sorted [1 3 2]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [1 1 1 0] state_WI [0.34 0.44 0.36 0.41] sorted [1 3 2]\n",
      "   state [1 1 1 1] state_WI [0.34 0.44 0.36 0.42] sorted [1 3 2]\n",
      "   state [0 1 1 1] state_WI [0.42 0.44 0.36 0.42] sorted [1 3 0]\n",
      "instance 9, ep 26, state [1 0 0 0]\n",
      "   state [1 0 0 0] state_WI [0.34 0.84 0.39 0.41] sorted [1 3 2]\n",
      "   state [0 0 1 0] state_WI [0.42 0.84 0.36 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [0.34 0.44 0.39 0.41] sorted [1 3 2]\n",
      "   state [0 1 0 0] state_WI [0.42 0.44 0.39 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [0 0 1 1] state_WI [0.42 0.84 0.36 0.42] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [0.34 0.44 0.39 0.41] sorted [1 3 2]\n",
      "   state [1 1 1 1] state_WI [0.34 0.44 0.36 0.42] sorted [1 3 2]\n",
      "   state [1 0 1 1] state_WI [0.34 0.84 0.36 0.42] sorted [1 3 2]\n",
      "   state [0 1 1 0] state_WI [0.42 0.44 0.36 0.41] sorted [1 0 3]\n",
      "   state [0 1 0 0] state_WI [0.42 0.44 0.39 0.41] sorted [1 0 3]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [1 0 0 0] state_WI [0.34 0.84 0.39 0.41] sorted [1 3 2]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "instance 9, ep 27, state [0 0 0 0]\n",
      "   state [0 0 0 0] state_WI [0.42 0.84 0.39 0.41] sorted [1 0 3]\n",
      "   state [0 1 0 0] state_WI [0.42 0.44 0.39 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [1 1 1 1] state_WI [0.34 0.44 0.36 0.42] sorted [1 3 2]\n",
      "   state [1 1 1 0] state_WI [0.34 0.44 0.36 0.41] sorted [1 3 2]\n",
      "   state [1 1 1 0] state_WI [0.34 0.44 0.36 0.41] sorted [1 3 2]\n",
      "   state [1 1 1 0] state_WI [0.34 0.44 0.36 0.41] sorted [1 3 2]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.42 0.44 0.39 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [0.34 0.44 0.39 0.41] sorted [1 3 2]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [0 1 1 0] state_WI [0.42 0.44 0.36 0.41] sorted [1 0 3]\n",
      "   state [1 1 1 1] state_WI [0.34 0.44 0.36 0.42] sorted [1 3 2]\n",
      "   state [0 1 1 1] state_WI [0.42 0.44 0.36 0.42] sorted [1 3 0]\n",
      "instance 9, ep 28, state [1 1 1 0]\n",
      "   state [1 1 1 0] state_WI [0.34 0.44 0.36 0.41] sorted [1 3 2]\n",
      "   state [0 1 1 0] state_WI [0.42 0.44 0.36 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [1 0 0 0] state_WI [0.34 0.84 0.39 0.41] sorted [1 3 2]\n",
      "   state [1 1 1 0] state_WI [0.34 0.44 0.36 0.41] sorted [1 3 2]\n",
      "   state [1 1 1 0] state_WI [0.34 0.44 0.36 0.41] sorted [1 3 2]\n",
      "   state [0 1 1 0] state_WI [0.42 0.44 0.36 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [0.34 0.44 0.39 0.41] sorted [1 3 2]\n",
      "   state [0 1 0 0] state_WI [0.42 0.44 0.39 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [0 0 1 0] state_WI [0.42 0.84 0.36 0.41] sorted [1 0 3]\n",
      "   state [0 0 0 1] state_WI [0.42 0.84 0.39 0.42] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [1 1 1 0] state_WI [0.34 0.44 0.36 0.41] sorted [1 3 2]\n",
      "   state [1 1 1 1] state_WI [0.34 0.44 0.36 0.42] sorted [1 3 2]\n",
      "   state [1 1 1 0] state_WI [0.34 0.44 0.36 0.41] sorted [1 3 2]\n",
      "   state [0 1 0 0] state_WI [0.42 0.44 0.39 0.41] sorted [1 0 3]\n",
      "   state [0 1 1 0] state_WI [0.42 0.44 0.36 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "instance 9, ep 29, state [0 1 0 0]\n",
      "   state [0 1 0 0] state_WI [0.42 0.44 0.39 0.41] sorted [1 0 3]\n",
      "   state [0 1 0 0] state_WI [0.42 0.44 0.39 0.41] sorted [1 0 3]\n",
      "   state [1 0 0 1] state_WI [0.34 0.84 0.39 0.42] sorted [1 3 2]\n",
      "   state [0 0 1 0] state_WI [0.42 0.84 0.36 0.41] sorted [1 0 3]\n",
      "   state [0 1 1 1] state_WI [0.42 0.44 0.36 0.42] sorted [1 3 0]\n",
      "   state [1 1 1 1] state_WI [0.34 0.44 0.36 0.42] sorted [1 3 2]\n",
      "   state [0 1 0 0] state_WI [0.42 0.44 0.39 0.41] sorted [1 0 3]\n",
      "   state [1 0 0 0] state_WI [0.34 0.84 0.39 0.41] sorted [1 3 2]\n",
      "   state [1 1 0 0] state_WI [0.34 0.44 0.39 0.41] sorted [1 3 2]\n",
      "   state [0 1 1 0] state_WI [0.42 0.44 0.36 0.41] sorted [1 0 3]\n",
      "   state [0 1 0 0] state_WI [0.42 0.44 0.39 0.41] sorted [1 0 3]\n",
      "   state [0 1 1 1] state_WI [0.42 0.44 0.36 0.42] sorted [1 3 0]\n",
      "   state [1 1 1 1] state_WI [0.34 0.44 0.36 0.42] sorted [1 3 2]\n",
      "   state [0 1 1 1] state_WI [0.42 0.44 0.36 0.42] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [0.34 0.44 0.39 0.42] sorted [1 3 2]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.42 0.44 0.39 0.42] sorted [1 3 0]\n"
     ]
    }
   ],
   "source": [
    "np.random.seed(seed)\n",
    "random.seed(seed)\n",
    "optimal_reward = optimal_whittle(simulator, n_episodes, n_epochs, discount)\n",
    "optimal_active_rate = simulator.total_active/(optimal_reward.size*n_arms)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 17,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "first state [0 1 1 1]\n",
      "instance 0, ep 1, state [1 1 1 1]\n",
      "instance 0, ep 2, state [0 0 0 1]\n",
      "instance 0, ep 3, state [1 1 0 1]\n",
      "instance 0, ep 4, state [0 1 1 1]\n",
      "instance 0, ep 5, state [0 0 0 1]\n",
      "instance 0, ep 6, state [0 0 0 1]\n",
      "instance 0, ep 7, state [0 1 1 0]\n",
      "instance 0, ep 8, state [1 1 0 1]\n",
      "instance 0, ep 9, state [1 1 1 1]\n",
      "instance 0, ep 10, state [0 0 0 0]\n",
      "instance 0, ep 11, state [0 1 0 0]\n",
      "instance 0, ep 12, state [0 1 0 1]\n",
      "instance 0, ep 13, state [0 0 0 0]\n",
      "instance 0, ep 14, state [1 0 1 0]\n",
      "instance 0, ep 15, state [0 0 0 1]\n",
      "instance 0, ep 16, state [0 0 0 0]\n",
      "instance 0, ep 17, state [1 1 0 1]\n",
      "instance 0, ep 18, state [0 1 0 0]\n",
      "instance 0, ep 19, state [0 1 1 1]\n",
      "instance 0, ep 20, state [0 1 1 0]\n",
      "instance 0, ep 21, state [0 0 1 0]\n",
      "instance 0, ep 22, state [1 0 1 1]\n",
      "instance 0, ep 23, state [0 1 1 1]\n",
      "instance 0, ep 24, state [0 0 1 1]\n",
      "instance 0, ep 25, state [0 0 1 0]\n",
      "instance 0, ep 26, state [1 1 1 1]\n",
      "instance 0, ep 27, state [0 1 1 0]\n",
      "instance 0, ep 28, state [0 1 1 0]\n",
      "instance 0, ep 29, state [1 1 1 1]\n",
      "first state [1 0 0 0]\n",
      "instance 1, ep 1, state [1 0 0 1]\n",
      "instance 1, ep 2, state [0 0 0 0]\n",
      "instance 1, ep 3, state [1 0 1 0]\n",
      "instance 1, ep 4, state [1 0 0 1]\n",
      "instance 1, ep 5, state [1 1 0 0]\n",
      "instance 1, ep 6, state [0 1 0 1]\n",
      "instance 1, ep 7, state [0 1 0 1]\n",
      "instance 1, ep 8, state [0 0 1 0]\n",
      "instance 1, ep 9, state [0 1 1 0]\n",
      "instance 1, ep 10, state [0 0 1 0]\n",
      "instance 1, ep 11, state [0 0 0 1]\n",
      "instance 1, ep 12, state [0 1 0 0]\n",
      "instance 1, ep 13, state [0 0 1 1]\n",
      "instance 1, ep 14, state [1 1 0 1]\n",
      "instance 1, ep 15, state [0 1 0 0]\n",
      "instance 1, ep 16, state [0 0 0 0]\n",
      "instance 1, ep 17, state [1 0 0 1]\n",
      "instance 1, ep 18, state [1 0 0 1]\n",
      "instance 1, ep 19, state [0 1 1 0]\n",
      "instance 1, ep 20, state [0 1 1 1]\n",
      "instance 1, ep 21, state [1 1 1 1]\n",
      "instance 1, ep 22, state [1 1 1 1]\n",
      "instance 1, ep 23, state [1 0 1 1]\n",
      "instance 1, ep 24, state [1 1 1 0]\n",
      "instance 1, ep 25, state [0 0 0 0]\n",
      "instance 1, ep 26, state [1 0 1 0]\n",
      "instance 1, ep 27, state [1 0 0 0]\n",
      "instance 1, ep 28, state [1 0 1 0]\n",
      "instance 1, ep 29, state [0 1 1 0]\n",
      "first state [1 0 0 1]\n",
      "instance 2, ep 1, state [0 1 0 1]\n",
      "instance 2, ep 2, state [0 1 1 1]\n",
      "instance 2, ep 3, state [0 1 1 1]\n",
      "instance 2, ep 4, state [1 1 0 1]\n",
      "instance 2, ep 5, state [1 1 0 0]\n",
      "instance 2, ep 6, state [1 1 0 1]\n",
      "instance 2, ep 7, state [0 0 0 0]\n",
      "instance 2, ep 8, state [1 0 1 1]\n",
      "instance 2, ep 9, state [1 1 0 1]\n",
      "instance 2, ep 10, state [1 0 1 1]\n",
      "instance 2, ep 11, state [1 1 1 0]\n",
      "instance 2, ep 12, state [1 1 0 0]\n",
      "instance 2, ep 13, state [0 1 1 0]\n",
      "instance 2, ep 14, state [1 0 1 1]\n",
      "instance 2, ep 15, state [1 0 0 0]\n",
      "instance 2, ep 16, state [0 1 1 1]\n",
      "instance 2, ep 17, state [1 1 1 1]\n",
      "instance 2, ep 18, state [1 0 0 0]\n",
      "instance 2, ep 19, state [1 1 0 1]\n",
      "instance 2, ep 20, state [1 0 0 1]\n",
      "instance 2, ep 21, state [1 1 1 1]\n",
      "instance 2, ep 22, state [1 1 1 0]\n",
      "instance 2, ep 23, state [0 0 1 1]\n",
      "instance 2, ep 24, state [1 0 0 0]\n",
      "instance 2, ep 25, state [0 1 0 0]\n",
      "instance 2, ep 26, state [1 0 1 1]\n",
      "instance 2, ep 27, state [0 1 1 1]\n",
      "instance 2, ep 28, state [0 1 0 0]\n",
      "instance 2, ep 29, state [0 1 0 0]\n",
      "first state [0 1 1 0]\n",
      "instance 3, ep 1, state [1 1 0 0]\n",
      "instance 3, ep 2, state [0 0 0 0]\n",
      "instance 3, ep 3, state [0 0 1 0]\n",
      "instance 3, ep 4, state [1 0 1 0]\n",
      "instance 3, ep 5, state [0 1 1 1]\n",
      "instance 3, ep 6, state [0 0 1 1]\n",
      "instance 3, ep 7, state [1 1 0 1]\n",
      "instance 3, ep 8, state [0 0 0 1]\n",
      "instance 3, ep 9, state [0 0 1 0]\n",
      "instance 3, ep 10, state [1 0 0 1]\n",
      "instance 3, ep 11, state [0 0 0 0]\n",
      "instance 3, ep 12, state [1 0 1 0]\n",
      "instance 3, ep 13, state [1 1 1 0]\n",
      "instance 3, ep 14, state [0 0 1 1]\n",
      "instance 3, ep 15, state [1 0 1 1]\n",
      "instance 3, ep 16, state [0 0 1 1]\n",
      "instance 3, ep 17, state [1 0 1 0]\n",
      "instance 3, ep 18, state [0 0 1 1]\n",
      "instance 3, ep 19, state [1 0 1 0]\n",
      "instance 3, ep 20, state [1 0 0 0]\n",
      "instance 3, ep 21, state [0 1 1 0]\n",
      "instance 3, ep 22, state [1 0 1 1]\n",
      "instance 3, ep 23, state [1 0 1 1]\n",
      "instance 3, ep 24, state [0 0 1 1]\n",
      "instance 3, ep 25, state [1 1 1 0]\n",
      "instance 3, ep 26, state [0 0 1 0]\n",
      "instance 3, ep 27, state [1 1 1 0]\n",
      "instance 3, ep 28, state [1 0 1 0]\n",
      "instance 3, ep 29, state [0 1 0 0]\n",
      "first state [0 1 0 1]\n",
      "instance 4, ep 1, state [0 0 0 0]\n",
      "instance 4, ep 2, state [1 0 1 0]\n",
      "instance 4, ep 3, state [1 0 0 1]\n",
      "instance 4, ep 4, state [0 0 1 1]\n",
      "instance 4, ep 5, state [0 0 1 0]\n",
      "instance 4, ep 6, state [0 0 1 1]\n",
      "instance 4, ep 7, state [0 0 0 1]\n",
      "instance 4, ep 8, state [0 0 1 0]\n",
      "instance 4, ep 9, state [1 0 0 0]\n",
      "instance 4, ep 10, state [1 1 1 0]\n",
      "instance 4, ep 11, state [1 0 0 1]\n",
      "instance 4, ep 12, state [0 0 0 0]\n",
      "instance 4, ep 13, state [0 1 0 1]\n",
      "instance 4, ep 14, state [1 0 0 0]\n",
      "instance 4, ep 15, state [1 0 1 0]\n",
      "instance 4, ep 16, state [1 0 0 1]\n",
      "instance 4, ep 17, state [1 0 1 0]\n",
      "instance 4, ep 18, state [1 1 0 0]\n",
      "instance 4, ep 19, state [0 1 1 0]\n",
      "instance 4, ep 20, state [0 1 1 1]\n",
      "instance 4, ep 21, state [0 0 0 1]\n",
      "instance 4, ep 22, state [0 1 0 1]\n",
      "instance 4, ep 23, state [1 1 0 0]\n",
      "instance 4, ep 24, state [0 1 1 1]\n",
      "instance 4, ep 25, state [1 1 0 1]\n",
      "instance 4, ep 26, state [0 0 1 0]\n",
      "instance 4, ep 27, state [0 1 0 1]\n",
      "instance 4, ep 28, state [0 0 0 0]\n",
      "instance 4, ep 29, state [1 0 1 0]\n",
      "first state [0 1 1 1]\n",
      "instance 5, ep 1, state [0 0 1 0]\n",
      "instance 5, ep 2, state [1 1 1 1]\n",
      "instance 5, ep 3, state [1 0 1 0]\n",
      "instance 5, ep 4, state [0 1 1 1]\n",
      "instance 5, ep 5, state [1 0 0 1]\n",
      "instance 5, ep 6, state [0 0 0 0]\n",
      "instance 5, ep 7, state [0 0 0 0]\n",
      "instance 5, ep 8, state [1 0 0 1]\n",
      "instance 5, ep 9, state [0 1 1 0]\n",
      "instance 5, ep 10, state [0 1 1 0]\n",
      "instance 5, ep 11, state [1 0 1 0]\n",
      "instance 5, ep 12, state [1 1 1 1]\n",
      "instance 5, ep 13, state [0 0 0 0]\n",
      "instance 5, ep 14, state [1 0 0 1]\n",
      "instance 5, ep 15, state [1 1 1 0]\n",
      "instance 5, ep 16, state [0 1 1 0]\n",
      "instance 5, ep 17, state [1 0 0 1]\n",
      "instance 5, ep 18, state [1 1 0 1]\n",
      "instance 5, ep 19, state [0 0 1 1]\n",
      "instance 5, ep 20, state [1 1 1 1]\n",
      "instance 5, ep 21, state [0 0 0 0]\n",
      "instance 5, ep 22, state [1 0 0 0]\n",
      "instance 5, ep 23, state [1 0 1 0]\n",
      "instance 5, ep 24, state [0 1 1 0]\n",
      "instance 5, ep 25, state [1 1 0 1]\n",
      "instance 5, ep 26, state [1 1 1 1]\n",
      "instance 5, ep 27, state [1 1 1 1]\n",
      "instance 5, ep 28, state [1 1 0 1]\n",
      "instance 5, ep 29, state [1 0 1 0]\n",
      "first state [0 0 1 0]\n",
      "instance 6, ep 1, state [1 0 1 0]\n",
      "instance 6, ep 2, state [1 1 1 1]\n",
      "instance 6, ep 3, state [1 1 0 0]\n",
      "instance 6, ep 4, state [1 1 1 0]\n",
      "instance 6, ep 5, state [0 0 1 0]\n",
      "instance 6, ep 6, state [0 0 0 1]\n",
      "instance 6, ep 7, state [0 1 0 0]\n",
      "instance 6, ep 8, state [0 0 0 0]\n",
      "instance 6, ep 9, state [1 0 1 1]\n",
      "instance 6, ep 10, state [1 0 0 0]\n",
      "instance 6, ep 11, state [0 1 0 0]\n",
      "instance 6, ep 12, state [1 1 1 0]\n",
      "instance 6, ep 13, state [0 1 0 0]\n",
      "instance 6, ep 14, state [0 0 0 0]\n",
      "instance 6, ep 15, state [1 1 1 0]\n",
      "instance 6, ep 16, state [0 0 1 1]\n",
      "instance 6, ep 17, state [0 1 0 1]\n",
      "instance 6, ep 18, state [1 1 1 1]\n",
      "instance 6, ep 19, state [0 1 0 1]\n",
      "instance 6, ep 20, state [1 1 0 1]\n",
      "instance 6, ep 21, state [1 1 0 0]\n",
      "instance 6, ep 22, state [0 0 1 0]\n",
      "instance 6, ep 23, state [1 0 0 1]\n",
      "instance 6, ep 24, state [1 0 1 1]\n",
      "instance 6, ep 25, state [0 1 1 1]\n",
      "instance 6, ep 26, state [0 1 0 0]\n",
      "instance 6, ep 27, state [0 0 1 1]\n",
      "instance 6, ep 28, state [1 0 0 0]\n",
      "instance 6, ep 29, state [1 0 1 1]\n",
      "first state [1 0 1 0]\n",
      "instance 7, ep 1, state [1 0 0 0]\n",
      "instance 7, ep 2, state [1 0 1 1]\n",
      "instance 7, ep 3, state [0 1 0 1]\n",
      "instance 7, ep 4, state [0 1 1 1]\n",
      "instance 7, ep 5, state [1 0 1 1]\n",
      "instance 7, ep 6, state [1 0 1 1]\n",
      "instance 7, ep 7, state [1 0 1 0]\n",
      "instance 7, ep 8, state [1 0 1 1]\n",
      "instance 7, ep 9, state [0 1 0 1]\n",
      "instance 7, ep 10, state [1 1 1 1]\n",
      "instance 7, ep 11, state [0 0 1 1]\n",
      "instance 7, ep 12, state [1 1 0 1]\n",
      "instance 7, ep 13, state [0 1 0 0]\n",
      "instance 7, ep 14, state [0 0 1 0]\n",
      "instance 7, ep 15, state [0 0 0 0]\n",
      "instance 7, ep 16, state [0 1 1 1]\n",
      "instance 7, ep 17, state [0 0 1 1]\n",
      "instance 7, ep 18, state [0 0 0 0]\n",
      "instance 7, ep 19, state [0 1 1 1]\n",
      "instance 7, ep 20, state [1 1 1 1]\n",
      "instance 7, ep 21, state [0 0 0 1]\n",
      "instance 7, ep 22, state [1 0 1 0]\n",
      "instance 7, ep 23, state [1 0 0 0]\n",
      "instance 7, ep 24, state [0 0 0 1]\n",
      "instance 7, ep 25, state [1 0 1 1]\n",
      "instance 7, ep 26, state [0 0 0 0]\n",
      "instance 7, ep 27, state [1 0 1 1]\n",
      "instance 7, ep 28, state [0 1 0 1]\n",
      "instance 7, ep 29, state [0 1 1 0]\n",
      "first state [0 0 1 1]\n",
      "instance 8, ep 1, state [0 1 0 1]\n",
      "instance 8, ep 2, state [0 0 1 0]\n",
      "instance 8, ep 3, state [1 1 1 0]\n",
      "instance 8, ep 4, state [0 0 1 1]\n",
      "instance 8, ep 5, state [1 1 1 1]\n",
      "instance 8, ep 6, state [0 1 0 1]\n",
      "instance 8, ep 7, state [1 1 0 0]\n",
      "instance 8, ep 8, state [0 0 0 1]\n",
      "instance 8, ep 9, state [1 0 0 0]\n",
      "instance 8, ep 10, state [1 1 1 0]\n",
      "instance 8, ep 11, state [1 1 0 1]\n",
      "instance 8, ep 12, state [0 1 0 1]\n",
      "instance 8, ep 13, state [1 1 1 0]\n",
      "instance 8, ep 14, state [0 0 0 1]\n",
      "instance 8, ep 15, state [0 1 1 1]\n",
      "instance 8, ep 16, state [0 1 1 0]\n",
      "instance 8, ep 17, state [1 1 0 1]\n",
      "instance 8, ep 18, state [0 0 0 0]\n",
      "instance 8, ep 19, state [0 0 1 1]\n",
      "instance 8, ep 20, state [1 0 0 1]\n",
      "instance 8, ep 21, state [0 0 1 0]\n",
      "instance 8, ep 22, state [1 1 0 0]\n",
      "instance 8, ep 23, state [1 0 0 1]\n",
      "instance 8, ep 24, state [0 1 1 0]\n",
      "instance 8, ep 25, state [0 0 0 0]\n",
      "instance 8, ep 26, state [1 0 1 1]\n",
      "instance 8, ep 27, state [1 1 0 1]\n",
      "instance 8, ep 28, state [1 0 0 1]\n",
      "instance 8, ep 29, state [0 0 0 0]\n",
      "first state [1 1 1 0]\n",
      "instance 9, ep 1, state [1 1 0 0]\n",
      "instance 9, ep 2, state [0 0 1 0]\n",
      "instance 9, ep 3, state [1 0 0 0]\n",
      "instance 9, ep 4, state [0 0 1 1]\n",
      "instance 9, ep 5, state [1 0 0 0]\n",
      "instance 9, ep 6, state [1 0 0 1]\n",
      "instance 9, ep 7, state [0 0 0 1]\n",
      "instance 9, ep 8, state [1 0 0 1]\n",
      "instance 9, ep 9, state [1 0 1 0]\n",
      "instance 9, ep 10, state [1 1 0 1]\n",
      "instance 9, ep 11, state [1 1 0 0]\n",
      "instance 9, ep 12, state [0 1 0 1]\n",
      "instance 9, ep 13, state [1 0 1 0]\n",
      "instance 9, ep 14, state [1 0 0 0]\n",
      "instance 9, ep 15, state [0 1 1 1]\n",
      "instance 9, ep 16, state [0 0 0 1]\n",
      "instance 9, ep 17, state [1 0 0 1]\n",
      "instance 9, ep 18, state [1 1 1 0]\n",
      "instance 9, ep 19, state [0 1 1 0]\n",
      "instance 9, ep 20, state [1 1 1 1]\n",
      "instance 9, ep 21, state [0 1 1 1]\n",
      "instance 9, ep 22, state [1 1 0 1]\n",
      "instance 9, ep 23, state [1 1 1 1]\n",
      "instance 9, ep 24, state [0 1 0 0]\n",
      "instance 9, ep 25, state [1 1 0 0]\n",
      "instance 9, ep 26, state [1 0 0 0]\n",
      "instance 9, ep 27, state [0 0 0 0]\n",
      "instance 9, ep 28, state [1 1 1 0]\n",
      "instance 9, ep 29, state [0 1 0 0]\n"
     ]
    }
   ],
   "source": [
    "np.random.seed(seed)\n",
    "random.seed(seed)\n",
    "zero_step_rewards = myopic_match_n_step(simulator, n_episodes, n_epochs, discount,0)\n",
    "zero_step_active_rate = simulator.total_active/(zero_step_rewards.size*n_arms)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 18,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "first state [0 1 1 1]\n",
      "instance 0, ep 1, state [1 1 1 1]\n",
      "instance 0, ep 2, state [0 0 0 1]\n",
      "instance 0, ep 3, state [1 1 0 1]\n",
      "instance 0, ep 4, state [0 1 1 1]\n",
      "instance 0, ep 5, state [0 0 0 1]\n",
      "instance 0, ep 6, state [0 0 0 1]\n",
      "instance 0, ep 7, state [0 1 1 0]\n",
      "instance 0, ep 8, state [1 1 0 1]\n",
      "instance 0, ep 9, state [1 1 1 1]\n",
      "instance 0, ep 10, state [0 0 0 0]\n",
      "instance 0, ep 11, state [0 1 0 0]\n",
      "instance 0, ep 12, state [0 1 0 1]\n",
      "instance 0, ep 13, state [0 0 0 0]\n",
      "instance 0, ep 14, state [1 0 1 0]\n",
      "instance 0, ep 15, state [0 0 0 1]\n",
      "instance 0, ep 16, state [0 0 0 0]\n",
      "instance 0, ep 17, state [1 1 0 1]\n",
      "instance 0, ep 18, state [0 1 0 0]\n",
      "instance 0, ep 19, state [0 1 1 1]\n",
      "instance 0, ep 20, state [0 1 1 0]\n",
      "instance 0, ep 21, state [0 0 1 0]\n",
      "instance 0, ep 22, state [1 0 1 1]\n",
      "instance 0, ep 23, state [0 1 1 1]\n",
      "instance 0, ep 24, state [0 0 1 1]\n",
      "instance 0, ep 25, state [0 0 1 0]\n",
      "instance 0, ep 26, state [1 1 1 1]\n",
      "instance 0, ep 27, state [0 1 1 0]\n",
      "instance 0, ep 28, state [0 1 1 0]\n",
      "instance 0, ep 29, state [1 1 1 1]\n",
      "first state [1 0 0 0]\n",
      "instance 1, ep 1, state [1 0 0 1]\n",
      "instance 1, ep 2, state [0 0 0 0]\n",
      "instance 1, ep 3, state [1 0 1 0]\n",
      "instance 1, ep 4, state [1 0 0 1]\n",
      "instance 1, ep 5, state [1 1 0 0]\n",
      "instance 1, ep 6, state [0 1 0 1]\n",
      "instance 1, ep 7, state [0 1 0 1]\n",
      "instance 1, ep 8, state [0 0 1 0]\n",
      "instance 1, ep 9, state [0 1 1 0]\n",
      "instance 1, ep 10, state [0 0 1 0]\n",
      "instance 1, ep 11, state [0 0 0 1]\n",
      "instance 1, ep 12, state [0 1 0 0]\n",
      "instance 1, ep 13, state [0 0 1 1]\n",
      "instance 1, ep 14, state [1 1 0 1]\n",
      "instance 1, ep 15, state [0 1 0 0]\n",
      "instance 1, ep 16, state [0 0 0 0]\n",
      "instance 1, ep 17, state [1 0 0 1]\n",
      "instance 1, ep 18, state [1 0 0 1]\n",
      "instance 1, ep 19, state [0 1 1 0]\n",
      "instance 1, ep 20, state [0 1 1 1]\n",
      "instance 1, ep 21, state [1 1 1 1]\n",
      "instance 1, ep 22, state [1 1 1 1]\n",
      "instance 1, ep 23, state [1 0 1 1]\n",
      "instance 1, ep 24, state [1 1 1 0]\n",
      "instance 1, ep 25, state [0 0 0 0]\n",
      "instance 1, ep 26, state [1 0 1 0]\n",
      "instance 1, ep 27, state [1 0 0 0]\n",
      "instance 1, ep 28, state [1 0 1 0]\n",
      "instance 1, ep 29, state [0 1 1 0]\n",
      "first state [1 0 0 1]\n",
      "instance 2, ep 1, state [0 1 0 1]\n",
      "instance 2, ep 2, state [0 1 1 1]\n",
      "instance 2, ep 3, state [0 1 1 1]\n",
      "instance 2, ep 4, state [1 1 0 1]\n",
      "instance 2, ep 5, state [1 1 0 0]\n",
      "instance 2, ep 6, state [1 1 0 1]\n",
      "instance 2, ep 7, state [0 0 0 0]\n",
      "instance 2, ep 8, state [1 0 1 1]\n",
      "instance 2, ep 9, state [1 1 0 1]\n",
      "instance 2, ep 10, state [1 0 1 1]\n",
      "instance 2, ep 11, state [1 1 1 0]\n",
      "instance 2, ep 12, state [1 1 0 0]\n",
      "instance 2, ep 13, state [0 1 1 0]\n",
      "instance 2, ep 14, state [1 0 1 1]\n",
      "instance 2, ep 15, state [1 0 0 0]\n",
      "instance 2, ep 16, state [0 1 1 1]\n",
      "instance 2, ep 17, state [1 1 1 1]\n",
      "instance 2, ep 18, state [1 0 0 0]\n",
      "instance 2, ep 19, state [1 1 0 1]\n",
      "instance 2, ep 20, state [1 0 0 1]\n",
      "instance 2, ep 21, state [1 1 1 1]\n",
      "instance 2, ep 22, state [1 1 1 0]\n",
      "instance 2, ep 23, state [0 0 1 1]\n",
      "instance 2, ep 24, state [1 0 0 0]\n",
      "instance 2, ep 25, state [0 1 0 0]\n",
      "instance 2, ep 26, state [1 0 1 1]\n",
      "instance 2, ep 27, state [0 1 1 1]\n",
      "instance 2, ep 28, state [0 1 0 0]\n",
      "instance 2, ep 29, state [0 1 0 0]\n",
      "first state [0 1 1 0]\n",
      "instance 3, ep 1, state [1 1 0 0]\n",
      "instance 3, ep 2, state [0 0 0 0]\n",
      "instance 3, ep 3, state [0 0 1 0]\n",
      "instance 3, ep 4, state [1 0 1 0]\n",
      "instance 3, ep 5, state [0 1 1 1]\n",
      "instance 3, ep 6, state [0 0 1 1]\n",
      "instance 3, ep 7, state [1 1 0 1]\n",
      "instance 3, ep 8, state [0 0 0 1]\n",
      "instance 3, ep 9, state [0 0 1 0]\n",
      "instance 3, ep 10, state [1 0 0 1]\n",
      "instance 3, ep 11, state [0 0 0 0]\n",
      "instance 3, ep 12, state [1 0 1 0]\n",
      "instance 3, ep 13, state [1 1 1 0]\n",
      "instance 3, ep 14, state [0 0 1 1]\n",
      "instance 3, ep 15, state [1 0 1 1]\n",
      "instance 3, ep 16, state [0 0 1 1]\n",
      "instance 3, ep 17, state [1 0 1 0]\n",
      "instance 3, ep 18, state [0 0 1 1]\n",
      "instance 3, ep 19, state [1 0 1 0]\n",
      "instance 3, ep 20, state [1 0 0 0]\n",
      "instance 3, ep 21, state [0 1 1 0]\n",
      "instance 3, ep 22, state [1 0 1 1]\n",
      "instance 3, ep 23, state [1 0 1 1]\n",
      "instance 3, ep 24, state [0 0 1 1]\n",
      "instance 3, ep 25, state [1 1 1 0]\n",
      "instance 3, ep 26, state [0 0 1 0]\n",
      "instance 3, ep 27, state [1 1 1 0]\n",
      "instance 3, ep 28, state [1 0 1 0]\n",
      "instance 3, ep 29, state [0 1 0 0]\n",
      "first state [0 1 0 1]\n",
      "instance 4, ep 1, state [0 0 0 0]\n",
      "instance 4, ep 2, state [1 0 1 0]\n",
      "instance 4, ep 3, state [1 0 0 1]\n",
      "instance 4, ep 4, state [0 0 1 1]\n",
      "instance 4, ep 5, state [0 0 1 0]\n",
      "instance 4, ep 6, state [0 0 1 1]\n",
      "instance 4, ep 7, state [0 0 0 1]\n",
      "instance 4, ep 8, state [0 0 1 0]\n",
      "instance 4, ep 9, state [1 0 0 0]\n",
      "instance 4, ep 10, state [1 1 1 0]\n",
      "instance 4, ep 11, state [1 0 0 1]\n",
      "instance 4, ep 12, state [0 0 0 0]\n",
      "instance 4, ep 13, state [0 1 0 1]\n",
      "instance 4, ep 14, state [1 0 0 0]\n",
      "instance 4, ep 15, state [1 0 1 0]\n",
      "instance 4, ep 16, state [1 0 0 1]\n",
      "instance 4, ep 17, state [1 0 1 0]\n",
      "instance 4, ep 18, state [1 1 0 0]\n",
      "instance 4, ep 19, state [0 1 1 0]\n",
      "instance 4, ep 20, state [0 1 1 1]\n",
      "instance 4, ep 21, state [0 0 0 1]\n",
      "instance 4, ep 22, state [0 1 0 1]\n",
      "instance 4, ep 23, state [1 1 0 0]\n",
      "instance 4, ep 24, state [0 1 1 1]\n",
      "instance 4, ep 25, state [1 1 0 1]\n",
      "instance 4, ep 26, state [0 0 1 0]\n",
      "instance 4, ep 27, state [0 1 0 1]\n",
      "instance 4, ep 28, state [0 0 0 0]\n",
      "instance 4, ep 29, state [1 0 1 0]\n",
      "first state [0 1 1 1]\n",
      "instance 5, ep 1, state [0 0 1 0]\n",
      "instance 5, ep 2, state [1 1 1 1]\n",
      "instance 5, ep 3, state [1 0 1 0]\n",
      "instance 5, ep 4, state [0 1 1 1]\n",
      "instance 5, ep 5, state [1 0 0 1]\n",
      "instance 5, ep 6, state [0 0 0 0]\n",
      "instance 5, ep 7, state [0 0 0 0]\n",
      "instance 5, ep 8, state [1 0 0 1]\n",
      "instance 5, ep 9, state [0 1 1 0]\n",
      "instance 5, ep 10, state [0 1 1 0]\n",
      "instance 5, ep 11, state [1 0 1 0]\n",
      "instance 5, ep 12, state [1 1 1 1]\n",
      "instance 5, ep 13, state [0 0 0 0]\n",
      "instance 5, ep 14, state [1 0 0 1]\n",
      "instance 5, ep 15, state [1 1 1 0]\n",
      "instance 5, ep 16, state [0 1 1 0]\n",
      "instance 5, ep 17, state [1 0 0 1]\n",
      "instance 5, ep 18, state [1 1 0 1]\n",
      "instance 5, ep 19, state [0 0 1 1]\n",
      "instance 5, ep 20, state [1 1 1 1]\n",
      "instance 5, ep 21, state [0 0 0 0]\n",
      "instance 5, ep 22, state [1 0 0 0]\n",
      "instance 5, ep 23, state [1 0 1 0]\n",
      "instance 5, ep 24, state [0 1 1 0]\n",
      "instance 5, ep 25, state [1 1 0 1]\n",
      "instance 5, ep 26, state [1 1 1 1]\n",
      "instance 5, ep 27, state [1 1 1 1]\n",
      "instance 5, ep 28, state [1 1 0 1]\n",
      "instance 5, ep 29, state [1 0 1 0]\n",
      "first state [0 0 1 0]\n",
      "instance 6, ep 1, state [1 0 1 0]\n",
      "instance 6, ep 2, state [1 1 1 1]\n",
      "instance 6, ep 3, state [1 1 0 0]\n",
      "instance 6, ep 4, state [1 1 1 0]\n",
      "instance 6, ep 5, state [0 0 1 0]\n",
      "instance 6, ep 6, state [0 0 0 1]\n",
      "instance 6, ep 7, state [0 1 0 0]\n",
      "instance 6, ep 8, state [0 0 0 0]\n",
      "instance 6, ep 9, state [1 0 1 1]\n",
      "instance 6, ep 10, state [1 0 0 0]\n",
      "instance 6, ep 11, state [0 1 0 0]\n",
      "instance 6, ep 12, state [1 1 1 0]\n",
      "instance 6, ep 13, state [0 1 0 0]\n",
      "instance 6, ep 14, state [0 0 0 0]\n",
      "instance 6, ep 15, state [1 1 1 0]\n",
      "instance 6, ep 16, state [0 0 1 1]\n",
      "instance 6, ep 17, state [0 1 0 1]\n",
      "instance 6, ep 18, state [1 1 1 1]\n",
      "instance 6, ep 19, state [0 1 0 1]\n",
      "instance 6, ep 20, state [1 1 0 1]\n",
      "instance 6, ep 21, state [1 1 0 0]\n",
      "instance 6, ep 22, state [0 0 1 0]\n",
      "instance 6, ep 23, state [1 0 0 1]\n",
      "instance 6, ep 24, state [1 0 1 1]\n",
      "instance 6, ep 25, state [0 1 1 1]\n",
      "instance 6, ep 26, state [0 1 0 0]\n",
      "instance 6, ep 27, state [0 0 1 1]\n",
      "instance 6, ep 28, state [1 0 0 0]\n",
      "instance 6, ep 29, state [1 0 1 1]\n",
      "first state [1 0 1 0]\n",
      "instance 7, ep 1, state [1 0 0 0]\n",
      "instance 7, ep 2, state [1 0 1 1]\n",
      "instance 7, ep 3, state [0 1 0 1]\n",
      "instance 7, ep 4, state [0 1 1 1]\n",
      "instance 7, ep 5, state [1 0 1 1]\n",
      "instance 7, ep 6, state [1 0 1 1]\n",
      "instance 7, ep 7, state [1 0 1 0]\n",
      "instance 7, ep 8, state [1 0 1 1]\n",
      "instance 7, ep 9, state [0 1 0 1]\n",
      "instance 7, ep 10, state [1 1 1 1]\n",
      "instance 7, ep 11, state [0 0 1 1]\n",
      "instance 7, ep 12, state [1 1 0 1]\n",
      "instance 7, ep 13, state [0 1 0 0]\n",
      "instance 7, ep 14, state [0 0 1 0]\n",
      "instance 7, ep 15, state [0 0 0 0]\n",
      "instance 7, ep 16, state [0 1 1 1]\n",
      "instance 7, ep 17, state [0 0 1 1]\n",
      "instance 7, ep 18, state [0 0 0 0]\n",
      "instance 7, ep 19, state [0 1 1 1]\n",
      "instance 7, ep 20, state [1 1 1 1]\n",
      "instance 7, ep 21, state [0 0 0 1]\n",
      "instance 7, ep 22, state [1 0 1 0]\n",
      "instance 7, ep 23, state [1 0 0 0]\n",
      "instance 7, ep 24, state [0 0 0 1]\n",
      "instance 7, ep 25, state [1 0 1 1]\n",
      "instance 7, ep 26, state [0 0 0 0]\n",
      "instance 7, ep 27, state [1 0 1 1]\n",
      "instance 7, ep 28, state [0 1 0 1]\n",
      "instance 7, ep 29, state [0 1 1 0]\n",
      "first state [0 0 1 1]\n",
      "instance 8, ep 1, state [0 1 0 1]\n",
      "instance 8, ep 2, state [0 0 1 0]\n",
      "instance 8, ep 3, state [1 1 1 0]\n",
      "instance 8, ep 4, state [0 0 1 1]\n",
      "instance 8, ep 5, state [1 1 1 1]\n",
      "instance 8, ep 6, state [0 1 0 1]\n",
      "instance 8, ep 7, state [1 1 0 0]\n",
      "instance 8, ep 8, state [0 0 0 1]\n",
      "instance 8, ep 9, state [1 0 0 0]\n",
      "instance 8, ep 10, state [1 1 1 0]\n",
      "instance 8, ep 11, state [1 1 0 1]\n",
      "instance 8, ep 12, state [0 1 0 1]\n",
      "instance 8, ep 13, state [1 1 1 0]\n",
      "instance 8, ep 14, state [0 0 0 1]\n",
      "instance 8, ep 15, state [0 1 1 1]\n",
      "instance 8, ep 16, state [0 1 1 0]\n",
      "instance 8, ep 17, state [1 1 0 1]\n",
      "instance 8, ep 18, state [0 0 0 0]\n",
      "instance 8, ep 19, state [0 0 1 1]\n",
      "instance 8, ep 20, state [1 0 0 1]\n",
      "instance 8, ep 21, state [0 0 1 0]\n",
      "instance 8, ep 22, state [1 1 0 0]\n",
      "instance 8, ep 23, state [1 0 0 1]\n",
      "instance 8, ep 24, state [0 1 1 0]\n",
      "instance 8, ep 25, state [0 0 0 0]\n",
      "instance 8, ep 26, state [1 0 1 1]\n",
      "instance 8, ep 27, state [1 1 0 1]\n",
      "instance 8, ep 28, state [1 0 0 1]\n",
      "instance 8, ep 29, state [0 0 0 0]\n",
      "first state [1 1 1 0]\n",
      "instance 9, ep 1, state [1 1 0 0]\n",
      "instance 9, ep 2, state [0 0 1 0]\n",
      "instance 9, ep 3, state [1 0 0 0]\n",
      "instance 9, ep 4, state [0 0 1 1]\n",
      "instance 9, ep 5, state [1 0 0 0]\n",
      "instance 9, ep 6, state [1 0 0 1]\n",
      "instance 9, ep 7, state [0 0 0 1]\n",
      "instance 9, ep 8, state [1 0 0 1]\n",
      "instance 9, ep 9, state [1 0 1 0]\n",
      "instance 9, ep 10, state [1 1 0 1]\n",
      "instance 9, ep 11, state [1 1 0 0]\n",
      "instance 9, ep 12, state [0 1 0 1]\n",
      "instance 9, ep 13, state [1 0 1 0]\n",
      "instance 9, ep 14, state [1 0 0 0]\n",
      "instance 9, ep 15, state [0 1 1 1]\n",
      "instance 9, ep 16, state [0 0 0 1]\n",
      "instance 9, ep 17, state [1 0 0 1]\n",
      "instance 9, ep 18, state [1 1 1 0]\n",
      "instance 9, ep 19, state [0 1 1 0]\n",
      "instance 9, ep 20, state [1 1 1 1]\n",
      "instance 9, ep 21, state [0 1 1 1]\n",
      "instance 9, ep 22, state [1 1 0 1]\n",
      "instance 9, ep 23, state [1 1 1 1]\n",
      "instance 9, ep 24, state [0 1 0 0]\n",
      "instance 9, ep 25, state [1 1 0 0]\n",
      "instance 9, ep 26, state [1 0 0 0]\n",
      "instance 9, ep 27, state [0 0 0 0]\n",
      "instance 9, ep 28, state [1 1 1 0]\n",
      "instance 9, ep 29, state [0 1 0 0]\n"
     ]
    }
   ],
   "source": [
    "np.random.seed(seed)\n",
    "random.seed(seed)\n",
    "one_step_rewards = myopic_match_n_step(simulator, n_episodes, n_epochs, discount,1)\n",
    "one_step_active_rate = simulator.total_active/(one_step_rewards.size*n_arms)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 19,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "first state [0 1 1 1]\n",
      "instance 0, ep 1, state [1 1 1 1]\n",
      "instance 0, ep 2, state [0 0 0 1]\n",
      "instance 0, ep 3, state [1 1 0 1]\n",
      "instance 0, ep 4, state [0 1 1 1]\n",
      "instance 0, ep 5, state [0 0 0 1]\n",
      "instance 0, ep 6, state [0 0 0 1]\n",
      "instance 0, ep 7, state [0 1 1 0]\n",
      "instance 0, ep 8, state [1 1 0 1]\n",
      "instance 0, ep 9, state [1 1 1 1]\n",
      "instance 0, ep 10, state [0 0 0 0]\n",
      "instance 0, ep 11, state [0 1 0 0]\n",
      "instance 0, ep 12, state [0 1 0 1]\n",
      "instance 0, ep 13, state [0 0 0 0]\n",
      "instance 0, ep 14, state [1 0 1 0]\n",
      "instance 0, ep 15, state [0 0 0 1]\n",
      "instance 0, ep 16, state [0 0 0 0]\n",
      "instance 0, ep 17, state [1 1 0 1]\n",
      "instance 0, ep 18, state [0 1 0 0]\n",
      "instance 0, ep 19, state [0 1 1 1]\n",
      "instance 0, ep 20, state [0 1 1 0]\n",
      "instance 0, ep 21, state [0 0 1 0]\n",
      "instance 0, ep 22, state [1 0 1 1]\n",
      "instance 0, ep 23, state [0 1 1 1]\n",
      "instance 0, ep 24, state [0 0 1 1]\n",
      "instance 0, ep 25, state [0 0 1 0]\n",
      "instance 0, ep 26, state [1 1 1 1]\n",
      "instance 0, ep 27, state [0 1 1 0]\n",
      "instance 0, ep 28, state [0 1 1 0]\n",
      "instance 0, ep 29, state [1 1 1 1]\n",
      "first state [1 0 0 0]\n",
      "instance 1, ep 1, state [1 0 0 1]\n",
      "instance 1, ep 2, state [0 0 0 0]\n",
      "instance 1, ep 3, state [1 0 1 0]\n",
      "instance 1, ep 4, state [1 0 0 1]\n",
      "instance 1, ep 5, state [1 1 0 0]\n",
      "instance 1, ep 6, state [0 1 0 1]\n",
      "instance 1, ep 7, state [0 1 0 1]\n",
      "instance 1, ep 8, state [0 0 1 0]\n",
      "instance 1, ep 9, state [0 1 1 0]\n",
      "instance 1, ep 10, state [0 0 1 0]\n",
      "instance 1, ep 11, state [0 0 0 1]\n",
      "instance 1, ep 12, state [0 1 0 0]\n",
      "instance 1, ep 13, state [0 0 1 1]\n",
      "instance 1, ep 14, state [1 1 0 1]\n",
      "instance 1, ep 15, state [0 1 0 0]\n",
      "instance 1, ep 16, state [0 0 0 0]\n",
      "instance 1, ep 17, state [1 0 0 1]\n",
      "instance 1, ep 18, state [1 0 0 1]\n",
      "instance 1, ep 19, state [0 1 1 0]\n",
      "instance 1, ep 20, state [0 1 1 1]\n",
      "instance 1, ep 21, state [1 1 1 1]\n",
      "instance 1, ep 22, state [1 1 1 1]\n",
      "instance 1, ep 23, state [1 0 1 1]\n",
      "instance 1, ep 24, state [1 1 1 0]\n",
      "instance 1, ep 25, state [0 0 0 0]\n",
      "instance 1, ep 26, state [1 0 1 0]\n",
      "instance 1, ep 27, state [1 0 0 0]\n",
      "instance 1, ep 28, state [1 0 1 0]\n",
      "instance 1, ep 29, state [0 1 1 0]\n",
      "first state [1 0 0 1]\n",
      "instance 2, ep 1, state [0 1 0 1]\n",
      "instance 2, ep 2, state [0 1 1 1]\n",
      "instance 2, ep 3, state [0 1 1 1]\n",
      "instance 2, ep 4, state [1 1 0 1]\n",
      "instance 2, ep 5, state [1 1 0 0]\n",
      "instance 2, ep 6, state [1 1 0 1]\n",
      "instance 2, ep 7, state [0 0 0 0]\n",
      "instance 2, ep 8, state [1 0 1 1]\n",
      "instance 2, ep 9, state [1 1 0 1]\n",
      "instance 2, ep 10, state [1 0 1 1]\n",
      "instance 2, ep 11, state [1 1 1 0]\n",
      "instance 2, ep 12, state [1 1 0 0]\n",
      "instance 2, ep 13, state [0 1 1 0]\n",
      "instance 2, ep 14, state [1 0 1 1]\n",
      "instance 2, ep 15, state [1 0 0 0]\n",
      "instance 2, ep 16, state [0 1 1 1]\n",
      "instance 2, ep 17, state [1 1 1 1]\n",
      "instance 2, ep 18, state [1 0 0 0]\n",
      "instance 2, ep 19, state [1 1 0 1]\n",
      "instance 2, ep 20, state [1 0 0 1]\n",
      "instance 2, ep 21, state [1 1 1 1]\n",
      "instance 2, ep 22, state [1 1 1 0]\n",
      "instance 2, ep 23, state [0 0 1 1]\n",
      "instance 2, ep 24, state [1 0 0 0]\n",
      "instance 2, ep 25, state [0 1 0 0]\n",
      "instance 2, ep 26, state [1 0 1 1]\n",
      "instance 2, ep 27, state [0 1 1 1]\n",
      "instance 2, ep 28, state [0 1 0 0]\n",
      "instance 2, ep 29, state [0 1 0 0]\n",
      "first state [0 1 1 0]\n",
      "instance 3, ep 1, state [1 1 0 0]\n",
      "instance 3, ep 2, state [0 0 0 0]\n",
      "instance 3, ep 3, state [0 0 1 0]\n",
      "instance 3, ep 4, state [1 0 1 0]\n",
      "instance 3, ep 5, state [0 1 1 1]\n",
      "instance 3, ep 6, state [0 0 1 1]\n",
      "instance 3, ep 7, state [1 1 0 1]\n",
      "instance 3, ep 8, state [0 0 0 1]\n",
      "instance 3, ep 9, state [0 0 1 0]\n",
      "instance 3, ep 10, state [1 0 0 1]\n",
      "instance 3, ep 11, state [0 0 0 0]\n",
      "instance 3, ep 12, state [1 0 1 0]\n",
      "instance 3, ep 13, state [1 1 1 0]\n",
      "instance 3, ep 14, state [0 0 1 1]\n",
      "instance 3, ep 15, state [1 0 1 1]\n",
      "instance 3, ep 16, state [0 0 1 1]\n",
      "instance 3, ep 17, state [1 0 1 0]\n",
      "instance 3, ep 18, state [0 0 1 1]\n",
      "instance 3, ep 19, state [1 0 1 0]\n",
      "instance 3, ep 20, state [1 0 0 0]\n",
      "instance 3, ep 21, state [0 1 1 0]\n",
      "instance 3, ep 22, state [1 0 1 1]\n",
      "instance 3, ep 23, state [1 0 1 1]\n",
      "instance 3, ep 24, state [0 0 1 1]\n",
      "instance 3, ep 25, state [1 1 1 0]\n",
      "instance 3, ep 26, state [0 0 1 0]\n",
      "instance 3, ep 27, state [1 1 1 0]\n",
      "instance 3, ep 28, state [1 0 1 0]\n",
      "instance 3, ep 29, state [0 1 0 0]\n",
      "first state [0 1 0 1]\n",
      "instance 4, ep 1, state [0 0 0 0]\n",
      "instance 4, ep 2, state [1 0 1 0]\n",
      "instance 4, ep 3, state [1 0 0 1]\n",
      "instance 4, ep 4, state [0 0 1 1]\n",
      "instance 4, ep 5, state [0 0 1 0]\n",
      "instance 4, ep 6, state [0 0 1 1]\n",
      "instance 4, ep 7, state [0 0 0 1]\n",
      "instance 4, ep 8, state [0 0 1 0]\n",
      "instance 4, ep 9, state [1 0 0 0]\n",
      "instance 4, ep 10, state [1 1 1 0]\n",
      "instance 4, ep 11, state [1 0 0 1]\n",
      "instance 4, ep 12, state [0 0 0 0]\n",
      "instance 4, ep 13, state [0 1 0 1]\n",
      "instance 4, ep 14, state [1 0 0 0]\n",
      "instance 4, ep 15, state [1 0 1 0]\n",
      "instance 4, ep 16, state [1 0 0 1]\n",
      "instance 4, ep 17, state [1 0 1 0]\n",
      "instance 4, ep 18, state [1 1 0 0]\n",
      "instance 4, ep 19, state [0 1 1 0]\n",
      "instance 4, ep 20, state [0 1 1 1]\n",
      "instance 4, ep 21, state [0 0 0 1]\n",
      "instance 4, ep 22, state [0 1 0 1]\n",
      "instance 4, ep 23, state [1 1 0 0]\n",
      "instance 4, ep 24, state [0 1 1 1]\n",
      "instance 4, ep 25, state [1 1 0 1]\n",
      "instance 4, ep 26, state [0 0 1 0]\n",
      "instance 4, ep 27, state [0 1 0 1]\n",
      "instance 4, ep 28, state [0 0 0 0]\n",
      "instance 4, ep 29, state [1 0 1 0]\n",
      "first state [0 1 1 1]\n",
      "instance 5, ep 1, state [0 0 1 0]\n",
      "instance 5, ep 2, state [1 1 1 1]\n",
      "instance 5, ep 3, state [1 0 1 0]\n",
      "instance 5, ep 4, state [0 1 1 1]\n",
      "instance 5, ep 5, state [1 0 0 1]\n",
      "instance 5, ep 6, state [0 0 0 0]\n",
      "instance 5, ep 7, state [0 0 0 0]\n",
      "instance 5, ep 8, state [1 0 0 1]\n",
      "instance 5, ep 9, state [0 1 1 0]\n",
      "instance 5, ep 10, state [0 1 1 0]\n",
      "instance 5, ep 11, state [1 0 1 0]\n",
      "instance 5, ep 12, state [1 1 1 1]\n",
      "instance 5, ep 13, state [0 0 0 0]\n",
      "instance 5, ep 14, state [1 0 0 1]\n",
      "instance 5, ep 15, state [1 1 1 0]\n",
      "instance 5, ep 16, state [0 1 1 0]\n",
      "instance 5, ep 17, state [1 0 0 1]\n",
      "instance 5, ep 18, state [1 1 0 1]\n",
      "instance 5, ep 19, state [0 0 1 1]\n",
      "instance 5, ep 20, state [1 1 1 1]\n",
      "instance 5, ep 21, state [0 0 0 0]\n",
      "instance 5, ep 22, state [1 0 0 0]\n",
      "instance 5, ep 23, state [1 0 1 0]\n",
      "instance 5, ep 24, state [0 1 1 0]\n",
      "instance 5, ep 25, state [1 1 0 1]\n",
      "instance 5, ep 26, state [1 1 1 1]\n",
      "instance 5, ep 27, state [1 1 1 1]\n",
      "instance 5, ep 28, state [1 1 0 1]\n",
      "instance 5, ep 29, state [1 0 1 0]\n",
      "first state [0 0 1 0]\n",
      "instance 6, ep 1, state [1 0 1 0]\n",
      "instance 6, ep 2, state [1 1 1 1]\n",
      "instance 6, ep 3, state [1 1 0 0]\n",
      "instance 6, ep 4, state [1 1 1 0]\n",
      "instance 6, ep 5, state [0 0 1 0]\n",
      "instance 6, ep 6, state [0 0 0 1]\n",
      "instance 6, ep 7, state [0 1 0 0]\n",
      "instance 6, ep 8, state [0 0 0 0]\n",
      "instance 6, ep 9, state [1 0 1 1]\n",
      "instance 6, ep 10, state [1 0 0 0]\n",
      "instance 6, ep 11, state [0 1 0 0]\n",
      "instance 6, ep 12, state [1 1 1 0]\n",
      "instance 6, ep 13, state [0 1 0 0]\n",
      "instance 6, ep 14, state [0 0 0 0]\n",
      "instance 6, ep 15, state [1 1 1 0]\n",
      "instance 6, ep 16, state [0 0 1 1]\n",
      "instance 6, ep 17, state [0 1 0 1]\n",
      "instance 6, ep 18, state [1 1 1 1]\n",
      "instance 6, ep 19, state [0 1 0 1]\n",
      "instance 6, ep 20, state [1 1 0 1]\n",
      "instance 6, ep 21, state [1 1 0 0]\n",
      "instance 6, ep 22, state [0 0 1 0]\n",
      "instance 6, ep 23, state [1 0 0 1]\n",
      "instance 6, ep 24, state [1 0 1 1]\n",
      "instance 6, ep 25, state [0 1 1 1]\n",
      "instance 6, ep 26, state [0 1 0 0]\n",
      "instance 6, ep 27, state [0 0 1 1]\n",
      "instance 6, ep 28, state [1 0 0 0]\n",
      "instance 6, ep 29, state [1 0 1 1]\n",
      "first state [1 0 1 0]\n",
      "instance 7, ep 1, state [1 0 0 0]\n",
      "instance 7, ep 2, state [1 0 1 1]\n",
      "instance 7, ep 3, state [0 1 0 1]\n",
      "instance 7, ep 4, state [0 1 1 1]\n",
      "instance 7, ep 5, state [1 0 1 1]\n",
      "instance 7, ep 6, state [1 0 1 1]\n",
      "instance 7, ep 7, state [1 0 1 0]\n",
      "instance 7, ep 8, state [1 0 1 1]\n",
      "instance 7, ep 9, state [0 1 0 1]\n",
      "instance 7, ep 10, state [1 1 1 1]\n",
      "instance 7, ep 11, state [0 0 1 1]\n",
      "instance 7, ep 12, state [1 1 0 1]\n",
      "instance 7, ep 13, state [0 1 0 0]\n",
      "instance 7, ep 14, state [0 0 1 0]\n",
      "instance 7, ep 15, state [0 0 0 0]\n",
      "instance 7, ep 16, state [0 1 1 1]\n",
      "instance 7, ep 17, state [0 0 1 1]\n",
      "instance 7, ep 18, state [0 0 0 0]\n",
      "instance 7, ep 19, state [0 1 1 1]\n",
      "instance 7, ep 20, state [1 1 1 1]\n",
      "instance 7, ep 21, state [0 0 0 1]\n",
      "instance 7, ep 22, state [1 0 1 0]\n",
      "instance 7, ep 23, state [1 0 0 0]\n",
      "instance 7, ep 24, state [0 0 0 1]\n",
      "instance 7, ep 25, state [1 0 1 1]\n",
      "instance 7, ep 26, state [0 0 0 0]\n",
      "instance 7, ep 27, state [1 0 1 1]\n",
      "instance 7, ep 28, state [0 1 0 1]\n",
      "instance 7, ep 29, state [0 1 1 0]\n",
      "first state [0 0 1 1]\n",
      "instance 8, ep 1, state [0 1 0 1]\n",
      "instance 8, ep 2, state [0 0 1 0]\n",
      "instance 8, ep 3, state [1 1 1 0]\n",
      "instance 8, ep 4, state [0 0 1 1]\n",
      "instance 8, ep 5, state [1 1 1 1]\n",
      "instance 8, ep 6, state [0 1 0 1]\n",
      "instance 8, ep 7, state [1 1 0 0]\n",
      "instance 8, ep 8, state [0 0 0 1]\n",
      "instance 8, ep 9, state [1 0 0 0]\n",
      "instance 8, ep 10, state [1 1 1 0]\n",
      "instance 8, ep 11, state [1 1 0 1]\n",
      "instance 8, ep 12, state [0 1 0 1]\n",
      "instance 8, ep 13, state [1 1 1 0]\n",
      "instance 8, ep 14, state [0 0 0 1]\n",
      "instance 8, ep 15, state [0 1 1 1]\n",
      "instance 8, ep 16, state [0 1 1 0]\n",
      "instance 8, ep 17, state [1 1 0 1]\n",
      "instance 8, ep 18, state [0 0 0 0]\n",
      "instance 8, ep 19, state [0 0 1 1]\n",
      "instance 8, ep 20, state [1 0 0 1]\n",
      "instance 8, ep 21, state [0 0 1 0]\n",
      "instance 8, ep 22, state [1 1 0 0]\n",
      "instance 8, ep 23, state [1 0 0 1]\n",
      "instance 8, ep 24, state [0 1 1 0]\n",
      "instance 8, ep 25, state [0 0 0 0]\n",
      "instance 8, ep 26, state [1 0 1 1]\n",
      "instance 8, ep 27, state [1 1 0 1]\n",
      "instance 8, ep 28, state [1 0 0 1]\n",
      "instance 8, ep 29, state [0 0 0 0]\n",
      "first state [1 1 1 0]\n",
      "instance 9, ep 1, state [1 1 0 0]\n",
      "instance 9, ep 2, state [0 0 1 0]\n",
      "instance 9, ep 3, state [1 0 0 0]\n",
      "instance 9, ep 4, state [0 0 1 1]\n",
      "instance 9, ep 5, state [1 0 0 0]\n",
      "instance 9, ep 6, state [1 0 0 1]\n",
      "instance 9, ep 7, state [0 0 0 1]\n",
      "instance 9, ep 8, state [1 0 0 1]\n",
      "instance 9, ep 9, state [1 0 1 0]\n",
      "instance 9, ep 10, state [1 1 0 1]\n",
      "instance 9, ep 11, state [1 1 0 0]\n",
      "instance 9, ep 12, state [0 1 0 1]\n",
      "instance 9, ep 13, state [1 0 1 0]\n",
      "instance 9, ep 14, state [1 0 0 0]\n",
      "instance 9, ep 15, state [0 1 1 1]\n",
      "instance 9, ep 16, state [0 0 0 1]\n",
      "instance 9, ep 17, state [1 0 0 1]\n",
      "instance 9, ep 18, state [1 1 1 0]\n",
      "instance 9, ep 19, state [0 1 1 0]\n",
      "instance 9, ep 20, state [1 1 1 1]\n",
      "instance 9, ep 21, state [0 1 1 1]\n",
      "instance 9, ep 22, state [1 1 0 1]\n",
      "instance 9, ep 23, state [1 1 1 1]\n",
      "instance 9, ep 24, state [0 1 0 0]\n",
      "instance 9, ep 25, state [1 1 0 0]\n",
      "instance 9, ep 26, state [1 0 0 0]\n",
      "instance 9, ep 27, state [0 0 0 0]\n",
      "instance 9, ep 28, state [1 1 1 0]\n",
      "instance 9, ep 29, state [0 1 0 0]\n"
     ]
    }
   ],
   "source": [
    "np.random.seed(seed)\n",
    "random.seed(seed)\n",
    "infinite_step_rewards = myopic_match_n_step(simulator, n_episodes, n_epochs, discount,-1)\n",
    "infinite_step_active_rate = simulator.total_active/(infinite_step_rewards.size*n_arms)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 18,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "first state [0 1 1 1]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 1 3]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.52] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.52] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.52] sorted [2 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.54 0.52] sorted [1 0 2]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.52] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.52] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.52] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.52] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.52] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.52] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.52] sorted [2 1 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.52 1.   0.52] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.52 1.   0.52] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.   0.52 1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.   0.52 1.   1.  ] sorted [2 3 0]\n",
      "instance 0, ep 1, state [1 1 1 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 1 3]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.52] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.52] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.52] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.52] sorted [2 1 0]\n",
      "   state [1 0 0 0] state_WI [1.   0.52 0.54 0.52] sorted [0 2 3]\n",
      "   state [0 0 1 1] state_WI [0.35 0.52 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 1 3]\n",
      "   state [0 0 0 0] state_WI [0.35 0.52 0.54 0.52] sorted [2 3 1]\n",
      "   state [0 1 0 0] state_WI [0.35 1.   0.54 0.52] sorted [1 2 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.52 1.   0.52] sorted [2 0 3]\n",
      "   state [0 0 1 1] state_WI [0.35 0.52 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 0] state_WI [0.35 1.   1.   0.52] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.35 1.   1.   0.52] sorted [2 1 3]\n",
      "   state [1 0 1 1] state_WI [1.   0.52 1.   1.  ] sorted [2 3 0]\n",
      "instance 0, ep 2, state [0 0 0 1]\n",
      "   state [0 0 0 1] state_WI [0.35 0.52 0.54 1.  ] sorted [3 2 1]\n",
      "   state [0 0 1 1] state_WI [0.35 0.52 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 0 1] state_WI [0.35 1.   0.54 1.  ] sorted [1 3 2]\n",
      "   state [0 1 0 1] state_WI [0.35 1.   0.54 1.  ] sorted [1 3 2]\n",
      "   state [0 0 0 1] state_WI [0.35 0.52 0.54 1.  ] sorted [3 2 1]\n",
      "   state [0 0 0 1] state_WI [0.35 0.52 0.54 1.  ] sorted [3 2 1]\n",
      "   state [0 1 1 0] state_WI [0.35 1.   1.   0.52] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.35 0.52 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 0 0] state_WI [0.35 1.   0.54 0.52] sorted [1 2 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 1 3]\n",
      "   state [0 1 0 1] state_WI [0.35 1.   0.54 1.  ] sorted [1 3 2]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 0 1] state_WI [0.35 1.   0.54 1.  ] sorted [1 3 2]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 1 3]\n",
      "instance 0, ep 3, state [1 1 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.54 1.  ] sorted [1 3 0]\n",
      "   state [1 0 1 1] state_WI [1.   0.52 1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.   0.52 1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.   0.52 1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.   0.52 1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 0 0] state_WI [1.   0.52 0.54 0.52] sorted [0 2 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.52 1.   0.52] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.   0.52 1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.   0.52 1.   1.  ] sorted [2 3 0]\n",
      "   state [0 0 1 1] state_WI [0.35 0.52 1.   1.  ] sorted [2 3 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 1 3]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.52] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.52] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.52] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.52] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.52] sorted [2 1 0]\n",
      "   state [0 0 1 0] state_WI [0.35 0.52 1.   0.52] sorted [2 3 1]\n",
      "   state [0 0 1 0] state_WI [0.35 0.52 1.   0.52] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 1 3]\n",
      "instance 0, ep 4, state [0 1 1 1]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 0 0] state_WI [0.35 1.   0.54 0.52] sorted [1 2 3]\n",
      "   state [0 0 0 1] state_WI [0.35 0.52 0.54 1.  ] sorted [3 2 1]\n",
      "   state [0 0 1 1] state_WI [0.35 0.52 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 0] state_WI [0.35 0.52 1.   0.52] sorted [2 3 1]\n",
      "   state [0 0 1 0] state_WI [0.35 0.52 1.   0.52] sorted [2 3 1]\n",
      "   state [0 1 1 0] state_WI [0.35 1.   1.   0.52] sorted [2 1 3]\n",
      "   state [0 1 0 1] state_WI [0.35 1.   0.54 1.  ] sorted [1 3 2]\n",
      "   state [0 0 1 1] state_WI [0.35 0.52 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.35 0.52 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.35 0.52 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.35 0.52 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.35 0.52 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 0 1] state_WI [0.35 1.   0.54 1.  ] sorted [1 3 2]\n",
      "   state [0 1 0 1] state_WI [0.35 1.   0.54 1.  ] sorted [1 3 2]\n",
      "   state [0 1 0 1] state_WI [0.35 1.   0.54 1.  ] sorted [1 3 2]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 0 1] state_WI [0.35 1.   0.54 1.  ] sorted [1 3 2]\n",
      "instance 0, ep 5, state [0 0 0 1]\n",
      "   state [0 0 0 1] state_WI [0.35 0.52 0.54 1.  ] sorted [3 2 1]\n",
      "   state [0 0 1 1] state_WI [0.35 0.52 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 0 1 0] state_WI [0.35 0.52 1.   0.52] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.35 0.52 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 1 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 1 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 1 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 0 1 0] state_WI [0.35 0.52 1.   0.52] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 1 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.52 0.54 1.  ] sorted [3 0 2]\n",
      "   state [1 0 0 1] state_WI [1.   0.52 0.54 1.  ] sorted [3 0 2]\n",
      "   state [0 0 0 1] state_WI [0.35 0.52 0.54 1.  ] sorted [3 2 1]\n",
      "instance 0, ep 6, state [0 0 0 1]\n",
      "   state [0 0 0 1] state_WI [0.35 0.52 0.54 1.  ] sorted [3 2 1]\n",
      "   state [0 1 0 1] state_WI [0.35 1.   0.54 1.  ] sorted [1 3 2]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 1 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 1 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 0 1] state_WI [0.35 1.   0.54 1.  ] sorted [1 3 2]\n",
      "   state [0 1 1 0] state_WI [0.35 1.   1.   0.52] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 0 1] state_WI [0.35 1.   0.54 1.  ] sorted [1 3 2]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 1 3]\n",
      "   state [1 0 1 1] state_WI [1.   0.52 1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.   0.52 1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.   0.52 1.   1.  ] sorted [2 3 0]\n",
      "instance 0, ep 7, state [0 1 1 0]\n",
      "   state [0 1 1 0] state_WI [0.35 1.   1.   0.52] sorted [2 1 3]\n",
      "   state [0 1 0 0] state_WI [0.35 1.   0.54 0.52] sorted [1 2 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.52 0.54 1.  ] sorted [3 0 2]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.54 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.54 1.  ] sorted [1 3 0]\n",
      "   state [0 0 0 1] state_WI [0.35 0.52 0.54 1.  ] sorted [3 2 1]\n",
      "   state [1 0 1 1] state_WI [1.   0.52 1.   1.  ] sorted [2 3 0]\n",
      "   state [0 0 1 1] state_WI [0.35 0.52 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 0 1] state_WI [0.35 0.52 0.54 1.  ] sorted [3 2 1]\n",
      "   state [0 1 0 1] state_WI [0.35 1.   0.54 1.  ] sorted [1 3 2]\n",
      "   state [0 1 0 0] state_WI [0.35 1.   0.54 0.52] sorted [1 2 3]\n",
      "   state [0 1 1 0] state_WI [0.35 1.   1.   0.52] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.35 1.   1.   0.52] sorted [2 1 3]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.52] sorted [2 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.54 0.52] sorted [1 0 2]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.54 0.52] sorted [1 0 2]\n",
      "   state [0 1 0 0] state_WI [0.35 1.   0.54 0.52] sorted [1 2 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.52 1.   0.52] sorted [2 0 3]\n",
      "   state [0 0 1 1] state_WI [0.35 0.52 1.   1.  ] sorted [2 3 1]\n",
      "instance 0, ep 8, state [1 1 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.54 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.54 0.52] sorted [1 0 2]\n",
      "   state [0 0 0 0] state_WI [0.35 0.52 0.54 0.52] sorted [2 3 1]\n",
      "   state [0 1 1 0] state_WI [0.35 1.   1.   0.52] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.35 1.   1.   0.52] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.35 1.   1.   0.52] sorted [2 1 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.35 0.52 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.35 0.52 1.   1.  ] sorted [2 3 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.35 0.52 1.   1.  ] sorted [2 3 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.35 0.52 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "instance 0, ep 9, state [1 1 1 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 1 3]\n",
      "   state [1 0 1 1] state_WI [1.   0.52 1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 0 0] state_WI [1.   0.52 0.54 0.52] sorted [0 2 3]\n",
      "   state [1 0 1 1] state_WI [1.   0.52 1.   1.  ] sorted [2 3 0]\n",
      "   state [0 0 1 1] state_WI [0.35 0.52 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 0] state_WI [0.35 1.   1.   0.52] sorted [2 1 3]\n",
      "   state [1 0 1 1] state_WI [1.   0.52 1.   1.  ] sorted [2 3 0]\n",
      "   state [0 0 1 1] state_WI [0.35 0.52 1.   1.  ] sorted [2 3 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [1 0 1 1] state_WI [1.   0.52 1.   1.  ] sorted [2 3 0]\n",
      "   state [0 0 1 0] state_WI [0.35 0.52 1.   0.52] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.35 0.52 1.   1.  ] sorted [2 3 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 1 3]\n",
      "   state [0 1 0 1] state_WI [0.35 1.   0.54 1.  ] sorted [1 3 2]\n",
      "   state [0 0 0 1] state_WI [0.35 0.52 0.54 1.  ] sorted [3 2 1]\n",
      "   state [0 1 0 1] state_WI [0.35 1.   0.54 1.  ] sorted [1 3 2]\n",
      "   state [0 1 0 1] state_WI [0.35 1.   0.54 1.  ] sorted [1 3 2]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.54 0.52] sorted [1 0 2]\n",
      "   state [1 0 1 0] state_WI [1.   0.52 1.   0.52] sorted [2 0 3]\n",
      "instance 0, ep 10, state [0 0 0 0]\n",
      "   state [0 0 0 0] state_WI [0.35 0.52 0.54 0.52] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.35 0.52 1.   1.  ] sorted [2 3 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.35 1.   1.   0.52] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.35 1.   1.   0.52] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.35 0.52 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.35 0.52 1.   1.  ] sorted [2 3 1]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.52] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.52] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.52] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.35 1.   1.   0.52] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [1 0 1 1] state_WI [1.   0.52 1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.   0.52 1.   1.  ] sorted [2 3 0]\n",
      "   state [0 0 1 1] state_WI [0.35 0.52 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 0] state_WI [0.35 1.   1.   0.52] sorted [2 1 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.54 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.54 1.  ] sorted [1 3 0]\n",
      "instance 0, ep 11, state [0 1 0 0]\n",
      "   state [0 1 0 0] state_WI [0.35 1.   0.54 0.52] sorted [1 2 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 1 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 1 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.35 1.   1.   0.52] sorted [2 1 3]\n",
      "   state [1 0 1 1] state_WI [1.   0.52 1.   1.  ] sorted [2 3 0]\n",
      "   state [0 0 1 1] state_WI [0.35 0.52 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.35 0.52 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.35 0.52 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.35 0.52 1.   1.  ] sorted [2 3 1]\n",
      "   state [1 0 1 1] state_WI [1.   0.52 1.   1.  ] sorted [2 3 0]\n",
      "   state [0 1 1 0] state_WI [0.35 1.   1.   0.52] sorted [2 1 3]\n",
      "   state [0 1 0 1] state_WI [0.35 1.   0.54 1.  ] sorted [1 3 2]\n",
      "   state [0 1 0 1] state_WI [0.35 1.   0.54 1.  ] sorted [1 3 2]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.52] sorted [2 1 0]\n",
      "   state [1 0 0 0] state_WI [1.   0.52 0.54 0.52] sorted [0 2 3]\n",
      "   state [1 0 1 1] state_WI [1.   0.52 1.   1.  ] sorted [2 3 0]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 1 3]\n",
      "instance 0, ep 12, state [0 1 0 1]\n",
      "   state [0 1 0 1] state_WI [0.35 1.   0.54 1.  ] sorted [1 3 2]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [1 0 1 1] state_WI [1.   0.52 1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.   0.52 1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.   0.52 1.   1.  ] sorted [2 3 0]\n",
      "   state [0 0 1 1] state_WI [0.35 0.52 1.   1.  ] sorted [2 3 1]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.52] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.52] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.52] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.52] sorted [2 1 0]\n",
      "   state [0 0 1 0] state_WI [0.35 0.52 1.   0.52] sorted [2 3 1]\n",
      "   state [0 1 0 1] state_WI [0.35 1.   0.54 1.  ] sorted [1 3 2]\n",
      "   state [0 1 0 1] state_WI [0.35 1.   0.54 1.  ] sorted [1 3 2]\n",
      "   state [0 0 0 1] state_WI [0.35 0.52 0.54 1.  ] sorted [3 2 1]\n",
      "   state [0 0 1 1] state_WI [0.35 0.52 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 0] state_WI [0.35 0.52 1.   0.52] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.35 1.   1.   0.52] sorted [2 1 3]\n",
      "   state [0 1 0 0] state_WI [0.35 1.   0.54 0.52] sorted [1 2 3]\n",
      "   state [0 0 0 0] state_WI [0.35 0.52 0.54 0.52] sorted [2 3 1]\n",
      "instance 0, ep 13, state [0 0 0 0]\n",
      "   state [0 0 0 0] state_WI [0.35 0.52 0.54 0.52] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.35 0.52 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 0 1] state_WI [0.35 1.   0.54 1.  ] sorted [1 3 2]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 0 1] state_WI [0.35 1.   0.54 1.  ] sorted [1 3 2]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 0 0] state_WI [0.35 1.   0.54 0.52] sorted [1 2 3]\n",
      "   state [0 0 1 0] state_WI [0.35 0.52 1.   0.52] sorted [2 3 1]\n",
      "   state [1 0 1 1] state_WI [1.   0.52 1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.   0.52 1.   1.  ] sorted [2 3 0]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 0 0] state_WI [0.35 1.   0.54 0.52] sorted [1 2 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [1 0 1 1] state_WI [1.   0.52 1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.   0.52 1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.   0.52 1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.   0.52 1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.   0.52 1.   1.  ] sorted [2 3 0]\n",
      "   state [0 0 1 0] state_WI [0.35 0.52 1.   0.52] sorted [2 3 1]\n",
      "instance 0, ep 14, state [1 0 1 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.52 1.   0.52] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.   0.52 1.   1.  ] sorted [2 3 0]\n",
      "   state [0 0 1 1] state_WI [0.35 0.52 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 0] state_WI [0.35 0.52 1.   0.52] sorted [2 3 1]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.52] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.35 1.   1.   0.52] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 0 0 1] state_WI [0.35 0.52 0.54 1.  ] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.35 1.   1.   0.52] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.35 0.52 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.35 0.52 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 0 0] state_WI [0.35 1.   0.54 0.52] sorted [1 2 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.54 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.54 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.54 0.52] sorted [1 0 2]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.54 0.52] sorted [1 0 2]\n",
      "   state [1 0 1 0] state_WI [1.   0.52 1.   0.52] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.   0.52 1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.   0.52 1.   1.  ] sorted [2 3 0]\n",
      "instance 0, ep 15, state [0 0 0 1]\n",
      "   state [0 0 0 1] state_WI [0.35 0.52 0.54 1.  ] sorted [3 2 1]\n",
      "   state [0 1 0 1] state_WI [0.35 1.   0.54 1.  ] sorted [1 3 2]\n",
      "   state [0 1 0 1] state_WI [0.35 1.   0.54 1.  ] sorted [1 3 2]\n",
      "   state [1 0 1 1] state_WI [1.   0.52 1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.   0.52 1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.   0.52 1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.   0.52 1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.52 1.   0.52] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.   0.52 1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.   0.52 1.   1.  ] sorted [2 3 0]\n",
      "   state [0 0 1 1] state_WI [0.35 0.52 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 0 1] state_WI [0.35 1.   0.54 1.  ] sorted [1 3 2]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.52 1.   0.52] sorted [2 0 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.35 1.   1.   0.52] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.35 1.   1.   0.52] sorted [2 1 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 1 3]\n",
      "instance 0, ep 16, state [0 0 0 0]\n",
      "   state [0 0 0 0] state_WI [0.35 0.52 0.54 0.52] sorted [2 3 1]\n",
      "   state [0 1 0 1] state_WI [0.35 1.   0.54 1.  ] sorted [1 3 2]\n",
      "   state [0 0 1 1] state_WI [0.35 0.52 1.   1.  ] sorted [2 3 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.52] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.52] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.52] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.52] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.35 1.   1.   0.52] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [1 0 1 1] state_WI [1.   0.52 1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.   0.52 1.   1.  ] sorted [2 3 0]\n",
      "   state [0 0 1 1] state_WI [0.35 0.52 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 0 1] state_WI [0.35 0.52 0.54 1.  ] sorted [3 2 1]\n",
      "   state [0 0 0 1] state_WI [0.35 0.52 0.54 1.  ] sorted [3 2 1]\n",
      "   state [0 1 0 1] state_WI [0.35 1.   0.54 1.  ] sorted [1 3 2]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "instance 0, ep 17, state [1 1 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.54 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.54 1.  ] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.52 0.54 1.  ] sorted [3 0 2]\n",
      "   state [0 0 0 1] state_WI [0.35 0.52 0.54 1.  ] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.35 0.52 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 0 1] state_WI [0.35 1.   0.54 1.  ] sorted [1 3 2]\n",
      "   state [0 1 0 1] state_WI [0.35 1.   0.54 1.  ] sorted [1 3 2]\n",
      "   state [0 1 0 1] state_WI [0.35 1.   0.54 1.  ] sorted [1 3 2]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "instance 0, ep 18, state [0 1 0 0]\n",
      "   state [0 1 0 0] state_WI [0.35 1.   0.54 0.52] sorted [1 2 3]\n",
      "   state [0 0 1 1] state_WI [0.35 0.52 1.   1.  ] sorted [2 3 1]\n",
      "   state [1 0 1 1] state_WI [1.   0.52 1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.52 1.   0.52] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.52 1.   0.52] sorted [2 0 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.52 0.54 1.  ] sorted [3 0 2]\n",
      "   state [0 0 1 1] state_WI [0.35 0.52 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 0] state_WI [0.35 0.52 1.   0.52] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.35 0.52 1.   1.  ] sorted [2 3 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 1 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.52] sorted [2 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.54 0.52] sorted [1 0 2]\n",
      "   state [1 0 1 0] state_WI [1.   0.52 1.   0.52] sorted [2 0 3]\n",
      "   state [0 0 1 1] state_WI [0.35 0.52 1.   1.  ] sorted [2 3 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.54 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.54 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.35 1.   0.54 1.  ] sorted [1 3 2]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "instance 0, ep 19, state [0 1 1 1]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 0 0] state_WI [0.35 1.   0.54 0.52] sorted [1 2 3]\n",
      "   state [0 0 0 0] state_WI [0.35 0.52 0.54 0.52] sorted [2 3 1]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.54 0.52] sorted [1 0 2]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.52] sorted [2 1 0]\n",
      "   state [0 0 1 0] state_WI [0.35 0.52 1.   0.52] sorted [2 3 1]\n",
      "   state [0 0 0 1] state_WI [0.35 0.52 0.54 1.  ] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.35 0.52 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 0 1] state_WI [0.35 1.   0.54 1.  ] sorted [1 3 2]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 1 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.52] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.52] sorted [2 1 0]\n",
      "instance 0, ep 20, state [0 1 1 0]\n",
      "   state [0 1 1 0] state_WI [0.35 1.   1.   0.52] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.54 0.52] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.35 1.   1.   0.52] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 0 1] state_WI [0.35 1.   0.54 1.  ] sorted [1 3 2]\n",
      "   state [0 1 0 1] state_WI [0.35 1.   0.54 1.  ] sorted [1 3 2]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 1 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 1 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.52 1.   0.52] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.   0.52 1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.   0.52 1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.   0.52 1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.   0.52 1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.   0.52 1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.   0.52 1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.   0.52 1.   1.  ] sorted [2 3 0]\n",
      "instance 0, ep 21, state [0 0 1 0]\n",
      "   state [0 0 1 0] state_WI [0.35 0.52 1.   0.52] sorted [2 3 1]\n",
      "   state [0 1 1 0] state_WI [0.35 1.   1.   0.52] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.35 1.   1.   0.52] sorted [2 1 3]\n",
      "   state [0 1 0 0] state_WI [0.35 1.   0.54 0.52] sorted [1 2 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 0 0 1] state_WI [0.35 0.52 0.54 1.  ] sorted [3 2 1]\n",
      "   state [0 1 0 1] state_WI [0.35 1.   0.54 1.  ] sorted [1 3 2]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.35 0.52 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 0] state_WI [0.35 1.   1.   0.52] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.35 0.52 1.   1.  ] sorted [2 3 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.52 0.54 1.  ] sorted [3 0 2]\n",
      "   state [0 0 1 1] state_WI [0.35 0.52 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 0 0] state_WI [0.35 1.   0.54 0.52] sorted [1 2 3]\n",
      "instance 0, ep 22, state [1 0 1 1]\n",
      "   state [1 0 1 1] state_WI [1.   0.52 1.   1.  ] sorted [2 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.54 1.  ] sorted [1 3 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.52] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.35 0.52 1.   1.  ] sorted [2 3 1]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.52] sorted [2 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.54 0.52] sorted [1 0 2]\n",
      "   state [1 0 1 0] state_WI [1.   0.52 1.   0.52] sorted [2 0 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.35 0.52 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 0 1] state_WI [0.35 1.   0.54 1.  ] sorted [1 3 2]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 1 3]\n",
      "instance 0, ep 23, state [0 1 1 1]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 1 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.35 1.   1.   0.52] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.35 1.   1.   0.52] sorted [2 1 3]\n",
      "   state [0 1 0 1] state_WI [0.35 1.   0.54 1.  ] sorted [1 3 2]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 1 3]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.52] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.52] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.35 1.   1.   0.52] sorted [2 1 3]\n",
      "   state [0 1 0 0] state_WI [0.35 1.   0.54 0.52] sorted [1 2 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.35 1.   1.   0.52] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.35 1.   1.   0.52] sorted [2 1 3]\n",
      "instance 0, ep 24, state [0 0 1 1]\n",
      "   state [0 0 1 1] state_WI [0.35 0.52 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 0 1] state_WI [0.35 1.   0.54 1.  ] sorted [1 3 2]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 0 1] state_WI [0.35 1.   0.54 1.  ] sorted [1 3 2]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.52 1.   0.52] sorted [2 0 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.52] sorted [2 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.54 0.52] sorted [1 0 2]\n",
      "   state [0 1 0 0] state_WI [0.35 1.   0.54 0.52] sorted [1 2 3]\n",
      "   state [0 1 1 0] state_WI [0.35 1.   1.   0.52] sorted [2 1 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.54 1.  ] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.52 0.54 1.  ] sorted [3 0 2]\n",
      "   state [1 0 0 1] state_WI [1.   0.52 0.54 1.  ] sorted [3 0 2]\n",
      "   state [1 0 0 1] state_WI [1.   0.52 0.54 1.  ] sorted [3 0 2]\n",
      "instance 0, ep 25, state [0 0 1 0]\n",
      "   state [0 0 1 0] state_WI [0.35 0.52 1.   0.52] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.35 0.52 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 0 1] state_WI [0.35 1.   0.54 1.  ] sorted [1 3 2]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.35 1.   1.   0.52] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.35 1.   1.   0.52] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.35 1.   1.   0.52] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.35 1.   1.   0.52] sorted [2 1 3]\n",
      "   state [0 1 0 0] state_WI [0.35 1.   0.54 0.52] sorted [1 2 3]\n",
      "   state [0 0 0 0] state_WI [0.35 0.52 0.54 0.52] sorted [2 3 1]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.52] sorted [2 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.54 0.52] sorted [1 0 2]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.35 1.   1.   0.52] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 1 3]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.52] sorted [2 1 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.52 1.   0.52] sorted [2 0 3]\n",
      "instance 0, ep 26, state [1 1 1 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 0 0 1] state_WI [0.35 0.52 0.54 1.  ] sorted [3 2 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 1 3]\n",
      "   state [1 0 1 1] state_WI [1.   0.52 1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.52 1.   0.52] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.52 1.   0.52] sorted [2 0 3]\n",
      "   state [0 0 1 1] state_WI [0.35 0.52 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.35 0.52 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.35 1.   1.   0.52] sorted [2 1 3]\n",
      "   state [0 0 1 0] state_WI [0.35 0.52 1.   0.52] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.35 0.52 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.35 0.52 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 0] state_WI [0.35 1.   1.   0.52] sorted [2 1 3]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.52] sorted [2 1 0]\n",
      "instance 0, ep 27, state [0 1 1 0]\n",
      "   state [0 1 1 0] state_WI [0.35 1.   1.   0.52] sorted [2 1 3]\n",
      "   state [0 0 0 1] state_WI [0.35 0.52 0.54 1.  ] sorted [3 2 1]\n",
      "   state [0 0 1 1] state_WI [0.35 0.52 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.35 1.   1.   0.52] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.35 1.   1.   0.52] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.35 1.   1.   0.52] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 1 3]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.52] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 1 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.35 1.   1.   0.52] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.35 1.   1.   0.52] sorted [2 1 3]\n",
      "instance 0, ep 28, state [0 1 1 0]\n",
      "   state [0 1 1 0] state_WI [0.35 1.   1.   0.52] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.35 0.52 1.   1.  ] sorted [2 3 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.54 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.54 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.35 1.   0.54 1.  ] sorted [1 3 2]\n",
      "   state [0 0 0 1] state_WI [0.35 0.52 0.54 1.  ] sorted [3 2 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.52 0.54 1.  ] sorted [3 0 2]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.35 0.52 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.35 0.52 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 0 1] state_WI [0.35 1.   0.54 1.  ] sorted [1 3 2]\n",
      "   state [0 0 0 0] state_WI [0.35 0.52 0.54 0.52] sorted [2 3 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.54 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.54 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.54 0.52] sorted [1 0 2]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.54 0.52] sorted [1 0 2]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.54 1.  ] sorted [1 3 0]\n",
      "instance 0, ep 29, state [1 1 1 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 1 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 0 1] state_WI [0.35 1.   0.54 1.  ] sorted [1 3 2]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.35 1.   1.   0.52] sorted [2 1 3]\n",
      "   state [0 0 1 0] state_WI [0.35 0.52 1.   0.52] sorted [2 3 1]\n",
      "   state [0 1 0 0] state_WI [0.35 1.   0.54 0.52] sorted [1 2 3]\n",
      "   state [0 0 1 0] state_WI [0.35 0.52 1.   0.52] sorted [2 3 1]\n",
      "   state [0 1 1 0] state_WI [0.35 1.   1.   0.52] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.35 1.   1.   0.52] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 0 1] state_WI [0.35 1.   0.54 1.  ] sorted [1 3 2]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.35 0.52 1.   1.  ] sorted [2 3 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.35 0.52 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.35 0.52 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.35 1.   1.   1.  ] sorted [2 1 3]\n",
      "first state [1 0 0 0]\n",
      "   state [1 0 0 0] state_WI [1.   0.45 0.38 0.57] sorted [0 3 1]\n",
      "   state [1 0 1 0] state_WI [1.   0.45 1.   0.57] sorted [0 2 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.45 1.   0.57] sorted [0 2 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.45 1.   0.57] sorted [0 2 3]\n",
      "   state [1 0 1 1] state_WI [1.   0.45 1.   1.  ] sorted [0 3 2]\n",
      "   state [1 0 1 1] state_WI [1.   0.45 1.   1.  ] sorted [0 3 2]\n",
      "   state [1 0 1 1] state_WI [1.   0.45 1.   1.  ] sorted [0 3 2]\n",
      "   state [1 0 1 1] state_WI [1.   0.45 1.   1.  ] sorted [0 3 2]\n",
      "   state [1 0 1 1] state_WI [1.   0.45 1.   1.  ] sorted [0 3 2]\n",
      "   state [1 0 0 0] state_WI [1.   0.45 0.38 0.57] sorted [0 3 1]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.57] sorted [0 1 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.57] sorted [0 1 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "instance 1, ep 1, state [1 0 0 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [0 0 0 1] state_WI [0.44 0.45 0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.57] sorted [0 1 3]\n",
      "   state [1 0 0 0] state_WI [1.   0.45 0.38 0.57] sorted [0 3 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [0 0 1 1] state_WI [0.44 0.45 1.   1.  ] sorted [3 2 1]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "instance 1, ep 2, state [0 0 0 0]\n",
      "   state [0 0 0 0] state_WI [0.44 0.45 0.38 0.57] sorted [3 1 0]\n",
      "   state [0 0 0 1] state_WI [0.44 0.45 0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.57] sorted [0 1 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.44 1.   0.38 0.57] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.57] sorted [0 1 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.57] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.57] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "instance 1, ep 3, state [1 0 1 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.45 1.   0.57] sorted [0 2 3]\n",
      "   state [1 0 1 1] state_WI [1.   0.45 1.   1.  ] sorted [0 3 2]\n",
      "   state [1 0 1 1] state_WI [1.   0.45 1.   1.  ] sorted [0 3 2]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [0 1 1 0] state_WI [0.44 1.   1.   0.57] sorted [1 2 3]\n",
      "   state [0 1 1 0] state_WI [0.44 1.   1.   0.57] sorted [1 2 3]\n",
      "   state [0 0 0 0] state_WI [0.44 0.45 0.38 0.57] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [0 1 0 0] state_WI [0.44 1.   0.38 0.57] sorted [1 3 0]\n",
      "   state [0 0 0 1] state_WI [0.44 0.45 0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 0 0 0] state_WI [0.44 0.45 0.38 0.57] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "instance 1, ep 4, state [1 0 0 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.57] sorted [0 1 3]\n",
      "   state [1 0 0 0] state_WI [1.   0.45 0.38 0.57] sorted [0 3 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [0 1 0 0] state_WI [0.44 1.   0.38 0.57] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.57] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.57] sorted [0 1 2]\n",
      "   state [1 0 1 0] state_WI [1.   0.45 1.   0.57] sorted [0 2 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [0 1 3]\n",
      "   state [0 1 0 0] state_WI [0.44 1.   0.38 0.57] sorted [1 3 0]\n",
      "instance 1, ep 5, state [1 1 0 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.57] sorted [0 1 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [0 0 0 1] state_WI [0.44 0.45 0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.57] sorted [0 1 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.57] sorted [0 1 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.57] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "instance 1, ep 6, state [0 1 0 1]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [0 0 1 1] state_WI [0.44 0.45 1.   1.  ] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.44 1.   1.   1.  ] sorted [1 3 2]\n",
      "   state [0 0 1 0] state_WI [0.44 0.45 1.   0.57] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.44 0.45 1.   1.  ] sorted [3 2 1]\n",
      "   state [0 1 0 0] state_WI [0.44 1.   0.38 0.57] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.57] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [0 1 1 1] state_WI [0.44 1.   1.   1.  ] sorted [1 3 2]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [1 0 1 0] state_WI [1.   0.45 1.   0.57] sorted [0 2 3]\n",
      "   state [1 0 1 1] state_WI [1.   0.45 1.   1.  ] sorted [0 3 2]\n",
      "   state [1 0 1 1] state_WI [1.   0.45 1.   1.  ] sorted [0 3 2]\n",
      "   state [0 0 1 1] state_WI [0.44 0.45 1.   1.  ] sorted [3 2 1]\n",
      "instance 1, ep 7, state [0 1 0 1]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.57] sorted [0 1 3]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.57] sorted [0 1 2]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.57] sorted [0 1 2]\n",
      "   state [1 0 0 0] state_WI [1.   0.45 0.38 0.57] sorted [0 3 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.44 1.   0.38 0.57] sorted [1 3 0]\n",
      "   state [0 0 1 1] state_WI [0.44 0.45 1.   1.  ] sorted [3 2 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [1 0 0 0] state_WI [1.   0.45 0.38 0.57] sorted [0 3 1]\n",
      "   state [1 0 0 0] state_WI [1.   0.45 0.38 0.57] sorted [0 3 1]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "instance 1, ep 8, state [0 0 1 0]\n",
      "   state [0 0 1 0] state_WI [0.44 0.45 1.   0.57] sorted [2 3 1]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [0 0 1 0] state_WI [0.44 0.45 1.   0.57] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.44 1.   1.   1.  ] sorted [1 3 2]\n",
      "   state [0 1 1 1] state_WI [0.44 1.   1.   1.  ] sorted [1 3 2]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [0 0 0 1] state_WI [0.44 0.45 0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.57] sorted [0 1 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.57] sorted [0 1 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.57] sorted [0 1 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "instance 1, ep 9, state [0 1 1 0]\n",
      "   state [0 1 1 0] state_WI [0.44 1.   1.   0.57] sorted [1 2 3]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.57] sorted [0 1 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.57] sorted [0 1 3]\n",
      "   state [0 1 0 0] state_WI [0.44 1.   0.38 0.57] sorted [1 3 0]\n",
      "   state [1 0 0 0] state_WI [1.   0.45 0.38 0.57] sorted [0 3 1]\n",
      "   state [0 0 0 1] state_WI [0.44 0.45 0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [0 1 3]\n",
      "   state [0 0 1 1] state_WI [0.44 0.45 1.   1.  ] sorted [3 2 1]\n",
      "   state [0 0 0 0] state_WI [0.44 0.45 0.38 0.57] sorted [3 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.57] sorted [0 1 2]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.57] sorted [0 1 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.57] sorted [0 1 3]\n",
      "instance 1, ep 10, state [0 0 1 0]\n",
      "   state [0 0 1 0] state_WI [0.44 0.45 1.   0.57] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.44 1.   1.   1.  ] sorted [1 3 2]\n",
      "   state [0 0 1 1] state_WI [0.44 0.45 1.   1.  ] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.44 1.   1.   1.  ] sorted [1 3 2]\n",
      "   state [0 1 0 0] state_WI [0.44 1.   0.38 0.57] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.57] sorted [0 1 3]\n",
      "   state [0 0 0 1] state_WI [0.44 0.45 0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [0 0 0 1] state_WI [0.44 0.45 0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "instance 1, ep 11, state [0 0 0 1]\n",
      "   state [0 0 0 1] state_WI [0.44 0.45 0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [0 0 0 1] state_WI [0.44 0.45 0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [0 0 0 1] state_WI [0.44 0.45 0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [1 0 1 1] state_WI [1.   0.45 1.   1.  ] sorted [0 3 2]\n",
      "   state [1 0 1 1] state_WI [1.   0.45 1.   1.  ] sorted [0 3 2]\n",
      "   state [0 0 1 1] state_WI [0.44 0.45 1.   1.  ] sorted [3 2 1]\n",
      "   state [0 0 1 0] state_WI [0.44 0.45 1.   0.57] sorted [2 3 1]\n",
      "   state [0 1 1 0] state_WI [0.44 1.   1.   0.57] sorted [1 2 3]\n",
      "   state [0 1 1 1] state_WI [0.44 1.   1.   1.  ] sorted [1 3 2]\n",
      "   state [0 1 1 1] state_WI [0.44 1.   1.   1.  ] sorted [1 3 2]\n",
      "   state [0 1 1 1] state_WI [0.44 1.   1.   1.  ] sorted [1 3 2]\n",
      "instance 1, ep 12, state [0 1 0 0]\n",
      "   state [0 1 0 0] state_WI [0.44 1.   0.38 0.57] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [0 1 1 1] state_WI [0.44 1.   1.   1.  ] sorted [1 3 2]\n",
      "   state [0 1 1 1] state_WI [0.44 1.   1.   1.  ] sorted [1 3 2]\n",
      "   state [0 1 1 1] state_WI [0.44 1.   1.   1.  ] sorted [1 3 2]\n",
      "   state [0 1 1 1] state_WI [0.44 1.   1.   1.  ] sorted [1 3 2]\n",
      "   state [0 1 1 1] state_WI [0.44 1.   1.   1.  ] sorted [1 3 2]\n",
      "   state [0 1 1 1] state_WI [0.44 1.   1.   1.  ] sorted [1 3 2]\n",
      "   state [0 1 1 1] state_WI [0.44 1.   1.   1.  ] sorted [1 3 2]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [0 1 1 1] state_WI [0.44 1.   1.   1.  ] sorted [1 3 2]\n",
      "   state [0 1 1 1] state_WI [0.44 1.   1.   1.  ] sorted [1 3 2]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [0 1 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [1 0 1 1] state_WI [1.   0.45 1.   1.  ] sorted [0 3 2]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [0 0 0 1] state_WI [0.44 0.45 0.38 1.  ] sorted [3 1 0]\n",
      "instance 1, ep 13, state [0 0 1 1]\n",
      "   state [0 0 1 1] state_WI [0.44 0.45 1.   1.  ] sorted [3 2 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [1 0 0 0] state_WI [1.   0.45 0.38 0.57] sorted [0 3 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [0 1 0 0] state_WI [0.44 1.   0.38 0.57] sorted [1 3 0]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [1 0 0 0] state_WI [1.   0.45 0.38 0.57] sorted [0 3 1]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.57] sorted [0 1 3]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.57] sorted [0 1 3]\n",
      "instance 1, ep 14, state [1 1 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 0 1 1] state_WI [1.   0.45 1.   1.  ] sorted [0 3 2]\n",
      "   state [1 0 1 0] state_WI [1.   0.45 1.   0.57] sorted [0 2 3]\n",
      "   state [1 0 1 1] state_WI [1.   0.45 1.   1.  ] sorted [0 3 2]\n",
      "   state [1 0 1 1] state_WI [1.   0.45 1.   1.  ] sorted [0 3 2]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [0 0 0 1] state_WI [0.44 0.45 0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [0 0 0 0] state_WI [0.44 0.45 0.38 0.57] sorted [3 1 0]\n",
      "   state [1 0 0 0] state_WI [1.   0.45 0.38 0.57] sorted [0 3 1]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.57] sorted [0 1 2]\n",
      "instance 1, ep 15, state [0 1 0 0]\n",
      "   state [0 1 0 0] state_WI [0.44 1.   0.38 0.57] sorted [1 3 0]\n",
      "   state [0 0 0 1] state_WI [0.44 0.45 0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.57] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.57] sorted [0 1 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.57] sorted [0 1 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [0 1 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [1 0 0 0] state_WI [1.   0.45 0.38 0.57] sorted [0 3 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "instance 1, ep 16, state [0 0 0 0]\n",
      "   state [0 0 0 0] state_WI [0.44 0.45 0.38 0.57] sorted [3 1 0]\n",
      "   state [0 1 0 0] state_WI [0.44 1.   0.38 0.57] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [0 0 0 1] state_WI [0.44 0.45 0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 0 0 1] state_WI [0.44 0.45 0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.57] sorted [0 1 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.57] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.57] sorted [0 1 3]\n",
      "instance 1, ep 17, state [1 0 0 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.44 1.   0.38 0.57] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.57] sorted [0 1 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.57] sorted [0 1 3]\n",
      "   state [0 0 0 1] state_WI [0.44 0.45 0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [0 1 1 0] state_WI [0.44 1.   1.   0.57] sorted [1 2 3]\n",
      "   state [0 0 1 1] state_WI [0.44 0.45 1.   1.  ] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.44 1.   1.   1.  ] sorted [1 3 2]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.44 1.   0.38 0.57] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.44 1.   0.38 0.57] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.57] sorted [0 1 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "instance 1, ep 18, state [1 0 0 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [0 0 0 1] state_WI [0.44 0.45 0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 0 0 1] state_WI [0.44 0.45 0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [0 0 0 1] state_WI [0.44 0.45 0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.57] sorted [0 1 2]\n",
      "   state [0 0 0 0] state_WI [0.44 0.45 0.38 0.57] sorted [3 1 0]\n",
      "   state [1 0 1 1] state_WI [1.   0.45 1.   1.  ] sorted [0 3 2]\n",
      "   state [1 0 0 0] state_WI [1.   0.45 0.38 0.57] sorted [0 3 1]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.57] sorted [0 1 2]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.57] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 0 0 0] state_WI [1.   0.45 0.38 0.57] sorted [0 3 1]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.44 1.   0.38 0.57] sorted [1 3 0]\n",
      "instance 1, ep 19, state [0 1 1 0]\n",
      "   state [0 1 1 0] state_WI [0.44 1.   1.   0.57] sorted [1 2 3]\n",
      "   state [0 1 0 0] state_WI [0.44 1.   0.38 0.57] sorted [1 3 0]\n",
      "   state [0 1 1 0] state_WI [0.44 1.   1.   0.57] sorted [1 2 3]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.57] sorted [0 1 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.57] sorted [0 1 2]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.57] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.57] sorted [0 1 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.57] sorted [0 1 3]\n",
      "instance 1, ep 20, state [0 1 1 1]\n",
      "   state [0 1 1 1] state_WI [0.44 1.   1.   1.  ] sorted [1 3 2]\n",
      "   state [0 1 1 1] state_WI [0.44 1.   1.   1.  ] sorted [1 3 2]\n",
      "   state [0 1 0 0] state_WI [0.44 1.   0.38 0.57] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.57] sorted [0 1 3]\n",
      "   state [0 1 0 0] state_WI [0.44 1.   0.38 0.57] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.57] sorted [0 1 2]\n",
      "   state [0 1 1 0] state_WI [0.44 1.   1.   0.57] sorted [1 2 3]\n",
      "   state [0 1 1 1] state_WI [0.44 1.   1.   1.  ] sorted [1 3 2]\n",
      "   state [0 1 1 0] state_WI [0.44 1.   1.   0.57] sorted [1 2 3]\n",
      "   state [0 1 0 0] state_WI [0.44 1.   0.38 0.57] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [0 0 1 1] state_WI [0.44 0.45 1.   1.  ] sorted [3 2 1]\n",
      "   state [1 0 1 1] state_WI [1.   0.45 1.   1.  ] sorted [0 3 2]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.57] sorted [0 1 2]\n",
      "instance 1, ep 21, state [1 1 1 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.57] sorted [0 1 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.57] sorted [0 1 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.57] sorted [0 1 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.57] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "instance 1, ep 22, state [1 1 1 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [0 1 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [0 0 1 1] state_WI [0.44 0.45 1.   1.  ] sorted [3 2 1]\n",
      "   state [0 0 0 0] state_WI [0.44 0.45 0.38 0.57] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [0 0 0 1] state_WI [0.44 0.45 0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 0 0 1] state_WI [0.44 0.45 0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [0 0 0 1] state_WI [0.44 0.45 0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 0 0 0] state_WI [1.   0.45 0.38 0.57] sorted [0 3 1]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.57] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [0 0 0 0] state_WI [0.44 0.45 0.38 0.57] sorted [3 1 0]\n",
      "instance 1, ep 23, state [1 0 1 1]\n",
      "   state [1 0 1 1] state_WI [1.   0.45 1.   1.  ] sorted [0 3 2]\n",
      "   state [1 0 1 1] state_WI [1.   0.45 1.   1.  ] sorted [0 3 2]\n",
      "   state [0 0 1 1] state_WI [0.44 0.45 1.   1.  ] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.44 1.   1.   1.  ] sorted [1 3 2]\n",
      "   state [0 1 1 0] state_WI [0.44 1.   1.   0.57] sorted [1 2 3]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [0 0 0 1] state_WI [0.44 0.45 0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 0 0 1] state_WI [0.44 0.45 0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 0 0 1] state_WI [0.44 0.45 0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 0 0 1] state_WI [0.44 0.45 0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [0 0 0 1] state_WI [0.44 0.45 0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 0 0 0] state_WI [1.   0.45 0.38 0.57] sorted [0 3 1]\n",
      "instance 1, ep 24, state [1 1 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.57] sorted [0 1 2]\n",
      "   state [1 0 1 0] state_WI [1.   0.45 1.   0.57] sorted [0 2 3]\n",
      "   state [1 0 0 0] state_WI [1.   0.45 0.38 0.57] sorted [0 3 1]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.57] sorted [0 1 3]\n",
      "   state [0 1 1 0] state_WI [0.44 1.   1.   0.57] sorted [1 2 3]\n",
      "   state [0 0 1 1] state_WI [0.44 0.45 1.   1.  ] sorted [3 2 1]\n",
      "   state [0 0 1 1] state_WI [0.44 0.45 1.   1.  ] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.44 1.   1.   1.  ] sorted [1 3 2]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.44 1.   0.38 0.57] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.57] sorted [0 1 3]\n",
      "   state [0 0 0 1] state_WI [0.44 0.45 0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.44 1.   0.38 0.57] sorted [1 3 0]\n",
      "   state [1 0 0 0] state_WI [1.   0.45 0.38 0.57] sorted [0 3 1]\n",
      "   state [0 0 0 1] state_WI [0.44 0.45 0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [1 0 1 1] state_WI [1.   0.45 1.   1.  ] sorted [0 3 2]\n",
      "instance 1, ep 25, state [0 0 0 0]\n",
      "   state [0 0 0 0] state_WI [0.44 0.45 0.38 0.57] sorted [3 1 0]\n",
      "   state [0 0 0 1] state_WI [0.44 0.45 0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 0 0 1] state_WI [0.44 0.45 0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [0 0 0 1] state_WI [0.44 0.45 0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.57] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [1 0 1 1] state_WI [1.   0.45 1.   1.  ] sorted [0 3 2]\n",
      "   state [1 0 1 1] state_WI [1.   0.45 1.   1.  ] sorted [0 3 2]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [0 0 0 0] state_WI [0.44 0.45 0.38 0.57] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "instance 1, ep 26, state [1 0 1 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.45 1.   0.57] sorted [0 2 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [0 0 0 1] state_WI [0.44 0.45 0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [0 0 0 1] state_WI [0.44 0.45 0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [0 1 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.57] sorted [0 1 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [0 0 0 1] state_WI [0.44 0.45 0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 0 0 1] state_WI [0.44 0.45 0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "instance 1, ep 27, state [1 0 0 0]\n",
      "   state [1 0 0 0] state_WI [1.   0.45 0.38 0.57] sorted [0 3 1]\n",
      "   state [1 0 1 1] state_WI [1.   0.45 1.   1.  ] sorted [0 3 2]\n",
      "   state [1 0 1 1] state_WI [1.   0.45 1.   1.  ] sorted [0 3 2]\n",
      "   state [0 0 1 1] state_WI [0.44 0.45 1.   1.  ] sorted [3 2 1]\n",
      "   state [0 1 1 0] state_WI [0.44 1.   1.   0.57] sorted [1 2 3]\n",
      "   state [0 0 0 0] state_WI [0.44 0.45 0.38 0.57] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [1 0 0 0] state_WI [1.   0.45 0.38 0.57] sorted [0 3 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 0 0 0] state_WI [1.   0.45 0.38 0.57] sorted [0 3 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [0 0 1 1] state_WI [0.44 0.45 1.   1.  ] sorted [3 2 1]\n",
      "   state [0 0 1 1] state_WI [0.44 0.45 1.   1.  ] sorted [3 2 1]\n",
      "   state [0 0 1 1] state_WI [0.44 0.45 1.   1.  ] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.44 1.   1.   1.  ] sorted [1 3 2]\n",
      "instance 1, ep 28, state [1 0 1 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.45 1.   0.57] sorted [0 2 3]\n",
      "   state [1 0 1 1] state_WI [1.   0.45 1.   1.  ] sorted [0 3 2]\n",
      "   state [0 0 1 1] state_WI [0.44 0.45 1.   1.  ] sorted [3 2 1]\n",
      "   state [0 0 0 1] state_WI [0.44 0.45 0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 0] state_WI [0.44 1.   0.38 0.57] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [0 0 0 1] state_WI [0.44 0.45 0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 0 1 1] state_WI [1.   0.45 1.   1.  ] sorted [0 3 2]\n",
      "   state [1 0 1 1] state_WI [1.   0.45 1.   1.  ] sorted [0 3 2]\n",
      "   state [1 0 0 0] state_WI [1.   0.45 0.38 0.57] sorted [0 3 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "instance 1, ep 29, state [0 1 1 0]\n",
      "   state [0 1 1 0] state_WI [0.44 1.   1.   0.57] sorted [1 2 3]\n",
      "   state [0 1 1 0] state_WI [0.44 1.   1.   0.57] sorted [1 2 3]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [0 1 0 1] state_WI [0.44 1.   0.38 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.44 1.   0.38 0.57] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.57] sorted [0 1 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.57] sorted [0 1 3]\n",
      "   state [0 1 1 1] state_WI [0.44 1.   1.   1.  ] sorted [1 3 2]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.57] sorted [0 1 2]\n",
      "   state [0 1 0 0] state_WI [0.44 1.   0.38 0.57] sorted [1 3 0]\n",
      "   state [0 0 0 0] state_WI [0.44 0.45 0.38 0.57] sorted [3 1 0]\n",
      "   state [0 1 0 0] state_WI [0.44 1.   0.38 0.57] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.45 0.38 1.  ] sorted [0 3 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [0 1 3]\n",
      "first state [1 0 0 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.5  0.66 1.  ] sorted [3 0 2]\n",
      "   state [1 0 0 1] state_WI [1.   0.5  0.66 1.  ] sorted [3 0 2]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "   state [0 1 0 1] state_WI [0.49 1.   0.66 1.  ] sorted [3 1 2]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [3 0 1]\n",
      "   state [0 1 0 1] state_WI [0.49 1.   0.66 1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.55] sorted [0 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 0 1] state_WI [0.49 1.   0.66 1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "   state [0 0 1 0] state_WI [0.49 0.5  1.   0.55] sorted [2 3 1]\n",
      "   state [0 1 0 0] state_WI [0.49 1.   0.66 0.55] sorted [1 2 3]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "instance 2, ep 1, state [0 1 0 1]\n",
      "   state [0 1 0 1] state_WI [0.49 1.   0.66 1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 0 0] state_WI [0.49 1.   0.66 0.55] sorted [1 2 3]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 0] state_WI [0.49 1.   1.   0.55] sorted [1 2 3]\n",
      "   state [0 0 1 0] state_WI [0.49 0.5  1.   0.55] sorted [2 3 1]\n",
      "   state [0 1 1 0] state_WI [0.49 1.   1.   0.55] sorted [1 2 3]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.55] sorted [0 1 2]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [3 0 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [3 0 1]\n",
      "   state [0 1 0 0] state_WI [0.49 1.   0.66 0.55] sorted [1 2 3]\n",
      "   state [0 1 1 0] state_WI [0.49 1.   1.   0.55] sorted [1 2 3]\n",
      "instance 2, ep 2, state [0 1 1 1]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 0 1] state_WI [0.49 1.   0.66 1.  ] sorted [3 1 2]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [3 0 1]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [3 0 1]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 0] state_WI [0.49 1.   1.   0.55] sorted [1 2 3]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 0 1] state_WI [0.49 1.   0.66 1.  ] sorted [3 1 2]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "   state [0 0 1 0] state_WI [0.49 0.5  1.   0.55] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [3 0 1]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "instance 2, ep 3, state [0 1 1 1]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 0 0] state_WI [0.49 1.   0.66 0.55] sorted [1 2 3]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 0] state_WI [0.49 1.   1.   0.55] sorted [1 2 3]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 0 0 0] state_WI [0.49 0.5  0.66 0.55] sorted [2 3 1]\n",
      "   state [0 0 0 1] state_WI [0.49 0.5  0.66 1.  ] sorted [3 2 1]\n",
      "   state [0 1 0 1] state_WI [0.49 1.   0.66 1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 0 0 1] state_WI [0.49 0.5  0.66 1.  ] sorted [3 2 1]\n",
      "   state [0 1 0 1] state_WI [0.49 1.   0.66 1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "instance 2, ep 4, state [1 1 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.66 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.66 1.  ] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.5  0.66 1.  ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [1 0 0 1] state_WI [1.   0.5  0.66 1.  ] sorted [3 0 2]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "   state [0 0 1 0] state_WI [0.49 0.5  1.   0.55] sorted [2 3 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [3 0 1]\n",
      "   state [0 1 0 1] state_WI [0.49 1.   0.66 1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 0 1] state_WI [0.49 1.   0.66 1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "   state [0 0 0 1] state_WI [0.49 0.5  0.66 1.  ] sorted [3 2 1]\n",
      "   state [1 0 1 0] state_WI [1.   0.5  1.   0.55] sorted [0 2 3]\n",
      "   state [1 0 0 0] state_WI [1.   0.5  0.66 0.55] sorted [0 2 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.5  0.66 1.  ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [3 0 1]\n",
      "instance 2, ep 5, state [1 1 0 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.66 0.55] sorted [0 1 2]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.55] sorted [0 1 2]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [3 0 1]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "   state [0 0 1 0] state_WI [0.49 0.5  1.   0.55] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "   state [0 1 0 1] state_WI [0.49 1.   0.66 1.  ] sorted [3 1 2]\n",
      "   state [0 1 0 1] state_WI [0.49 1.   0.66 1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "   state [0 1 1 0] state_WI [0.49 1.   1.   0.55] sorted [1 2 3]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [3 0 1]\n",
      "   state [0 1 1 0] state_WI [0.49 1.   1.   0.55] sorted [1 2 3]\n",
      "   state [0 1 1 0] state_WI [0.49 1.   1.   0.55] sorted [1 2 3]\n",
      "   state [0 1 1 0] state_WI [0.49 1.   1.   0.55] sorted [1 2 3]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "   state [0 1 0 1] state_WI [0.49 1.   0.66 1.  ] sorted [3 1 2]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "instance 2, ep 6, state [1 1 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.66 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.66 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.66 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.66 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.66 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.66 1.  ] sorted [3 0 1]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 0] state_WI [0.49 1.   1.   0.55] sorted [1 2 3]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 0 1 0] state_WI [0.49 0.5  1.   0.55] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.66 1.  ] sorted [3 0 1]\n",
      "   state [0 0 0 1] state_WI [0.49 0.5  0.66 1.  ] sorted [3 2 1]\n",
      "instance 2, ep 7, state [0 0 0 0]\n",
      "   state [0 0 0 0] state_WI [0.49 0.5  0.66 0.55] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "   state [0 0 0 0] state_WI [0.49 0.5  0.66 0.55] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 0 1] state_WI [0.49 1.   0.66 1.  ] sorted [3 1 2]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 0 1 0] state_WI [0.49 0.5  1.   0.55] sorted [2 3 1]\n",
      "   state [0 1 0 1] state_WI [0.49 1.   0.66 1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 0 0 1] state_WI [0.49 0.5  0.66 1.  ] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "   state [0 0 0 1] state_WI [0.49 0.5  0.66 1.  ] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 0] state_WI [0.49 1.   1.   0.55] sorted [1 2 3]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "instance 2, ep 8, state [1 0 1 1]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [1 0 1 0] state_WI [1.   0.5  1.   0.55] sorted [0 2 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 0 1] state_WI [0.49 1.   0.66 1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "   state [0 1 1 0] state_WI [0.49 1.   1.   0.55] sorted [1 2 3]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "instance 2, ep 9, state [1 1 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.66 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.66 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.66 1.  ] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.5  0.66 1.  ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [1 0 1 0] state_WI [1.   0.5  1.   0.55] sorted [0 2 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "   state [0 0 0 1] state_WI [0.49 0.5  0.66 1.  ] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "   state [0 1 0 1] state_WI [0.49 1.   0.66 1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "instance 2, ep 10, state [1 0 1 1]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.55] sorted [0 1 2]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.66 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.66 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.66 1.  ] sorted [3 0 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [3 0 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.66 1.  ] sorted [3 0 1]\n",
      "   state [0 1 0 1] state_WI [0.49 1.   0.66 1.  ] sorted [3 1 2]\n",
      "   state [0 1 0 1] state_WI [0.49 1.   0.66 1.  ] sorted [3 1 2]\n",
      "   state [0 1 0 1] state_WI [0.49 1.   0.66 1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.66 1.  ] sorted [3 0 1]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [1 0 0 1] state_WI [1.   0.5  0.66 1.  ] sorted [3 0 2]\n",
      "   state [1 0 1 0] state_WI [1.   0.5  1.   0.55] sorted [0 2 3]\n",
      "instance 2, ep 11, state [1 1 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.55] sorted [0 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 0 1] state_WI [0.49 1.   0.66 1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 0 1 0] state_WI [0.49 0.5  1.   0.55] sorted [2 3 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [3 0 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [3 0 1]\n",
      "   state [1 0 1 0] state_WI [1.   0.5  1.   0.55] sorted [0 2 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.5  1.   0.55] sorted [0 2 3]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 0 1 0] state_WI [0.49 0.5  1.   0.55] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "   state [0 0 1 0] state_WI [0.49 0.5  1.   0.55] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 0 1] state_WI [0.49 1.   0.66 1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "instance 2, ep 12, state [1 1 0 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.66 0.55] sorted [0 1 2]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.5  0.66 1.  ] sorted [3 0 2]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [3 0 1]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "   state [0 0 1 0] state_WI [0.49 0.5  1.   0.55] sorted [2 3 1]\n",
      "   state [0 1 0 1] state_WI [0.49 1.   0.66 1.  ] sorted [3 1 2]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [3 0 1]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.55] sorted [0 1 2]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.55] sorted [0 1 2]\n",
      "   state [0 1 1 0] state_WI [0.49 1.   1.   0.55] sorted [1 2 3]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "instance 2, ep 13, state [0 1 1 0]\n",
      "   state [0 1 1 0] state_WI [0.49 1.   1.   0.55] sorted [1 2 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.5  0.66 1.  ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "   state [0 1 1 0] state_WI [0.49 1.   1.   0.55] sorted [1 2 3]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.66 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.66 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.66 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.66 1.  ] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.5  0.66 1.  ] sorted [3 0 2]\n",
      "   state [1 0 0 1] state_WI [1.   0.5  0.66 1.  ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "   state [0 0 0 1] state_WI [0.49 0.5  0.66 1.  ] sorted [3 2 1]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "instance 2, ep 14, state [1 0 1 1]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.66 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.66 1.  ] sorted [3 0 1]\n",
      "   state [0 1 0 1] state_WI [0.49 1.   0.66 1.  ] sorted [3 1 2]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "   state [0 0 1 0] state_WI [0.49 0.5  1.   0.55] sorted [2 3 1]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.55] sorted [0 1 2]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.55] sorted [0 1 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "   state [0 1 1 0] state_WI [0.49 1.   1.   0.55] sorted [1 2 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.5  0.66 1.  ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "instance 2, ep 15, state [1 0 0 0]\n",
      "   state [1 0 0 0] state_WI [1.   0.5  0.66 0.55] sorted [0 2 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.5  0.66 1.  ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [1 0 1 0] state_WI [1.   0.5  1.   0.55] sorted [0 2 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [1 0 0 1] state_WI [1.   0.5  0.66 1.  ] sorted [3 0 2]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 0] state_WI [0.49 1.   1.   0.55] sorted [1 2 3]\n",
      "   state [0 1 1 0] state_WI [0.49 1.   1.   0.55] sorted [1 2 3]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 0] state_WI [0.49 1.   1.   0.55] sorted [1 2 3]\n",
      "   state [0 1 1 0] state_WI [0.49 1.   1.   0.55] sorted [1 2 3]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [1 0 0 0] state_WI [1.   0.5  0.66 0.55] sorted [0 2 3]\n",
      "instance 2, ep 16, state [0 1 1 1]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.66 1.  ] sorted [3 0 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [3 0 1]\n",
      "   state [0 1 1 0] state_WI [0.49 1.   1.   0.55] sorted [1 2 3]\n",
      "   state [0 1 1 0] state_WI [0.49 1.   1.   0.55] sorted [1 2 3]\n",
      "   state [0 1 1 0] state_WI [0.49 1.   1.   0.55] sorted [1 2 3]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [3 0 1]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.5  0.66 1.  ] sorted [3 0 2]\n",
      "   state [1 0 0 1] state_WI [1.   0.5  0.66 1.  ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.5  0.66 1.  ] sorted [3 0 2]\n",
      "instance 2, ep 17, state [1 1 1 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [3 0 1]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.66 0.55] sorted [0 1 2]\n",
      "   state [1 0 1 0] state_WI [1.   0.5  1.   0.55] sorted [0 2 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [1 0 1 0] state_WI [1.   0.5  1.   0.55] sorted [0 2 3]\n",
      "   state [1 0 0 0] state_WI [1.   0.5  0.66 0.55] sorted [0 2 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "   state [0 1 1 0] state_WI [0.49 1.   1.   0.55] sorted [1 2 3]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "instance 2, ep 18, state [1 0 0 0]\n",
      "   state [1 0 0 0] state_WI [1.   0.5  0.66 0.55] sorted [0 2 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [1 0 0 1] state_WI [1.   0.5  0.66 1.  ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [1 0 1 0] state_WI [1.   0.5  1.   0.55] sorted [0 2 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [1 0 1 0] state_WI [1.   0.5  1.   0.55] sorted [0 2 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [0 0 0 1] state_WI [0.49 0.5  0.66 1.  ] sorted [3 2 1]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "instance 2, ep 19, state [1 1 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.66 1.  ] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.5  0.66 1.  ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "   state [0 0 0 1] state_WI [0.49 0.5  0.66 1.  ] sorted [3 2 1]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [1 0 0 1] state_WI [1.   0.5  0.66 1.  ] sorted [3 0 2]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [3 0 1]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [1 0 1 0] state_WI [1.   0.5  1.   0.55] sorted [0 2 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [1 0 1 0] state_WI [1.   0.5  1.   0.55] sorted [0 2 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.66 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.66 1.  ] sorted [3 0 1]\n",
      "instance 2, ep 20, state [1 0 0 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.5  0.66 1.  ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [1 0 0 1] state_WI [1.   0.5  0.66 1.  ] sorted [3 0 2]\n",
      "   state [1 0 0 1] state_WI [1.   0.5  0.66 1.  ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [3 0 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [3 0 1]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "   state [0 0 1 0] state_WI [0.49 0.5  1.   0.55] sorted [2 3 1]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [1 0 0 1] state_WI [1.   0.5  0.66 1.  ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [1 0 0 1] state_WI [1.   0.5  0.66 1.  ] sorted [3 0 2]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.55] sorted [0 1 2]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.66 0.55] sorted [0 1 2]\n",
      "   state [0 1 1 0] state_WI [0.49 1.   1.   0.55] sorted [1 2 3]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 0 1] state_WI [0.49 1.   0.66 1.  ] sorted [3 1 2]\n",
      "instance 2, ep 21, state [1 1 1 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [3 0 1]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "   state [0 0 1 0] state_WI [0.49 0.5  1.   0.55] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "   state [0 0 0 1] state_WI [0.49 0.5  0.66 1.  ] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.55] sorted [0 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "   state [0 0 0 1] state_WI [0.49 0.5  0.66 1.  ] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "instance 2, ep 22, state [1 1 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.55] sorted [0 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [3 0 1]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [3 0 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [3 0 1]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.66 0.55] sorted [0 1 2]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.66 0.55] sorted [0 1 2]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.66 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.66 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.66 1.  ] sorted [3 0 1]\n",
      "   state [0 1 0 1] state_WI [0.49 1.   0.66 1.  ] sorted [3 1 2]\n",
      "   state [0 1 0 0] state_WI [0.49 1.   0.66 0.55] sorted [1 2 3]\n",
      "   state [0 1 1 0] state_WI [0.49 1.   1.   0.55] sorted [1 2 3]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "   state [0 0 0 1] state_WI [0.49 0.5  0.66 1.  ] sorted [3 2 1]\n",
      "   state [0 0 1 0] state_WI [0.49 0.5  1.   0.55] sorted [2 3 1]\n",
      "   state [0 1 1 0] state_WI [0.49 1.   1.   0.55] sorted [1 2 3]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "instance 2, ep 23, state [0 0 1 1]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 0 0 1] state_WI [0.49 0.5  0.66 1.  ] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 0 1] state_WI [0.49 1.   0.66 1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 0 0 1] state_WI [0.49 0.5  0.66 1.  ] sorted [3 2 1]\n",
      "   state [0 0 1 0] state_WI [0.49 0.5  1.   0.55] sorted [2 3 1]\n",
      "   state [0 0 0 1] state_WI [0.49 0.5  0.66 1.  ] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 0] state_WI [0.49 1.   1.   0.55] sorted [1 2 3]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "instance 2, ep 24, state [1 0 0 0]\n",
      "   state [1 0 0 0] state_WI [1.   0.5  0.66 0.55] sorted [0 2 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.5  0.66 1.  ] sorted [3 0 2]\n",
      "   state [1 0 1 0] state_WI [1.   0.5  1.   0.55] sorted [0 2 3]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "   state [0 1 0 0] state_WI [0.49 1.   0.66 0.55] sorted [1 2 3]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "   state [0 0 1 0] state_WI [0.49 0.5  1.   0.55] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 0 0] state_WI [0.49 1.   0.66 0.55] sorted [1 2 3]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 0 1] state_WI [0.49 1.   0.66 1.  ] sorted [3 1 2]\n",
      "instance 2, ep 25, state [0 1 0 0]\n",
      "   state [0 1 0 0] state_WI [0.49 1.   0.66 0.55] sorted [1 2 3]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "   state [0 1 0 1] state_WI [0.49 1.   0.66 1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 0 0] state_WI [0.49 1.   0.66 0.55] sorted [1 2 3]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "   state [0 1 0 1] state_WI [0.49 1.   0.66 1.  ] sorted [3 1 2]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.55] sorted [0 1 2]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.66 0.55] sorted [0 1 2]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.55] sorted [0 1 2]\n",
      "instance 2, ep 26, state [1 0 1 1]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [1 0 0 1] state_WI [1.   0.5  0.66 1.  ] sorted [3 0 2]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 0 0] state_WI [0.49 1.   0.66 0.55] sorted [1 2 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [3 0 1]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 0 1] state_WI [0.49 1.   0.66 1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [3 0 1]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "   state [0 1 0 1] state_WI [0.49 1.   0.66 1.  ] sorted [3 1 2]\n",
      "   state [0 1 0 1] state_WI [0.49 1.   0.66 1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 0 1] state_WI [0.49 1.   0.66 1.  ] sorted [3 1 2]\n",
      "instance 2, ep 27, state [0 1 1 1]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.55] sorted [0 1 2]\n",
      "   state [0 1 0 0] state_WI [0.49 1.   0.66 0.55] sorted [1 2 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.5  1.   0.55] sorted [0 2 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 0] state_WI [0.49 1.   1.   0.55] sorted [1 2 3]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 0 1 0] state_WI [0.49 0.5  1.   0.55] sorted [2 3 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [3 0 1]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 0] state_WI [0.49 1.   1.   0.55] sorted [1 2 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "instance 2, ep 28, state [0 1 0 0]\n",
      "   state [0 1 0 0] state_WI [0.49 1.   0.66 0.55] sorted [1 2 3]\n",
      "   state [0 0 1 0] state_WI [0.49 0.5  1.   0.55] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 0 1] state_WI [0.49 1.   0.66 1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "   state [0 0 0 1] state_WI [0.49 0.5  0.66 1.  ] sorted [3 2 1]\n",
      "   state [0 0 0 1] state_WI [0.49 0.5  0.66 1.  ] sorted [3 2 1]\n",
      "   state [0 1 0 1] state_WI [0.49 1.   0.66 1.  ] sorted [3 1 2]\n",
      "   state [0 0 1 0] state_WI [0.49 0.5  1.   0.55] sorted [2 3 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [3 0 1]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.55] sorted [0 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "instance 2, ep 29, state [0 1 0 0]\n",
      "   state [0 1 0 0] state_WI [0.49 1.   0.66 0.55] sorted [1 2 3]\n",
      "   state [0 1 0 1] state_WI [0.49 1.   0.66 1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 0 1 1] state_WI [0.49 0.5  1.   1.  ] sorted [3 2 1]\n",
      "   state [0 1 0 1] state_WI [0.49 1.   0.66 1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.49 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 0 0 1] state_WI [0.49 0.5  0.66 1.  ] sorted [3 2 1]\n",
      "   state [0 0 0 1] state_WI [0.49 0.5  0.66 1.  ] sorted [3 2 1]\n",
      "   state [0 1 0 0] state_WI [0.49 1.   0.66 0.55] sorted [1 2 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [3 0 1]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [1 0 1 0] state_WI [1.   0.5  1.   0.55] sorted [0 2 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [1 0 1 0] state_WI [1.   0.5  1.   0.55] sorted [0 2 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.5 1.  1. ] sorted [3 0 2]\n",
      "   state [1 0 1 0] state_WI [1.   0.5  1.   0.55] sorted [0 2 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.5  0.66 1.  ] sorted [3 0 2]\n",
      "first state [0 1 1 0]\n",
      "   state [0 1 1 0] state_WI [0.63 1.   1.   0.53] sorted [2 1 0]\n",
      "   state [0 0 1 0] state_WI [0.63 0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [0 0 1 1] state_WI [0.63 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.49 1.  ] sorted [0 3 2]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 0 1]\n",
      "   state [0 0 1 0] state_WI [0.63 0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [0 0 1 1] state_WI [0.63 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.53] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.53] sorted [2 0 1]\n",
      "   state [0 1 1 0] state_WI [0.63 1.   1.   0.53] sorted [2 1 0]\n",
      "   state [0 0 1 0] state_WI [0.63 0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.49 1.  ] sorted [0 3 2]\n",
      "instance 3, ep 1, state [1 1 0 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.49 0.53] sorted [0 1 3]\n",
      "   state [0 0 0 0] state_WI [0.63 0.4  0.49 0.53] sorted [0 3 2]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [0 0 1 0] state_WI [0.63 0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [0 0 1 1] state_WI [0.63 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [0 0 1 1] state_WI [0.63 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 0 0] state_WI [1.   0.4  0.49 0.53] sorted [0 3 2]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.49 1.  ] sorted [0 3 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "instance 3, ep 2, state [0 0 0 0]\n",
      "   state [0 0 0 0] state_WI [0.63 0.4  0.49 0.53] sorted [0 3 2]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 0 1]\n",
      "   state [1 0 0 0] state_WI [1.   0.4  0.49 0.53] sorted [0 3 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [0 0 1 1] state_WI [0.63 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [0 1 1 1] state_WI [0.63 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.63 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [0 0 1 0] state_WI [0.63 0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "instance 3, ep 3, state [0 0 1 0]\n",
      "   state [0 0 1 0] state_WI [0.63 0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [0 0 1 1] state_WI [0.63 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [0 0 1 1] state_WI [0.63 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.49 1.  ] sorted [0 3 2]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.53] sorted [2 0 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.49 1.  ] sorted [0 1 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.49 1.  ] sorted [0 3 2]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.49 1.  ] sorted [0 3 2]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.53] sorted [2 0 1]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 0 1]\n",
      "instance 3, ep 4, state [1 0 1 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [0 0 1 1] state_WI [0.63 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [0 1 1 1] state_WI [0.63 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.63 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.63 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 0 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.53] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.53] sorted [2 0 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 0 1]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 0 0] state_WI [1.   0.4  0.49 0.53] sorted [0 3 2]\n",
      "instance 3, ep 5, state [0 1 1 1]\n",
      "   state [0 1 1 1] state_WI [0.63 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.63 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.63 1.   1.   0.53] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.63 1.   1.   0.53] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.53] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.53] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.53] sorted [2 0 1]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.49 1.  ] sorted [0 3 2]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 0 0] state_WI [1.   0.4  0.49 0.53] sorted [0 3 2]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [0 0 1 1] state_WI [0.63 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "instance 3, ep 6, state [0 0 1 1]\n",
      "   state [0 0 1 1] state_WI [0.63 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [0 0 1 1] state_WI [0.63 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.49 1.  ] sorted [0 3 2]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [0 0 1 0] state_WI [0.63 0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [0 0 1 1] state_WI [0.63 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [0 0 1 0] state_WI [0.63 0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "instance 3, ep 7, state [1 1 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.49 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.49 1.  ] sorted [0 1 3]\n",
      "   state [0 1 1 0] state_WI [0.63 1.   1.   0.53] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.63 1.   1.   0.53] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.63 1.   1.   0.53] sorted [2 1 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [0 0 1 1] state_WI [0.63 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [0 1 1 0] state_WI [0.63 1.   1.   0.53] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.53] sorted [2 0 1]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 0 1]\n",
      "   state [0 1 1 1] state_WI [0.63 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.63 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [0 0 1 0] state_WI [0.63 0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [0 0 1 1] state_WI [0.63 0.4  1.   1.  ] sorted [2 3 0]\n",
      "instance 3, ep 8, state [0 0 0 1]\n",
      "   state [0 0 0 1] state_WI [0.63 0.4  0.49 1.  ] sorted [3 0 2]\n",
      "   state [0 0 0 1] state_WI [0.63 0.4  0.49 1.  ] sorted [3 0 2]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [0 0 1 0] state_WI [0.63 0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 0 0] state_WI [1.   0.4  0.49 0.53] sorted [0 3 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 0 0] state_WI [1.   0.4  0.49 0.53] sorted [0 3 2]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.49 1.  ] sorted [0 3 2]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 0 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 0 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 0 1]\n",
      "   state [1 0 0 0] state_WI [1.   0.4  0.49 0.53] sorted [0 3 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [0 1 1 0] state_WI [0.63 1.   1.   0.53] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.63 1.   1.   0.53] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.63 1.   1.   0.53] sorted [2 1 0]\n",
      "instance 3, ep 9, state [0 0 1 0]\n",
      "   state [0 0 1 0] state_WI [0.63 0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 0 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 0 1]\n",
      "   state [0 1 1 0] state_WI [0.63 1.   1.   0.53] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.53] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.53] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.53] sorted [2 0 1]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [0 0 1 1] state_WI [0.63 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.49 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.49 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.49 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.49 1.  ] sorted [0 1 3]\n",
      "   state [0 0 0 0] state_WI [0.63 0.4  0.49 0.53] sorted [0 3 2]\n",
      "   state [0 0 0 1] state_WI [0.63 0.4  0.49 1.  ] sorted [3 0 2]\n",
      "instance 3, ep 10, state [1 0 0 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.49 1.  ] sorted [0 3 2]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [0 1 1 0] state_WI [0.63 1.   1.   0.53] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.63 1.   1.   0.53] sorted [2 1 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [0 0 1 1] state_WI [0.63 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.53] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.53] sorted [2 0 1]\n",
      "   state [0 0 1 0] state_WI [0.63 0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "instance 3, ep 11, state [0 0 0 0]\n",
      "   state [0 0 0 0] state_WI [0.63 0.4  0.49 0.53] sorted [0 3 2]\n",
      "   state [0 0 0 1] state_WI [0.63 0.4  0.49 1.  ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 0 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 0 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 0 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 0 1]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [0 0 1 0] state_WI [0.63 0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "instance 3, ep 12, state [1 0 1 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.53] sorted [2 0 1]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [0 0 0 1] state_WI [0.63 0.4  0.49 1.  ] sorted [3 0 2]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.53] sorted [2 0 1]\n",
      "   state [0 1 1 0] state_WI [0.63 1.   1.   0.53] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.53] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.53] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.53] sorted [2 0 1]\n",
      "   state [0 0 1 0] state_WI [0.63 0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.49 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.49 1.  ] sorted [0 1 3]\n",
      "   state [1 0 0 0] state_WI [1.   0.4  0.49 0.53] sorted [0 3 2]\n",
      "instance 3, ep 13, state [1 1 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.53] sorted [2 0 1]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 0 0] state_WI [1.   0.4  0.49 0.53] sorted [0 3 2]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.53] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.53] sorted [2 0 1]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.53] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.53] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.53] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.53] sorted [2 0 1]\n",
      "instance 3, ep 14, state [0 0 1 1]\n",
      "   state [0 0 1 1] state_WI [0.63 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [0 1 1 1] state_WI [0.63 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 0 1] state_WI [0.63 1.   0.49 1.  ] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.49 1.  ] sorted [0 3 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [0 1 0 0] state_WI [0.63 1.   0.49 0.53] sorted [1 0 3]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.53] sorted [2 0 1]\n",
      "   state [0 1 1 0] state_WI [0.63 1.   1.   0.53] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.53] sorted [2 0 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.53] sorted [2 0 1]\n",
      "   state [0 1 1 0] state_WI [0.63 1.   1.   0.53] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.53] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.53] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.53] sorted [2 0 1]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "instance 3, ep 15, state [1 0 1 1]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.49 1.  ] sorted [0 3 2]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.49 1.  ] sorted [0 3 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 0 1]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 0 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 0 1]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.53] sorted [2 0 1]\n",
      "   state [0 0 1 0] state_WI [0.63 0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 0 0] state_WI [1.   0.4  0.49 0.53] sorted [0 3 2]\n",
      "   state [0 0 1 0] state_WI [0.63 0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "instance 3, ep 16, state [0 0 1 1]\n",
      "   state [0 0 1 1] state_WI [0.63 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.49 1.  ] sorted [0 3 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [0 0 1 0] state_WI [0.63 0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [0 0 1 0] state_WI [0.63 0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.49 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.49 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.49 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.49 1.  ] sorted [0 1 3]\n",
      "   state [1 0 0 0] state_WI [1.   0.4  0.49 0.53] sorted [0 3 2]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.49 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.49 1.  ] sorted [0 1 3]\n",
      "   state [0 1 0 1] state_WI [0.63 1.   0.49 1.  ] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.49 1.  ] sorted [0 3 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [0 0 1 0] state_WI [0.63 0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 0 0] state_WI [1.   0.4  0.49 0.53] sorted [0 3 2]\n",
      "instance 3, ep 17, state [1 0 1 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [0 0 1 0] state_WI [0.63 0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.53] sorted [2 0 1]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [0 0 1 1] state_WI [0.63 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [0 0 1 0] state_WI [0.63 0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "instance 3, ep 18, state [0 0 1 1]\n",
      "   state [0 0 1 1] state_WI [0.63 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 0 0] state_WI [1.   0.4  0.49 0.53] sorted [0 3 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 0 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 0 1]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.49 1.  ] sorted [0 3 2]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.49 1.  ] sorted [0 3 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.53] sorted [2 0 1]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "instance 3, ep 19, state [1 0 1 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [0 1 1 0] state_WI [0.63 1.   1.   0.53] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.53] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.53] sorted [2 0 1]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 0 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 0 1]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.49 0.53] sorted [0 1 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.49 1.  ] sorted [0 3 2]\n",
      "   state [0 0 1 1] state_WI [0.63 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.49 1.  ] sorted [0 3 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "instance 3, ep 20, state [1 0 0 0]\n",
      "   state [1 0 0 0] state_WI [1.   0.4  0.49 0.53] sorted [0 3 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.53] sorted [2 0 1]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 0 1]\n",
      "   state [0 1 1 0] state_WI [0.63 1.   1.   0.53] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 0 1]\n",
      "   state [0 1 1 0] state_WI [0.63 1.   1.   0.53] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.63 1.   1.   0.53] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.53] sorted [2 0 1]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [0 0 1 1] state_WI [0.63 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [0 0 1 1] state_WI [0.63 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [0 0 1 0] state_WI [0.63 0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "instance 3, ep 21, state [0 1 1 0]\n",
      "   state [0 1 1 0] state_WI [0.63 1.   1.   0.53] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.53] sorted [2 0 1]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [0 0 1 1] state_WI [0.63 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [0 0 0 1] state_WI [0.63 0.4  0.49 1.  ] sorted [3 0 2]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 0 1]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.53] sorted [2 0 1]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.49 1.  ] sorted [0 3 2]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.49 1.  ] sorted [0 3 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.49 1.  ] sorted [0 3 2]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "instance 3, ep 22, state [1 0 1 1]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [0 0 1 1] state_WI [0.63 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.53] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.53] sorted [2 0 1]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.49 0.53] sorted [0 1 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.53] sorted [2 0 1]\n",
      "   state [0 0 0 0] state_WI [0.63 0.4  0.49 0.53] sorted [0 3 2]\n",
      "   state [0 0 1 0] state_WI [0.63 0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.49 1.  ] sorted [0 3 2]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 0 1]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.53] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.53] sorted [2 0 1]\n",
      "instance 3, ep 23, state [1 0 1 1]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.53] sorted [2 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.49 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.49 1.  ] sorted [0 1 3]\n",
      "   state [0 1 0 1] state_WI [0.63 1.   0.49 1.  ] sorted [1 3 0]\n",
      "   state [1 0 0 0] state_WI [1.   0.4  0.49 0.53] sorted [0 3 2]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.53] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.53] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.53] sorted [2 0 1]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 0 0] state_WI [1.   0.4  0.49 0.53] sorted [0 3 2]\n",
      "   state [0 0 0 1] state_WI [0.63 0.4  0.49 1.  ] sorted [3 0 2]\n",
      "   state [0 0 1 1] state_WI [0.63 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [0 0 1 1] state_WI [0.63 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 0 0] state_WI [1.   0.4  0.49 0.53] sorted [0 3 2]\n",
      "   state [0 0 1 1] state_WI [0.63 0.4  1.   1.  ] sorted [2 3 0]\n",
      "instance 3, ep 24, state [0 0 1 1]\n",
      "   state [0 0 1 1] state_WI [0.63 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [0 1 1 1] state_WI [0.63 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.63 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.63 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [0 0 1 0] state_WI [0.63 0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [0 0 1 0] state_WI [0.63 0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [0 0 1 1] state_WI [0.63 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "instance 3, ep 25, state [1 1 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.53] sorted [2 0 1]\n",
      "   state [0 1 1 0] state_WI [0.63 1.   1.   0.53] sorted [2 1 0]\n",
      "   state [0 0 1 0] state_WI [0.63 0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 0 1]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [0 0 1 0] state_WI [0.63 0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [0 0 1 0] state_WI [0.63 0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.49 1.  ] sorted [0 3 2]\n",
      "instance 3, ep 26, state [0 0 1 0]\n",
      "   state [0 0 1 0] state_WI [0.63 0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 0 1]\n",
      "   state [0 1 1 1] state_WI [0.63 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.63 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.63 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 0 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 0 1]\n",
      "   state [0 1 1 0] state_WI [0.63 1.   1.   0.53] sorted [2 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.49 0.53] sorted [0 1 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 0 1]\n",
      "   state [0 1 1 0] state_WI [0.63 1.   1.   0.53] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.53] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.53] sorted [2 0 1]\n",
      "instance 3, ep 27, state [1 1 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.53] sorted [2 0 1]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.49 1.  ] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.49 1.  ] sorted [0 1 3]\n",
      "   state [1 0 0 0] state_WI [1.   0.4  0.49 0.53] sorted [0 3 2]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.49 1.  ] sorted [0 3 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [0 0 1 0] state_WI [0.63 0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.53] sorted [2 0 1]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.49 0.53] sorted [0 1 3]\n",
      "instance 3, ep 28, state [1 0 1 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [0 1 0 1] state_WI [0.63 1.   0.49 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.49 0.53] sorted [0 1 3]\n",
      "   state [1 0 0 0] state_WI [1.   0.4  0.49 0.53] sorted [0 3 2]\n",
      "   state [1 0 0 0] state_WI [1.   0.4  0.49 0.53] sorted [0 3 2]\n",
      "   state [0 0 1 0] state_WI [0.63 0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "instance 3, ep 29, state [0 1 0 0]\n",
      "   state [0 1 0 0] state_WI [0.63 1.   0.49 0.53] sorted [1 0 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 0 1]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.53] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [0 1 1 1] state_WI [0.63 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 0 1] state_WI [0.63 1.   0.49 1.  ] sorted [1 3 0]\n",
      "   state [0 1 1 1] state_WI [0.63 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 0 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 0 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 0 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.49 1.  ] sorted [0 1 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.49 1.  ] sorted [0 3 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.49 1.  ] sorted [0 3 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 0 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.53] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.53] sorted [2 0 1]\n",
      "first state [0 1 0 1]\n",
      "   state [0 1 0 1] state_WI [0.22 1.   0.26 1.  ] sorted [1 3 2]\n",
      "   state [0 1 0 0] state_WI [0.22 1.   0.26 0.03] sorted [1 2 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.38 1.   0.03] sorted [2 0 1]\n",
      "   state [1 0 1 0] state_WI [1.   0.38 1.   0.03] sorted [2 0 1]\n",
      "   state [0 0 0 0] state_WI [0.22 0.38 0.26 0.03] sorted [1 2 0]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [1 0 0 0] state_WI [1.   0.38 0.26 0.03] sorted [0 1 2]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [1 0 0 0] state_WI [1.   0.38 0.26 0.03] sorted [0 1 2]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 0 0] state_WI [0.22 1.   0.26 0.03] sorted [1 2 0]\n",
      "   state [0 1 0 0] state_WI [0.22 1.   0.26 0.03] sorted [1 2 0]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "instance 4, ep 1, state [0 0 0 0]\n",
      "   state [0 0 0 0] state_WI [0.22 0.38 0.26 0.03] sorted [1 2 0]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [1 0 0 0] state_WI [1.   0.38 0.26 0.03] sorted [0 1 2]\n",
      "   state [1 0 1 1] state_WI [1.   0.38 1.   1.  ] sorted [2 0 3]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 0 0] state_WI [0.22 1.   0.26 0.03] sorted [1 2 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 1 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.38 1.   0.03] sorted [2 0 1]\n",
      "   state [0 0 0 0] state_WI [0.22 0.38 0.26 0.03] sorted [1 2 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.38 1.   0.03] sorted [2 0 1]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "instance 4, ep 2, state [1 0 1 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.38 1.   0.03] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 0 0] state_WI [0.22 1.   0.26 0.03] sorted [1 2 0]\n",
      "   state [0 0 0 0] state_WI [0.22 0.38 0.26 0.03] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 0 0] state_WI [0.22 1.   0.26 0.03] sorted [1 2 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.38 1.   0.03] sorted [2 0 1]\n",
      "   state [0 0 0 0] state_WI [0.22 0.38 0.26 0.03] sorted [1 2 0]\n",
      "   state [0 0 0 0] state_WI [0.22 0.38 0.26 0.03] sorted [1 2 0]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [0 0 0 0] state_WI [0.22 0.38 0.26 0.03] sorted [1 2 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.38 1.   0.03] sorted [2 0 1]\n",
      "   state [1 0 1 0] state_WI [1.   0.38 1.   0.03] sorted [2 0 1]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 1] state_WI [0.22 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.38 1.   0.03] sorted [2 0 1]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "instance 4, ep 3, state [1 0 0 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.38 0.26 1.  ] sorted [0 3 1]\n",
      "   state [1 0 0 0] state_WI [1.   0.38 0.26 0.03] sorted [0 1 2]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 1] state_WI [0.22 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 0 0] state_WI [0.22 1.   0.26 0.03] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.26 0.03] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.38 1.   0.03] sorted [2 0 1]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [0 0 0 0] state_WI [0.22 0.38 0.26 0.03] sorted [1 2 0]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.26 0.03] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 0 0] state_WI [0.22 1.   0.26 0.03] sorted [1 2 0]\n",
      "instance 4, ep 4, state [0 0 1 1]\n",
      "   state [0 0 1 1] state_WI [0.22 0.38 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 0 0] state_WI [0.22 1.   0.26 0.03] sorted [1 2 0]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 0 0] state_WI [0.22 1.   0.26 0.03] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 0 0] state_WI [0.22 1.   0.26 0.03] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.26 0.03] sorted [1 0 2]\n",
      "   state [0 0 0 0] state_WI [0.22 0.38 0.26 0.03] sorted [1 2 0]\n",
      "instance 4, ep 5, state [0 0 1 0]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.38 1.   0.03] sorted [2 0 1]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 0 0] state_WI [0.22 1.   0.26 0.03] sorted [1 2 0]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [0 0 0 0] state_WI [0.22 0.38 0.26 0.03] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 1] state_WI [0.22 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.38 1.   0.03] sorted [2 0 1]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.26 0.03] sorted [1 0 2]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "instance 4, ep 6, state [0 0 1 1]\n",
      "   state [0 0 1 1] state_WI [0.22 0.38 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 1] state_WI [0.22 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 0 0] state_WI [0.22 1.   0.26 0.03] sorted [1 2 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.26 0.03] sorted [1 0 2]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.26 0.03] sorted [1 0 2]\n",
      "   state [0 1 0 0] state_WI [0.22 1.   0.26 0.03] sorted [1 2 0]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.38 1.   0.03] sorted [2 0 1]\n",
      "   state [1 0 1 0] state_WI [1.   0.38 1.   0.03] sorted [2 0 1]\n",
      "   state [1 0 0 0] state_WI [1.   0.38 0.26 0.03] sorted [0 1 2]\n",
      "   state [0 0 0 0] state_WI [0.22 0.38 0.26 0.03] sorted [1 2 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.38 1.   0.03] sorted [2 0 1]\n",
      "instance 4, ep 7, state [0 0 0 1]\n",
      "   state [0 0 0 1] state_WI [0.22 0.38 0.26 1.  ] sorted [3 1 2]\n",
      "   state [0 0 0 0] state_WI [0.22 0.38 0.26 0.03] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 0 0] state_WI [0.22 1.   0.26 0.03] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [0 0 0 0] state_WI [0.22 0.38 0.26 0.03] sorted [1 2 0]\n",
      "   state [0 1 0 0] state_WI [0.22 1.   0.26 0.03] sorted [1 2 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 1] state_WI [0.22 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 0 0] state_WI [0.22 1.   0.26 0.03] sorted [1 2 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "instance 4, ep 8, state [0 0 1 0]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 0 0] state_WI [0.22 1.   0.26 0.03] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.38 1.   0.03] sorted [2 0 1]\n",
      "   state [1 0 1 0] state_WI [1.   0.38 1.   0.03] sorted [2 0 1]\n",
      "   state [1 0 1 0] state_WI [1.   0.38 1.   0.03] sorted [2 0 1]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 0 0] state_WI [0.22 1.   0.26 0.03] sorted [1 2 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.26 0.03] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.26 0.03] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "instance 4, ep 9, state [1 0 0 0]\n",
      "   state [1 0 0 0] state_WI [1.   0.38 0.26 0.03] sorted [0 1 2]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 0 0] state_WI [0.22 1.   0.26 0.03] sorted [1 2 0]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [0 0 0 0] state_WI [0.22 0.38 0.26 0.03] sorted [1 2 0]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.38 1.   0.03] sorted [2 0 1]\n",
      "   state [0 1 0 0] state_WI [0.22 1.   0.26 0.03] sorted [1 2 0]\n",
      "instance 4, ep 10, state [1 1 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.26 0.03] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 0 0] state_WI [0.22 1.   0.26 0.03] sorted [1 2 0]\n",
      "   state [0 1 1 1] state_WI [0.22 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 0 0] state_WI [0.22 1.   0.26 0.03] sorted [1 2 0]\n",
      "   state [0 1 0 0] state_WI [0.22 1.   0.26 0.03] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 0 0] state_WI [0.22 1.   0.26 0.03] sorted [1 2 0]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 1] state_WI [0.22 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 0 0 0] state_WI [0.22 0.38 0.26 0.03] sorted [1 2 0]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.38 1.   0.03] sorted [2 0 1]\n",
      "instance 4, ep 11, state [1 0 0 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.38 0.26 1.  ] sorted [0 3 1]\n",
      "   state [1 0 1 0] state_WI [1.   0.38 1.   0.03] sorted [2 0 1]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 0 0 0] state_WI [0.22 0.38 0.26 0.03] sorted [1 2 0]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.38 1.   0.03] sorted [2 0 1]\n",
      "   state [0 0 0 0] state_WI [0.22 0.38 0.26 0.03] sorted [1 2 0]\n",
      "   state [0 0 1 1] state_WI [0.22 0.38 1.   1.  ] sorted [2 3 1]\n",
      "   state [1 0 1 0] state_WI [1.   0.38 1.   0.03] sorted [2 0 1]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "instance 4, ep 12, state [0 0 0 0]\n",
      "   state [0 0 0 0] state_WI [0.22 0.38 0.26 0.03] sorted [1 2 0]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.38 1.   0.03] sorted [2 0 1]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.38 1.   0.03] sorted [2 0 1]\n",
      "   state [1 0 0 0] state_WI [1.   0.38 0.26 0.03] sorted [0 1 2]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 0 0] state_WI [0.22 1.   0.26 0.03] sorted [1 2 0]\n",
      "   state [1 0 0 0] state_WI [1.   0.38 0.26 0.03] sorted [0 1 2]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 1] state_WI [0.22 1.   1.   1.  ] sorted [2 1 3]\n",
      "instance 4, ep 13, state [0 1 0 1]\n",
      "   state [0 1 0 1] state_WI [0.22 1.   0.26 1.  ] sorted [1 3 2]\n",
      "   state [0 1 0 1] state_WI [0.22 1.   0.26 1.  ] sorted [1 3 2]\n",
      "   state [0 1 0 0] state_WI [0.22 1.   0.26 0.03] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [1 0 0 0] state_WI [1.   0.38 0.26 0.03] sorted [0 1 2]\n",
      "   state [0 0 0 0] state_WI [0.22 0.38 0.26 0.03] sorted [1 2 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 0 0] state_WI [0.22 1.   0.26 0.03] sorted [1 2 0]\n",
      "   state [0 1 0 0] state_WI [0.22 1.   0.26 0.03] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.26 0.03] sorted [1 0 2]\n",
      "   state [1 0 1 0] state_WI [1.   0.38 1.   0.03] sorted [2 0 1]\n",
      "instance 4, ep 14, state [1 0 0 0]\n",
      "   state [1 0 0 0] state_WI [1.   0.38 0.26 0.03] sorted [0 1 2]\n",
      "   state [1 0 0 0] state_WI [1.   0.38 0.26 0.03] sorted [0 1 2]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.26 0.03] sorted [1 0 2]\n",
      "   state [0 1 0 0] state_WI [0.22 1.   0.26 0.03] sorted [1 2 0]\n",
      "   state [0 1 1 1] state_WI [0.22 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.38 1.   0.03] sorted [2 0 1]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [1 0 1 1] state_WI [1.   0.38 1.   1.  ] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.38 1.   0.03] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.26 0.03] sorted [1 0 2]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "instance 4, ep 15, state [1 0 1 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.38 1.   0.03] sorted [2 0 1]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.26 0.03] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 0 0 0] state_WI [0.22 0.38 0.26 0.03] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 1] state_WI [0.22 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.22 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 0 0 0] state_WI [0.22 0.38 0.26 0.03] sorted [1 2 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.26 0.03] sorted [1 0 2]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 0 0] state_WI [0.22 1.   0.26 0.03] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "instance 4, ep 16, state [1 0 0 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.38 0.26 1.  ] sorted [0 3 1]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.38 1.   0.03] sorted [2 0 1]\n",
      "   state [0 1 0 0] state_WI [0.22 1.   0.26 0.03] sorted [1 2 0]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 0 0] state_WI [0.22 1.   0.26 0.03] sorted [1 2 0]\n",
      "   state [0 0 0 0] state_WI [0.22 0.38 0.26 0.03] sorted [1 2 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.38 1.   0.03] sorted [2 0 1]\n",
      "   state [0 0 1 1] state_WI [0.22 0.38 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.22 0.38 1.   1.  ] sorted [2 3 1]\n",
      "instance 4, ep 17, state [1 0 1 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.38 1.   0.03] sorted [2 0 1]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [0 0 0 0] state_WI [0.22 0.38 0.26 0.03] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.26 0.03] sorted [1 0 2]\n",
      "   state [1 0 1 0] state_WI [1.   0.38 1.   0.03] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 0 0] state_WI [0.22 1.   0.26 0.03] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.38 1.   0.03] sorted [2 0 1]\n",
      "   state [0 0 0 0] state_WI [0.22 0.38 0.26 0.03] sorted [1 2 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.38 1.   0.03] sorted [2 0 1]\n",
      "   state [1 0 1 1] state_WI [1.   0.38 1.   1.  ] sorted [2 0 3]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "instance 4, ep 18, state [1 1 0 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.26 0.03] sorted [1 0 2]\n",
      "   state [0 1 0 0] state_WI [0.22 1.   0.26 0.03] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [1 0 1 1] state_WI [1.   0.38 1.   1.  ] sorted [2 0 3]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 0 0] state_WI [0.22 1.   0.26 0.03] sorted [1 2 0]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.26 0.03] sorted [1 0 2]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.38 1.   0.03] sorted [2 0 1]\n",
      "   state [0 1 0 0] state_WI [0.22 1.   0.26 0.03] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.38 1.   0.03] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "instance 4, ep 19, state [0 1 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [1 0 0 0] state_WI [1.   0.38 0.26 0.03] sorted [0 1 2]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 0 0] state_WI [0.22 1.   0.26 0.03] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.26 0.03] sorted [1 0 2]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 1 0]\n",
      "   state [0 1 0 0] state_WI [0.22 1.   0.26 0.03] sorted [1 2 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 0 1 1] state_WI [0.22 0.38 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "instance 4, ep 20, state [0 1 1 1]\n",
      "   state [0 1 1 1] state_WI [0.22 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 0 0 1] state_WI [0.22 0.38 0.26 1.  ] sorted [3 1 2]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [1 0 0 0] state_WI [1.   0.38 0.26 0.03] sorted [0 1 2]\n",
      "   state [0 1 1 1] state_WI [0.22 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.22 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 0 0] state_WI [0.22 1.   0.26 0.03] sorted [1 2 0]\n",
      "   state [0 0 0 0] state_WI [0.22 0.38 0.26 0.03] sorted [1 2 0]\n",
      "   state [0 0 0 0] state_WI [0.22 0.38 0.26 0.03] sorted [1 2 0]\n",
      "   state [0 1 0 0] state_WI [0.22 1.   0.26 0.03] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "instance 4, ep 21, state [0 0 0 1]\n",
      "   state [0 0 0 1] state_WI [0.22 0.38 0.26 1.  ] sorted [3 1 2]\n",
      "   state [0 0 1 1] state_WI [0.22 0.38 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 0 0] state_WI [0.22 1.   0.26 0.03] sorted [1 2 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 0 0] state_WI [0.22 1.   0.26 0.03] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 0 0 0] state_WI [0.22 0.38 0.26 0.03] sorted [1 2 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "instance 4, ep 22, state [0 1 0 1]\n",
      "   state [0 1 0 1] state_WI [0.22 1.   0.26 1.  ] sorted [1 3 2]\n",
      "   state [0 1 1 1] state_WI [0.22 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 1 0 0] state_WI [0.22 1.   0.26 0.03] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.38 1.   0.03] sorted [2 0 1]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [0 0 0 0] state_WI [0.22 0.38 0.26 0.03] sorted [1 2 0]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 0 0] state_WI [0.22 1.   0.26 0.03] sorted [1 2 0]\n",
      "   state [0 1 0 0] state_WI [0.22 1.   0.26 0.03] sorted [1 2 0]\n",
      "   state [0 1 0 0] state_WI [0.22 1.   0.26 0.03] sorted [1 2 0]\n",
      "instance 4, ep 23, state [1 1 0 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.26 0.03] sorted [1 0 2]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [1 0 0 0] state_WI [1.   0.38 0.26 0.03] sorted [0 1 2]\n",
      "   state [0 0 0 0] state_WI [0.22 0.38 0.26 0.03] sorted [1 2 0]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 0 0] state_WI [0.22 1.   0.26 0.03] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 0 0] state_WI [0.22 1.   0.26 0.03] sorted [1 2 0]\n",
      "   state [0 1 0 1] state_WI [0.22 1.   0.26 1.  ] sorted [1 3 2]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 1 0]\n",
      "instance 4, ep 24, state [0 1 1 1]\n",
      "   state [0 1 1 1] state_WI [0.22 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 0 0 0] state_WI [0.22 0.38 0.26 0.03] sorted [1 2 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 0 0] state_WI [0.22 1.   0.26 0.03] sorted [1 2 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.38 1.   0.03] sorted [2 0 1]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [1 0 0 0] state_WI [1.   0.38 0.26 0.03] sorted [0 1 2]\n",
      "   state [1 0 1 0] state_WI [1.   0.38 1.   0.03] sorted [2 0 1]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.38 1.   0.03] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "instance 4, ep 25, state [1 1 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.26 1.  ] sorted [1 0 3]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.26 0.03] sorted [1 0 2]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 1 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.38 1.   0.03] sorted [2 0 1]\n",
      "   state [0 1 0 0] state_WI [0.22 1.   0.26 0.03] sorted [1 2 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 0 0 0] state_WI [0.22 0.38 0.26 0.03] sorted [1 2 0]\n",
      "   state [0 1 0 0] state_WI [0.22 1.   0.26 0.03] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.38 1.   0.03] sorted [2 0 1]\n",
      "   state [1 0 1 0] state_WI [1.   0.38 1.   0.03] sorted [2 0 1]\n",
      "instance 4, ep 26, state [0 0 1 0]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.38 1.   0.03] sorted [2 0 1]\n",
      "   state [0 0 0 0] state_WI [0.22 0.38 0.26 0.03] sorted [1 2 0]\n",
      "   state [0 0 0 0] state_WI [0.22 0.38 0.26 0.03] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.38 1.   0.03] sorted [2 0 1]\n",
      "   state [0 1 1 1] state_WI [0.22 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.38 1.   0.03] sorted [2 0 1]\n",
      "   state [1 0 1 1] state_WI [1.   0.38 1.   1.  ] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.38 1.   0.03] sorted [2 0 1]\n",
      "   state [0 0 0 0] state_WI [0.22 0.38 0.26 0.03] sorted [1 2 0]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [0 0 0 0] state_WI [0.22 0.38 0.26 0.03] sorted [1 2 0]\n",
      "instance 4, ep 27, state [0 1 0 1]\n",
      "   state [0 1 0 1] state_WI [0.22 1.   0.26 1.  ] sorted [1 3 2]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 0 0] state_WI [0.22 1.   0.26 0.03] sorted [1 2 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.26 0.03] sorted [1 0 2]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.38 0.26 1.  ] sorted [0 3 1]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [0 0 1 1] state_WI [0.22 0.38 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 0 0] state_WI [0.22 0.38 0.26 0.03] sorted [1 2 0]\n",
      "   state [0 0 1 1] state_WI [0.22 0.38 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [0 0 0 0] state_WI [0.22 0.38 0.26 0.03] sorted [1 2 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.38 1.   0.03] sorted [2 0 1]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "instance 4, ep 28, state [0 0 0 0]\n",
      "   state [0 0 0 0] state_WI [0.22 0.38 0.26 0.03] sorted [1 2 0]\n",
      "   state [0 0 0 0] state_WI [0.22 0.38 0.26 0.03] sorted [1 2 0]\n",
      "   state [0 0 0 0] state_WI [0.22 0.38 0.26 0.03] sorted [1 2 0]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [0 0 1 1] state_WI [0.22 0.38 1.   1.  ] sorted [2 3 1]\n",
      "   state [1 0 1 0] state_WI [1.   0.38 1.   0.03] sorted [2 0 1]\n",
      "   state [1 0 1 0] state_WI [1.   0.38 1.   0.03] sorted [2 0 1]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 0 0 0] state_WI [0.22 0.38 0.26 0.03] sorted [1 2 0]\n",
      "   state [0 1 0 0] state_WI [0.22 1.   0.26 0.03] sorted [1 2 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "instance 4, ep 29, state [1 0 1 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.38 1.   0.03] sorted [2 0 1]\n",
      "   state [0 0 1 0] state_WI [0.22 0.38 1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 0 0] state_WI [0.22 1.   0.26 0.03] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 0 0] state_WI [0.22 1.   0.26 0.03] sorted [1 2 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.38 1.   0.03] sorted [2 0 1]\n",
      "   state [0 1 1 1] state_WI [0.22 1.   1.   1.  ] sorted [2 1 3]\n",
      "   state [0 0 0 0] state_WI [0.22 0.38 0.26 0.03] sorted [1 2 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [0 1 0 0] state_WI [0.22 1.   0.26 0.03] sorted [1 2 0]\n",
      "   state [0 1 0 0] state_WI [0.22 1.   0.26 0.03] sorted [1 2 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.03] sorted [2 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.26 0.03] sorted [1 0 2]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.26 0.03] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.22 1.   1.   0.03] sorted [2 1 0]\n",
      "first state [0 1 1 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 0 0] state_WI [0.32 1.   0.58 0.36] sorted [1 2 3]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 0] state_WI [0.32 0.41 1.   0.36] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 0] state_WI [0.32 0.41 1.   0.36] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [0 1 0 1] state_WI [0.32 1.   0.58 1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 0 1] state_WI [0.32 1.   0.58 1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.36] sorted [2 1 0]\n",
      "   state [0 0 1 0] state_WI [0.32 0.41 1.   0.36] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "instance 5, ep 1, state [0 0 1 0]\n",
      "   state [0 0 1 0] state_WI [0.32 0.41 1.   0.36] sorted [2 1 3]\n",
      "   state [0 0 0 0] state_WI [0.32 0.41 0.58 0.36] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 0] state_WI [0.32 0.41 1.   0.36] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 3 1]\n",
      "   state [1 0 1 1] state_WI [1.   0.41 1.   1.  ] sorted [2 3 0]\n",
      "   state [0 0 1 0] state_WI [0.32 0.41 1.   0.36] sorted [2 1 3]\n",
      "instance 5, ep 2, state [1 1 1 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 3 1]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.36] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.36] sorted [2 1 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.41 1.   0.36] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.36] sorted [2 1 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.41 1.   0.36] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.36] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.36] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.36] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.36] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 0 0] state_WI [0.32 0.41 0.58 0.36] sorted [2 1 3]\n",
      "   state [0 0 0 1] state_WI [0.32 0.41 0.58 1.  ] sorted [3 2 1]\n",
      "   state [0 1 0 1] state_WI [0.32 1.   0.58 1.  ] sorted [3 1 2]\n",
      "   state [0 1 0 1] state_WI [0.32 1.   0.58 1.  ] sorted [3 1 2]\n",
      "   state [0 1 0 1] state_WI [0.32 1.   0.58 1.  ] sorted [3 1 2]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "instance 5, ep 3, state [1 0 1 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.41 1.   0.36] sorted [2 0 1]\n",
      "   state [1 0 1 0] state_WI [1.   0.41 1.   0.36] sorted [2 0 1]\n",
      "   state [1 0 1 0] state_WI [1.   0.41 1.   0.36] sorted [2 0 1]\n",
      "   state [0 0 1 0] state_WI [0.32 0.41 1.   0.36] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 3 1]\n",
      "   state [1 0 1 1] state_WI [1.   0.41 1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.41 1.   0.36] sorted [2 0 1]\n",
      "   state [0 0 1 0] state_WI [0.32 0.41 1.   0.36] sorted [2 1 3]\n",
      "   state [0 0 1 0] state_WI [0.32 0.41 1.   0.36] sorted [2 1 3]\n",
      "   state [0 0 1 0] state_WI [0.32 0.41 1.   0.36] sorted [2 1 3]\n",
      "   state [0 0 1 0] state_WI [0.32 0.41 1.   0.36] sorted [2 1 3]\n",
      "   state [0 0 1 0] state_WI [0.32 0.41 1.   0.36] sorted [2 1 3]\n",
      "   state [0 0 1 0] state_WI [0.32 0.41 1.   0.36] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 3 1]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [0 0 1 0] state_WI [0.32 0.41 1.   0.36] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "instance 5, ep 4, state [0 1 1 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 0] state_WI [0.32 0.41 1.   0.36] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 0] state_WI [0.32 0.41 1.   0.36] sorted [2 1 3]\n",
      "   state [0 0 0 0] state_WI [0.32 0.41 0.58 0.36] sorted [2 1 3]\n",
      "   state [0 1 0 1] state_WI [0.32 1.   0.58 1.  ] sorted [3 1 2]\n",
      "instance 5, ep 5, state [1 0 0 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.41 0.58 1.  ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.   0.41 1.   1.  ] sorted [2 3 0]\n",
      "   state [0 0 0 0] state_WI [0.32 0.41 0.58 0.36] sorted [2 1 3]\n",
      "   state [0 1 0 0] state_WI [0.32 1.   0.58 0.36] sorted [1 2 3]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [0 1 0 0] state_WI [0.32 1.   0.58 0.36] sorted [1 2 3]\n",
      "   state [0 1 0 0] state_WI [0.32 1.   0.58 0.36] sorted [1 2 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.58 0.36] sorted [1 0 2]\n",
      "   state [0 0 0 0] state_WI [0.32 0.41 0.58 0.36] sorted [2 1 3]\n",
      "   state [0 0 1 0] state_WI [0.32 0.41 1.   0.36] sorted [2 1 3]\n",
      "   state [1 0 1 1] state_WI [1.   0.41 1.   1.  ] sorted [2 3 0]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "instance 5, ep 6, state [0 0 0 0]\n",
      "   state [0 0 0 0] state_WI [0.32 0.41 0.58 0.36] sorted [2 1 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.41 1.   0.36] sorted [2 0 1]\n",
      "   state [1 0 1 0] state_WI [1.   0.41 1.   0.36] sorted [2 0 1]\n",
      "   state [1 0 1 0] state_WI [1.   0.41 1.   0.36] sorted [2 0 1]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 0] state_WI [0.32 0.41 1.   0.36] sorted [2 1 3]\n",
      "   state [0 0 1 0] state_WI [0.32 0.41 1.   0.36] sorted [2 1 3]\n",
      "   state [0 0 0 0] state_WI [0.32 0.41 0.58 0.36] sorted [2 1 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.41 1.   0.36] sorted [2 0 1]\n",
      "   state [1 0 1 1] state_WI [1.   0.41 1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.   0.41 1.   1.  ] sorted [2 3 0]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 3 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 3 1]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.36] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "instance 5, ep 7, state [0 0 0 0]\n",
      "   state [0 0 0 0] state_WI [0.32 0.41 0.58 0.36] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 0] state_WI [0.32 0.41 1.   0.36] sorted [2 1 3]\n",
      "   state [0 0 1 0] state_WI [0.32 0.41 1.   0.36] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [0 1 0 0] state_WI [0.32 1.   0.58 0.36] sorted [1 2 3]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [0 0 1 0] state_WI [0.32 0.41 1.   0.36] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 0] state_WI [0.32 0.41 1.   0.36] sorted [2 1 3]\n",
      "instance 5, ep 8, state [1 0 0 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.41 0.58 1.  ] sorted [3 0 2]\n",
      "   state [0 0 0 0] state_WI [0.32 0.41 0.58 0.36] sorted [2 1 3]\n",
      "   state [0 0 1 0] state_WI [0.32 0.41 1.   0.36] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [0 1 0 0] state_WI [0.32 1.   0.58 0.36] sorted [1 2 3]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.41 0.58 1.  ] sorted [3 0 2]\n",
      "   state [0 0 0 0] state_WI [0.32 0.41 0.58 0.36] sorted [2 1 3]\n",
      "   state [0 0 0 0] state_WI [0.32 0.41 0.58 0.36] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [0 0 0 1] state_WI [0.32 0.41 0.58 1.  ] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.36] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.36] sorted [2 1 0]\n",
      "   state [1 0 0 0] state_WI [1.   0.41 0.58 0.36] sorted [0 2 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.58 1.  ] sorted [3 1 0]\n",
      "instance 5, ep 9, state [0 1 1 0]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 0 1] state_WI [0.32 1.   0.58 1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 0 0] state_WI [0.32 1.   0.58 0.36] sorted [1 2 3]\n",
      "   state [0 1 0 0] state_WI [0.32 1.   0.58 0.36] sorted [1 2 3]\n",
      "   state [0 1 0 0] state_WI [0.32 1.   0.58 0.36] sorted [1 2 3]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 0] state_WI [0.32 0.41 1.   0.36] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 3 1]\n",
      "   state [0 0 1 0] state_WI [0.32 0.41 1.   0.36] sorted [2 1 3]\n",
      "instance 5, ep 10, state [0 1 1 0]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "   state [1 0 1 1] state_WI [1.   0.41 1.   1.  ] sorted [2 3 0]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 0 1] state_WI [0.32 0.41 0.58 1.  ] sorted [3 2 1]\n",
      "   state [1 0 1 1] state_WI [1.   0.41 1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.   0.41 1.   1.  ] sorted [2 3 0]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 3 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 3 1]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.36] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.36] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.36] sorted [2 1 0]\n",
      "   state [0 1 0 1] state_WI [0.32 1.   0.58 1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [1 0 1 0] state_WI [1.   0.41 1.   0.36] sorted [2 0 1]\n",
      "   state [0 0 0 0] state_WI [0.32 0.41 0.58 0.36] sorted [2 1 3]\n",
      "   state [0 0 0 1] state_WI [0.32 0.41 0.58 1.  ] sorted [3 2 1]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "instance 5, ep 11, state [1 0 1 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.41 1.   0.36] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.36] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.36] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.36] sorted [2 1 0]\n",
      "   state [1 0 1 1] state_WI [1.   0.41 1.   1.  ] sorted [2 3 0]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.36] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.36] sorted [2 1 0]\n",
      "   state [0 1 0 0] state_WI [0.32 1.   0.58 0.36] sorted [1 2 3]\n",
      "   state [0 1 0 1] state_WI [0.32 1.   0.58 1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "instance 5, ep 12, state [1 1 1 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 3 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 3 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.58 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.32 1.   0.58 1.  ] sorted [3 1 2]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 3 1]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "instance 5, ep 13, state [0 0 0 0]\n",
      "   state [0 0 0 0] state_WI [0.32 0.41 0.58 0.36] sorted [2 1 3]\n",
      "   state [1 0 0 0] state_WI [1.   0.41 0.58 0.36] sorted [0 2 1]\n",
      "   state [1 0 1 0] state_WI [1.   0.41 1.   0.36] sorted [2 0 1]\n",
      "   state [1 0 1 0] state_WI [1.   0.41 1.   0.36] sorted [2 0 1]\n",
      "   state [1 0 1 1] state_WI [1.   0.41 1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.   0.41 1.   1.  ] sorted [2 3 0]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 3 1]\n",
      "   state [0 1 0 0] state_WI [0.32 1.   0.58 0.36] sorted [1 2 3]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "instance 5, ep 14, state [1 0 0 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.41 0.58 1.  ] sorted [3 0 2]\n",
      "   state [1 0 0 1] state_WI [1.   0.41 0.58 1.  ] sorted [3 0 2]\n",
      "   state [1 0 0 1] state_WI [1.   0.41 0.58 1.  ] sorted [3 0 2]\n",
      "   state [0 0 0 1] state_WI [0.32 0.41 0.58 1.  ] sorted [3 2 1]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 0] state_WI [0.32 0.41 1.   0.36] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "   state [1 0 1 0] state_WI [1.   0.41 1.   0.36] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.36] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [1 0 1 1] state_WI [1.   0.41 1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.   0.41 1.   1.  ] sorted [2 3 0]\n",
      "   state [0 0 1 0] state_WI [0.32 0.41 1.   0.36] sorted [2 1 3]\n",
      "   state [0 0 1 0] state_WI [0.32 0.41 1.   0.36] sorted [2 1 3]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.36] sorted [2 1 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.41 1.   0.36] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.36] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.36] sorted [2 1 0]\n",
      "instance 5, ep 15, state [1 1 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.36] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [0 1 0 0] state_WI [0.32 1.   0.58 0.36] sorted [1 2 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.36] sorted [2 1 0]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "instance 5, ep 16, state [0 1 1 0]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [0 1 0 1] state_WI [0.32 1.   0.58 1.  ] sorted [3 1 2]\n",
      "   state [0 0 0 0] state_WI [0.32 0.41 0.58 0.36] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 0 1] state_WI [0.32 1.   0.58 1.  ] sorted [3 1 2]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.36] sorted [2 1 0]\n",
      "instance 5, ep 17, state [1 0 0 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.41 0.58 1.  ] sorted [3 0 2]\n",
      "   state [1 0 0 1] state_WI [1.   0.41 0.58 1.  ] sorted [3 0 2]\n",
      "   state [0 0 0 0] state_WI [0.32 0.41 0.58 0.36] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 0 1] state_WI [0.32 1.   0.58 1.  ] sorted [3 1 2]\n",
      "   state [0 1 0 1] state_WI [0.32 1.   0.58 1.  ] sorted [3 1 2]\n",
      "   state [0 1 0 1] state_WI [0.32 1.   0.58 1.  ] sorted [3 1 2]\n",
      "   state [0 1 0 1] state_WI [0.32 1.   0.58 1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "instance 5, ep 18, state [1 1 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.58 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.58 1.  ] sorted [3 1 0]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 0] state_WI [0.32 0.41 1.   0.36] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 0 0] state_WI [0.32 1.   0.58 0.36] sorted [1 2 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 0 1] state_WI [0.32 1.   0.58 1.  ] sorted [3 1 2]\n",
      "   state [0 1 0 1] state_WI [0.32 1.   0.58 1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "instance 5, ep 19, state [0 0 1 1]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 0 0] state_WI [0.32 0.41 0.58 0.36] sorted [2 1 3]\n",
      "   state [0 1 0 1] state_WI [0.32 1.   0.58 1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 0 1] state_WI [0.32 0.41 0.58 1.  ] sorted [3 2 1]\n",
      "   state [0 0 0 0] state_WI [0.32 0.41 0.58 0.36] sorted [2 1 3]\n",
      "   state [0 0 1 0] state_WI [0.32 0.41 1.   0.36] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 0] state_WI [0.32 0.41 1.   0.36] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 0 1] state_WI [0.32 1.   0.58 1.  ] sorted [3 1 2]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "   state [1 0 1 1] state_WI [1.   0.41 1.   1.  ] sorted [2 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.58 1.  ] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.41 0.58 1.  ] sorted [3 0 2]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "instance 5, ep 20, state [1 1 1 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [1 0 1 1] state_WI [1.   0.41 1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.   0.41 1.   1.  ] sorted [2 3 0]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 0 0] state_WI [0.32 0.41 0.58 0.36] sorted [2 1 3]\n",
      "   state [0 1 0 0] state_WI [0.32 1.   0.58 0.36] sorted [1 2 3]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "instance 5, ep 21, state [0 0 0 0]\n",
      "   state [0 0 0 0] state_WI [0.32 0.41 0.58 0.36] sorted [2 1 3]\n",
      "   state [0 0 0 0] state_WI [0.32 0.41 0.58 0.36] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.58 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 0] state_WI [0.32 1.   0.58 0.36] sorted [1 2 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 3 1]\n",
      "   state [0 0 1 0] state_WI [0.32 0.41 1.   0.36] sorted [2 1 3]\n",
      "   state [0 0 0 1] state_WI [0.32 0.41 0.58 1.  ] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 0 1] state_WI [0.32 0.41 0.58 1.  ] sorted [3 2 1]\n",
      "   state [0 1 0 1] state_WI [0.32 1.   0.58 1.  ] sorted [3 1 2]\n",
      "   state [0 1 0 1] state_WI [0.32 1.   0.58 1.  ] sorted [3 1 2]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "instance 5, ep 22, state [1 0 0 0]\n",
      "   state [1 0 0 0] state_WI [1.   0.41 0.58 0.36] sorted [0 2 1]\n",
      "   state [1 0 1 0] state_WI [1.   0.41 1.   0.36] sorted [2 0 1]\n",
      "   state [1 0 1 0] state_WI [1.   0.41 1.   0.36] sorted [2 0 1]\n",
      "   state [1 0 1 1] state_WI [1.   0.41 1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.   0.41 1.   1.  ] sorted [2 3 0]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 0 1] state_WI [0.32 1.   0.58 1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.58 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.58 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 0] state_WI [0.32 1.   0.58 0.36] sorted [1 2 3]\n",
      "   state [0 1 0 0] state_WI [0.32 1.   0.58 0.36] sorted [1 2 3]\n",
      "   state [0 1 0 1] state_WI [0.32 1.   0.58 1.  ] sorted [3 1 2]\n",
      "   state [0 1 0 1] state_WI [0.32 1.   0.58 1.  ] sorted [3 1 2]\n",
      "   state [0 1 0 1] state_WI [0.32 1.   0.58 1.  ] sorted [3 1 2]\n",
      "   state [0 1 0 1] state_WI [0.32 1.   0.58 1.  ] sorted [3 1 2]\n",
      "   state [0 0 0 0] state_WI [0.32 0.41 0.58 0.36] sorted [2 1 3]\n",
      "   state [0 0 1 0] state_WI [0.32 0.41 1.   0.36] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "instance 5, ep 23, state [1 0 1 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.41 1.   0.36] sorted [2 0 1]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.36] sorted [2 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.58 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.58 0.36] sorted [1 0 2]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.58 1.  ] sorted [3 1 0]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 0] state_WI [0.32 0.41 1.   0.36] sorted [2 1 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.41 1.   0.36] sorted [2 0 1]\n",
      "   state [0 0 1 0] state_WI [0.32 0.41 1.   0.36] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.36] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 3 1]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [0 0 1 0] state_WI [0.32 0.41 1.   0.36] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 0] state_WI [0.32 0.41 1.   0.36] sorted [2 1 3]\n",
      "instance 5, ep 24, state [0 1 1 0]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 0 1] state_WI [0.32 1.   0.58 1.  ] sorted [3 1 2]\n",
      "   state [0 0 1 0] state_WI [0.32 0.41 1.   0.36] sorted [2 1 3]\n",
      "   state [0 0 1 0] state_WI [0.32 0.41 1.   0.36] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 0 1] state_WI [0.32 0.41 0.58 1.  ] sorted [3 2 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.58 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.58 1.  ] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.41 0.58 1.  ] sorted [3 0 2]\n",
      "   state [1 0 1 0] state_WI [1.   0.41 1.   0.36] sorted [2 0 1]\n",
      "   state [0 0 1 0] state_WI [0.32 0.41 1.   0.36] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 0 1] state_WI [0.32 0.41 0.58 1.  ] sorted [3 2 1]\n",
      "instance 5, ep 25, state [1 1 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.58 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.32 1.   0.58 1.  ] sorted [3 1 2]\n",
      "   state [0 1 0 1] state_WI [0.32 1.   0.58 1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 3 1]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 0 1] state_WI [0.32 1.   0.58 1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "instance 5, ep 26, state [1 1 1 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.36] sorted [2 1 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.41 1.   0.36] sorted [2 0 1]\n",
      "   state [1 0 1 0] state_WI [1.   0.41 1.   0.36] sorted [2 0 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 0 0] state_WI [0.32 0.41 0.58 0.36] sorted [2 1 3]\n",
      "   state [0 0 1 0] state_WI [0.32 0.41 1.   0.36] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [0 0 1 0] state_WI [0.32 0.41 1.   0.36] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 0 1] state_WI [0.32 0.41 0.58 1.  ] sorted [3 2 1]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "instance 5, ep 27, state [1 1 1 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 3 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 3 1]\n",
      "   state [0 0 1 0] state_WI [0.32 0.41 1.   0.36] sorted [2 1 3]\n",
      "   state [0 0 1 0] state_WI [0.32 0.41 1.   0.36] sorted [2 1 3]\n",
      "   state [0 0 0 1] state_WI [0.32 0.41 0.58 1.  ] sorted [3 2 1]\n",
      "   state [0 1 0 1] state_WI [0.32 1.   0.58 1.  ] sorted [3 1 2]\n",
      "   state [0 1 0 1] state_WI [0.32 1.   0.58 1.  ] sorted [3 1 2]\n",
      "   state [0 0 1 0] state_WI [0.32 0.41 1.   0.36] sorted [2 1 3]\n",
      "   state [1 0 1 1] state_WI [1.   0.41 1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.   0.41 1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.   0.41 1.   1.  ] sorted [2 3 0]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 0 0] state_WI [0.32 0.41 0.58 0.36] sorted [2 1 3]\n",
      "   state [0 0 1 0] state_WI [0.32 0.41 1.   0.36] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 0] state_WI [0.32 0.41 1.   0.36] sorted [2 1 3]\n",
      "instance 5, ep 28, state [1 1 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.58 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.58 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.32 1.   0.58 1.  ] sorted [3 1 2]\n",
      "   state [0 1 0 1] state_WI [0.32 1.   0.58 1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 0 0] state_WI [0.32 0.41 0.58 0.36] sorted [2 1 3]\n",
      "   state [0 1 0 1] state_WI [0.32 1.   0.58 1.  ] sorted [3 1 2]\n",
      "   state [0 1 0 0] state_WI [0.32 1.   0.58 0.36] sorted [1 2 3]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "instance 5, ep 29, state [1 0 1 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.41 1.   0.36] sorted [2 0 1]\n",
      "   state [1 0 0 0] state_WI [1.   0.41 0.58 0.36] sorted [0 2 1]\n",
      "   state [0 1 1 0] state_WI [0.32 1.   1.   0.36] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 0] state_WI [0.32 0.41 1.   0.36] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 0 0] state_WI [0.32 0.41 0.58 0.36] sorted [2 1 3]\n",
      "   state [0 0 0 0] state_WI [0.32 0.41 0.58 0.36] sorted [2 1 3]\n",
      "   state [0 0 1 0] state_WI [0.32 0.41 1.   0.36] sorted [2 1 3]\n",
      "   state [0 1 0 1] state_WI [0.32 1.   0.58 1.  ] sorted [3 1 2]\n",
      "   state [0 1 0 1] state_WI [0.32 1.   0.58 1.  ] sorted [3 1 2]\n",
      "   state [0 1 0 0] state_WI [0.32 1.   0.58 0.36] sorted [1 2 3]\n",
      "   state [0 1 0 0] state_WI [0.32 1.   0.58 0.36] sorted [1 2 3]\n",
      "   state [0 0 1 0] state_WI [0.32 0.41 1.   0.36] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.32 0.41 1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.32 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 0 1] state_WI [0.32 1.   0.58 1.  ] sorted [3 1 2]\n",
      "first state [0 0 1 0]\n",
      "   state [0 0 1 0] state_WI [0.48 0.4  1.   0.41] sorted [2 0 3]\n",
      "   state [0 0 0 0] state_WI [0.48 0.4  0.22 0.41] sorted [0 3 1]\n",
      "   state [1 0 0 0] state_WI [1.   0.4  0.22 0.41] sorted [0 3 1]\n",
      "   state [0 1 0 1] state_WI [0.48 1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [0 0 0 0] state_WI [0.48 0.4  0.22 0.41] sorted [0 3 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 0 0 0] state_WI [1.   0.4  0.22 0.41] sorted [0 3 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [0 0 0 1] state_WI [0.48 0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [0 1 0 1] state_WI [0.48 1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.41] sorted [1 0 2]\n",
      "instance 6, ep 1, state [1 0 1 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.41] sorted [0 2 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [3 0 2]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 0 0 0] state_WI [1.   0.4  0.22 0.41] sorted [0 3 1]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [0 1 0 1] state_WI [0.48 1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.41] sorted [1 0 2]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.41] sorted [0 2 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [3 0 2]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.41] sorted [0 2 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [0 1 1 1] state_WI [0.48 1.   1.   1.  ] sorted [3 1 2]\n",
      "instance 6, ep 2, state [1 1 1 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.48 1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 0] state_WI [0.48 1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [0 1 0 1] state_WI [0.48 1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 0] state_WI [0.48 1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [0 1 0 1] state_WI [0.48 1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [0 0 0 1] state_WI [0.48 0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [3 1 0]\n",
      "   state [0 1 1 1] state_WI [0.48 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 0 1] state_WI [0.48 1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [0 1 1 1] state_WI [0.48 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 0 0 0] state_WI [0.48 0.4  0.22 0.41] sorted [0 3 1]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "instance 6, ep 3, state [1 1 0 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [0 0 0 1] state_WI [0.48 0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [0 1 0 1] state_WI [0.48 1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [3 1 0]\n",
      "   state [1 0 0 0] state_WI [1.   0.4  0.22 0.41] sorted [0 3 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.48 1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 0] state_WI [0.48 1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [0 1 0 1] state_WI [0.48 1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.48 1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [0 0 0 1] state_WI [0.48 0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [0 0 0 1] state_WI [0.48 0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [0 0 0 1] state_WI [0.48 0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [0 0 0 0] state_WI [0.48 0.4  0.22 0.41] sorted [0 3 1]\n",
      "   state [0 1 0 1] state_WI [0.48 1.   0.22 1.  ] sorted [3 1 0]\n",
      "instance 6, ep 4, state [1 1 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.41] sorted [1 0 2]\n",
      "   state [1 0 0 0] state_WI [1.   0.4  0.22 0.41] sorted [0 3 1]\n",
      "   state [1 0 0 0] state_WI [1.   0.4  0.22 0.41] sorted [0 3 1]\n",
      "   state [1 0 0 0] state_WI [1.   0.4  0.22 0.41] sorted [0 3 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [0 1 0 1] state_WI [0.48 1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [0 1 0 1] state_WI [0.48 1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "instance 6, ep 5, state [0 0 1 0]\n",
      "   state [0 0 1 0] state_WI [0.48 0.4  1.   0.41] sorted [2 0 3]\n",
      "   state [0 0 0 0] state_WI [0.48 0.4  0.22 0.41] sorted [0 3 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [1 0 0 0] state_WI [1.   0.4  0.22 0.41] sorted [0 3 1]\n",
      "   state [0 0 0 0] state_WI [0.48 0.4  0.22 0.41] sorted [0 3 1]\n",
      "   state [0 1 0 0] state_WI [0.48 1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [0 1 1 0] state_WI [0.48 1.   1.   0.41] sorted [1 2 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [0 1 0 0] state_WI [0.48 1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.48 1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [0 0 0 1] state_WI [0.48 0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "instance 6, ep 6, state [0 0 0 1]\n",
      "   state [0 0 0 1] state_WI [0.48 0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.41] sorted [1 0 2]\n",
      "   state [1 0 0 0] state_WI [1.   0.4  0.22 0.41] sorted [0 3 1]\n",
      "   state [0 1 1 0] state_WI [0.48 1.   1.   0.41] sorted [1 2 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.41] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.48 1.   1.   0.41] sorted [1 2 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.48 1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [0 1 0 1] state_WI [0.48 1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.48 1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.48 1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.48 1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [0 0 0 1] state_WI [0.48 0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [0 0 0 1] state_WI [0.48 0.4  0.22 1.  ] sorted [3 0 1]\n",
      "instance 6, ep 7, state [0 1 0 0]\n",
      "   state [0 1 0 0] state_WI [0.48 1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [0 1 0 1] state_WI [0.48 1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [3 1 0]\n",
      "   state [0 1 0 0] state_WI [0.48 1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [0 1 0 0] state_WI [0.48 1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [1 0 0 0] state_WI [1.   0.4  0.22 0.41] sorted [0 3 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.22 0.41] sorted [1 0 3]\n",
      "instance 6, ep 8, state [0 0 0 0]\n",
      "   state [0 0 0 0] state_WI [0.48 0.4  0.22 0.41] sorted [0 3 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [0 1 0 1] state_WI [0.48 1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.48 1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.48 1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "instance 6, ep 9, state [1 0 1 1]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [3 0 2]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [0 0 0 1] state_WI [0.48 0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [0 1 0 1] state_WI [0.48 1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [1 0 0 0] state_WI [1.   0.4  0.22 0.41] sorted [0 3 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [1 0 0 0] state_WI [1.   0.4  0.22 0.41] sorted [0 3 1]\n",
      "   state [0 1 0 0] state_WI [0.48 1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "instance 6, ep 10, state [1 0 0 0]\n",
      "   state [1 0 0 0] state_WI [1.   0.4  0.22 0.41] sorted [0 3 1]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.48 1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.48 1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.48 1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [0 1 1 1] state_WI [0.48 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 0 1 1] state_WI [0.48 0.4  1.   1.  ] sorted [3 2 0]\n",
      "   state [0 0 1 1] state_WI [0.48 0.4  1.   1.  ] sorted [3 2 0]\n",
      "   state [0 0 1 1] state_WI [0.48 0.4  1.   1.  ] sorted [3 2 0]\n",
      "   state [0 0 0 1] state_WI [0.48 0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [3 0 2]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [3 0 2]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.48 1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [0 0 0 1] state_WI [0.48 0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [0 0 0 1] state_WI [0.48 0.4  0.22 1.  ] sorted [3 0 1]\n",
      "instance 6, ep 11, state [0 1 0 0]\n",
      "   state [0 1 0 0] state_WI [0.48 1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [0 0 0 1] state_WI [0.48 0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [0 0 1 0] state_WI [0.48 0.4  1.   0.41] sorted [2 0 3]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.41] sorted [1 0 2]\n",
      "   state [0 0 1 1] state_WI [0.48 0.4  1.   1.  ] sorted [3 2 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [3 0 2]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "instance 6, ep 12, state [1 1 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.41] sorted [1 0 2]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.41] sorted [1 0 2]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [0 0 1 1] state_WI [0.48 0.4  1.   1.  ] sorted [3 2 0]\n",
      "   state [0 0 0 1] state_WI [0.48 0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [0 1 0 1] state_WI [0.48 1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [0 0 0 0] state_WI [0.48 0.4  0.22 0.41] sorted [0 3 1]\n",
      "   state [0 0 0 0] state_WI [0.48 0.4  0.22 0.41] sorted [0 3 1]\n",
      "   state [0 1 0 0] state_WI [0.48 1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [0 1 0 0] state_WI [0.48 1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.48 1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.48 1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 0 0 0] state_WI [1.   0.4  0.22 0.41] sorted [0 3 1]\n",
      "instance 6, ep 13, state [0 1 0 0]\n",
      "   state [0 1 0 0] state_WI [0.48 1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [0 1 0 1] state_WI [0.48 1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [0 0 0 1] state_WI [0.48 0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [0 1 0 1] state_WI [0.48 1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.48 1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 0] state_WI [0.48 1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [3 0 2]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [3 1 0]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [0 0 0 1] state_WI [0.48 0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [0 0 0 1] state_WI [0.48 0.4  0.22 1.  ] sorted [3 0 1]\n",
      "instance 6, ep 14, state [0 0 0 0]\n",
      "   state [0 0 0 0] state_WI [0.48 0.4  0.22 0.41] sorted [0 3 1]\n",
      "   state [0 0 0 1] state_WI [0.48 0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [0 0 0 1] state_WI [0.48 0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [0 0 0 1] state_WI [0.48 0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [0 1 0 1] state_WI [0.48 1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.48 1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [1 0 0 0] state_WI [1.   0.4  0.22 0.41] sorted [0 3 1]\n",
      "   state [0 1 0 0] state_WI [0.48 1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [0 1 1 1] state_WI [0.48 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [3 0 2]\n",
      "   state [0 0 0 0] state_WI [0.48 0.4  0.22 0.41] sorted [0 3 1]\n",
      "   state [0 1 0 1] state_WI [0.48 1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.48 1.   0.22 1.  ] sorted [3 1 0]\n",
      "instance 6, ep 15, state [1 1 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.41] sorted [1 0 2]\n",
      "   state [1 0 0 0] state_WI [1.   0.4  0.22 0.41] sorted [0 3 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [0 0 0 1] state_WI [0.48 0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 0 0 0] state_WI [1.   0.4  0.22 0.41] sorted [0 3 1]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [0 1 0 1] state_WI [0.48 1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [0 0 0 0] state_WI [0.48 0.4  0.22 0.41] sorted [0 3 1]\n",
      "instance 6, ep 16, state [0 0 1 1]\n",
      "   state [0 0 1 1] state_WI [0.48 0.4  1.   1.  ] sorted [3 2 0]\n",
      "   state [0 0 0 1] state_WI [0.48 0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [1 0 0 0] state_WI [1.   0.4  0.22 0.41] sorted [0 3 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [0 1 0 1] state_WI [0.48 1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [0 1 1 1] state_WI [0.48 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 0 1] state_WI [0.48 1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.48 1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.48 1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [0 0 0 1] state_WI [0.48 0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [0 0 0 1] state_WI [0.48 0.4  0.22 1.  ] sorted [3 0 1]\n",
      "instance 6, ep 17, state [0 1 0 1]\n",
      "   state [0 1 0 1] state_WI [0.48 1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [0 0 0 0] state_WI [0.48 0.4  0.22 0.41] sorted [0 3 1]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [3 0 2]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [1 0 0 0] state_WI [1.   0.4  0.22 0.41] sorted [0 3 1]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.41] sorted [0 2 3]\n",
      "   state [1 0 0 0] state_WI [1.   0.4  0.22 0.41] sorted [0 3 1]\n",
      "   state [1 0 0 0] state_WI [1.   0.4  0.22 0.41] sorted [0 3 1]\n",
      "   state [0 0 0 0] state_WI [0.48 0.4  0.22 0.41] sorted [0 3 1]\n",
      "   state [0 1 0 0] state_WI [0.48 1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.41] sorted [1 0 2]\n",
      "   state [1 0 0 0] state_WI [1.   0.4  0.22 0.41] sorted [0 3 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "instance 6, ep 18, state [1 1 1 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.48 1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.48 1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.48 1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [3 1 0]\n",
      "   state [0 1 1 1] state_WI [0.48 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 0 1] state_WI [0.48 1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.48 1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [0 0 0 1] state_WI [0.48 0.4  0.22 1.  ] sorted [3 0 1]\n",
      "instance 6, ep 19, state [0 1 0 1]\n",
      "   state [0 1 0 1] state_WI [0.48 1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [0 0 0 1] state_WI [0.48 0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [0 1 0 1] state_WI [0.48 1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [0 0 0 1] state_WI [0.48 0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [0 0 0 1] state_WI [0.48 0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [0 1 0 1] state_WI [0.48 1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.48 1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.48 1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.41] sorted [1 0 2]\n",
      "   state [0 1 1 1] state_WI [0.48 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.48 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.48 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 0 1] state_WI [0.48 1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [0 0 0 1] state_WI [0.48 0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [0 1 0 0] state_WI [0.48 1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.48 1.   0.22 1.  ] sorted [3 1 0]\n",
      "instance 6, ep 20, state [1 1 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.48 1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.48 1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "instance 6, ep 21, state [1 1 0 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.41] sorted [0 2 3]\n",
      "   state [0 0 1 0] state_WI [0.48 0.4  1.   0.41] sorted [2 0 3]\n",
      "   state [1 0 0 0] state_WI [1.   0.4  0.22 0.41] sorted [0 3 1]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.48 1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.48 1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [0 0 1 1] state_WI [0.48 0.4  1.   1.  ] sorted [3 2 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [0 1 0 0] state_WI [0.48 1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [0 0 0 1] state_WI [0.48 0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [0 0 0 1] state_WI [0.48 0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [0 1 0 0] state_WI [0.48 1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [0 1 0 1] state_WI [0.48 1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 0 0 0] state_WI [1.   0.4  0.22 0.41] sorted [0 3 1]\n",
      "   state [0 0 0 0] state_WI [0.48 0.4  0.22 0.41] sorted [0 3 1]\n",
      "   state [0 1 0 0] state_WI [0.48 1.   0.22 0.41] sorted [1 0 3]\n",
      "instance 6, ep 22, state [0 0 1 0]\n",
      "   state [0 0 1 0] state_WI [0.48 0.4  1.   0.41] sorted [2 0 3]\n",
      "   state [0 0 0 0] state_WI [0.48 0.4  0.22 0.41] sorted [0 3 1]\n",
      "   state [0 1 0 0] state_WI [0.48 1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [0 1 0 0] state_WI [0.48 1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [0 1 0 1] state_WI [0.48 1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [3 0 2]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 0 0 0] state_WI [1.   0.4  0.22 0.41] sorted [0 3 1]\n",
      "   state [1 0 0 0] state_WI [1.   0.4  0.22 0.41] sorted [0 3 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.48 1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.48 1.   0.22 1.  ] sorted [3 1 0]\n",
      "instance 6, ep 23, state [1 0 0 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.48 1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 0] state_WI [0.48 1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [0 1 0 0] state_WI [0.48 1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [3 0 2]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [0 0 0 1] state_WI [0.48 0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [0 1 0 1] state_WI [0.48 1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [0 0 0 1] state_WI [0.48 0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [0 1 0 1] state_WI [0.48 1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [0 0 0 1] state_WI [0.48 0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [0 1 0 0] state_WI [0.48 1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [0 0 0 1] state_WI [0.48 0.4  0.22 1.  ] sorted [3 0 1]\n",
      "instance 6, ep 24, state [1 0 1 1]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [3 0 2]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [0 1 0 1] state_WI [0.48 1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [0 1 0 1] state_WI [0.48 1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "instance 6, ep 25, state [0 1 1 1]\n",
      "   state [0 1 1 1] state_WI [0.48 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 0 1] state_WI [0.48 1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [3 0 2]\n",
      "   state [0 0 0 1] state_WI [0.48 0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [0 1 0 0] state_WI [0.48 1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [0 1 0 0] state_WI [0.48 1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [0 1 0 0] state_WI [0.48 1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [0 0 0 0] state_WI [0.48 0.4  0.22 0.41] sorted [0 3 1]\n",
      "   state [0 1 0 0] state_WI [0.48 1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [0 1 0 1] state_WI [0.48 1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "instance 6, ep 26, state [0 1 0 0]\n",
      "   state [0 1 0 0] state_WI [0.48 1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [0 1 0 0] state_WI [0.48 1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [0 0 0 1] state_WI [0.48 0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [0 0 0 1] state_WI [0.48 0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [1 0 0 0] state_WI [1.   0.4  0.22 0.41] sorted [0 3 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [0 1 0 1] state_WI [0.48 1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [0 0 0 1] state_WI [0.48 0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.48 1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [0 1 0 0] state_WI [0.48 1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "instance 6, ep 27, state [0 0 1 1]\n",
      "   state [0 0 1 1] state_WI [0.48 0.4  1.   1.  ] sorted [3 2 0]\n",
      "   state [0 0 1 1] state_WI [0.48 0.4  1.   1.  ] sorted [3 2 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [1 0 0 0] state_WI [1.   0.4  0.22 0.41] sorted [0 3 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [0 0 0 0] state_WI [0.48 0.4  0.22 0.41] sorted [0 3 1]\n",
      "   state [1 0 0 0] state_WI [1.   0.4  0.22 0.41] sorted [0 3 1]\n",
      "   state [0 0 0 0] state_WI [0.48 0.4  0.22 0.41] sorted [0 3 1]\n",
      "   state [0 0 0 1] state_WI [0.48 0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.48 1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.48 1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [0 1 0 1] state_WI [0.48 1.   0.22 1.  ] sorted [3 1 0]\n",
      "instance 6, ep 28, state [1 0 0 0]\n",
      "   state [1 0 0 0] state_WI [1.   0.4  0.22 0.41] sorted [0 3 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [3 0 2]\n",
      "   state [0 1 1 0] state_WI [0.48 1.   1.   0.41] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.48 1.   1.   0.41] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.48 1.   1.   0.41] sorted [1 2 0]\n",
      "   state [0 1 1 0] state_WI [0.48 1.   1.   0.41] sorted [1 2 0]\n",
      "   state [0 1 0 1] state_WI [0.48 1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 0] state_WI [0.48 1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [0 1 0 0] state_WI [0.48 1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [0 0 1 0] state_WI [0.48 0.4  1.   0.41] sorted [2 0 3]\n",
      "   state [0 0 1 1] state_WI [0.48 0.4  1.   1.  ] sorted [3 2 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "instance 6, ep 29, state [1 0 1 1]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [3 0 2]\n",
      "   state [1 0 0 0] state_WI [1.   0.4  0.22 0.41] sorted [0 3 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.22 0.41] sorted [1 0 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [3 1 0]\n",
      "   state [0 0 1 1] state_WI [0.48 0.4  1.   1.  ] sorted [3 2 0]\n",
      "   state [0 0 0 1] state_WI [0.48 0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.22 1.  ] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [3 0 2]\n",
      "   state [0 0 1 0] state_WI [0.48 0.4  1.   0.41] sorted [2 0 3]\n",
      "   state [0 0 0 1] state_WI [0.48 0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [0 0 1 1] state_WI [0.48 0.4  1.   1.  ] sorted [3 2 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [0 0 0 1] state_WI [0.48 0.4  0.22 1.  ] sorted [3 0 1]\n",
      "   state [1 0 0 0] state_WI [1.   0.4  0.22 0.41] sorted [0 3 1]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.22 0.41] sorted [1 0 3]\n",
      "first state [1 0 1 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.52 1.   0.45] sorted [0 2 1]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.32 0.45] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.45] sorted [1 0 2]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.45] sorted [1 0 2]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.32 0.45] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.32 0.45] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.32 0.45] sorted [1 0 3]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.45] sorted [1 0 2]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.32 0.45] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "instance 7, ep 1, state [1 0 0 0]\n",
      "   state [1 0 0 0] state_WI [1.   0.52 0.32 0.45] sorted [0 1 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.32 0.45] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.37 1.   0.32 0.45] sorted [1 3 0]\n",
      "   state [0 0 0 0] state_WI [0.37 0.52 0.32 0.45] sorted [1 3 0]\n",
      "   state [0 0 0 1] state_WI [0.37 0.52 0.32 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.52 0.32 1.  ] sorted [3 0 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.37 1.   0.32 0.45] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [1 3 0]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "instance 7, ep 2, state [1 0 1 1]\n",
      "   state [1 0 1 1] state_WI [1.   0.52 1.   1.  ] sorted [3 0 2]\n",
      "   state [0 0 1 0] state_WI [0.37 0.52 1.   0.45] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.37 0.52 1.   1.  ] sorted [3 2 1]\n",
      "   state [0 0 1 1] state_WI [0.37 0.52 1.   1.  ] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.37 1.   1.   1.  ] sorted [1 3 2]\n",
      "   state [0 1 1 1] state_WI [0.37 1.   1.   1.  ] sorted [1 3 2]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [0 1 1 1] state_WI [0.37 1.   1.   1.  ] sorted [1 3 2]\n",
      "   state [0 1 1 1] state_WI [0.37 1.   1.   1.  ] sorted [1 3 2]\n",
      "   state [0 0 1 0] state_WI [0.37 0.52 1.   0.45] sorted [2 1 3]\n",
      "   state [0 0 0 0] state_WI [0.37 0.52 0.32 0.45] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.52 0.32 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "instance 7, ep 3, state [0 1 0 1]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [0 1 1 0] state_WI [0.37 1.   1.   0.45] sorted [1 2 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [1 3 0]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [1 3 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.45] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.37 1.   1.   0.45] sorted [1 2 3]\n",
      "   state [0 1 0 0] state_WI [0.37 1.   0.32 0.45] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.37 1.   0.32 0.45] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.52 0.32 1.  ] sorted [3 0 1]\n",
      "   state [0 1 0 0] state_WI [0.37 1.   0.32 0.45] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.37 1.   0.32 0.45] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.52 0.32 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [1 3 0]\n",
      "   state [0 1 1 1] state_WI [0.37 1.   1.   1.  ] sorted [1 3 2]\n",
      "instance 7, ep 4, state [0 1 1 1]\n",
      "   state [0 1 1 1] state_WI [0.37 1.   1.   1.  ] sorted [1 3 2]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 0 0 0] state_WI [1.   0.52 0.32 0.45] sorted [0 1 3]\n",
      "   state [0 0 0 0] state_WI [0.37 0.52 0.32 0.45] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.52 0.32 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.45] sorted [1 0 2]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 0 0 0] state_WI [1.   0.52 0.32 0.45] sorted [0 1 3]\n",
      "   state [1 0 0 0] state_WI [1.   0.52 0.32 0.45] sorted [0 1 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.32 0.45] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.32 0.45] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.32 0.45] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.32 0.45] sorted [1 0 3]\n",
      "instance 7, ep 5, state [1 0 1 1]\n",
      "   state [1 0 1 1] state_WI [1.   0.52 1.   1.  ] sorted [3 0 2]\n",
      "   state [1 0 1 0] state_WI [1.   0.52 1.   0.45] sorted [0 2 1]\n",
      "   state [0 0 1 0] state_WI [0.37 0.52 1.   0.45] sorted [2 1 3]\n",
      "   state [0 0 0 0] state_WI [0.37 0.52 0.32 0.45] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [0 0 0 1] state_WI [0.37 0.52 0.32 1.  ] sorted [3 1 0]\n",
      "   state [0 0 0 1] state_WI [0.37 0.52 0.32 1.  ] sorted [3 1 0]\n",
      "   state [0 0 0 0] state_WI [0.37 0.52 0.32 0.45] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [0 0 1 1] state_WI [0.37 0.52 1.   1.  ] sorted [3 2 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.52 0.32 1.  ] sorted [3 0 1]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.45] sorted [1 0 2]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.32 0.45] sorted [1 0 3]\n",
      "   state [1 0 0 0] state_WI [1.   0.52 0.32 0.45] sorted [0 1 3]\n",
      "   state [1 0 0 0] state_WI [1.   0.52 0.32 0.45] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.52 0.32 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.37 1.   0.32 0.45] sorted [1 3 0]\n",
      "instance 7, ep 6, state [1 0 1 1]\n",
      "   state [1 0 1 1] state_WI [1.   0.52 1.   1.  ] sorted [3 0 2]\n",
      "   state [0 0 1 1] state_WI [0.37 0.52 1.   1.  ] sorted [3 2 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.52 0.32 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.52 0.32 1.  ] sorted [3 0 1]\n",
      "   state [1 0 0 0] state_WI [1.   0.52 0.32 0.45] sorted [0 1 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.32 0.45] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.32 0.45] sorted [1 0 3]\n",
      "   state [0 0 0 1] state_WI [0.37 0.52 0.32 1.  ] sorted [3 1 0]\n",
      "   state [0 0 0 1] state_WI [0.37 0.52 0.32 1.  ] sorted [3 1 0]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [0 0 1 1] state_WI [0.37 0.52 1.   1.  ] sorted [3 2 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "instance 7, ep 7, state [1 0 1 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.52 1.   0.45] sorted [0 2 1]\n",
      "   state [0 0 1 0] state_WI [0.37 0.52 1.   0.45] sorted [2 1 3]\n",
      "   state [0 0 0 0] state_WI [0.37 0.52 0.32 0.45] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.32 0.45] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.32 0.45] sorted [1 0 3]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [0 0 0 1] state_WI [0.37 0.52 0.32 1.  ] sorted [3 1 0]\n",
      "   state [1 0 1 1] state_WI [1.   0.52 1.   1.  ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.   0.52 1.   1.  ] sorted [3 0 2]\n",
      "   state [0 0 1 1] state_WI [0.37 0.52 1.   1.  ] sorted [3 2 1]\n",
      "   state [0 0 1 1] state_WI [0.37 0.52 1.   1.  ] sorted [3 2 1]\n",
      "   state [0 0 1 0] state_WI [0.37 0.52 1.   0.45] sorted [2 1 3]\n",
      "   state [0 0 1 0] state_WI [0.37 0.52 1.   0.45] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.37 1.   1.   1.  ] sorted [1 3 2]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.32 0.45] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.32 0.45] sorted [1 0 3]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [0 0 0 1] state_WI [0.37 0.52 0.32 1.  ] sorted [3 1 0]\n",
      "instance 7, ep 8, state [1 0 1 1]\n",
      "   state [1 0 1 1] state_WI [1.   0.52 1.   1.  ] sorted [3 0 2]\n",
      "   state [0 0 1 1] state_WI [0.37 0.52 1.   1.  ] sorted [3 2 1]\n",
      "   state [0 0 1 1] state_WI [0.37 0.52 1.   1.  ] sorted [3 2 1]\n",
      "   state [0 0 1 1] state_WI [0.37 0.52 1.   1.  ] sorted [3 2 1]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.45] sorted [1 0 2]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.45] sorted [1 0 2]\n",
      "   state [0 1 0 0] state_WI [0.37 1.   0.32 0.45] sorted [1 3 0]\n",
      "   state [1 0 0 0] state_WI [1.   0.52 0.32 0.45] sorted [0 1 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.32 0.45] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.32 0.45] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.45] sorted [1 0 2]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.32 0.45] sorted [1 0 3]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.45] sorted [1 0 2]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.32 0.45] sorted [1 0 3]\n",
      "instance 7, ep 9, state [0 1 0 1]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [0 1 1 1] state_WI [0.37 1.   1.   1.  ] sorted [1 3 2]\n",
      "   state [0 1 1 0] state_WI [0.37 1.   1.   0.45] sorted [1 2 3]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.32 0.45] sorted [1 0 3]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.32 0.45] sorted [1 0 3]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [0 1 1 0] state_WI [0.37 1.   1.   0.45] sorted [1 2 3]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.52 0.32 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "instance 7, ep 10, state [1 1 1 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [1 3 0]\n",
      "   state [0 1 1 1] state_WI [0.37 1.   1.   1.  ] sorted [1 3 2]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.32 0.45] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.32 0.45] sorted [1 0 3]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.32 0.45] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.32 0.45] sorted [1 0 3]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.45] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.37 1.   1.   0.45] sorted [1 2 3]\n",
      "   state [0 0 1 1] state_WI [0.37 0.52 1.   1.  ] sorted [3 2 1]\n",
      "   state [0 1 0 0] state_WI [0.37 1.   0.32 0.45] sorted [1 3 0]\n",
      "   state [0 1 1 1] state_WI [0.37 1.   1.   1.  ] sorted [1 3 2]\n",
      "   state [0 1 1 1] state_WI [0.37 1.   1.   1.  ] sorted [1 3 2]\n",
      "   state [0 1 1 0] state_WI [0.37 1.   1.   0.45] sorted [1 2 3]\n",
      "   state [0 0 0 0] state_WI [0.37 0.52 0.32 0.45] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "instance 7, ep 11, state [0 0 1 1]\n",
      "   state [0 0 1 1] state_WI [0.37 0.52 1.   1.  ] sorted [3 2 1]\n",
      "   state [0 0 0 0] state_WI [0.37 0.52 0.32 0.45] sorted [1 3 0]\n",
      "   state [0 0 0 1] state_WI [0.37 0.52 0.32 1.  ] sorted [3 1 0]\n",
      "   state [0 0 0 1] state_WI [0.37 0.52 0.32 1.  ] sorted [3 1 0]\n",
      "   state [0 0 1 0] state_WI [0.37 0.52 1.   0.45] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.37 0.52 1.   1.  ] sorted [3 2 1]\n",
      "   state [0 0 1 0] state_WI [0.37 0.52 1.   0.45] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.37 1.   1.   1.  ] sorted [1 3 2]\n",
      "   state [0 1 1 1] state_WI [0.37 1.   1.   1.  ] sorted [1 3 2]\n",
      "   state [0 0 1 1] state_WI [0.37 0.52 1.   1.  ] sorted [3 2 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [1 3 0]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.52 0.32 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.32 0.45] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.32 0.45] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.32 0.45] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.32 0.45] sorted [1 0 3]\n",
      "instance 7, ep 12, state [1 1 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [1 3 0]\n",
      "   state [1 0 1 1] state_WI [1.   0.52 1.   1.  ] sorted [3 0 2]\n",
      "   state [1 0 0 0] state_WI [1.   0.52 0.32 0.45] sorted [0 1 3]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.32 0.45] sorted [1 0 3]\n",
      "   state [1 0 0 0] state_WI [1.   0.52 0.32 0.45] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.37 1.   0.32 0.45] sorted [1 3 0]\n",
      "   state [0 0 0 0] state_WI [0.37 0.52 0.32 0.45] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.52 0.32 1.  ] sorted [3 0 1]\n",
      "   state [0 0 0 1] state_WI [0.37 0.52 0.32 1.  ] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.52 0.32 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.32 0.45] sorted [1 0 3]\n",
      "   state [0 1 0 0] state_WI [0.37 1.   0.32 0.45] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "instance 7, ep 13, state [0 1 0 0]\n",
      "   state [0 1 0 0] state_WI [0.37 1.   0.32 0.45] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [0 0 0 0] state_WI [0.37 0.52 0.32 0.45] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.37 1.   0.32 0.45] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.52 0.32 1.  ] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.52 0.32 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.52 0.32 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.32 0.45] sorted [1 0 3]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.32 0.45] sorted [1 0 3]\n",
      "   state [0 1 0 0] state_WI [0.37 1.   0.32 0.45] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "instance 7, ep 14, state [0 0 1 0]\n",
      "   state [0 0 1 0] state_WI [0.37 0.52 1.   0.45] sorted [2 1 3]\n",
      "   state [0 0 1 0] state_WI [0.37 0.52 1.   0.45] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.37 1.   1.   0.45] sorted [1 2 3]\n",
      "   state [0 1 1 0] state_WI [0.37 1.   1.   0.45] sorted [1 2 3]\n",
      "   state [0 1 0 0] state_WI [0.37 1.   0.32 0.45] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.32 0.45] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.32 0.45] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.32 0.45] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.32 0.45] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.45] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.37 1.   1.   0.45] sorted [1 2 3]\n",
      "   state [0 1 1 0] state_WI [0.37 1.   1.   0.45] sorted [1 2 3]\n",
      "   state [0 1 1 0] state_WI [0.37 1.   1.   0.45] sorted [1 2 3]\n",
      "   state [0 1 1 0] state_WI [0.37 1.   1.   0.45] sorted [1 2 3]\n",
      "   state [0 1 1 1] state_WI [0.37 1.   1.   1.  ] sorted [1 3 2]\n",
      "   state [0 1 1 1] state_WI [0.37 1.   1.   1.  ] sorted [1 3 2]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.37 1.   0.32 0.45] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.37 1.   0.32 0.45] sorted [1 3 0]\n",
      "instance 7, ep 15, state [0 0 0 0]\n",
      "   state [0 0 0 0] state_WI [0.37 0.52 0.32 0.45] sorted [1 3 0]\n",
      "   state [0 0 0 1] state_WI [0.37 0.52 0.32 1.  ] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.52 0.32 1.  ] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.52 0.32 1.  ] sorted [3 0 1]\n",
      "   state [0 1 0 0] state_WI [0.37 1.   0.32 0.45] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.32 0.45] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 0 0 0] state_WI [1.   0.52 0.32 0.45] sorted [0 1 3]\n",
      "   state [0 0 0 0] state_WI [0.37 0.52 0.32 0.45] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [0 1 1 1] state_WI [0.37 1.   1.   1.  ] sorted [1 3 2]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "instance 7, ep 16, state [0 1 1 1]\n",
      "   state [0 1 1 1] state_WI [0.37 1.   1.   1.  ] sorted [1 3 2]\n",
      "   state [0 1 0 0] state_WI [0.37 1.   0.32 0.45] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.37 1.   0.32 0.45] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.32 0.45] sorted [1 0 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.32 0.45] sorted [1 0 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.52 0.32 1.  ] sorted [3 0 1]\n",
      "   state [0 1 1 1] state_WI [0.37 1.   1.   1.  ] sorted [1 3 2]\n",
      "   state [0 0 0 0] state_WI [0.37 0.52 0.32 0.45] sorted [1 3 0]\n",
      "   state [0 0 0 1] state_WI [0.37 0.52 0.32 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.32 0.45] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [0 1 1 1] state_WI [0.37 1.   1.   1.  ] sorted [1 3 2]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.37 1.   0.32 0.45] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.32 0.45] sorted [1 0 3]\n",
      "   state [0 1 1 1] state_WI [0.37 1.   1.   1.  ] sorted [1 3 2]\n",
      "   state [0 1 0 0] state_WI [0.37 1.   0.32 0.45] sorted [1 3 0]\n",
      "instance 7, ep 17, state [0 0 1 1]\n",
      "   state [0 0 1 1] state_WI [0.37 0.52 1.   1.  ] sorted [3 2 1]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [0 0 0 1] state_WI [0.37 0.52 0.32 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.37 1.   0.32 0.45] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.45] sorted [1 0 2]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.45] sorted [1 0 2]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.32 0.45] sorted [1 0 3]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.37 1.   0.32 0.45] sorted [1 3 0]\n",
      "instance 7, ep 18, state [0 0 0 0]\n",
      "   state [0 0 0 0] state_WI [0.37 0.52 0.32 0.45] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.52 0.32 1.  ] sorted [3 0 1]\n",
      "   state [1 0 0 0] state_WI [1.   0.52 0.32 0.45] sorted [0 1 3]\n",
      "   state [0 1 0 0] state_WI [0.37 1.   0.32 0.45] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.37 1.   0.32 0.45] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [0 0 1 1] state_WI [0.37 0.52 1.   1.  ] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.37 1.   1.   1.  ] sorted [1 3 2]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.32 0.45] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.32 0.45] sorted [1 0 3]\n",
      "   state [0 1 0 0] state_WI [0.37 1.   0.32 0.45] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.37 1.   0.32 0.45] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.45] sorted [1 0 2]\n",
      "   state [1 0 0 0] state_WI [1.   0.52 0.32 0.45] sorted [0 1 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.52 0.32 1.  ] sorted [3 0 1]\n",
      "instance 7, ep 19, state [0 1 1 1]\n",
      "   state [0 1 1 1] state_WI [0.37 1.   1.   1.  ] sorted [1 3 2]\n",
      "   state [0 1 1 1] state_WI [0.37 1.   1.   1.  ] sorted [1 3 2]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [1 3 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.45] sorted [1 0 2]\n",
      "   state [0 1 0 0] state_WI [0.37 1.   0.32 0.45] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.32 0.45] sorted [1 0 3]\n",
      "   state [0 0 0 0] state_WI [0.37 0.52 0.32 0.45] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.52 0.32 1.  ] sorted [3 0 1]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.45] sorted [1 0 2]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.32 0.45] sorted [1 0 3]\n",
      "   state [0 1 0 0] state_WI [0.37 1.   0.32 0.45] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.37 1.   0.32 0.45] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.45] sorted [1 0 2]\n",
      "   state [0 0 1 0] state_WI [0.37 0.52 1.   0.45] sorted [2 1 3]\n",
      "   state [0 0 0 0] state_WI [0.37 0.52 0.32 0.45] sorted [1 3 0]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.32 0.45] sorted [1 0 3]\n",
      "instance 7, ep 20, state [1 1 1 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.52 0.32 1.  ] sorted [3 0 1]\n",
      "   state [0 0 0 0] state_WI [0.37 0.52 0.32 0.45] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.52 0.32 1.  ] sorted [3 0 1]\n",
      "   state [1 0 0 0] state_WI [1.   0.52 0.32 0.45] sorted [0 1 3]\n",
      "   state [0 0 0 0] state_WI [0.37 0.52 0.32 0.45] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.32 0.45] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.32 0.45] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.32 0.45] sorted [1 0 3]\n",
      "   state [0 1 0 0] state_WI [0.37 1.   0.32 0.45] sorted [1 3 0]\n",
      "   state [0 1 1 1] state_WI [0.37 1.   1.   1.  ] sorted [1 3 2]\n",
      "   state [0 1 1 0] state_WI [0.37 1.   1.   0.45] sorted [1 2 3]\n",
      "   state [0 1 1 0] state_WI [0.37 1.   1.   0.45] sorted [1 2 3]\n",
      "   state [0 1 1 1] state_WI [0.37 1.   1.   1.  ] sorted [1 3 2]\n",
      "   state [0 1 1 1] state_WI [0.37 1.   1.   1.  ] sorted [1 3 2]\n",
      "   state [0 1 1 1] state_WI [0.37 1.   1.   1.  ] sorted [1 3 2]\n",
      "   state [0 0 1 1] state_WI [0.37 0.52 1.   1.  ] sorted [3 2 1]\n",
      "instance 7, ep 21, state [0 0 0 1]\n",
      "   state [0 0 0 1] state_WI [0.37 0.52 0.32 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.37 1.   0.32 0.45] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.37 1.   0.32 0.45] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.37 1.   0.32 0.45] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.37 1.   0.32 0.45] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.32 0.45] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.32 0.45] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.32 0.45] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.32 0.45] sorted [1 0 3]\n",
      "   state [0 1 0 0] state_WI [0.37 1.   0.32 0.45] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.52 0.32 1.  ] sorted [3 0 1]\n",
      "   state [1 0 0 0] state_WI [1.   0.52 0.32 0.45] sorted [0 1 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.32 0.45] sorted [1 0 3]\n",
      "instance 7, ep 22, state [1 0 1 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.52 1.   0.45] sorted [0 2 1]\n",
      "   state [0 1 1 0] state_WI [0.37 1.   1.   0.45] sorted [1 2 3]\n",
      "   state [0 1 1 0] state_WI [0.37 1.   1.   0.45] sorted [1 2 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [0 1 1 1] state_WI [0.37 1.   1.   1.  ] sorted [1 3 2]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [1 3 0]\n",
      "   state [1 0 0 0] state_WI [1.   0.52 0.32 0.45] sorted [0 1 3]\n",
      "   state [0 1 0 0] state_WI [0.37 1.   0.32 0.45] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [1 3 0]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.32 0.45] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.32 0.45] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.32 0.45] sorted [1 0 3]\n",
      "instance 7, ep 23, state [1 0 0 0]\n",
      "   state [1 0 0 0] state_WI [1.   0.52 0.32 0.45] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.37 1.   0.32 0.45] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.37 1.   0.32 0.45] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [0 0 0 0] state_WI [0.37 0.52 0.32 0.45] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.52 0.32 1.  ] sorted [3 0 1]\n",
      "   state [1 0 0 0] state_WI [1.   0.52 0.32 0.45] sorted [0 1 3]\n",
      "   state [0 0 0 1] state_WI [0.37 0.52 0.32 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.52 0.32 1.  ] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.52 0.32 1.  ] sorted [3 0 1]\n",
      "   state [1 0 1 0] state_WI [1.   0.52 1.   0.45] sorted [0 2 1]\n",
      "   state [0 1 1 1] state_WI [0.37 1.   1.   1.  ] sorted [1 3 2]\n",
      "   state [0 0 1 1] state_WI [0.37 0.52 1.   1.  ] sorted [3 2 1]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.37 1.   0.32 0.45] sorted [1 3 0]\n",
      "instance 7, ep 24, state [0 0 0 1]\n",
      "   state [0 0 0 1] state_WI [0.37 0.52 0.32 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [0 1 1 1] state_WI [0.37 1.   1.   1.  ] sorted [1 3 2]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 0 1 1] state_WI [1.   0.52 1.   1.  ] sorted [3 0 2]\n",
      "   state [1 0 0 1] state_WI [1.   0.52 0.32 1.  ] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.52 0.32 1.  ] sorted [3 0 1]\n",
      "   state [0 0 0 1] state_WI [0.37 0.52 0.32 1.  ] sorted [3 1 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.52 1.   0.45] sorted [0 2 1]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.45] sorted [1 0 2]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.45] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.37 1.   1.   0.45] sorted [1 2 3]\n",
      "   state [0 1 0 0] state_WI [0.37 1.   0.32 0.45] sorted [1 3 0]\n",
      "   state [0 0 0 1] state_WI [0.37 0.52 0.32 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.32 0.45] sorted [1 0 3]\n",
      "   state [0 1 1 1] state_WI [0.37 1.   1.   1.  ] sorted [1 3 2]\n",
      "   state [0 1 1 1] state_WI [0.37 1.   1.   1.  ] sorted [1 3 2]\n",
      "   state [0 1 0 0] state_WI [0.37 1.   0.32 0.45] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.37 1.   0.32 0.45] sorted [1 3 0]\n",
      "instance 7, ep 25, state [1 0 1 1]\n",
      "   state [1 0 1 1] state_WI [1.   0.52 1.   1.  ] sorted [3 0 2]\n",
      "   state [1 0 0 0] state_WI [1.   0.52 0.32 0.45] sorted [0 1 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [1 3 0]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.32 0.45] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.32 0.45] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.32 0.45] sorted [1 0 3]\n",
      "   state [0 1 0 0] state_WI [0.37 1.   0.32 0.45] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [0 0 1 1] state_WI [0.37 0.52 1.   1.  ] sorted [3 2 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.32 0.45] sorted [1 0 3]\n",
      "   state [0 1 0 0] state_WI [0.37 1.   0.32 0.45] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.37 1.   0.32 0.45] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.37 1.   0.32 0.45] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.32 0.45] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.32 0.45] sorted [1 0 3]\n",
      "instance 7, ep 26, state [0 0 0 0]\n",
      "   state [0 0 0 0] state_WI [0.37 0.52 0.32 0.45] sorted [1 3 0]\n",
      "   state [0 0 0 0] state_WI [0.37 0.52 0.32 0.45] sorted [1 3 0]\n",
      "   state [0 0 0 0] state_WI [0.37 0.52 0.32 0.45] sorted [1 3 0]\n",
      "   state [0 0 0 1] state_WI [0.37 0.52 0.32 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [0 1 1 1] state_WI [0.37 1.   1.   1.  ] sorted [1 3 2]\n",
      "   state [0 1 1 1] state_WI [0.37 1.   1.   1.  ] sorted [1 3 2]\n",
      "   state [0 1 1 1] state_WI [0.37 1.   1.   1.  ] sorted [1 3 2]\n",
      "   state [0 1 1 1] state_WI [0.37 1.   1.   1.  ] sorted [1 3 2]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.45] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.37 1.   1.   0.45] sorted [1 2 3]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.45] sorted [1 0 2]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.32 0.45] sorted [1 0 3]\n",
      "   state [1 0 0 0] state_WI [1.   0.52 0.32 0.45] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.32 0.45] sorted [1 0 3]\n",
      "instance 7, ep 27, state [1 0 1 1]\n",
      "   state [1 0 1 1] state_WI [1.   0.52 1.   1.  ] sorted [3 0 2]\n",
      "   state [0 0 1 0] state_WI [0.37 0.52 1.   0.45] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.37 1.   1.   1.  ] sorted [1 3 2]\n",
      "   state [0 0 1 1] state_WI [0.37 0.52 1.   1.  ] sorted [3 2 1]\n",
      "   state [0 0 1 1] state_WI [0.37 0.52 1.   1.  ] sorted [3 2 1]\n",
      "   state [0 0 0 0] state_WI [0.37 0.52 0.32 0.45] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.52 0.32 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.52 0.32 1.  ] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.52 0.32 1.  ] sorted [3 0 1]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 0 1 1] state_WI [1.   0.52 1.   1.  ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.   0.52 1.   1.  ] sorted [3 0 2]\n",
      "   state [0 0 0 1] state_WI [0.37 0.52 0.32 1.  ] sorted [3 1 0]\n",
      "   state [0 0 0 0] state_WI [0.37 0.52 0.32 0.45] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.52 0.32 1.  ] sorted [3 0 1]\n",
      "   state [1 0 1 1] state_WI [1.   0.52 1.   1.  ] sorted [3 0 2]\n",
      "instance 7, ep 28, state [0 1 0 1]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.32 0.45] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [0 1 1 1] state_WI [0.37 1.   1.   1.  ] sorted [1 3 2]\n",
      "   state [0 1 1 1] state_WI [0.37 1.   1.   1.  ] sorted [1 3 2]\n",
      "   state [0 1 1 1] state_WI [0.37 1.   1.   1.  ] sorted [1 3 2]\n",
      "   state [0 0 1 1] state_WI [0.37 0.52 1.   1.  ] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.37 1.   1.   1.  ] sorted [1 3 2]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.45] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.37 1.   1.   0.45] sorted [1 2 3]\n",
      "   state [0 0 1 0] state_WI [0.37 0.52 1.   0.45] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.37 0.52 1.   1.  ] sorted [3 2 1]\n",
      "   state [0 1 0 0] state_WI [0.37 1.   0.32 0.45] sorted [1 3 0]\n",
      "   state [1 0 0 0] state_WI [1.   0.52 0.32 0.45] sorted [0 1 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.52 0.32 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "instance 7, ep 29, state [0 1 1 0]\n",
      "   state [0 1 1 0] state_WI [0.37 1.   1.   0.45] sorted [1 2 3]\n",
      "   state [0 0 1 1] state_WI [0.37 0.52 1.   1.  ] sorted [3 2 1]\n",
      "   state [0 1 1 0] state_WI [0.37 1.   1.   0.45] sorted [1 2 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.32 0.45] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.32 0.45] sorted [1 0 3]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.32 0.45] sorted [1 0 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.52 0.32 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.45] sorted [1 0 2]\n",
      "   state [0 1 1 1] state_WI [0.37 1.   1.   1.  ] sorted [1 3 2]\n",
      "   state [0 1 1 1] state_WI [0.37 1.   1.   1.  ] sorted [1 3 2]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 0 1 1] state_WI [1.   0.52 1.   1.  ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.   0.52 1.   1.  ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.   0.52 1.   1.  ] sorted [3 0 2]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.37 1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.32 1.  ] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.52 0.32 1.  ] sorted [3 0 1]\n",
      "first state [0 0 1 1]\n",
      "   state [0 0 1 1] state_WI [0.61 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.61] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.61] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.61] sorted [2 0 3]\n",
      "   state [1 0 0 0] state_WI [1.   0.4  0.52 0.61] sorted [0 3 2]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.52 1.  ] sorted [3 0 2]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.52 1.  ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.61] sorted [2 0 3]\n",
      "   state [0 0 1 0] state_WI [0.61 0.4  1.   0.61] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [0 0 1 1] state_WI [0.61 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [0 0 1 1] state_WI [0.61 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [0 0 0 1] state_WI [0.61 0.4  0.52 1.  ] sorted [3 0 2]\n",
      "   state [0 0 1 0] state_WI [0.61 0.4  1.   0.61] sorted [2 3 0]\n",
      "   state [0 1 1 1] state_WI [0.61 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.61 1.   1.   1.  ] sorted [2 3 1]\n",
      "instance 8, ep 1, state [0 1 0 1]\n",
      "   state [0 1 0 1] state_WI [0.61 1.   0.52 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.61 1.   0.52 1.  ] sorted [3 1 0]\n",
      "   state [0 0 0 1] state_WI [0.61 0.4  0.52 1.  ] sorted [3 0 2]\n",
      "   state [0 0 0 1] state_WI [0.61 0.4  0.52 1.  ] sorted [3 0 2]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.61] sorted [2 0 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.61 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 0] state_WI [0.61 1.   1.   0.61] sorted [2 1 3]\n",
      "   state [0 1 1 0] state_WI [0.61 1.   1.   0.61] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.61 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.61 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.52 1.  ] sorted [3 0 2]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.61] sorted [2 1 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.61] sorted [2 0 3]\n",
      "   state [0 0 1 0] state_WI [0.61 0.4  1.   0.61] sorted [2 3 0]\n",
      "   state [0 0 1 1] state_WI [0.61 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [0 0 1 1] state_WI [0.61 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.52 1.  ] sorted [3 0 2]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.61] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.61] sorted [2 0 3]\n",
      "instance 8, ep 2, state [0 0 1 0]\n",
      "   state [0 0 1 0] state_WI [0.61 0.4  1.   0.61] sorted [2 3 0]\n",
      "   state [0 0 1 1] state_WI [0.61 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [0 1 1 1] state_WI [0.61 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.61 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [0 0 1 1] state_WI [0.61 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [0 0 1 1] state_WI [0.61 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [0 0 0 0] state_WI [0.61 0.4  0.52 0.61] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [0 0 1 1] state_WI [0.61 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.61 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 0 1] state_WI [0.61 0.4  0.52 1.  ] sorted [3 0 2]\n",
      "   state [0 0 1 1] state_WI [0.61 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [0 0 1 1] state_WI [0.61 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.61] sorted [2 0 3]\n",
      "instance 8, ep 3, state [1 1 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.61] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.61] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.61] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.61] sorted [2 1 0]\n",
      "   state [0 0 1 0] state_WI [0.61 0.4  1.   0.61] sorted [2 3 0]\n",
      "   state [0 0 1 1] state_WI [0.61 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [0 0 0 1] state_WI [0.61 0.4  0.52 1.  ] sorted [3 0 2]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.61] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.61] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.61] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.52 1.  ] sorted [3 0 2]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 3 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 3 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.52 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.61 1.   0.52 1.  ] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.52 1.  ] sorted [3 0 2]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.52 1.  ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "instance 8, ep 4, state [0 0 1 1]\n",
      "   state [0 0 1 1] state_WI [0.61 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.61] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [0 0 1 0] state_WI [0.61 0.4  1.   0.61] sorted [2 3 0]\n",
      "   state [0 0 1 1] state_WI [0.61 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.52 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.52 0.61] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.52 1.  ] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.52 1.  ] sorted [3 0 2]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.52 1.  ] sorted [3 0 2]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.61] sorted [2 1 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.61] sorted [2 0 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 3 1]\n",
      "   state [0 1 0 1] state_WI [0.61 1.   0.52 1.  ] sorted [3 1 0]\n",
      "   state [0 0 0 0] state_WI [0.61 0.4  0.52 0.61] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.52 1.  ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "instance 8, ep 5, state [1 1 1 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 3 1]\n",
      "   state [0 1 1 0] state_WI [0.61 1.   1.   0.61] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.61 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [0 0 1 0] state_WI [0.61 0.4  1.   0.61] sorted [2 3 0]\n",
      "   state [0 1 0 1] state_WI [0.61 1.   0.52 1.  ] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.52 1.  ] sorted [3 0 2]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.61] sorted [2 0 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 3 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 3 1]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [0 0 1 1] state_WI [0.61 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.61] sorted [2 0 3]\n",
      "   state [0 0 1 1] state_WI [0.61 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.52 0.61] sorted [1 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.61] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [0 0 1 1] state_WI [0.61 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.61] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "instance 8, ep 6, state [0 1 0 1]\n",
      "   state [0 1 0 1] state_WI [0.61 1.   0.52 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.52 0.61] sorted [1 0 3]\n",
      "   state [0 1 0 1] state_WI [0.61 1.   0.52 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.61 1.   0.52 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.61 1.   0.52 1.  ] sorted [3 1 0]\n",
      "   state [0 0 0 1] state_WI [0.61 0.4  0.52 1.  ] sorted [3 0 2]\n",
      "   state [0 0 1 1] state_WI [0.61 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 3 1]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.61] sorted [2 0 3]\n",
      "   state [0 0 1 1] state_WI [0.61 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.61] sorted [2 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.52 0.61] sorted [1 0 3]\n",
      "   state [1 0 0 0] state_WI [1.   0.4  0.52 0.61] sorted [0 3 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.52 1.  ] sorted [3 0 2]\n",
      "   state [0 0 1 1] state_WI [0.61 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [0 0 1 1] state_WI [0.61 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "instance 8, ep 7, state [1 1 0 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.52 0.61] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.52 0.61] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.52 1.  ] sorted [3 1 0]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.61 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.61 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.61 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.61 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.61 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.61 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [0 0 1 1] state_WI [0.61 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.52 1.  ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 3 1]\n",
      "   state [0 1 1 0] state_WI [0.61 1.   1.   0.61] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.61 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [0 1 1 1] state_WI [0.61 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 0 1] state_WI [0.61 0.4  0.52 1.  ] sorted [3 0 2]\n",
      "   state [1 0 0 0] state_WI [1.   0.4  0.52 0.61] sorted [0 3 2]\n",
      "instance 8, ep 8, state [0 0 0 1]\n",
      "   state [0 0 0 1] state_WI [0.61 0.4  0.52 1.  ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.61 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 0 1] state_WI [0.61 1.   0.52 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.52 0.61] sorted [1 0 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 3 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 3 1]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.61] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.61] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.61 1.   1.   0.61] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.61 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 0 1] state_WI [0.61 0.4  0.52 1.  ] sorted [3 0 2]\n",
      "   state [0 0 0 1] state_WI [0.61 0.4  0.52 1.  ] sorted [3 0 2]\n",
      "   state [0 0 1 1] state_WI [0.61 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [0 0 1 1] state_WI [0.61 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [0 0 1 0] state_WI [0.61 0.4  1.   0.61] sorted [2 3 0]\n",
      "   state [0 0 1 1] state_WI [0.61 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 3 1]\n",
      "instance 8, ep 9, state [1 0 0 0]\n",
      "   state [1 0 0 0] state_WI [1.   0.4  0.52 0.61] sorted [0 3 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 3 1]\n",
      "   state [0 1 0 0] state_WI [0.61 1.   0.52 0.61] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.52 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 0] state_WI [0.61 1.   0.52 0.61] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.52 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.52 0.61] sorted [1 0 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.52 1.  ] sorted [3 0 2]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.61] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.61] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [0 0 1 1] state_WI [0.61 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.61] sorted [2 0 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 3 1]\n",
      "   state [0 0 0 0] state_WI [0.61 0.4  0.52 0.61] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "instance 8, ep 10, state [1 1 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.61] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.61 1.   1.   0.61] sorted [2 1 3]\n",
      "   state [0 0 0 1] state_WI [0.61 0.4  0.52 1.  ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [0 0 1 1] state_WI [0.61 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [0 0 1 1] state_WI [0.61 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.61] sorted [2 1 0]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.61 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.61 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 3 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 3 1]\n",
      "   state [0 0 1 0] state_WI [0.61 0.4  1.   0.61] sorted [2 3 0]\n",
      "   state [0 0 1 1] state_WI [0.61 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [0 1 1 1] state_WI [0.61 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.61 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.61 1.   1.   1.  ] sorted [2 3 1]\n",
      "instance 8, ep 11, state [1 1 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.52 1.  ] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.52 1.  ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.52 1.  ] sorted [3 1 0]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 3 1]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 0 0] state_WI [1.   0.4  0.52 0.61] sorted [0 3 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.61 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.61 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.61 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "instance 8, ep 12, state [0 1 0 1]\n",
      "   state [0 1 0 1] state_WI [0.61 1.   0.52 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.52 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.52 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.52 1.  ] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.52 1.  ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [0 0 0 1] state_WI [0.61 0.4  0.52 1.  ] sorted [3 0 2]\n",
      "   state [0 0 0 1] state_WI [0.61 0.4  0.52 1.  ] sorted [3 0 2]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.52 1.  ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.61] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.52 1.  ] sorted [3 0 2]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.52 1.  ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "instance 8, ep 13, state [1 1 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.61] sorted [2 1 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.61] sorted [2 0 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.61 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.61 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [0 0 1 0] state_WI [0.61 0.4  1.   0.61] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.61] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [0 0 1 1] state_WI [0.61 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [0 0 0 1] state_WI [0.61 0.4  0.52 1.  ] sorted [3 0 2]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.52 1.  ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [0 0 1 1] state_WI [0.61 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [0 0 1 1] state_WI [0.61 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [0 0 0 1] state_WI [0.61 0.4  0.52 1.  ] sorted [3 0 2]\n",
      "   state [0 0 1 1] state_WI [0.61 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.52 1.  ] sorted [3 1 0]\n",
      "instance 8, ep 14, state [0 0 0 1]\n",
      "   state [0 0 0 1] state_WI [0.61 0.4  0.52 1.  ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.61] sorted [2 0 3]\n",
      "   state [1 0 0 0] state_WI [1.   0.4  0.52 0.61] sorted [0 3 2]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.52 1.  ] sorted [3 0 2]\n",
      "   state [1 0 0 0] state_WI [1.   0.4  0.52 0.61] sorted [0 3 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.61 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.61 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.61 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 0 1] state_WI [0.61 1.   0.52 1.  ] sorted [3 1 0]\n",
      "   state [1 0 0 0] state_WI [1.   0.4  0.52 0.61] sorted [0 3 2]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.52 1.  ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.61] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [0 0 1 1] state_WI [0.61 0.4  1.   1.  ] sorted [2 3 0]\n",
      "instance 8, ep 15, state [0 1 1 1]\n",
      "   state [0 1 1 1] state_WI [0.61 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.61 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.61 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 0] state_WI [0.61 1.   1.   0.61] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.61 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.61 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.52 1.  ] sorted [3 0 2]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.52 1.  ] sorted [3 0 2]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.61] sorted [2 1 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.61] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.61] sorted [2 0 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.52 1.  ] sorted [3 0 2]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.61 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.52 1.  ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.52 1.  ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "instance 8, ep 16, state [0 1 1 0]\n",
      "   state [0 1 1 0] state_WI [0.61 1.   1.   0.61] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.61 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [0 0 1 1] state_WI [0.61 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [0 0 1 0] state_WI [0.61 0.4  1.   0.61] sorted [2 3 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.61] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [0 1 1 0] state_WI [0.61 1.   1.   0.61] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.61 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [0 0 0 1] state_WI [0.61 0.4  0.52 1.  ] sorted [3 0 2]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.52 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.52 1.  ] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.52 1.  ] sorted [3 0 2]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.52 1.  ] sorted [3 0 2]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.61 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.61 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "instance 8, ep 17, state [1 1 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.52 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.52 0.61] sorted [1 0 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 3 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 3 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 3 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.61 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [0 0 1 1] state_WI [0.61 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [0 0 1 1] state_WI [0.61 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.52 1.  ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.61] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 3 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 3 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 3 1]\n",
      "instance 8, ep 18, state [0 0 0 0]\n",
      "   state [0 0 0 0] state_WI [0.61 0.4  0.52 0.61] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 0 0] state_WI [1.   0.4  0.52 0.61] sorted [0 3 2]\n",
      "   state [0 0 0 1] state_WI [0.61 0.4  0.52 1.  ] sorted [3 0 2]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.52 1.  ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.52 1.  ] sorted [3 0 2]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.52 1.  ] sorted [3 0 2]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 3 1]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.61] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 3 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 3 1]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.61] sorted [2 1 0]\n",
      "   state [0 1 1 0] state_WI [0.61 1.   1.   0.61] sorted [2 1 3]\n",
      "   state [0 0 1 1] state_WI [0.61 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 3 1]\n",
      "instance 8, ep 19, state [0 0 1 1]\n",
      "   state [0 0 1 1] state_WI [0.61 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.61] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.52 1.  ] sorted [3 0 2]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.61] sorted [2 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.52 0.61] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.52 1.  ] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.52 1.  ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.61 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.61 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.61 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.61 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.61 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.61 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.52 0.61] sorted [1 0 3]\n",
      "instance 8, ep 20, state [1 0 0 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.52 1.  ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.61] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.61] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.61] sorted [2 0 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.52 1.  ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.52 1.  ] sorted [3 1 0]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 3 1]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.52 0.61] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.52 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.52 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.52 1.  ] sorted [3 1 0]\n",
      "   state [1 0 0 0] state_WI [1.   0.4  0.52 0.61] sorted [0 3 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.61 1.   1.   1.  ] sorted [2 3 1]\n",
      "instance 8, ep 21, state [0 0 1 0]\n",
      "   state [0 0 1 0] state_WI [0.61 0.4  1.   0.61] sorted [2 3 0]\n",
      "   state [0 0 1 1] state_WI [0.61 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.61] sorted [2 0 3]\n",
      "   state [0 0 1 1] state_WI [0.61 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [0 1 1 1] state_WI [0.61 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.61 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 0 1] state_WI [0.61 1.   0.52 1.  ] sorted [3 1 0]\n",
      "   state [0 0 0 0] state_WI [0.61 0.4  0.52 0.61] sorted [3 0 2]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 3 1]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.61] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.52 1.  ] sorted [3 0 2]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.52 1.  ] sorted [3 0 2]\n",
      "   state [0 0 1 1] state_WI [0.61 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "instance 8, ep 22, state [1 1 0 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.52 0.61] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.52 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.52 0.61] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.52 0.61] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.52 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.52 1.  ] sorted [3 1 0]\n",
      "   state [0 1 1 1] state_WI [0.61 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.61 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.61 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 3 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.52 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.52 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.52 0.61] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.52 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.61 1.   0.52 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.61 1.   0.52 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.52 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.52 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.52 1.  ] sorted [3 1 0]\n",
      "instance 8, ep 23, state [1 0 0 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.52 1.  ] sorted [3 0 2]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.61 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [0 0 1 1] state_WI [0.61 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [0 0 1 1] state_WI [0.61 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.61] sorted [2 0 3]\n",
      "   state [0 0 1 0] state_WI [0.61 0.4  1.   0.61] sorted [2 3 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.52 1.  ] sorted [3 0 2]\n",
      "   state [0 0 0 0] state_WI [0.61 0.4  0.52 0.61] sorted [3 0 2]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 3 1]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 3 1]\n",
      "   state [0 1 0 1] state_WI [0.61 1.   0.52 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.52 1.  ] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.52 1.  ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [0 0 1 1] state_WI [0.61 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [0 0 0 1] state_WI [0.61 0.4  0.52 1.  ] sorted [3 0 2]\n",
      "instance 8, ep 24, state [0 1 1 0]\n",
      "   state [0 1 1 0] state_WI [0.61 1.   1.   0.61] sorted [2 1 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 3 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.52 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.52 0.61] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.52 1.  ] sorted [3 1 0]\n",
      "   state [0 0 0 0] state_WI [0.61 0.4  0.52 0.61] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.61] sorted [2 0 3]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.61] sorted [2 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.61] sorted [2 1 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.61] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.52 1.  ] sorted [3 0 2]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.61] sorted [2 1 0]\n",
      "instance 8, ep 25, state [0 0 0 0]\n",
      "   state [0 0 0 0] state_WI [0.61 0.4  0.52 0.61] sorted [3 0 2]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.52 1.  ] sorted [3 0 2]\n",
      "   state [0 0 0 1] state_WI [0.61 0.4  0.52 1.  ] sorted [3 0 2]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.61 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [0 0 1 1] state_WI [0.61 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [0 0 1 1] state_WI [0.61 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.61] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.61 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.61 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.61 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 0 0] state_WI [0.61 1.   0.52 0.61] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.61 1.   0.52 0.61] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.61 1.   0.52 0.61] sorted [1 3 0]\n",
      "   state [0 0 0 1] state_WI [0.61 0.4  0.52 1.  ] sorted [3 0 2]\n",
      "instance 8, ep 26, state [1 0 1 1]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.52 1.  ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.52 1.  ] sorted [3 0 2]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.52 1.  ] sorted [3 0 2]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.52 0.61] sorted [1 0 3]\n",
      "   state [0 0 0 0] state_WI [0.61 0.4  0.52 0.61] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.52 1.  ] sorted [3 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.61] sorted [2 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.52 1.  ] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.52 1.  ] sorted [3 0 2]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.61] sorted [2 0 3]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.61] sorted [2 0 3]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.61] sorted [2 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.52 0.61] sorted [1 0 3]\n",
      "instance 8, ep 27, state [1 1 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.52 1.  ] sorted [3 1 0]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 3 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.52 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.52 1.  ] sorted [3 1 0]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 3 1]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [0 0 1 1] state_WI [0.61 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.61] sorted [2 0 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.52 1.  ] sorted [3 0 2]\n",
      "   state [0 0 0 1] state_WI [0.61 0.4  0.52 1.  ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.52 1.  ] sorted [3 0 2]\n",
      "   state [0 0 1 1] state_WI [0.61 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [0 0 1 1] state_WI [0.61 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.52 1.  ] sorted [3 0 2]\n",
      "instance 8, ep 28, state [1 0 0 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.52 1.  ] sorted [3 0 2]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.52 1.  ] sorted [3 0 2]\n",
      "   state [1 0 0 0] state_WI [1.   0.4  0.52 0.61] sorted [0 3 2]\n",
      "   state [0 0 0 1] state_WI [0.61 0.4  0.52 1.  ] sorted [3 0 2]\n",
      "   state [0 0 0 1] state_WI [0.61 0.4  0.52 1.  ] sorted [3 0 2]\n",
      "   state [0 0 1 0] state_WI [0.61 0.4  1.   0.61] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.52 1.  ] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.4  1.   0.61] sorted [2 0 3]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.52 1.  ] sorted [3 0 2]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 3 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.61 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.52 1.  ] sorted [3 1 0]\n",
      "   state [0 0 1 1] state_WI [0.61 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "instance 8, ep 29, state [0 0 0 0]\n",
      "   state [0 0 0 0] state_WI [0.61 0.4  0.52 0.61] sorted [3 0 2]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.52 1.  ] sorted [3 0 2]\n",
      "   state [0 1 1 1] state_WI [0.61 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 1 1 1] state_WI [0.61 1.   1.   1.  ] sorted [2 3 1]\n",
      "   state [0 0 0 1] state_WI [0.61 0.4  0.52 1.  ] sorted [3 0 2]\n",
      "   state [0 0 1 1] state_WI [0.61 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [0 0 1 1] state_WI [0.61 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [0 0 1 1] state_WI [0.61 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 0 1 1] state_WI [1.  0.4 1.  1. ] sorted [2 3 0]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [2 3 1]\n",
      "   state [0 0 1 1] state_WI [0.61 0.4  1.   1.  ] sorted [2 3 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.52 1.  ] sorted [3 0 2]\n",
      "   state [1 0 0 1] state_WI [1.   0.4  0.52 1.  ] sorted [3 0 2]\n",
      "first state [1 1 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.41] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.39 1.   1.   0.41] sorted [1 2 3]\n",
      "   state [0 1 1 1] state_WI [0.39 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 0] state_WI [0.39 1.   1.   0.41] sorted [1 2 3]\n",
      "   state [0 1 1 0] state_WI [0.39 1.   1.   0.41] sorted [1 2 3]\n",
      "   state [0 1 1 0] state_WI [0.39 1.   1.   0.41] sorted [1 2 3]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.41] sorted [1 0 2]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "instance 9, ep 1, state [1 1 0 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [0 1 1 0] state_WI [0.39 1.   1.   0.41] sorted [1 2 3]\n",
      "   state [0 1 1 0] state_WI [0.39 1.   1.   0.41] sorted [1 2 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 0] state_WI [0.39 1.   0.38 0.41] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.66 0.38 1.  ] sorted [3 0 1]\n",
      "instance 9, ep 2, state [0 0 1 0]\n",
      "   state [0 0 1 0] state_WI [0.39 0.66 1.   0.41] sorted [2 1 3]\n",
      "   state [0 1 1 1] state_WI [0.39 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.39 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.39 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 0 0] state_WI [0.39 1.   0.38 0.41] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.66 0.38 1.  ] sorted [3 0 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [3 1 0]\n",
      "   state [0 1 0 0] state_WI [0.39 1.   0.38 0.41] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.66 0.38 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [0 1 0 0] state_WI [0.39 1.   0.38 0.41] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.39 1.   0.38 0.41] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "instance 9, ep 3, state [1 0 0 0]\n",
      "   state [1 0 0 0] state_WI [1.   0.66 0.38 0.41] sorted [0 1 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.66 0.38 1.  ] sorted [3 0 1]\n",
      "   state [0 1 0 0] state_WI [0.39 1.   0.38 0.41] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.39 1.   0.38 0.41] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 1 0] state_WI [0.39 1.   1.   0.41] sorted [1 2 3]\n",
      "instance 9, ep 4, state [0 0 1 1]\n",
      "   state [0 0 1 1] state_WI [0.39 0.66 1.   1.  ] sorted [3 2 1]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 0 0 1] state_WI [0.39 0.66 0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 1 1] state_WI [0.39 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.66 0.38 1.  ] sorted [3 0 1]\n",
      "   state [1 0 0 0] state_WI [1.   0.66 0.38 0.41] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.41] sorted [1 0 2]\n",
      "   state [1 0 1 0] state_WI [1.   0.66 1.   0.41] sorted [0 2 1]\n",
      "   state [0 1 1 0] state_WI [0.39 1.   1.   0.41] sorted [1 2 3]\n",
      "   state [1 0 0 0] state_WI [1.   0.66 0.38 0.41] sorted [0 1 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.66 0.38 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "instance 9, ep 5, state [1 0 0 0]\n",
      "   state [1 0 0 0] state_WI [1.   0.66 0.38 0.41] sorted [0 1 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [0 1 1 1] state_WI [0.39 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.39 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 0] state_WI [0.39 1.   1.   0.41] sorted [1 2 3]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [0 1 0 0] state_WI [0.39 1.   0.38 0.41] sorted [1 3 0]\n",
      "   state [0 0 0 0] state_WI [0.39 0.66 0.38 0.41] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.39 1.   0.38 0.41] sorted [1 3 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.66 1.   0.41] sorted [0 2 1]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.41] sorted [1 0 2]\n",
      "   state [1 0 1 0] state_WI [1.   0.66 1.   0.41] sorted [0 2 1]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.41] sorted [1 0 2]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [3 1 0]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "instance 9, ep 6, state [1 0 0 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.66 0.38 1.  ] sorted [3 0 1]\n",
      "   state [1 0 1 1] state_WI [1.   0.66 1.   1.  ] sorted [3 0 2]\n",
      "   state [1 0 0 1] state_WI [1.   0.66 0.38 1.  ] sorted [3 0 1]\n",
      "   state [1 0 1 1] state_WI [1.   0.66 1.   1.  ] sorted [3 0 2]\n",
      "   state [1 0 0 1] state_WI [1.   0.66 0.38 1.  ] sorted [3 0 1]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.66 0.38 1.  ] sorted [3 0 1]\n",
      "   state [0 0 0 1] state_WI [0.39 0.66 0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.66 1.   0.41] sorted [0 2 1]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.41] sorted [1 0 2]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.41] sorted [1 0 2]\n",
      "instance 9, ep 7, state [0 0 0 1]\n",
      "   state [0 0 0 1] state_WI [0.39 0.66 0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.66 0.38 1.  ] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.66 0.38 1.  ] sorted [3 0 1]\n",
      "   state [0 1 0 0] state_WI [0.39 1.   0.38 0.41] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 0] state_WI [0.39 1.   0.38 0.41] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.66 0.38 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.41] sorted [1 0 2]\n",
      "instance 9, ep 8, state [1 0 0 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.66 0.38 1.  ] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.66 0.38 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.66 0.38 1.  ] sorted [3 0 1]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 1 1] state_WI [0.39 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 0 0 0] state_WI [1.   0.66 0.38 0.41] sorted [0 1 3]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.66 0.38 1.  ] sorted [3 0 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [3 1 0]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [3 1 0]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [3 1 0]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [3 1 0]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "instance 9, ep 9, state [1 0 1 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.66 1.   0.41] sorted [0 2 1]\n",
      "   state [0 1 0 0] state_WI [0.39 1.   0.38 0.41] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.39 1.   0.38 0.41] sorted [1 3 0]\n",
      "   state [0 0 0 0] state_WI [0.39 0.66 0.38 0.41] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.39 1.   0.38 0.41] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.39 1.   0.38 0.41] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.39 1.   0.38 0.41] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.66 0.38 1.  ] sorted [3 0 1]\n",
      "instance 9, ep 10, state [1 1 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 0] state_WI [0.39 1.   0.38 0.41] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.66 0.38 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [0 1 0 0] state_WI [0.39 1.   0.38 0.41] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.66 0.38 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "instance 9, ep 11, state [1 1 0 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 0 0 1] state_WI [0.39 0.66 0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 0 0 0] state_WI [0.39 0.66 0.38 0.41] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.66 0.38 1.  ] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.66 0.38 1.  ] sorted [3 0 1]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 0] state_WI [0.39 1.   0.38 0.41] sorted [1 3 0]\n",
      "   state [1 0 0 0] state_WI [1.   0.66 0.38 0.41] sorted [0 1 3]\n",
      "   state [0 1 0 0] state_WI [0.39 1.   0.38 0.41] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "instance 9, ep 12, state [0 1 0 1]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 0 0 0] state_WI [1.   0.66 0.38 0.41] sorted [0 1 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.66 0.38 1.  ] sorted [3 0 1]\n",
      "   state [1 0 0 0] state_WI [1.   0.66 0.38 0.41] sorted [0 1 3]\n",
      "   state [1 0 0 0] state_WI [1.   0.66 0.38 0.41] sorted [0 1 3]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "instance 9, ep 13, state [1 0 1 0]\n",
      "   state [1 0 1 0] state_WI [1.   0.66 1.   0.41] sorted [0 2 1]\n",
      "   state [1 0 1 0] state_WI [1.   0.66 1.   0.41] sorted [0 2 1]\n",
      "   state [0 0 0 1] state_WI [0.39 0.66 0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.66 0.38 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "instance 9, ep 14, state [1 0 0 0]\n",
      "   state [1 0 0 0] state_WI [1.   0.66 0.38 0.41] sorted [0 1 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 0] state_WI [0.39 1.   0.38 0.41] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.66 0.38 1.  ] sorted [3 0 1]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 0 0 0] state_WI [1.   0.66 0.38 0.41] sorted [0 1 3]\n",
      "   state [1 0 0 0] state_WI [1.   0.66 0.38 0.41] sorted [0 1 3]\n",
      "   state [1 0 0 0] state_WI [1.   0.66 0.38 0.41] sorted [0 1 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.41] sorted [1 0 2]\n",
      "instance 9, ep 15, state [0 1 1 1]\n",
      "   state [0 1 1 1] state_WI [0.39 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 0 1 1] state_WI [0.39 0.66 1.   1.  ] sorted [3 2 1]\n",
      "   state [0 1 1 1] state_WI [0.39 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 0] state_WI [0.39 1.   0.38 0.41] sorted [1 3 0]\n",
      "   state [1 0 0 0] state_WI [1.   0.66 0.38 0.41] sorted [0 1 3]\n",
      "   state [0 1 0 0] state_WI [0.39 1.   0.38 0.41] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "instance 9, ep 16, state [0 0 0 1]\n",
      "   state [0 0 0 1] state_WI [0.39 0.66 0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.66 0.38 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 0 0 1] state_WI [0.39 0.66 0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 0 0 0] state_WI [1.   0.66 0.38 0.41] sorted [0 1 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.66 0.38 1.  ] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.66 0.38 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [0 1 0 0] state_WI [0.39 1.   0.38 0.41] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 1 0] state_WI [0.39 1.   1.   0.41] sorted [1 2 3]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.41] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.39 1.   1.   0.41] sorted [1 2 3]\n",
      "   state [0 1 1 1] state_WI [0.39 1.   1.   1.  ] sorted [3 1 2]\n",
      "instance 9, ep 17, state [1 0 0 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.66 0.38 1.  ] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.66 0.38 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 0] state_WI [0.39 1.   0.38 0.41] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.66 0.38 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 1 1] state_WI [0.39 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.39 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 0 1 1] state_WI [0.39 0.66 1.   1.  ] sorted [3 2 1]\n",
      "   state [0 1 0 0] state_WI [0.39 1.   0.38 0.41] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "instance 9, ep 18, state [1 1 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.41] sorted [1 0 2]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [3 1 0]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [1 0 0 0] state_WI [1.   0.66 0.38 0.41] sorted [0 1 3]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [1 0 0 0] state_WI [1.   0.66 0.38 0.41] sorted [0 1 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "instance 9, ep 19, state [0 1 1 0]\n",
      "   state [0 1 1 0] state_WI [0.39 1.   1.   0.41] sorted [1 2 3]\n",
      "   state [0 1 1 0] state_WI [0.39 1.   1.   0.41] sorted [1 2 3]\n",
      "   state [0 1 0 0] state_WI [0.39 1.   0.38 0.41] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 0 0 0] state_WI [1.   0.66 0.38 0.41] sorted [0 1 3]\n",
      "   state [0 1 0 0] state_WI [0.39 1.   0.38 0.41] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 0] state_WI [0.39 1.   0.38 0.41] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "instance 9, ep 20, state [1 1 1 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [0 1 0 0] state_WI [0.39 1.   0.38 0.41] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.39 1.   0.38 0.41] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [0 1 0 0] state_WI [0.39 1.   0.38 0.41] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [0 1 0 0] state_WI [0.39 1.   0.38 0.41] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "instance 9, ep 21, state [0 1 1 1]\n",
      "   state [0 1 1 1] state_WI [0.39 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.39 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.39 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [1 0 0 0] state_WI [1.   0.66 0.38 0.41] sorted [0 1 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 0] state_WI [0.39 1.   0.38 0.41] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "instance 9, ep 22, state [1 1 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 0] state_WI [0.39 1.   0.38 0.41] sorted [1 3 0]\n",
      "   state [0 0 0 1] state_WI [0.39 0.66 0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 0] state_WI [0.39 1.   0.38 0.41] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [3 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.41] sorted [1 0 2]\n",
      "   state [0 1 1 0] state_WI [0.39 1.   1.   0.41] sorted [1 2 3]\n",
      "   state [0 1 0 0] state_WI [0.39 1.   0.38 0.41] sorted [1 3 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.66 0.38 1.  ] sorted [3 0 1]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 0 0 1] state_WI [0.39 0.66 0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "instance 9, ep 23, state [1 1 1 1]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.66 0.38 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 0] state_WI [0.39 1.   0.38 0.41] sorted [1 3 0]\n",
      "   state [0 0 0 1] state_WI [0.39 0.66 0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 0] state_WI [0.39 1.   0.38 0.41] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.39 1.   0.38 0.41] sorted [1 3 0]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.66 0.38 1.  ] sorted [3 0 1]\n",
      "   state [0 0 0 1] state_WI [0.39 0.66 0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "instance 9, ep 24, state [0 1 0 0]\n",
      "   state [0 1 0 0] state_WI [0.39 1.   0.38 0.41] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.41] sorted [1 0 2]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.41] sorted [1 0 2]\n",
      "   state [0 1 1 1] state_WI [0.39 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [1 0 0 0] state_WI [1.   0.66 0.38 0.41] sorted [0 1 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 0 0 1] state_WI [0.39 0.66 0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.66 0.38 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "instance 9, ep 25, state [1 1 0 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 0 0 0] state_WI [1.   0.66 0.38 0.41] sorted [0 1 3]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 0] state_WI [0.39 1.   0.38 0.41] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "instance 9, ep 26, state [1 0 0 0]\n",
      "   state [1 0 0 0] state_WI [1.   0.66 0.38 0.41] sorted [0 1 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.41] sorted [1 0 2]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [3 1 0]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [3 1 0]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [3 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.41] sorted [1 0 2]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 0 0 0] state_WI [1.   0.66 0.38 0.41] sorted [0 1 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.41] sorted [1 0 2]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.41] sorted [1 0 2]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 0 0 0] state_WI [1.   0.66 0.38 0.41] sorted [0 1 3]\n",
      "   state [1 0 0 1] state_WI [1.   0.66 0.38 1.  ] sorted [3 0 1]\n",
      "instance 9, ep 27, state [0 0 0 0]\n",
      "   state [0 0 0 0] state_WI [0.39 0.66 0.38 0.41] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [0 1 1 0] state_WI [0.39 1.   1.   0.41] sorted [1 2 3]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 0] state_WI [0.39 1.   0.38 0.41] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.39 1.   0.38 0.41] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.66 0.38 1.  ] sorted [3 0 1]\n",
      "   state [1 0 0 0] state_WI [1.   0.66 0.38 0.41] sorted [0 1 3]\n",
      "   state [0 1 1 1] state_WI [0.39 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.39 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 0 0] state_WI [0.39 1.   0.38 0.41] sorted [1 3 0]\n",
      "   state [1 0 0 0] state_WI [1.   0.66 0.38 0.41] sorted [0 1 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [0 1 0 0] state_WI [0.39 1.   0.38 0.41] sorted [1 3 0]\n",
      "   state [0 1 0 0] state_WI [0.39 1.   0.38 0.41] sorted [1 3 0]\n",
      "   state [0 1 1 1] state_WI [0.39 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 1 1 1] state_WI [0.39 1.   1.   1.  ] sorted [3 1 2]\n",
      "instance 9, ep 28, state [1 1 1 0]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.41] sorted [1 0 2]\n",
      "   state [0 1 0 0] state_WI [0.39 1.   0.38 0.41] sorted [1 3 0]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [1 0 0 0] state_WI [1.   0.66 0.38 0.41] sorted [0 1 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 0 0 1] state_WI [0.39 0.66 0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 0] state_WI [0.39 1.   0.38 0.41] sorted [1 3 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [0 0 0 0] state_WI [0.39 0.66 0.38 0.41] sorted [1 3 0]\n",
      "instance 9, ep 29, state [0 1 0 0]\n",
      "   state [0 1 0 0] state_WI [0.39 1.   0.38 0.41] sorted [1 3 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.66 0.38 1.  ] sorted [3 0 1]\n",
      "   state [0 0 0 1] state_WI [0.39 0.66 0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 0 0 1] state_WI [0.39 0.66 0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [0 1 0 1] state_WI [0.39 1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [0 1 1 0] state_WI [0.39 1.   1.   0.41] sorted [1 2 3]\n",
      "   state [0 1 1 1] state_WI [0.39 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [1 1 1 0] state_WI [1.   1.   1.   0.41] sorted [1 0 2]\n",
      "   state [1 1 1 1] state_WI [1. 1. 1. 1.] sorted [3 1 0]\n",
      "   state [0 1 1 1] state_WI [0.39 1.   1.   1.  ] sorted [3 1 2]\n",
      "   state [0 0 1 1] state_WI [0.39 0.66 1.   1.  ] sorted [3 2 1]\n",
      "   state [0 0 0 1] state_WI [0.39 0.66 0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 0 0 1] state_WI [1.   0.66 0.38 1.  ] sorted [3 0 1]\n",
      "   state [1 0 0 1] state_WI [1.   0.66 0.38 1.  ] sorted [3 0 1]\n",
      "   state [1 1 0 1] state_WI [1.   1.   0.38 1.  ] sorted [3 1 0]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [1 1 0 0] state_WI [1.   1.   0.38 0.41] sorted [1 0 3]\n",
      "   state [1 0 0 0] state_WI [1.   0.66 0.38 0.41] sorted [0 1 3]\n"
     ]
    },
    {
     "data": {
      "text/plain": [
       "0.7449583333333333"
      ]
     },
     "execution_count": 18,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "np.random.seed(seed)\n",
    "random.seed(seed)\n",
    "whittle_approximate_rewards = optimal_whittle(simulator, n_episodes, n_epochs, discount,reward_function='matching')\n",
    "whittle_approximate_active_rate = simulator.total_active/(whittle_approximate_rewards.size*n_arms)\n",
    "np.mean(whittle_approximate_rewards)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 22,
   "metadata": {},
   "outputs": [],
   "source": [
    "mean_rewards = {'random_rewards': np.mean(random_rewards), \n",
    " 'optimal_rewards': np.mean(optimal_reward), \n",
    " 'zero_step_rewards': np.mean(zero_step_rewards),\n",
    " 'one_step_rewards': np.mean(one_step_rewards),\n",
    " 'infinite_step_rewards': np.mean(infinite_step_rewards),\n",
    " 'whittle_approximate_rewards': np.mean(whittle_approximate_rewards)}"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 23,
   "metadata": {},
   "outputs": [],
   "source": [
    "active_rates = {'random_rewards': np.mean(random_active_rate), \n",
    " 'optimal_rewards': np.mean(optimal_active_rate), \n",
    " 'zero_step_rewards': np.mean(zero_step_active_rate),\n",
    " 'one_step_rewards': np.mean(one_step_active_rate),\n",
    " 'infinite_step_rewards': np.mean(infinite_step_active_rate),\n",
    " 'whittle_approximate_rewards': np.mean(whittle_approximate_active_rate)}"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 24,
   "metadata": {},
   "outputs": [],
   "source": [
    "std_rewards = {'random_rewards': np.std(random_rewards), \n",
    " 'optimal_rewards': np.std(optimal_reward), \n",
    " 'zero_step_rewards': np.std(zero_step_rewards),\n",
    " 'one_step_rewards': np.std(one_step_rewards),\n",
    " 'infinite_step_rewards': np.std(infinite_step_rewards),\n",
    " 'whittle_approximate_rewards': np.std(whittle_approximate_rewards), \n",
    " }"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 25,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "first state [0 1 1 1]\n",
      "instance 0, ep 1, state [1 1 1 1]\n",
      "instance 0, ep 2, state [0 0 0 1]\n",
      "instance 0, ep 3, state [1 1 0 1]\n",
      "instance 0, ep 4, state [0 1 1 1]\n",
      "instance 0, ep 5, state [0 0 0 1]\n",
      "instance 0, ep 6, state [0 0 0 1]\n",
      "instance 0, ep 7, state [0 1 1 0]\n",
      "instance 0, ep 8, state [1 1 0 1]\n",
      "instance 0, ep 9, state [1 1 1 1]\n",
      "instance 0, ep 10, state [0 0 0 0]\n",
      "instance 0, ep 11, state [0 1 0 0]\n",
      "instance 0, ep 12, state [0 1 0 1]\n",
      "instance 0, ep 13, state [0 0 0 0]\n",
      "instance 0, ep 14, state [1 0 1 0]\n",
      "instance 0, ep 15, state [0 0 0 1]\n",
      "instance 0, ep 16, state [0 0 0 0]\n",
      "instance 0, ep 17, state [1 1 0 1]\n",
      "instance 0, ep 18, state [0 1 0 0]\n",
      "instance 0, ep 19, state [0 1 1 1]\n",
      "instance 0, ep 20, state [0 1 1 0]\n",
      "instance 0, ep 21, state [0 0 1 0]\n",
      "instance 0, ep 22, state [1 0 1 1]\n",
      "instance 0, ep 23, state [0 1 1 1]\n",
      "instance 0, ep 24, state [0 0 1 1]\n",
      "instance 0, ep 25, state [0 0 1 0]\n",
      "instance 0, ep 26, state [1 1 1 1]\n",
      "instance 0, ep 27, state [0 1 1 0]\n",
      "instance 0, ep 28, state [0 1 1 0]\n",
      "instance 0, ep 29, state [1 1 1 1]\n",
      "first state [1 0 0 0]\n",
      "instance 1, ep 1, state [1 0 0 1]\n",
      "instance 1, ep 2, state [0 0 0 0]\n",
      "instance 1, ep 3, state [1 0 1 0]\n",
      "instance 1, ep 4, state [1 0 0 1]\n",
      "instance 1, ep 5, state [1 1 0 0]\n",
      "instance 1, ep 6, state [0 1 0 1]\n",
      "instance 1, ep 7, state [0 1 0 1]\n",
      "instance 1, ep 8, state [0 0 1 0]\n",
      "instance 1, ep 9, state [0 1 1 0]\n",
      "instance 1, ep 10, state [0 0 1 0]\n",
      "instance 1, ep 11, state [0 0 0 1]\n",
      "instance 1, ep 12, state [0 1 0 0]\n",
      "instance 1, ep 13, state [0 0 1 1]\n",
      "instance 1, ep 14, state [1 1 0 1]\n",
      "instance 1, ep 15, state [0 1 0 0]\n",
      "instance 1, ep 16, state [0 0 0 0]\n",
      "instance 1, ep 17, state [1 0 0 1]\n",
      "instance 1, ep 18, state [1 0 0 1]\n",
      "instance 1, ep 19, state [0 1 1 0]\n",
      "instance 1, ep 20, state [0 1 1 1]\n",
      "instance 1, ep 21, state [1 1 1 1]\n",
      "instance 1, ep 22, state [1 1 1 1]\n",
      "instance 1, ep 23, state [1 0 1 1]\n",
      "instance 1, ep 24, state [1 1 1 0]\n",
      "instance 1, ep 25, state [0 0 0 0]\n",
      "instance 1, ep 26, state [1 0 1 0]\n",
      "instance 1, ep 27, state [1 0 0 0]\n",
      "instance 1, ep 28, state [1 0 1 0]\n",
      "instance 1, ep 29, state [0 1 1 0]\n",
      "first state [1 0 0 1]\n",
      "instance 2, ep 1, state [0 1 0 1]\n",
      "instance 2, ep 2, state [0 1 1 1]\n",
      "instance 2, ep 3, state [0 1 1 1]\n",
      "instance 2, ep 4, state [1 1 0 1]\n",
      "instance 2, ep 5, state [1 1 0 0]\n",
      "instance 2, ep 6, state [1 1 0 1]\n",
      "instance 2, ep 7, state [0 0 0 0]\n",
      "instance 2, ep 8, state [1 0 1 1]\n",
      "instance 2, ep 9, state [1 1 0 1]\n",
      "instance 2, ep 10, state [1 0 1 1]\n",
      "instance 2, ep 11, state [1 1 1 0]\n",
      "instance 2, ep 12, state [1 1 0 0]\n",
      "instance 2, ep 13, state [0 1 1 0]\n",
      "instance 2, ep 14, state [1 0 1 1]\n",
      "instance 2, ep 15, state [1 0 0 0]\n",
      "instance 2, ep 16, state [0 1 1 1]\n",
      "instance 2, ep 17, state [1 1 1 1]\n",
      "instance 2, ep 18, state [1 0 0 0]\n",
      "instance 2, ep 19, state [1 1 0 1]\n",
      "instance 2, ep 20, state [1 0 0 1]\n",
      "instance 2, ep 21, state [1 1 1 1]\n",
      "instance 2, ep 22, state [1 1 1 0]\n",
      "instance 2, ep 23, state [0 0 1 1]\n",
      "instance 2, ep 24, state [1 0 0 0]\n",
      "instance 2, ep 25, state [0 1 0 0]\n",
      "instance 2, ep 26, state [1 0 1 1]\n",
      "instance 2, ep 27, state [0 1 1 1]\n",
      "instance 2, ep 28, state [0 1 0 0]\n",
      "instance 2, ep 29, state [0 1 0 0]\n",
      "first state [0 1 1 0]\n",
      "instance 3, ep 1, state [1 1 0 0]\n",
      "instance 3, ep 2, state [0 0 0 0]\n",
      "instance 3, ep 3, state [0 0 1 0]\n",
      "instance 3, ep 4, state [1 0 1 0]\n",
      "instance 3, ep 5, state [0 1 1 1]\n",
      "instance 3, ep 6, state [0 0 1 1]\n",
      "instance 3, ep 7, state [1 1 0 1]\n",
      "instance 3, ep 8, state [0 0 0 1]\n",
      "instance 3, ep 9, state [0 0 1 0]\n",
      "instance 3, ep 10, state [1 0 0 1]\n",
      "instance 3, ep 11, state [0 0 0 0]\n",
      "instance 3, ep 12, state [1 0 1 0]\n",
      "instance 3, ep 13, state [1 1 1 0]\n",
      "instance 3, ep 14, state [0 0 1 1]\n",
      "instance 3, ep 15, state [1 0 1 1]\n",
      "instance 3, ep 16, state [0 0 1 1]\n",
      "instance 3, ep 17, state [1 0 1 0]\n",
      "instance 3, ep 18, state [0 0 1 1]\n",
      "instance 3, ep 19, state [1 0 1 0]\n",
      "instance 3, ep 20, state [1 0 0 0]\n",
      "instance 3, ep 21, state [0 1 1 0]\n",
      "instance 3, ep 22, state [1 0 1 1]\n",
      "instance 3, ep 23, state [1 0 1 1]\n",
      "instance 3, ep 24, state [0 0 1 1]\n",
      "instance 3, ep 25, state [1 1 1 0]\n",
      "instance 3, ep 26, state [0 0 1 0]\n",
      "instance 3, ep 27, state [1 1 1 0]\n",
      "instance 3, ep 28, state [1 0 1 0]\n",
      "instance 3, ep 29, state [0 1 0 0]\n",
      "first state [0 1 0 1]\n",
      "instance 4, ep 1, state [0 0 0 0]\n",
      "instance 4, ep 2, state [1 0 1 0]\n",
      "instance 4, ep 3, state [1 0 0 1]\n",
      "instance 4, ep 4, state [0 0 1 1]\n",
      "instance 4, ep 5, state [0 0 1 0]\n",
      "instance 4, ep 6, state [0 0 1 1]\n",
      "instance 4, ep 7, state [0 0 0 1]\n",
      "instance 4, ep 8, state [0 0 1 0]\n",
      "instance 4, ep 9, state [1 0 0 0]\n",
      "instance 4, ep 10, state [1 1 1 0]\n",
      "instance 4, ep 11, state [1 0 0 1]\n",
      "instance 4, ep 12, state [0 0 0 0]\n",
      "instance 4, ep 13, state [0 1 0 1]\n",
      "instance 4, ep 14, state [1 0 0 0]\n",
      "instance 4, ep 15, state [1 0 1 0]\n",
      "instance 4, ep 16, state [1 0 0 1]\n",
      "instance 4, ep 17, state [1 0 1 0]\n",
      "instance 4, ep 18, state [1 1 0 0]\n",
      "instance 4, ep 19, state [0 1 1 0]\n",
      "instance 4, ep 20, state [0 1 1 1]\n",
      "instance 4, ep 21, state [0 0 0 1]\n",
      "instance 4, ep 22, state [0 1 0 1]\n",
      "instance 4, ep 23, state [1 1 0 0]\n",
      "instance 4, ep 24, state [0 1 1 1]\n",
      "instance 4, ep 25, state [1 1 0 1]\n",
      "instance 4, ep 26, state [0 0 1 0]\n",
      "instance 4, ep 27, state [0 1 0 1]\n",
      "instance 4, ep 28, state [0 0 0 0]\n",
      "instance 4, ep 29, state [1 0 1 0]\n",
      "first state [0 1 1 1]\n",
      "instance 5, ep 1, state [0 0 1 0]\n",
      "instance 5, ep 2, state [1 1 1 1]\n",
      "instance 5, ep 3, state [1 0 1 0]\n",
      "instance 5, ep 4, state [0 1 1 1]\n",
      "instance 5, ep 5, state [1 0 0 1]\n",
      "instance 5, ep 6, state [0 0 0 0]\n",
      "instance 5, ep 7, state [0 0 0 0]\n",
      "instance 5, ep 8, state [1 0 0 1]\n",
      "instance 5, ep 9, state [0 1 1 0]\n",
      "instance 5, ep 10, state [0 1 1 0]\n",
      "instance 5, ep 11, state [1 0 1 0]\n",
      "instance 5, ep 12, state [1 1 1 1]\n",
      "instance 5, ep 13, state [0 0 0 0]\n",
      "instance 5, ep 14, state [1 0 0 1]\n",
      "instance 5, ep 15, state [1 1 1 0]\n",
      "instance 5, ep 16, state [0 1 1 0]\n",
      "instance 5, ep 17, state [1 0 0 1]\n",
      "instance 5, ep 18, state [1 1 0 1]\n",
      "instance 5, ep 19, state [0 0 1 1]\n",
      "instance 5, ep 20, state [1 1 1 1]\n",
      "instance 5, ep 21, state [0 0 0 0]\n",
      "instance 5, ep 22, state [1 0 0 0]\n",
      "instance 5, ep 23, state [1 0 1 0]\n",
      "instance 5, ep 24, state [0 1 1 0]\n",
      "instance 5, ep 25, state [1 1 0 1]\n",
      "instance 5, ep 26, state [1 1 1 1]\n",
      "instance 5, ep 27, state [1 1 1 1]\n",
      "instance 5, ep 28, state [1 1 0 1]\n",
      "instance 5, ep 29, state [1 0 1 0]\n",
      "first state [0 0 1 0]\n",
      "instance 6, ep 1, state [1 0 1 0]\n",
      "instance 6, ep 2, state [1 1 1 1]\n",
      "instance 6, ep 3, state [1 1 0 0]\n",
      "instance 6, ep 4, state [1 1 1 0]\n",
      "instance 6, ep 5, state [0 0 1 0]\n",
      "instance 6, ep 6, state [0 0 0 1]\n",
      "instance 6, ep 7, state [0 1 0 0]\n",
      "instance 6, ep 8, state [0 0 0 0]\n",
      "instance 6, ep 9, state [1 0 1 1]\n",
      "instance 6, ep 10, state [1 0 0 0]\n",
      "instance 6, ep 11, state [0 1 0 0]\n",
      "instance 6, ep 12, state [1 1 1 0]\n",
      "instance 6, ep 13, state [0 1 0 0]\n",
      "instance 6, ep 14, state [0 0 0 0]\n",
      "instance 6, ep 15, state [1 1 1 0]\n",
      "instance 6, ep 16, state [0 0 1 1]\n",
      "instance 6, ep 17, state [0 1 0 1]\n",
      "instance 6, ep 18, state [1 1 1 1]\n",
      "instance 6, ep 19, state [0 1 0 1]\n",
      "instance 6, ep 20, state [1 1 0 1]\n",
      "instance 6, ep 21, state [1 1 0 0]\n",
      "instance 6, ep 22, state [0 0 1 0]\n",
      "instance 6, ep 23, state [1 0 0 1]\n",
      "instance 6, ep 24, state [1 0 1 1]\n",
      "instance 6, ep 25, state [0 1 1 1]\n",
      "instance 6, ep 26, state [0 1 0 0]\n",
      "instance 6, ep 27, state [0 0 1 1]\n",
      "instance 6, ep 28, state [1 0 0 0]\n",
      "instance 6, ep 29, state [1 0 1 1]\n",
      "first state [1 0 1 0]\n",
      "instance 7, ep 1, state [1 0 0 0]\n",
      "instance 7, ep 2, state [1 0 1 1]\n",
      "instance 7, ep 3, state [0 1 0 1]\n",
      "instance 7, ep 4, state [0 1 1 1]\n",
      "instance 7, ep 5, state [1 0 1 1]\n",
      "instance 7, ep 6, state [1 0 1 1]\n",
      "instance 7, ep 7, state [1 0 1 0]\n",
      "instance 7, ep 8, state [1 0 1 1]\n",
      "instance 7, ep 9, state [0 1 0 1]\n",
      "instance 7, ep 10, state [1 1 1 1]\n",
      "instance 7, ep 11, state [0 0 1 1]\n",
      "instance 7, ep 12, state [1 1 0 1]\n",
      "instance 7, ep 13, state [0 1 0 0]\n",
      "instance 7, ep 14, state [0 0 1 0]\n",
      "instance 7, ep 15, state [0 0 0 0]\n",
      "instance 7, ep 16, state [0 1 1 1]\n",
      "instance 7, ep 17, state [0 0 1 1]\n",
      "instance 7, ep 18, state [0 0 0 0]\n",
      "instance 7, ep 19, state [0 1 1 1]\n",
      "instance 7, ep 20, state [1 1 1 1]\n",
      "instance 7, ep 21, state [0 0 0 1]\n",
      "instance 7, ep 22, state [1 0 1 0]\n",
      "instance 7, ep 23, state [1 0 0 0]\n",
      "instance 7, ep 24, state [0 0 0 1]\n",
      "instance 7, ep 25, state [1 0 1 1]\n",
      "instance 7, ep 26, state [0 0 0 0]\n",
      "instance 7, ep 27, state [1 0 1 1]\n",
      "instance 7, ep 28, state [0 1 0 1]\n",
      "instance 7, ep 29, state [0 1 1 0]\n",
      "first state [0 0 1 1]\n",
      "instance 8, ep 1, state [0 1 0 1]\n",
      "instance 8, ep 2, state [0 0 1 0]\n",
      "instance 8, ep 3, state [1 1 1 0]\n",
      "instance 8, ep 4, state [0 0 1 1]\n",
      "instance 8, ep 5, state [1 1 1 1]\n",
      "instance 8, ep 6, state [0 1 0 1]\n",
      "instance 8, ep 7, state [1 1 0 0]\n",
      "instance 8, ep 8, state [0 0 0 1]\n",
      "instance 8, ep 9, state [1 0 0 0]\n",
      "instance 8, ep 10, state [1 1 1 0]\n",
      "instance 8, ep 11, state [1 1 0 1]\n",
      "instance 8, ep 12, state [0 1 0 1]\n",
      "instance 8, ep 13, state [1 1 1 0]\n",
      "instance 8, ep 14, state [0 0 0 1]\n",
      "instance 8, ep 15, state [0 1 1 1]\n",
      "instance 8, ep 16, state [0 1 1 0]\n",
      "instance 8, ep 17, state [1 1 0 1]\n",
      "instance 8, ep 18, state [0 0 0 0]\n",
      "instance 8, ep 19, state [0 0 1 1]\n",
      "instance 8, ep 20, state [1 0 0 1]\n",
      "instance 8, ep 21, state [0 0 1 0]\n",
      "instance 8, ep 22, state [1 1 0 0]\n",
      "instance 8, ep 23, state [1 0 0 1]\n",
      "instance 8, ep 24, state [0 1 1 0]\n",
      "instance 8, ep 25, state [0 0 0 0]\n",
      "instance 8, ep 26, state [1 0 1 1]\n",
      "instance 8, ep 27, state [1 1 0 1]\n",
      "instance 8, ep 28, state [1 0 0 1]\n",
      "instance 8, ep 29, state [0 0 0 0]\n",
      "first state [1 1 1 0]\n",
      "instance 9, ep 1, state [1 1 0 0]\n",
      "instance 9, ep 2, state [0 0 1 0]\n",
      "instance 9, ep 3, state [1 0 0 0]\n",
      "instance 9, ep 4, state [0 0 1 1]\n",
      "instance 9, ep 5, state [1 0 0 0]\n",
      "instance 9, ep 6, state [1 0 0 1]\n",
      "instance 9, ep 7, state [0 0 0 1]\n",
      "instance 9, ep 8, state [1 0 0 1]\n",
      "instance 9, ep 9, state [1 0 1 0]\n",
      "instance 9, ep 10, state [1 1 0 1]\n",
      "instance 9, ep 11, state [1 1 0 0]\n",
      "instance 9, ep 12, state [0 1 0 1]\n",
      "instance 9, ep 13, state [1 0 1 0]\n",
      "instance 9, ep 14, state [1 0 0 0]\n",
      "instance 9, ep 15, state [0 1 1 1]\n",
      "instance 9, ep 16, state [0 0 0 1]\n",
      "instance 9, ep 17, state [1 0 0 1]\n",
      "instance 9, ep 18, state [1 1 1 0]\n",
      "instance 9, ep 19, state [0 1 1 0]\n",
      "instance 9, ep 20, state [1 1 1 1]\n",
      "instance 9, ep 21, state [0 1 1 1]\n",
      "instance 9, ep 22, state [1 1 0 1]\n",
      "instance 9, ep 23, state [1 1 1 1]\n",
      "instance 9, ep 24, state [0 1 0 0]\n",
      "instance 9, ep 25, state [1 1 0 0]\n",
      "instance 9, ep 26, state [1 0 0 0]\n",
      "instance 9, ep 27, state [0 0 0 0]\n",
      "instance 9, ep 28, state [1 1 1 0]\n",
      "instance 9, ep 29, state [0 1 0 0]\n"
     ]
    }
   ],
   "source": [
    "if n_arms <= 6:\n",
    "    np.random.seed(seed)\n",
    "    random.seed(seed)\n",
    "    optimal_match_rewards = optimal_q_iteration(simulator, n_episodes, n_epochs, discount,reward_function='matching')\n",
    "    optimal_match_active_rate = simulator.total_active/(optimal_match_rewards.size*n_arms)\n",
    "\n",
    "    mean_rewards['optimal_match_rewards'] = np.mean(optimal_match_rewards)\n",
    "    active_rates['optimal_match_rewards'] = np.mean(optimal_match_active_rate)\n",
    "    std_rewards['optimal_match_rewards'] = np.std(optimal_match_rewards)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 26,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "{'random_rewards': 0.6314791666666667,\n",
       " 'optimal_rewards': 0.6417291666666667,\n",
       " 'zero_step_rewards': 0.7406666666666667,\n",
       " 'one_step_rewards': 0.7450625,\n",
       " 'infinite_step_rewards': 0.733625,\n",
       " 'whittle_approximate_rewards': 0.7437916666666666,\n",
       " 'optimal_match_rewards': 0.7490833333333333}"
      ]
     },
     "execution_count": 26,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "mean_rewards"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 27,
   "metadata": {},
   "outputs": [],
   "source": [
    "data = {\n",
    "    'mean_reward': mean_rewards, \n",
    "    'std_reward': std_rewards,\n",
    "    'active_rate': active_rates, \n",
    "    'parameters': \n",
    "        {'seed'      : seed,\n",
    "        'n_arms'    : n_arms,\n",
    "        'budget'    : budget,\n",
    "        'discount'  : discount, \n",
    "        'alpha'     : alpha, \n",
    "        'n_episodes': n_episodes, \n",
    "        'episode_len': episode_len, \n",
    "        'n_epochs'  : n_epochs, \n",
    "        'match_prob': match_prob} \n",
    "}"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 85,
   "metadata": {},
   "outputs": [],
   "source": [
    "save_path = get_save_path('matching_baseline',save_name,seed,use_date=save_with_date)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 86,
   "metadata": {},
   "outputs": [],
   "source": [
    "delete_duplicate_results('matching_baseline',save_name,data)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 87,
   "metadata": {},
   "outputs": [],
   "source": [
    "json.dump(data,open('../results/'+save_path,'w'))"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "food",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.7.12"
  },
  "orig_nbformat": 4
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
