{
 "cells": [
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# Improved Uncertain Activity Bandits"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Improve Uncertain (non-Oracle) Activity Bandits (from their baseline) with unknown transition functions. We improve these by imporving the way they learn the transition function using a normal approximation (Wilson score) along with fixing some bugs in their code"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {},
   "outputs": [],
   "source": [
    "%load_ext autoreload\n",
    "%autoreload 2"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "metadata": {},
   "outputs": [],
   "source": [
    "import numpy as np\n",
    "import random \n",
    "import matplotlib.pyplot as plt\n",
    "import json \n",
    "import argparse \n",
    "import sys\n",
    "from scipy.stats import norm"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "metadata": {},
   "outputs": [],
   "source": [
    "from rmab.simulator import RMABSimulator, random_valid_transition\n",
    "from rmab.uc_whittle import UCWhittleBuggy, UCWhittle, UCWhittleOracle \n",
    "\n",
    "from rmab.baselines import optimal_whittle, random_policy, WIQL\n",
    "from rmab.fr_dynamics import get_all_transitions\n",
    "from rmab.utils import get_save_path, delete_duplicate_results\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "metadata": {},
   "outputs": [],
   "source": [
    "is_jupyter = 'ipykernel' in sys.modules"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "metadata": {},
   "outputs": [],
   "source": [
    "if is_jupyter: \n",
    "    seed        = 42\n",
    "    n_arms      = 8\n",
    "    budget      = 3\n",
    "    discount    = 0.9\n",
    "    alpha       = 3 \n",
    "    n_episodes  = 30\n",
    "    episode_len = 20\n",
    "    n_epochs    = 10\n",
    "    save_name = 'normal_confidence'\n",
    "    save_with_date = False \n",
    "    dataset = 'fr'\n",
    "else:\n",
    "    parser = argparse.ArgumentParser()\n",
    "    parser.add_argument('--n_arms',         '-N', help='num beneficiaries (arms)', type=int, default=8)\n",
    "    parser.add_argument('--episode_len',    '-H', help='episode length', type=int, default=20)\n",
    "    parser.add_argument('--n_episodes',     '-T', help='num episodes', type=int, default=30)\n",
    "    parser.add_argument('--budget',         '-B', help='budget', type=int, default=3)\n",
    "    parser.add_argument('--n_epochs',       '-E', help='number of epochs (num_repeats)', type=int, default=10)\n",
    "    parser.add_argument('--discount',       '-d', help='discount factor', type=float, default=0.9)\n",
    "    parser.add_argument('--alpha',          '-a', help='alpha: for conf radius', type=float, default=3)\n",
    "    parser.add_argument('--seed',           '-s', help='random seed', type=int, default=42)\n",
    "    parser.add_argument('--save_name',      '-n', help='save name', type=str, default='results')\n",
    "    parser.add_argument('--dataset',      '-ds', help='which dataset', type=str, default='fr')\n",
    "    parser.add_argument('--use_date', action='store_true')\n",
    "\n",
    "    args = parser.parse_args()\n",
    "\n",
    "    n_arms      = args.n_arms\n",
    "    budget      = args.budget\n",
    "    discount    = args.discount\n",
    "    alpha       = args.alpha \n",
    "    seed        = args.seed\n",
    "    n_episodes  = args.n_episodes\n",
    "    episode_len = args.episode_len\n",
    "    n_epochs    = args.n_epochs\n",
    "    save_name   = args.save_name \n",
    "    save_with_date = args.use_date \n",
    "    dataset = args.dataset \n",
    "\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 9,
   "metadata": {},
   "outputs": [],
   "source": [
    "n_states = 2\n",
    "n_actions = 2"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 10,
   "metadata": {},
   "outputs": [],
   "source": [
    "all_population_size = 100 # number of random arms to generate\n",
    "\n",
    "if dataset == 'fr':\n",
    "    all_transitions = get_all_transitions(all_population_size)\n",
    "elif dataset == 'synthetic':\n",
    "    all_transitions = random_valid_transition(all_population_size, n_states, n_actions)\n",
    "else:\n",
    "    raise Exception(\"Dataset {} is not found\".format(dataset))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 11,
   "metadata": {},
   "outputs": [],
   "source": [
    "all_features = np.arange(all_population_size)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 12,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "acting should always be good! 0.000 < 0.044\n",
      "acting should always be good! 0.000 < 0.162\n",
      "acting should always be good! 0.108 < 0.183\n",
      "good start state should always be good! 0.380 < 0.508\n",
      "good start state should always be good! 0.506 < 0.760\n",
      "cohort [83 53 70 45 44 39 22 80]\n",
      "cohort [45 80  5 29 78 35 86 14]\n",
      "cohort [42 28 84 76 68 46 97 15]\n",
      "cohort [51 29 14 74 15  3 31 87]\n",
      "cohort [55  0 94  4 72 26 38  3]\n",
      "cohort [69 66 55 63 30 61 42 29]\n",
      "cohort [83 68 66 27 99 32 35 23]\n",
      "cohort [31  1 98 11 36  4 84 58]\n",
      "cohort [ 5 41 86 49 97 13 58 42]\n",
      "cohort [22 71 78 83 30 48 34 29]\n"
     ]
    }
   ],
   "source": [
    "np.random.seed(seed)\n",
    "random.seed(seed)\n",
    "simulator = RMABSimulator(all_population_size, all_features, all_transitions,\n",
    "            n_arms, episode_len, n_epochs, n_episodes, budget, number_states=n_states)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 13,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "solving UCWhittle using method: UCB\n",
      "first state [0 1 1 1 1 1 1 1]\n",
      "---------------------------------------------------\n",
      "0 0  | a  [0 0 0 0 0 1 1 1]  | s'  [0 0 1 0 0 1 0 1]  | r  7    | WI  [-0. -0. -0. -0. -0. -0. -0. -0.]\n",
      "instance 0, ep 1, state [0 0 0 1 1 1 0 1]\n",
      "instance 0, ep 2, state [0 1 1 1 0 0 0 1]\n",
      "instance 0, ep 3, state [0 0 0 1 0 1 1 0]\n",
      "instance 0, ep 4, state [1 1 0 1 1 1 1 1]\n",
      "instance 0, ep 5, state [0 0 0 0 0 1 0 0]\n",
      "---------------------------------------------------\n",
      "0 100  | a  [0 0 0 0 0 1 1 1]  | s'  [0 0 0 0 0 1 0 0]  | r  1    | WI  [-0. -0. -0. -0. -0. -0. -0. -0.]\n",
      "instance 0, ep 6, state [0 1 0 1 0 0 0 0]\n",
      "instance 0, ep 7, state [1 0 1 0 0 0 0 1]\n",
      "instance 0, ep 8, state [0 0 0 0 1 1 0 1]\n",
      "instance 0, ep 9, state [0 1 0 0 0 1 1 1]\n",
      "instance 0, ep 10, state [0 1 1 0 0 0 1 0]\n",
      "---------------------------------------------------\n",
      "0 200  | a  [0 0 0 0 0 1 1 1]  | s'  [1 1 1 0 0 1 1 0]  | r  3    | WI  [-0. -0. -0. -0. -0. -0. -0. -0.]\n",
      "instance 0, ep 11, state [1 0 1 1 0 1 1 1]\n",
      "instance 0, ep 12, state [0 0 1 1 0 0 1 0]\n",
      "instance 0, ep 13, state [1 1 1 1 0 1 1 0]\n",
      "instance 0, ep 14, state [0 1 1 0 1 1 1 1]\n",
      "instance 0, ep 15, state [0 0 1 1 1 0 1 1]\n",
      "---------------------------------------------------\n",
      "0 300  | a  [0 0 0 0 0 1 1 1]  | s'  [0 1 0 1 1 1 1 1]  | r  5    | WI  [-0. -0. -0. -0. -0. -0. -0. -0.]\n",
      "instance 0, ep 16, state [1 1 1 1 0 1 1 0]\n",
      "instance 0, ep 17, state [0 0 0 1 0 0 0 0]\n",
      "instance 0, ep 18, state [0 1 1 0 1 1 1 0]\n",
      "instance 0, ep 19, state [1 1 0 1 0 0 1 1]\n",
      "instance 0, ep 20, state [1 0 0 1 1 0 1 0]\n",
      "---------------------------------------------------\n",
      "0 400  | a  [0 1 1 0 0 1 0 0]  | s'  [0 1 1 0 0 0 1 0]  | r  4    | WI  [-0.     0.015  0.016 -0.    -0.     0.013 -0.    -0.   ]\n",
      "instance 0, ep 21, state [0 1 1 1 0 1 1 1]\n",
      "instance 0, ep 22, state [0 0 0 0 0 0 0 1]\n",
      "instance 0, ep 23, state [1 0 0 1 0 0 0 0]\n",
      "instance 0, ep 24, state [1 0 1 1 0 0 0 1]\n",
      "instance 0, ep 25, state [0 0 1 0 0 0 0 1]\n",
      "---------------------------------------------------\n",
      "0 500  | a  [1 0 0 0 1 1 0 0]  | s'  [1 0 1 0 0 1 0 1]  | r  2    | WI  [  0.047   0.046  -0.      0.044   0.048   0.048 -10.    -10.   ]\n",
      "instance 0, ep 26, state [0 1 0 1 0 0 1 1]\n",
      "instance 0, ep 27, state [1 0 0 0 1 0 1 0]\n",
      "instance 0, ep 28, state [1 0 1 0 0 1 0 0]\n",
      "instance 0, ep 29, state [1 1 0 0 0 1 0 0]\n",
      "first state [1 1 1 0 0 1 1 1]\n",
      "---------------------------------------------------\n",
      "1 0  | a  [0 0 0 0 0 1 1 1]  | s'  [0 1 1 0 1 1 1 0]  | r  6    | WI  [-0. -0. -0. -0. -0. -0. -0. -0.]\n",
      "instance 1, ep 1, state [0 1 1 0 0 1 0 0]\n",
      "instance 1, ep 2, state [0 0 0 1 1 0 1 1]\n",
      "instance 1, ep 3, state [0 0 0 0 1 1 0 1]\n",
      "instance 1, ep 4, state [1 0 1 1 1 0 1 1]\n",
      "instance 1, ep 5, state [1 1 1 1 1 1 0 0]\n",
      "---------------------------------------------------\n",
      "1 100  | a  [0 0 0 0 0 1 1 1]  | s'  [1 0 0 0 1 1 0 0]  | r  6    | WI  [-0. -0. -0. -0. -0. -0. -0. -0.]\n",
      "instance 1, ep 6, state [0 1 0 1 0 1 1 1]\n",
      "instance 1, ep 7, state [0 1 1 0 1 0 0 1]\n",
      "instance 1, ep 8, state [0 0 0 0 0 1 1 1]\n",
      "instance 1, ep 9, state [1 1 1 0 0 0 0 1]\n",
      "instance 1, ep 10, state [0 1 1 1 0 0 1 1]\n",
      "---------------------------------------------------\n",
      "1 200  | a  [0 0 0 0 0 1 1 1]  | s'  [0 0 0 0 1 0 1 1]  | r  5    | WI  [-0. -0. -0. -0. -0. -0. -0. -0.]\n",
      "instance 1, ep 11, state [0 1 0 0 0 0 1 1]\n",
      "instance 1, ep 12, state [0 1 1 1 0 0 0 0]\n",
      "instance 1, ep 13, state [0 1 0 0 0 0 0 0]\n",
      "instance 1, ep 14, state [0 0 0 1 0 0 0 1]\n",
      "instance 1, ep 15, state [0 1 1 0 1 1 0 0]\n",
      "---------------------------------------------------\n",
      "1 300  | a  [1 0 0 1 0 0 0 1]  | s'  [0 0 0 1 1 0 0 0]  | r  4    | WI  [ 0.005 -0.    -0.     0.001 -0.    -0.    -0.    -0.   ]\n",
      "instance 1, ep 16, state [1 0 1 0 1 0 1 1]\n",
      "instance 1, ep 17, state [0 0 0 0 0 1 1 1]\n",
      "instance 1, ep 18, state [1 1 1 1 0 0 0 0]\n",
      "instance 1, ep 19, state [0 0 1 1 0 0 0 0]\n",
      "instance 1, ep 20, state [0 1 0 1 1 0 1 1]\n",
      "---------------------------------------------------\n",
      "1 400  | a  [1 0 1 0 0 1 0 0]  | s'  [0 0 1 1 1 0 0 0]  | r  5    | WI  [ 0.003 -0.     0.003 -0.    -0.     0.014 -0.    -0.   ]\n",
      "instance 1, ep 21, state [0 0 1 1 1 1 1 1]\n",
      "instance 1, ep 22, state [1 1 1 0 1 1 0 1]\n",
      "instance 1, ep 23, state [0 1 1 1 0 1 1 0]\n",
      "instance 1, ep 24, state [0 1 0 0 1 0 1 0]\n",
      "instance 1, ep 25, state [1 0 1 0 1 0 1 1]\n",
      "---------------------------------------------------\n",
      "1 500  | a  [0 1 0 1 0 1 0 0]  | s'  [1 0 0 0 0 1 1 1]  | r  5    | WI  [-0.     0.017 -0.     0.018 -0.     0.02  -0.    -0.   ]\n",
      "instance 1, ep 26, state [1 1 0 1 0 0 0 1]\n",
      "instance 1, ep 27, state [1 0 1 0 0 0 0 0]\n",
      "instance 1, ep 28, state [1 1 0 0 0 1 0 1]\n",
      "instance 1, ep 29, state [1 1 1 0 1 1 1 0]\n",
      "first state [1 1 0 1 0 0 1 1]\n",
      "---------------------------------------------------\n",
      "2 0  | a  [0 0 0 0 0 1 1 1]  | s'  [0 0 1 1 0 1 1 1]  | r  5    | WI  [-0. -0. -0. -0. -0. -0. -0. -0.]\n",
      "instance 2, ep 1, state [0 1 0 0 0 0 0 1]\n",
      "instance 2, ep 2, state [1 0 1 1 0 1 1 0]\n",
      "instance 2, ep 3, state [0 1 1 0 1 1 1 1]\n",
      "instance 2, ep 4, state [1 0 0 1 1 0 1 1]\n",
      "instance 2, ep 5, state [0 1 1 1 1 0 1 0]\n",
      "---------------------------------------------------\n",
      "2 100  | a  [0 0 0 0 0 1 1 1]  | s'  [0 0 1 1 0 1 1 0]  | r  5    | WI  [-0. -0. -0. -0. -0. -0. -0. -0.]\n",
      "instance 2, ep 6, state [0 1 0 0 1 0 0 1]\n",
      "instance 2, ep 7, state [1 0 1 0 1 1 1 1]\n",
      "instance 2, ep 8, state [1 1 0 0 1 0 1 0]\n",
      "instance 2, ep 9, state [1 0 0 1 1 1 0 0]\n",
      "instance 2, ep 10, state [1 0 1 1 1 1 1 1]\n",
      "---------------------------------------------------\n",
      "2 200  | a  [0 0 0 0 0 1 1 1]  | s'  [1 0 1 1 1 1 1 1]  | r  7    | WI  [-0. -0. -0. -0. -0. -0. -0. -0.]\n",
      "instance 2, ep 11, state [0 0 0 0 1 1 0 0]\n",
      "instance 2, ep 12, state [0 1 1 0 1 1 0 1]\n",
      "instance 2, ep 13, state [1 0 0 0 0 1 1 0]\n",
      "instance 2, ep 14, state [0 0 0 1 0 0 0 1]\n",
      "instance 2, ep 15, state [0 1 0 1 1 0 0 1]\n",
      "---------------------------------------------------\n",
      "2 300  | a  [0 0 0 0 0 1 1 1]  | s'  [0 0 0 1 1 1 1 1]  | r  4    | WI  [-0. -0. -0. -0. -0. -0. -0. -0.]\n",
      "instance 2, ep 16, state [1 0 0 1 1 0 1 0]\n",
      "instance 2, ep 17, state [1 0 0 0 1 0 0 0]\n",
      "instance 2, ep 18, state [1 1 0 1 1 1 0 0]\n",
      "instance 2, ep 19, state [0 0 0 1 0 0 1 0]\n",
      "instance 2, ep 20, state [1 1 0 1 1 1 0 0]\n",
      "---------------------------------------------------\n",
      "2 400  | a  [0 0 0 0 0 1 1 1]  | s'  [1 0 1 1 1 1 1 0]  | r  5    | WI  [-0. -0. -0. -0. -0. -0. -0. -0.]\n",
      "instance 2, ep 21, state [1 0 0 0 1 0 1 1]\n",
      "instance 2, ep 22, state [1 1 1 1 0 1 0 0]\n",
      "instance 2, ep 23, state [1 1 0 1 1 1 1 1]\n",
      "instance 2, ep 24, state [1 1 1 1 1 0 0 0]\n",
      "instance 2, ep 25, state [0 1 1 1 0 1 1 1]\n",
      "---------------------------------------------------\n",
      "2 500  | a  [1 0 0 0 0 0 1 1]  | s'  [1 0 1 1 0 0 1 0]  | r  6    | WI  [ 0.001 -0.    -0.    -0.    -0.    -0.    -0.    -0.   ]\n",
      "instance 2, ep 26, state [1 1 0 1 0 0 1 0]\n",
      "instance 2, ep 27, state [1 0 1 0 1 1 0 1]\n",
      "instance 2, ep 28, state [1 0 0 0 1 1 1 0]\n",
      "instance 2, ep 29, state [0 1 0 0 1 1 1 1]\n",
      "first state [1 1 1 1 1 1 1 0]\n",
      "---------------------------------------------------\n",
      "3 0  | a  [0 0 0 0 0 1 1 1]  | s'  [0 0 0 1 1 0 1 1]  | r  7    | WI  [-0. -0. -0. -0. -0. -0. -0. -0.]\n",
      "instance 3, ep 1, state [1 0 1 1 1 0 0 0]\n",
      "instance 3, ep 2, state [1 0 0 0 1 1 0 0]\n",
      "instance 3, ep 3, state [1 1 1 0 1 0 1 1]\n",
      "instance 3, ep 4, state [0 0 1 1 1 1 1 1]\n",
      "instance 3, ep 5, state [0 1 0 0 1 0 0 0]\n",
      "---------------------------------------------------\n",
      "3 100  | a  [0 0 0 0 0 1 1 1]  | s'  [0 0 0 0 0 0 1 1]  | r  2    | WI  [-0. -0. -0. -0. -0. -0. -0. -0.]\n",
      "instance 3, ep 6, state [1 0 0 0 0 0 0 1]\n",
      "instance 3, ep 7, state [0 0 0 0 1 1 0 0]\n",
      "instance 3, ep 8, state [0 1 1 1 0 1 0 0]\n",
      "instance 3, ep 9, state [0 0 1 1 0 1 1 1]\n",
      "instance 3, ep 10, state [1 1 1 1 0 0 1 0]\n",
      "---------------------------------------------------\n",
      "3 200  | a  [0 0 0 0 0 1 1 1]  | s'  [0 1 0 1 0 0 1 1]  | r  5    | WI  [-0. -0. -0. -0. -0. -0. -0. -0.]\n",
      "instance 3, ep 11, state [1 0 0 0 0 1 1 1]\n",
      "instance 3, ep 12, state [1 0 1 1 1 0 1 0]\n",
      "instance 3, ep 13, state [1 1 0 1 1 0 1 1]\n",
      "instance 3, ep 14, state [0 0 0 0 0 1 0 0]\n",
      "instance 3, ep 15, state [1 1 0 0 0 1 0 1]\n",
      "---------------------------------------------------\n",
      "3 300  | a  [0 0 1 1 1 0 0 0]  | s'  [1 0 0 1 0 0 0 1]  | r  4    | WI  [ -0.     -0.      0.02    0.018   0.023 -10.     -0.     -0.   ]\n",
      "instance 3, ep 16, state [1 0 1 1 0 1 1 1]\n",
      "instance 3, ep 17, state [1 1 1 1 1 1 1 0]\n",
      "instance 3, ep 18, state [0 0 0 0 1 0 1 0]\n",
      "instance 3, ep 19, state [1 1 0 1 0 1 0 1]\n",
      "instance 3, ep 20, state [0 1 1 0 0 0 0 1]\n",
      "---------------------------------------------------\n",
      "3 400  | a  [1 0 0 1 1 0 0 0]  | s'  [1 0 0 1 1 0 0 1]  | r  3    | WI  [  0.047  -0.     -0.      0.047   0.047 -10.    -10.     -0.   ]\n",
      "instance 3, ep 21, state [0 0 0 1 0 0 0 0]\n",
      "instance 3, ep 22, state [1 0 0 1 1 0 1 1]\n",
      "instance 3, ep 23, state [0 1 1 0 0 0 1 1]\n",
      "instance 3, ep 24, state [1 0 1 1 0 0 1 0]\n",
      "instance 3, ep 25, state [1 0 0 0 0 1 0 1]\n",
      "---------------------------------------------------\n",
      "3 500  | a  [0 0 1 0 1 0 1 0]  | s'  [0 0 1 0 1 1 0 0]  | r  3    | WI  [ -0.      0.086   0.086   0.085   0.086 -10.      0.087  -0.   ]\n",
      "instance 3, ep 26, state [1 1 0 1 1 0 0 1]\n",
      "instance 3, ep 27, state [1 0 1 1 1 1 1 0]\n",
      "instance 3, ep 28, state [0 0 1 1 0 1 1 1]\n",
      "instance 3, ep 29, state [0 1 0 0 0 0 0 1]\n",
      "first state [1 1 1 0 1 1 1 0]\n",
      "---------------------------------------------------\n",
      "4 0  | a  [0 0 0 0 0 1 1 1]  | s'  [0 0 0 0 1 1 1 0]  | r  6    | WI  [-0. -0. -0. -0. -0. -0. -0. -0.]\n",
      "instance 4, ep 1, state [0 0 0 1 0 1 0 0]\n",
      "instance 4, ep 2, state [1 1 0 1 1 0 1 1]\n",
      "instance 4, ep 3, state [1 0 1 0 0 0 0 1]\n",
      "instance 4, ep 4, state [1 1 0 0 0 1 0 1]\n",
      "instance 4, ep 5, state [1 0 1 0 1 1 0 0]\n",
      "---------------------------------------------------\n",
      "4 100  | a  [0 0 0 0 0 1 1 1]  | s'  [1 0 1 0 1 1 0 0]  | r  4    | WI  [-0. -0. -0. -0. -0. -0. -0. -0.]\n",
      "instance 4, ep 6, state [1 1 0 1 1 1 0 1]\n",
      "instance 4, ep 7, state [1 0 0 1 0 1 0 0]\n",
      "instance 4, ep 8, state [1 0 1 0 1 0 0 1]\n",
      "instance 4, ep 9, state [0 1 0 1 0 1 0 0]\n",
      "instance 4, ep 10, state [0 0 1 0 1 0 0 1]\n",
      "---------------------------------------------------\n",
      "4 200  | a  [0 1 0 1 0 0 0 1]  | s'  [0 0 0 1 0 0 1 0]  | r  3    | WI  [-0.     0.005 -0.     0.001 -0.    -0.    -0.    -0.   ]\n",
      "instance 4, ep 11, state [1 0 0 0 1 1 0 1]\n",
      "instance 4, ep 12, state [1 1 1 0 0 0 0 1]\n",
      "instance 4, ep 13, state [1 0 0 0 1 0 1 0]\n",
      "instance 4, ep 14, state [0 1 1 0 1 1 1 0]\n",
      "instance 4, ep 15, state [1 0 1 0 0 0 1 0]\n",
      "---------------------------------------------------\n",
      "4 300  | a  [0 1 0 1 0 0 0 1]  | s'  [1 0 1 0 0 0 0 0]  | r  3    | WI  [-0.e+00  3.e-03 -0.e+00  5.e-03 -1.e+01 -0.e+00 -0.e+00  2.e-03]\n",
      "instance 4, ep 16, state [1 1 0 1 0 1 0 1]\n",
      "instance 4, ep 17, state [1 1 1 0 1 1 1 0]\n",
      "instance 4, ep 18, state [1 1 1 0 1 0 1 0]\n",
      "instance 4, ep 19, state [1 1 0 1 0 1 1 1]\n",
      "instance 4, ep 20, state [1 1 0 0 1 1 1 1]\n",
      "---------------------------------------------------\n",
      "4 400  | a  [0 0 0 1 0 0 1 1]  | s'  [1 0 0 0 1 1 1 1]  | r  6    | WI  [ -0.    -0.   -10.     0.03  -0.    -0.    -0.    -0.  ]\n",
      "instance 4, ep 21, state [0 1 0 1 0 0 0 0]\n",
      "instance 4, ep 22, state [1 0 0 0 0 0 0 1]\n",
      "instance 4, ep 23, state [1 1 0 0 1 1 0 0]\n",
      "instance 4, ep 24, state [0 0 0 1 1 1 1 1]\n",
      "instance 4, ep 25, state [1 1 0 0 0 1 1 0]\n",
      "---------------------------------------------------\n",
      "4 500  | a  [0 0 1 1 0 0 0 1]  | s'  [1 0 1 0 0 0 0 0]  | r  4    | WI  [-10.     -0.      0.075   0.076 -10.     -0.     -0.      0.075]\n",
      "instance 4, ep 26, state [1 0 1 0 0 0 0 0]\n",
      "instance 4, ep 27, state [0 1 1 0 1 1 0 0]\n",
      "instance 4, ep 28, state [0 0 1 0 1 1 0 1]\n",
      "instance 4, ep 29, state [0 1 0 1 1 0 1 1]\n",
      "first state [0 0 1 1 0 1 0 1]\n",
      "---------------------------------------------------\n",
      "5 0  | a  [0 0 0 0 0 1 1 1]  | s'  [0 1 0 0 0 1 1 1]  | r  4    | WI  [-0. -0. -0. -0. -0. -0. -0. -0.]\n",
      "instance 5, ep 1, state [0 0 1 0 1 1 1 0]\n",
      "instance 5, ep 2, state [0 0 1 1 1 1 1 1]\n",
      "instance 5, ep 3, state [0 1 0 1 1 1 0 0]\n",
      "instance 5, ep 4, state [0 0 0 1 1 0 0 0]\n",
      "instance 5, ep 5, state [1 1 1 0 1 1 0 1]\n",
      "---------------------------------------------------\n",
      "5 100  | a  [0 0 0 0 0 1 1 1]  | s'  [1 0 1 0 0 1 0 1]  | r  6    | WI  [-0. -0. -0. -0. -0. -0. -0. -0.]\n",
      "instance 5, ep 6, state [0 1 0 1 1 1 1 0]\n",
      "instance 5, ep 7, state [0 0 0 1 0 1 1 1]\n",
      "instance 5, ep 8, state [0 1 1 0 1 1 0 1]\n",
      "instance 5, ep 9, state [0 0 0 0 0 0 1 1]\n",
      "instance 5, ep 10, state [1 0 0 1 0 0 1 0]\n",
      "---------------------------------------------------\n",
      "5 200  | a  [0 0 0 0 0 1 1 1]  | s'  [1 1 0 0 0 1 1 1]  | r  3    | WI  [-0. -0. -0. -0. -0. -0. -0. -0.]\n",
      "instance 5, ep 11, state [1 1 0 0 1 0 0 1]\n",
      "instance 5, ep 12, state [0 1 1 0 0 0 0 0]\n",
      "instance 5, ep 13, state [1 0 1 1 1 1 0 1]\n",
      "instance 5, ep 14, state [1 0 0 1 0 0 0 0]\n",
      "instance 5, ep 15, state [1 1 1 0 0 0 0 0]\n",
      "---------------------------------------------------\n",
      "5 300  | a  [0 0 0 1 1 0 0 1]  | s'  [1 0 0 0 1 0 0 1]  | r  3    | WI  [-0.    -0.    -0.     0.004  0.001 -0.    -0.    -0.   ]\n",
      "instance 5, ep 16, state [1 0 1 0 0 0 1 1]\n",
      "instance 5, ep 17, state [1 0 0 1 0 1 0 0]\n",
      "instance 5, ep 18, state [0 0 1 0 0 0 0 1]\n",
      "instance 5, ep 19, state [1 1 1 0 1 0 0 1]\n",
      "instance 5, ep 20, state [0 1 0 1 1 1 1 1]\n",
      "---------------------------------------------------\n",
      "5 400  | a  [1 0 1 0 0 0 0 1]  | s'  [0 1 0 0 0 1 1 1]  | r  6    | WI  [ 0.019 -0.     0.016 -0.    -0.    -0.    -0.    -0.   ]\n",
      "instance 5, ep 21, state [0 1 0 1 1 1 0 0]\n",
      "instance 5, ep 22, state [1 0 0 0 1 1 0 0]\n",
      "instance 5, ep 23, state [0 1 1 0 0 0 1 1]\n",
      "instance 5, ep 24, state [0 0 0 1 0 1 1 0]\n",
      "instance 5, ep 25, state [0 0 1 1 1 1 0 1]\n",
      "---------------------------------------------------\n",
      "5 500  | a  [1 1 0 0 0 0 1 0]  | s'  [1 1 1 0 0 1 0 1]  | r  5    | WI  [  0.043   0.04   -0.    -10.     -0.    -10.      0.039  -0.   ]\n",
      "instance 5, ep 26, state [1 0 1 1 1 1 1 1]\n",
      "instance 5, ep 27, state [0 0 1 0 0 0 0 1]\n",
      "instance 5, ep 28, state [1 0 0 0 1 1 0 1]\n",
      "instance 5, ep 29, state [1 1 1 0 1 0 1 1]\n",
      "first state [0 1 0 1 0 1 0 1]\n",
      "---------------------------------------------------\n",
      "6 0  | a  [0 0 0 0 0 1 1 1]  | s'  [0 0 0 0 0 0 1 0]  | r  4    | WI  [-0. -0. -0. -0. -0. -0. -0. -0.]\n",
      "instance 6, ep 1, state [1 1 1 1 1 0 1 0]\n",
      "instance 6, ep 2, state [0 0 0 1 1 1 1 0]\n",
      "instance 6, ep 3, state [0 0 0 0 0 1 1 1]\n",
      "instance 6, ep 4, state [1 1 0 1 1 0 0 1]\n",
      "instance 6, ep 5, state [0 1 1 0 0 0 0 0]\n",
      "---------------------------------------------------\n",
      "6 100  | a  [0 0 0 0 0 1 1 1]  | s'  [1 0 0 0 0 1 1 0]  | r  2    | WI  [-0. -0. -0. -0. -0. -0. -0. -0.]\n",
      "instance 6, ep 6, state [1 0 1 0 1 0 0 1]\n",
      "instance 6, ep 7, state [1 0 1 0 0 0 0 1]\n",
      "instance 6, ep 8, state [0 0 1 1 0 1 0 1]\n",
      "instance 6, ep 9, state [1 1 0 0 0 0 0 1]\n",
      "instance 6, ep 10, state [0 0 1 0 1 0 0 0]\n",
      "---------------------------------------------------\n",
      "6 200  | a  [0 0 0 0 0 1 1 1]  | s'  [1 0 1 0 1 0 0 0]  | r  2    | WI  [-0. -0. -0. -0. -0. -0. -0. -0.]\n",
      "instance 6, ep 11, state [0 1 0 1 0 0 1 0]\n",
      "instance 6, ep 12, state [1 1 1 1 0 0 0 1]\n",
      "instance 6, ep 13, state [1 0 1 0 1 0 1 1]\n",
      "instance 6, ep 14, state [0 0 0 0 0 1 1 1]\n",
      "instance 6, ep 15, state [0 1 1 0 1 1 0 0]\n",
      "---------------------------------------------------\n",
      "6 300  | a  [0 0 0 1 0 0 1 1]  | s'  [1 0 1 1 1 1 0 1]  | r  4    | WI  [-1.e+01 -0.e+00 -0.e+00  1.e-03 -0.e+00 -0.e+00 -0.e+00 -0.e+00]\n",
      "instance 6, ep 16, state [0 0 1 1 1 0 0 1]\n",
      "instance 6, ep 17, state [1 0 1 1 0 0 1 0]\n",
      "instance 6, ep 18, state [0 0 0 1 1 0 1 1]\n",
      "instance 6, ep 19, state [1 0 0 1 1 0 0 0]\n",
      "instance 6, ep 20, state [1 1 0 0 1 1 0 1]\n",
      "---------------------------------------------------\n",
      "6 400  | a  [0 0 1 1 0 0 0 1]  | s'  [1 0 1 1 0 1 0 1]  | r  5    | WI  [-0.    -0.     0.007  0.007 -0.    -0.    -0.    -0.   ]\n",
      "instance 6, ep 21, state [1 0 1 0 1 1 1 1]\n",
      "instance 6, ep 22, state [0 1 1 0 1 1 0 1]\n",
      "instance 6, ep 23, state [1 0 1 0 0 0 1 1]\n",
      "instance 6, ep 24, state [0 0 1 0 1 1 1 1]\n",
      "instance 6, ep 25, state [0 1 1 1 0 1 0 0]\n",
      "---------------------------------------------------\n",
      "6 500  | a  [1 0 0 0 1 0 1 0]  | s'  [0 0 0 0 1 1 0 0]  | r  4    | WI  [  0.018  -0.    -10.     -0.      0.024  -0.      0.024  -0.   ]\n",
      "instance 6, ep 26, state [0 1 1 1 1 0 1 0]\n",
      "instance 6, ep 27, state [1 1 1 1 0 0 1 0]\n",
      "instance 6, ep 28, state [0 0 1 0 0 1 1 0]\n",
      "instance 6, ep 29, state [0 0 0 0 1 1 1 0]\n",
      "first state [1 0 1 1 1 1 1 0]\n",
      "---------------------------------------------------\n",
      "7 0  | a  [0 0 0 0 0 1 1 1]  | s'  [1 0 1 1 1 0 1 0]  | r  6    | WI  [-0. -0. -0. -0. -0. -0. -0. -0.]\n",
      "instance 7, ep 1, state [0 0 1 0 1 1 1 1]\n",
      "instance 7, ep 2, state [0 1 1 0 0 1 1 1]\n",
      "instance 7, ep 3, state [1 1 1 0 0 0 1 1]\n",
      "instance 7, ep 4, state [1 0 1 1 1 1 0 1]\n",
      "instance 7, ep 5, state [0 0 0 1 1 1 1 1]\n",
      "---------------------------------------------------\n",
      "7 100  | a  [0 0 0 0 0 1 1 1]  | s'  [0 0 0 0 0 1 0 0]  | r  5    | WI  [-0. -0. -0. -0. -0. -0. -0. -0.]\n",
      "instance 7, ep 6, state [1 0 0 0 0 0 0 0]\n",
      "instance 7, ep 7, state [1 0 0 0 1 0 0 1]\n",
      "instance 7, ep 8, state [0 0 0 0 0 0 1 1]\n",
      "instance 7, ep 9, state [1 0 1 0 0 1 0 0]\n",
      "instance 7, ep 10, state [1 1 0 1 1 0 0 0]\n",
      "---------------------------------------------------\n",
      "7 200  | a  [0 0 0 0 0 1 1 1]  | s'  [0 0 0 0 1 1 1 1]  | r  4    | WI  [ -0.  -0. -10.  -0.  -0.  -0.  -0.  -0.]\n",
      "instance 7, ep 11, state [0 0 1 1 1 0 1 1]\n",
      "instance 7, ep 12, state [1 0 1 0 0 0 1 1]\n",
      "instance 7, ep 13, state [0 0 0 0 0 0 1 0]\n",
      "instance 7, ep 14, state [0 0 1 1 1 0 1 0]\n",
      "instance 7, ep 15, state [1 1 1 1 1 0 1 0]\n",
      "---------------------------------------------------\n",
      "7 300  | a  [0 0 0 0 0 1 1 1]  | s'  [1 0 1 0 1 0 1 0]  | r  6    | WI  [ -0.     -0.     -0.    -10.     -0.      0.028  -0.     -0.   ]\n",
      "instance 7, ep 16, state [1 0 0 0 0 0 1 0]\n",
      "instance 7, ep 17, state [0 1 0 1 1 1 1 0]\n",
      "instance 7, ep 18, state [1 0 0 1 0 1 1 1]\n",
      "instance 7, ep 19, state [1 0 0 1 0 1 1 1]\n",
      "instance 7, ep 20, state [0 0 0 0 1 0 0 0]\n",
      "---------------------------------------------------\n",
      "7 400  | a  [1 0 1 1 0 0 0 0]  | s'  [1 0 1 0 1 0 1 0]  | r  1    | WI  [ 2.3e-02  3.0e-03  1.9e-02  1.8e-02 -0.0e+00 -1.0e+01 -0.0e+00 -0.0e+00]\n",
      "instance 7, ep 21, state [1 1 0 0 0 0 1 1]\n",
      "instance 7, ep 22, state [0 0 1 0 1 0 0 0]\n",
      "instance 7, ep 23, state [1 1 0 0 0 0 0 0]\n",
      "instance 7, ep 24, state [1 0 0 1 0 1 0 1]\n",
      "instance 7, ep 25, state [1 1 1 0 1 0 0 0]\n",
      "---------------------------------------------------\n",
      "7 500  | a  [0 0 0 0 0 1 1 1]  | s'  [0 0 0 0 0 0 1 1]  | r  4    | WI  [-10.     -0.     -0.    -10.     -0.      0.034  -0.      0.03 ]\n",
      "instance 7, ep 26, state [1 0 1 1 1 1 0 0]\n",
      "instance 7, ep 27, state [0 0 0 0 0 1 1 0]\n",
      "instance 7, ep 28, state [1 0 0 1 0 0 1 1]\n",
      "instance 7, ep 29, state [1 1 1 0 0 0 0 1]\n",
      "first state [1 0 0 1 0 1 0 0]\n",
      "---------------------------------------------------\n",
      "8 0  | a  [0 0 0 0 0 1 1 1]  | s'  [1 0 0 1 0 1 0 1]  | r  3    | WI  [-0. -0. -0. -0. -0. -0. -0. -0.]\n",
      "instance 8, ep 1, state [1 1 1 1 0 0 1 1]\n",
      "instance 8, ep 2, state [0 1 0 0 0 1 1 0]\n",
      "instance 8, ep 3, state [1 0 0 0 0 0 1 1]\n",
      "instance 8, ep 4, state [1 0 0 0 0 1 0 1]\n",
      "instance 8, ep 5, state [1 0 1 1 1 1 0 0]\n",
      "---------------------------------------------------\n",
      "8 100  | a  [0 0 0 0 0 1 1 1]  | s'  [0 0 1 0 1 1 0 0]  | r  5    | WI  [-0. -0. -0. -0. -0. -0. -0. -0.]\n",
      "instance 8, ep 6, state [0 0 1 0 1 1 0 0]\n",
      "instance 8, ep 7, state [1 1 1 0 0 0 0 1]\n",
      "instance 8, ep 8, state [1 1 1 1 0 0 1 0]\n",
      "instance 8, ep 9, state [1 1 0 1 1 1 1 1]\n",
      "instance 8, ep 10, state [0 0 1 1 0 0 1 1]\n",
      "---------------------------------------------------\n",
      "8 200  | a  [0 1 0 0 1 0 0 1]  | s'  [0 1 0 1 1 0 0 1]  | r  4    | WI  [-0.     0.001 -0.    -0.     0.003 -0.    -0.    -0.   ]\n",
      "instance 8, ep 11, state [1 1 0 0 1 0 0 0]\n",
      "instance 8, ep 12, state [1 1 0 0 1 1 0 0]\n",
      "instance 8, ep 13, state [0 1 0 0 1 1 0 1]\n",
      "instance 8, ep 14, state [0 1 0 1 0 1 1 1]\n",
      "instance 8, ep 15, state [1 1 0 0 1 0 1 1]\n",
      "---------------------------------------------------\n",
      "8 300  | a  [0 0 1 1 0 1 0 0]  | s'  [0 0 1 1 0 0 1 0]  | r  5    | WI  [-0.    -0.     0.009  0.008 -0.     0.006 -0.    -0.   ]\n",
      "instance 8, ep 16, state [0 1 0 1 0 0 1 1]\n",
      "instance 8, ep 17, state [1 1 0 1 0 1 1 1]\n",
      "instance 8, ep 18, state [1 0 1 0 1 0 1 1]\n",
      "instance 8, ep 19, state [0 0 1 0 0 0 0 1]\n",
      "instance 8, ep 20, state [1 0 0 0 0 0 0 0]\n",
      "---------------------------------------------------\n",
      "8 400  | a  [0 1 1 0 0 0 0 1]  | s'  [0 0 1 0 0 0 0 1]  | r  1    | WI  [ -0.      0.03    0.032   0.027 -10.    -10.      0.027   0.029]\n",
      "instance 8, ep 21, state [1 0 1 1 1 1 1 1]\n",
      "instance 8, ep 22, state [1 1 1 1 0 0 0 1]\n",
      "instance 8, ep 23, state [1 1 1 0 0 1 1 1]\n",
      "instance 8, ep 24, state [0 1 1 1 1 1 0 1]\n",
      "instance 8, ep 25, state [1 1 1 0 0 1 1 1]\n",
      "---------------------------------------------------\n",
      "8 500  | a  [0 0 0 1 1 0 0 1]  | s'  [0 1 1 1 0 1 0 0]  | r  6    | WI  [ -0.     -0.    -10.      0.089   0.092  -0.     -0.     -0.   ]\n",
      "instance 8, ep 26, state [0 1 1 1 0 1 1 0]\n",
      "instance 8, ep 27, state [1 1 1 0 0 0 0 0]\n",
      "instance 8, ep 28, state [1 0 1 1 1 1 1 1]\n",
      "instance 8, ep 29, state [0 0 1 1 0 1 1 0]\n",
      "first state [0 1 0 0 0 0 1 0]\n",
      "---------------------------------------------------\n",
      "9 0  | a  [0 0 0 0 0 1 1 1]  | s'  [0 0 1 0 0 1 0 1]  | r  2    | WI  [-0. -0. -0. -0. -0. -0. -0. -0.]\n",
      "instance 9, ep 1, state [1 1 0 1 1 1 0 0]\n",
      "instance 9, ep 2, state [1 1 1 0 1 0 0 0]\n",
      "instance 9, ep 3, state [1 0 0 1 0 0 0 1]\n",
      "instance 9, ep 4, state [1 0 1 1 0 1 1 1]\n",
      "instance 9, ep 5, state [0 1 1 0 0 0 0 1]\n",
      "---------------------------------------------------\n",
      "9 100  | a  [0 0 0 0 0 1 1 1]  | s'  [1 1 1 0 0 1 1 1]  | r  3    | WI  [-0. -0. -0. -0. -0. -0. -0. -0.]\n",
      "instance 9, ep 6, state [0 0 1 0 1 0 0 0]\n",
      "instance 9, ep 7, state [0 0 1 1 0 1 1 1]\n",
      "instance 9, ep 8, state [0 0 0 1 1 0 0 1]\n",
      "instance 9, ep 9, state [1 1 1 0 1 1 0 1]\n",
      "instance 9, ep 10, state [1 0 1 1 1 0 0 1]\n",
      "---------------------------------------------------\n",
      "9 200  | a  [0 0 0 0 0 1 1 1]  | s'  [0 1 1 1 0 0 1 1]  | r  5    | WI  [-0. -0. -0. -0. -0. -0. -0. -0.]\n",
      "instance 9, ep 11, state [0 1 1 0 1 1 0 1]\n",
      "instance 9, ep 12, state [1 1 1 0 1 1 1 1]\n",
      "instance 9, ep 13, state [0 1 0 0 0 1 1 1]\n",
      "instance 9, ep 14, state [1 1 1 0 0 0 1 1]\n",
      "instance 9, ep 15, state [0 0 1 0 1 1 0 0]\n",
      "---------------------------------------------------\n",
      "9 300  | a  [0 0 0 0 0 1 1 1]  | s'  [0 0 1 0 1 1 0 1]  | r  3    | WI  [ -0.  -0.  -0. -10.  -0.  -0.  -0.  -0.]\n",
      "instance 9, ep 16, state [1 1 1 1 0 1 1 1]\n",
      "instance 9, ep 17, state [0 1 1 0 0 1 0 0]\n",
      "instance 9, ep 18, state [0 1 1 1 0 1 1 1]\n",
      "instance 9, ep 19, state [1 0 1 0 1 0 0 0]\n",
      "instance 9, ep 20, state [1 0 1 0 0 1 0 0]\n",
      "---------------------------------------------------\n",
      "9 400  | a  [0 0 0 1 0 0 1 1]  | s'  [1 0 0 1 0 1 0 0]  | r  3    | WI  [-0.e+00 -0.e+00 -0.e+00  1.e-03 -1.e+01 -0.e+00 -0.e+00 -0.e+00]\n",
      "instance 9, ep 21, state [1 0 0 0 1 1 1 1]\n",
      "instance 9, ep 22, state [0 0 1 0 0 0 0 1]\n",
      "instance 9, ep 23, state [0 1 0 1 0 0 1 1]\n",
      "instance 9, ep 24, state [0 0 0 0 0 0 0 0]\n",
      "instance 9, ep 25, state [1 1 1 0 0 1 0 0]\n",
      "---------------------------------------------------\n",
      "9 500  | a  [0 0 0 1 1 0 1 0]  | s'  [0 0 1 1 1 1 0 0]  | r  4    | WI  [-0.0e+00 -0.0e+00 -0.0e+00  9.0e-03  1.1e-02 -1.0e+01  1.1e-02 -0.0e+00]\n",
      "instance 9, ep 26, state [1 1 1 0 0 1 0 1]\n",
      "instance 9, ep 27, state [1 1 0 0 1 1 1 0]\n",
      "instance 9, ep 28, state [0 1 1 1 0 1 1 1]\n",
      "instance 9, ep 29, state [0 0 1 0 0 1 0 1]\n"
     ]
    }
   ],
   "source": [
    "np.random.seed(seed)\n",
    "random.seed(seed)\n",
    "rewards_without_norm = UCWhittle(simulator, n_episodes, n_epochs, discount, alpha=alpha, method='UCB',norm_confidence=False)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 14,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "solving UCWhittle using method: UCB\n",
      "first state [0 1 1 1 1 1 1 1]\n",
      "---------------------------------------------------\n",
      "0 0  | a  [0 0 0 0 0 1 1 1]  | s'  [0 0 1 0 0 1 0 1]  | r  7    | WI  [-0. -0. -0. -0. -0. -0. -0. -0.]\n",
      "instance 0, ep 1, state [0 0 0 1 1 1 0 1]\n",
      "instance 0, ep 2, state [0 1 1 1 0 0 0 1]\n",
      "instance 0, ep 3, state [0 0 0 1 0 1 1 0]\n",
      "instance 0, ep 4, state [1 1 0 1 1 1 1 1]\n",
      "instance 0, ep 5, state [0 0 0 0 0 1 0 0]\n",
      "---------------------------------------------------\n",
      "0 100  | a  [0 1 1 0 0 0 0 1]  | s'  [0 0 0 0 0 0 0 1]  | r  1    | WI  [  0.283   0.648   0.578   0.398 -10.      0.422   0.47    0.55 ]\n",
      "instance 0, ep 6, state [0 1 0 1 0 0 0 0]\n",
      "instance 0, ep 7, state [1 0 1 0 0 0 0 1]\n",
      "instance 0, ep 8, state [0 0 0 0 1 1 0 1]\n",
      "instance 0, ep 9, state [0 1 0 0 0 1 1 1]\n",
      "instance 0, ep 10, state [0 1 1 0 0 0 1 0]\n",
      "---------------------------------------------------\n",
      "0 200  | a  [1 0 0 1 0 0 0 1]  | s'  [1 0 1 1 0 0 0 0]  | r  3    | WI  [  0.639   0.505   0.207   0.54  -10.    -10.    -10.      0.528]\n",
      "instance 0, ep 11, state [1 0 1 1 0 1 1 1]\n",
      "instance 0, ep 12, state [0 0 1 1 0 0 1 0]\n",
      "instance 0, ep 13, state [1 1 1 1 0 1 1 0]\n",
      "instance 0, ep 14, state [0 1 1 0 1 1 1 1]\n",
      "instance 0, ep 15, state [0 0 1 1 1 0 1 1]\n",
      "---------------------------------------------------\n",
      "0 300  | a  [1 1 0 0 0 1 0 0]  | s'  [1 1 1 0 0 1 0 1]  | r  5    | WI  [  0.497   0.566   0.277   0.364   0.472   0.528 -10.    -10.   ]\n",
      "instance 0, ep 16, state [1 1 1 1 0 1 1 0]\n",
      "instance 0, ep 17, state [0 0 0 1 0 0 0 0]\n",
      "instance 0, ep 18, state [0 1 1 0 1 1 1 0]\n",
      "instance 0, ep 19, state [1 1 0 1 0 0 1 1]\n",
      "instance 0, ep 20, state [1 0 0 1 1 0 1 0]\n",
      "---------------------------------------------------\n",
      "0 400  | a  [0 1 1 0 0 0 0 1]  | s'  [1 0 0 0 1 0 0 0]  | r  4    | WI  [  0.408   0.545   0.562   0.397   0.437   0.52  -10.      0.581]\n",
      "instance 0, ep 21, state [0 1 1 1 0 1 1 1]\n",
      "instance 0, ep 22, state [0 0 0 0 0 0 0 1]\n",
      "instance 0, ep 23, state [1 0 0 1 0 0 0 0]\n",
      "instance 0, ep 24, state [1 0 1 1 0 0 0 1]\n",
      "instance 0, ep 25, state [0 0 1 0 0 0 0 1]\n",
      "---------------------------------------------------\n",
      "0 500  | a  [0 1 0 1 1 0 0 0]  | s'  [0 1 0 0 1 0 0 1]  | r  2    | WI  [  0.532   0.564   0.363   0.581   0.562 -10.    -10.    -10.   ]\n",
      "instance 0, ep 26, state [0 1 0 1 0 0 1 1]\n",
      "instance 0, ep 27, state [1 0 0 0 1 0 1 0]\n",
      "instance 0, ep 28, state [1 0 1 0 0 1 0 0]\n",
      "instance 0, ep 29, state [1 1 0 0 0 1 0 0]\n",
      "first state [1 1 1 0 0 1 1 1]\n",
      "---------------------------------------------------\n",
      "1 0  | a  [0 0 0 0 0 1 1 1]  | s'  [0 0 1 0 0 1 1 1]  | r  6    | WI  [-0. -0. -0. -0. -0. -0. -0. -0.]\n",
      "instance 1, ep 1, state [0 1 1 0 0 1 0 0]\n",
      "instance 1, ep 2, state [0 0 0 1 1 0 1 1]\n",
      "instance 1, ep 3, state [0 0 0 0 1 1 0 1]\n",
      "instance 1, ep 4, state [1 0 1 1 1 0 1 1]\n",
      "instance 1, ep 5, state [1 1 1 1 1 1 0 0]\n",
      "---------------------------------------------------\n",
      "1 100  | a  [1 0 0 0 0 1 0 1]  | s'  [1 0 0 1 1 1 0 0]  | r  6    | WI  [  0.35    0.162   0.02    0.152 -10.      0.377   0.183   0.759]\n",
      "instance 1, ep 6, state [0 1 0 1 0 1 1 1]\n",
      "instance 1, ep 7, state [0 1 1 0 1 0 0 1]\n",
      "instance 1, ep 8, state [0 0 0 0 0 1 1 1]\n",
      "instance 1, ep 9, state [1 1 1 0 0 0 0 1]\n",
      "instance 1, ep 10, state [0 1 1 1 0 0 1 1]\n",
      "---------------------------------------------------\n",
      "1 200  | a  [1 0 0 0 1 1 0 0]  | s'  [0 0 0 0 1 0 0 1]  | r  5    | WI  [  0.682   0.231   0.02    0.192   0.694   0.524 -10.    -10.   ]\n",
      "instance 1, ep 11, state [0 1 0 0 0 0 1 1]\n",
      "instance 1, ep 12, state [0 1 1 1 0 0 0 0]\n",
      "instance 1, ep 13, state [0 1 0 0 0 0 0 0]\n",
      "instance 1, ep 14, state [0 0 0 1 0 0 0 1]\n",
      "instance 1, ep 15, state [0 1 1 0 1 1 0 0]\n",
      "---------------------------------------------------\n",
      "1 300  | a  [1 0 0 1 0 0 0 1]  | s'  [1 1 0 1 1 0 0 1]  | r  4    | WI  [  0.681   0.288   0.03    0.49  -10.      0.39  -10.      0.525]\n",
      "instance 1, ep 16, state [1 0 1 0 1 0 1 1]\n",
      "instance 1, ep 17, state [0 0 0 0 0 1 1 1]\n",
      "instance 1, ep 18, state [1 1 1 1 0 0 0 0]\n",
      "instance 1, ep 19, state [0 0 1 1 0 0 0 0]\n",
      "instance 1, ep 20, state [0 1 0 1 1 0 1 1]\n",
      "---------------------------------------------------\n",
      "1 400  | a  [1 0 0 0 0 1 1 0]  | s'  [1 0 0 0 1 0 0 0]  | r  5    | WI  [  0.718   0.344   0.332   0.254 -10.      0.504   0.478 -10.   ]\n",
      "instance 1, ep 21, state [0 0 1 1 1 1 1 1]\n",
      "instance 1, ep 22, state [1 1 1 0 1 1 0 1]\n",
      "instance 1, ep 23, state [0 1 1 1 0 1 1 0]\n",
      "instance 1, ep 24, state [0 1 0 0 1 0 1 0]\n",
      "instance 1, ep 25, state [1 0 1 0 1 0 1 1]\n",
      "---------------------------------------------------\n",
      "1 500  | a  [0 1 0 1 0 1 0 0]  | s'  [0 0 1 0 1 1 0 0]  | r  5    | WI  [  0.293   0.867   0.045   0.491   0.314   0.503 -10.    -10.   ]\n",
      "instance 1, ep 26, state [1 1 0 1 0 0 0 1]\n",
      "instance 1, ep 27, state [1 0 1 0 0 0 0 0]\n",
      "instance 1, ep 28, state [1 1 0 0 0 1 0 1]\n",
      "instance 1, ep 29, state [1 1 1 0 1 1 1 0]\n",
      "first state [1 1 0 1 0 0 1 1]\n",
      "---------------------------------------------------\n",
      "2 0  | a  [0 0 0 0 0 1 1 1]  | s'  [1 1 0 1 0 1 1 1]  | r  5    | WI  [-0. -0. -0. -0. -0. -0. -0. -0.]\n",
      "instance 2, ep 1, state [0 1 0 0 0 0 0 1]\n",
      "instance 2, ep 2, state [1 0 1 1 0 1 1 0]\n",
      "instance 2, ep 3, state [0 1 1 0 1 1 1 1]\n",
      "instance 2, ep 4, state [1 0 0 1 1 0 1 1]\n",
      "instance 2, ep 5, state [0 1 1 1 1 0 1 0]\n",
      "---------------------------------------------------\n",
      "2 100  | a  [1 0 0 0 0 1 0 1]  | s'  [0 0 1 1 0 1 0 0]  | r  5    | WI  [0.754 0.293 0.32  0.127 0.315 0.425 0.353 0.486]\n",
      "instance 2, ep 6, state [0 1 0 0 1 0 0 1]\n",
      "instance 2, ep 7, state [1 0 1 0 1 1 1 1]\n",
      "instance 2, ep 8, state [1 1 0 0 1 0 1 0]\n",
      "instance 2, ep 9, state [1 0 0 1 1 1 0 0]\n",
      "instance 2, ep 10, state [1 0 1 1 1 1 1 1]\n",
      "---------------------------------------------------\n",
      "2 200  | a  [0 1 0 0 0 0 1 1]  | s'  [0 0 0 1 1 1 1 0]  | r  7    | WI  [  0.275   0.626   0.335   0.236   0.382 -10.      0.395   0.466]\n",
      "instance 2, ep 11, state [0 0 0 0 1 1 0 0]\n",
      "instance 2, ep 12, state [0 1 1 0 1 1 0 1]\n",
      "instance 2, ep 13, state [1 0 0 0 0 1 1 0]\n",
      "instance 2, ep 14, state [0 0 0 1 0 0 0 1]\n",
      "instance 2, ep 15, state [0 1 0 1 1 0 0 1]\n",
      "---------------------------------------------------\n",
      "2 300  | a  [0 0 0 0 0 1 1 1]  | s'  [0 1 0 0 0 0 1 1]  | r  4    | WI  [0.405 0.408 0.296 0.247 0.425 0.446 0.58  0.488]\n",
      "instance 2, ep 16, state [1 0 0 1 1 0 1 0]\n",
      "instance 2, ep 17, state [1 0 0 0 1 0 0 0]\n",
      "instance 2, ep 18, state [1 1 0 1 1 1 0 0]\n",
      "instance 2, ep 19, state [0 0 0 1 0 0 1 0]\n",
      "instance 2, ep 20, state [1 1 0 1 1 1 0 0]\n",
      "---------------------------------------------------\n",
      "2 400  | a  [0 1 0 0 0 0 1 1]  | s'  [1 1 1 1 0 0 1 1]  | r  5    | WI  [  0.35    0.452   0.316   0.254   0.4   -10.      0.558   0.438]\n",
      "instance 2, ep 21, state [1 0 0 0 1 0 1 1]\n",
      "instance 2, ep 22, state [1 1 1 1 0 1 0 0]\n",
      "instance 2, ep 23, state [1 1 0 1 1 1 1 1]\n",
      "instance 2, ep 24, state [1 1 1 1 1 0 0 0]\n",
      "instance 2, ep 25, state [0 1 1 1 0 1 1 1]\n",
      "---------------------------------------------------\n",
      "2 500  | a  [0 0 0 0 1 0 1 1]  | s'  [0 1 0 1 1 0 1 0]  | r  6    | WI  [  0.423   0.468   0.391   0.278   0.576 -10.      0.496   0.485]\n",
      "instance 2, ep 26, state [1 1 0 1 0 0 1 0]\n",
      "instance 2, ep 27, state [1 0 1 0 1 1 0 1]\n",
      "instance 2, ep 28, state [1 0 0 0 1 1 1 0]\n",
      "instance 2, ep 29, state [0 1 0 0 1 1 1 1]\n",
      "first state [1 1 1 1 1 1 1 0]\n",
      "---------------------------------------------------\n",
      "3 0  | a  [0 0 0 0 0 1 1 1]  | s'  [0 0 0 1 0 1 1 1]  | r  7    | WI  [-0. -0. -0. -0. -0. -0. -0. -0.]\n",
      "instance 3, ep 1, state [1 0 1 1 1 0 0 0]\n",
      "instance 3, ep 2, state [1 0 0 0 1 1 0 0]\n",
      "instance 3, ep 3, state [1 1 1 0 1 0 1 1]\n",
      "instance 3, ep 4, state [0 0 1 1 1 1 1 1]\n",
      "instance 3, ep 5, state [0 1 0 0 1 0 0 0]\n",
      "---------------------------------------------------\n",
      "3 100  | a  [0 0 0 1 0 0 1 1]  | s'  [0 1 1 1 0 0 1 1]  | r  2    | WI  [0.098 0.251 0.596 0.764 0.262 0.327 0.694 0.792]\n",
      "instance 3, ep 6, state [1 0 0 0 0 0 0 1]\n",
      "instance 3, ep 7, state [0 0 0 0 1 1 0 0]\n",
      "instance 3, ep 8, state [0 1 1 1 0 1 0 0]\n",
      "instance 3, ep 9, state [0 0 1 1 0 1 1 1]\n",
      "instance 3, ep 10, state [1 1 1 1 0 0 1 0]\n",
      "---------------------------------------------------\n",
      "3 200  | a  [1 0 0 0 1 0 0 1]  | s'  [1 1 1 1 1 0 0 1]  | r  5    | WI  [  0.455   0.274 -10.    -10.      0.616   0.285   0.315   0.606]\n",
      "instance 3, ep 11, state [1 0 0 0 0 1 1 1]\n",
      "instance 3, ep 12, state [1 0 1 1 1 0 1 0]\n",
      "instance 3, ep 13, state [1 1 0 1 1 0 1 1]\n",
      "instance 3, ep 14, state [0 0 0 0 0 1 0 0]\n",
      "instance 3, ep 15, state [1 1 0 0 0 1 0 1]\n",
      "---------------------------------------------------\n",
      "3 300  | a  [0 0 1 1 0 0 1 0]  | s'  [1 1 0 0 0 0 0 0]  | r  4    | WI  [  0.498   0.344   0.591   0.618 -10.    -10.      0.676 -10.   ]\n",
      "instance 3, ep 16, state [1 0 1 1 0 1 1 1]\n",
      "instance 3, ep 17, state [1 1 1 1 1 1 1 0]\n",
      "instance 3, ep 18, state [0 0 0 0 1 0 1 0]\n",
      "instance 3, ep 19, state [1 1 0 1 0 1 0 1]\n",
      "instance 3, ep 20, state [0 1 1 0 0 0 0 1]\n",
      "---------------------------------------------------\n",
      "3 400  | a  [0 0 0 1 1 0 1 0]  | s'  [0 1 1 1 0 0 1 1]  | r  3    | WI  [  0.254   0.314 -10.      0.562   0.503 -10.      0.601 -10.   ]\n",
      "instance 3, ep 21, state [0 0 0 1 0 0 0 0]\n",
      "instance 3, ep 22, state [1 0 0 1 1 0 1 1]\n",
      "instance 3, ep 23, state [0 1 1 0 0 0 1 1]\n",
      "instance 3, ep 24, state [1 0 1 1 0 0 1 0]\n",
      "instance 3, ep 25, state [1 0 0 0 0 1 0 1]\n",
      "---------------------------------------------------\n",
      "3 500  | a  [0 1 0 1 0 0 1 0]  | s'  [1 0 0 1 0 0 0 1]  | r  3    | WI  [  0.456   0.585   0.53    0.602 -10.    -10.      0.593   0.45 ]\n",
      "instance 3, ep 26, state [1 1 0 1 1 0 0 1]\n",
      "instance 3, ep 27, state [1 0 1 1 1 1 1 0]\n",
      "instance 3, ep 28, state [0 0 1 1 0 1 1 1]\n",
      "instance 3, ep 29, state [0 1 0 0 0 0 0 1]\n",
      "first state [1 1 1 0 1 1 1 0]\n",
      "---------------------------------------------------\n",
      "4 0  | a  [0 0 0 0 0 1 1 1]  | s'  [0 0 0 0 0 1 0 0]  | r  6    | WI  [-0. -0. -0. -0. -0. -0. -0. -0.]\n",
      "instance 4, ep 1, state [0 0 0 1 0 1 0 0]\n",
      "instance 4, ep 2, state [1 1 0 1 1 0 1 1]\n",
      "instance 4, ep 3, state [1 0 1 0 0 0 0 1]\n",
      "instance 4, ep 4, state [1 1 0 0 0 1 0 1]\n",
      "instance 4, ep 5, state [1 0 1 0 1 1 0 0]\n",
      "---------------------------------------------------\n",
      "4 100  | a  [0 0 0 0 1 1 0 1]  | s'  [0 0 1 0 1 1 0 0]  | r  4    | WI  [-10.      0.274   0.263   0.196   0.464   0.335 -10.      0.461]\n",
      "instance 4, ep 6, state [1 1 0 1 1 1 0 1]\n",
      "instance 4, ep 7, state [1 0 0 1 0 1 0 0]\n",
      "instance 4, ep 8, state [1 0 1 0 1 0 0 1]\n",
      "instance 4, ep 9, state [0 1 0 1 0 1 0 0]\n",
      "instance 4, ep 10, state [0 0 1 0 1 0 0 1]\n",
      "---------------------------------------------------\n",
      "4 200  | a  [0 0 0 0 1 1 1 0]  | s'  [0 0 1 0 0 0 0 0]  | r  3    | WI  [  0.438   0.292   0.296   0.349   0.44    0.492   0.604 -10.   ]\n",
      "instance 4, ep 11, state [1 0 0 0 1 1 0 1]\n",
      "instance 4, ep 12, state [1 1 1 0 0 0 0 1]\n",
      "instance 4, ep 13, state [1 0 0 0 1 0 1 0]\n",
      "instance 4, ep 14, state [0 1 1 0 1 1 1 0]\n",
      "instance 4, ep 15, state [1 0 1 0 0 0 1 0]\n",
      "---------------------------------------------------\n",
      "4 300  | a  [0 0 0 1 1 1 0 0]  | s'  [0 0 0 0 1 0 1 0]  | r  3    | WI  [-10.      0.299   0.282   0.32    0.439   0.459 -10.    -10.   ]\n",
      "instance 4, ep 16, state [1 1 0 1 0 1 0 1]\n",
      "instance 4, ep 17, state [1 1 1 0 1 1 1 0]\n",
      "instance 4, ep 18, state [1 1 1 0 1 0 1 0]\n",
      "instance 4, ep 19, state [1 1 0 1 0 1 1 1]\n",
      "instance 4, ep 20, state [1 1 0 0 1 1 1 1]\n",
      "---------------------------------------------------\n",
      "4 400  | a  [0 0 1 0 1 1 0 0]  | s'  [1 0 1 1 1 0 0 0]  | r  6    | WI  [-10.      0.186   0.44    0.352   0.468   0.XXXX-5 -10.    -10.   ]\n",
      "instance 4, ep 21, state [0 1 0 1 0 0 0 0]\n",
      "instance 4, ep 22, state [1 0 0 0 0 0 0 1]\n",
      "instance 4, ep 23, state [1 1 0 0 1 1 0 0]\n",
      "instance 4, ep 24, state [0 0 0 1 1 1 1 1]\n",
      "instance 4, ep 25, state [1 1 0 0 0 1 1 0]\n",
      "---------------------------------------------------\n",
      "4 500  | a  [0 0 1 0 1 1 0 0]  | s'  [1 0 0 0 0 1 1 0]  | r  4    | WI  [-10.      0.221   0.418   0.3     0.419   0.38  -10.    -10.   ]\n",
      "instance 4, ep 26, state [1 0 1 0 0 0 0 0]\n",
      "instance 4, ep 27, state [0 1 1 0 1 1 0 0]\n",
      "instance 4, ep 28, state [0 0 1 0 1 1 0 1]\n",
      "instance 4, ep 29, state [0 1 0 1 1 0 1 1]\n",
      "first state [0 0 1 1 0 1 0 1]\n",
      "---------------------------------------------------\n",
      "5 0  | a  [0 0 0 0 0 1 1 1]  | s'  [0 0 1 1 0 1 1 0]  | r  4    | WI  [-0. -0. -0. -0. -0. -0. -0. -0.]\n",
      "instance 5, ep 1, state [0 0 1 0 1 1 1 0]\n",
      "instance 5, ep 2, state [0 0 1 1 1 1 1 1]\n",
      "instance 5, ep 3, state [0 1 0 1 1 1 0 0]\n",
      "instance 5, ep 4, state [0 0 0 1 1 0 0 0]\n",
      "instance 5, ep 5, state [1 1 1 0 1 1 0 1]\n",
      "---------------------------------------------------\n",
      "5 100  | a  [0 0 0 0 1 1 1 0]  | s'  [1 1 0 0 1 0 0 0]  | r  6    | WI  [  0.171   0.182   0.11    0.11    0.3     0.238   0.713 -10.   ]\n",
      "instance 5, ep 6, state [0 1 0 1 1 1 1 0]\n",
      "instance 5, ep 7, state [0 0 0 1 0 1 1 1]\n",
      "instance 5, ep 8, state [0 1 1 0 1 1 0 1]\n",
      "instance 5, ep 9, state [0 0 0 0 0 0 1 1]\n",
      "instance 5, ep 10, state [1 0 0 1 0 0 1 0]\n",
      "---------------------------------------------------\n",
      "5 200  | a  [0 0 0 0 1 1 0 1]  | s'  [0 1 0 0 0 0 1 0]  | r  3    | WI  [0.279 0.475 0.205 0.449 0.608 0.703 0.348 0.617]\n",
      "instance 5, ep 11, state [1 1 0 0 1 0 0 1]\n",
      "instance 5, ep 12, state [0 1 1 0 0 0 0 0]\n",
      "instance 5, ep 13, state [1 0 1 1 1 1 0 1]\n",
      "instance 5, ep 14, state [1 0 0 1 0 0 0 0]\n",
      "instance 5, ep 15, state [1 1 1 0 0 0 0 0]\n",
      "---------------------------------------------------\n",
      "5 300  | a  [0 0 0 0 0 1 1 1]  | s'  [0 1 1 0 0 1 1 1]  | r  3    | WI  [0.333 0.417 0.26  0.314 0.XXXX-5 0.616 0.554 0.515]\n",
      "instance 5, ep 16, state [1 0 1 0 0 0 1 1]\n",
      "instance 5, ep 17, state [1 0 0 1 0 1 0 0]\n",
      "instance 5, ep 18, state [0 0 1 0 0 0 0 1]\n",
      "instance 5, ep 19, state [1 1 1 0 1 0 0 1]\n",
      "instance 5, ep 20, state [0 1 0 1 1 1 1 1]\n",
      "---------------------------------------------------\n",
      "5 400  | a  [1 1 1 0 0 0 0 0]  | s'  [1 1 0 0 0 0 0 1]  | r  6    | WI  [  0.531   0.435   0.563   0.427 -10.    -10.    -10.    -10.   ]\n",
      "instance 5, ep 21, state [0 1 0 1 1 1 0 0]\n",
      "instance 5, ep 22, state [1 0 0 0 1 1 0 0]\n",
      "instance 5, ep 23, state [0 1 1 0 0 0 1 1]\n",
      "instance 5, ep 24, state [0 0 0 1 0 1 1 0]\n",
      "instance 5, ep 25, state [0 0 1 1 1 1 0 1]\n",
      "---------------------------------------------------\n",
      "5 500  | a  [1 0 0 1 0 0 1 0]  | s'  [0 0 1 1 0 0 1 1]  | r  5    | WI  [  0.544   0.361   0.306   0.454   0.425 -10.      0.562 -10.   ]\n",
      "instance 5, ep 26, state [1 0 1 1 1 1 1 1]\n",
      "instance 5, ep 27, state [0 0 1 0 0 0 0 1]\n",
      "instance 5, ep 28, state [1 0 0 0 1 1 0 1]\n",
      "instance 5, ep 29, state [1 1 1 0 1 0 1 1]\n",
      "first state [0 1 0 1 0 1 0 1]\n",
      "---------------------------------------------------\n",
      "6 0  | a  [0 0 0 0 0 1 1 1]  | s'  [1 1 0 1 0 1 1 1]  | r  4    | WI  [-0. -0. -0. -0. -0. -0. -0. -0.]\n",
      "instance 6, ep 1, state [1 1 1 1 1 0 1 0]\n",
      "instance 6, ep 2, state [0 0 0 1 1 1 1 0]\n",
      "instance 6, ep 3, state [0 0 0 0 0 1 1 1]\n",
      "instance 6, ep 4, state [1 1 0 1 1 0 0 1]\n",
      "instance 6, ep 5, state [0 1 1 0 0 0 0 0]\n",
      "---------------------------------------------------\n",
      "6 100  | a  [0 0 0 1 1 1 0 0]  | s'  [1 0 1 1 1 0 1 0]  | r  2    | WI  [  0.589   0.152 -10.      0.608   0.666   0.826 -10.    -10.   ]\n",
      "instance 6, ep 6, state [1 0 1 0 1 0 0 1]\n",
      "instance 6, ep 7, state [1 0 1 0 0 0 0 1]\n",
      "instance 6, ep 8, state [0 0 1 1 0 1 0 1]\n",
      "instance 6, ep 9, state [1 1 0 0 0 0 0 1]\n",
      "instance 6, ep 10, state [0 0 1 0 1 0 0 0]\n",
      "---------------------------------------------------\n",
      "6 200  | a  [1 1 0 0 0 1 0 0]  | s'  [1 1 0 0 0 0 0 0]  | r  2    | WI  [  0.579   0.596 -10.      0.558 -10.      0.563 -10.    -10.   ]\n",
      "instance 6, ep 11, state [0 1 0 1 0 0 1 0]\n",
      "instance 6, ep 12, state [1 1 1 1 0 0 0 1]\n",
      "instance 6, ep 13, state [1 0 1 0 1 0 1 1]\n",
      "instance 6, ep 14, state [0 0 0 0 0 1 1 1]\n",
      "instance 6, ep 15, state [0 1 1 0 1 1 0 0]\n",
      "---------------------------------------------------\n",
      "6 300  | a  [1 0 0 1 0 1 0 0]  | s'  [1 0 1 1 1 1 0 1]  | r  4    | WI  [  0.544   0.31  -10.      0.551   0.451   0.533 -10.    -10.   ]\n",
      "instance 6, ep 16, state [0 0 1 1 1 0 0 1]\n",
      "instance 6, ep 17, state [1 0 1 1 0 0 1 0]\n",
      "instance 6, ep 18, state [0 0 0 1 1 0 1 1]\n",
      "instance 6, ep 19, state [1 0 0 1 1 0 0 0]\n",
      "instance 6, ep 20, state [1 1 0 0 1 1 0 1]\n",
      "---------------------------------------------------\n",
      "6 400  | a  [0 0 0 1 0 1 1 0]  | s'  [1 0 0 0 0 1 0 0]  | r  5    | WI  [  0.328   0.337   0.432   0.541   0.498   0.547   0.543 -10.   ]\n",
      "instance 6, ep 21, state [1 0 1 0 1 1 1 1]\n",
      "instance 6, ep 22, state [0 1 1 0 1 1 0 1]\n",
      "instance 6, ep 23, state [1 0 1 0 0 0 1 1]\n",
      "instance 6, ep 24, state [0 0 1 0 1 1 1 1]\n",
      "instance 6, ep 25, state [0 1 1 1 0 1 0 0]\n",
      "---------------------------------------------------\n",
      "6 500  | a  [0 0 0 1 1 1 0 0]  | s'  [1 1 0 0 1 1 0 0]  | r  4    | WI  [  0.515   0.343 -10.      0.545   0.569   0.527 -10.    -10.   ]\n",
      "instance 6, ep 26, state [0 1 1 1 1 0 1 0]\n",
      "instance 6, ep 27, state [1 1 1 1 0 0 1 0]\n",
      "instance 6, ep 28, state [0 0 1 0 0 1 1 0]\n",
      "instance 6, ep 29, state [0 0 0 0 1 1 1 0]\n",
      "first state [1 0 1 1 1 1 1 0]\n",
      "---------------------------------------------------\n",
      "7 0  | a  [0 0 0 0 0 1 1 1]  | s'  [0 0 0 0 0 0 0 1]  | r  6    | WI  [-0. -0. -0. -0. -0. -0. -0. -0.]\n",
      "instance 7, ep 1, state [0 0 1 0 1 1 1 1]\n",
      "instance 7, ep 2, state [0 1 1 0 0 1 1 1]\n",
      "instance 7, ep 3, state [1 1 1 0 0 0 1 1]\n",
      "instance 7, ep 4, state [1 0 1 1 1 1 0 1]\n",
      "instance 7, ep 5, state [0 0 0 1 1 1 1 1]\n",
      "---------------------------------------------------\n",
      "7 100  | a  [1 0 1 1 0 0 0 0]  | s'  [0 0 1 1 0 0 0 1]  | r  5    | WI  [  0.459   0.427   0.641   0.53  -10.    -10.    -10.    -10.   ]\n",
      "instance 7, ep 6, state [1 0 0 0 0 0 0 0]\n",
      "instance 7, ep 7, state [1 0 0 0 1 0 0 1]\n",
      "instance 7, ep 8, state [0 0 0 0 0 0 1 1]\n",
      "instance 7, ep 9, state [1 0 1 0 0 1 0 0]\n",
      "instance 7, ep 10, state [1 1 0 1 1 0 0 0]\n",
      "---------------------------------------------------\n",
      "7 200  | a  [1 0 1 0 0 0 0 1]  | s'  [1 0 1 0 1 0 0 0]  | r  4    | WI  [  0.624 -10.      0.571   0.455 -10.    -10.    -10.      0.575]\n",
      "instance 7, ep 11, state [0 0 1 1 1 0 1 1]\n",
      "instance 7, ep 12, state [1 0 1 0 0 0 1 1]\n",
      "instance 7, ep 13, state [0 0 0 0 0 0 1 0]\n",
      "instance 7, ep 14, state [0 0 1 1 1 0 1 0]\n",
      "instance 7, ep 15, state [1 1 1 1 1 0 1 0]\n",
      "---------------------------------------------------\n",
      "7 300  | a  [1 0 0 1 0 0 0 1]  | s'  [0 0 1 0 1 0 0 1]  | r  6    | WI  [  0.604   0.097   0.391   0.505 -10.    -10.    -10.      0.519]\n",
      "instance 7, ep 16, state [1 0 0 0 0 0 1 0]\n",
      "instance 7, ep 17, state [0 1 0 1 1 1 1 0]\n",
      "instance 7, ep 18, state [1 0 0 1 0 1 1 1]\n",
      "instance 7, ep 19, state [1 0 0 1 0 1 1 1]\n",
      "instance 7, ep 20, state [0 0 0 0 1 0 0 0]\n",
      "---------------------------------------------------\n",
      "7 400  | a  [1 0 1 0 0 0 0 1]  | s'  [0 0 0 0 1 0 1 0]  | r  1    | WI  [  0.584   0.257   0.557   0.504 -10.    -10.    -10.      0.528]\n",
      "instance 7, ep 21, state [1 1 0 0 0 0 1 1]\n",
      "instance 7, ep 22, state [0 0 1 0 1 0 0 0]\n",
      "instance 7, ep 23, state [1 1 0 0 0 0 0 0]\n",
      "instance 7, ep 24, state [1 0 0 1 0 1 0 1]\n",
      "instance 7, ep 25, state [1 1 1 0 1 0 0 0]\n",
      "---------------------------------------------------\n",
      "7 500  | a  [0 0 1 1 0 0 0 1]  | s'  [1 0 1 0 0 0 1 1]  | r  4    | WI  [  0.07    0.116   0.444   0.487   0.167   0.344 -10.      0.537]\n",
      "instance 7, ep 26, state [1 0 1 1 1 1 0 0]\n",
      "instance 7, ep 27, state [0 0 0 0 0 1 1 0]\n",
      "instance 7, ep 28, state [1 0 0 1 0 0 1 1]\n",
      "instance 7, ep 29, state [1 1 1 0 0 0 0 1]\n",
      "first state [1 0 0 1 0 1 0 0]\n",
      "---------------------------------------------------\n",
      "8 0  | a  [0 0 0 0 0 1 1 1]  | s'  [0 0 1 1 1 1 0 1]  | r  3    | WI  [-0. -0. -0. -0. -0. -0. -0. -0.]\n",
      "instance 8, ep 1, state [1 1 1 1 0 0 1 1]\n",
      "instance 8, ep 2, state [0 1 0 0 0 1 1 0]\n",
      "instance 8, ep 3, state [1 0 0 0 0 0 1 1]\n",
      "instance 8, ep 4, state [1 0 0 0 0 1 0 1]\n",
      "instance 8, ep 5, state [1 0 1 1 1 1 0 0]\n",
      "---------------------------------------------------\n",
      "8 100  | a  [0 0 0 0 0 1 1 1]  | s'  [0 0 0 1 0 0 1 1]  | r  5    | WI  [0.192 0.484 0.327 0.188 0.326 0.525 0.623 0.557]\n",
      "instance 8, ep 6, state [0 0 1 0 1 1 0 0]\n",
      "instance 8, ep 7, state [1 1 1 0 0 0 0 1]\n",
      "instance 8, ep 8, state [1 1 1 1 0 0 1 0]\n",
      "instance 8, ep 9, state [1 1 0 1 1 1 1 1]\n",
      "instance 8, ep 10, state [0 0 1 1 0 0 1 1]\n",
      "---------------------------------------------------\n",
      "8 200  | a  [0 1 0 0 1 1 0 0]  | s'  [0 0 0 0 0 0 1 1]  | r  4    | WI  [  0.332   0.547   0.443   0.264   0.569   0.648 -10.    -10.   ]\n",
      "instance 8, ep 11, state [1 1 0 0 1 0 0 0]\n",
      "instance 8, ep 12, state [1 1 0 0 1 1 0 0]\n",
      "instance 8, ep 13, state [0 1 0 0 1 1 0 1]\n",
      "instance 8, ep 14, state [0 1 0 1 0 1 1 1]\n",
      "instance 8, ep 15, state [1 1 0 0 1 0 1 1]\n",
      "---------------------------------------------------\n",
      "8 300  | a  [0 1 0 1 0 1 0 0]  | s'  [0 1 0 0 0 1 0 1]  | r  5    | WI  [  0.315   0.59    0.277   0.602   0.519   0.581 -10.    -10.   ]\n",
      "instance 8, ep 16, state [0 1 0 1 0 0 1 1]\n",
      "instance 8, ep 17, state [1 1 0 1 0 1 1 1]\n",
      "instance 8, ep 18, state [1 0 1 0 1 0 1 1]\n",
      "instance 8, ep 19, state [0 0 1 0 0 0 0 1]\n",
      "instance 8, ep 20, state [1 0 0 0 0 0 0 0]\n",
      "---------------------------------------------------\n",
      "8 400  | a  [0 0 0 0 1 0 1 1]  | s'  [1 0 0 0 1 0 1 0]  | r  1    | WI  [0.323 0.452 0.33  0.535 0.571 0.485 0.584 0.621]\n",
      "instance 8, ep 21, state [1 0 1 1 1 1 1 1]\n",
      "instance 8, ep 22, state [1 1 1 1 0 0 0 1]\n",
      "instance 8, ep 23, state [1 1 1 0 0 1 1 1]\n",
      "instance 8, ep 24, state [0 1 1 1 1 1 0 1]\n",
      "instance 8, ep 25, state [1 1 1 0 0 1 1 1]\n",
      "---------------------------------------------------\n",
      "8 500  | a  [0 1 0 1 1 0 0 0]  | s'  [1 1 0 1 0 0 0 1]  | r  6    | WI  [  0.348   0.539   0.467   0.568   0.553 -10.    -10.    -10.   ]\n",
      "instance 8, ep 26, state [0 1 1 1 0 1 1 0]\n",
      "instance 8, ep 27, state [1 1 1 0 0 0 0 0]\n",
      "instance 8, ep 28, state [1 0 1 1 1 1 1 1]\n",
      "instance 8, ep 29, state [0 0 1 1 0 1 1 0]\n",
      "first state [0 1 0 0 0 0 1 0]\n",
      "---------------------------------------------------\n",
      "9 0  | a  [0 0 0 0 0 1 1 1]  | s'  [0 1 0 0 0 0 1 0]  | r  2    | WI  [-0. -0. -0. -0. -0. -0. -0. -0.]\n",
      "instance 9, ep 1, state [1 1 0 1 1 1 0 0]\n",
      "instance 9, ep 2, state [1 1 1 0 1 0 0 0]\n",
      "instance 9, ep 3, state [1 0 0 1 0 0 0 1]\n",
      "instance 9, ep 4, state [1 0 1 1 0 1 1 1]\n",
      "instance 9, ep 5, state [0 1 1 0 0 0 0 1]\n",
      "---------------------------------------------------\n",
      "9 100  | a  [1 0 0 0 1 0 1 0]  | s'  [1 0 1 0 1 0 1 0]  | r  3    | WI  [  0.848   0.183   0.251   0.332   0.605   0.596   0.763 -10.   ]\n",
      "instance 9, ep 6, state [0 0 1 0 1 0 0 0]\n",
      "instance 9, ep 7, state [0 0 1 1 0 1 1 1]\n",
      "instance 9, ep 8, state [0 0 0 1 1 0 0 1]\n",
      "instance 9, ep 9, state [1 1 1 0 1 1 0 1]\n",
      "instance 9, ep 10, state [1 0 1 1 1 0 0 1]\n",
      "---------------------------------------------------\n",
      "9 200  | a  [0 1 0 0 1 0 1 0]  | s'  [1 1 1 0 0 0 1 0]  | r  5    | WI  [-10.      0.698   0.32    0.359   0.49    0.39    0.628 -10.   ]\n",
      "instance 9, ep 11, state [0 1 1 0 1 1 0 1]\n",
      "instance 9, ep 12, state [1 1 1 0 1 1 1 1]\n",
      "instance 9, ep 13, state [0 1 0 0 0 1 1 1]\n",
      "instance 9, ep 14, state [1 1 1 0 0 0 1 1]\n",
      "instance 9, ep 15, state [0 0 1 0 1 1 0 0]\n",
      "---------------------------------------------------\n",
      "9 300  | a  [0 1 0 0 0 0 1 1]  | s'  [0 0 1 1 1 1 1 1]  | r  3    | WI  [  0.536   0.702   0.322   0.428 -10.    -10.      0.582   0.574]\n",
      "instance 9, ep 16, state [1 1 1 1 0 1 1 1]\n",
      "instance 9, ep 17, state [0 1 1 0 0 1 0 0]\n",
      "instance 9, ep 18, state [0 1 1 1 0 1 1 1]\n",
      "instance 9, ep 19, state [1 0 1 0 1 0 0 0]\n",
      "instance 9, ep 20, state [1 0 1 0 0 1 0 0]\n",
      "---------------------------------------------------\n",
      "9 400  | a  [0 1 0 0 0 0 1 1]  | s'  [0 0 0 1 0 1 1 0]  | r  3    | WI  [-10.      0.573   0.336   0.453   0.519 -10.      0.568   0.571]\n",
      "instance 9, ep 21, state [1 0 0 0 1 1 1 1]\n",
      "instance 9, ep 22, state [0 0 1 0 0 0 0 1]\n",
      "instance 9, ep 23, state [0 1 0 1 0 0 1 1]\n",
      "instance 9, ep 24, state [0 0 0 0 0 0 0 0]\n",
      "instance 9, ep 25, state [1 1 1 0 0 1 0 0]\n",
      "---------------------------------------------------\n",
      "9 500  | a  [0 0 0 1 0 0 1 1]  | s'  [0 1 0 0 0 0 1 0]  | r  4    | WI  [-10.      0.264   0.332   0.454   0.446 -10.      0.57    0.556]\n",
      "instance 9, ep 26, state [1 1 1 0 0 1 0 1]\n",
      "instance 9, ep 27, state [1 1 0 0 1 1 1 0]\n",
      "instance 9, ep 28, state [0 1 1 1 0 1 1 1]\n",
      "instance 9, ep 29, state [0 0 1 0 0 1 0 1]\n"
     ]
    },
    {
     "data": {
      "text/plain": [
       "3.5045"
      ]
     },
     "execution_count": 14,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "np.random.seed(seed)\n",
    "random.seed(seed)\n",
    "rewards_with_norm = UCWhittle(simulator, n_episodes, n_epochs, discount, alpha=alpha, method='UCB',norm_confidence=True)\n",
    "np.mean(rewards_with_norm)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 15,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "solving UCWhittle using method: UCB\n",
      "first state [0 1 1 1 1 1 1 1]\n",
      "---------------------------------------------------\n",
      "0 0  | a  [0 0 1 1 0 0 0 1]  | s'  [1 0 1 1 1 0 1 1]  | r  7    | WI  [-10.      0.163   0.251   0.172 -10.    -10.    -10.      0.239]\n",
      "instance 0, ep 1, state [0 0 0 1 1 1 0 1]\n",
      "instance 0, ep 2, state [0 1 1 1 0 0 0 1]\n",
      "instance 0, ep 3, state [0 0 0 1 0 1 1 0]\n",
      "instance 0, ep 4, state [1 1 0 1 1 1 1 1]\n",
      "instance 0, ep 5, state [0 0 0 0 0 1 0 0]\n",
      "---------------------------------------------------\n",
      "0 100  | a  [0 0 1 1 0 0 0 1]  | s'  [0 0 0 1 0 0 0 1]  | r  1    | WI  [  0.292   0.543   0.58    0.737 -10.      0.322   0.498   1.   ]\n",
      "instance 0, ep 6, state [0 1 0 1 0 0 0 0]\n",
      "instance 0, ep 7, state [1 0 1 0 0 0 0 1]\n",
      "instance 0, ep 8, state [0 0 0 0 1 1 0 1]\n",
      "instance 0, ep 9, state [0 1 0 0 0 1 1 1]\n",
      "instance 0, ep 10, state [0 1 1 0 0 0 1 0]\n",
      "---------------------------------------------------\n",
      "0 200  | a  [0 0 1 1 0 0 0 1]  | s'  [1 0 0 1 0 0 0 0]  | r  3    | WI  [  0.389   0.387   0.564   0.725   0.409   0.486 -10.      1.   ]\n",
      "instance 0, ep 11, state [1 0 1 1 0 1 1 1]\n",
      "instance 0, ep 12, state [0 0 1 1 0 0 1 0]\n",
      "instance 0, ep 13, state [1 1 1 1 0 1 1 0]\n",
      "instance 0, ep 14, state [0 1 1 0 1 1 1 1]\n",
      "instance 0, ep 15, state [0 0 1 1 1 0 1 1]\n",
      "---------------------------------------------------\n",
      "0 300  | a  [0 1 0 0 0 1 0 1]  | s'  [0 1 0 1 0 1 1 1]  | r  5    | WI  [  0.387   0.684   0.493   0.177   0.527   0.646 -10.      0.544]\n",
      "instance 0, ep 16, state [1 1 1 1 0 1 1 0]\n",
      "instance 0, ep 17, state [0 0 0 1 0 0 0 0]\n",
      "instance 0, ep 18, state [0 1 1 0 1 1 1 0]\n",
      "instance 0, ep 19, state [1 1 0 1 0 0 1 1]\n",
      "instance 0, ep 20, state [1 0 0 1 1 0 1 0]\n",
      "---------------------------------------------------\n",
      "0 400  | a  [0 1 0 0 0 1 0 1]  | s'  [1 1 1 0 0 0 1 0]  | r  4    | WI  [  0.244   0.65    0.58    0.214   0.454   0.653 -10.      0.867]\n",
      "instance 0, ep 21, state [0 1 1 1 0 1 1 1]\n",
      "instance 0, ep 22, state [0 0 0 0 0 0 0 1]\n",
      "instance 0, ep 23, state [1 0 0 1 0 0 0 0]\n",
      "instance 0, ep 24, state [1 0 1 1 0 0 0 1]\n",
      "instance 0, ep 25, state [0 0 1 0 0 0 0 1]\n",
      "---------------------------------------------------\n",
      "0 500  | a  [0 1 0 1 0 1 0 0]  | s'  [0 0 1 0 0 1 0 0]  | r  2    | WI  [  0.438   0.721   0.514   0.76  -10.      0.556 -10.    -10.   ]\n",
      "instance 0, ep 26, state [0 1 0 1 0 0 1 1]\n",
      "instance 0, ep 27, state [1 0 0 0 1 0 1 0]\n",
      "instance 0, ep 28, state [1 0 1 0 0 1 0 0]\n",
      "instance 0, ep 29, state [1 1 0 0 0 1 0 0]\n",
      "first state [1 1 1 0 0 1 1 1]\n",
      "---------------------------------------------------\n",
      "1 0  | a  [1 1 0 0 1 0 0 0]  | s'  [1 1 0 0 1 1 1 0]  | r  6    | WI  [  0.172   0.239 -10.    -10.      0.174 -10.    -10.    -10.   ]\n",
      "instance 1, ep 1, state [0 1 1 0 0 1 0 0]\n",
      "instance 1, ep 2, state [0 0 0 1 1 0 1 1]\n",
      "instance 1, ep 3, state [0 0 0 0 1 1 0 1]\n",
      "instance 1, ep 4, state [1 0 1 1 1 0 1 1]\n",
      "instance 1, ep 5, state [1 1 1 1 1 1 0 0]\n",
      "---------------------------------------------------\n",
      "1 100  | a  [0 0 0 1 0 1 0 1]  | s'  [1 1 0 1 0 1 0 1]  | r  6    | WI  [  0.239   0.111   0.12    0.274   0.181   0.304 -10.      0.296]\n",
      "instance 1, ep 6, state [0 1 0 1 0 1 1 1]\n",
      "instance 1, ep 7, state [0 1 1 0 1 0 0 1]\n",
      "instance 1, ep 8, state [0 0 0 0 0 1 1 1]\n",
      "instance 1, ep 9, state [1 1 1 0 0 0 0 1]\n",
      "instance 1, ep 10, state [0 1 1 1 0 0 1 1]\n",
      "---------------------------------------------------\n",
      "1 200  | a  [1 0 0 1 0 1 0 0]  | s'  [1 0 0 1 1 0 1 0]  | r  5    | WI  [  0.851   0.276   0.12    0.532   0.285   0.351 -10.    -10.   ]\n",
      "instance 1, ep 11, state [0 1 0 0 0 0 1 1]\n",
      "instance 1, ep 12, state [0 1 1 1 0 0 0 0]\n",
      "instance 1, ep 13, state [0 1 0 0 0 0 0 0]\n",
      "instance 1, ep 14, state [0 0 0 1 0 0 0 1]\n",
      "instance 1, ep 15, state [0 1 1 0 1 1 0 0]\n",
      "---------------------------------------------------\n",
      "1 300  | a  [1 0 0 1 0 1 0 0]  | s'  [1 0 0 1 0 1 0 0]  | r  4    | WI  [  0.844   0.288   0.015   0.716 -10.      0.469 -10.    -10.   ]\n",
      "instance 1, ep 16, state [1 0 1 0 1 0 1 1]\n",
      "instance 1, ep 17, state [0 0 0 0 0 1 1 1]\n",
      "instance 1, ep 18, state [1 1 1 1 0 0 0 0]\n",
      "instance 1, ep 19, state [0 0 1 1 0 0 0 0]\n",
      "instance 1, ep 20, state [0 1 0 1 1 0 1 1]\n",
      "---------------------------------------------------\n",
      "1 400  | a  [1 1 0 0 0 1 0 0]  | s'  [1 1 0 1 0 1 1 1]  | r  5    | WI  [  0.923   0.298   0.16    0.24  -10.      0.416 -10.    -10.   ]\n",
      "instance 1, ep 21, state [0 0 1 1 1 1 1 1]\n",
      "instance 1, ep 22, state [1 1 1 0 1 1 0 1]\n",
      "instance 1, ep 23, state [0 1 1 1 0 1 1 0]\n",
      "instance 1, ep 24, state [0 1 0 0 1 0 1 0]\n",
      "instance 1, ep 25, state [1 0 1 0 1 0 1 1]\n",
      "---------------------------------------------------\n",
      "1 500  | a  [0 1 0 1 0 1 0 0]  | s'  [1 1 1 0 0 0 1 1]  | r  5    | WI  [  0.366   1.      0.12    0.787 -10.      0.466 -10.    -10.   ]\n",
      "instance 1, ep 26, state [1 1 0 1 0 0 0 1]\n",
      "instance 1, ep 27, state [1 0 1 0 0 0 0 0]\n",
      "instance 1, ep 28, state [1 1 0 0 0 1 0 1]\n",
      "instance 1, ep 29, state [1 1 1 0 1 1 1 0]\n",
      "first state [1 1 0 1 0 0 1 1]\n",
      "---------------------------------------------------\n",
      "2 0  | a  [1 0 1 0 0 0 1 0]  | s'  [1 1 1 1 0 0 1 1]  | r  5    | WI  [  0.176   0.099   0.253   0.137 -10.    -10.      0.236 -10.   ]\n",
      "instance 2, ep 1, state [0 1 0 0 0 0 0 1]\n",
      "instance 2, ep 2, state [1 0 1 1 0 1 1 0]\n",
      "instance 2, ep 3, state [0 1 1 0 1 1 1 1]\n",
      "instance 2, ep 4, state [1 0 0 1 1 0 1 1]\n",
      "instance 2, ep 5, state [0 1 1 1 1 0 1 0]\n",
      "---------------------------------------------------\n",
      "2 100  | a  [1 0 0 0 0 1 0 1]  | s'  [1 1 0 1 1 1 1 0]  | r  5    | WI  [  0.863   0.171   0.078   0.136   0.217   0.491 -10.      0.578]\n",
      "instance 2, ep 6, state [0 1 0 0 1 0 0 1]\n",
      "instance 2, ep 7, state [1 0 1 0 1 1 1 1]\n",
      "instance 2, ep 8, state [1 1 0 0 1 0 1 0]\n",
      "instance 2, ep 9, state [1 0 0 1 1 1 0 0]\n",
      "instance 2, ep 10, state [1 0 1 1 1 1 1 1]\n",
      "---------------------------------------------------\n",
      "2 200  | a  [1 1 0 0 0 0 0 1]  | s'  [1 1 0 0 1 0 1 1]  | r  7    | WI  [  0.353   0.816   0.078   0.184   0.256 -10.    -10.      0.324]\n",
      "instance 2, ep 11, state [0 0 0 0 1 1 0 0]\n",
      "instance 2, ep 12, state [0 1 1 0 1 1 0 1]\n",
      "instance 2, ep 13, state [1 0 0 0 0 1 1 0]\n",
      "instance 2, ep 14, state [0 0 0 1 0 0 0 1]\n",
      "instance 2, ep 15, state [0 1 0 1 1 0 0 1]\n",
      "---------------------------------------------------\n",
      "2 300  | a  [1 0 0 0 0 0 1 1]  | s'  [1 0 1 0 1 0 1 1]  | r  4    | WI  [  1.      0.187   0.35    0.184   0.228 -10.      0.506   0.413]\n",
      "instance 2, ep 16, state [1 0 0 1 1 0 1 0]\n",
      "instance 2, ep 17, state [1 0 0 0 1 0 0 0]\n",
      "instance 2, ep 18, state [1 1 0 1 1 1 0 0]\n",
      "instance 2, ep 19, state [0 0 0 1 0 0 1 0]\n",
      "instance 2, ep 20, state [1 1 0 1 1 1 0 0]\n",
      "---------------------------------------------------\n",
      "2 400  | a  [1 0 0 0 0 0 1 1]  | s'  [1 1 0 1 0 1 1 0]  | r  5    | WI  [  0.378   0.187   0.254   0.184   0.23  -10.      0.481   0.313]\n",
      "instance 2, ep 21, state [1 0 0 0 1 0 1 1]\n",
      "instance 2, ep 22, state [1 1 1 1 0 1 0 0]\n",
      "instance 2, ep 23, state [1 1 0 1 1 1 1 1]\n",
      "instance 2, ep 24, state [1 1 1 1 1 0 0 0]\n",
      "instance 2, ep 25, state [0 1 1 1 0 1 1 1]\n",
      "---------------------------------------------------\n",
      "2 500  | a  [1 0 0 0 1 0 1 0]  | s'  [1 0 0 1 0 1 1 0]  | r  6    | WI  [  0.923   0.187   0.088   0.176   0.985 -10.      0.471 -10.   ]\n",
      "instance 2, ep 26, state [1 1 0 1 0 0 1 0]\n",
      "instance 2, ep 27, state [1 0 1 0 1 1 0 1]\n",
      "instance 2, ep 28, state [1 0 0 0 1 1 1 0]\n",
      "instance 2, ep 29, state [0 1 0 0 1 1 1 1]\n",
      "first state [1 1 1 1 1 1 1 0]\n",
      "---------------------------------------------------\n",
      "3 0  | a  [0 1 0 1 0 0 1 0]  | s'  [0 1 0 1 1 0 1 0]  | r  7    | WI  [  0.142   0.163 -10.      0.194 -10.    -10.      0.153 -10.   ]\n",
      "instance 3, ep 1, state [1 0 1 1 1 0 0 0]\n",
      "instance 3, ep 2, state [1 0 0 0 1 1 0 0]\n",
      "instance 3, ep 3, state [1 1 1 0 1 0 1 1]\n",
      "instance 3, ep 4, state [0 0 1 1 1 1 1 1]\n",
      "instance 3, ep 5, state [0 1 0 0 1 0 0 0]\n",
      "---------------------------------------------------\n",
      "3 100  | a  [0 0 1 0 0 0 1 1]  | s'  [1 1 1 1 1 0 1 0]  | r  2    | WI  [  0.499   0.276   0.639   0.446   0.33  -10.      0.946   0.996]\n",
      "instance 3, ep 6, state [1 0 0 0 0 0 0 1]\n",
      "instance 3, ep 7, state [0 0 0 0 1 1 0 0]\n",
      "instance 3, ep 8, state [0 1 1 1 0 1 0 0]\n",
      "instance 3, ep 9, state [0 0 1 1 0 1 1 1]\n",
      "instance 3, ep 10, state [1 1 1 1 0 0 1 0]\n",
      "---------------------------------------------------\n",
      "3 200  | a  [0 0 0 1 1 0 0 1]  | s'  [0 1 1 1 0 0 0 0]  | r  5    | WI  [  0.319   0.276   0.347   0.348   0.386 -10.    -10.      0.918]\n",
      "instance 3, ep 11, state [1 0 0 0 0 1 1 1]\n",
      "instance 3, ep 12, state [1 0 1 1 1 0 1 0]\n",
      "instance 3, ep 13, state [1 1 0 1 1 0 1 1]\n",
      "instance 3, ep 14, state [0 0 0 0 0 1 0 0]\n",
      "instance 3, ep 15, state [1 1 0 0 0 1 0 1]\n",
      "---------------------------------------------------\n",
      "3 300  | a  [0 0 1 1 0 0 1 0]  | s'  [0 1 1 0 0 1 1 0]  | r  4    | WI  [  0.22    0.264   0.572   0.544 -10.    -10.      0.836 -10.   ]\n",
      "instance 3, ep 16, state [1 0 1 1 0 1 1 1]\n",
      "instance 3, ep 17, state [1 1 1 1 1 1 1 0]\n",
      "instance 3, ep 18, state [0 0 0 0 1 0 1 0]\n",
      "instance 3, ep 19, state [1 1 0 1 0 1 0 1]\n",
      "instance 3, ep 20, state [0 1 1 0 0 0 0 1]\n",
      "---------------------------------------------------\n",
      "3 400  | a  [0 0 0 1 0 0 1 1]  | s'  [1 1 0 1 0 0 1 1]  | r  3    | WI  [  0.379   0.252   0.231   0.617   0.426 -10.      0.865   0.475]\n",
      "instance 3, ep 21, state [0 0 0 1 0 0 0 0]\n",
      "instance 3, ep 22, state [1 0 0 1 1 0 1 1]\n",
      "instance 3, ep 23, state [0 1 1 0 0 0 1 1]\n",
      "instance 3, ep 24, state [1 0 1 1 0 0 1 0]\n",
      "instance 3, ep 25, state [1 0 0 0 0 1 0 1]\n",
      "---------------------------------------------------\n",
      "3 500  | a  [0 1 1 0 0 0 1 0]  | s'  [1 0 1 0 0 0 1 0]  | r  3    | WI  [  0.273   0.72    0.616   0.531   0.396 -10.      0.865 -10.   ]\n",
      "instance 3, ep 26, state [1 1 0 1 1 0 0 1]\n",
      "instance 3, ep 27, state [1 0 1 1 1 1 1 0]\n",
      "instance 3, ep 28, state [0 0 1 1 0 1 1 1]\n",
      "instance 3, ep 29, state [0 1 0 0 0 0 0 1]\n",
      "first state [1 1 1 0 1 1 1 0]\n",
      "---------------------------------------------------\n",
      "4 0  | a  [0 0 1 0 1 0 1 0]  | s'  [0 0 1 0 0 0 0 0]  | r  6    | WI  [  0.125  -0.      0.204 -10.      0.16  -10.      0.132 -10.   ]\n",
      "instance 4, ep 1, state [0 0 0 1 0 1 0 0]\n",
      "instance 4, ep 2, state [1 1 0 1 1 0 1 1]\n",
      "instance 4, ep 3, state [1 0 1 0 0 0 0 1]\n",
      "instance 4, ep 4, state [1 1 0 0 0 1 0 1]\n",
      "instance 4, ep 5, state [1 0 1 0 1 1 0 0]\n",
      "---------------------------------------------------\n",
      "4 100  | a  [0 0 0 1 1 1 0 0]  | s'  [1 0 1 0 0 1 0 0]  | r  4    | WI  [  0.225  -0.      0.271   0.297   0.32    0.619 -10.    -10.   ]\n",
      "instance 4, ep 6, state [1 1 0 1 1 1 0 1]\n",
      "instance 4, ep 7, state [1 0 0 1 0 1 0 0]\n",
      "instance 4, ep 8, state [1 0 1 0 1 0 0 1]\n",
      "instance 4, ep 9, state [0 1 0 1 0 1 0 0]\n",
      "instance 4, ep 10, state [0 0 1 0 1 0 0 1]\n",
      "---------------------------------------------------\n",
      "4 200  | a  [1 0 0 0 0 1 1 0]  | s'  [1 0 0 0 1 1 0 0]  | r  3    | WI  [  0.518  -0.      0.266   0.192   0.32    0.521   0.384 -10.   ]\n",
      "instance 4, ep 11, state [1 0 0 0 1 1 0 1]\n",
      "instance 4, ep 12, state [1 1 1 0 0 0 0 1]\n",
      "instance 4, ep 13, state [1 0 0 0 1 0 1 0]\n",
      "instance 4, ep 14, state [0 1 1 0 1 1 1 0]\n",
      "instance 4, ep 15, state [1 0 1 0 0 0 1 0]\n",
      "---------------------------------------------------\n",
      "4 300  | a  [0 0 0 1 1 1 0 0]  | s'  [1 0 1 0 0 0 0 0]  | r  3    | WI  [  0.225  -0.      0.276   0.277   0.532   0.51  -10.    -10.   ]\n",
      "instance 4, ep 16, state [1 1 0 1 0 1 0 1]\n",
      "instance 4, ep 17, state [1 1 1 0 1 1 1 0]\n",
      "instance 4, ep 18, state [1 1 1 0 1 0 1 0]\n",
      "instance 4, ep 19, state [1 1 0 1 0 1 1 1]\n",
      "instance 4, ep 20, state [1 1 0 0 1 1 1 1]\n",
      "---------------------------------------------------\n",
      "4 400  | a  [0 0 1 0 0 1 1 0]  | s'  [1 0 0 0 0 1 0 0]  | r  6    | WI  [  0.22   -0.      0.551   0.225   0.294   0.398   0.471 -10.   ]\n",
      "instance 4, ep 21, state [0 1 0 1 0 0 0 0]\n",
      "instance 4, ep 22, state [1 0 0 0 0 0 0 1]\n",
      "instance 4, ep 23, state [1 1 0 0 1 1 0 0]\n",
      "instance 4, ep 24, state [0 0 0 1 1 1 1 1]\n",
      "instance 4, ep 25, state [1 1 0 0 0 1 1 0]\n",
      "---------------------------------------------------\n",
      "4 500  | a  [0 0 1 0 1 0 1 0]  | s'  [1 0 0 0 1 1 1 0]  | r  4    | WI  [  0.225  -0.      0.551   0.225   0.514   0.415   0.462 -10.   ]\n",
      "instance 4, ep 26, state [1 0 1 0 0 0 0 0]\n",
      "instance 4, ep 27, state [0 1 1 0 1 1 0 0]\n",
      "instance 4, ep 28, state [0 0 1 0 1 1 0 1]\n",
      "instance 4, ep 29, state [0 1 0 1 1 0 1 1]\n",
      "first state [0 0 1 1 0 1 0 1]\n",
      "---------------------------------------------------\n",
      "5 0  | a  [0 0 0 1 0 1 0 1]  | s'  [0 1 0 1 0 0 0 0]  | r  4    | WI  [-10.    -10.      0.125   0.134  -0.432   0.205 -10.      0.163]\n",
      "instance 5, ep 1, state [0 0 1 0 1 1 1 0]\n",
      "instance 5, ep 2, state [0 0 1 1 1 1 1 1]\n",
      "instance 5, ep 3, state [0 1 0 1 1 1 0 0]\n",
      "instance 5, ep 4, state [0 0 0 1 1 0 0 0]\n",
      "instance 5, ep 5, state [1 1 1 0 1 1 0 1]\n",
      "---------------------------------------------------\n",
      "5 100  | a  [1 0 0 1 0 0 1 0]  | s'  [1 1 1 0 0 1 0 1]  | r  6    | WI  [  0.607   0.133   0.225   0.921   0.415 -10.      0.457 -10.   ]\n",
      "instance 5, ep 6, state [0 1 0 1 1 1 1 0]\n",
      "instance 5, ep 7, state [0 0 0 1 0 1 1 1]\n",
      "instance 5, ep 8, state [0 1 1 0 1 1 0 1]\n",
      "instance 5, ep 9, state [0 0 0 0 0 0 1 1]\n",
      "instance 5, ep 10, state [1 0 0 1 0 0 1 0]\n",
      "---------------------------------------------------\n",
      "5 200  | a  [0 0 1 0 0 1 0 1]  | s'  [0 1 1 1 0 1 0 0]  | r  3    | WI  [  0.382   0.406   0.507   0.313 -10.      0.908 -10.      0.494]\n",
      "instance 5, ep 11, state [1 1 0 0 1 0 0 1]\n",
      "instance 5, ep 12, state [0 1 1 0 0 0 0 0]\n",
      "instance 5, ep 13, state [1 0 1 1 1 1 0 1]\n",
      "instance 5, ep 14, state [1 0 0 1 0 0 0 0]\n",
      "instance 5, ep 15, state [1 1 1 0 0 0 0 0]\n",
      "---------------------------------------------------\n",
      "5 300  | a  [0 0 0 1 0 1 1 0]  | s'  [1 0 1 0 0 1 1 0]  | r  3    | WI  [  0.335   0.452   0.212   0.505   0.47    0.908   0.772 -10.   ]\n",
      "instance 5, ep 16, state [1 0 1 0 0 0 1 1]\n",
      "instance 5, ep 17, state [1 0 0 1 0 1 0 0]\n",
      "instance 5, ep 18, state [0 0 1 0 0 0 0 1]\n",
      "instance 5, ep 19, state [1 1 1 0 1 0 0 1]\n",
      "instance 5, ep 20, state [0 1 0 1 1 1 1 1]\n",
      "---------------------------------------------------\n",
      "5 400  | a  [1 0 1 1 0 0 0 0]  | s'  [0 1 0 1 1 0 1 1]  | r  6    | WI  [  0.841   0.319   0.565   0.451   0.415 -10.    -10.    -10.   ]\n",
      "instance 5, ep 21, state [0 1 0 1 1 1 0 0]\n",
      "instance 5, ep 22, state [1 0 0 0 1 1 0 0]\n",
      "instance 5, ep 23, state [0 1 1 0 0 0 1 1]\n",
      "instance 5, ep 24, state [0 0 0 1 0 1 1 0]\n",
      "instance 5, ep 25, state [0 0 1 1 1 1 0 1]\n",
      "---------------------------------------------------\n",
      "5 500  | a  [1 0 0 1 0 0 1 0]  | s'  [1 1 1 1 0 0 1 0]  | r  5    | WI  [  0.841   0.274   0.211   0.464   0.379 -10.      0.772 -10.   ]\n",
      "instance 5, ep 26, state [1 0 1 1 1 1 1 1]\n",
      "instance 5, ep 27, state [0 0 1 0 0 0 0 1]\n",
      "instance 5, ep 28, state [1 0 0 0 1 1 0 1]\n",
      "instance 5, ep 29, state [1 1 1 0 1 0 1 1]\n",
      "first state [0 1 0 1 0 1 0 1]\n",
      "---------------------------------------------------\n",
      "6 0  | a  [0 1 0 1 0 1 0 0]  | s'  [0 1 0 1 0 1 0 0]  | r  4    | WI  [-10.      0.204 -10.      0.116  -0.15    0.106 -10.    -10.   ]\n",
      "instance 6, ep 1, state [1 1 1 1 1 0 1 0]\n",
      "instance 6, ep 2, state [0 0 0 1 1 1 1 0]\n",
      "instance 6, ep 3, state [0 0 0 0 0 1 1 1]\n",
      "instance 6, ep 4, state [1 1 0 1 1 0 0 1]\n",
      "instance 6, ep 5, state [0 1 1 0 0 0 0 0]\n",
      "---------------------------------------------------\n",
      "6 100  | a  [0 0 0 1 1 0 1 0]  | s'  [0 1 1 1 1 0 1 0]  | r  2    | WI  [  0.541   0.196   0.326   0.576   1.    -10.      0.714 -10.   ]\n",
      "instance 6, ep 6, state [1 0 1 0 1 0 0 1]\n",
      "instance 6, ep 7, state [1 0 1 0 0 0 0 1]\n",
      "instance 6, ep 8, state [0 0 1 1 0 1 0 1]\n",
      "instance 6, ep 9, state [1 1 0 0 0 0 0 1]\n",
      "instance 6, ep 10, state [0 0 1 0 1 0 0 0]\n",
      "---------------------------------------------------\n",
      "6 200  | a  [1 1 0 0 0 0 1 0]  | s'  [1 1 1 0 0 0 1 0]  | r  2    | WI  [  0.498   1.      0.327   0.477   0.471 -10.      0.736 -10.   ]\n",
      "instance 6, ep 11, state [0 1 0 1 0 0 1 0]\n",
      "instance 6, ep 12, state [1 1 1 1 0 0 0 1]\n",
      "instance 6, ep 13, state [1 0 1 0 1 0 1 1]\n",
      "instance 6, ep 14, state [0 0 0 0 0 1 1 1]\n",
      "instance 6, ep 15, state [0 1 1 0 1 1 0 0]\n",
      "---------------------------------------------------\n",
      "6 300  | a  [1 0 0 1 0 0 1 0]  | s'  [0 0 1 1 1 0 1 0]  | r  4    | WI  [0.531 0.132 0.328 0.482 0.466 0.395 0.957 0.394]\n",
      "instance 6, ep 16, state [0 0 1 1 1 0 0 1]\n",
      "instance 6, ep 17, state [1 0 1 1 0 0 1 0]\n",
      "instance 6, ep 18, state [0 0 0 1 1 0 1 1]\n",
      "instance 6, ep 19, state [1 0 0 1 1 0 0 0]\n",
      "instance 6, ep 20, state [1 1 0 0 1 1 0 1]\n",
      "---------------------------------------------------\n",
      "6 400  | a  [0 0 0 1 0 0 1 1]  | s'  [1 0 0 1 1 0 0 0]  | r  5    | WI  [  0.238   0.183   0.37    0.511   0.374 -10.      0.597   0.381]\n",
      "instance 6, ep 21, state [1 0 1 0 1 1 1 1]\n",
      "instance 6, ep 22, state [0 1 1 0 1 1 0 1]\n",
      "instance 6, ep 23, state [1 0 1 0 0 0 1 1]\n",
      "instance 6, ep 24, state [0 0 1 0 1 1 1 1]\n",
      "instance 6, ep 25, state [0 1 1 1 0 1 0 0]\n",
      "---------------------------------------------------\n",
      "6 500  | a  [1 0 0 0 1 0 1 0]  | s'  [1 1 0 0 0 0 0 0]  | r  4    | WI  [  0.469   0.196   0.318   0.276   1.    -10.      0.555 -10.   ]\n",
      "instance 6, ep 26, state [0 1 1 1 1 0 1 0]\n",
      "instance 6, ep 27, state [1 1 1 1 0 0 1 0]\n",
      "instance 6, ep 28, state [0 0 1 0 0 1 1 0]\n",
      "instance 6, ep 29, state [0 0 0 0 1 1 1 0]\n",
      "first state [1 0 1 1 1 1 1 0]\n",
      "---------------------------------------------------\n",
      "7 0  | a  [1 0 1 0 1 0 0 0]  | s'  [1 0 1 1 1 1 0 0]  | r  6    | WI  [  0.153   0.04    0.243 -10.      0.162 -10.    -10.    -10.   ]\n",
      "instance 7, ep 1, state [0 0 1 0 1 1 1 1]\n",
      "instance 7, ep 2, state [0 1 1 0 0 1 1 1]\n",
      "instance 7, ep 3, state [1 1 1 0 0 0 1 1]\n",
      "instance 7, ep 4, state [1 0 1 1 1 1 0 1]\n",
      "instance 7, ep 5, state [0 0 0 1 1 1 1 1]\n",
      "---------------------------------------------------\n",
      "7 100  | a  [1 0 1 0 1 0 0 0]  | s'  [1 0 0 0 1 0 0 1]  | r  5    | WI  [  0.914 -10.      0.59  -10.      0.315 -10.    -10.      0.296]\n",
      "instance 7, ep 6, state [1 0 0 0 0 0 0 0]\n",
      "instance 7, ep 7, state [1 0 0 0 1 0 0 1]\n",
      "instance 7, ep 8, state [0 0 0 0 0 0 1 1]\n",
      "instance 7, ep 9, state [1 0 1 0 0 1 0 0]\n",
      "instance 7, ep 10, state [1 1 0 1 1 0 0 0]\n",
      "---------------------------------------------------\n",
      "7 200  | a  [0 0 1 0 1 0 0 1]  | s'  [1 0 1 0 1 0 1 0]  | r  4    | WI  [  0.127 -10.      0.801 -10.      0.321 -10.    -10.      0.444]\n",
      "instance 7, ep 11, state [0 0 1 1 1 0 1 1]\n",
      "instance 7, ep 12, state [1 0 1 0 0 0 1 1]\n",
      "instance 7, ep 13, state [0 0 0 0 0 0 1 0]\n",
      "instance 7, ep 14, state [0 0 1 1 1 0 1 0]\n",
      "instance 7, ep 15, state [1 1 1 1 1 0 1 0]\n",
      "---------------------------------------------------\n",
      "7 300  | a  [0 0 1 0 1 0 0 1]  | s'  [0 0 1 0 1 0 0 0]  | r  6    | WI  [  0.072 -10.      0.208   0.05    0.307 -10.    -10.      0.427]\n",
      "instance 7, ep 16, state [1 0 0 0 0 0 1 0]\n",
      "instance 7, ep 17, state [0 1 0 1 1 1 1 0]\n",
      "instance 7, ep 18, state [1 0 0 1 0 1 1 1]\n",
      "instance 7, ep 19, state [1 0 0 1 0 1 1 1]\n",
      "instance 7, ep 20, state [0 0 0 0 1 0 0 0]\n",
      "---------------------------------------------------\n",
      "7 400  | a  [1 0 1 0 0 0 0 1]  | s'  [0 0 0 0 0 1 1 1]  | r  1    | WI  [  0.986 -10.      0.674   0.407 -10.    -10.    -10.      0.462]\n",
      "instance 7, ep 21, state [1 1 0 0 0 0 1 1]\n",
      "instance 7, ep 22, state [0 0 1 0 1 0 0 0]\n",
      "instance 7, ep 23, state [1 1 0 0 0 0 0 0]\n",
      "instance 7, ep 24, state [1 0 0 1 0 1 0 1]\n",
      "instance 7, ep 25, state [1 1 1 0 1 0 0 0]\n",
      "---------------------------------------------------\n",
      "7 500  | a  [0 0 0 1 1 0 0 1]  | s'  [1 0 0 0 1 0 0 0]  | r  4    | WI  [  0.131 -10.      0.332   0.367   0.335 -10.    -10.      0.443]\n",
      "instance 7, ep 26, state [1 0 1 1 1 1 0 0]\n",
      "instance 7, ep 27, state [0 0 0 0 0 1 1 0]\n",
      "instance 7, ep 28, state [1 0 0 1 0 0 1 1]\n",
      "instance 7, ep 29, state [1 1 1 0 0 0 0 1]\n",
      "first state [1 0 0 1 0 1 0 0]\n",
      "---------------------------------------------------\n",
      "8 0  | a  [0 0 0 1 0 1 0 1]  | s'  [0 0 0 1 0 0 0 1]  | r  3    | WI  [-10.    -10.    -10.      0.193 -10.     -0.038 -10.    -10.   ]\n",
      "instance 8, ep 1, state [1 1 1 1 0 0 1 1]\n",
      "instance 8, ep 2, state [0 1 0 0 0 1 1 0]\n",
      "instance 8, ep 3, state [1 0 0 0 0 0 1 1]\n",
      "instance 8, ep 4, state [1 0 0 0 0 1 0 1]\n",
      "instance 8, ep 5, state [1 0 1 1 1 1 0 0]\n",
      "---------------------------------------------------\n",
      "8 100  | a  [0 1 0 0 0 0 1 1]  | s'  [0 1 1 0 0 1 1 1]  | r  5    | WI  [  0.117   0.441   0.119   0.192 -10.      0.266   0.614   1.   ]\n",
      "instance 8, ep 6, state [0 0 1 0 1 1 0 0]\n",
      "instance 8, ep 7, state [1 1 1 0 0 0 0 1]\n",
      "instance 8, ep 8, state [1 1 1 1 0 0 1 0]\n",
      "instance 8, ep 9, state [1 1 0 1 1 1 1 1]\n",
      "instance 8, ep 10, state [0 0 1 1 0 0 1 1]\n",
      "---------------------------------------------------\n",
      "8 200  | a  [0 1 0 0 1 1 0 0]  | s'  [0 0 1 0 0 0 0 1]  | r  4    | WI  [  0.137   0.441   0.203   0.305   0.846   0.318 -10.    -10.   ]\n",
      "instance 8, ep 11, state [1 1 0 0 1 0 0 0]\n",
      "instance 8, ep 12, state [1 1 0 0 1 1 0 0]\n",
      "instance 8, ep 13, state [0 1 0 0 1 1 0 1]\n",
      "instance 8, ep 14, state [0 1 0 1 0 1 1 1]\n",
      "instance 8, ep 15, state [1 1 0 0 1 0 1 1]\n",
      "---------------------------------------------------\n",
      "8 300  | a  [0 1 0 1 0 1 0 0]  | s'  [0 1 0 1 0 0 0 0]  | r  5    | WI  [  0.12    0.448 -10.      0.962   0.324   0.361 -10.    -10.   ]\n",
      "instance 8, ep 16, state [0 1 0 1 0 0 1 1]\n",
      "instance 8, ep 17, state [1 1 0 1 0 1 1 1]\n",
      "instance 8, ep 18, state [1 0 1 0 1 0 1 1]\n",
      "instance 8, ep 19, state [0 0 1 0 0 0 0 1]\n",
      "instance 8, ep 20, state [1 0 0 0 0 0 0 0]\n",
      "---------------------------------------------------\n",
      "8 400  | a  [0 0 0 1 1 0 0 1]  | s'  [0 0 0 0 0 0 0 1]  | r  1    | WI  [  0.118   0.433   0.217   0.946   0.733 -10.      0.546   0.922]\n",
      "instance 8, ep 21, state [1 0 1 1 1 1 1 1]\n",
      "instance 8, ep 22, state [1 1 1 1 0 0 0 1]\n",
      "instance 8, ep 23, state [1 1 1 0 0 1 1 1]\n",
      "instance 8, ep 24, state [0 1 1 1 1 1 0 1]\n",
      "instance 8, ep 25, state [1 1 1 0 0 1 1 1]\n",
      "---------------------------------------------------\n",
      "8 500  | a  [0 1 0 1 1 0 0 0]  | s'  [0 1 1 1 0 1 0 1]  | r  6    | WI  [  0.12    0.432   0.267   0.946   0.722 -10.    -10.    -10.   ]\n",
      "instance 8, ep 26, state [0 1 1 1 0 1 1 0]\n",
      "instance 8, ep 27, state [1 1 1 0 0 0 0 0]\n",
      "instance 8, ep 28, state [1 0 1 1 1 1 1 1]\n",
      "instance 8, ep 29, state [0 0 1 1 0 1 1 0]\n",
      "first state [0 1 0 0 0 0 1 0]\n",
      "---------------------------------------------------\n",
      "9 0  | a  [0 1 1 0 0 0 1 0]  | s'  [0 1 1 0 0 0 1 0]  | r  2    | WI  [-10.      0.129   0.174 -10.     -0.432  -0.428   0.17  -10.   ]\n",
      "instance 9, ep 1, state [1 1 0 1 1 1 0 0]\n",
      "instance 9, ep 2, state [1 1 1 0 1 0 0 0]\n",
      "instance 9, ep 3, state [1 0 0 1 0 0 0 1]\n",
      "instance 9, ep 4, state [1 0 1 1 0 1 1 1]\n",
      "instance 9, ep 5, state [0 1 1 0 0 0 0 1]\n",
      "---------------------------------------------------\n",
      "9 100  | a  [0 0 0 0 1 1 1 0]  | s'  [0 0 0 0 0 0 1 1]  | r  3    | WI  [  0.336   0.26    0.163   0.394   0.642   1.      0.418 -10.   ]\n",
      "instance 9, ep 6, state [0 0 1 0 1 0 0 0]\n",
      "instance 9, ep 7, state [0 0 1 1 0 1 1 1]\n",
      "instance 9, ep 8, state [0 0 0 1 1 0 0 1]\n",
      "instance 9, ep 9, state [1 1 1 0 1 1 0 1]\n",
      "instance 9, ep 10, state [1 0 1 1 1 0 0 1]\n",
      "---------------------------------------------------\n",
      "9 200  | a  [0 1 0 0 0 1 1 0]  | s'  [1 0 0 0 1 1 0 1]  | r  5    | WI  [0.307 0.819 0.201 0.158 0.254 0.77  0.457 0.276]\n",
      "instance 9, ep 11, state [0 1 1 0 1 1 0 1]\n",
      "instance 9, ep 12, state [1 1 1 0 1 1 1 1]\n",
      "instance 9, ep 13, state [0 1 0 0 0 1 1 1]\n",
      "instance 9, ep 14, state [1 1 1 0 0 0 1 1]\n",
      "instance 9, ep 15, state [0 0 1 0 1 1 0 0]\n",
      "---------------------------------------------------\n",
      "9 300  | a  [0 1 0 0 1 0 0 1]  | s'  [0 1 1 0 1 1 0 1]  | r  3    | WI  [  0.647   0.935   0.202   0.243   0.691 -10.    -10.      0.668]\n",
      "instance 9, ep 16, state [1 1 1 1 0 1 1 1]\n",
      "instance 9, ep 17, state [0 1 1 0 0 1 0 0]\n",
      "instance 9, ep 18, state [0 1 1 1 0 1 1 1]\n",
      "instance 9, ep 19, state [1 0 1 0 1 0 0 0]\n",
      "instance 9, ep 20, state [1 0 1 0 0 1 0 0]\n",
      "---------------------------------------------------\n",
      "9 400  | a  [0 1 0 0 1 0 0 1]  | s'  [0 1 1 0 0 0 0 0]  | r  3    | WI  [  0.27    0.947   0.197   0.384   0.563 -10.      0.523   0.668]\n",
      "instance 9, ep 21, state [1 0 0 0 1 1 1 1]\n",
      "instance 9, ep 22, state [0 0 1 0 0 0 0 1]\n",
      "instance 9, ep 23, state [0 1 0 1 0 0 1 1]\n",
      "instance 9, ep 24, state [0 0 0 0 0 0 0 0]\n",
      "instance 9, ep 25, state [1 1 1 0 0 1 0 0]\n",
      "---------------------------------------------------\n",
      "9 500  | a  [0 0 0 0 1 0 1 1]  | s'  [0 0 1 0 0 1 0 1]  | r  4    | WI  [0.262 0.263 0.199 0.353 0.54  0.299 0.522 0.668]\n",
      "instance 9, ep 26, state [1 1 1 0 0 1 0 1]\n",
      "instance 9, ep 27, state [1 1 0 0 1 1 1 0]\n",
      "instance 9, ep 28, state [0 1 1 1 0 1 1 1]\n",
      "instance 9, ep 29, state [0 0 1 0 0 1 0 1]\n"
     ]
    },
    {
     "data": {
      "text/plain": [
       "3.5568333333333335"
      ]
     },
     "execution_count": 15,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "np.random.seed(seed)\n",
    "random.seed(seed)\n",
    "perfect_rewards = UCWhittleOracle(simulator, n_episodes, n_epochs, discount, alpha=alpha, method='UCB',norm_confidence=True)\n",
    "np.mean(perfect_rewards)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 16,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "first state [0 1 1 1 1 1 1 1]\n",
      "   state [0 1 1 1 1 1 1 1] state_WI [  0.39   0.47   0.47   0.26   0.45 -10.   -10.   -10.  ] sorted [2 1 4]\n",
      "   state [0 1 1 0 1 0 1 1] state_WI [  0.39   0.47   0.47   0.71   0.45   0.52 -10.   -10.  ] sorted [3 5 2]\n",
      "   state [0 1 1 1 1 1 0 0] state_WI [  0.39   0.47   0.47   0.26   0.45 -10.     0.49   0.82] sorted [7 6 2]\n",
      "   state [0 1 1 1 0 0 0 0] state_WI [0.39 0.47 0.47 0.26 0.45 0.52 0.49 0.82] sorted [7 5 6]\n",
      "   state [0 1 1 0 0 1 0 1] state_WI [  0.39   0.47   0.47   0.71   0.45 -10.     0.49 -10.  ] sorted [3 6 2]\n",
      "   state [1 0 1 1 0 0 1 0] state_WI [  0.26   0.54   0.47   0.26   0.45   0.52 -10.     0.82] sorted [7 1 5]\n",
      "   state [0 1 0 0 0 1 1 0] state_WI [  0.39   0.47   0.58   0.71   0.45 -10.   -10.     0.82] sorted [7 3 2]\n",
      "   state [1 0 0 1 0 1 0 1] state_WI [  0.26   0.54   0.58   0.26   0.45 -10.     0.49 -10.  ] sorted [2 1 6]\n",
      "   state [0 1 1 1 0 0 1 1] state_WI [  0.39   0.47   0.47   0.26   0.45   0.52 -10.   -10.  ] sorted [5 2 1]\n",
      "   state [0 1 1 1 0 1 0 0] state_WI [  0.39   0.47   0.47   0.26   0.45 -10.     0.49   0.82] sorted [7 6 2]\n",
      "   state [1 1 1 1 0 0 0 1] state_WI [  0.26   0.47   0.47   0.26   0.45   0.52   0.49 -10.  ] sorted [5 6 2]\n",
      "   state [1 0 1 1 0 1 0 1] state_WI [  0.26   0.54   0.47   0.26   0.45 -10.     0.49 -10.  ] sorted [1 6 2]\n",
      "   state [1 0 1 1 1 1 1 0] state_WI [  0.26   0.54   0.47   0.26   0.45 -10.   -10.     0.82] sorted [7 1 2]\n",
      "   state [1 1 0 0 0 1 1 0] state_WI [  0.26   0.47   0.58   0.71   0.45 -10.   -10.     0.82] sorted [7 3 2]\n",
      "   state [1 0 1 1 0 0 0 0] state_WI [0.26 0.54 0.47 0.26 0.45 0.52 0.49 0.82] sorted [7 1 5]\n",
      "   state [0 1 1 1 1 1 0 1] state_WI [  0.39   0.47   0.47   0.26   0.45 -10.     0.49 -10.  ] sorted [6 2 1]\n",
      "   state [1 1 1 0 1 1 0 1] state_WI [  0.26   0.47   0.47   0.71   0.45 -10.     0.49 -10.  ] sorted [3 6 2]\n",
      "   state [1 0 1 1 0 1 0 1] state_WI [  0.26   0.54   0.47   0.26   0.45 -10.     0.49 -10.  ] sorted [1 6 2]\n",
      "   state [1 1 1 0 0 0 1 1] state_WI [  0.26   0.47   0.47   0.71   0.45   0.52 -10.   -10.  ] sorted [3 5 2]\n",
      "   state [1 0 1 0 0 1 0 0] state_WI [  0.26   0.54   0.47   0.71   0.45 -10.     0.49   0.82] sorted [7 3 1]\n",
      "instance 0, ep 1, state [0 0 0 1 1 1 0 1]\n",
      "   state [0 0 0 1 1 1 0 1] state_WI [  0.39   0.54   0.58   0.26   0.45 -10.     0.49 -10.  ] sorted [2 1 6]\n",
      "   state [0 1 1 0 0 1 0 0] state_WI [  0.39   0.47   0.47   0.71   0.45 -10.     0.49   0.82] sorted [7 3 6]\n",
      "   state [0 0 0 0 0 0 0 1] state_WI [  0.39   0.54   0.58   0.71   0.45   0.52   0.49 -10.  ] sorted [3 2 1]\n",
      "   state [0 0 1 1 0 0 0 0] state_WI [0.39 0.54 0.47 0.26 0.45 0.52 0.49 0.82] sorted [7 1 5]\n",
      "   state [0 0 0 0 0 1 0 1] state_WI [  0.39   0.54   0.58   0.71   0.45 -10.     0.49 -10.  ] sorted [3 2 1]\n",
      "   state [0 1 0 1 0 0 0 1] state_WI [  0.39   0.47   0.58   0.26   0.45   0.52   0.49 -10.  ] sorted [2 5 6]\n",
      "   state [0 0 1 1 0 0 0 0] state_WI [0.39 0.54 0.47 0.26 0.45 0.52 0.49 0.82] sorted [7 1 5]\n",
      "   state [0 0 0 1 0 0 0 1] state_WI [  0.39   0.54   0.58   0.26   0.45   0.52   0.49 -10.  ] sorted [2 1 5]\n",
      "   state [0 1 0 0 0 0 0 0] state_WI [0.39 0.47 0.58 0.71 0.45 0.52 0.49 0.82] sorted [7 3 2]\n",
      "   state [0 0 0 0 0 1 0 1] state_WI [  0.39   0.54   0.58   0.71   0.45 -10.     0.49 -10.  ] sorted [3 2 1]\n",
      "   state [0 1 0 1 0 1 0 0] state_WI [  0.39   0.47   0.58   0.26   0.45 -10.     0.49   0.82] sorted [7 2 6]\n",
      "   state [0 0 1 1 0 1 1 0] state_WI [  0.39   0.54   0.47   0.26   0.45 -10.   -10.     0.82] sorted [7 1 2]\n",
      "   state [0 0 1 0 0 0 0 1] state_WI [  0.39   0.54   0.47   0.71   0.45   0.52   0.49 -10.  ] sorted [3 1 5]\n",
      "   state [0 1 0 1 0 0 1 1] state_WI [  0.39   0.47   0.58   0.26   0.45   0.52 -10.   -10.  ] sorted [2 5 1]\n",
      "   state [1 1 0 1 1 1 0 0] state_WI [  0.26   0.47   0.58   0.26   0.45 -10.     0.49   0.82] sorted [7 2 6]\n",
      "   state [1 0 0 0 0 0 0 1] state_WI [  0.26   0.54   0.58   0.71   0.45   0.52   0.49 -10.  ] sorted [3 2 1]\n",
      "   state [0 1 0 1 0 0 0 0] state_WI [0.39 0.47 0.58 0.26 0.45 0.52 0.49 0.82] sorted [7 2 5]\n",
      "   state [0 1 0 1 0 1 0 1] state_WI [  0.39   0.47   0.58   0.26   0.45 -10.     0.49 -10.  ] sorted [2 6 1]\n",
      "   state [0 1 0 1 0 1 0 1] state_WI [  0.39   0.47   0.58   0.26   0.45 -10.     0.49 -10.  ] sorted [2 6 1]\n",
      "   state [1 0 0 1 0 1 0 1] state_WI [  0.26   0.54   0.58   0.26   0.45 -10.     0.49 -10.  ] sorted [2 1 6]\n",
      "instance 0, ep 2, state [0 1 1 1 0 0 0 1]\n",
      "   state [0 1 1 1 0 0 0 1] state_WI [  0.39   0.47   0.47   0.26   0.45   0.52   0.49 -10.  ] sorted [5 6 2]\n",
      "   state [0 1 1 0 0 0 1 0] state_WI [  0.39   0.47   0.47   0.71   0.45   0.52 -10.     0.82] sorted [7 3 5]\n",
      "   state [0 1 0 1 1 1 0 1] state_WI [  0.39   0.47   0.58   0.26   0.45 -10.     0.49 -10.  ] sorted [2 6 1]\n",
      "   state [0 1 0 1 0 0 1 1] state_WI [  0.39   0.47   0.58   0.26   0.45   0.52 -10.   -10.  ] sorted [2 5 1]\n",
      "   state [0 1 0 1 0 1 1 1] state_WI [  0.39   0.47   0.58   0.26   0.45 -10.   -10.   -10.  ] sorted [2 1 4]\n",
      "   state [0 1 0 1 0 0 1 0] state_WI [  0.39   0.47   0.58   0.26   0.45   0.52 -10.     0.82] sorted [7 2 5]\n",
      "   state [0 1 1 1 0 1 0 1] state_WI [  0.39   0.47   0.47   0.26   0.45 -10.     0.49 -10.  ] sorted [6 2 1]\n",
      "   state [0 1 1 0 0 1 0 1] state_WI [  0.39   0.47   0.47   0.71   0.45 -10.     0.49 -10.  ] sorted [3 6 2]\n",
      "   state [0 1 0 1 1 0 1 1] state_WI [  0.39   0.47   0.58   0.26   0.45   0.52 -10.   -10.  ] sorted [2 5 1]\n",
      "   state [0 0 1 1 0 1 1 1] state_WI [  0.39   0.54   0.47   0.26   0.45 -10.   -10.   -10.  ] sorted [1 2 4]\n",
      "   state [0 0 1 1 0 1 1 1] state_WI [  0.39   0.54   0.47   0.26   0.45 -10.   -10.   -10.  ] sorted [1 2 4]\n",
      "   state [0 0 0 0 1 0 0 0] state_WI [0.39 0.54 0.58 0.71 0.45 0.52 0.49 0.82] sorted [7 3 2]\n",
      "   state [0 1 0 0 1 0 0 1] state_WI [  0.39   0.47   0.58   0.71   0.45   0.52   0.49 -10.  ] sorted [3 2 5]\n",
      "   state [0 0 1 1 1 0 0 1] state_WI [  0.39   0.54   0.47   0.26   0.45   0.52   0.49 -10.  ] sorted [1 5 6]\n",
      "   state [0 1 0 1 0 0 0 1] state_WI [  0.39   0.47   0.58   0.26   0.45   0.52   0.49 -10.  ] sorted [2 5 6]\n",
      "   state [0 1 0 1 0 1 0 0] state_WI [  0.39   0.47   0.58   0.26   0.45 -10.     0.49   0.82] sorted [7 2 6]\n",
      "   state [0 0 1 0 0 0 0 1] state_WI [  0.39   0.54   0.47   0.71   0.45   0.52   0.49 -10.  ] sorted [3 1 5]\n",
      "   state [0 1 0 0 0 1 0 0] state_WI [  0.39   0.47   0.58   0.71   0.45 -10.     0.49   0.82] sorted [7 3 2]\n",
      "   state [0 0 0 0 0 1 0 0] state_WI [  0.39   0.54   0.58   0.71   0.45 -10.     0.49   0.82] sorted [7 3 2]\n",
      "   state [0 0 0 0 0 0 0 0] state_WI [0.39 0.54 0.58 0.71 0.45 0.52 0.49 0.82] sorted [7 3 2]\n",
      "instance 0, ep 3, state [0 0 0 1 0 1 1 0]\n",
      "   state [0 0 0 1 0 1 1 0] state_WI [  0.39   0.54   0.58   0.26   0.45 -10.   -10.     0.82] sorted [7 2 1]\n",
      "   state [0 1 0 0 0 0 0 1] state_WI [  0.39   0.47   0.58   0.71   0.45   0.52   0.49 -10.  ] sorted [3 2 5]\n",
      "   state [0 1 1 0 0 0 0 0] state_WI [0.39 0.47 0.47 0.71 0.45 0.52 0.49 0.82] sorted [7 3 5]\n",
      "   state [0 0 1 1 0 1 0 0] state_WI [  0.39   0.54   0.47   0.26   0.45 -10.     0.49   0.82] sorted [7 1 6]\n",
      "   state [1 1 1 1 0 0 0 1] state_WI [  0.26   0.47   0.47   0.26   0.45   0.52   0.49 -10.  ] sorted [5 6 2]\n",
      "   state [1 0 1 1 1 1 0 0] state_WI [  0.26   0.54   0.47   0.26   0.45 -10.     0.49   0.82] sorted [7 1 6]\n",
      "   state [0 1 0 1 0 0 1 1] state_WI [  0.39   0.47   0.58   0.26   0.45   0.52 -10.   -10.  ] sorted [2 5 1]\n",
      "   state [0 0 0 1 0 1 1 1] state_WI [  0.39   0.54   0.58   0.26   0.45 -10.   -10.   -10.  ] sorted [2 1 4]\n",
      "   state [0 1 0 0 1 0 0 1] state_WI [  0.39   0.47   0.58   0.71   0.45   0.52   0.49 -10.  ] sorted [3 2 5]\n",
      "   state [0 1 0 1 0 0 0 0] state_WI [0.39 0.47 0.58 0.26 0.45 0.52 0.49 0.82] sorted [7 2 5]\n",
      "   state [0 0 1 1 0 0 0 0] state_WI [0.39 0.54 0.47 0.26 0.45 0.52 0.49 0.82] sorted [7 1 5]\n",
      "   state [0 0 1 1 0 1 0 0] state_WI [  0.39   0.54   0.47   0.26   0.45 -10.     0.49   0.82] sorted [7 1 6]\n",
      "   state [0 1 1 0 0 1 1 1] state_WI [  0.39   0.47   0.47   0.71   0.45 -10.   -10.   -10.  ] sorted [3 2 1]\n",
      "   state [0 1 1 0 1 0 1 0] state_WI [  0.39   0.47   0.47   0.71   0.45   0.52 -10.     0.82] sorted [7 3 5]\n",
      "   state [0 0 1 1 1 1 1 1] state_WI [  0.39   0.54   0.47   0.26   0.45 -10.   -10.   -10.  ] sorted [1 2 4]\n",
      "   state [0 1 1 1 1 0 1 1] state_WI [  0.39   0.47   0.47   0.26   0.45   0.52 -10.   -10.  ] sorted [5 2 1]\n",
      "   state [0 1 1 0 1 0 1 1] state_WI [  0.39   0.47   0.47   0.71   0.45   0.52 -10.   -10.  ] sorted [3 5 2]\n",
      "   state [1 0 1 1 0 1 0 1] state_WI [  0.26   0.54   0.47   0.26   0.45 -10.     0.49 -10.  ] sorted [1 6 2]\n",
      "   state [0 0 0 1 0 1 0 0] state_WI [  0.39   0.54   0.58   0.26   0.45 -10.     0.49   0.82] sorted [7 2 1]\n",
      "   state [0 1 0 1 1 1 0 0] state_WI [  0.39   0.47   0.58   0.26   0.45 -10.     0.49   0.82] sorted [7 2 6]\n",
      "instance 0, ep 4, state [1 1 0 1 1 1 1 1]\n",
      "   state [1 1 0 1 1 1 1 1] state_WI [  0.26   0.47   0.58   0.26   0.45 -10.   -10.   -10.  ] sorted [2 1 4]\n",
      "   state [1 1 1 1 1 1 1 0] state_WI [  0.26   0.47   0.47   0.26   0.45 -10.   -10.     0.82] sorted [7 2 1]\n",
      "   state [0 1 1 0 0 0 0 0] state_WI [0.39 0.47 0.47 0.71 0.45 0.52 0.49 0.82] sorted [7 3 5]\n",
      "   state [0 0 1 1 0 1 0 1] state_WI [  0.39   0.54   0.47   0.26   0.45 -10.     0.49 -10.  ] sorted [1 6 2]\n",
      "   state [0 0 1 1 1 0 1 0] state_WI [  0.39   0.54   0.47   0.26   0.45   0.52 -10.     0.82] sorted [7 1 5]\n",
      "   state [1 0 1 1 0 1 0 0] state_WI [  0.26   0.54   0.47   0.26   0.45 -10.     0.49   0.82] sorted [7 1 6]\n",
      "   state [0 0 1 0 0 1 1 1] state_WI [  0.39   0.54   0.47   0.71   0.45 -10.   -10.   -10.  ] sorted [3 1 2]\n",
      "   state [1 0 1 1 0 0 1 0] state_WI [  0.26   0.54   0.47   0.26   0.45   0.52 -10.     0.82] sorted [7 1 5]\n",
      "   state [0 1 1 1 0 1 0 0] state_WI [  0.39   0.47   0.47   0.26   0.45 -10.     0.49   0.82] sorted [7 6 2]\n",
      "   state [1 1 1 1 0 0 0 1] state_WI [  0.26   0.47   0.47   0.26   0.45   0.52   0.49 -10.  ] sorted [5 6 2]\n",
      "   state [0 0 1 1 0 0 1 0] state_WI [  0.39   0.54   0.47   0.26   0.45   0.52 -10.     0.82] sorted [7 1 5]\n",
      "   state [1 1 1 1 0 0 1 1] state_WI [  0.26   0.47   0.47   0.26   0.45   0.52 -10.   -10.  ] sorted [5 2 1]\n",
      "   state [0 1 1 1 0 1 1 1] state_WI [  0.39   0.47   0.47   0.26   0.45 -10.   -10.   -10.  ] sorted [2 1 4]\n",
      "   state [0 1 1 1 0 1 1 0] state_WI [  0.39   0.47   0.47   0.26   0.45 -10.   -10.     0.82] sorted [7 2 1]\n",
      "   state [1 0 1 1 0 1 1 1] state_WI [  0.26   0.54   0.47   0.26   0.45 -10.   -10.   -10.  ] sorted [1 2 4]\n",
      "   state [0 0 1 1 1 0 1 1] state_WI [  0.39   0.54   0.47   0.26   0.45   0.52 -10.   -10.  ] sorted [1 5 2]\n",
      "   state [0 0 1 1 1 0 1 1] state_WI [  0.39   0.54   0.47   0.26   0.45   0.52 -10.   -10.  ] sorted [1 5 2]\n",
      "   state [0 1 1 0 0 1 0 1] state_WI [  0.39   0.47   0.47   0.71   0.45 -10.     0.49 -10.  ] sorted [3 6 2]\n",
      "   state [0 1 0 1 1 1 1 0] state_WI [  0.39   0.47   0.58   0.26   0.45 -10.   -10.     0.82] sorted [7 2 1]\n",
      "   state [0 0 0 0 0 1 1 1] state_WI [  0.39   0.54   0.58   0.71   0.45 -10.   -10.   -10.  ] sorted [3 2 1]\n",
      "instance 0, ep 5, state [0 0 0 0 0 1 0 0]\n",
      "   state [0 0 0 0 0 1 0 0] state_WI [  0.39   0.54   0.58   0.71   0.45 -10.     0.49   0.82] sorted [7 3 2]\n",
      "   state [0 0 1 0 1 0 0 1] state_WI [  0.39   0.54   0.47   0.71   0.45   0.52   0.49 -10.  ] sorted [3 1 5]\n",
      "   state [0 1 0 0 1 0 0 0] state_WI [0.39 0.47 0.58 0.71 0.45 0.52 0.49 0.82] sorted [7 3 2]\n",
      "   state [0 0 1 1 1 0 1 0] state_WI [  0.39   0.54   0.47   0.26   0.45   0.52 -10.     0.82] sorted [7 1 5]\n",
      "   state [1 1 1 1 1 1 0 0] state_WI [  0.26   0.47   0.47   0.26   0.45 -10.     0.49   0.82] sorted [7 6 2]\n",
      "   state [1 1 1 1 0 0 1 1] state_WI [  0.26   0.47   0.47   0.26   0.45   0.52 -10.   -10.  ] sorted [5 2 1]\n",
      "   state [0 1 0 1 0 1 0 0] state_WI [  0.39   0.47   0.58   0.26   0.45 -10.     0.49   0.82] sorted [7 2 6]\n",
      "   state [0 0 0 1 0 0 1 1] state_WI [  0.39   0.54   0.58   0.26   0.45   0.52 -10.   -10.  ] sorted [2 1 5]\n",
      "   state [0 0 1 0 0 1 0 0] state_WI [  0.39   0.54   0.47   0.71   0.45 -10.     0.49   0.82] sorted [7 3 1]\n",
      "   state [0 1 1 0 0 0 0 1] state_WI [  0.39   0.47   0.47   0.71   0.45   0.52   0.49 -10.  ] sorted [3 5 6]\n",
      "   state [0 0 0 0 0 1 1 0] state_WI [  0.39   0.54   0.58   0.71   0.45 -10.   -10.     0.82] sorted [7 3 2]\n",
      "   state [0 0 1 1 0 1 0 1] state_WI [  0.39   0.54   0.47   0.26   0.45 -10.     0.49 -10.  ] sorted [1 6 2]\n",
      "   state [0 1 1 1 0 1 0 1] state_WI [  0.39   0.47   0.47   0.26   0.45 -10.     0.49 -10.  ] sorted [6 2 1]\n",
      "   state [0 1 1 1 0 1 0 0] state_WI [  0.39   0.47   0.47   0.26   0.45 -10.     0.49   0.82] sorted [7 6 2]\n",
      "   state [0 0 1 0 1 0 0 1] state_WI [  0.39   0.54   0.47   0.71   0.45   0.52   0.49 -10.  ] sorted [3 1 5]\n",
      "   state [0 1 1 1 0 1 1 1] state_WI [  0.39   0.47   0.47   0.26   0.45 -10.   -10.   -10.  ] sorted [2 1 4]\n",
      "   state [0 1 0 0 0 0 1 1] state_WI [  0.39   0.47   0.58   0.71   0.45   0.52 -10.   -10.  ] sorted [3 2 5]\n",
      "   state [0 0 0 1 1 0 1 1] state_WI [  0.39   0.54   0.58   0.26   0.45   0.52 -10.   -10.  ] sorted [2 1 5]\n",
      "   state [0 1 1 1 1 0 0 1] state_WI [  0.39   0.47   0.47   0.26   0.45   0.52   0.49 -10.  ] sorted [5 6 2]\n",
      "   state [1 0 1 1 1 0 1 1] state_WI [  0.26   0.54   0.47   0.26   0.45   0.52 -10.   -10.  ] sorted [1 5 2]\n",
      "instance 0, ep 6, state [0 1 0 1 0 0 0 0]\n",
      "   state [0 1 0 1 0 0 0 0] state_WI [0.39 0.47 0.58 0.26 0.45 0.52 0.49 0.82] sorted [7 2 5]\n",
      "   state [0 0 0 1 0 0 1 0] state_WI [  0.39   0.54   0.58   0.26   0.45   0.52 -10.     0.82] sorted [7 2 1]\n",
      "   state [0 0 1 0 1 0 0 0] state_WI [0.39 0.54 0.47 0.71 0.45 0.52 0.49 0.82] sorted [7 3 1]\n",
      "   state [0 1 0 1 0 0 0 1] state_WI [  0.39   0.47   0.58   0.26   0.45   0.52   0.49 -10.  ] sorted [2 5 6]\n",
      "   state [0 0 0 1 0 1 1 1] state_WI [  0.39   0.54   0.58   0.26   0.45 -10.   -10.   -10.  ] sorted [2 1 4]\n",
      "   state [0 1 0 0 0 0 0 1] state_WI [  0.39   0.47   0.58   0.71   0.45   0.52   0.49 -10.  ] sorted [3 2 5]\n",
      "   state [0 0 1 1 0 1 0 0] state_WI [  0.39   0.54   0.47   0.26   0.45 -10.     0.49   0.82] sorted [7 1 6]\n",
      "   state [1 1 0 1 0 1 0 1] state_WI [  0.26   0.47   0.58   0.26   0.45 -10.     0.49 -10.  ] sorted [2 6 1]\n",
      "   state [0 1 0 0 0 1 0 1] state_WI [  0.39   0.47   0.58   0.71   0.45 -10.     0.49 -10.  ] sorted [3 2 6]\n",
      "   state [1 0 1 1 0 0 1 1] state_WI [  0.26   0.54   0.47   0.26   0.45   0.52 -10.   -10.  ] sorted [1 5 2]\n",
      "   state [1 1 1 1 0 1 0 1] state_WI [  0.26   0.47   0.47   0.26   0.45 -10.     0.49 -10.  ] sorted [6 2 1]\n",
      "   state [1 1 1 1 0 1 0 1] state_WI [  0.26   0.47   0.47   0.26   0.45 -10.     0.49 -10.  ] sorted [6 2 1]\n",
      "   state [1 0 1 0 0 1 1 1] state_WI [  0.26   0.54   0.47   0.71   0.45 -10.   -10.   -10.  ] sorted [3 1 2]\n",
      "   state [1 0 1 1 0 1 1 0] state_WI [  0.26   0.54   0.47   0.26   0.45 -10.   -10.     0.82] sorted [7 1 2]\n",
      "   state [1 0 1 0 0 0 0 1] state_WI [  0.26   0.54   0.47   0.71   0.45   0.52   0.49 -10.  ] sorted [3 1 5]\n",
      "   state [0 1 0 1 0 0 0 1] state_WI [  0.39   0.47   0.58   0.26   0.45   0.52   0.49 -10.  ] sorted [2 5 6]\n",
      "   state [0 0 0 1 0 1 0 0] state_WI [  0.39   0.54   0.58   0.26   0.45 -10.     0.49   0.82] sorted [7 2 1]\n",
      "   state [0 0 1 1 0 1 0 1] state_WI [  0.39   0.54   0.47   0.26   0.45 -10.     0.49 -10.  ] sorted [1 6 2]\n",
      "   state [1 0 1 0 0 1 0 1] state_WI [  0.26   0.54   0.47   0.71   0.45 -10.     0.49 -10.  ] sorted [3 1 6]\n",
      "   state [0 1 0 0 0 0 0 0] state_WI [0.39 0.47 0.58 0.71 0.45 0.52 0.49 0.82] sorted [7 3 2]\n",
      "instance 0, ep 7, state [1 0 1 0 0 0 0 1]\n",
      "   state [1 0 1 0 0 0 0 1] state_WI [  0.26   0.54   0.47   0.71   0.45   0.52   0.49 -10.  ] sorted [3 1 5]\n",
      "   state [0 1 0 1 0 0 0 0] state_WI [0.39 0.47 0.58 0.26 0.45 0.52 0.49 0.82] sorted [7 2 5]\n",
      "   state [1 0 1 1 0 1 1 1] state_WI [  0.26   0.54   0.47   0.26   0.45 -10.   -10.   -10.  ] sorted [1 2 4]\n",
      "   state [1 1 1 0 1 0 1 1] state_WI [  0.26   0.47   0.47   0.71   0.45   0.52 -10.   -10.  ] sorted [3 5 2]\n",
      "   state [0 0 1 0 1 0 1 0] state_WI [  0.39   0.54   0.47   0.71   0.45   0.52 -10.     0.82] sorted [7 3 1]\n",
      "   state [0 1 1 0 1 0 0 0] state_WI [0.39 0.47 0.47 0.71 0.45 0.52 0.49 0.82] sorted [7 3 5]\n",
      "   state [0 1 1 1 0 0 0 1] state_WI [  0.39   0.47   0.47   0.26   0.45   0.52   0.49 -10.  ] sorted [5 6 2]\n",
      "   state [1 0 1 0 0 1 1 1] state_WI [  0.26   0.54   0.47   0.71   0.45 -10.   -10.   -10.  ] sorted [3 1 2]\n",
      "   state [0 0 1 1 0 0 0 1] state_WI [  0.39   0.54   0.47   0.26   0.45   0.52   0.49 -10.  ] sorted [1 5 6]\n",
      "   state [0 0 0 0 0 1 0 1] state_WI [  0.39   0.54   0.58   0.71   0.45 -10.     0.49 -10.  ] sorted [3 2 1]\n",
      "   state [0 1 1 1 0 0 0 1] state_WI [  0.39   0.47   0.47   0.26   0.45   0.52   0.49 -10.  ] sorted [5 6 2]\n",
      "   state [1 1 1 1 0 0 1 1] state_WI [  0.26   0.47   0.47   0.26   0.45   0.52 -10.   -10.  ] sorted [5 2 1]\n",
      "   state [0 1 1 1 0 1 1 0] state_WI [  0.39   0.47   0.47   0.26   0.45 -10.   -10.     0.82] sorted [7 2 1]\n",
      "   state [0 1 1 0 0 0 1 1] state_WI [  0.39   0.47   0.47   0.71   0.45   0.52 -10.   -10.  ] sorted [3 5 2]\n",
      "   state [0 1 1 1 0 1 0 1] state_WI [  0.39   0.47   0.47   0.26   0.45 -10.     0.49 -10.  ] sorted [6 2 1]\n",
      "   state [0 1 0 0 0 0 0 1] state_WI [  0.39   0.47   0.58   0.71   0.45   0.52   0.49 -10.  ] sorted [3 2 5]\n",
      "   state [0 0 0 1 0 1 1 0] state_WI [  0.39   0.54   0.58   0.26   0.45 -10.   -10.     0.82] sorted [7 2 1]\n",
      "   state [1 1 0 1 0 1 0 1] state_WI [  0.26   0.47   0.58   0.26   0.45 -10.     0.49 -10.  ] sorted [2 6 1]\n",
      "   state [1 1 1 0 0 0 0 1] state_WI [  0.26   0.47   0.47   0.71   0.45   0.52   0.49 -10.  ] sorted [3 5 6]\n",
      "   state [0 1 1 1 0 1 1 0] state_WI [  0.39   0.47   0.47   0.26   0.45 -10.   -10.     0.82] sorted [7 2 1]\n",
      "instance 0, ep 8, state [0 0 0 0 1 1 0 1]\n",
      "   state [0 0 0 0 1 1 0 1] state_WI [  0.39   0.54   0.58   0.71   0.45 -10.     0.49 -10.  ] sorted [3 2 1]\n",
      "   state [0 0 1 1 1 0 0 0] state_WI [0.39 0.54 0.47 0.26 0.45 0.52 0.49 0.82] sorted [7 1 5]\n",
      "   state [0 0 1 0 0 1 0 0] state_WI [  0.39   0.54   0.47   0.71   0.45 -10.     0.49   0.82] sorted [7 3 1]\n",
      "   state [0 1 0 1 0 1 1 0] state_WI [  0.39   0.47   0.58   0.26   0.45 -10.   -10.     0.82] sorted [7 2 1]\n",
      "   state [0 0 0 0 0 0 0 1] state_WI [  0.39   0.54   0.58   0.71   0.45   0.52   0.49 -10.  ] sorted [3 2 1]\n",
      "   state [1 1 0 1 0 0 0 1] state_WI [  0.26   0.47   0.58   0.26   0.45   0.52   0.49 -10.  ] sorted [2 5 6]\n",
      "   state [0 0 0 0 0 1 1 0] state_WI [  0.39   0.54   0.58   0.71   0.45 -10.   -10.     0.82] sorted [7 3 2]\n",
      "   state [0 0 0 0 0 0 0 0] state_WI [0.39 0.54 0.58 0.71 0.45 0.52 0.49 0.82] sorted [7 3 2]\n",
      "   state [0 0 1 1 1 0 0 1] state_WI [  0.39   0.54   0.47   0.26   0.45   0.52   0.49 -10.  ] sorted [1 5 6]\n",
      "   state [0 1 0 1 0 0 1 0] state_WI [  0.39   0.47   0.58   0.26   0.45   0.52 -10.     0.82] sorted [7 2 5]\n",
      "   state [0 0 1 1 1 1 1 0] state_WI [  0.39   0.54   0.47   0.26   0.45 -10.   -10.     0.82] sorted [7 1 2]\n",
      "   state [0 1 1 1 0 1 0 1] state_WI [  0.39   0.47   0.47   0.26   0.45 -10.     0.49 -10.  ] sorted [6 2 1]\n",
      "   state [0 1 1 1 0 0 0 1] state_WI [  0.39   0.47   0.47   0.26   0.45   0.52   0.49 -10.  ] sorted [5 6 2]\n",
      "   state [0 1 0 0 0 0 0 0] state_WI [0.39 0.47 0.58 0.71 0.45 0.52 0.49 0.82] sorted [7 3 2]\n",
      "   state [1 1 0 0 0 0 0 0] state_WI [0.26 0.47 0.58 0.71 0.45 0.52 0.49 0.82] sorted [7 3 2]\n",
      "   state [0 0 1 1 0 0 0 1] state_WI [  0.39   0.54   0.47   0.26   0.45   0.52   0.49 -10.  ] sorted [1 5 6]\n",
      "   state [0 1 1 0 0 0 1 1] state_WI [  0.39   0.47   0.47   0.71   0.45   0.52 -10.   -10.  ] sorted [3 5 2]\n",
      "   state [0 0 0 1 0 0 1 1] state_WI [  0.39   0.54   0.58   0.26   0.45   0.52 -10.   -10.  ] sorted [2 1 5]\n",
      "   state [0 1 1 1 0 0 1 0] state_WI [  0.39   0.47   0.47   0.26   0.45   0.52 -10.     0.82] sorted [7 5 2]\n",
      "   state [0 0 1 1 1 0 0 0] state_WI [0.39 0.54 0.47 0.26 0.45 0.52 0.49 0.82] sorted [7 1 5]\n",
      "instance 0, ep 9, state [0 1 0 0 0 1 1 1]\n",
      "   state [0 1 0 0 0 1 1 1] state_WI [  0.39   0.47   0.58   0.71   0.45 -10.   -10.   -10.  ] sorted [3 2 1]\n",
      "   state [0 1 1 1 0 1 0 1] state_WI [  0.39   0.47   0.47   0.26   0.45 -10.     0.49 -10.  ] sorted [6 2 1]\n",
      "   state [1 1 0 0 0 1 1 0] state_WI [  0.26   0.47   0.58   0.71   0.45 -10.   -10.     0.82] sorted [7 3 2]\n",
      "   state [1 1 1 1 0 0 0 1] state_WI [  0.26   0.47   0.47   0.26   0.45   0.52   0.49 -10.  ] sorted [5 6 2]\n",
      "   state [1 1 1 1 0 1 0 0] state_WI [  0.26   0.47   0.47   0.26   0.45 -10.     0.49   0.82] sorted [7 6 2]\n",
      "   state [1 1 0 0 0 0 1 1] state_WI [  0.26   0.47   0.58   0.71   0.45   0.52 -10.   -10.  ] sorted [3 2 5]\n",
      "   state [1 0 0 1 0 0 1 0] state_WI [  0.26   0.54   0.58   0.26   0.45   0.52 -10.     0.82] sorted [7 2 1]\n",
      "   state [1 0 1 0 0 0 0 1] state_WI [  0.26   0.54   0.47   0.71   0.45   0.52   0.49 -10.  ] sorted [3 1 5]\n",
      "   state [1 0 0 1 1 1 0 0] state_WI [  0.26   0.54   0.58   0.26   0.45 -10.     0.49   0.82] sorted [7 2 1]\n",
      "   state [1 0 1 0 1 0 0 1] state_WI [  0.26   0.54   0.47   0.71   0.45   0.52   0.49 -10.  ] sorted [3 1 5]\n",
      "   state [1 0 1 1 0 1 0 1] state_WI [  0.26   0.54   0.47   0.26   0.45 -10.     0.49 -10.  ] sorted [1 6 2]\n",
      "   state [0 1 1 0 0 0 1 1] state_WI [  0.39   0.47   0.47   0.71   0.45   0.52 -10.   -10.  ] sorted [3 5 2]\n",
      "   state [0 0 1 0 0 0 0 0] state_WI [0.39 0.54 0.47 0.71 0.45 0.52 0.49 0.82] sorted [7 3 1]\n",
      "   state [0 1 1 1 0 0 0 1] state_WI [  0.39   0.47   0.47   0.26   0.45   0.52   0.49 -10.  ] sorted [5 6 2]\n",
      "   state [0 0 1 0 0 1 0 0] state_WI [  0.39   0.54   0.47   0.71   0.45 -10.     0.49   0.82] sorted [7 3 1]\n",
      "   state [0 0 0 1 0 0 0 1] state_WI [  0.39   0.54   0.58   0.26   0.45   0.52   0.49 -10.  ] sorted [2 1 5]\n",
      "   state [0 0 1 1 0 1 0 0] state_WI [  0.39   0.54   0.47   0.26   0.45 -10.     0.49   0.82] sorted [7 1 6]\n",
      "   state [0 0 1 1 0 1 1 0] state_WI [  0.39   0.54   0.47   0.26   0.45 -10.   -10.     0.82] sorted [7 1 2]\n",
      "   state [0 0 1 1 1 0 0 0] state_WI [0.39 0.54 0.47 0.26 0.45 0.52 0.49 0.82] sorted [7 1 5]\n",
      "   state [0 0 1 0 0 1 0 1] state_WI [  0.39   0.54   0.47   0.71   0.45 -10.     0.49 -10.  ] sorted [3 1 6]\n",
      "instance 0, ep 10, state [0 1 1 0 0 0 1 0]\n",
      "   state [0 1 1 0 0 0 1 0] state_WI [  0.39   0.47   0.47   0.71   0.45   0.52 -10.     0.82] sorted [7 3 5]\n",
      "   state [0 1 0 1 1 1 1 0] state_WI [  0.39   0.47   0.58   0.26   0.45 -10.   -10.     0.82] sorted [7 2 1]\n",
      "   state [0 1 1 1 0 1 0 1] state_WI [  0.39   0.47   0.47   0.26   0.45 -10.     0.49 -10.  ] sorted [6 2 1]\n",
      "   state [0 1 1 0 0 0 0 0] state_WI [0.39 0.47 0.47 0.71 0.45 0.52 0.49 0.82] sorted [7 3 5]\n",
      "   state [1 0 1 0 0 1 0 1] state_WI [  0.26   0.54   0.47   0.71   0.45 -10.     0.49 -10.  ] sorted [3 1 6]\n",
      "   state [1 0 0 1 0 1 1 1] state_WI [  0.26   0.54   0.58   0.26   0.45 -10.   -10.   -10.  ] sorted [2 1 4]\n",
      "   state [0 0 1 1 0 0 1 0] state_WI [  0.39   0.54   0.47   0.26   0.45   0.52 -10.     0.82] sorted [7 1 5]\n",
      "   state [0 1 0 0 0 0 1 1] state_WI [  0.39   0.47   0.58   0.71   0.45   0.52 -10.   -10.  ] sorted [3 2 5]\n",
      "   state [0 1 1 1 0 1 1 1] state_WI [  0.39   0.47   0.47   0.26   0.45 -10.   -10.   -10.  ] sorted [2 1 4]\n",
      "   state [0 0 1 1 1 0 0 1] state_WI [  0.39   0.54   0.47   0.26   0.45   0.52   0.49 -10.  ] sorted [1 5 6]\n",
      "   state [1 0 1 1 0 1 0 1] state_WI [  0.26   0.54   0.47   0.26   0.45 -10.     0.49 -10.  ] sorted [1 6 2]\n",
      "   state [1 1 1 0 1 0 0 1] state_WI [  0.26   0.47   0.47   0.71   0.45   0.52   0.49 -10.  ] sorted [3 5 6]\n",
      "   state [1 0 1 1 0 1 0 0] state_WI [  0.26   0.54   0.47   0.26   0.45 -10.     0.49   0.82] sorted [7 1 6]\n",
      "   state [0 1 1 0 0 1 0 1] state_WI [  0.39   0.47   0.47   0.71   0.45 -10.     0.49 -10.  ] sorted [3 6 2]\n",
      "   state [1 0 1 1 1 1 1 0] state_WI [  0.26   0.54   0.47   0.26   0.45 -10.   -10.     0.82] sorted [7 1 2]\n",
      "   state [1 0 1 0 0 0 1 1] state_WI [  0.26   0.54   0.47   0.71   0.45   0.52 -10.   -10.  ] sorted [3 1 5]\n",
      "   state [0 1 0 1 0 1 1 0] state_WI [  0.39   0.47   0.58   0.26   0.45 -10.   -10.     0.82] sorted [7 2 1]\n",
      "   state [0 1 1 0 0 1 0 0] state_WI [  0.39   0.47   0.47   0.71   0.45 -10.     0.49   0.82] sorted [7 3 6]\n",
      "   state [0 1 0 0 0 0 0 1] state_WI [  0.39   0.47   0.58   0.71   0.45   0.52   0.49 -10.  ] sorted [3 2 5]\n",
      "   state [0 1 0 1 0 1 0 0] state_WI [  0.39   0.47   0.58   0.26   0.45 -10.     0.49   0.82] sorted [7 2 6]\n",
      "instance 0, ep 11, state [1 0 1 1 0 1 1 1]\n",
      "   state [1 0 1 1 0 1 1 1] state_WI [  0.26   0.54   0.47   0.26   0.45 -10.   -10.   -10.  ] sorted [1 2 4]\n",
      "   state [0 1 1 1 0 0 0 0] state_WI [0.39 0.47 0.47 0.26 0.45 0.52 0.49 0.82] sorted [7 5 6]\n",
      "   state [0 1 1 1 0 1 0 1] state_WI [  0.39   0.47   0.47   0.26   0.45 -10.     0.49 -10.  ] sorted [6 2 1]\n",
      "   state [0 1 0 0 0 1 1 0] state_WI [  0.39   0.47   0.58   0.71   0.45 -10.   -10.     0.82] sorted [7 3 2]\n",
      "   state [1 0 0 0 0 1 0 1] state_WI [  0.26   0.54   0.58   0.71   0.45 -10.     0.49 -10.  ] sorted [3 2 1]\n",
      "   state [0 1 1 1 0 1 0 0] state_WI [  0.39   0.47   0.47   0.26   0.45 -10.     0.49   0.82] sorted [7 6 2]\n",
      "   state [1 0 1 0 0 0 0 0] state_WI [0.26 0.54 0.47 0.71 0.45 0.52 0.49 0.82] sorted [7 3 1]\n",
      "   state [0 1 0 1 0 0 0 0] state_WI [0.39 0.47 0.58 0.26 0.45 0.52 0.49 0.82] sorted [7 2 5]\n",
      "   state [1 1 1 1 1 0 0 0] state_WI [0.26 0.47 0.47 0.26 0.45 0.52 0.49 0.82] sorted [7 5 6]\n",
      "   state [1 0 1 1 1 1 0 1] state_WI [  0.26   0.54   0.47   0.26   0.45 -10.     0.49 -10.  ] sorted [1 6 2]\n",
      "   state [1 0 0 1 1 1 1 1] state_WI [  0.26   0.54   0.58   0.26   0.45 -10.   -10.   -10.  ] sorted [2 1 4]\n",
      "   state [1 0 0 0 1 1 1 0] state_WI [  0.26   0.54   0.58   0.71   0.45 -10.   -10.     0.82] sorted [7 3 2]\n",
      "   state [1 0 1 1 0 0 0 1] state_WI [  0.26   0.54   0.47   0.26   0.45   0.52   0.49 -10.  ] sorted [1 5 6]\n",
      "   state [0 1 1 1 0 1 1 0] state_WI [  0.39   0.47   0.47   0.26   0.45 -10.   -10.     0.82] sorted [7 2 1]\n",
      "   state [0 1 1 0 0 0 1 0] state_WI [  0.39   0.47   0.47   0.71   0.45   0.52 -10.     0.82] sorted [7 3 5]\n",
      "   state [0 0 1 0 0 1 0 0] state_WI [  0.39   0.54   0.47   0.71   0.45 -10.     0.49   0.82] sorted [7 3 1]\n",
      "   state [0 0 0 0 0 1 0 0] state_WI [  0.39   0.54   0.58   0.71   0.45 -10.     0.49   0.82] sorted [7 3 2]\n",
      "   state [1 0 0 1 0 0 0 1] state_WI [  0.26   0.54   0.58   0.26   0.45   0.52   0.49 -10.  ] sorted [2 1 5]\n",
      "   state [0 1 1 0 0 0 0 0] state_WI [0.39 0.47 0.47 0.71 0.45 0.52 0.49 0.82] sorted [7 3 5]\n",
      "   state [1 1 1 0 0 1 0 0] state_WI [  0.26   0.47   0.47   0.71   0.45 -10.     0.49   0.82] sorted [7 3 6]\n",
      "instance 0, ep 12, state [0 0 1 1 0 0 1 0]\n",
      "   state [0 0 1 1 0 0 1 0] state_WI [  0.39   0.54   0.47   0.26   0.45   0.52 -10.     0.82] sorted [7 1 5]\n",
      "   state [0 0 0 0 0 0 0 1] state_WI [  0.39   0.54   0.58   0.71   0.45   0.52   0.49 -10.  ] sorted [3 2 1]\n",
      "   state [1 1 1 0 0 0 0 1] state_WI [  0.26   0.47   0.47   0.71   0.45   0.52   0.49 -10.  ] sorted [3 5 6]\n",
      "   state [1 1 1 0 1 0 1 0] state_WI [  0.26   0.47   0.47   0.71   0.45   0.52 -10.     0.82] sorted [7 3 5]\n",
      "   state [0 0 0 1 0 0 0 1] state_WI [  0.39   0.54   0.58   0.26   0.45   0.52   0.49 -10.  ] sorted [2 1 5]\n",
      "   state [0 1 1 1 0 0 0 0] state_WI [0.39 0.47 0.47 0.26 0.45 0.52 0.49 0.82] sorted [7 5 6]\n",
      "   state [0 1 0 1 0 1 1 1] state_WI [  0.39   0.47   0.58   0.26   0.45 -10.   -10.   -10.  ] sorted [2 1 4]\n",
      "   state [0 1 0 1 1 1 0 0] state_WI [  0.39   0.47   0.58   0.26   0.45 -10.     0.49   0.82] sorted [7 2 6]\n",
      "   state [0 0 1 0 0 0 1 1] state_WI [  0.39   0.54   0.47   0.71   0.45   0.52 -10.   -10.  ] sorted [3 1 5]\n",
      "   state [0 0 0 0 0 1 0 0] state_WI [  0.39   0.54   0.58   0.71   0.45 -10.     0.49   0.82] sorted [7 3 2]\n",
      "   state [1 0 1 0 0 0 0 1] state_WI [  0.26   0.54   0.47   0.71   0.45   0.52   0.49 -10.  ] sorted [3 1 5]\n",
      "   state [0 0 0 1 0 0 0 0] state_WI [0.39 0.54 0.58 0.26 0.45 0.52 0.49 0.82] sorted [7 2 1]\n",
      "   state [0 1 0 1 0 1 0 1] state_WI [  0.39   0.47   0.58   0.26   0.45 -10.     0.49 -10.  ] sorted [2 6 1]\n",
      "   state [1 1 1 0 0 0 1 0] state_WI [  0.26   0.47   0.47   0.71   0.45   0.52 -10.     0.82] sorted [7 3 5]\n",
      "   state [1 0 1 1 0 0 0 0] state_WI [0.26 0.54 0.47 0.26 0.45 0.52 0.49 0.82] sorted [7 1 5]\n",
      "   state [0 0 0 1 0 0 0 0] state_WI [0.39 0.54 0.58 0.26 0.45 0.52 0.49 0.82] sorted [7 2 1]\n",
      "   state [0 1 1 0 1 1 0 1] state_WI [  0.39   0.47   0.47   0.71   0.45 -10.     0.49 -10.  ] sorted [3 6 2]\n",
      "   state [0 0 1 0 0 0 0 1] state_WI [  0.39   0.54   0.47   0.71   0.45   0.52   0.49 -10.  ] sorted [3 1 5]\n",
      "   state [1 1 1 1 0 1 0 1] state_WI [  0.26   0.47   0.47   0.26   0.45 -10.     0.49 -10.  ] sorted [6 2 1]\n",
      "   state [0 1 1 0 0 1 0 1] state_WI [  0.39   0.47   0.47   0.71   0.45 -10.     0.49 -10.  ] sorted [3 6 2]\n",
      "instance 0, ep 13, state [1 1 1 1 0 1 1 0]\n",
      "   state [1 1 1 1 0 1 1 0] state_WI [  0.26   0.47   0.47   0.26   0.45 -10.   -10.     0.82] sorted [7 2 1]\n",
      "   state [1 1 1 0 0 1 0 1] state_WI [  0.26   0.47   0.47   0.71   0.45 -10.     0.49 -10.  ] sorted [3 6 2]\n",
      "   state [0 0 1 1 0 1 0 1] state_WI [  0.39   0.54   0.47   0.26   0.45 -10.     0.49 -10.  ] sorted [1 6 2]\n",
      "   state [0 1 1 1 0 0 1 1] state_WI [  0.39   0.47   0.47   0.26   0.45   0.52 -10.   -10.  ] sorted [5 2 1]\n",
      "   state [0 0 1 0 0 0 0 1] state_WI [  0.39   0.54   0.47   0.71   0.45   0.52   0.49 -10.  ] sorted [3 1 5]\n",
      "   state [0 1 1 1 0 0 0 1] state_WI [  0.39   0.47   0.47   0.26   0.45   0.52   0.49 -10.  ] sorted [5 6 2]\n",
      "   state [0 0 1 1 0 1 1 1] state_WI [  0.39   0.54   0.47   0.26   0.45 -10.   -10.   -10.  ] sorted [1 2 4]\n",
      "   state [0 1 0 0 0 0 0 0] state_WI [0.39 0.47 0.58 0.71 0.45 0.52 0.49 0.82] sorted [7 3 2]\n",
      "   state [1 1 0 1 0 0 0 1] state_WI [  0.26   0.47   0.58   0.26   0.45   0.52   0.49 -10.  ] sorted [2 5 6]\n",
      "   state [1 1 0 0 0 0 0 0] state_WI [0.26 0.47 0.58 0.71 0.45 0.52 0.49 0.82] sorted [7 3 2]\n",
      "   state [1 1 0 1 0 0 0 1] state_WI [  0.26   0.47   0.58   0.26   0.45   0.52   0.49 -10.  ] sorted [2 5 6]\n",
      "   state [1 1 0 1 0 1 0 0] state_WI [  0.26   0.47   0.58   0.26   0.45 -10.     0.49   0.82] sorted [7 2 6]\n",
      "   state [1 1 0 1 0 1 1 1] state_WI [  0.26   0.47   0.58   0.26   0.45 -10.   -10.   -10.  ] sorted [2 1 4]\n",
      "   state [1 1 0 1 0 0 0 0] state_WI [0.26 0.47 0.58 0.26 0.45 0.52 0.49 0.82] sorted [7 2 5]\n",
      "   state [1 0 1 0 0 1 0 0] state_WI [  0.26   0.54   0.47   0.71   0.45 -10.     0.49   0.82] sorted [7 3 1]\n",
      "   state [1 0 1 0 0 1 0 0] state_WI [  0.26   0.54   0.47   0.71   0.45 -10.     0.49   0.82] sorted [7 3 1]\n",
      "   state [0 0 1 0 0 1 0 1] state_WI [  0.39   0.54   0.47   0.71   0.45 -10.     0.49 -10.  ] sorted [3 1 6]\n",
      "   state [0 1 0 1 0 0 1 1] state_WI [  0.39   0.47   0.58   0.26   0.45   0.52 -10.   -10.  ] sorted [2 5 1]\n",
      "   state [0 0 1 1 1 1 1 1] state_WI [  0.39   0.54   0.47   0.26   0.45 -10.   -10.   -10.  ] sorted [1 2 4]\n",
      "   state [0 0 1 1 0 0 1 0] state_WI [  0.39   0.54   0.47   0.26   0.45   0.52 -10.     0.82] sorted [7 1 5]\n",
      "instance 0, ep 14, state [0 1 1 0 1 1 1 1]\n",
      "   state [0 1 1 0 1 1 1 1] state_WI [  0.39   0.47   0.47   0.71   0.45 -10.   -10.   -10.  ] sorted [3 2 1]\n",
      "   state [1 1 1 1 0 1 0 1] state_WI [  0.26   0.47   0.47   0.26   0.45 -10.     0.49 -10.  ] sorted [6 2 1]\n",
      "   state [1 1 1 1 0 0 1 0] state_WI [  0.26   0.47   0.47   0.26   0.45   0.52 -10.     0.82] sorted [7 5 2]\n",
      "   state [1 0 1 0 0 0 0 1] state_WI [  0.26   0.54   0.47   0.71   0.45   0.52   0.49 -10.  ] sorted [3 1 5]\n",
      "   state [0 1 0 1 0 0 0 0] state_WI [0.39 0.47 0.58 0.26 0.45 0.52 0.49 0.82] sorted [7 2 5]\n",
      "   state [0 0 1 1 0 1 1 1] state_WI [  0.39   0.54   0.47   0.26   0.45 -10.   -10.   -10.  ] sorted [1 2 4]\n",
      "   state [0 0 1 1 1 1 0 0] state_WI [  0.39   0.54   0.47   0.26   0.45 -10.     0.49   0.82] sorted [7 1 6]\n",
      "   state [0 1 0 0 0 0 1 1] state_WI [  0.39   0.47   0.58   0.71   0.45   0.52 -10.   -10.  ] sorted [3 2 5]\n",
      "   state [0 0 0 0 0 1 1 0] state_WI [  0.39   0.54   0.58   0.71   0.45 -10.   -10.     0.82] sorted [7 3 2]\n",
      "   state [1 0 1 1 0 0 0 0] state_WI [0.26 0.54 0.47 0.26 0.45 0.52 0.49 0.82] sorted [7 1 5]\n",
      "   state [0 1 1 1 0 1 1 1] state_WI [  0.39   0.47   0.47   0.26   0.45 -10.   -10.   -10.  ] sorted [2 1 4]\n",
      "   state [1 1 1 0 0 0 0 0] state_WI [0.26 0.47 0.47 0.71 0.45 0.52 0.49 0.82] sorted [7 3 5]\n",
      "   state [1 1 1 0 0 1 0 1] state_WI [  0.26   0.47   0.47   0.71   0.45 -10.     0.49 -10.  ] sorted [3 6 2]\n",
      "   state [0 0 1 0 0 1 1 0] state_WI [  0.39   0.54   0.47   0.71   0.45 -10.   -10.     0.82] sorted [7 3 1]\n",
      "   state [0 0 1 1 0 1 0 0] state_WI [  0.39   0.54   0.47   0.26   0.45 -10.     0.49   0.82] sorted [7 1 6]\n",
      "   state [0 1 0 0 0 0 1 1] state_WI [  0.39   0.47   0.58   0.71   0.45   0.52 -10.   -10.  ] sorted [3 2 5]\n",
      "   state [0 0 0 0 0 1 1 1] state_WI [  0.39   0.54   0.58   0.71   0.45 -10.   -10.   -10.  ] sorted [3 2 1]\n",
      "   state [1 0 1 0 1 1 1 1] state_WI [  0.26   0.54   0.47   0.71   0.45 -10.   -10.   -10.  ] sorted [3 1 2]\n",
      "   state [1 0 1 1 0 1 1 0] state_WI [  0.26   0.54   0.47   0.26   0.45 -10.   -10.     0.82] sorted [7 1 2]\n",
      "   state [1 1 1 1 0 1 1 0] state_WI [  0.26   0.47   0.47   0.26   0.45 -10.   -10.     0.82] sorted [7 2 1]\n",
      "instance 0, ep 15, state [0 0 1 1 1 0 1 1]\n",
      "   state [0 0 1 1 1 0 1 1] state_WI [  0.39   0.54   0.47   0.26   0.45   0.52 -10.   -10.  ] sorted [1 5 2]\n",
      "   state [0 0 0 0 1 0 1 0] state_WI [  0.39   0.54   0.58   0.71   0.45   0.52 -10.     0.82] sorted [7 3 2]\n",
      "   state [0 0 1 0 0 0 0 1] state_WI [  0.39   0.54   0.47   0.71   0.45   0.52   0.49 -10.  ] sorted [3 1 5]\n",
      "   state [0 0 0 1 1 0 0 0] state_WI [0.39 0.54 0.58 0.26 0.45 0.52 0.49 0.82] sorted [7 2 1]\n",
      "   state [0 1 1 1 0 0 0 0] state_WI [0.39 0.47 0.47 0.26 0.45 0.52 0.49 0.82] sorted [7 5 6]\n",
      "   state [0 0 1 0 0 1 0 1] state_WI [  0.39   0.54   0.47   0.71   0.45 -10.     0.49 -10.  ] sorted [3 1 6]\n",
      "   state [0 0 0 0 0 0 1 1] state_WI [  0.39   0.54   0.58   0.71   0.45   0.52 -10.   -10.  ] sorted [3 2 1]\n",
      "   state [0 1 1 1 0 0 1 1] state_WI [  0.39   0.47   0.47   0.26   0.45   0.52 -10.   -10.  ] sorted [5 2 1]\n",
      "   state [1 1 1 1 0 0 1 0] state_WI [  0.26   0.47   0.47   0.26   0.45   0.52 -10.     0.82] sorted [7 5 2]\n",
      "   state [0 1 1 0 0 1 0 1] state_WI [  0.39   0.47   0.47   0.71   0.45 -10.     0.49 -10.  ] sorted [3 6 2]\n",
      "   state [1 1 1 1 0 1 0 1] state_WI [  0.26   0.47   0.47   0.26   0.45 -10.     0.49 -10.  ] sorted [6 2 1]\n",
      "   state [1 1 1 0 0 1 0 0] state_WI [  0.26   0.47   0.47   0.71   0.45 -10.     0.49   0.82] sorted [7 3 6]\n",
      "   state [1 0 1 0 0 0 0 0] state_WI [0.26 0.54 0.47 0.71 0.45 0.52 0.49 0.82] sorted [7 3 1]\n",
      "   state [1 1 0 1 0 0 0 0] state_WI [0.26 0.47 0.58 0.26 0.45 0.52 0.49 0.82] sorted [7 2 5]\n",
      "   state [0 1 1 0 0 1 0 1] state_WI [  0.39   0.47   0.47   0.71   0.45 -10.     0.49 -10.  ] sorted [3 6 2]\n",
      "   state [0 0 1 1 0 0 1 0] state_WI [  0.39   0.54   0.47   0.26   0.45   0.52 -10.     0.82] sorted [7 1 5]\n",
      "   state [0 1 1 0 0 1 0 1] state_WI [  0.39   0.47   0.47   0.71   0.45 -10.     0.49 -10.  ] sorted [3 6 2]\n",
      "   state [0 0 1 1 0 1 1 1] state_WI [  0.39   0.54   0.47   0.26   0.45 -10.   -10.   -10.  ] sorted [1 2 4]\n",
      "   state [0 1 1 1 1 1 0 1] state_WI [  0.39   0.47   0.47   0.26   0.45 -10.     0.49 -10.  ] sorted [6 2 1]\n",
      "   state [0 1 1 1 1 1 1 1] state_WI [  0.39   0.47   0.47   0.26   0.45 -10.   -10.   -10.  ] sorted [2 1 4]\n",
      "instance 0, ep 16, state [1 1 1 1 0 1 1 0]\n",
      "   state [1 1 1 1 0 1 1 0] state_WI [  0.26   0.47   0.47   0.26   0.45 -10.   -10.     0.82] sorted [7 2 1]\n",
      "   state [1 0 1 1 0 0 1 1] state_WI [  0.26   0.54   0.47   0.26   0.45   0.52 -10.   -10.  ] sorted [1 5 2]\n",
      "   state [1 1 0 1 0 1 0 1] state_WI [  0.26   0.47   0.58   0.26   0.45 -10.     0.49 -10.  ] sorted [2 6 1]\n",
      "   state [1 1 0 1 0 0 0 1] state_WI [  0.26   0.47   0.58   0.26   0.45   0.52   0.49 -10.  ] sorted [2 5 6]\n",
      "   state [1 1 0 1 0 1 1 0] state_WI [  0.26   0.47   0.58   0.26   0.45 -10.   -10.     0.82] sorted [7 2 1]\n",
      "   state [1 0 1 0 0 0 1 0] state_WI [  0.26   0.54   0.47   0.71   0.45   0.52 -10.     0.82] sorted [7 3 1]\n",
      "   state [1 0 0 1 0 0 1 0] state_WI [  0.26   0.54   0.58   0.26   0.45   0.52 -10.     0.82] sorted [7 2 1]\n",
      "   state [0 0 1 1 0 0 0 1] state_WI [  0.39   0.54   0.47   0.26   0.45   0.52   0.49 -10.  ] sorted [1 5 6]\n",
      "   state [0 0 0 0 0 1 0 1] state_WI [  0.39   0.54   0.58   0.71   0.45 -10.     0.49 -10.  ] sorted [3 2 1]\n",
      "   state [0 1 0 1 0 1 0 0] state_WI [  0.39   0.47   0.58   0.26   0.45 -10.     0.49   0.82] sorted [7 2 6]\n",
      "   state [0 0 0 1 0 0 1 1] state_WI [  0.39   0.54   0.58   0.26   0.45   0.52 -10.   -10.  ] sorted [2 1 5]\n",
      "   state [0 0 0 1 0 0 1 1] state_WI [  0.39   0.54   0.58   0.26   0.45   0.52 -10.   -10.  ] sorted [2 1 5]\n",
      "   state [0 0 0 1 0 1 1 1] state_WI [  0.39   0.54   0.58   0.26   0.45 -10.   -10.   -10.  ] sorted [2 1 4]\n",
      "   state [0 0 1 1 1 0 0 1] state_WI [  0.39   0.54   0.47   0.26   0.45   0.52   0.49 -10.  ] sorted [1 5 6]\n",
      "   state [0 1 0 1 1 1 0 0] state_WI [  0.39   0.47   0.58   0.26   0.45 -10.     0.49   0.82] sorted [7 2 6]\n",
      "   state [0 0 1 1 0 1 0 1] state_WI [  0.39   0.54   0.47   0.26   0.45 -10.     0.49 -10.  ] sorted [1 6 2]\n",
      "   state [1 0 0 0 0 1 1 0] state_WI [  0.26   0.54   0.58   0.71   0.45 -10.   -10.     0.82] sorted [7 3 2]\n",
      "   state [0 0 1 0 0 1 1 0] state_WI [  0.39   0.54   0.47   0.71   0.45 -10.   -10.     0.82] sorted [7 3 1]\n",
      "   state [0 0 0 1 0 0 0 0] state_WI [0.39 0.54 0.58 0.26 0.45 0.52 0.49 0.82] sorted [7 2 1]\n",
      "   state [0 0 0 0 0 0 0 0] state_WI [0.39 0.54 0.58 0.71 0.45 0.52 0.49 0.82] sorted [7 3 2]\n",
      "instance 0, ep 17, state [0 0 0 1 0 0 0 0]\n",
      "   state [0 0 0 1 0 0 0 0] state_WI [0.39 0.54 0.58 0.26 0.45 0.52 0.49 0.82] sorted [7 2 1]\n",
      "   state [0 1 1 0 0 1 0 1] state_WI [  0.39   0.47   0.47   0.71   0.45 -10.     0.49 -10.  ] sorted [3 6 2]\n",
      "   state [0 0 1 1 0 0 1 0] state_WI [  0.39   0.54   0.47   0.26   0.45   0.52 -10.     0.82] sorted [7 1 5]\n",
      "   state [0 0 0 1 1 0 1 0] state_WI [  0.39   0.54   0.58   0.26   0.45   0.52 -10.     0.82] sorted [7 2 1]\n",
      "   state [0 0 0 1 0 0 1 0] state_WI [  0.39   0.54   0.58   0.26   0.45   0.52 -10.     0.82] sorted [7 2 1]\n",
      "   state [0 0 1 0 0 0 0 0] state_WI [0.39 0.54 0.47 0.71 0.45 0.52 0.49 0.82] sorted [7 3 1]\n",
      "   state [0 1 1 1 0 0 0 0] state_WI [0.39 0.47 0.47 0.26 0.45 0.52 0.49 0.82] sorted [7 5 6]\n",
      "   state [0 0 0 0 0 1 0 1] state_WI [  0.39   0.54   0.58   0.71   0.45 -10.     0.49 -10.  ] sorted [3 2 1]\n",
      "   state [1 0 0 1 1 1 0 0] state_WI [  0.26   0.54   0.58   0.26   0.45 -10.     0.49   0.82] sorted [7 2 1]\n",
      "   state [1 1 0 1 1 1 0 1] state_WI [  0.26   0.47   0.58   0.26   0.45 -10.     0.49 -10.  ] sorted [2 6 1]\n",
      "   state [0 1 0 1 0 1 0 0] state_WI [  0.39   0.47   0.58   0.26   0.45 -10.     0.49   0.82] sorted [7 2 6]\n",
      "   state [0 0 1 1 0 0 0 0] state_WI [0.39 0.54 0.47 0.26 0.45 0.52 0.49 0.82] sorted [7 1 5]\n",
      "   state [0 1 0 0 0 0 0 1] state_WI [  0.39   0.47   0.58   0.71   0.45   0.52   0.49 -10.  ] sorted [3 2 5]\n",
      "   state [0 0 0 0 0 1 0 1] state_WI [  0.39   0.54   0.58   0.71   0.45 -10.     0.49 -10.  ] sorted [3 2 1]\n",
      "   state [0 0 1 1 0 0 0 0] state_WI [0.39 0.54 0.47 0.26 0.45 0.52 0.49 0.82] sorted [7 1 5]\n",
      "   state [1 1 1 0 0 0 0 0] state_WI [0.26 0.47 0.47 0.71 0.45 0.52 0.49 0.82] sorted [7 3 5]\n",
      "   state [1 0 0 1 0 1 0 0] state_WI [  0.26   0.54   0.58   0.26   0.45 -10.     0.49   0.82] sorted [7 2 1]\n",
      "   state [1 0 1 1 0 1 0 0] state_WI [  0.26   0.54   0.47   0.26   0.45 -10.     0.49   0.82] sorted [7 1 6]\n",
      "   state [1 1 1 1 0 0 0 1] state_WI [  0.26   0.47   0.47   0.26   0.45   0.52   0.49 -10.  ] sorted [5 6 2]\n",
      "   state [0 0 1 1 0 0 0 1] state_WI [  0.39   0.54   0.47   0.26   0.45   0.52   0.49 -10.  ] sorted [1 5 6]\n",
      "instance 0, ep 18, state [0 1 1 0 1 1 1 0]\n",
      "   state [0 1 1 0 1 1 1 0] state_WI [  0.39   0.47   0.47   0.71   0.45 -10.   -10.     0.82] sorted [7 3 2]\n",
      "   state [0 0 1 1 0 1 0 0] state_WI [  0.39   0.54   0.47   0.26   0.45 -10.     0.49   0.82] sorted [7 1 6]\n",
      "   state [0 0 0 0 0 0 1 1] state_WI [  0.39   0.54   0.58   0.71   0.45   0.52 -10.   -10.  ] sorted [3 2 1]\n",
      "   state [0 0 0 1 0 0 1 1] state_WI [  0.39   0.54   0.58   0.26   0.45   0.52 -10.   -10.  ] sorted [2 1 5]\n",
      "   state [0 0 1 1 0 1 1 1] state_WI [  0.39   0.54   0.47   0.26   0.45 -10.   -10.   -10.  ] sorted [1 2 4]\n",
      "   state [0 1 1 1 0 0 1 1] state_WI [  0.39   0.47   0.47   0.26   0.45   0.52 -10.   -10.  ] sorted [5 2 1]\n",
      "   state [1 1 1 1 1 1 1 0] state_WI [  0.26   0.47   0.47   0.26   0.45 -10.   -10.     0.82] sorted [7 2 1]\n",
      "   state [0 1 1 0 0 0 0 1] state_WI [  0.39   0.47   0.47   0.71   0.45   0.52   0.49 -10.  ] sorted [3 5 6]\n",
      "   state [1 0 0 0 0 0 1 1] state_WI [  0.26   0.54   0.58   0.71   0.45   0.52 -10.   -10.  ] sorted [3 2 1]\n",
      "   state [1 0 1 0 1 0 0 0] state_WI [0.26 0.54 0.47 0.71 0.45 0.52 0.49 0.82] sorted [7 3 1]\n",
      "   state [0 1 0 1 0 0 0 1] state_WI [  0.39   0.47   0.58   0.26   0.45   0.52   0.49 -10.  ] sorted [2 5 6]\n",
      "   state [0 0 0 1 0 0 0 0] state_WI [0.39 0.54 0.58 0.26 0.45 0.52 0.49 0.82] sorted [7 2 1]\n",
      "   state [0 1 0 1 0 0 0 1] state_WI [  0.39   0.47   0.58   0.26   0.45   0.52   0.49 -10.  ] sorted [2 5 6]\n",
      "   state [1 0 1 1 0 1 0 1] state_WI [  0.26   0.54   0.47   0.26   0.45 -10.     0.49 -10.  ] sorted [1 6 2]\n",
      "   state [0 0 1 0 0 1 1 1] state_WI [  0.39   0.54   0.47   0.71   0.45 -10.   -10.   -10.  ] sorted [3 1 2]\n",
      "   state [0 0 1 0 0 0 1 1] state_WI [  0.39   0.54   0.47   0.71   0.45   0.52 -10.   -10.  ] sorted [3 1 5]\n",
      "   state [0 1 0 0 0 1 1 0] state_WI [  0.39   0.47   0.58   0.71   0.45 -10.   -10.     0.82] sorted [7 3 2]\n",
      "   state [1 1 1 1 0 1 1 1] state_WI [  0.26   0.47   0.47   0.26   0.45 -10.   -10.   -10.  ] sorted [2 1 4]\n",
      "   state [1 1 1 0 0 1 1 1] state_WI [  0.26   0.47   0.47   0.71   0.45 -10.   -10.   -10.  ] sorted [3 2 1]\n",
      "   state [0 1 1 1 1 1 1 1] state_WI [  0.39   0.47   0.47   0.26   0.45 -10.   -10.   -10.  ] sorted [2 1 4]\n",
      "instance 0, ep 19, state [1 1 0 1 0 0 1 1]\n",
      "   state [1 1 0 1 0 0 1 1] state_WI [  0.26   0.47   0.58   0.26   0.45   0.52 -10.   -10.  ] sorted [2 5 1]\n",
      "   state [0 1 1 1 0 0 1 1] state_WI [  0.39   0.47   0.47   0.26   0.45   0.52 -10.   -10.  ] sorted [5 2 1]\n",
      "   state [0 1 1 1 0 0 0 1] state_WI [  0.39   0.47   0.47   0.26   0.45   0.52   0.49 -10.  ] sorted [5 6 2]\n",
      "   state [0 1 1 1 1 1 0 0] state_WI [  0.39   0.47   0.47   0.26   0.45 -10.     0.49   0.82] sorted [7 6 2]\n",
      "   state [0 0 1 1 0 1 0 0] state_WI [  0.39   0.54   0.47   0.26   0.45 -10.     0.49   0.82] sorted [7 1 6]\n",
      "   state [0 0 0 1 1 1 1 0] state_WI [  0.39   0.54   0.58   0.26   0.45 -10.   -10.     0.82] sorted [7 2 1]\n",
      "   state [1 1 0 1 0 1 1 0] state_WI [  0.26   0.47   0.58   0.26   0.45 -10.   -10.     0.82] sorted [7 2 1]\n",
      "   state [1 1 1 0 0 0 0 0] state_WI [0.26 0.47 0.47 0.71 0.45 0.52 0.49 0.82] sorted [7 3 5]\n",
      "   state [1 1 1 1 0 0 0 0] state_WI [0.26 0.47 0.47 0.26 0.45 0.52 0.49 0.82] sorted [7 5 6]\n",
      "   state [0 0 0 0 0 0 1 1] state_WI [  0.39   0.54   0.58   0.71   0.45   0.52 -10.   -10.  ] sorted [3 2 1]\n",
      "   state [1 1 0 1 0 0 0 0] state_WI [0.26 0.47 0.58 0.26 0.45 0.52 0.49 0.82] sorted [7 2 5]\n",
      "   state [0 0 1 0 0 1 0 0] state_WI [  0.39   0.54   0.47   0.71   0.45 -10.     0.49   0.82] sorted [7 3 1]\n",
      "   state [1 0 0 1 0 0 0 0] state_WI [0.26 0.54 0.58 0.26 0.45 0.52 0.49 0.82] sorted [7 2 1]\n",
      "   state [1 1 0 1 0 0 0 1] state_WI [  0.26   0.47   0.58   0.26   0.45   0.52   0.49 -10.  ] sorted [2 5 6]\n",
      "   state [0 1 0 0 0 1 1 1] state_WI [  0.39   0.47   0.58   0.71   0.45 -10.   -10.   -10.  ] sorted [3 2 1]\n",
      "   state [0 1 0 1 0 1 1 0] state_WI [  0.39   0.47   0.58   0.26   0.45 -10.   -10.     0.82] sorted [7 2 1]\n",
      "   state [0 1 1 1 0 1 0 1] state_WI [  0.39   0.47   0.47   0.26   0.45 -10.     0.49 -10.  ] sorted [6 2 1]\n",
      "   state [0 1 1 1 0 0 1 0] state_WI [  0.39   0.47   0.47   0.26   0.45   0.52 -10.     0.82] sorted [7 5 2]\n",
      "   state [0 0 1 1 0 1 0 1] state_WI [  0.39   0.54   0.47   0.26   0.45 -10.     0.49 -10.  ] sorted [1 6 2]\n",
      "   state [0 1 1 0 0 0 1 0] state_WI [  0.39   0.47   0.47   0.71   0.45   0.52 -10.     0.82] sorted [7 3 5]\n",
      "instance 0, ep 20, state [1 0 0 1 1 0 1 0]\n",
      "   state [1 0 0 1 1 0 1 0] state_WI [  0.26   0.54   0.58   0.26   0.45   0.52 -10.     0.82] sorted [7 2 1]\n",
      "   state [1 1 1 0 1 0 0 1] state_WI [  0.26   0.47   0.47   0.71   0.45   0.52   0.49 -10.  ] sorted [3 5 6]\n",
      "   state [0 0 0 1 1 1 1 0] state_WI [  0.39   0.54   0.58   0.26   0.45 -10.   -10.     0.82] sorted [7 2 1]\n",
      "   state [0 0 0 1 1 0 0 0] state_WI [0.39 0.54 0.58 0.26 0.45 0.52 0.49 0.82] sorted [7 2 1]\n",
      "   state [0 1 1 0 1 0 0 1] state_WI [  0.39   0.47   0.47   0.71   0.45   0.52   0.49 -10.  ] sorted [3 5 6]\n",
      "   state [0 1 1 1 1 0 0 0] state_WI [0.39 0.47 0.47 0.26 0.45 0.52 0.49 0.82] sorted [7 5 6]\n",
      "   state [0 0 1 1 0 1 0 0] state_WI [  0.39   0.54   0.47   0.26   0.45 -10.     0.49   0.82] sorted [7 1 6]\n",
      "   state [0 1 1 0 0 0 0 0] state_WI [0.39 0.47 0.47 0.71 0.45 0.52 0.49 0.82] sorted [7 3 5]\n",
      "   state [0 0 1 0 0 0 0 1] state_WI [  0.39   0.54   0.47   0.71   0.45   0.52   0.49 -10.  ] sorted [3 1 5]\n",
      "   state [0 0 1 0 0 1 1 0] state_WI [  0.39   0.54   0.47   0.71   0.45 -10.   -10.     0.82] sorted [7 3 1]\n",
      "   state [0 0 1 1 0 0 0 0] state_WI [0.39 0.54 0.47 0.26 0.45 0.52 0.49 0.82] sorted [7 1 5]\n",
      "   state [1 1 1 0 0 1 0 1] state_WI [  0.26   0.47   0.47   0.71   0.45 -10.     0.49 -10.  ] sorted [3 6 2]\n",
      "   state [1 1 1 0 0 1 0 1] state_WI [  0.26   0.47   0.47   0.71   0.45 -10.     0.49 -10.  ] sorted [3 6 2]\n",
      "   state [1 1 1 0 0 0 0 0] state_WI [0.26 0.47 0.47 0.71 0.45 0.52 0.49 0.82] sorted [7 3 5]\n",
      "   state [0 1 1 0 0 1 0 0] state_WI [  0.39   0.47   0.47   0.71   0.45 -10.     0.49   0.82] sorted [7 3 6]\n",
      "   state [0 1 0 1 0 0 0 1] state_WI [  0.39   0.47   0.58   0.26   0.45   0.52   0.49 -10.  ] sorted [2 5 6]\n",
      "   state [0 1 1 1 1 1 1 0] state_WI [  0.39   0.47   0.47   0.26   0.45 -10.   -10.     0.82] sorted [7 2 1]\n",
      "   state [0 1 1 0 0 1 1 1] state_WI [  0.39   0.47   0.47   0.71   0.45 -10.   -10.   -10.  ] sorted [3 2 1]\n",
      "   state [0 1 1 0 0 0 0 1] state_WI [  0.39   0.47   0.47   0.71   0.45   0.52   0.49 -10.  ] sorted [3 5 6]\n",
      "   state [0 1 1 0 0 0 1 0] state_WI [  0.39   0.47   0.47   0.71   0.45   0.52 -10.     0.82] sorted [7 3 5]\n",
      "instance 0, ep 21, state [0 1 1 1 0 1 1 1]\n",
      "   state [0 1 1 1 0 1 1 1] state_WI [  0.39   0.47   0.47   0.26   0.45 -10.   -10.   -10.  ] sorted [2 1 4]\n",
      "   state [1 1 1 1 0 0 0 1] state_WI [  0.26   0.47   0.47   0.26   0.45   0.52   0.49 -10.  ] sorted [5 6 2]\n",
      "   state [1 0 1 0 0 1 0 0] state_WI [  0.26   0.54   0.47   0.71   0.45 -10.     0.49   0.82] sorted [7 3 1]\n",
      "   state [1 1 0 1 0 0 0 1] state_WI [  0.26   0.47   0.58   0.26   0.45   0.52   0.49 -10.  ] sorted [2 5 6]\n",
      "   state [0 1 1 1 0 1 0 0] state_WI [  0.39   0.47   0.47   0.26   0.45 -10.     0.49   0.82] sorted [7 6 2]\n",
      "   state [0 0 1 0 0 1 0 1] state_WI [  0.39   0.54   0.47   0.71   0.45 -10.     0.49 -10.  ] sorted [3 1 6]\n",
      "   state [0 1 1 1 0 0 1 0] state_WI [  0.39   0.47   0.47   0.26   0.45   0.52 -10.     0.82] sorted [7 5 2]\n",
      "   state [0 0 1 1 0 0 0 1] state_WI [  0.39   0.54   0.47   0.26   0.45   0.52   0.49 -10.  ] sorted [1 5 6]\n",
      "   state [1 0 0 0 1 0 1 1] state_WI [  0.26   0.54   0.58   0.71   0.45   0.52 -10.   -10.  ] sorted [3 2 1]\n",
      "   state [1 0 1 1 0 0 1 1] state_WI [  0.26   0.54   0.47   0.26   0.45   0.52 -10.   -10.  ] sorted [1 5 2]\n",
      "   state [1 0 1 0 0 1 1 0] state_WI [  0.26   0.54   0.47   0.71   0.45 -10.   -10.     0.82] sorted [7 3 1]\n",
      "   state [0 1 0 1 0 1 0 0] state_WI [  0.39   0.47   0.58   0.26   0.45 -10.     0.49   0.82] sorted [7 2 6]\n",
      "   state [0 0 0 1 0 0 0 0] state_WI [0.39 0.54 0.58 0.26 0.45 0.52 0.49 0.82] sorted [7 2 1]\n",
      "   state [0 1 0 0 0 1 0 0] state_WI [  0.39   0.47   0.58   0.71   0.45 -10.     0.49   0.82] sorted [7 3 2]\n",
      "   state [0 1 1 0 1 1 1 1] state_WI [  0.39   0.47   0.47   0.71   0.45 -10.   -10.   -10.  ] sorted [3 2 1]\n",
      "   state [0 1 1 1 1 0 1 1] state_WI [  0.39   0.47   0.47   0.26   0.45   0.52 -10.   -10.  ] sorted [5 2 1]\n",
      "   state [0 1 1 1 0 0 1 0] state_WI [  0.39   0.47   0.47   0.26   0.45   0.52 -10.     0.82] sorted [7 5 2]\n",
      "   state [1 0 1 0 0 0 0 0] state_WI [0.26 0.54 0.47 0.71 0.45 0.52 0.49 0.82] sorted [7 3 1]\n",
      "   state [0 1 1 1 0 0 0 1] state_WI [  0.39   0.47   0.47   0.26   0.45   0.52   0.49 -10.  ] sorted [5 6 2]\n",
      "   state [1 0 1 0 1 0 1 1] state_WI [  0.26   0.54   0.47   0.71   0.45   0.52 -10.   -10.  ] sorted [3 1 5]\n",
      "instance 0, ep 22, state [0 0 0 0 0 0 0 1]\n",
      "   state [0 0 0 0 0 0 0 1] state_WI [  0.39   0.54   0.58   0.71   0.45   0.52   0.49 -10.  ] sorted [3 2 1]\n",
      "   state [0 0 0 1 0 1 0 0] state_WI [  0.39   0.54   0.58   0.26   0.45 -10.     0.49   0.82] sorted [7 2 1]\n",
      "   state [0 0 1 1 0 0 0 1] state_WI [  0.39   0.54   0.47   0.26   0.45   0.52   0.49 -10.  ] sorted [1 5 6]\n",
      "   state [1 0 0 1 1 0 0 0] state_WI [0.26 0.54 0.58 0.26 0.45 0.52 0.49 0.82] sorted [7 2 1]\n",
      "   state [1 0 0 1 0 0 0 0] state_WI [0.26 0.54 0.58 0.26 0.45 0.52 0.49 0.82] sorted [7 2 1]\n",
      "   state [1 0 1 1 0 0 0 1] state_WI [  0.26   0.54   0.47   0.26   0.45   0.52   0.49 -10.  ] sorted [1 5 6]\n",
      "   state [0 1 0 0 0 1 0 0] state_WI [  0.39   0.47   0.58   0.71   0.45 -10.     0.49   0.82] sorted [7 3 2]\n",
      "   state [1 1 0 1 0 1 0 0] state_WI [  0.26   0.47   0.58   0.26   0.45 -10.     0.49   0.82] sorted [7 2 6]\n",
      "   state [1 0 1 0 0 0 1 0] state_WI [  0.26   0.54   0.47   0.71   0.45   0.52 -10.     0.82] sorted [7 3 1]\n",
      "   state [1 1 1 0 0 0 0 1] state_WI [  0.26   0.47   0.47   0.71   0.45   0.52   0.49 -10.  ] sorted [3 5 6]\n",
      "   state [1 0 0 1 0 0 1 0] state_WI [  0.26   0.54   0.58   0.26   0.45   0.52 -10.     0.82] sorted [7 2 1]\n",
      "   state [1 1 0 0 0 0 1 1] state_WI [  0.26   0.47   0.58   0.71   0.45   0.52 -10.   -10.  ] sorted [3 2 5]\n",
      "   state [1 1 0 0 0 0 1 0] state_WI [  0.26   0.47   0.58   0.71   0.45   0.52 -10.     0.82] sorted [7 3 2]\n",
      "   state [0 1 0 1 1 0 1 1] state_WI [  0.39   0.47   0.58   0.26   0.45   0.52 -10.   -10.  ] sorted [2 5 1]\n",
      "   state [1 1 1 1 0 0 0 1] state_WI [  0.26   0.47   0.47   0.26   0.45   0.52   0.49 -10.  ] sorted [5 6 2]\n",
      "   state [1 0 1 1 0 1 1 0] state_WI [  0.26   0.54   0.47   0.26   0.45 -10.   -10.     0.82] sorted [7 1 2]\n",
      "   state [1 0 1 1 0 0 1 0] state_WI [  0.26   0.54   0.47   0.26   0.45   0.52 -10.     0.82] sorted [7 1 5]\n",
      "   state [1 0 0 1 0 1 0 1] state_WI [  0.26   0.54   0.58   0.26   0.45 -10.     0.49 -10.  ] sorted [2 1 6]\n",
      "   state [1 1 1 1 0 0 1 0] state_WI [  0.26   0.47   0.47   0.26   0.45   0.52 -10.     0.82] sorted [7 5 2]\n",
      "   state [1 0 1 1 0 0 0 1] state_WI [  0.26   0.54   0.47   0.26   0.45   0.52   0.49 -10.  ] sorted [1 5 6]\n",
      "instance 0, ep 23, state [1 0 0 1 0 0 0 0]\n",
      "   state [1 0 0 1 0 0 0 0] state_WI [0.26 0.54 0.58 0.26 0.45 0.52 0.49 0.82] sorted [7 2 1]\n",
      "   state [0 0 0 0 0 0 0 0] state_WI [0.39 0.54 0.58 0.71 0.45 0.52 0.49 0.82] sorted [7 3 2]\n",
      "   state [0 0 1 0 1 0 0 1] state_WI [  0.39   0.54   0.47   0.71   0.45   0.52   0.49 -10.  ] sorted [3 1 5]\n",
      "   state [0 0 1 0 1 0 0 1] state_WI [  0.39   0.54   0.47   0.71   0.45   0.52   0.49 -10.  ] sorted [3 1 5]\n",
      "   state [0 1 1 1 1 1 0 1] state_WI [  0.39   0.47   0.47   0.26   0.45 -10.     0.49 -10.  ] sorted [6 2 1]\n",
      "   state [0 0 1 0 1 1 1 0] state_WI [  0.39   0.54   0.47   0.71   0.45 -10.   -10.     0.82] sorted [7 3 1]\n",
      "   state [0 0 1 1 0 0 0 1] state_WI [  0.39   0.54   0.47   0.26   0.45   0.52   0.49 -10.  ] sorted [1 5 6]\n",
      "   state [1 1 0 0 0 1 0 0] state_WI [  0.26   0.47   0.58   0.71   0.45 -10.     0.49   0.82] sorted [7 3 2]\n",
      "   state [1 0 0 0 0 1 1 1] state_WI [  0.26   0.54   0.58   0.71   0.45 -10.   -10.   -10.  ] sorted [3 2 1]\n",
      "   state [1 0 1 1 0 0 0 0] state_WI [0.26 0.54 0.47 0.26 0.45 0.52 0.49 0.82] sorted [7 1 5]\n",
      "   state [0 0 0 1 0 1 0 1] state_WI [  0.39   0.54   0.58   0.26   0.45 -10.     0.49 -10.  ] sorted [2 1 6]\n",
      "   state [0 1 0 0 0 1 1 0] state_WI [  0.39   0.47   0.58   0.71   0.45 -10.   -10.     0.82] sorted [7 3 2]\n",
      "   state [0 1 0 1 0 1 1 1] state_WI [  0.39   0.47   0.58   0.26   0.45 -10.   -10.   -10.  ] sorted [2 1 4]\n",
      "   state [0 1 1 0 0 0 0 1] state_WI [  0.39   0.47   0.47   0.71   0.45   0.52   0.49 -10.  ] sorted [3 5 6]\n",
      "   state [1 0 0 1 0 1 1 1] state_WI [  0.26   0.54   0.58   0.26   0.45 -10.   -10.   -10.  ] sorted [2 1 4]\n",
      "   state [0 0 0 1 1 0 1 1] state_WI [  0.39   0.54   0.58   0.26   0.45   0.52 -10.   -10.  ] sorted [2 1 5]\n",
      "   state [0 1 1 0 0 1 1 1] state_WI [  0.39   0.47   0.47   0.71   0.45 -10.   -10.   -10.  ] sorted [3 2 1]\n",
      "   state [0 1 1 1 0 0 1 1] state_WI [  0.39   0.47   0.47   0.26   0.45   0.52 -10.   -10.  ] sorted [5 2 1]\n",
      "   state [0 1 0 0 0 1 1 0] state_WI [  0.39   0.47   0.58   0.71   0.45 -10.   -10.     0.82] sorted [7 3 2]\n",
      "   state [0 0 1 1 0 1 0 0] state_WI [  0.39   0.54   0.47   0.26   0.45 -10.     0.49   0.82] sorted [7 1 6]\n",
      "instance 0, ep 24, state [1 0 1 1 0 0 0 1]\n",
      "   state [1 0 1 1 0 0 0 1] state_WI [  0.26   0.54   0.47   0.26   0.45   0.52   0.49 -10.  ] sorted [1 5 6]\n",
      "   state [1 1 0 0 0 1 0 0] state_WI [  0.26   0.47   0.58   0.71   0.45 -10.     0.49   0.82] sorted [7 3 2]\n",
      "   state [1 0 1 0 0 1 0 1] state_WI [  0.26   0.54   0.47   0.71   0.45 -10.     0.49 -10.  ] sorted [3 1 6]\n",
      "   state [0 1 1 1 0 0 0 0] state_WI [0.39 0.47 0.47 0.26 0.45 0.52 0.49 0.82] sorted [7 5 6]\n",
      "   state [0 1 0 0 0 1 1 1] state_WI [  0.39   0.47   0.58   0.71   0.45 -10.   -10.   -10.  ] sorted [3 2 1]\n",
      "   state [0 1 1 0 0 1 0 0] state_WI [  0.39   0.47   0.47   0.71   0.45 -10.     0.49   0.82] sorted [7 3 6]\n",
      "   state [0 0 0 1 0 1 1 1] state_WI [  0.39   0.54   0.58   0.26   0.45 -10.   -10.   -10.  ] sorted [2 1 4]\n",
      "   state [1 0 1 1 1 1 0 1] state_WI [  0.26   0.54   0.47   0.26   0.45 -10.     0.49 -10.  ] sorted [1 6 2]\n",
      "   state [0 1 1 0 1 0 0 1] state_WI [  0.39   0.47   0.47   0.71   0.45   0.52   0.49 -10.  ] sorted [3 5 6]\n",
      "   state [0 1 1 1 1 1 0 1] state_WI [  0.39   0.47   0.47   0.26   0.45 -10.     0.49 -10.  ] sorted [6 2 1]\n",
      "   state [0 1 1 0 0 1 0 0] state_WI [  0.39   0.47   0.47   0.71   0.45 -10.     0.49   0.82] sorted [7 3 6]\n",
      "   state [0 1 0 0 0 0 1 1] state_WI [  0.39   0.47   0.58   0.71   0.45   0.52 -10.   -10.  ] sorted [3 2 5]\n",
      "   state [0 0 1 1 0 1 1 1] state_WI [  0.39   0.54   0.47   0.26   0.45 -10.   -10.   -10.  ] sorted [1 2 4]\n",
      "   state [0 1 1 1 0 1 0 0] state_WI [  0.39   0.47   0.47   0.26   0.45 -10.     0.49   0.82] sorted [7 6 2]\n",
      "   state [0 1 1 1 0 1 0 1] state_WI [  0.39   0.47   0.47   0.26   0.45 -10.     0.49 -10.  ] sorted [6 2 1]\n",
      "   state [0 1 1 0 0 0 0 0] state_WI [0.39 0.47 0.47 0.71 0.45 0.52 0.49 0.82] sorted [7 3 5]\n",
      "   state [0 1 0 1 0 0 0 1] state_WI [  0.39   0.47   0.58   0.26   0.45   0.52   0.49 -10.  ] sorted [2 5 6]\n",
      "   state [1 0 1 0 0 0 0 1] state_WI [  0.26   0.54   0.47   0.71   0.45   0.52   0.49 -10.  ] sorted [3 1 5]\n",
      "   state [1 0 1 1 0 0 0 0] state_WI [0.26 0.54 0.47 0.26 0.45 0.52 0.49 0.82] sorted [7 1 5]\n",
      "   state [0 1 0 0 1 1 1 0] state_WI [  0.39   0.47   0.58   0.71   0.45 -10.   -10.     0.82] sorted [7 3 2]\n",
      "instance 0, ep 25, state [0 0 1 0 0 0 0 1]\n",
      "   state [0 0 1 0 0 0 0 1] state_WI [  0.39   0.54   0.47   0.71   0.45   0.52   0.49 -10.  ] sorted [3 1 5]\n",
      "   state [0 0 0 0 0 1 0 1] state_WI [  0.39   0.54   0.58   0.71   0.45 -10.     0.49 -10.  ] sorted [3 2 1]\n",
      "   state [0 0 0 0 0 1 0 1] state_WI [  0.39   0.54   0.58   0.71   0.45 -10.     0.49 -10.  ] sorted [3 2 1]\n",
      "   state [0 1 0 0 0 1 1 0] state_WI [  0.39   0.47   0.58   0.71   0.45 -10.   -10.     0.82] sorted [7 3 2]\n",
      "   state [1 1 0 1 0 1 0 1] state_WI [  0.26   0.47   0.58   0.26   0.45 -10.     0.49 -10.  ] sorted [2 6 1]\n",
      "   state [0 1 0 1 0 1 1 0] state_WI [  0.39   0.47   0.58   0.26   0.45 -10.   -10.     0.82] sorted [7 2 1]\n",
      "   state [0 0 0 1 0 0 1 0] state_WI [  0.39   0.54   0.58   0.26   0.45   0.52 -10.     0.82] sorted [7 2 1]\n",
      "   state [0 0 0 0 1 1 1 1] state_WI [  0.39   0.54   0.58   0.71   0.45 -10.   -10.   -10.  ] sorted [3 2 1]\n",
      "   state [0 0 1 1 0 0 1 1] state_WI [  0.39   0.54   0.47   0.26   0.45   0.52 -10.   -10.  ] sorted [1 5 2]\n",
      "   state [0 1 1 1 0 1 0 0] state_WI [  0.39   0.47   0.47   0.26   0.45 -10.     0.49   0.82] sorted [7 6 2]\n",
      "   state [0 0 1 1 0 1 1 1] state_WI [  0.39   0.54   0.47   0.26   0.45 -10.   -10.   -10.  ] sorted [1 2 4]\n",
      "   state [0 0 1 0 1 0 0 0] state_WI [0.39 0.54 0.47 0.71 0.45 0.52 0.49 0.82] sorted [7 3 1]\n",
      "   state [0 0 1 0 0 1 0 1] state_WI [  0.39   0.54   0.47   0.71   0.45 -10.     0.49 -10.  ] sorted [3 1 6]\n",
      "   state [0 1 1 1 0 1 0 0] state_WI [  0.39   0.47   0.47   0.26   0.45 -10.     0.49   0.82] sorted [7 6 2]\n",
      "   state [1 0 1 1 0 0 1 1] state_WI [  0.26   0.54   0.47   0.26   0.45   0.52 -10.   -10.  ] sorted [1 5 2]\n",
      "   state [1 0 1 0 0 0 0 1] state_WI [  0.26   0.54   0.47   0.71   0.45   0.52   0.49 -10.  ] sorted [3 1 5]\n",
      "   state [0 1 0 0 0 1 0 0] state_WI [  0.39   0.47   0.58   0.71   0.45 -10.     0.49   0.82] sorted [7 3 2]\n",
      "   state [0 1 0 1 0 1 1 0] state_WI [  0.39   0.47   0.58   0.26   0.45 -10.   -10.     0.82] sorted [7 2 1]\n",
      "   state [0 1 1 1 0 1 1 1] state_WI [  0.39   0.47   0.47   0.26   0.45 -10.   -10.   -10.  ] sorted [2 1 4]\n",
      "   state [0 1 1 0 0 1 0 0] state_WI [  0.39   0.47   0.47   0.71   0.45 -10.     0.49   0.82] sorted [7 3 6]\n",
      "instance 0, ep 26, state [0 1 0 1 0 0 1 1]\n",
      "   state [0 1 0 1 0 0 1 1] state_WI [  0.39   0.47   0.58   0.26   0.45   0.52 -10.   -10.  ] sorted [2 5 1]\n",
      "   state [0 1 1 1 1 0 1 1] state_WI [  0.39   0.47   0.47   0.26   0.45   0.52 -10.   -10.  ] sorted [5 2 1]\n",
      "   state [0 1 1 0 1 1 0 0] state_WI [  0.39   0.47   0.47   0.71   0.45 -10.     0.49   0.82] sorted [7 3 6]\n",
      "   state [0 0 0 1 1 0 0 0] state_WI [0.39 0.54 0.58 0.26 0.45 0.52 0.49 0.82] sorted [7 2 1]\n",
      "   state [0 1 1 0 1 1 0 0] state_WI [  0.39   0.47   0.47   0.71   0.45 -10.     0.49   0.82] sorted [7 3 6]\n",
      "   state [1 0 0 0 0 0 0 0] state_WI [0.26 0.54 0.58 0.71 0.45 0.52 0.49 0.82] sorted [7 3 2]\n",
      "   state [1 0 0 1 0 0 0 1] state_WI [  0.26   0.54   0.58   0.26   0.45   0.52   0.49 -10.  ] sorted [2 1 5]\n",
      "   state [1 1 0 1 0 1 0 0] state_WI [  0.26   0.47   0.58   0.26   0.45 -10.     0.49   0.82] sorted [7 2 6]\n",
      "   state [1 1 0 1 0 1 1 1] state_WI [  0.26   0.47   0.58   0.26   0.45 -10.   -10.   -10.  ] sorted [2 1 4]\n",
      "   state [1 1 1 0 1 1 1 0] state_WI [  0.26   0.47   0.47   0.71   0.45 -10.   -10.     0.82] sorted [7 3 2]\n",
      "   state [1 0 0 1 0 1 0 0] state_WI [  0.26   0.54   0.58   0.26   0.45 -10.     0.49   0.82] sorted [7 2 1]\n",
      "   state [1 1 0 1 0 1 0 1] state_WI [  0.26   0.47   0.58   0.26   0.45 -10.     0.49 -10.  ] sorted [2 6 1]\n",
      "   state [1 1 0 1 0 1 0 1] state_WI [  0.26   0.47   0.58   0.26   0.45 -10.     0.49 -10.  ] sorted [2 6 1]\n",
      "   state [1 0 0 1 0 1 1 1] state_WI [  0.26   0.54   0.58   0.26   0.45 -10.   -10.   -10.  ] sorted [2 1 4]\n",
      "   state [0 0 1 0 1 0 0 0] state_WI [0.39 0.54 0.47 0.71 0.45 0.52 0.49 0.82] sorted [7 3 1]\n",
      "   state [0 1 0 0 0 0 0 1] state_WI [  0.39   0.47   0.58   0.71   0.45   0.52   0.49 -10.  ] sorted [3 2 5]\n",
      "   state [0 0 0 1 0 0 0 1] state_WI [  0.39   0.54   0.58   0.26   0.45   0.52   0.49 -10.  ] sorted [2 1 5]\n",
      "   state [0 0 1 0 0 1 0 0] state_WI [  0.39   0.54   0.47   0.71   0.45 -10.     0.49   0.82] sorted [7 3 1]\n",
      "   state [0 1 1 0 0 1 0 1] state_WI [  0.39   0.47   0.47   0.71   0.45 -10.     0.49 -10.  ] sorted [3 6 2]\n",
      "   state [0 0 1 1 0 0 1 1] state_WI [  0.39   0.54   0.47   0.26   0.45   0.52 -10.   -10.  ] sorted [1 5 2]\n",
      "instance 0, ep 27, state [1 0 0 0 1 0 1 0]\n",
      "   state [1 0 0 0 1 0 1 0] state_WI [  0.26   0.54   0.58   0.71   0.45   0.52 -10.     0.82] sorted [7 3 2]\n",
      "   state [1 0 0 1 1 0 0 1] state_WI [  0.26   0.54   0.58   0.26   0.45   0.52   0.49 -10.  ] sorted [2 1 5]\n",
      "   state [0 0 0 0 0 1 0 0] state_WI [  0.39   0.54   0.58   0.71   0.45 -10.     0.49   0.82] sorted [7 3 2]\n",
      "   state [0 0 1 1 0 1 0 1] state_WI [  0.39   0.54   0.47   0.26   0.45 -10.     0.49 -10.  ] sorted [1 6 2]\n",
      "   state [0 1 1 0 0 1 1 0] state_WI [  0.39   0.47   0.47   0.71   0.45 -10.   -10.     0.82] sorted [7 3 2]\n",
      "   state [0 0 0 1 0 1 0 1] state_WI [  0.39   0.54   0.58   0.26   0.45 -10.     0.49 -10.  ] sorted [2 1 6]\n",
      "   state [0 0 0 0 0 0 1 0] state_WI [  0.39   0.54   0.58   0.71   0.45   0.52 -10.     0.82] sorted [7 3 2]\n",
      "   state [0 0 1 1 0 0 0 1] state_WI [  0.39   0.54   0.47   0.26   0.45   0.52   0.49 -10.  ] sorted [1 5 6]\n",
      "   state [0 0 0 0 0 1 0 1] state_WI [  0.39   0.54   0.58   0.71   0.45 -10.     0.49 -10.  ] sorted [3 2 1]\n",
      "   state [0 0 1 0 0 0 0 1] state_WI [  0.39   0.54   0.47   0.71   0.45   0.52   0.49 -10.  ] sorted [3 1 5]\n",
      "   state [0 1 0 1 0 1 0 1] state_WI [  0.39   0.47   0.58   0.26   0.45 -10.     0.49 -10.  ] sorted [2 6 1]\n",
      "   state [1 1 1 0 0 0 0 0] state_WI [0.26 0.47 0.47 0.71 0.45 0.52 0.49 0.82] sorted [7 3 5]\n",
      "   state [1 0 1 0 0 1 0 1] state_WI [  0.26   0.54   0.47   0.71   0.45 -10.     0.49 -10.  ] sorted [3 1 6]\n",
      "   state [1 0 1 0 0 0 0 0] state_WI [0.26 0.54 0.47 0.71 0.45 0.52 0.49 0.82] sorted [7 3 1]\n",
      "   state [1 1 0 0 0 0 1 0] state_WI [  0.26   0.47   0.58   0.71   0.45   0.52 -10.     0.82] sorted [7 3 2]\n",
      "   state [1 0 1 1 0 0 1 0] state_WI [  0.26   0.54   0.47   0.26   0.45   0.52 -10.     0.82] sorted [7 1 5]\n",
      "   state [0 1 1 1 0 1 0 0] state_WI [  0.39   0.47   0.47   0.26   0.45 -10.     0.49   0.82] sorted [7 6 2]\n",
      "   state [0 1 1 0 0 1 0 0] state_WI [  0.39   0.47   0.47   0.71   0.45 -10.     0.49   0.82] sorted [7 3 6]\n",
      "   state [0 0 0 1 0 1 0 1] state_WI [  0.39   0.54   0.58   0.26   0.45 -10.     0.49 -10.  ] sorted [2 1 6]\n",
      "   state [0 1 1 0 0 1 0 1] state_WI [  0.39   0.47   0.47   0.71   0.45 -10.     0.49 -10.  ] sorted [3 6 2]\n",
      "instance 0, ep 28, state [1 0 1 0 0 1 0 0]\n",
      "   state [1 0 1 0 0 1 0 0] state_WI [  0.26   0.54   0.47   0.71   0.45 -10.     0.49   0.82] sorted [7 3 1]\n",
      "   state [0 0 0 1 0 0 0 0] state_WI [0.39 0.54 0.58 0.26 0.45 0.52 0.49 0.82] sorted [7 2 1]\n",
      "   state [1 0 1 0 0 0 0 1] state_WI [  0.26   0.54   0.47   0.71   0.45   0.52   0.49 -10.  ] sorted [3 1 5]\n",
      "   state [1 0 0 1 0 0 0 0] state_WI [0.26 0.54 0.58 0.26 0.45 0.52 0.49 0.82] sorted [7 2 1]\n",
      "   state [1 1 1 1 0 0 0 0] state_WI [0.26 0.47 0.47 0.26 0.45 0.52 0.49 0.82] sorted [7 5 6]\n",
      "   state [1 1 0 0 1 0 0 1] state_WI [  0.26   0.47   0.58   0.71   0.45   0.52   0.49 -10.  ] sorted [3 2 5]\n",
      "   state [1 0 1 1 0 0 0 0] state_WI [0.26 0.54 0.47 0.26 0.45 0.52 0.49 0.82] sorted [7 1 5]\n",
      "   state [1 1 1 1 0 1 0 0] state_WI [  0.26   0.47   0.47   0.26   0.45 -10.     0.49   0.82] sorted [7 6 2]\n",
      "   state [0 1 1 1 0 1 0 1] state_WI [  0.39   0.47   0.47   0.26   0.45 -10.     0.49 -10.  ] sorted [6 2 1]\n",
      "   state [0 1 1 1 0 0 1 1] state_WI [  0.39   0.47   0.47   0.26   0.45   0.52 -10.   -10.  ] sorted [5 2 1]\n",
      "   state [1 1 1 1 0 1 0 0] state_WI [  0.26   0.47   0.47   0.26   0.45 -10.     0.49   0.82] sorted [7 6 2]\n",
      "   state [0 0 0 0 1 0 1 1] state_WI [  0.39   0.54   0.58   0.71   0.45   0.52 -10.   -10.  ] sorted [3 2 1]\n",
      "   state [0 0 1 1 1 0 1 1] state_WI [  0.39   0.54   0.47   0.26   0.45   0.52 -10.   -10.  ] sorted [1 5 2]\n",
      "   state [0 1 0 1 0 0 1 1] state_WI [  0.39   0.47   0.58   0.26   0.45   0.52 -10.   -10.  ] sorted [2 5 1]\n",
      "   state [0 1 1 0 0 0 1 1] state_WI [  0.39   0.47   0.47   0.71   0.45   0.52 -10.   -10.  ] sorted [3 5 2]\n",
      "   state [0 0 1 1 0 1 0 0] state_WI [  0.39   0.54   0.47   0.26   0.45 -10.     0.49   0.82] sorted [7 1 6]\n",
      "   state [0 0 1 1 0 0 1 1] state_WI [  0.39   0.54   0.47   0.26   0.45   0.52 -10.   -10.  ] sorted [1 5 2]\n",
      "   state [1 1 1 0 0 0 0 1] state_WI [  0.26   0.47   0.47   0.71   0.45   0.52   0.49 -10.  ] sorted [3 5 6]\n",
      "   state [1 1 0 1 0 1 1 1] state_WI [  0.26   0.47   0.58   0.26   0.45 -10.   -10.   -10.  ] sorted [2 1 4]\n",
      "   state [1 1 0 1 1 1 0 1] state_WI [  0.26   0.47   0.58   0.26   0.45 -10.     0.49 -10.  ] sorted [2 6 1]\n",
      "instance 0, ep 29, state [1 1 0 0 0 1 0 0]\n",
      "   state [1 1 0 0 0 1 0 0] state_WI [  0.26   0.47   0.58   0.71   0.45 -10.     0.49   0.82] sorted [7 3 2]\n",
      "   state [0 0 1 0 1 1 0 0] state_WI [  0.39   0.54   0.47   0.71   0.45 -10.     0.49   0.82] sorted [7 3 1]\n",
      "   state [0 0 0 0 1 0 0 1] state_WI [  0.39   0.54   0.58   0.71   0.45   0.52   0.49 -10.  ] sorted [3 2 1]\n",
      "   state [0 0 1 1 0 0 0 0] state_WI [0.39 0.54 0.47 0.26 0.45 0.52 0.49 0.82] sorted [7 1 5]\n",
      "   state [0 0 1 0 0 1 0 0] state_WI [  0.39   0.54   0.47   0.71   0.45 -10.     0.49   0.82] sorted [7 3 1]\n",
      "   state [0 0 0 0 0 0 0 1] state_WI [  0.39   0.54   0.58   0.71   0.45   0.52   0.49 -10.  ] sorted [3 2 1]\n",
      "   state [1 0 0 0 0 0 0 0] state_WI [0.26 0.54 0.58 0.71 0.45 0.52 0.49 0.82] sorted [7 3 2]\n",
      "   state [0 0 0 0 0 1 1 1] state_WI [  0.39   0.54   0.58   0.71   0.45 -10.   -10.   -10.  ] sorted [3 2 1]\n",
      "   state [0 1 0 1 0 0 1 0] state_WI [  0.39   0.47   0.58   0.26   0.45   0.52 -10.     0.82] sorted [7 2 5]\n",
      "   state [0 1 0 1 1 1 0 0] state_WI [  0.39   0.47   0.58   0.26   0.45 -10.     0.49   0.82] sorted [7 2 6]\n",
      "   state [0 1 1 1 0 0 1 1] state_WI [  0.39   0.47   0.47   0.26   0.45   0.52 -10.   -10.  ] sorted [5 2 1]\n",
      "   state [0 0 1 1 0 0 1 1] state_WI [  0.39   0.54   0.47   0.26   0.45   0.52 -10.   -10.  ] sorted [1 5 2]\n",
      "   state [0 1 1 1 0 0 0 0] state_WI [0.39 0.47 0.47 0.26 0.45 0.52 0.49 0.82] sorted [7 5 6]\n",
      "   state [1 1 1 0 0 1 0 0] state_WI [  0.26   0.47   0.47   0.71   0.45 -10.     0.49   0.82] sorted [7 3 6]\n",
      "   state [1 0 0 1 0 1 0 0] state_WI [  0.26   0.54   0.58   0.26   0.45 -10.     0.49   0.82] sorted [7 2 1]\n",
      "   state [0 1 0 1 0 0 0 1] state_WI [  0.39   0.47   0.58   0.26   0.45   0.52   0.49 -10.  ] sorted [2 5 6]\n",
      "   state [1 0 1 1 0 1 0 1] state_WI [  0.26   0.54   0.47   0.26   0.45 -10.     0.49 -10.  ] sorted [1 6 2]\n",
      "   state [1 1 1 0 1 0 0 1] state_WI [  0.26   0.47   0.47   0.71   0.45   0.52   0.49 -10.  ] sorted [3 5 6]\n",
      "   state [1 1 0 1 1 0 0 0] state_WI [0.26 0.47 0.58 0.26 0.45 0.52 0.49 0.82] sorted [7 2 5]\n",
      "   state [0 1 1 1 1 0 0 1] state_WI [  0.39   0.47   0.47   0.26   0.45   0.52   0.49 -10.  ] sorted [5 6 2]\n",
      "first state [1 1 1 0 0 1 1 1]\n",
      "   state [1 1 1 0 0 1 1 1] state_WI [  0.26 -10.     0.12   0.67   0.27   0.49 -10.   -10.  ] sorted [3 5 4]\n",
      "   state [1 0 0 0 1 1 0 1] state_WI [  0.26   0.82   0.15   0.67 -10.     0.49 -10.   -10.  ] sorted [1 3 5]\n",
      "   state [1 0 0 0 0 1 0 0] state_WI [  0.26   0.82   0.15   0.67   0.27   0.49 -10.     0.55] sorted [1 3 7]\n",
      "   state [1 0 0 0 0 0 0 0] state_WI [  0.26   0.82   0.15   0.67   0.27   0.47 -10.     0.55] sorted [1 3 7]\n",
      "   state [0 1 0 1 0 0 0 0] state_WI [  0.71 -10.     0.15   0.28   0.27   0.47 -10.     0.55] sorted [0 7 5]\n",
      "   state [1 0 0 0 0 0 0 0] state_WI [  0.26   0.82   0.15   0.67   0.27   0.47 -10.     0.55] sorted [1 3 7]\n",
      "   state [1 1 0 0 0 0 0 0] state_WI [  0.26 -10.     0.15   0.67   0.27   0.47 -10.     0.55] sorted [3 7 5]\n",
      "   state [0 1 0 1 1 0 0 0] state_WI [  0.71 -10.     0.15   0.28 -10.     0.47 -10.     0.55] sorted [0 7 5]\n",
      "   state [0 0 0 0 1 1 0 1] state_WI [  0.71   0.82   0.15   0.67 -10.     0.49 -10.   -10.  ] sorted [1 0 3]\n",
      "   state [0 1 0 1 0 1 0 0] state_WI [  0.71 -10.     0.15   0.28   0.27   0.49 -10.     0.55] sorted [0 7 5]\n",
      "   state [1 0 0 1 1 1 1 0] state_WI [  0.26   0.82   0.15   0.28 -10.     0.49 -10.     0.55] sorted [1 7 5]\n",
      "   state [1 1 0 0 1 1 1 0] state_WI [  0.26 -10.     0.15   0.67 -10.     0.49 -10.     0.55] sorted [3 7 5]\n",
      "   state [0 0 0 1 1 0 0 0] state_WI [  0.71   0.82   0.15   0.28 -10.     0.47 -10.     0.55] sorted [1 0 7]\n",
      "   state [1 1 0 1 0 1 0 0] state_WI [  0.26 -10.     0.15   0.28   0.27   0.49 -10.     0.55] sorted [7 5 3]\n",
      "   state [0 1 0 1 0 1 0 1] state_WI [  0.71 -10.     0.15   0.28   0.27   0.49 -10.   -10.  ] sorted [0 5 3]\n",
      "   state [0 1 0 1 0 1 0 1] state_WI [  0.71 -10.     0.15   0.28   0.27   0.49 -10.   -10.  ] sorted [0 5 3]\n",
      "   state [1 0 0 1 1 1 0 0] state_WI [  0.26   0.82   0.15   0.28 -10.     0.49 -10.     0.55] sorted [1 7 5]\n",
      "   state [0 1 0 1 0 1 0 0] state_WI [  0.71 -10.     0.15   0.28   0.27   0.49 -10.     0.55] sorted [0 7 5]\n",
      "   state [1 0 0 1 0 0 0 0] state_WI [  0.26   0.82   0.15   0.28   0.27   0.47 -10.     0.55] sorted [1 7 5]\n",
      "   state [1 1 0 0 1 1 0 0] state_WI [  0.26 -10.     0.15   0.67 -10.     0.49 -10.     0.55] sorted [3 7 5]\n",
      "instance 1, ep 1, state [0 1 1 0 0 1 0 0]\n",
      "   state [0 1 1 0 0 1 0 0] state_WI [  0.71 -10.     0.12   0.67   0.27   0.49 -10.     0.55] sorted [0 3 7]\n",
      "   state [0 0 0 0 1 1 1 1] state_WI [  0.71   0.82   0.15   0.67 -10.     0.49 -10.   -10.  ] sorted [1 0 3]\n",
      "   state [0 0 0 1 1 1 1 1] state_WI [  0.71   0.82   0.15   0.28 -10.     0.49 -10.   -10.  ] sorted [1 0 5]\n",
      "   state [0 1 0 0 1 1 1 0] state_WI [  0.71 -10.     0.15   0.67 -10.     0.49 -10.     0.55] sorted [0 3 7]\n",
      "   state [1 0 0 0 0 0 1 0] state_WI [  0.26   0.82   0.15   0.67   0.27   0.47 -10.     0.55] sorted [1 3 7]\n",
      "   state [0 1 0 1 0 0 0 0] state_WI [  0.71 -10.     0.15   0.28   0.27   0.47 -10.     0.55] sorted [0 7 5]\n",
      "   state [1 1 0 0 0 0 1 0] state_WI [  0.26 -10.     0.15   0.67   0.27   0.47 -10.     0.55] sorted [3 7 5]\n",
      "   state [0 0 0 0 1 0 1 0] state_WI [  0.71   0.82   0.15   0.67 -10.     0.47 -10.     0.55] sorted [1 0 3]\n",
      "   state [1 1 0 1 1 1 1 0] state_WI [  0.26 -10.     0.15   0.28 -10.     0.49 -10.     0.55] sorted [7 5 3]\n",
      "   state [0 0 0 0 0 1 1 0] state_WI [  0.71   0.82   0.15   0.67   0.27   0.49 -10.     0.55] sorted [1 0 3]\n",
      "   state [0 1 0 0 0 1 1 0] state_WI [  0.71 -10.     0.15   0.67   0.27   0.49 -10.     0.55] sorted [0 3 7]\n",
      "   state [1 1 0 1 1 0 0 0] state_WI [  0.26 -10.     0.15   0.28 -10.     0.47 -10.     0.55] sorted [7 5 3]\n",
      "   state [1 1 0 1 0 1 0 1] state_WI [  0.26 -10.     0.15   0.28   0.27   0.49 -10.   -10.  ] sorted [5 3 4]\n",
      "   state [1 1 0 1 0 1 1 0] state_WI [  0.26 -10.     0.15   0.28   0.27   0.49 -10.     0.55] sorted [7 5 3]\n",
      "   state [1 0 0 1 1 1 1 0] state_WI [  0.26   0.82   0.15   0.28 -10.     0.49 -10.     0.55] sorted [1 7 5]\n",
      "   state [1 1 0 0 0 1 1 1] state_WI [  0.26 -10.     0.15   0.67   0.27   0.49 -10.   -10.  ] sorted [3 5 4]\n",
      "   state [0 1 0 0 1 0 1 0] state_WI [  0.71 -10.     0.15   0.67 -10.     0.47 -10.     0.55] sorted [0 3 7]\n",
      "   state [1 0 0 0 0 1 0 1] state_WI [  0.26   0.82   0.15   0.67   0.27   0.49 -10.   -10.  ] sorted [1 3 5]\n",
      "   state [1 0 0 1 1 1 0 1] state_WI [  0.26   0.82   0.15   0.28 -10.     0.49 -10.   -10.  ] sorted [1 5 3]\n",
      "   state [0 1 1 0 0 0 0 1] state_WI [  0.71 -10.     0.12   0.67   0.27   0.47 -10.   -10.  ] sorted [0 3 5]\n",
      "instance 1, ep 2, state [0 0 0 1 1 0 1 1]\n",
      "   state [0 0 0 1 1 0 1 1] state_WI [  0.71   0.82   0.15   0.28 -10.     0.47 -10.   -10.  ] sorted [1 0 5]\n",
      "   state [1 0 0 0 0 1 1 0] state_WI [  0.26   0.82   0.15   0.67   0.27   0.49 -10.     0.55] sorted [1 3 7]\n",
      "   state [1 1 0 1 0 0 1 0] state_WI [  0.26 -10.     0.15   0.28   0.27   0.47 -10.     0.55] sorted [7 5 3]\n",
      "   state [0 1 1 1 1 0 1 1] state_WI [  0.71 -10.     0.12   0.28 -10.     0.47 -10.   -10.  ] sorted [0 5 3]\n",
      "   state [1 0 0 1 0 0 0 0] state_WI [  0.26   0.82   0.15   0.28   0.27   0.47 -10.     0.55] sorted [1 7 5]\n",
      "   state [1 0 0 1 0 0 0 1] state_WI [  0.26   0.82   0.15   0.28   0.27   0.47 -10.   -10.  ] sorted [1 5 3]\n",
      "   state [1 1 0 1 0 0 0 0] state_WI [  0.26 -10.     0.15   0.28   0.27   0.47 -10.     0.55] sorted [7 5 3]\n",
      "   state [0 1 0 1 1 0 0 0] state_WI [  0.71 -10.     0.15   0.28 -10.     0.47 -10.     0.55] sorted [0 7 5]\n",
      "   state [1 1 0 0 1 1 0 0] state_WI [  0.26 -10.     0.15   0.67 -10.     0.49 -10.     0.55] sorted [3 7 5]\n",
      "   state [1 1 0 1 0 1 0 1] state_WI [  0.26 -10.     0.15   0.28   0.27   0.49 -10.   -10.  ] sorted [5 3 4]\n",
      "   state [1 0 0 1 1 1 0 0] state_WI [  0.26   0.82   0.15   0.28 -10.     0.49 -10.     0.55] sorted [1 7 5]\n",
      "   state [1 0 0 0 1 1 1 1] state_WI [  0.26   0.82   0.15   0.67 -10.     0.49 -10.   -10.  ] sorted [1 3 5]\n",
      "   state [1 1 0 0 0 1 0 1] state_WI [  0.26 -10.     0.15   0.67   0.27   0.49 -10.   -10.  ] sorted [3 5 4]\n",
      "   state [0 0 0 1 1 1 0 0] state_WI [  0.71   0.82   0.15   0.28 -10.     0.49 -10.     0.55] sorted [1 0 7]\n",
      "   state [1 1 0 1 0 1 0 1] state_WI [  0.26 -10.     0.15   0.28   0.27   0.49 -10.   -10.  ] sorted [5 3 4]\n",
      "   state [0 1 0 1 1 1 0 0] state_WI [  0.71 -10.     0.15   0.28 -10.     0.49 -10.     0.55] sorted [0 7 5]\n",
      "   state [0 1 0 1 1 0 0 0] state_WI [  0.71 -10.     0.15   0.28 -10.     0.47 -10.     0.55] sorted [0 7 5]\n",
      "   state [1 0 0 1 1 0 0 0] state_WI [  0.26   0.82   0.15   0.28 -10.     0.47 -10.     0.55] sorted [1 7 5]\n",
      "   state [1 1 0 0 1 1 0 1] state_WI [  0.26 -10.     0.15   0.67 -10.     0.49 -10.   -10.  ] sorted [3 5 0]\n",
      "   state [1 0 0 1 0 1 0 1] state_WI [  0.26   0.82   0.15   0.28   0.27   0.49 -10.   -10.  ] sorted [1 5 3]\n",
      "instance 1, ep 3, state [0 0 0 0 1 1 0 1]\n",
      "   state [0 0 0 0 1 1 0 1] state_WI [  0.71   0.82   0.15   0.67 -10.     0.49 -10.   -10.  ] sorted [1 0 3]\n",
      "   state [1 1 0 1 0 0 0 0] state_WI [  0.26 -10.     0.15   0.28   0.27   0.47 -10.     0.55] sorted [7 5 3]\n",
      "   state [1 0 1 0 0 0 0 1] state_WI [  0.26   0.82   0.12   0.67   0.27   0.47 -10.   -10.  ] sorted [1 3 5]\n",
      "   state [1 1 0 1 0 0 0 1] state_WI [  0.26 -10.     0.15   0.28   0.27   0.47 -10.   -10.  ] sorted [5 3 4]\n",
      "   state [1 1 0 0 1 0 1 1] state_WI [  0.26 -10.     0.15   0.67 -10.     0.47 -10.   -10.  ] sorted [3 5 0]\n",
      "   state [0 1 0 0 1 0 1 1] state_WI [  0.71 -10.     0.15   0.67 -10.     0.47 -10.   -10.  ] sorted [0 3 5]\n",
      "   state [1 0 0 1 0 1 1 0] state_WI [  0.26   0.82   0.15   0.28   0.27   0.49 -10.     0.55] sorted [1 7 5]\n",
      "   state [0 1 0 0 0 1 1 0] state_WI [  0.71 -10.     0.15   0.67   0.27   0.49 -10.     0.55] sorted [0 3 7]\n",
      "   state [1 0 0 0 1 0 1 0] state_WI [  0.26   0.82   0.15   0.67 -10.     0.47 -10.     0.55] sorted [1 3 7]\n",
      "   state [1 1 0 1 1 0 0 0] state_WI [  0.26 -10.     0.15   0.28 -10.     0.47 -10.     0.55] sorted [7 5 3]\n",
      "   state [1 1 0 1 1 1 0 1] state_WI [  0.26 -10.     0.15   0.28 -10.     0.49 -10.   -10.  ] sorted [5 3 0]\n",
      "   state [1 0 0 1 1 1 1 1] state_WI [  0.26   0.82   0.15   0.28 -10.     0.49 -10.   -10.  ] sorted [1 5 3]\n",
      "   state [0 0 0 1 0 1 0 0] state_WI [  0.71   0.82   0.15   0.28   0.27   0.49 -10.     0.55] sorted [1 0 7]\n",
      "   state [0 0 1 0 0 0 0 0] state_WI [  0.71   0.82   0.12   0.67   0.27   0.47 -10.     0.55] sorted [1 0 3]\n",
      "   state [0 1 0 0 0 1 0 0] state_WI [  0.71 -10.     0.15   0.67   0.27   0.49 -10.     0.55] sorted [0 3 7]\n",
      "   state [0 0 0 0 1 0 0 1] state_WI [  0.71   0.82   0.15   0.67 -10.     0.47 -10.   -10.  ] sorted [1 0 3]\n",
      "   state [0 1 0 1 0 0 0 1] state_WI [  0.71 -10.     0.15   0.28   0.27   0.47 -10.   -10.  ] sorted [0 5 3]\n",
      "   state [0 1 0 1 0 0 0 0] state_WI [  0.71 -10.     0.15   0.28   0.27   0.47 -10.     0.55] sorted [0 7 5]\n",
      "   state [0 1 1 0 1 1 0 1] state_WI [  0.71 -10.     0.12   0.67 -10.     0.49 -10.   -10.  ] sorted [0 3 5]\n",
      "   state [1 1 0 1 0 0 0 1] state_WI [  0.26 -10.     0.15   0.28   0.27   0.47 -10.   -10.  ] sorted [5 3 4]\n",
      "instance 1, ep 4, state [1 0 1 1 1 0 1 1]\n",
      "   state [1 0 1 1 1 0 1 1] state_WI [  0.26   0.82   0.12   0.28 -10.     0.47 -10.   -10.  ] sorted [1 5 3]\n",
      "   state [1 0 0 0 0 1 1 1] state_WI [  0.26   0.82   0.15   0.67   0.27   0.49 -10.   -10.  ] sorted [1 3 5]\n",
      "   state [0 1 0 1 1 0 0 0] state_WI [  0.71 -10.     0.15   0.28 -10.     0.47 -10.     0.55] sorted [0 7 5]\n",
      "   state [1 1 0 1 0 0 0 0] state_WI [  0.26 -10.     0.15   0.28   0.27   0.47 -10.     0.55] sorted [7 5 3]\n",
      "   state [1 1 0 1 0 0 0 0] state_WI [  0.26 -10.     0.15   0.28   0.27   0.47 -10.     0.55] sorted [7 5 3]\n",
      "   state [0 0 0 1 0 0 0 1] state_WI [  0.71   0.82   0.15   0.28   0.27   0.47 -10.   -10.  ] sorted [1 0 5]\n",
      "   state [0 1 0 1 1 0 0 0] state_WI [  0.71 -10.     0.15   0.28 -10.     0.47 -10.     0.55] sorted [0 7 5]\n",
      "   state [1 0 0 1 0 1 0 0] state_WI [  0.26   0.82   0.15   0.28   0.27   0.49 -10.     0.55] sorted [1 7 5]\n",
      "   state [0 0 0 1 1 1 0 0] state_WI [  0.71   0.82   0.15   0.28 -10.     0.49 -10.     0.55] sorted [1 0 7]\n",
      "   state [0 1 0 0 1 0 1 1] state_WI [  0.71 -10.     0.15   0.67 -10.     0.47 -10.   -10.  ] sorted [0 3 5]\n",
      "   state [0 1 0 0 0 0 0 0] state_WI [  0.71 -10.     0.15   0.67   0.27   0.47 -10.     0.55] sorted [0 3 7]\n",
      "   state [1 0 0 1 0 0 0 0] state_WI [  0.26   0.82   0.15   0.28   0.27   0.47 -10.     0.55] sorted [1 7 5]\n",
      "   state [1 1 0 0 0 1 0 1] state_WI [  0.26 -10.     0.15   0.67   0.27   0.49 -10.   -10.  ] sorted [3 5 4]\n",
      "   state [1 0 0 1 1 0 0 1] state_WI [  0.26   0.82   0.15   0.28 -10.     0.47 -10.   -10.  ] sorted [1 5 3]\n",
      "   state [1 1 0 1 1 0 0 1] state_WI [  0.26 -10.     0.15   0.28 -10.     0.47 -10.   -10.  ] sorted [5 3 0]\n",
      "   state [1 1 0 1 1 0 0 0] state_WI [  0.26 -10.     0.15   0.28 -10.     0.47 -10.     0.55] sorted [7 5 3]\n",
      "   state [0 0 0 1 1 1 0 0] state_WI [  0.71   0.82   0.15   0.28 -10.     0.49 -10.     0.55] sorted [1 0 7]\n",
      "   state [0 1 0 1 1 0 1 0] state_WI [  0.71 -10.     0.15   0.28 -10.     0.47 -10.     0.55] sorted [0 7 5]\n",
      "   state [0 1 0 1 0 1 1 1] state_WI [  0.71 -10.     0.15   0.28   0.27   0.49 -10.   -10.  ] sorted [0 5 3]\n",
      "   state [0 0 0 0 1 1 1 1] state_WI [  0.71   0.82   0.15   0.67 -10.     0.49 -10.   -10.  ] sorted [1 0 3]\n",
      "instance 1, ep 5, state [1 1 1 1 1 1 0 0]\n",
      "   state [1 1 1 1 1 1 0 0] state_WI [  0.26 -10.     0.12   0.28 -10.     0.49 -10.     0.55] sorted [7 5 3]\n",
      "   state [1 0 1 1 0 0 0 0] state_WI [  0.26   0.82   0.12   0.28   0.27   0.47 -10.     0.55] sorted [1 7 5]\n",
      "   state [1 1 0 1 0 0 0 0] state_WI [  0.26 -10.     0.15   0.28   0.27   0.47 -10.     0.55] sorted [7 5 3]\n",
      "   state [1 1 0 1 1 0 0 1] state_WI [  0.26 -10.     0.15   0.28 -10.     0.47 -10.   -10.  ] sorted [5 3 0]\n",
      "   state [1 1 0 0 1 0 0 0] state_WI [  0.26 -10.     0.15   0.67 -10.     0.47 -10.     0.55] sorted [3 7 5]\n",
      "   state [0 0 1 0 1 0 0 1] state_WI [  0.71   0.82   0.12   0.67 -10.     0.47 -10.   -10.  ] sorted [1 0 3]\n",
      "   state [1 1 0 1 0 0 0 0] state_WI [  0.26 -10.     0.15   0.28   0.27   0.47 -10.     0.55] sorted [7 5 3]\n",
      "   state [0 1 0 1 0 0 0 1] state_WI [  0.71 -10.     0.15   0.28   0.27   0.47 -10.   -10.  ] sorted [0 5 3]\n",
      "   state [1 1 0 1 0 1 1 1] state_WI [  0.26 -10.     0.15   0.28   0.27   0.49 -10.   -10.  ] sorted [5 3 4]\n",
      "   state [1 0 1 1 0 1 0 0] state_WI [  0.26   0.82   0.12   0.28   0.27   0.49 -10.     0.55] sorted [1 7 5]\n",
      "   state [0 1 0 0 0 1 0 0] state_WI [  0.71 -10.     0.15   0.67   0.27   0.49 -10.     0.55] sorted [0 3 7]\n",
      "   state [1 1 0 0 1 1 1 1] state_WI [  0.26 -10.     0.15   0.67 -10.     0.49 -10.   -10.  ] sorted [3 5 0]\n",
      "   state [1 1 0 0 1 1 1 1] state_WI [  0.26 -10.     0.15   0.67 -10.     0.49 -10.   -10.  ] sorted [3 5 0]\n",
      "   state [1 1 0 0 1 1 1 0] state_WI [  0.26 -10.     0.15   0.67 -10.     0.49 -10.     0.55] sorted [3 7 5]\n",
      "   state [1 0 0 1 1 1 0 1] state_WI [  0.26   0.82   0.15   0.28 -10.     0.49 -10.   -10.  ] sorted [1 5 3]\n",
      "   state [0 1 0 1 1 1 0 0] state_WI [  0.71 -10.     0.15   0.28 -10.     0.49 -10.     0.55] sorted [0 7 5]\n",
      "   state [1 0 0 0 0 1 0 1] state_WI [  0.26   0.82   0.15   0.67   0.27   0.49 -10.   -10.  ] sorted [1 3 5]\n",
      "   state [1 1 0 0 0 0 1 1] state_WI [  0.26 -10.     0.15   0.67   0.27   0.47 -10.   -10.  ] sorted [3 5 4]\n",
      "   state [0 1 0 1 1 1 1 0] state_WI [  0.71 -10.     0.15   0.28 -10.     0.49 -10.     0.55] sorted [0 7 5]\n",
      "   state [1 0 0 1 0 0 1 0] state_WI [  0.26   0.82   0.15   0.28   0.27   0.47 -10.     0.55] sorted [1 7 5]\n",
      "instance 1, ep 6, state [0 1 0 1 0 1 1 1]\n",
      "   state [0 1 0 1 0 1 1 1] state_WI [  0.71 -10.     0.15   0.28   0.27   0.49 -10.   -10.  ] sorted [0 5 3]\n",
      "   state [1 0 0 0 1 1 0 0] state_WI [  0.26   0.82   0.15   0.67 -10.     0.49 -10.     0.55] sorted [1 3 7]\n",
      "   state [0 1 1 0 1 0 0 0] state_WI [  0.71 -10.     0.12   0.67 -10.     0.47 -10.     0.55] sorted [0 3 7]\n",
      "   state [1 1 0 1 1 1 0 1] state_WI [  0.26 -10.     0.15   0.28 -10.     0.49 -10.   -10.  ] sorted [5 3 0]\n",
      "   state [1 0 0 0 1 1 0 0] state_WI [  0.26   0.82   0.15   0.67 -10.     0.49 -10.     0.55] sorted [1 3 7]\n",
      "   state [0 1 1 0 0 1 0 0] state_WI [  0.71 -10.     0.12   0.67   0.27   0.49 -10.     0.55] sorted [0 3 7]\n",
      "   state [1 0 1 0 0 0 0 1] state_WI [  0.26   0.82   0.12   0.67   0.27   0.47 -10.   -10.  ] sorted [1 3 5]\n",
      "   state [0 0 0 0 0 1 0 1] state_WI [  0.71   0.82   0.15   0.67   0.27   0.49 -10.   -10.  ] sorted [1 0 3]\n",
      "   state [1 1 0 1 1 1 0 0] state_WI [  0.26 -10.     0.15   0.28 -10.     0.49 -10.     0.55] sorted [7 5 3]\n",
      "   state [1 1 1 0 0 0 0 0] state_WI [  0.26 -10.     0.12   0.67   0.27   0.47 -10.     0.55] sorted [3 7 5]\n",
      "   state [0 1 0 1 0 1 0 1] state_WI [  0.71 -10.     0.15   0.28   0.27   0.49 -10.   -10.  ] sorted [0 5 3]\n",
      "   state [1 0 0 1 1 1 0 0] state_WI [  0.26   0.82   0.15   0.28 -10.     0.49 -10.     0.55] sorted [1 7 5]\n",
      "   state [0 1 1 0 1 0 0 1] state_WI [  0.71 -10.     0.12   0.67 -10.     0.47 -10.   -10.  ] sorted [0 3 5]\n",
      "   state [0 0 0 1 1 0 0 1] state_WI [  0.71   0.82   0.15   0.28 -10.     0.47 -10.   -10.  ] sorted [1 0 5]\n",
      "   state [0 0 0 1 0 0 0 0] state_WI [  0.71   0.82   0.15   0.28   0.27   0.47 -10.     0.55] sorted [1 0 7]\n",
      "   state [0 1 0 1 0 0 0 0] state_WI [  0.71 -10.     0.15   0.28   0.27   0.47 -10.     0.55] sorted [0 7 5]\n",
      "   state [0 1 0 1 1 0 0 1] state_WI [  0.71 -10.     0.15   0.28 -10.     0.47 -10.   -10.  ] sorted [0 5 3]\n",
      "   state [1 1 0 0 1 0 0 0] state_WI [  0.26 -10.     0.15   0.67 -10.     0.47 -10.     0.55] sorted [3 7 5]\n",
      "   state [0 1 0 0 0 1 0 0] state_WI [  0.71 -10.     0.15   0.67   0.27   0.49 -10.     0.55] sorted [0 3 7]\n",
      "   state [0 0 0 1 0 0 0 1] state_WI [  0.71   0.82   0.15   0.28   0.27   0.47 -10.   -10.  ] sorted [1 0 5]\n",
      "instance 1, ep 7, state [0 1 1 0 1 0 0 1]\n",
      "   state [0 1 1 0 1 0 0 1] state_WI [  0.71 -10.     0.12   0.67 -10.     0.47 -10.   -10.  ] sorted [0 3 5]\n",
      "   state [0 0 0 1 0 0 0 1] state_WI [  0.71   0.82   0.15   0.28   0.27   0.47 -10.   -10.  ] sorted [1 0 5]\n",
      "   state [0 1 0 1 1 0 0 1] state_WI [  0.71 -10.     0.15   0.28 -10.     0.47 -10.   -10.  ] sorted [0 5 3]\n",
      "   state [1 1 0 0 1 1 0 0] state_WI [  0.26 -10.     0.15   0.67 -10.     0.49 -10.     0.55] sorted [3 7 5]\n",
      "   state [1 1 0 0 1 1 0 1] state_WI [  0.26 -10.     0.15   0.67 -10.     0.49 -10.   -10.  ] sorted [3 5 0]\n",
      "   state [1 0 0 1 1 1 0 1] state_WI [  0.26   0.82   0.15   0.28 -10.     0.49 -10.   -10.  ] sorted [1 5 3]\n",
      "   state [0 0 0 1 0 1 0 0] state_WI [  0.71   0.82   0.15   0.28   0.27   0.49 -10.     0.55] sorted [1 0 7]\n",
      "   state [1 1 0 1 1 1 0 1] state_WI [  0.26 -10.     0.15   0.28 -10.     0.49 -10.   -10.  ] sorted [5 3 0]\n",
      "   state [0 0 0 1 0 0 0 1] state_WI [  0.71   0.82   0.15   0.28   0.27   0.47 -10.   -10.  ] sorted [1 0 5]\n",
      "   state [1 0 0 1 1 0 1 0] state_WI [  0.26   0.82   0.15   0.28 -10.     0.47 -10.     0.55] sorted [1 7 5]\n",
      "   state [1 0 0 0 1 0 1 0] state_WI [  0.26   0.82   0.15   0.67 -10.     0.47 -10.     0.55] sorted [1 3 7]\n",
      "   state [1 1 0 1 1 0 1 0] state_WI [  0.26 -10.     0.15   0.28 -10.     0.47 -10.     0.55] sorted [7 5 3]\n",
      "   state [1 1 0 1 1 1 1 1] state_WI [  0.26 -10.     0.15   0.28 -10.     0.49 -10.   -10.  ] sorted [5 3 0]\n",
      "   state [1 1 0 1 1 1 1 0] state_WI [  0.26 -10.     0.15   0.28 -10.     0.49 -10.     0.55] sorted [7 5 3]\n",
      "   state [0 0 0 1 1 0 1 0] state_WI [  0.71   0.82   0.15   0.28 -10.     0.47 -10.     0.55] sorted [1 0 7]\n",
      "   state [1 0 0 0 1 0 0 0] state_WI [  0.26   0.82   0.15   0.67 -10.     0.47 -10.     0.55] sorted [1 3 7]\n",
      "   state [1 1 0 1 1 0 0 1] state_WI [  0.26 -10.     0.15   0.28 -10.     0.47 -10.   -10.  ] sorted [5 3 0]\n",
      "   state [0 0 0 1 1 1 0 0] state_WI [  0.71   0.82   0.15   0.28 -10.     0.49 -10.     0.55] sorted [1 0 7]\n",
      "   state [1 1 0 1 0 0 0 0] state_WI [  0.26 -10.     0.15   0.28   0.27   0.47 -10.     0.55] sorted [7 5 3]\n",
      "   state [1 1 1 1 0 0 0 0] state_WI [  0.26 -10.     0.12   0.28   0.27   0.47 -10.     0.55] sorted [7 5 3]\n",
      "instance 1, ep 8, state [0 0 0 0 0 1 1 1]\n",
      "   state [0 0 0 0 0 1 1 1] state_WI [  0.71   0.82   0.15   0.67   0.27   0.49 -10.   -10.  ] sorted [1 0 3]\n",
      "   state [1 0 0 0 1 0 1 0] state_WI [  0.26   0.82   0.15   0.67 -10.     0.47 -10.     0.55] sorted [1 3 7]\n",
      "   state [0 1 0 0 1 0 1 1] state_WI [  0.71 -10.     0.15   0.67 -10.     0.47 -10.   -10.  ] sorted [0 3 5]\n",
      "   state [1 1 0 0 0 0 0 0] state_WI [  0.26 -10.     0.15   0.67   0.27   0.47 -10.     0.55] sorted [3 7 5]\n",
      "   state [1 0 0 1 0 0 0 0] state_WI [  0.26   0.82   0.15   0.28   0.27   0.47 -10.     0.55] sorted [1 7 5]\n",
      "   state [0 1 0 0 0 0 0 0] state_WI [  0.71 -10.     0.15   0.67   0.27   0.47 -10.     0.55] sorted [0 3 7]\n",
      "   state [0 1 0 0 0 1 1 1] state_WI [  0.71 -10.     0.15   0.67   0.27   0.49 -10.   -10.  ] sorted [0 3 5]\n",
      "   state [1 1 1 1 0 1 0 0] state_WI [  0.26 -10.     0.12   0.28   0.27   0.49 -10.     0.55] sorted [7 5 3]\n",
      "   state [1 0 1 0 0 1 1 0] state_WI [  0.26   0.82   0.12   0.67   0.27   0.49 -10.     0.55] sorted [1 3 7]\n",
      "   state [0 1 0 1 1 0 0 0] state_WI [  0.71 -10.     0.15   0.28 -10.     0.47 -10.     0.55] sorted [0 7 5]\n",
      "   state [1 0 0 0 1 0 0 1] state_WI [  0.26   0.82   0.15   0.67 -10.     0.47 -10.   -10.  ] sorted [1 3 5]\n",
      "   state [1 1 0 0 1 0 1 1] state_WI [  0.26 -10.     0.15   0.67 -10.     0.47 -10.   -10.  ] sorted [3 5 0]\n",
      "   state [0 1 1 0 1 0 0 0] state_WI [  0.71 -10.     0.12   0.67 -10.     0.47 -10.     0.55] sorted [0 3 7]\n",
      "   state [1 1 0 0 1 0 1 0] state_WI [  0.26 -10.     0.15   0.67 -10.     0.47 -10.     0.55] sorted [3 7 5]\n",
      "   state [0 0 0 0 1 0 0 0] state_WI [  0.71   0.82   0.15   0.67 -10.     0.47 -10.     0.55] sorted [1 0 3]\n",
      "   state [1 1 0 0 0 0 0 0] state_WI [  0.26 -10.     0.15   0.67   0.27   0.47 -10.     0.55] sorted [3 7 5]\n",
      "   state [1 0 0 1 1 0 0 0] state_WI [  0.26   0.82   0.15   0.28 -10.     0.47 -10.     0.55] sorted [1 7 5]\n",
      "   state [0 0 0 1 0 0 0 1] state_WI [  0.71   0.82   0.15   0.28   0.27   0.47 -10.   -10.  ] sorted [1 0 5]\n",
      "   state [1 1 0 1 0 0 0 0] state_WI [  0.26 -10.     0.15   0.28   0.27   0.47 -10.     0.55] sorted [7 5 3]\n",
      "   state [0 1 0 1 1 0 0 1] state_WI [  0.71 -10.     0.15   0.28 -10.     0.47 -10.   -10.  ] sorted [0 5 3]\n",
      "instance 1, ep 9, state [1 1 1 0 0 0 0 1]\n",
      "   state [1 1 1 0 0 0 0 1] state_WI [  0.26 -10.     0.12   0.67   0.27   0.47 -10.   -10.  ] sorted [3 5 4]\n",
      "   state [0 0 1 1 1 1 0 0] state_WI [  0.71   0.82   0.12   0.28 -10.     0.49 -10.     0.55] sorted [1 0 7]\n",
      "   state [1 1 0 0 1 1 0 0] state_WI [  0.26 -10.     0.15   0.67 -10.     0.49 -10.     0.55] sorted [3 7 5]\n",
      "   state [1 0 0 1 1 0 0 0] state_WI [  0.26   0.82   0.15   0.28 -10.     0.47 -10.     0.55] sorted [1 7 5]\n",
      "   state [1 1 0 1 1 0 1 1] state_WI [  0.26 -10.     0.15   0.28 -10.     0.47 -10.   -10.  ] sorted [5 3 0]\n",
      "   state [1 0 0 1 1 0 0 0] state_WI [  0.26   0.82   0.15   0.28 -10.     0.47 -10.     0.55] sorted [1 7 5]\n",
      "   state [0 1 0 0 1 1 0 0] state_WI [  0.71 -10.     0.15   0.67 -10.     0.49 -10.     0.55] sorted [0 3 7]\n",
      "   state [0 1 1 1 1 0 0 0] state_WI [  0.71 -10.     0.12   0.28 -10.     0.47 -10.     0.55] sorted [0 7 5]\n",
      "   state [0 0 1 0 0 0 1 1] state_WI [  0.71   0.82   0.12   0.67   0.27   0.47 -10.   -10.  ] sorted [1 0 3]\n",
      "   state [1 1 0 1 0 0 1 1] state_WI [  0.26 -10.     0.15   0.28   0.27   0.47 -10.   -10.  ] sorted [5 3 4]\n",
      "   state [0 0 0 0 0 0 0 1] state_WI [  0.71   0.82   0.15   0.67   0.27   0.47 -10.   -10.  ] sorted [1 0 3]\n",
      "   state [0 0 0 1 0 0 0 1] state_WI [  0.71   0.82   0.15   0.28   0.27   0.47 -10.   -10.  ] sorted [1 0 5]\n",
      "   state [1 1 1 1 1 0 0 1] state_WI [  0.26 -10.     0.12   0.28 -10.     0.47 -10.   -10.  ] sorted [5 3 0]\n",
      "   state [1 0 0 1 1 1 0 1] state_WI [  0.26   0.82   0.15   0.28 -10.     0.49 -10.   -10.  ] sorted [1 5 3]\n",
      "   state [0 1 0 1 1 1 0 0] state_WI [  0.71 -10.     0.15   0.28 -10.     0.49 -10.     0.55] sorted [0 7 5]\n",
      "   state [1 0 0 0 0 1 1 1] state_WI [  0.26   0.82   0.15   0.67   0.27   0.49 -10.   -10.  ] sorted [1 3 5]\n",
      "   state [1 1 0 0 1 1 1 1] state_WI [  0.26 -10.     0.15   0.67 -10.     0.49 -10.   -10.  ] sorted [3 5 0]\n",
      "   state [1 1 0 1 0 1 0 0] state_WI [  0.26 -10.     0.15   0.28   0.27   0.49 -10.     0.55] sorted [7 5 3]\n",
      "   state [0 0 0 1 1 0 0 0] state_WI [  0.71   0.82   0.15   0.28 -10.     0.47 -10.     0.55] sorted [1 0 7]\n",
      "   state [1 1 0 1 0 0 0 0] state_WI [  0.26 -10.     0.15   0.28   0.27   0.47 -10.     0.55] sorted [7 5 3]\n",
      "instance 1, ep 10, state [0 1 1 1 0 0 1 1]\n",
      "   state [0 1 1 1 0 0 1 1] state_WI [  0.71 -10.     0.12   0.28   0.27   0.47 -10.   -10.  ] sorted [0 5 3]\n",
      "   state [1 0 0 1 1 0 0 1] state_WI [  0.26   0.82   0.15   0.28 -10.     0.47 -10.   -10.  ] sorted [1 5 3]\n",
      "   state [0 0 1 1 0 0 0 0] state_WI [  0.71   0.82   0.12   0.28   0.27   0.47 -10.     0.55] sorted [1 0 7]\n",
      "   state [1 1 0 1 0 0 0 1] state_WI [  0.26 -10.     0.15   0.28   0.27   0.47 -10.   -10.  ] sorted [5 3 4]\n",
      "   state [1 0 0 1 1 0 0 1] state_WI [  0.26   0.82   0.15   0.28 -10.     0.47 -10.   -10.  ] sorted [1 5 3]\n",
      "   state [0 1 0 1 0 1 0 0] state_WI [  0.71 -10.     0.15   0.28   0.27   0.49 -10.     0.55] sorted [0 7 5]\n",
      "   state [1 0 0 1 1 1 0 0] state_WI [  0.26   0.82   0.15   0.28 -10.     0.49 -10.     0.55] sorted [1 7 5]\n",
      "   state [1 0 0 0 1 1 0 0] state_WI [  0.26   0.82   0.15   0.67 -10.     0.49 -10.     0.55] sorted [1 3 7]\n",
      "   state [0 1 0 0 1 1 0 1] state_WI [  0.71 -10.     0.15   0.67 -10.     0.49 -10.   -10.  ] sorted [0 3 5]\n",
      "   state [1 0 0 1 1 1 0 1] state_WI [  0.26   0.82   0.15   0.28 -10.     0.49 -10.   -10.  ] sorted [1 5 3]\n",
      "   state [1 0 0 1 0 1 0 1] state_WI [  0.26   0.82   0.15   0.28   0.27   0.49 -10.   -10.  ] sorted [1 5 3]\n",
      "   state [0 1 0 1 1 1 0 0] state_WI [  0.71 -10.     0.15   0.28 -10.     0.49 -10.     0.55] sorted [0 7 5]\n",
      "   state [0 0 0 1 0 1 0 0] state_WI [  0.71   0.82   0.15   0.28   0.27   0.49 -10.     0.55] sorted [1 0 7]\n",
      "   state [1 1 0 1 0 0 0 1] state_WI [  0.26 -10.     0.15   0.28   0.27   0.47 -10.   -10.  ] sorted [5 3 4]\n",
      "   state [0 1 0 1 1 0 0 0] state_WI [  0.71 -10.     0.15   0.28 -10.     0.47 -10.     0.55] sorted [0 7 5]\n",
      "   state [1 0 0 0 0 1 0 0] state_WI [  0.26   0.82   0.15   0.67   0.27   0.49 -10.     0.55] sorted [1 3 7]\n",
      "   state [0 1 0 1 1 1 1 1] state_WI [  0.71 -10.     0.15   0.28 -10.     0.49 -10.   -10.  ] sorted [0 5 3]\n",
      "   state [1 0 0 1 1 1 1 0] state_WI [  0.26   0.82   0.15   0.28 -10.     0.49 -10.     0.55] sorted [1 7 5]\n",
      "   state [1 1 0 0 0 1 0 0] state_WI [  0.26 -10.     0.15   0.67   0.27   0.49 -10.     0.55] sorted [3 7 5]\n",
      "   state [1 1 0 0 1 1 0 1] state_WI [  0.26 -10.     0.15   0.67 -10.     0.49 -10.   -10.  ] sorted [3 5 0]\n",
      "instance 1, ep 11, state [0 1 0 0 0 0 1 1]\n",
      "   state [0 1 0 0 0 0 1 1] state_WI [  0.71 -10.     0.15   0.67   0.27   0.47 -10.   -10.  ] sorted [0 3 5]\n",
      "   state [0 1 0 1 0 0 1 0] state_WI [  0.71 -10.     0.15   0.28   0.27   0.47 -10.     0.55] sorted [0 7 5]\n",
      "   state [0 0 0 0 1 0 0 0] state_WI [  0.71   0.82   0.15   0.67 -10.     0.47 -10.     0.55] sorted [1 0 3]\n",
      "   state [1 1 0 1 1 0 0 0] state_WI [  0.26 -10.     0.15   0.28 -10.     0.47 -10.     0.55] sorted [7 5 3]\n",
      "   state [0 0 0 1 1 0 0 1] state_WI [  0.71   0.82   0.15   0.28 -10.     0.47 -10.   -10.  ] sorted [1 0 5]\n",
      "   state [0 1 0 0 1 1 0 0] state_WI [  0.71 -10.     0.15   0.67 -10.     0.49 -10.     0.55] sorted [0 3 7]\n",
      "   state [0 0 0 1 0 0 0 1] state_WI [  0.71   0.82   0.15   0.28   0.27   0.47 -10.   -10.  ] sorted [1 0 5]\n",
      "   state [0 1 0 1 0 1 0 0] state_WI [  0.71 -10.     0.15   0.28   0.27   0.49 -10.     0.55] sorted [0 7 5]\n",
      "   state [1 0 1 1 0 1 0 1] state_WI [  0.26   0.82   0.12   0.28   0.27   0.49 -10.   -10.  ] sorted [1 5 3]\n",
      "   state [0 1 0 1 0 1 0 1] state_WI [  0.71 -10.     0.15   0.28   0.27   0.49 -10.   -10.  ] sorted [0 5 3]\n",
      "   state [0 0 0 1 0 1 0 1] state_WI [  0.71   0.82   0.15   0.28   0.27   0.49 -10.   -10.  ] sorted [1 0 5]\n",
      "   state [1 1 0 0 0 1 0 0] state_WI [  0.26 -10.     0.15   0.67   0.27   0.49 -10.     0.55] sorted [3 7 5]\n",
      "   state [1 0 0 1 0 1 0 0] state_WI [  0.26   0.82   0.15   0.28   0.27   0.49 -10.     0.55] sorted [1 7 5]\n",
      "   state [1 1 0 0 0 1 0 1] state_WI [  0.26 -10.     0.15   0.67   0.27   0.49 -10.   -10.  ] sorted [3 5 4]\n",
      "   state [1 1 0 1 1 1 0 1] state_WI [  0.26 -10.     0.15   0.28 -10.     0.49 -10.   -10.  ] sorted [5 3 0]\n",
      "   state [1 0 0 1 0 1 0 1] state_WI [  0.26   0.82   0.15   0.28   0.27   0.49 -10.   -10.  ] sorted [1 5 3]\n",
      "   state [0 1 0 0 0 1 0 0] state_WI [  0.71 -10.     0.15   0.67   0.27   0.49 -10.     0.55] sorted [0 3 7]\n",
      "   state [1 0 1 1 1 0 0 1] state_WI [  0.26   0.82   0.12   0.28 -10.     0.47 -10.   -10.  ] sorted [1 5 3]\n",
      "   state [0 1 0 0 1 1 0 0] state_WI [  0.71 -10.     0.15   0.67 -10.     0.49 -10.     0.55] sorted [0 3 7]\n",
      "   state [0 1 0 0 0 1 0 0] state_WI [  0.71 -10.     0.15   0.67   0.27   0.49 -10.     0.55] sorted [0 3 7]\n",
      "instance 1, ep 12, state [0 1 1 1 0 0 0 0]\n",
      "   state [0 1 1 1 0 0 0 0] state_WI [  0.71 -10.     0.12   0.28   0.27   0.47 -10.     0.55] sorted [0 7 5]\n",
      "   state [0 1 0 1 0 0 0 1] state_WI [  0.71 -10.     0.15   0.28   0.27   0.47 -10.   -10.  ] sorted [0 5 3]\n",
      "   state [0 1 0 1 0 0 0 0] state_WI [  0.71 -10.     0.15   0.28   0.27   0.47 -10.     0.55] sorted [0 7 5]\n",
      "   state [1 1 0 0 0 0 0 1] state_WI [  0.26 -10.     0.15   0.67   0.27   0.47 -10.   -10.  ] sorted [3 5 4]\n",
      "   state [0 0 0 0 1 0 0 1] state_WI [  0.71   0.82   0.15   0.67 -10.     0.47 -10.   -10.  ] sorted [1 0 3]\n",
      "   state [0 1 0 0 1 0 0 0] state_WI [  0.71 -10.     0.15   0.67 -10.     0.47 -10.     0.55] sorted [0 3 7]\n",
      "   state [0 1 0 1 1 0 0 0] state_WI [  0.71 -10.     0.15   0.28 -10.     0.47 -10.     0.55] sorted [0 7 5]\n",
      "   state [1 0 0 0 0 0 0 1] state_WI [  0.26   0.82   0.15   0.67   0.27   0.47 -10.   -10.  ] sorted [1 3 5]\n",
      "   state [1 0 0 0 1 1 0 0] state_WI [  0.26   0.82   0.15   0.67 -10.     0.49 -10.     0.55] sorted [1 3 7]\n",
      "   state [1 0 0 0 0 0 0 1] state_WI [  0.26   0.82   0.15   0.67   0.27   0.47 -10.   -10.  ] sorted [1 3 5]\n",
      "   state [0 1 0 1 1 1 0 0] state_WI [  0.71 -10.     0.15   0.28 -10.     0.49 -10.     0.55] sorted [0 7 5]\n",
      "   state [0 1 0 0 0 1 0 1] state_WI [  0.71 -10.     0.15   0.67   0.27   0.49 -10.   -10.  ] sorted [0 3 5]\n",
      "   state [1 1 0 0 1 1 0 0] state_WI [  0.26 -10.     0.15   0.67 -10.     0.49 -10.     0.55] sorted [3 7 5]\n",
      "   state [1 1 0 1 0 0 0 1] state_WI [  0.26 -10.     0.15   0.28   0.27   0.47 -10.   -10.  ] sorted [5 3 4]\n",
      "   state [0 0 0 0 1 0 0 1] state_WI [  0.71   0.82   0.15   0.67 -10.     0.47 -10.   -10.  ] sorted [1 0 3]\n",
      "   state [0 1 0 1 1 0 0 0] state_WI [  0.71 -10.     0.15   0.28 -10.     0.47 -10.     0.55] sorted [0 7 5]\n",
      "   state [0 0 0 1 1 0 0 0] state_WI [  0.71   0.82   0.15   0.28 -10.     0.47 -10.     0.55] sorted [1 0 7]\n",
      "   state [0 0 0 1 0 0 0 0] state_WI [  0.71   0.82   0.15   0.28   0.27   0.47 -10.     0.55] sorted [1 0 7]\n",
      "   state [1 1 1 0 1 0 0 0] state_WI [  0.26 -10.     0.12   0.67 -10.     0.47 -10.     0.55] sorted [3 7 5]\n",
      "   state [0 1 0 1 1 1 0 1] state_WI [  0.71 -10.     0.15   0.28 -10.     0.49 -10.   -10.  ] sorted [0 5 3]\n",
      "instance 1, ep 13, state [0 1 0 0 0 0 0 0]\n",
      "   state [0 1 0 0 0 0 0 0] state_WI [  0.71 -10.     0.15   0.67   0.27   0.47 -10.     0.55] sorted [0 3 7]\n",
      "   state [0 1 0 0 1 0 1 1] state_WI [  0.71 -10.     0.15   0.67 -10.     0.47 -10.   -10.  ] sorted [0 3 5]\n",
      "   state [1 0 0 0 1 1 0 1] state_WI [  0.26   0.82   0.15   0.67 -10.     0.49 -10.   -10.  ] sorted [1 3 5]\n",
      "   state [1 0 0 1 1 1 0 1] state_WI [  0.26   0.82   0.15   0.28 -10.     0.49 -10.   -10.  ] sorted [1 5 3]\n",
      "   state [0 0 1 1 1 0 0 1] state_WI [  0.71   0.82   0.12   0.28 -10.     0.47 -10.   -10.  ] sorted [1 0 5]\n",
      "   state [0 1 0 1 0 0 0 0] state_WI [  0.71 -10.     0.15   0.28   0.27   0.47 -10.     0.55] sorted [0 7 5]\n",
      "   state [1 0 0 0 0 1 1 0] state_WI [  0.26   0.82   0.15   0.67   0.27   0.49 -10.     0.55] sorted [1 3 7]\n",
      "   state [1 1 0 1 0 1 1 0] state_WI [  0.26 -10.     0.15   0.28   0.27   0.49 -10.     0.55] sorted [7 5 3]\n",
      "   state [1 1 0 1 0 1 1 0] state_WI [  0.26 -10.     0.15   0.28   0.27   0.49 -10.     0.55] sorted [7 5 3]\n",
      "   state [0 1 0 0 0 1 0 0] state_WI [  0.71 -10.     0.15   0.67   0.27   0.49 -10.     0.55] sorted [0 3 7]\n",
      "   state [0 1 0 0 0 0 0 0] state_WI [  0.71 -10.     0.15   0.67   0.27   0.47 -10.     0.55] sorted [0 3 7]\n",
      "   state [0 1 0 1 1 0 0 1] state_WI [  0.71 -10.     0.15   0.28 -10.     0.47 -10.   -10.  ] sorted [0 5 3]\n",
      "   state [0 1 0 1 0 0 0 1] state_WI [  0.71 -10.     0.15   0.28   0.27   0.47 -10.   -10.  ] sorted [0 5 3]\n",
      "   state [1 0 0 1 1 1 0 0] state_WI [  0.26   0.82   0.15   0.28 -10.     0.49 -10.     0.55] sorted [1 7 5]\n",
      "   state [1 1 0 0 1 1 0 0] state_WI [  0.26 -10.     0.15   0.67 -10.     0.49 -10.     0.55] sorted [3 7 5]\n",
      "   state [0 1 0 0 0 1 0 1] state_WI [  0.71 -10.     0.15   0.67   0.27   0.49 -10.   -10.  ] sorted [0 3 5]\n",
      "   state [0 1 1 1 0 1 0 0] state_WI [  0.71 -10.     0.12   0.28   0.27   0.49 -10.     0.55] sorted [0 7 5]\n",
      "   state [1 1 0 0 0 0 0 1] state_WI [  0.26 -10.     0.15   0.67   0.27   0.47 -10.   -10.  ] sorted [3 5 4]\n",
      "   state [1 1 0 0 0 0 0 1] state_WI [  0.26 -10.     0.15   0.67   0.27   0.47 -10.   -10.  ] sorted [3 5 4]\n",
      "   state [0 1 0 1 1 1 0 1] state_WI [  0.71 -10.     0.15   0.28 -10.     0.49 -10.   -10.  ] sorted [0 5 3]\n",
      "instance 1, ep 14, state [0 0 0 1 0 0 0 1]\n",
      "   state [0 0 0 1 0 0 0 1] state_WI [  0.71   0.82   0.15   0.28   0.27   0.47 -10.   -10.  ] sorted [1 0 5]\n",
      "   state [0 1 0 1 1 0 0 0] state_WI [  0.71 -10.     0.15   0.28 -10.     0.47 -10.     0.55] sorted [0 7 5]\n",
      "   state [1 0 0 0 1 1 0 1] state_WI [  0.26   0.82   0.15   0.67 -10.     0.49 -10.   -10.  ] sorted [1 3 5]\n",
      "   state [0 1 0 1 0 1 0 1] state_WI [  0.71 -10.     0.15   0.28   0.27   0.49 -10.   -10.  ] sorted [0 5 3]\n",
      "   state [0 1 0 0 1 0 0 1] state_WI [  0.71 -10.     0.15   0.67 -10.     0.47 -10.   -10.  ] sorted [0 3 5]\n",
      "   state [1 1 0 0 0 1 0 1] state_WI [  0.26 -10.     0.15   0.67   0.27   0.49 -10.   -10.  ] sorted [3 5 4]\n",
      "   state [0 0 0 0 1 1 1 0] state_WI [  0.71   0.82   0.15   0.67 -10.     0.49 -10.     0.55] sorted [1 0 3]\n",
      "   state [1 0 0 0 1 0 0 0] state_WI [  0.26   0.82   0.15   0.67 -10.     0.47 -10.     0.55] sorted [1 3 7]\n",
      "   state [0 1 0 0 0 0 0 0] state_WI [  0.71 -10.     0.15   0.67   0.27   0.47 -10.     0.55] sorted [0 3 7]\n",
      "   state [1 0 0 0 0 0 1 0] state_WI [  0.26   0.82   0.15   0.67   0.27   0.47 -10.     0.55] sorted [1 3 7]\n",
      "   state [0 0 0 1 0 0 0 0] state_WI [  0.71   0.82   0.15   0.28   0.27   0.47 -10.     0.55] sorted [1 0 7]\n",
      "   state [0 1 0 1 0 1 1 1] state_WI [  0.71 -10.     0.15   0.28   0.27   0.49 -10.   -10.  ] sorted [0 5 3]\n",
      "   state [0 0 0 1 0 1 1 0] state_WI [  0.71   0.82   0.15   0.28   0.27   0.49 -10.     0.55] sorted [1 0 7]\n",
      "   state [1 0 0 0 0 1 0 0] state_WI [  0.26   0.82   0.15   0.67   0.27   0.49 -10.     0.55] sorted [1 3 7]\n",
      "   state [1 1 0 1 1 0 0 0] state_WI [  0.26 -10.     0.15   0.28 -10.     0.47 -10.     0.55] sorted [7 5 3]\n",
      "   state [1 1 0 1 0 0 0 1] state_WI [  0.26 -10.     0.15   0.28   0.27   0.47 -10.   -10.  ] sorted [5 3 4]\n",
      "   state [1 0 0 1 1 0 0 0] state_WI [  0.26   0.82   0.15   0.28 -10.     0.47 -10.     0.55] sorted [1 7 5]\n",
      "   state [0 0 0 1 0 1 0 0] state_WI [  0.71   0.82   0.15   0.28   0.27   0.49 -10.     0.55] sorted [1 0 7]\n",
      "   state [0 0 0 0 1 1 0 1] state_WI [  0.71   0.82   0.15   0.67 -10.     0.49 -10.   -10.  ] sorted [1 0 3]\n",
      "   state [1 1 0 0 0 0 0 1] state_WI [  0.26 -10.     0.15   0.67   0.27   0.47 -10.   -10.  ] sorted [3 5 4]\n",
      "instance 1, ep 15, state [0 1 1 0 1 1 0 0]\n",
      "   state [0 1 1 0 1 1 0 0] state_WI [  0.71 -10.     0.12   0.67 -10.     0.49 -10.     0.55] sorted [0 3 7]\n",
      "   state [1 0 0 1 1 0 0 1] state_WI [  0.26   0.82   0.15   0.28 -10.     0.47 -10.   -10.  ] sorted [1 5 3]\n",
      "   state [1 0 0 1 0 1 0 1] state_WI [  0.26   0.82   0.15   0.28   0.27   0.49 -10.   -10.  ] sorted [1 5 3]\n",
      "   state [0 1 0 1 0 0 0 0] state_WI [  0.71 -10.     0.15   0.28   0.27   0.47 -10.     0.55] sorted [0 7 5]\n",
      "   state [1 0 0 0 1 1 0 0] state_WI [  0.26   0.82   0.15   0.67 -10.     0.49 -10.     0.55] sorted [1 3 7]\n",
      "   state [1 0 0 1 1 0 0 1] state_WI [  0.26   0.82   0.15   0.28 -10.     0.47 -10.   -10.  ] sorted [1 5 3]\n",
      "   state [1 0 0 0 1 1 0 0] state_WI [  0.26   0.82   0.15   0.67 -10.     0.49 -10.     0.55] sorted [1 3 7]\n",
      "   state [0 1 0 0 0 0 0 1] state_WI [  0.71 -10.     0.15   0.67   0.27   0.47 -10.   -10.  ] sorted [0 3 5]\n",
      "   state [1 0 1 0 1 0 1 0] state_WI [  0.26   0.82   0.12   0.67 -10.     0.47 -10.     0.55] sorted [1 3 7]\n",
      "   state [1 1 0 0 1 0 0 0] state_WI [  0.26 -10.     0.15   0.67 -10.     0.47 -10.     0.55] sorted [3 7 5]\n",
      "   state [1 0 0 0 0 1 1 1] state_WI [  0.26   0.82   0.15   0.67   0.27   0.49 -10.   -10.  ] sorted [1 3 5]\n",
      "   state [0 1 0 0 1 1 1 1] state_WI [  0.71 -10.     0.15   0.67 -10.     0.49 -10.   -10.  ] sorted [0 3 5]\n",
      "   state [0 0 0 0 1 1 1 0] state_WI [  0.71   0.82   0.15   0.67 -10.     0.49 -10.     0.55] sorted [1 0 3]\n",
      "   state [1 1 0 0 0 0 0 0] state_WI [  0.26 -10.     0.15   0.67   0.27   0.47 -10.     0.55] sorted [3 7 5]\n",
      "   state [0 0 0 0 1 1 0 1] state_WI [  0.71   0.82   0.15   0.67 -10.     0.49 -10.   -10.  ] sorted [1 0 3]\n",
      "   state [1 1 0 0 1 0 0 0] state_WI [  0.26 -10.     0.15   0.67 -10.     0.47 -10.     0.55] sorted [3 7 5]\n",
      "   state [1 0 0 1 1 1 0 1] state_WI [  0.26   0.82   0.15   0.28 -10.     0.49 -10.   -10.  ] sorted [1 5 3]\n",
      "   state [1 1 0 1 0 1 0 0] state_WI [  0.26 -10.     0.15   0.28   0.27   0.49 -10.     0.55] sorted [7 5 3]\n",
      "   state [1 1 0 1 0 0 0 0] state_WI [  0.26 -10.     0.15   0.28   0.27   0.47 -10.     0.55] sorted [7 5 3]\n",
      "   state [0 1 0 1 1 0 0 1] state_WI [  0.71 -10.     0.15   0.28 -10.     0.47 -10.   -10.  ] sorted [0 5 3]\n",
      "instance 1, ep 16, state [1 0 1 0 1 0 1 1]\n",
      "   state [1 0 1 0 1 0 1 1] state_WI [  0.26   0.82   0.12   0.67 -10.     0.47 -10.   -10.  ] sorted [1 3 5]\n",
      "   state [1 1 1 0 0 0 0 0] state_WI [  0.26 -10.     0.12   0.67   0.27   0.47 -10.     0.55] sorted [3 7 5]\n",
      "   state [1 0 1 0 1 0 0 0] state_WI [  0.26   0.82   0.12   0.67 -10.     0.47 -10.     0.55] sorted [1 3 7]\n",
      "   state [0 1 0 0 1 0 0 0] state_WI [  0.71 -10.     0.15   0.67 -10.     0.47 -10.     0.55] sorted [0 3 7]\n",
      "   state [1 1 0 1 0 0 0 0] state_WI [  0.26 -10.     0.15   0.28   0.27   0.47 -10.     0.55] sorted [7 5 3]\n",
      "   state [1 1 1 1 0 1 1 0] state_WI [  0.26 -10.     0.12   0.28   0.27   0.49 -10.     0.55] sorted [7 5 3]\n",
      "   state [1 1 0 1 0 0 0 1] state_WI [  0.26 -10.     0.15   0.28   0.27   0.47 -10.   -10.  ] sorted [5 3 4]\n",
      "   state [1 1 0 0 1 1 0 0] state_WI [  0.26 -10.     0.15   0.67 -10.     0.49 -10.     0.55] sorted [3 7 5]\n",
      "   state [1 1 0 0 1 1 0 0] state_WI [  0.26 -10.     0.15   0.67 -10.     0.49 -10.     0.55] sorted [3 7 5]\n",
      "   state [1 0 0 1 0 1 0 1] state_WI [  0.26   0.82   0.15   0.28   0.27   0.49 -10.   -10.  ] sorted [1 5 3]\n",
      "   state [0 0 0 1 1 1 0 0] state_WI [  0.71   0.82   0.15   0.28 -10.     0.49 -10.     0.55] sorted [1 0 7]\n",
      "   state [1 1 0 0 0 1 0 0] state_WI [  0.26 -10.     0.15   0.67   0.27   0.49 -10.     0.55] sorted [3 7 5]\n",
      "   state [0 1 0 0 1 0 0 1] state_WI [  0.71 -10.     0.15   0.67 -10.     0.47 -10.   -10.  ] sorted [0 3 5]\n",
      "   state [0 0 0 1 0 1 0 0] state_WI [  0.71   0.82   0.15   0.28   0.27   0.49 -10.     0.55] sorted [1 0 7]\n",
      "   state [1 1 0 1 1 0 0 0] state_WI [  0.26 -10.     0.15   0.28 -10.     0.47 -10.     0.55] sorted [7 5 3]\n",
      "   state [0 0 0 1 1 0 0 1] state_WI [  0.71   0.82   0.15   0.28 -10.     0.47 -10.   -10.  ] sorted [1 0 5]\n",
      "   state [1 0 0 0 0 1 0 0] state_WI [  0.26   0.82   0.15   0.67   0.27   0.49 -10.     0.55] sorted [1 3 7]\n",
      "   state [0 0 0 1 0 0 0 1] state_WI [  0.71   0.82   0.15   0.28   0.27   0.47 -10.   -10.  ] sorted [1 0 5]\n",
      "   state [1 1 0 0 0 0 0 0] state_WI [  0.26 -10.     0.15   0.67   0.27   0.47 -10.     0.55] sorted [3 7 5]\n",
      "   state [1 0 0 0 0 0 1 0] state_WI [  0.26   0.82   0.15   0.67   0.27   0.47 -10.     0.55] sorted [1 3 7]\n",
      "instance 1, ep 17, state [0 0 0 0 0 1 1 1]\n",
      "   state [0 0 0 0 0 1 1 1] state_WI [  0.71   0.82   0.15   0.67   0.27   0.49 -10.   -10.  ] sorted [1 0 3]\n",
      "   state [0 1 0 1 1 0 0 1] state_WI [  0.71 -10.     0.15   0.28 -10.     0.47 -10.   -10.  ] sorted [0 5 3]\n",
      "   state [1 0 0 1 0 1 0 0] state_WI [  0.26   0.82   0.15   0.28   0.27   0.49 -10.     0.55] sorted [1 7 5]\n",
      "   state [1 1 0 0 1 1 0 1] state_WI [  0.26 -10.     0.15   0.67 -10.     0.49 -10.   -10.  ] sorted [3 5 0]\n",
      "   state [1 1 0 0 1 1 0 0] state_WI [  0.26 -10.     0.15   0.67 -10.     0.49 -10.     0.55] sorted [3 7 5]\n",
      "   state [0 1 0 1 1 1 1 1] state_WI [  0.71 -10.     0.15   0.28 -10.     0.49 -10.   -10.  ] sorted [0 5 3]\n",
      "   state [0 1 0 1 0 1 1 1] state_WI [  0.71 -10.     0.15   0.28   0.27   0.49 -10.   -10.  ] sorted [0 5 3]\n",
      "   state [0 0 0 0 1 0 1 0] state_WI [  0.71   0.82   0.15   0.67 -10.     0.47 -10.     0.55] sorted [1 0 3]\n",
      "   state [1 1 0 0 0 0 0 0] state_WI [  0.26 -10.     0.15   0.67   0.27   0.47 -10.     0.55] sorted [3 7 5]\n",
      "   state [1 0 0 0 0 1 1 0] state_WI [  0.26   0.82   0.15   0.67   0.27   0.49 -10.     0.55] sorted [1 3 7]\n",
      "   state [1 1 0 0 0 0 1 1] state_WI [  0.26 -10.     0.15   0.67   0.27   0.47 -10.   -10.  ] sorted [3 5 4]\n",
      "   state [0 0 0 1 1 1 0 1] state_WI [  0.71   0.82   0.15   0.28 -10.     0.49 -10.   -10.  ] sorted [1 0 5]\n",
      "   state [1 0 0 0 0 0 0 0] state_WI [  0.26   0.82   0.15   0.67   0.27   0.47 -10.     0.55] sorted [1 3 7]\n",
      "   state [0 1 0 0 0 0 0 0] state_WI [  0.71 -10.     0.15   0.67   0.27   0.47 -10.     0.55] sorted [0 3 7]\n",
      "   state [1 1 0 1 0 0 0 0] state_WI [  0.26 -10.     0.15   0.28   0.27   0.47 -10.     0.55] sorted [7 5 3]\n",
      "   state [0 1 0 1 1 0 0 1] state_WI [  0.71 -10.     0.15   0.28 -10.     0.47 -10.   -10.  ] sorted [0 5 3]\n",
      "   state [1 0 0 1 1 0 0 1] state_WI [  0.26   0.82   0.15   0.28 -10.     0.47 -10.   -10.  ] sorted [1 5 3]\n",
      "   state [1 1 0 1 1 1 0 0] state_WI [  0.26 -10.     0.15   0.28 -10.     0.49 -10.     0.55] sorted [7 5 3]\n",
      "   state [0 1 0 0 1 1 0 0] state_WI [  0.71 -10.     0.15   0.67 -10.     0.49 -10.     0.55] sorted [0 3 7]\n",
      "   state [0 1 0 0 1 0 0 0] state_WI [  0.71 -10.     0.15   0.67 -10.     0.47 -10.     0.55] sorted [0 3 7]\n",
      "instance 1, ep 18, state [1 1 1 1 0 0 0 0]\n",
      "   state [1 1 1 1 0 0 0 0] state_WI [  0.26 -10.     0.12   0.28   0.27   0.47 -10.     0.55] sorted [7 5 3]\n",
      "   state [0 1 0 1 0 0 0 0] state_WI [  0.71 -10.     0.15   0.28   0.27   0.47 -10.     0.55] sorted [0 7 5]\n",
      "   state [1 0 0 1 0 0 1 0] state_WI [  0.26   0.82   0.15   0.28   0.27   0.47 -10.     0.55] sorted [1 7 5]\n",
      "   state [1 0 0 0 1 1 1 1] state_WI [  0.26   0.82   0.15   0.67 -10.     0.49 -10.   -10.  ] sorted [1 3 5]\n",
      "   state [1 1 0 1 1 1 1 0] state_WI [  0.26 -10.     0.15   0.28 -10.     0.49 -10.     0.55] sorted [7 5 3]\n",
      "   state [0 0 0 1 1 1 0 1] state_WI [  0.71   0.82   0.15   0.28 -10.     0.49 -10.   -10.  ] sorted [1 0 5]\n",
      "   state [0 1 0 0 1 1 0 0] state_WI [  0.71 -10.     0.15   0.67 -10.     0.49 -10.     0.55] sorted [0 3 7]\n",
      "   state [1 0 0 0 0 0 0 1] state_WI [  0.26   0.82   0.15   0.67   0.27   0.47 -10.   -10.  ] sorted [1 3 5]\n",
      "   state [0 0 0 1 0 1 1 0] state_WI [  0.71   0.82   0.15   0.28   0.27   0.49 -10.     0.55] sorted [1 0 7]\n",
      "   state [1 0 0 0 0 0 1 0] state_WI [  0.26   0.82   0.15   0.67   0.27   0.47 -10.     0.55] sorted [1 3 7]\n",
      "   state [0 1 0 1 0 0 1 0] state_WI [  0.71 -10.     0.15   0.28   0.27   0.47 -10.     0.55] sorted [0 7 5]\n",
      "   state [1 0 1 0 1 0 1 0] state_WI [  0.26   0.82   0.12   0.67 -10.     0.47 -10.     0.55] sorted [1 3 7]\n",
      "   state [1 1 0 1 1 0 0 1] state_WI [  0.26 -10.     0.15   0.28 -10.     0.47 -10.   -10.  ] sorted [5 3 0]\n",
      "   state [1 0 0 1 1 0 1 1] state_WI [  0.26   0.82   0.15   0.28 -10.     0.47 -10.   -10.  ] sorted [1 5 3]\n",
      "   state [0 1 0 1 0 0 1 1] state_WI [  0.71 -10.     0.15   0.28   0.27   0.47 -10.   -10.  ] sorted [0 5 3]\n",
      "   state [1 1 0 1 0 0 1 0] state_WI [  0.26 -10.     0.15   0.28   0.27   0.47 -10.     0.55] sorted [7 5 3]\n",
      "   state [0 1 0 1 1 1 0 0] state_WI [  0.71 -10.     0.15   0.28 -10.     0.49 -10.     0.55] sorted [0 7 5]\n",
      "   state [1 0 0 1 0 1 0 1] state_WI [  0.26   0.82   0.15   0.28   0.27   0.49 -10.   -10.  ] sorted [1 5 3]\n",
      "   state [1 0 0 1 1 1 0 0] state_WI [  0.26   0.82   0.15   0.28 -10.     0.49 -10.     0.55] sorted [1 7 5]\n",
      "   state [1 1 0 1 1 1 0 0] state_WI [  0.26 -10.     0.15   0.28 -10.     0.49 -10.     0.55] sorted [7 5 3]\n",
      "instance 1, ep 19, state [0 0 1 1 0 0 0 0]\n",
      "   state [0 0 1 1 0 0 0 0] state_WI [  0.71   0.82   0.12   0.28   0.27   0.47 -10.     0.55] sorted [1 0 7]\n",
      "   state [1 1 0 0 0 0 0 1] state_WI [  0.26 -10.     0.15   0.67   0.27   0.47 -10.   -10.  ] sorted [3 5 4]\n",
      "   state [1 1 0 1 1 1 0 0] state_WI [  0.26 -10.     0.15   0.28 -10.     0.49 -10.     0.55] sorted [7 5 3]\n",
      "   state [0 0 0 0 1 1 0 1] state_WI [  0.71   0.82   0.15   0.67 -10.     0.49 -10.   -10.  ] sorted [1 0 3]\n",
      "   state [0 1 0 1 0 1 0 1] state_WI [  0.71 -10.     0.15   0.28   0.27   0.49 -10.   -10.  ] sorted [0 5 3]\n",
      "   state [1 1 0 1 0 1 0 0] state_WI [  0.26 -10.     0.15   0.28   0.27   0.49 -10.     0.55] sorted [7 5 3]\n",
      "   state [0 0 0 0 1 0 0 0] state_WI [  0.71   0.82   0.15   0.67 -10.     0.47 -10.     0.55] sorted [1 0 3]\n",
      "   state [0 1 0 0 1 0 1 0] state_WI [  0.71 -10.     0.15   0.67 -10.     0.47 -10.     0.55] sorted [0 3 7]\n",
      "   state [1 1 0 0 0 1 1 1] state_WI [  0.26 -10.     0.15   0.67   0.27   0.49 -10.   -10.  ] sorted [3 5 4]\n",
      "   state [1 0 0 1 1 1 1 0] state_WI [  0.26   0.82   0.15   0.28 -10.     0.49 -10.     0.55] sorted [1 7 5]\n",
      "   state [0 1 0 0 1 1 0 1] state_WI [  0.71 -10.     0.15   0.67 -10.     0.49 -10.   -10.  ] sorted [0 3 5]\n",
      "   state [1 0 0 1 1 0 0 0] state_WI [  0.26   0.82   0.15   0.28 -10.     0.47 -10.     0.55] sorted [1 7 5]\n",
      "   state [1 0 0 1 0 1 0 1] state_WI [  0.26   0.82   0.15   0.28   0.27   0.49 -10.   -10.  ] sorted [1 5 3]\n",
      "   state [0 1 0 1 0 1 0 1] state_WI [  0.71 -10.     0.15   0.28   0.27   0.49 -10.   -10.  ] sorted [0 5 3]\n",
      "   state [1 0 0 1 1 1 0 0] state_WI [  0.26   0.82   0.15   0.28 -10.     0.49 -10.     0.55] sorted [1 7 5]\n",
      "   state [1 1 0 0 1 0 0 0] state_WI [  0.26 -10.     0.15   0.67 -10.     0.47 -10.     0.55] sorted [3 7 5]\n",
      "   state [0 1 0 0 1 0 0 1] state_WI [  0.71 -10.     0.15   0.67 -10.     0.47 -10.   -10.  ] sorted [0 3 5]\n",
      "   state [1 0 0 1 1 1 0 0] state_WI [  0.26   0.82   0.15   0.28 -10.     0.49 -10.     0.55] sorted [1 7 5]\n",
      "   state [0 1 1 0 1 0 0 0] state_WI [  0.71 -10.     0.12   0.67 -10.     0.47 -10.     0.55] sorted [0 3 7]\n",
      "   state [0 1 0 0 0 0 0 1] state_WI [  0.71 -10.     0.15   0.67   0.27   0.47 -10.   -10.  ] sorted [0 3 5]\n",
      "instance 1, ep 20, state [0 1 0 1 1 0 1 1]\n",
      "   state [0 1 0 1 1 0 1 1] state_WI [  0.71 -10.     0.15   0.28 -10.     0.47 -10.   -10.  ] sorted [0 5 3]\n",
      "   state [0 0 0 1 1 1 0 0] state_WI [  0.71   0.82   0.15   0.28 -10.     0.49 -10.     0.55] sorted [1 0 7]\n",
      "   state [1 1 0 0 0 0 0 1] state_WI [  0.26 -10.     0.15   0.67   0.27   0.47 -10.   -10.  ] sorted [3 5 4]\n",
      "   state [0 1 0 0 1 0 1 1] state_WI [  0.71 -10.     0.15   0.67 -10.     0.47 -10.   -10.  ] sorted [0 3 5]\n",
      "   state [1 1 0 1 0 1 0 0] state_WI [  0.26 -10.     0.15   0.28   0.27   0.49 -10.     0.55] sorted [7 5 3]\n",
      "   state [1 1 0 0 0 1 0 1] state_WI [  0.26 -10.     0.15   0.67   0.27   0.49 -10.   -10.  ] sorted [3 5 4]\n",
      "   state [0 0 0 1 1 0 0 0] state_WI [  0.71   0.82   0.15   0.28 -10.     0.47 -10.     0.55] sorted [1 0 7]\n",
      "   state [1 1 0 0 1 0 0 0] state_WI [  0.26 -10.     0.15   0.67 -10.     0.47 -10.     0.55] sorted [3 7 5]\n",
      "   state [0 0 0 0 0 0 1 1] state_WI [  0.71   0.82   0.15   0.67   0.27   0.47 -10.   -10.  ] sorted [1 0 3]\n",
      "   state [0 0 0 1 0 0 0 1] state_WI [  0.71   0.82   0.15   0.28   0.27   0.47 -10.   -10.  ] sorted [1 0 5]\n",
      "   state [0 1 0 0 0 0 0 0] state_WI [  0.71 -10.     0.15   0.67   0.27   0.47 -10.     0.55] sorted [0 3 7]\n",
      "   state [1 0 1 0 1 0 0 0] state_WI [  0.26   0.82   0.12   0.67 -10.     0.47 -10.     0.55] sorted [1 3 7]\n",
      "   state [0 1 0 1 1 0 0 1] state_WI [  0.71 -10.     0.15   0.28 -10.     0.47 -10.   -10.  ] sorted [0 5 3]\n",
      "   state [0 1 0 0 0 1 0 0] state_WI [  0.71 -10.     0.15   0.67   0.27   0.49 -10.     0.55] sorted [0 3 7]\n",
      "   state [0 0 0 1 1 0 0 1] state_WI [  0.71   0.82   0.15   0.28 -10.     0.47 -10.   -10.  ] sorted [1 0 5]\n",
      "   state [1 1 0 1 0 0 0 0] state_WI [  0.26 -10.     0.15   0.28   0.27   0.47 -10.     0.55] sorted [7 5 3]\n",
      "   state [1 0 0 1 1 0 0 0] state_WI [  0.26   0.82   0.15   0.28 -10.     0.47 -10.     0.55] sorted [1 7 5]\n",
      "   state [0 1 0 0 1 0 0 0] state_WI [  0.71 -10.     0.15   0.67 -10.     0.47 -10.     0.55] sorted [0 3 7]\n",
      "   state [1 0 0 0 1 0 1 0] state_WI [  0.26   0.82   0.15   0.67 -10.     0.47 -10.     0.55] sorted [1 3 7]\n",
      "   state [1 1 0 0 1 0 0 1] state_WI [  0.26 -10.     0.15   0.67 -10.     0.47 -10.   -10.  ] sorted [3 5 0]\n",
      "instance 1, ep 21, state [0 0 1 1 1 1 1 1]\n",
      "   state [0 0 1 1 1 1 1 1] state_WI [  0.71   0.82   0.12   0.28 -10.     0.49 -10.   -10.  ] sorted [1 0 5]\n",
      "   state [0 1 0 0 0 0 1 1] state_WI [  0.71 -10.     0.15   0.67   0.27   0.47 -10.   -10.  ] sorted [0 3 5]\n",
      "   state [1 1 0 1 0 1 0 0] state_WI [  0.26 -10.     0.15   0.28   0.27   0.49 -10.     0.55] sorted [7 5 3]\n",
      "   state [1 0 0 0 1 0 1 0] state_WI [  0.26   0.82   0.15   0.67 -10.     0.47 -10.     0.55] sorted [1 3 7]\n",
      "   state [0 0 0 0 1 0 0 0] state_WI [  0.71   0.82   0.15   0.67 -10.     0.47 -10.     0.55] sorted [1 0 3]\n",
      "   state [1 1 0 1 0 0 0 0] state_WI [  0.26 -10.     0.15   0.28   0.27   0.47 -10.     0.55] sorted [7 5 3]\n",
      "   state [1 0 0 0 0 1 0 1] state_WI [  0.26   0.82   0.15   0.67   0.27   0.49 -10.   -10.  ] sorted [1 3 5]\n",
      "   state [0 1 0 1 1 1 0 1] state_WI [  0.71 -10.     0.15   0.28 -10.     0.49 -10.   -10.  ] sorted [0 5 3]\n",
      "   state [1 1 0 1 1 1 0 0] state_WI [  0.26 -10.     0.15   0.28 -10.     0.49 -10.     0.55] sorted [7 5 3]\n",
      "   state [1 1 0 1 1 0 0 1] state_WI [  0.26 -10.     0.15   0.28 -10.     0.47 -10.   -10.  ] sorted [5 3 0]\n",
      "   state [0 1 0 0 0 1 0 0] state_WI [  0.71 -10.     0.15   0.67   0.27   0.49 -10.     0.55] sorted [0 3 7]\n",
      "   state [0 1 0 1 0 1 0 0] state_WI [  0.71 -10.     0.15   0.28   0.27   0.49 -10.     0.55] sorted [0 7 5]\n",
      "   state [1 0 0 1 0 1 0 1] state_WI [  0.26   0.82   0.15   0.28   0.27   0.49 -10.   -10.  ] sorted [1 5 3]\n",
      "   state [0 1 0 1 0 1 0 0] state_WI [  0.71 -10.     0.15   0.28   0.27   0.49 -10.     0.55] sorted [0 7 5]\n",
      "   state [1 1 0 1 0 1 0 0] state_WI [  0.26 -10.     0.15   0.28   0.27   0.49 -10.     0.55] sorted [7 5 3]\n",
      "   state [1 1 0 1 1 0 0 1] state_WI [  0.26 -10.     0.15   0.28 -10.     0.47 -10.   -10.  ] sorted [5 3 0]\n",
      "   state [1 0 0 1 0 1 0 0] state_WI [  0.26   0.82   0.15   0.28   0.27   0.49 -10.     0.55] sorted [1 7 5]\n",
      "   state [1 1 0 1 0 1 0 1] state_WI [  0.26 -10.     0.15   0.28   0.27   0.49 -10.   -10.  ] sorted [5 3 4]\n",
      "   state [1 1 0 0 1 1 0 0] state_WI [  0.26 -10.     0.15   0.67 -10.     0.49 -10.     0.55] sorted [3 7 5]\n",
      "   state [0 1 0 1 1 1 0 0] state_WI [  0.71 -10.     0.15   0.28 -10.     0.49 -10.     0.55] sorted [0 7 5]\n",
      "instance 1, ep 22, state [1 1 1 0 1 1 0 1]\n",
      "   state [1 1 1 0 1 1 0 1] state_WI [  0.26 -10.     0.12   0.67 -10.     0.49 -10.   -10.  ] sorted [3 5 0]\n",
      "   state [0 0 0 0 0 1 0 1] state_WI [  0.71   0.82   0.15   0.67   0.27   0.49 -10.   -10.  ] sorted [1 0 3]\n",
      "   state [0 1 0 0 0 0 0 0] state_WI [  0.71 -10.     0.15   0.67   0.27   0.47 -10.     0.55] sorted [0 3 7]\n",
      "   state [1 0 0 1 0 0 0 1] state_WI [  0.26   0.82   0.15   0.28   0.27   0.47 -10.   -10.  ] sorted [1 5 3]\n",
      "   state [0 1 0 0 0 0 1 0] state_WI [  0.71 -10.     0.15   0.67   0.27   0.47 -10.     0.55] sorted [0 3 7]\n",
      "   state [1 0 0 1 1 0 1 1] state_WI [  0.26   0.82   0.15   0.28 -10.     0.47 -10.   -10.  ] sorted [1 5 3]\n",
      "   state [0 0 0 1 1 0 0 0] state_WI [  0.71   0.82   0.15   0.28 -10.     0.47 -10.     0.55] sorted [1 0 7]\n",
      "   state [1 1 0 0 1 0 0 1] state_WI [  0.26 -10.     0.15   0.67 -10.     0.47 -10.   -10.  ] sorted [3 5 0]\n",
      "   state [0 0 0 1 0 1 0 1] state_WI [  0.71   0.82   0.15   0.28   0.27   0.49 -10.   -10.  ] sorted [1 0 5]\n",
      "   state [1 1 0 0 0 1 0 1] state_WI [  0.26 -10.     0.15   0.67   0.27   0.49 -10.   -10.  ] sorted [3 5 4]\n",
      "   state [0 0 0 1 0 1 0 0] state_WI [  0.71   0.82   0.15   0.28   0.27   0.49 -10.     0.55] sorted [1 0 7]\n",
      "   state [1 1 0 1 0 0 1 0] state_WI [  0.26 -10.     0.15   0.28   0.27   0.47 -10.     0.55] sorted [7 5 3]\n",
      "   state [1 1 0 1 0 0 0 1] state_WI [  0.26 -10.     0.15   0.28   0.27   0.47 -10.   -10.  ] sorted [5 3 4]\n",
      "   state [0 1 1 1 1 0 0 0] state_WI [  0.71 -10.     0.12   0.28 -10.     0.47 -10.     0.55] sorted [0 7 5]\n",
      "   state [1 1 1 1 1 0 0 1] state_WI [  0.26 -10.     0.12   0.28 -10.     0.47 -10.   -10.  ] sorted [5 3 0]\n",
      "   state [1 1 0 1 1 1 0 1] state_WI [  0.26 -10.     0.15   0.28 -10.     0.49 -10.   -10.  ] sorted [5 3 0]\n",
      "   state [1 0 0 1 1 1 0 1] state_WI [  0.26   0.82   0.15   0.28 -10.     0.49 -10.   -10.  ] sorted [1 5 3]\n",
      "   state [0 0 1 1 1 1 0 0] state_WI [  0.71   0.82   0.12   0.28 -10.     0.49 -10.     0.55] sorted [1 0 7]\n",
      "   state [1 1 0 1 0 0 0 0] state_WI [  0.26 -10.     0.15   0.28   0.27   0.47 -10.     0.55] sorted [7 5 3]\n",
      "   state [1 1 0 1 1 1 0 0] state_WI [  0.26 -10.     0.15   0.28 -10.     0.49 -10.     0.55] sorted [7 5 3]\n",
      "instance 1, ep 23, state [0 1 1 1 0 1 1 0]\n",
      "   state [0 1 1 1 0 1 1 0] state_WI [  0.71 -10.     0.12   0.28   0.27   0.49 -10.     0.55] sorted [0 7 5]\n",
      "   state [0 0 0 0 0 1 1 0] state_WI [  0.71   0.82   0.15   0.67   0.27   0.49 -10.     0.55] sorted [1 0 3]\n",
      "   state [1 1 0 1 1 1 1 0] state_WI [  0.26 -10.     0.15   0.28 -10.     0.49 -10.     0.55] sorted [7 5 3]\n",
      "   state [1 1 0 0 1 1 1 0] state_WI [  0.26 -10.     0.15   0.67 -10.     0.49 -10.     0.55] sorted [3 7 5]\n",
      "   state [1 1 0 1 1 1 1 0] state_WI [  0.26 -10.     0.15   0.28 -10.     0.49 -10.     0.55] sorted [7 5 3]\n",
      "   state [1 0 0 1 1 1 1 1] state_WI [  0.26   0.82   0.15   0.28 -10.     0.49 -10.   -10.  ] sorted [1 5 3]\n",
      "   state [0 1 0 1 1 1 1 0] state_WI [  0.71 -10.     0.15   0.28 -10.     0.49 -10.     0.55] sorted [0 7 5]\n",
      "   state [0 1 0 0 1 1 0 1] state_WI [  0.71 -10.     0.15   0.67 -10.     0.49 -10.   -10.  ] sorted [0 3 5]\n",
      "   state [1 1 0 0 1 1 0 0] state_WI [  0.26 -10.     0.15   0.67 -10.     0.49 -10.     0.55] sorted [3 7 5]\n",
      "   state [0 0 0 1 0 1 0 1] state_WI [  0.71   0.82   0.15   0.28   0.27   0.49 -10.   -10.  ] sorted [1 0 5]\n",
      "   state [1 1 0 0 0 1 0 1] state_WI [  0.26 -10.     0.15   0.67   0.27   0.49 -10.   -10.  ] sorted [3 5 4]\n",
      "   state [0 0 0 0 0 0 0 0] state_WI [  0.71   0.82   0.15   0.67   0.27   0.47 -10.     0.55] sorted [1 0 3]\n",
      "   state [1 1 0 1 1 0 0 0] state_WI [  0.26 -10.     0.15   0.28 -10.     0.47 -10.     0.55] sorted [7 5 3]\n",
      "   state [0 0 0 1 1 0 0 0] state_WI [  0.71   0.82   0.15   0.28 -10.     0.47 -10.     0.55] sorted [1 0 7]\n",
      "   state [0 1 0 0 0 1 0 0] state_WI [  0.71 -10.     0.15   0.67   0.27   0.49 -10.     0.55] sorted [0 3 7]\n",
      "   state [1 1 0 1 0 0 0 1] state_WI [  0.26 -10.     0.15   0.28   0.27   0.47 -10.   -10.  ] sorted [5 3 4]\n",
      "   state [1 1 1 1 1 1 1 0] state_WI [  0.26 -10.     0.12   0.28 -10.     0.49 -10.     0.55] sorted [7 5 3]\n",
      "   state [0 0 1 1 1 0 0 1] state_WI [  0.71   0.82   0.12   0.28 -10.     0.47 -10.   -10.  ] sorted [1 0 5]\n",
      "   state [0 1 0 0 1 0 0 0] state_WI [  0.71 -10.     0.15   0.67 -10.     0.47 -10.     0.55] sorted [0 3 7]\n",
      "   state [1 0 0 1 0 0 0 0] state_WI [  0.26   0.82   0.15   0.28   0.27   0.47 -10.     0.55] sorted [1 7 5]\n",
      "instance 1, ep 24, state [0 1 0 0 1 0 1 0]\n",
      "   state [0 1 0 0 1 0 1 0] state_WI [  0.71 -10.     0.15   0.67 -10.     0.47 -10.     0.55] sorted [0 3 7]\n",
      "   state [1 1 0 0 1 1 0 0] state_WI [  0.26 -10.     0.15   0.67 -10.     0.49 -10.     0.55] sorted [3 7 5]\n",
      "   state [1 1 0 1 0 1 0 1] state_WI [  0.26 -10.     0.15   0.28   0.27   0.49 -10.   -10.  ] sorted [5 3 4]\n",
      "   state [1 1 0 1 1 0 0 1] state_WI [  0.26 -10.     0.15   0.28 -10.     0.47 -10.   -10.  ] sorted [5 3 0]\n",
      "   state [1 0 0 1 1 1 0 0] state_WI [  0.26   0.82   0.15   0.28 -10.     0.49 -10.     0.55] sorted [1 7 5]\n",
      "   state [0 1 0 1 1 1 0 0] state_WI [  0.71 -10.     0.15   0.28 -10.     0.49 -10.     0.55] sorted [0 7 5]\n",
      "   state [0 1 0 0 1 1 1 0] state_WI [  0.71 -10.     0.15   0.67 -10.     0.49 -10.     0.55] sorted [0 3 7]\n",
      "   state [0 0 0 0 1 1 1 0] state_WI [  0.71   0.82   0.15   0.67 -10.     0.49 -10.     0.55] sorted [1 0 3]\n",
      "   state [1 1 1 1 0 1 0 0] state_WI [  0.26 -10.     0.12   0.28   0.27   0.49 -10.     0.55] sorted [7 5 3]\n",
      "   state [0 0 0 0 1 1 0 0] state_WI [  0.71   0.82   0.15   0.67 -10.     0.49 -10.     0.55] sorted [1 0 3]\n",
      "   state [0 1 0 1 0 0 0 0] state_WI [  0.71 -10.     0.15   0.28   0.27   0.47 -10.     0.55] sorted [0 7 5]\n",
      "   state [1 0 0 0 1 0 0 1] state_WI [  0.26   0.82   0.15   0.67 -10.     0.47 -10.   -10.  ] sorted [1 3 5]\n",
      "   state [1 1 0 0 1 1 0 1] state_WI [  0.26 -10.     0.15   0.67 -10.     0.49 -10.   -10.  ] sorted [3 5 0]\n",
      "   state [1 1 0 0 1 1 0 0] state_WI [  0.26 -10.     0.15   0.67 -10.     0.49 -10.     0.55] sorted [3 7 5]\n",
      "   state [1 0 0 1 0 0 0 0] state_WI [  0.26   0.82   0.15   0.28   0.27   0.47 -10.     0.55] sorted [1 7 5]\n",
      "   state [1 0 1 1 0 0 0 1] state_WI [  0.26   0.82   0.12   0.28   0.27   0.47 -10.   -10.  ] sorted [1 5 3]\n",
      "   state [0 0 1 1 0 1 0 0] state_WI [  0.71   0.82   0.12   0.28   0.27   0.49 -10.     0.55] sorted [1 0 7]\n",
      "   state [1 0 1 1 1 1 1 1] state_WI [  0.26   0.82   0.12   0.28 -10.     0.49 -10.   -10.  ] sorted [1 5 3]\n",
      "   state [1 1 0 1 1 0 1 1] state_WI [  0.26 -10.     0.15   0.28 -10.     0.47 -10.   -10.  ] sorted [5 3 0]\n",
      "   state [1 1 0 0 0 0 1 1] state_WI [  0.26 -10.     0.15   0.67   0.27   0.47 -10.   -10.  ] sorted [3 5 4]\n",
      "instance 1, ep 25, state [1 0 1 0 1 0 1 1]\n",
      "   state [1 0 1 0 1 0 1 1] state_WI [  0.26   0.82   0.12   0.67 -10.     0.47 -10.   -10.  ] sorted [1 3 5]\n",
      "   state [0 0 0 1 1 0 1 0] state_WI [  0.71   0.82   0.15   0.28 -10.     0.47 -10.     0.55] sorted [1 0 7]\n",
      "   state [1 1 0 1 0 0 0 1] state_WI [  0.26 -10.     0.15   0.28   0.27   0.47 -10.   -10.  ] sorted [5 3 4]\n",
      "   state [0 0 0 1 0 1 0 0] state_WI [  0.71   0.82   0.15   0.28   0.27   0.49 -10.     0.55] sorted [1 0 7]\n",
      "   state [1 1 0 0 0 0 1 1] state_WI [  0.26 -10.     0.15   0.67   0.27   0.47 -10.   -10.  ] sorted [3 5 4]\n",
      "   state [0 0 0 0 1 1 0 1] state_WI [  0.71   0.82   0.15   0.67 -10.     0.49 -10.   -10.  ] sorted [1 0 3]\n",
      "   state [0 1 0 0 1 1 0 0] state_WI [  0.71 -10.     0.15   0.67 -10.     0.49 -10.     0.55] sorted [0 3 7]\n",
      "   state [0 0 0 1 0 0 0 0] state_WI [  0.71   0.82   0.15   0.28   0.27   0.47 -10.     0.55] sorted [1 0 7]\n",
      "   state [1 1 0 1 1 0 0 1] state_WI [  0.26 -10.     0.15   0.28 -10.     0.47 -10.   -10.  ] sorted [5 3 0]\n",
      "   state [0 0 0 1 1 0 0 0] state_WI [  0.71   0.82   0.15   0.28 -10.     0.47 -10.     0.55] sorted [1 0 7]\n",
      "   state [1 0 0 1 1 0 0 0] state_WI [  0.26   0.82   0.15   0.28 -10.     0.47 -10.     0.55] sorted [1 7 5]\n",
      "   state [0 0 0 0 1 1 0 0] state_WI [  0.71   0.82   0.15   0.67 -10.     0.49 -10.     0.55] sorted [1 0 3]\n",
      "   state [0 1 0 0 1 1 0 0] state_WI [  0.71 -10.     0.15   0.67 -10.     0.49 -10.     0.55] sorted [0 3 7]\n",
      "   state [0 1 0 0 1 0 0 0] state_WI [  0.71 -10.     0.15   0.67 -10.     0.47 -10.     0.55] sorted [0 3 7]\n",
      "   state [1 0 0 0 0 0 0 0] state_WI [  0.26   0.82   0.15   0.67   0.27   0.47 -10.     0.55] sorted [1 3 7]\n",
      "   state [1 1 0 1 0 0 0 0] state_WI [  0.26 -10.     0.15   0.28   0.27   0.47 -10.     0.55] sorted [7 5 3]\n",
      "   state [1 0 1 1 1 1 0 0] state_WI [  0.26   0.82   0.12   0.28 -10.     0.49 -10.     0.55] sorted [1 7 5]\n",
      "   state [0 0 0 1 0 1 0 1] state_WI [  0.71   0.82   0.15   0.28   0.27   0.49 -10.   -10.  ] sorted [1 0 5]\n",
      "   state [0 1 0 1 0 1 0 0] state_WI [  0.71 -10.     0.15   0.28   0.27   0.49 -10.     0.55] sorted [0 7 5]\n",
      "   state [1 0 0 0 0 1 0 0] state_WI [  0.26   0.82   0.15   0.67   0.27   0.49 -10.     0.55] sorted [1 3 7]\n",
      "instance 1, ep 26, state [1 1 0 1 0 0 0 1]\n",
      "   state [1 1 0 1 0 0 0 1] state_WI [  0.26 -10.     0.15   0.28   0.27   0.47 -10.   -10.  ] sorted [5 3 4]\n",
      "   state [0 0 0 1 1 0 0 1] state_WI [  0.71   0.82   0.15   0.28 -10.     0.47 -10.   -10.  ] sorted [1 0 5]\n",
      "   state [1 0 0 0 0 1 0 0] state_WI [  0.26   0.82   0.15   0.67   0.27   0.49 -10.     0.55] sorted [1 3 7]\n",
      "   state [1 1 0 1 0 0 0 1] state_WI [  0.26 -10.     0.15   0.28   0.27   0.47 -10.   -10.  ] sorted [5 3 4]\n",
      "   state [1 0 0 1 1 0 0 1] state_WI [  0.26   0.82   0.15   0.28 -10.     0.47 -10.   -10.  ] sorted [1 5 3]\n",
      "   state [1 1 0 1 0 1 1 0] state_WI [  0.26 -10.     0.15   0.28   0.27   0.49 -10.     0.55] sorted [7 5 3]\n",
      "   state [0 1 0 1 0 1 0 1] state_WI [  0.71 -10.     0.15   0.28   0.27   0.49 -10.   -10.  ] sorted [0 5 3]\n",
      "   state [1 0 0 1 0 0 0 0] state_WI [  0.26   0.82   0.15   0.28   0.27   0.47 -10.     0.55] sorted [1 7 5]\n",
      "   state [0 1 0 1 0 0 0 1] state_WI [  0.71 -10.     0.15   0.28   0.27   0.47 -10.   -10.  ] sorted [0 5 3]\n",
      "   state [0 0 0 1 1 0 0 1] state_WI [  0.71   0.82   0.15   0.28 -10.     0.47 -10.   -10.  ] sorted [1 0 5]\n",
      "   state [0 1 0 0 0 0 0 1] state_WI [  0.71 -10.     0.15   0.67   0.27   0.47 -10.   -10.  ] sorted [0 3 5]\n",
      "   state [1 1 0 1 1 0 0 1] state_WI [  0.26 -10.     0.15   0.28 -10.     0.47 -10.   -10.  ] sorted [5 3 0]\n",
      "   state [0 0 0 1 0 1 0 0] state_WI [  0.71   0.82   0.15   0.28   0.27   0.49 -10.     0.55] sorted [1 0 7]\n",
      "   state [0 1 0 0 0 1 0 0] state_WI [  0.71 -10.     0.15   0.67   0.27   0.49 -10.     0.55] sorted [0 3 7]\n",
      "   state [0 1 0 1 1 0 1 1] state_WI [  0.71 -10.     0.15   0.28 -10.     0.47 -10.   -10.  ] sorted [0 5 3]\n",
      "   state [1 0 0 1 1 0 1 0] state_WI [  0.26   0.82   0.15   0.28 -10.     0.47 -10.     0.55] sorted [1 7 5]\n",
      "   state [0 1 0 1 1 1 0 1] state_WI [  0.71 -10.     0.15   0.28 -10.     0.49 -10.   -10.  ] sorted [0 5 3]\n",
      "   state [0 0 0 1 1 1 0 0] state_WI [  0.71   0.82   0.15   0.28 -10.     0.49 -10.     0.55] sorted [1 0 7]\n",
      "   state [1 0 0 1 0 0 0 1] state_WI [  0.26   0.82   0.15   0.28   0.27   0.47 -10.   -10.  ] sorted [1 5 3]\n",
      "   state [1 1 0 1 1 0 0 1] state_WI [  0.26 -10.     0.15   0.28 -10.     0.47 -10.   -10.  ] sorted [5 3 0]\n",
      "instance 1, ep 27, state [1 0 1 0 0 0 0 0]\n",
      "   state [1 0 1 0 0 0 0 0] state_WI [  0.26   0.82   0.12   0.67   0.27   0.47 -10.     0.55] sorted [1 3 7]\n",
      "   state [0 1 1 1 1 0 0 0] state_WI [  0.71 -10.     0.12   0.28 -10.     0.47 -10.     0.55] sorted [0 7 5]\n",
      "   state [1 1 0 0 1 1 0 1] state_WI [  0.26 -10.     0.15   0.67 -10.     0.49 -10.   -10.  ] sorted [3 5 0]\n",
      "   state [1 1 0 1 0 1 0 0] state_WI [  0.26 -10.     0.15   0.28   0.27   0.49 -10.     0.55] sorted [7 5 3]\n",
      "   state [1 0 0 1 1 1 0 1] state_WI [  0.26   0.82   0.15   0.28 -10.     0.49 -10.   -10.  ] sorted [1 5 3]\n",
      "   state [0 1 0 1 1 1 0 1] state_WI [  0.71 -10.     0.15   0.28 -10.     0.49 -10.   -10.  ] sorted [0 5 3]\n",
      "   state [0 1 0 1 0 1 0 0] state_WI [  0.71 -10.     0.15   0.28   0.27   0.49 -10.     0.55] sorted [0 7 5]\n",
      "   state [1 1 0 1 1 0 0 0] state_WI [  0.26 -10.     0.15   0.28 -10.     0.47 -10.     0.55] sorted [7 5 3]\n",
      "   state [1 0 0 1 0 0 0 0] state_WI [  0.26   0.82   0.15   0.28   0.27   0.47 -10.     0.55] sorted [1 7 5]\n",
      "   state [0 1 0 1 0 1 0 1] state_WI [  0.71 -10.     0.15   0.28   0.27   0.49 -10.   -10.  ] sorted [0 5 3]\n",
      "   state [0 1 0 1 0 1 0 0] state_WI [  0.71 -10.     0.15   0.28   0.27   0.49 -10.     0.55] sorted [0 7 5]\n",
      "   state [1 1 0 0 1 1 0 0] state_WI [  0.26 -10.     0.15   0.67 -10.     0.49 -10.     0.55] sorted [3 7 5]\n",
      "   state [0 0 0 1 1 1 1 0] state_WI [  0.71   0.82   0.15   0.28 -10.     0.49 -10.     0.55] sorted [1 0 7]\n",
      "   state [0 0 0 1 0 0 0 1] state_WI [  0.71   0.82   0.15   0.28   0.27   0.47 -10.   -10.  ] sorted [1 0 5]\n",
      "   state [0 0 0 0 0 1 0 1] state_WI [  0.71   0.82   0.15   0.67   0.27   0.49 -10.   -10.  ] sorted [1 0 3]\n",
      "   state [1 0 0 1 1 1 0 0] state_WI [  0.26   0.82   0.15   0.28 -10.     0.49 -10.     0.55] sorted [1 7 5]\n",
      "   state [0 0 0 0 1 1 1 1] state_WI [  0.71   0.82   0.15   0.67 -10.     0.49 -10.   -10.  ] sorted [1 0 3]\n",
      "   state [1 0 0 1 0 0 0 0] state_WI [  0.26   0.82   0.15   0.28   0.27   0.47 -10.     0.55] sorted [1 7 5]\n",
      "   state [1 1 0 1 0 0 0 0] state_WI [  0.26 -10.     0.15   0.28   0.27   0.47 -10.     0.55] sorted [7 5 3]\n",
      "   state [1 1 0 1 1 1 0 1] state_WI [  0.26 -10.     0.15   0.28 -10.     0.49 -10.   -10.  ] sorted [5 3 0]\n",
      "instance 1, ep 28, state [1 1 0 0 0 1 0 1]\n",
      "   state [1 1 0 0 0 1 0 1] state_WI [  0.26 -10.     0.15   0.67   0.27   0.49 -10.   -10.  ] sorted [3 5 4]\n",
      "   state [1 0 0 0 1 1 1 1] state_WI [  0.26   0.82   0.15   0.67 -10.     0.49 -10.   -10.  ] sorted [1 3 5]\n",
      "   state [0 1 0 1 1 1 0 0] state_WI [  0.71 -10.     0.15   0.28 -10.     0.49 -10.     0.55] sorted [0 7 5]\n",
      "   state [0 1 0 0 1 1 0 1] state_WI [  0.71 -10.     0.15   0.67 -10.     0.49 -10.   -10.  ] sorted [0 3 5]\n",
      "   state [1 1 0 0 0 1 0 0] state_WI [  0.26 -10.     0.15   0.67   0.27   0.49 -10.     0.55] sorted [3 7 5]\n",
      "   state [1 1 0 1 1 1 1 1] state_WI [  0.26 -10.     0.15   0.28 -10.     0.49 -10.   -10.  ] sorted [5 3 0]\n",
      "   state [1 0 0 0 0 1 0 0] state_WI [  0.26   0.82   0.15   0.67   0.27   0.49 -10.     0.55] sorted [1 3 7]\n",
      "   state [0 0 0 0 1 0 1 1] state_WI [  0.71   0.82   0.15   0.67 -10.     0.47 -10.   -10.  ] sorted [1 0 3]\n",
      "   state [1 1 0 1 1 0 1 0] state_WI [  0.26 -10.     0.15   0.28 -10.     0.47 -10.     0.55] sorted [7 5 3]\n",
      "   state [1 0 0 0 1 0 0 1] state_WI [  0.26   0.82   0.15   0.67 -10.     0.47 -10.   -10.  ] sorted [1 3 5]\n",
      "   state [1 1 0 0 1 1 0 0] state_WI [  0.26 -10.     0.15   0.67 -10.     0.49 -10.     0.55] sorted [3 7 5]\n",
      "   state [1 0 0 1 1 1 0 0] state_WI [  0.26   0.82   0.15   0.28 -10.     0.49 -10.     0.55] sorted [1 7 5]\n",
      "   state [0 0 0 0 0 1 0 1] state_WI [  0.71   0.82   0.15   0.67   0.27   0.49 -10.   -10.  ] sorted [1 0 3]\n",
      "   state [1 1 1 1 1 0 1 0] state_WI [  0.26 -10.     0.12   0.28 -10.     0.47 -10.     0.55] sorted [7 5 3]\n",
      "   state [0 0 0 1 1 1 1 1] state_WI [  0.71   0.82   0.15   0.28 -10.     0.49 -10.   -10.  ] sorted [1 0 5]\n",
      "   state [0 1 0 0 1 1 0 0] state_WI [  0.71 -10.     0.15   0.67 -10.     0.49 -10.     0.55] sorted [0 3 7]\n",
      "   state [1 1 0 0 1 1 0 0] state_WI [  0.26 -10.     0.15   0.67 -10.     0.49 -10.     0.55] sorted [3 7 5]\n",
      "   state [1 1 1 0 1 1 0 1] state_WI [  0.26 -10.     0.12   0.67 -10.     0.49 -10.   -10.  ] sorted [3 5 0]\n",
      "   state [1 0 0 0 1 1 0 0] state_WI [  0.26   0.82   0.15   0.67 -10.     0.49 -10.     0.55] sorted [1 3 7]\n",
      "   state [0 1 0 1 0 0 1 1] state_WI [  0.71 -10.     0.15   0.28   0.27   0.47 -10.   -10.  ] sorted [0 5 3]\n",
      "instance 1, ep 29, state [1 1 1 0 1 1 1 0]\n",
      "   state [1 1 1 0 1 1 1 0] state_WI [  0.26 -10.     0.12   0.67 -10.     0.49 -10.     0.55] sorted [3 7 5]\n",
      "   state [1 0 0 0 0 1 1 1] state_WI [  0.26   0.82   0.15   0.67   0.27   0.49 -10.   -10.  ] sorted [1 3 5]\n",
      "   state [0 1 0 0 1 1 1 0] state_WI [  0.71 -10.     0.15   0.67 -10.     0.49 -10.     0.55] sorted [0 3 7]\n",
      "   state [1 0 0 0 0 0 1 0] state_WI [  0.26   0.82   0.15   0.67   0.27   0.47 -10.     0.55] sorted [1 3 7]\n",
      "   state [0 0 0 1 1 0 0 0] state_WI [  0.71   0.82   0.15   0.28 -10.     0.47 -10.     0.55] sorted [1 0 7]\n",
      "   state [1 0 0 0 1 0 0 0] state_WI [  0.26   0.82   0.15   0.67 -10.     0.47 -10.     0.55] sorted [1 3 7]\n",
      "   state [1 0 0 0 1 0 0 1] state_WI [  0.26   0.82   0.15   0.67 -10.     0.47 -10.   -10.  ] sorted [1 3 5]\n",
      "   state [1 1 0 0 1 0 1 1] state_WI [  0.26 -10.     0.15   0.67 -10.     0.47 -10.   -10.  ] sorted [3 5 0]\n",
      "   state [0 0 0 0 0 1 0 1] state_WI [  0.71   0.82   0.15   0.67   0.27   0.49 -10.   -10.  ] sorted [1 0 3]\n",
      "   state [1 1 0 0 0 0 0 0] state_WI [  0.26 -10.     0.15   0.67   0.27   0.47 -10.     0.55] sorted [3 7 5]\n",
      "   state [0 0 0 0 0 1 1 0] state_WI [  0.71   0.82   0.15   0.67   0.27   0.49 -10.     0.55] sorted [1 0 3]\n",
      "   state [0 1 0 1 1 0 1 0] state_WI [  0.71 -10.     0.15   0.28 -10.     0.47 -10.     0.55] sorted [0 7 5]\n",
      "   state [1 1 1 0 0 1 1 1] state_WI [  0.26 -10.     0.12   0.67   0.27   0.49 -10.   -10.  ] sorted [3 5 4]\n",
      "   state [0 0 0 0 1 1 1 0] state_WI [  0.71   0.82   0.15   0.67 -10.     0.49 -10.     0.55] sorted [1 0 3]\n",
      "   state [1 0 0 0 1 0 0 0] state_WI [  0.26   0.82   0.15   0.67 -10.     0.47 -10.     0.55] sorted [1 3 7]\n",
      "   state [0 1 0 1 1 0 0 0] state_WI [  0.71 -10.     0.15   0.28 -10.     0.47 -10.     0.55] sorted [0 7 5]\n",
      "   state [0 0 1 0 1 0 1 0] state_WI [  0.71   0.82   0.12   0.67 -10.     0.47 -10.     0.55] sorted [1 0 3]\n",
      "   state [1 1 0 1 1 0 0 0] state_WI [  0.26 -10.     0.15   0.28 -10.     0.47 -10.     0.55] sorted [7 5 3]\n",
      "   state [0 0 0 1 1 0 1 0] state_WI [  0.71   0.82   0.15   0.28 -10.     0.47 -10.     0.55] sorted [1 0 7]\n",
      "   state [1 1 0 0 0 0 1 1] state_WI [  0.26 -10.     0.15   0.67   0.27   0.47 -10.   -10.  ] sorted [3 5 4]\n",
      "first state [1 1 0 1 0 0 1 1]\n",
      "   state [1 1 0 1 0 0 1 1] state_WI [  0.28   0.19   0.2    0.18   0.89   0.42   0.42 -10.  ] sorted [4 6 5]\n",
      "   state [0 1 0 1 1 1 1 0] state_WI [0.83 0.19 0.2  0.18 0.31 0.34 0.42 0.39] sorted [0 6 7]\n",
      "   state [1 0 1 1 1 1 1 0] state_WI [0.28 0.73 0.09 0.18 0.31 0.34 0.42 0.39] sorted [1 6 7]\n",
      "   state [1 1 1 0 1 0 1 1] state_WI [  0.28   0.19   0.09   0.91   0.31   0.42   0.42 -10.  ] sorted [3 6 5]\n",
      "   state [0 1 1 1 0 0 1 0] state_WI [0.83 0.19 0.09 0.18 0.89 0.42 0.42 0.39] sorted [4 0 6]\n",
      "   state [1 1 0 1 0 0 1 0] state_WI [0.28 0.19 0.2  0.18 0.89 0.42 0.42 0.39] sorted [4 6 5]\n",
      "   state [0 0 1 0 1 1 1 0] state_WI [0.83 0.73 0.09 0.91 0.31 0.34 0.42 0.39] sorted [3 0 1]\n",
      "   state [1 1 0 1 0 0 0 0] state_WI [0.28 0.19 0.2  0.18 0.89 0.42 0.67 0.39] sorted [4 6 5]\n",
      "   state [0 0 1 1 1 1 0 0] state_WI [0.83 0.73 0.09 0.18 0.31 0.34 0.67 0.39] sorted [0 1 6]\n",
      "   state [1 1 1 1 0 0 1 0] state_WI [0.28 0.19 0.09 0.18 0.89 0.42 0.42 0.39] sorted [4 6 5]\n",
      "   state [1 0 1 1 0 1 1 0] state_WI [0.28 0.73 0.09 0.18 0.89 0.34 0.42 0.39] sorted [4 1 6]\n",
      "   state [0 0 0 0 1 1 1 0] state_WI [0.83 0.73 0.2  0.91 0.31 0.34 0.42 0.39] sorted [3 0 1]\n",
      "   state [1 1 1 1 1 0 0 0] state_WI [0.28 0.19 0.09 0.18 0.31 0.42 0.67 0.39] sorted [6 5 7]\n",
      "   state [1 1 1 0 1 0 1 1] state_WI [  0.28   0.19   0.09   0.91   0.31   0.42   0.42 -10.  ] sorted [3 6 5]\n",
      "   state [0 1 1 0 1 1 1 0] state_WI [0.83 0.19 0.09 0.91 0.31 0.34 0.42 0.39] sorted [3 0 6]\n",
      "   state [0 0 0 1 0 1 1 0] state_WI [0.83 0.73 0.2  0.18 0.89 0.34 0.42 0.39] sorted [4 0 1]\n",
      "   state [0 1 1 0 1 0 0 0] state_WI [0.83 0.19 0.09 0.91 0.31 0.42 0.67 0.39] sorted [3 0 6]\n",
      "   state [0 1 0 0 0 0 1 0] state_WI [0.83 0.19 0.2  0.91 0.89 0.42 0.42 0.39] sorted [3 4 0]\n",
      "   state [0 0 1 0 1 0 1 0] state_WI [0.83 0.73 0.09 0.91 0.31 0.42 0.42 0.39] sorted [3 0 1]\n",
      "   state [1 0 0 0 0 0 1 0] state_WI [0.28 0.73 0.2  0.91 0.89 0.42 0.42 0.39] sorted [3 4 1]\n",
      "instance 2, ep 1, state [0 1 0 0 0 0 0 1]\n",
      "   state [0 1 0 0 0 0 0 1] state_WI [  0.83   0.19   0.2    0.91   0.89   0.42   0.67 -10.  ] sorted [3 4 0]\n",
      "   state [0 1 0 1 1 0 0 0] state_WI [0.83 0.19 0.2  0.18 0.31 0.42 0.67 0.39] sorted [0 6 5]\n",
      "   state [1 0 1 1 0 0 1 0] state_WI [0.28 0.73 0.09 0.18 0.89 0.42 0.42 0.39] sorted [4 1 6]\n",
      "   state [1 1 0 1 1 0 1 0] state_WI [0.28 0.19 0.2  0.18 0.31 0.42 0.42 0.39] sorted [6 5 7]\n",
      "   state [0 0 1 0 0 0 1 1] state_WI [  0.83   0.73   0.09   0.91   0.89   0.42   0.42 -10.  ] sorted [3 4 0]\n",
      "   state [0 0 0 1 0 1 0 1] state_WI [  0.83   0.73   0.2    0.18   0.89   0.34   0.67 -10.  ] sorted [4 0 1]\n",
      "   state [0 1 0 0 1 1 0 1] state_WI [  0.83   0.19   0.2    0.91   0.31   0.34   0.67 -10.  ] sorted [3 0 6]\n",
      "   state [1 1 0 1 1 0 1 0] state_WI [0.28 0.19 0.2  0.18 0.31 0.42 0.42 0.39] sorted [6 5 7]\n",
      "   state [0 1 1 0 0 1 1 1] state_WI [  0.83   0.19   0.09   0.91   0.89   0.34   0.42 -10.  ] sorted [3 4 0]\n",
      "   state [1 0 1 1 1 1 1 0] state_WI [0.28 0.73 0.09 0.18 0.31 0.34 0.42 0.39] sorted [1 6 7]\n",
      "   state [1 0 0 0 0 0 1 1] state_WI [  0.28   0.73   0.2    0.91   0.89   0.42   0.42 -10.  ] sorted [3 4 1]\n",
      "   state [1 1 1 1 1 0 1 1] state_WI [  0.28   0.19   0.09   0.18   0.31   0.42   0.42 -10.  ] sorted [6 5 4]\n",
      "   state [0 1 0 0 1 0 0 1] state_WI [  0.83   0.19   0.2    0.91   0.31   0.42   0.67 -10.  ] sorted [3 0 6]\n",
      "   state [1 1 1 1 1 0 1 0] state_WI [0.28 0.19 0.09 0.18 0.31 0.42 0.42 0.39] sorted [6 5 7]\n",
      "   state [1 1 1 1 0 1 1 0] state_WI [0.28 0.19 0.09 0.18 0.89 0.34 0.42 0.39] sorted [4 6 7]\n",
      "   state [1 0 0 1 0 0 1 0] state_WI [0.28 0.73 0.2  0.18 0.89 0.42 0.42 0.39] sorted [4 1 6]\n",
      "   state [0 0 0 1 1 1 1 0] state_WI [0.83 0.73 0.2  0.18 0.31 0.34 0.42 0.39] sorted [0 1 6]\n",
      "   state [1 1 1 1 1 1 1 0] state_WI [0.28 0.19 0.09 0.18 0.31 0.34 0.42 0.39] sorted [6 7 5]\n",
      "   state [0 0 0 0 0 0 1 1] state_WI [  0.83   0.73   0.2    0.91   0.89   0.42   0.42 -10.  ] sorted [3 4 0]\n",
      "   state [1 0 1 1 0 0 1 0] state_WI [0.28 0.73 0.09 0.18 0.89 0.42 0.42 0.39] sorted [4 1 6]\n",
      "instance 2, ep 2, state [1 0 1 1 0 1 1 0]\n",
      "   state [1 0 1 1 0 1 1 0] state_WI [0.28 0.73 0.09 0.18 0.89 0.34 0.42 0.39] sorted [4 1 6]\n",
      "   state [0 1 0 0 1 0 1 0] state_WI [0.83 0.19 0.2  0.91 0.31 0.42 0.42 0.39] sorted [3 0 6]\n",
      "   state [0 1 1 1 0 0 1 0] state_WI [0.83 0.19 0.09 0.18 0.89 0.42 0.42 0.39] sorted [4 0 6]\n",
      "   state [1 1 0 1 1 0 0 0] state_WI [0.28 0.19 0.2  0.18 0.31 0.42 0.67 0.39] sorted [6 5 7]\n",
      "   state [0 0 1 1 1 1 0 1] state_WI [  0.83   0.73   0.09   0.18   0.31   0.34   0.67 -10.  ] sorted [0 1 6]\n",
      "   state [1 0 1 0 1 0 0 0] state_WI [0.28 0.73 0.09 0.91 0.31 0.42 0.67 0.39] sorted [3 1 6]\n",
      "   state [1 0 0 1 1 1 1 0] state_WI [0.28 0.73 0.2  0.18 0.31 0.34 0.42 0.39] sorted [1 6 7]\n",
      "   state [1 1 1 0 0 1 0 1] state_WI [  0.28   0.19   0.09   0.91   0.89   0.34   0.67 -10.  ] sorted [3 4 6]\n",
      "   state [1 0 0 1 1 0 0 0] state_WI [0.28 0.73 0.2  0.18 0.31 0.42 0.67 0.39] sorted [1 6 5]\n",
      "   state [1 0 0 1 1 1 1 1] state_WI [  0.28   0.73   0.2    0.18   0.31   0.34   0.42 -10.  ] sorted [1 6 5]\n",
      "   state [0 1 0 1 1 1 1 1] state_WI [  0.83   0.19   0.2    0.18   0.31   0.34   0.42 -10.  ] sorted [0 6 5]\n",
      "   state [0 1 0 1 1 1 1 0] state_WI [0.83 0.19 0.2  0.18 0.31 0.34 0.42 0.39] sorted [0 6 7]\n",
      "   state [1 1 0 0 1 1 1 0] state_WI [0.28 0.19 0.2  0.91 0.31 0.34 0.42 0.39] sorted [3 6 7]\n",
      "   state [0 0 0 0 1 1 1 1] state_WI [  0.83   0.73   0.2    0.91   0.31   0.34   0.42 -10.  ] sorted [3 0 1]\n",
      "   state [1 1 1 1 1 0 1 1] state_WI [  0.28   0.19   0.09   0.18   0.31   0.42   0.42 -10.  ] sorted [6 5 4]\n",
      "   state [1 1 1 1 0 1 1 0] state_WI [0.28 0.19 0.09 0.18 0.89 0.34 0.42 0.39] sorted [4 6 7]\n",
      "   state [1 0 0 1 0 0 1 0] state_WI [0.28 0.73 0.2  0.18 0.89 0.42 0.42 0.39] sorted [4 1 6]\n",
      "   state [1 1 0 1 1 0 1 0] state_WI [0.28 0.19 0.2  0.18 0.31 0.42 0.42 0.39] sorted [6 5 7]\n",
      "   state [1 0 0 1 0 1 1 0] state_WI [0.28 0.73 0.2  0.18 0.89 0.34 0.42 0.39] sorted [4 1 6]\n",
      "   state [1 0 0 1 1 0 0 0] state_WI [0.28 0.73 0.2  0.18 0.31 0.42 0.67 0.39] sorted [1 6 5]\n",
      "instance 2, ep 3, state [0 1 1 0 1 1 1 1]\n",
      "   state [0 1 1 0 1 1 1 1] state_WI [  0.83   0.19   0.09   0.91   0.31   0.34   0.42 -10.  ] sorted [3 0 6]\n",
      "   state [1 1 0 1 0 0 1 1] state_WI [  0.28   0.19   0.2    0.18   0.89   0.42   0.42 -10.  ] sorted [4 6 5]\n",
      "   state [0 0 0 1 0 0 1 1] state_WI [  0.83   0.73   0.2    0.18   0.89   0.42   0.42 -10.  ] sorted [4 0 1]\n",
      "   state [1 0 0 1 1 0 1 1] state_WI [  0.28   0.73   0.2    0.18   0.31   0.42   0.42 -10.  ] sorted [1 6 5]\n",
      "   state [0 1 0 1 1 0 1 0] state_WI [0.83 0.19 0.2  0.18 0.31 0.42 0.42 0.39] sorted [0 6 5]\n",
      "   state [1 0 1 1 1 0 1 0] state_WI [0.28 0.73 0.09 0.18 0.31 0.42 0.42 0.39] sorted [1 6 5]\n",
      "   state [0 0 0 0 0 0 1 0] state_WI [0.83 0.73 0.2  0.91 0.89 0.42 0.42 0.39] sorted [3 4 0]\n",
      "   state [1 0 0 0 1 0 1 0] state_WI [0.28 0.73 0.2  0.91 0.31 0.42 0.42 0.39] sorted [3 1 6]\n",
      "   state [1 0 0 1 1 0 1 0] state_WI [0.28 0.73 0.2  0.18 0.31 0.42 0.42 0.39] sorted [1 6 5]\n",
      "   state [0 0 0 0 1 0 1 0] state_WI [0.83 0.73 0.2  0.91 0.31 0.42 0.42 0.39] sorted [3 0 1]\n",
      "   state [1 0 0 0 1 0 1 0] state_WI [0.28 0.73 0.2  0.91 0.31 0.42 0.42 0.39] sorted [3 1 6]\n",
      "   state [0 1 0 1 1 0 1 0] state_WI [0.83 0.19 0.2  0.18 0.31 0.42 0.42 0.39] sorted [0 6 5]\n",
      "   state [0 1 1 1 0 0 1 0] state_WI [0.83 0.19 0.09 0.18 0.89 0.42 0.42 0.39] sorted [4 0 6]\n",
      "   state [1 0 1 0 1 0 1 0] state_WI [0.28 0.73 0.09 0.91 0.31 0.42 0.42 0.39] sorted [3 1 6]\n",
      "   state [0 1 0 0 1 0 1 0] state_WI [0.83 0.19 0.2  0.91 0.31 0.42 0.42 0.39] sorted [3 0 6]\n",
      "   state [1 1 0 1 1 0 1 0] state_WI [0.28 0.19 0.2  0.18 0.31 0.42 0.42 0.39] sorted [6 5 7]\n",
      "   state [0 0 0 1 1 0 0 1] state_WI [  0.83   0.73   0.2    0.18   0.31   0.42   0.67 -10.  ] sorted [0 1 6]\n",
      "   state [1 1 1 1 1 0 0 1] state_WI [  0.28   0.19   0.09   0.18   0.31   0.42   0.67 -10.  ] sorted [6 5 4]\n",
      "   state [0 1 0 1 1 0 1 0] state_WI [0.83 0.19 0.2  0.18 0.31 0.42 0.42 0.39] sorted [0 6 5]\n",
      "   state [1 0 1 1 0 0 1 0] state_WI [0.28 0.73 0.09 0.18 0.89 0.42 0.42 0.39] sorted [4 1 6]\n",
      "instance 2, ep 4, state [1 0 0 1 1 0 1 1]\n",
      "   state [1 0 0 1 1 0 1 1] state_WI [  0.28   0.73   0.2    0.18   0.31   0.42   0.42 -10.  ] sorted [1 6 5]\n",
      "   state [0 0 1 1 1 0 1 1] state_WI [  0.83   0.73   0.09   0.18   0.31   0.42   0.42 -10.  ] sorted [0 1 6]\n",
      "   state [0 1 0 1 1 0 1 0] state_WI [0.83 0.19 0.2  0.18 0.31 0.42 0.42 0.39] sorted [0 6 5]\n",
      "   state [0 1 1 1 0 0 0 0] state_WI [0.83 0.19 0.09 0.18 0.89 0.42 0.67 0.39] sorted [4 0 6]\n",
      "   state [1 0 1 1 1 0 1 0] state_WI [0.28 0.73 0.09 0.18 0.31 0.42 0.42 0.39] sorted [1 6 5]\n",
      "   state [1 1 1 1 0 1 0 0] state_WI [0.28 0.19 0.09 0.18 0.89 0.34 0.67 0.39] sorted [4 6 7]\n",
      "   state [0 1 1 1 1 0 1 1] state_WI [  0.83   0.19   0.09   0.18   0.31   0.42   0.42 -10.  ] sorted [0 6 5]\n",
      "   state [1 1 0 1 0 0 1 1] state_WI [  0.28   0.19   0.2    0.18   0.89   0.42   0.42 -10.  ] sorted [4 6 5]\n",
      "   state [1 0 0 1 0 1 0 0] state_WI [0.28 0.73 0.2  0.18 0.89 0.34 0.67 0.39] sorted [4 1 6]\n",
      "   state [1 0 0 0 1 1 0 0] state_WI [0.28 0.73 0.2  0.91 0.31 0.34 0.67 0.39] sorted [3 1 6]\n",
      "   state [1 0 1 0 0 1 0 0] state_WI [0.28 0.73 0.09 0.91 0.89 0.34 0.67 0.39] sorted [3 4 1]\n",
      "   state [0 0 1 1 1 0 0 0] state_WI [0.83 0.73 0.09 0.18 0.31 0.42 0.67 0.39] sorted [0 1 6]\n",
      "   state [0 1 0 1 1 0 0 0] state_WI [0.83 0.19 0.2  0.18 0.31 0.42 0.67 0.39] sorted [0 6 5]\n",
      "   state [0 0 1 1 1 0 1 0] state_WI [0.83 0.73 0.09 0.18 0.31 0.42 0.42 0.39] sorted [0 1 6]\n",
      "   state [1 1 0 1 0 1 1 0] state_WI [0.28 0.19 0.2  0.18 0.89 0.34 0.42 0.39] sorted [4 6 7]\n",
      "   state [1 0 1 1 1 0 1 0] state_WI [0.28 0.73 0.09 0.18 0.31 0.42 0.42 0.39] sorted [1 6 5]\n",
      "   state [0 1 1 1 1 1 1 0] state_WI [0.83 0.19 0.09 0.18 0.31 0.34 0.42 0.39] sorted [0 6 7]\n",
      "   state [1 1 1 0 0 0 1 1] state_WI [  0.28   0.19   0.09   0.91   0.89   0.42   0.42 -10.  ] sorted [3 4 6]\n",
      "   state [0 1 0 1 1 0 1 0] state_WI [0.83 0.19 0.2  0.18 0.31 0.42 0.42 0.39] sorted [0 6 5]\n",
      "   state [1 1 1 1 1 1 1 0] state_WI [0.28 0.19 0.09 0.18 0.31 0.34 0.42 0.39] sorted [6 7 5]\n",
      "instance 2, ep 5, state [0 1 1 1 1 0 1 0]\n",
      "   state [0 1 1 1 1 0 1 0] state_WI [0.83 0.19 0.09 0.18 0.31 0.42 0.42 0.39] sorted [0 6 5]\n",
      "   state [0 1 1 1 1 1 1 0] state_WI [0.83 0.19 0.09 0.18 0.31 0.34 0.42 0.39] sorted [0 6 7]\n",
      "   state [0 1 0 0 1 0 1 0] state_WI [0.83 0.19 0.2  0.91 0.31 0.42 0.42 0.39] sorted [3 0 6]\n",
      "   state [0 0 0 1 0 0 0 0] state_WI [0.83 0.73 0.2  0.18 0.89 0.42 0.67 0.39] sorted [4 0 1]\n",
      "   state [1 0 1 1 1 0 0 0] state_WI [0.28 0.73 0.09 0.18 0.31 0.42 0.67 0.39] sorted [1 6 5]\n",
      "   state [1 1 1 1 0 0 1 0] state_WI [0.28 0.19 0.09 0.18 0.89 0.42 0.42 0.39] sorted [4 6 5]\n",
      "   state [0 1 0 0 1 1 1 0] state_WI [0.83 0.19 0.2  0.91 0.31 0.34 0.42 0.39] sorted [3 0 6]\n",
      "   state [0 1 0 1 1 1 1 0] state_WI [0.83 0.19 0.2  0.18 0.31 0.34 0.42 0.39] sorted [0 6 7]\n",
      "   state [0 0 0 1 1 0 1 1] state_WI [  0.83   0.73   0.2    0.18   0.31   0.42   0.42 -10.  ] sorted [0 1 6]\n",
      "   state [0 1 0 0 1 0 1 0] state_WI [0.83 0.19 0.2  0.91 0.31 0.42 0.42 0.39] sorted [3 0 6]\n",
      "   state [0 0 0 0 1 0 1 0] state_WI [0.83 0.73 0.2  0.91 0.31 0.42 0.42 0.39] sorted [3 0 1]\n",
      "   state [1 1 1 1 0 0 1 0] state_WI [0.28 0.19 0.09 0.18 0.89 0.42 0.42 0.39] sorted [4 6 5]\n",
      "   state [0 0 1 1 1 1 1 0] state_WI [0.83 0.73 0.09 0.18 0.31 0.34 0.42 0.39] sorted [0 1 6]\n",
      "   state [0 1 0 1 0 1 0 0] state_WI [0.83 0.19 0.2  0.18 0.89 0.34 0.67 0.39] sorted [4 0 6]\n",
      "   state [1 1 1 1 1 0 1 1] state_WI [  0.28   0.19   0.09   0.18   0.31   0.42   0.42 -10.  ] sorted [6 5 4]\n",
      "   state [1 1 1 0 1 1 1 0] state_WI [0.28 0.19 0.09 0.91 0.31 0.34 0.42 0.39] sorted [3 6 7]\n",
      "   state [0 0 0 1 0 0 1 1] state_WI [  0.83   0.73   0.2    0.18   0.89   0.42   0.42 -10.  ] sorted [4 0 1]\n",
      "   state [1 0 0 0 1 0 1 0] state_WI [0.28 0.73 0.2  0.91 0.31 0.42 0.42 0.39] sorted [3 1 6]\n",
      "   state [0 1 0 1 0 0 1 1] state_WI [  0.83   0.19   0.2    0.18   0.89   0.42   0.42 -10.  ] sorted [4 0 6]\n",
      "   state [0 0 0 1 1 0 0 0] state_WI [0.83 0.73 0.2  0.18 0.31 0.42 0.67 0.39] sorted [0 1 6]\n",
      "instance 2, ep 6, state [0 1 0 0 1 0 0 1]\n",
      "   state [0 1 0 0 1 0 0 1] state_WI [  0.83   0.19   0.2    0.91   0.31   0.42   0.67 -10.  ] sorted [3 0 6]\n",
      "   state [1 0 1 1 0 0 0 1] state_WI [  0.28   0.73   0.09   0.18   0.89   0.42   0.67 -10.  ] sorted [4 1 6]\n",
      "   state [0 0 0 1 1 0 1 0] state_WI [0.83 0.73 0.2  0.18 0.31 0.42 0.42 0.39] sorted [0 1 6]\n",
      "   state [0 1 0 0 1 0 1 0] state_WI [0.83 0.19 0.2  0.91 0.31 0.42 0.42 0.39] sorted [3 0 6]\n",
      "   state [1 1 1 1 1 0 1 0] state_WI [0.28 0.19 0.09 0.18 0.31 0.42 0.42 0.39] sorted [6 5 7]\n",
      "   state [0 1 1 0 0 0 1 0] state_WI [0.83 0.19 0.09 0.91 0.89 0.42 0.42 0.39] sorted [3 4 0]\n",
      "   state [1 1 1 0 1 0 1 0] state_WI [0.28 0.19 0.09 0.91 0.31 0.42 0.42 0.39] sorted [3 6 5]\n",
      "   state [1 0 1 0 1 0 1 0] state_WI [0.28 0.73 0.09 0.91 0.31 0.42 0.42 0.39] sorted [3 1 6]\n",
      "   state [0 0 0 0 0 0 1 0] state_WI [0.83 0.73 0.2  0.91 0.89 0.42 0.42 0.39] sorted [3 4 0]\n",
      "   state [1 0 0 1 1 0 0 0] state_WI [0.28 0.73 0.2  0.18 0.31 0.42 0.67 0.39] sorted [1 6 5]\n",
      "   state [1 1 1 1 1 1 1 0] state_WI [0.28 0.19 0.09 0.18 0.31 0.34 0.42 0.39] sorted [6 7 5]\n",
      "   state [1 0 1 0 1 1 1 0] state_WI [0.28 0.73 0.09 0.91 0.31 0.34 0.42 0.39] sorted [3 1 6]\n",
      "   state [0 1 0 1 0 1 1 0] state_WI [0.83 0.19 0.2  0.18 0.89 0.34 0.42 0.39] sorted [4 0 6]\n",
      "   state [1 0 0 0 1 1 1 0] state_WI [0.28 0.73 0.2  0.91 0.31 0.34 0.42 0.39] sorted [3 1 6]\n",
      "   state [0 1 1 0 1 0 1 0] state_WI [0.83 0.19 0.09 0.91 0.31 0.42 0.42 0.39] sorted [3 0 6]\n",
      "   state [1 1 1 0 0 1 1 0] state_WI [0.28 0.19 0.09 0.91 0.89 0.34 0.42 0.39] sorted [3 4 6]\n",
      "   state [0 1 1 1 1 0 1 0] state_WI [0.83 0.19 0.09 0.18 0.31 0.42 0.42 0.39] sorted [0 6 5]\n",
      "   state [0 0 0 1 1 1 1 0] state_WI [0.83 0.73 0.2  0.18 0.31 0.34 0.42 0.39] sorted [0 1 6]\n",
      "   state [1 1 0 1 0 1 1 0] state_WI [0.28 0.19 0.2  0.18 0.89 0.34 0.42 0.39] sorted [4 6 7]\n",
      "   state [1 0 1 0 1 1 1 0] state_WI [0.28 0.73 0.09 0.91 0.31 0.34 0.42 0.39] sorted [3 1 6]\n",
      "instance 2, ep 7, state [1 0 1 0 1 1 1 1]\n",
      "   state [1 0 1 0 1 1 1 1] state_WI [  0.28   0.73   0.09   0.91   0.31   0.34   0.42 -10.  ] sorted [3 1 6]\n",
      "   state [1 1 0 1 1 1 1 0] state_WI [0.28 0.19 0.2  0.18 0.31 0.34 0.42 0.39] sorted [6 7 5]\n",
      "   state [1 1 0 0 0 0 1 0] state_WI [0.28 0.19 0.2  0.91 0.89 0.42 0.42 0.39] sorted [3 4 6]\n",
      "   state [0 0 1 1 1 0 0 0] state_WI [0.83 0.73 0.09 0.18 0.31 0.42 0.67 0.39] sorted [0 1 6]\n",
      "   state [0 0 0 1 1 0 0 1] state_WI [  0.83   0.73   0.2    0.18   0.31   0.42   0.67 -10.  ] sorted [0 1 6]\n",
      "   state [1 1 1 1 1 0 1 0] state_WI [0.28 0.19 0.09 0.18 0.31 0.42 0.42 0.39] sorted [6 5 7]\n",
      "   state [1 1 0 1 1 1 1 1] state_WI [  0.28   0.19   0.2    0.18   0.31   0.34   0.42 -10.  ] sorted [6 5 4]\n",
      "   state [0 1 1 0 0 1 1 1] state_WI [  0.83   0.19   0.09   0.91   0.89   0.34   0.42 -10.  ] sorted [3 4 0]\n",
      "   state [0 0 0 0 1 1 0 0] state_WI [0.83 0.73 0.2  0.91 0.31 0.34 0.67 0.39] sorted [3 0 1]\n",
      "   state [1 0 1 1 0 0 0 0] state_WI [0.28 0.73 0.09 0.18 0.89 0.42 0.67 0.39] sorted [4 1 6]\n",
      "   state [0 1 1 1 1 0 1 0] state_WI [0.83 0.19 0.09 0.18 0.31 0.42 0.42 0.39] sorted [0 6 5]\n",
      "   state [1 0 0 1 1 1 1 1] state_WI [  0.28   0.73   0.2    0.18   0.31   0.34   0.42 -10.  ] sorted [1 6 5]\n",
      "   state [1 1 1 1 0 0 1 0] state_WI [0.28 0.19 0.09 0.18 0.89 0.42 0.42 0.39] sorted [4 6 5]\n",
      "   state [1 0 0 1 0 0 1 0] state_WI [0.28 0.73 0.2  0.18 0.89 0.42 0.42 0.39] sorted [4 1 6]\n",
      "   state [0 1 0 1 1 0 1 0] state_WI [0.83 0.19 0.2  0.18 0.31 0.42 0.42 0.39] sorted [0 6 5]\n",
      "   state [1 0 0 1 0 0 1 1] state_WI [  0.28   0.73   0.2    0.18   0.89   0.42   0.42 -10.  ] sorted [4 1 6]\n",
      "   state [0 0 1 0 1 0 1 0] state_WI [0.83 0.73 0.09 0.91 0.31 0.42 0.42 0.39] sorted [3 0 1]\n",
      "   state [1 0 1 0 0 0 1 1] state_WI [  0.28   0.73   0.09   0.91   0.89   0.42   0.42 -10.  ] sorted [3 4 1]\n",
      "   state [0 1 0 1 1 0 1 1] state_WI [  0.83   0.19   0.2    0.18   0.31   0.42   0.42 -10.  ] sorted [0 6 5]\n",
      "   state [0 1 0 1 0 0 1 0] state_WI [0.83 0.19 0.2  0.18 0.89 0.42 0.42 0.39] sorted [4 0 6]\n",
      "instance 2, ep 8, state [1 1 0 0 1 0 1 0]\n",
      "   state [1 1 0 0 1 0 1 0] state_WI [0.28 0.19 0.2  0.91 0.31 0.42 0.42 0.39] sorted [3 6 5]\n",
      "   state [1 0 1 1 1 1 1 0] state_WI [0.28 0.73 0.09 0.18 0.31 0.34 0.42 0.39] sorted [1 6 7]\n",
      "   state [1 0 1 0 1 0 1 0] state_WI [0.28 0.73 0.09 0.91 0.31 0.42 0.42 0.39] sorted [3 1 6]\n",
      "   state [0 1 1 0 0 0 1 0] state_WI [0.83 0.19 0.09 0.91 0.89 0.42 0.42 0.39] sorted [3 4 0]\n",
      "   state [1 0 1 1 0 0 1 0] state_WI [0.28 0.73 0.09 0.18 0.89 0.42 0.42 0.39] sorted [4 1 6]\n",
      "   state [1 1 1 1 1 1 1 0] state_WI [0.28 0.19 0.09 0.18 0.31 0.34 0.42 0.39] sorted [6 7 5]\n",
      "   state [0 0 0 1 0 1 1 0] state_WI [0.83 0.73 0.2  0.18 0.89 0.34 0.42 0.39] sorted [4 0 1]\n",
      "   state [0 1 1 1 0 0 0 0] state_WI [0.83 0.19 0.09 0.18 0.89 0.42 0.67 0.39] sorted [4 0 6]\n",
      "   state [1 1 0 1 0 0 0 0] state_WI [0.28 0.19 0.2  0.18 0.89 0.42 0.67 0.39] sorted [4 6 5]\n",
      "   state [1 0 0 1 1 1 0 0] state_WI [0.28 0.73 0.2  0.18 0.31 0.34 0.67 0.39] sorted [1 6 7]\n",
      "   state [1 1 0 1 1 0 1 0] state_WI [0.28 0.19 0.2  0.18 0.31 0.42 0.42 0.39] sorted [6 5 7]\n",
      "   state [0 1 0 1 1 0 1 1] state_WI [  0.83   0.19   0.2    0.18   0.31   0.42   0.42 -10.  ] sorted [0 6 5]\n",
      "   state [1 1 0 1 1 1 1 1] state_WI [  0.28   0.19   0.2    0.18   0.31   0.34   0.42 -10.  ] sorted [6 5 4]\n",
      "   state [0 1 1 1 1 1 1 0] state_WI [0.83 0.19 0.09 0.18 0.31 0.34 0.42 0.39] sorted [0 6 7]\n",
      "   state [0 0 1 1 0 1 1 1] state_WI [  0.83   0.73   0.09   0.18   0.89   0.34   0.42 -10.  ] sorted [4 0 1]\n",
      "   state [1 0 0 1 0 0 0 0] state_WI [0.28 0.73 0.2  0.18 0.89 0.42 0.67 0.39] sorted [4 1 6]\n",
      "   state [0 1 0 1 1 0 0 0] state_WI [0.83 0.19 0.2  0.18 0.31 0.42 0.67 0.39] sorted [0 6 5]\n",
      "   state [1 0 0 1 1 0 0 0] state_WI [0.28 0.73 0.2  0.18 0.31 0.42 0.67 0.39] sorted [1 6 5]\n",
      "   state [1 1 1 0 0 1 0 1] state_WI [  0.28   0.19   0.09   0.91   0.89   0.34   0.67 -10.  ] sorted [3 4 6]\n",
      "   state [1 1 0 1 1 0 0 1] state_WI [  0.28   0.19   0.2    0.18   0.31   0.42   0.67 -10.  ] sorted [6 5 4]\n",
      "instance 2, ep 9, state [1 0 0 1 1 1 0 0]\n",
      "   state [1 0 0 1 1 1 0 0] state_WI [0.28 0.73 0.2  0.18 0.31 0.34 0.67 0.39] sorted [1 6 7]\n",
      "   state [1 0 1 1 0 0 1 0] state_WI [0.28 0.73 0.09 0.18 0.89 0.42 0.42 0.39] sorted [4 1 6]\n",
      "   state [0 1 0 1 0 0 0 0] state_WI [0.83 0.19 0.2  0.18 0.89 0.42 0.67 0.39] sorted [4 0 6]\n",
      "   state [1 1 0 0 1 0 1 1] state_WI [  0.28   0.19   0.2    0.91   0.31   0.42   0.42 -10.  ] sorted [3 6 5]\n",
      "   state [1 0 0 1 0 0 0 0] state_WI [0.28 0.73 0.2  0.18 0.89 0.42 0.67 0.39] sorted [4 1 6]\n",
      "   state [0 1 1 1 1 0 1 0] state_WI [0.83 0.19 0.09 0.18 0.31 0.42 0.42 0.39] sorted [0 6 5]\n",
      "   state [1 1 0 0 1 1 1 0] state_WI [0.28 0.19 0.2  0.91 0.31 0.34 0.42 0.39] sorted [3 6 7]\n",
      "   state [0 1 0 0 1 1 0 0] state_WI [0.83 0.19 0.2  0.91 0.31 0.34 0.67 0.39] sorted [3 0 6]\n",
      "   state [0 0 0 1 1 1 1 0] state_WI [0.83 0.73 0.2  0.18 0.31 0.34 0.42 0.39] sorted [0 1 6]\n",
      "   state [1 1 0 1 1 1 1 0] state_WI [0.28 0.19 0.2  0.18 0.31 0.34 0.42 0.39] sorted [6 7 5]\n",
      "   state [1 0 1 1 0 1 1 0] state_WI [0.28 0.73 0.09 0.18 0.89 0.34 0.42 0.39] sorted [4 1 6]\n",
      "   state [1 0 1 1 1 0 1 0] state_WI [0.28 0.73 0.09 0.18 0.31 0.42 0.42 0.39] sorted [1 6 5]\n",
      "   state [1 1 0 1 0 0 1 0] state_WI [0.28 0.19 0.2  0.18 0.89 0.42 0.42 0.39] sorted [4 6 5]\n",
      "   state [1 0 0 0 1 0 1 0] state_WI [0.28 0.73 0.2  0.91 0.31 0.42 0.42 0.39] sorted [3 1 6]\n",
      "   state [0 1 0 1 0 0 1 0] state_WI [0.83 0.19 0.2  0.18 0.89 0.42 0.42 0.39] sorted [4 0 6]\n",
      "   state [0 1 1 0 1 1 1 0] state_WI [0.83 0.19 0.09 0.91 0.31 0.34 0.42 0.39] sorted [3 0 6]\n",
      "   state [1 1 0 1 1 0 1 0] state_WI [0.28 0.19 0.2  0.18 0.31 0.42 0.42 0.39] sorted [6 5 7]\n",
      "   state [0 1 0 1 0 1 1 1] state_WI [  0.83   0.19   0.2    0.18   0.89   0.34   0.42 -10.  ] sorted [4 0 6]\n",
      "   state [1 0 1 0 1 1 1 1] state_WI [  0.28   0.73   0.09   0.91   0.31   0.34   0.42 -10.  ] sorted [3 1 6]\n",
      "   state [0 0 0 1 1 0 1 0] state_WI [0.83 0.73 0.2  0.18 0.31 0.42 0.42 0.39] sorted [0 1 6]\n",
      "instance 2, ep 10, state [1 0 1 1 1 1 1 1]\n",
      "   state [1 0 1 1 1 1 1 1] state_WI [  0.28   0.73   0.09   0.18   0.31   0.34   0.42 -10.  ] sorted [1 6 5]\n",
      "   state [1 1 0 0 1 0 1 1] state_WI [  0.28   0.19   0.2    0.91   0.31   0.42   0.42 -10.  ] sorted [3 6 5]\n",
      "   state [0 0 1 1 1 0 1 0] state_WI [0.83 0.73 0.09 0.18 0.31 0.42 0.42 0.39] sorted [0 1 6]\n",
      "   state [1 0 0 1 0 0 1 0] state_WI [0.28 0.73 0.2  0.18 0.89 0.42 0.42 0.39] sorted [4 1 6]\n",
      "   state [1 1 0 1 1 1 1 0] state_WI [0.28 0.19 0.2  0.18 0.31 0.34 0.42 0.39] sorted [6 7 5]\n",
      "   state [1 0 0 0 1 1 1 0] state_WI [0.28 0.73 0.2  0.91 0.31 0.34 0.42 0.39] sorted [3 1 6]\n",
      "   state [1 1 1 1 1 0 1 0] state_WI [0.28 0.19 0.09 0.18 0.31 0.42 0.42 0.39] sorted [6 5 7]\n",
      "   state [1 0 1 1 0 0 1 0] state_WI [0.28 0.73 0.09 0.18 0.89 0.42 0.42 0.39] sorted [4 1 6]\n",
      "   state [0 0 1 1 1 1 1 1] state_WI [  0.83   0.73   0.09   0.18   0.31   0.34   0.42 -10.  ] sorted [0 1 6]\n",
      "   state [0 0 0 1 1 0 1 0] state_WI [0.83 0.73 0.2  0.18 0.31 0.42 0.42 0.39] sorted [0 1 6]\n",
      "   state [0 1 1 1 0 0 1 0] state_WI [0.83 0.19 0.09 0.18 0.89 0.42 0.42 0.39] sorted [4 0 6]\n",
      "   state [1 0 1 1 0 1 1 0] state_WI [0.28 0.73 0.09 0.18 0.89 0.34 0.42 0.39] sorted [4 1 6]\n",
      "   state [0 0 1 1 1 0 0 0] state_WI [0.83 0.73 0.09 0.18 0.31 0.42 0.67 0.39] sorted [0 1 6]\n",
      "   state [1 1 1 0 1 0 0 0] state_WI [0.28 0.19 0.09 0.91 0.31 0.42 0.67 0.39] sorted [3 6 5]\n",
      "   state [0 0 0 1 0 0 0 0] state_WI [0.83 0.73 0.2  0.18 0.89 0.42 0.67 0.39] sorted [4 0 1]\n",
      "   state [1 1 0 0 0 0 0 0] state_WI [0.28 0.19 0.2  0.91 0.89 0.42 0.67 0.39] sorted [3 4 6]\n",
      "   state [1 1 0 1 1 0 0 0] state_WI [0.28 0.19 0.2  0.18 0.31 0.42 0.67 0.39] sorted [6 5 7]\n",
      "   state [0 0 1 1 0 0 1 0] state_WI [0.83 0.73 0.09 0.18 0.89 0.42 0.42 0.39] sorted [4 0 1]\n",
      "   state [1 0 0 1 1 0 0 0] state_WI [0.28 0.73 0.2  0.18 0.31 0.42 0.67 0.39] sorted [1 6 5]\n",
      "   state [0 1 1 1 1 1 1 0] state_WI [0.83 0.19 0.09 0.18 0.31 0.34 0.42 0.39] sorted [0 6 7]\n",
      "instance 2, ep 11, state [0 0 0 0 1 1 0 0]\n",
      "   state [0 0 0 0 1 1 0 0] state_WI [0.83 0.73 0.2  0.91 0.31 0.34 0.67 0.39] sorted [3 0 1]\n",
      "   state [0 1 0 1 1 0 0 1] state_WI [  0.83   0.19   0.2    0.18   0.31   0.42   0.67 -10.  ] sorted [0 6 5]\n",
      "   state [1 1 0 1 1 0 0 0] state_WI [0.28 0.19 0.2  0.18 0.31 0.42 0.67 0.39] sorted [6 5 7]\n",
      "   state [0 0 1 0 0 1 0 0] state_WI [0.83 0.73 0.09 0.91 0.89 0.34 0.67 0.39] sorted [3 4 0]\n",
      "   state [0 0 1 1 0 0 0 0] state_WI [0.83 0.73 0.09 0.18 0.89 0.42 0.67 0.39] sorted [4 0 1]\n",
      "   state [1 0 0 0 1 0 0 0] state_WI [0.28 0.73 0.2  0.91 0.31 0.42 0.67 0.39] sorted [3 1 6]\n",
      "   state [1 0 0 1 1 0 1 0] state_WI [0.28 0.73 0.2  0.18 0.31 0.42 0.42 0.39] sorted [1 6 5]\n",
      "   state [1 1 1 0 1 1 1 0] state_WI [0.28 0.19 0.09 0.91 0.31 0.34 0.42 0.39] sorted [3 6 7]\n",
      "   state [1 0 0 0 1 1 0 0] state_WI [0.28 0.73 0.2  0.91 0.31 0.34 0.67 0.39] sorted [3 1 6]\n",
      "   state [1 0 0 1 0 0 1 0] state_WI [0.28 0.73 0.2  0.18 0.89 0.42 0.42 0.39] sorted [4 1 6]\n",
      "   state [1 1 0 0 0 0 1 0] state_WI [0.28 0.19 0.2  0.91 0.89 0.42 0.42 0.39] sorted [3 4 6]\n",
      "   state [1 1 0 1 0 0 1 0] state_WI [0.28 0.19 0.2  0.18 0.89 0.42 0.42 0.39] sorted [4 6 5]\n",
      "   state [1 1 0 1 1 0 1 0] state_WI [0.28 0.19 0.2  0.18 0.31 0.42 0.42 0.39] sorted [6 5 7]\n",
      "   state [1 1 1 1 0 0 1 0] state_WI [0.28 0.19 0.09 0.18 0.89 0.42 0.42 0.39] sorted [4 6 5]\n",
      "   state [1 1 0 0 0 1 1 0] state_WI [0.28 0.19 0.2  0.91 0.89 0.34 0.42 0.39] sorted [3 4 6]\n",
      "   state [1 0 0 0 1 1 1 0] state_WI [0.28 0.73 0.2  0.91 0.31 0.34 0.42 0.39] sorted [3 1 6]\n",
      "   state [1 0 0 1 1 0 1 0] state_WI [0.28 0.73 0.2  0.18 0.31 0.42 0.42 0.39] sorted [1 6 5]\n",
      "   state [0 1 0 1 1 1 1 0] state_WI [0.83 0.19 0.2  0.18 0.31 0.34 0.42 0.39] sorted [0 6 7]\n",
      "   state [0 0 1 1 0 0 1 0] state_WI [0.83 0.73 0.09 0.18 0.89 0.42 0.42 0.39] sorted [4 0 1]\n",
      "   state [0 0 1 0 1 0 0 0] state_WI [0.83 0.73 0.09 0.91 0.31 0.42 0.67 0.39] sorted [3 0 1]\n",
      "instance 2, ep 12, state [0 1 1 0 1 1 0 1]\n",
      "   state [0 1 1 0 1 1 0 1] state_WI [  0.83   0.19   0.09   0.91   0.31   0.34   0.67 -10.  ] sorted [3 0 6]\n",
      "   state [0 0 0 0 0 1 0 1] state_WI [  0.83   0.73   0.2    0.91   0.89   0.34   0.67 -10.  ] sorted [3 4 0]\n",
      "   state [1 0 1 1 1 0 0 1] state_WI [  0.28   0.73   0.09   0.18   0.31   0.42   0.67 -10.  ] sorted [1 6 5]\n",
      "   state [1 0 1 1 1 1 1 1] state_WI [  0.28   0.73   0.09   0.18   0.31   0.34   0.42 -10.  ] sorted [1 6 5]\n",
      "   state [1 1 0 1 1 0 1 0] state_WI [0.28 0.19 0.2  0.18 0.31 0.42 0.42 0.39] sorted [6 5 7]\n",
      "   state [1 1 0 1 0 1 1 0] state_WI [0.28 0.19 0.2  0.18 0.89 0.34 0.42 0.39] sorted [4 6 7]\n",
      "   state [0 0 1 1 0 0 0 1] state_WI [  0.83   0.73   0.09   0.18   0.89   0.42   0.67 -10.  ] sorted [4 0 1]\n",
      "   state [1 0 0 0 1 1 0 1] state_WI [  0.28   0.73   0.2    0.91   0.31   0.34   0.67 -10.  ] sorted [3 1 6]\n",
      "   state [1 1 1 1 0 0 1 0] state_WI [0.28 0.19 0.09 0.18 0.89 0.42 0.42 0.39] sorted [4 6 5]\n",
      "   state [0 0 0 1 1 1 1 0] state_WI [0.83 0.73 0.2  0.18 0.31 0.34 0.42 0.39] sorted [0 1 6]\n",
      "   state [1 0 1 0 0 1 1 0] state_WI [0.28 0.73 0.09 0.91 0.89 0.34 0.42 0.39] sorted [3 4 1]\n",
      "   state [0 0 0 0 1 1 0 0] state_WI [0.83 0.73 0.2  0.91 0.31 0.34 0.67 0.39] sorted [3 0 1]\n",
      "   state [0 0 0 1 0 1 0 0] state_WI [0.83 0.73 0.2  0.18 0.89 0.34 0.67 0.39] sorted [4 0 1]\n",
      "   state [1 1 0 0 1 1 0 0] state_WI [0.28 0.19 0.2  0.91 0.31 0.34 0.67 0.39] sorted [3 6 7]\n",
      "   state [0 0 0 1 1 0 1 1] state_WI [  0.83   0.73   0.2    0.18   0.31   0.42   0.42 -10.  ] sorted [0 1 6]\n",
      "   state [0 0 1 1 0 1 1 0] state_WI [0.83 0.73 0.09 0.18 0.89 0.34 0.42 0.39] sorted [4 0 1]\n",
      "   state [0 0 1 1 1 1 1 0] state_WI [0.83 0.73 0.09 0.18 0.31 0.34 0.42 0.39] sorted [0 1 6]\n",
      "   state [1 1 0 0 1 0 1 0] state_WI [0.28 0.19 0.2  0.91 0.31 0.42 0.42 0.39] sorted [3 6 5]\n",
      "   state [0 0 0 1 0 1 1 0] state_WI [0.83 0.73 0.2  0.18 0.89 0.34 0.42 0.39] sorted [4 0 1]\n",
      "   state [0 0 1 1 1 0 0 0] state_WI [0.83 0.73 0.09 0.18 0.31 0.42 0.67 0.39] sorted [0 1 6]\n",
      "instance 2, ep 13, state [1 0 0 0 0 1 1 0]\n",
      "   state [1 0 0 0 0 1 1 0] state_WI [0.28 0.73 0.2  0.91 0.89 0.34 0.42 0.39] sorted [3 4 1]\n",
      "   state [0 0 0 1 1 1 1 0] state_WI [0.83 0.73 0.2  0.18 0.31 0.34 0.42 0.39] sorted [0 1 6]\n",
      "   state [0 0 1 1 0 0 1 0] state_WI [0.83 0.73 0.09 0.18 0.89 0.42 0.42 0.39] sorted [4 0 1]\n",
      "   state [1 1 0 1 0 0 1 0] state_WI [0.28 0.19 0.2  0.18 0.89 0.42 0.42 0.39] sorted [4 6 5]\n",
      "   state [0 0 1 1 1 0 1 1] state_WI [  0.83   0.73   0.09   0.18   0.31   0.42   0.42 -10.  ] sorted [0 1 6]\n",
      "   state [1 1 0 1 0 0 1 0] state_WI [0.28 0.19 0.2  0.18 0.89 0.42 0.42 0.39] sorted [4 6 5]\n",
      "   state [1 1 0 0 1 0 1 0] state_WI [0.28 0.19 0.2  0.91 0.31 0.42 0.42 0.39] sorted [3 6 5]\n",
      "   state [1 0 1 1 1 1 0 0] state_WI [0.28 0.73 0.09 0.18 0.31 0.34 0.67 0.39] sorted [1 6 7]\n",
      "   state [0 0 1 1 1 0 0 1] state_WI [  0.83   0.73   0.09   0.18   0.31   0.42   0.67 -10.  ] sorted [0 1 6]\n",
      "   state [1 0 0 1 1 0 1 0] state_WI [0.28 0.73 0.2  0.18 0.31 0.42 0.42 0.39] sorted [1 6 5]\n",
      "   state [0 1 1 1 1 1 1 0] state_WI [0.83 0.19 0.09 0.18 0.31 0.34 0.42 0.39] sorted [0 6 7]\n",
      "   state [1 1 1 0 1 0 1 1] state_WI [  0.28   0.19   0.09   0.91   0.31   0.42   0.42 -10.  ] sorted [3 6 5]\n",
      "   state [0 0 1 0 0 1 1 0] state_WI [0.83 0.73 0.09 0.91 0.89 0.34 0.42 0.39] sorted [3 4 0]\n",
      "   state [1 0 1 1 1 1 1 0] state_WI [0.28 0.73 0.09 0.18 0.31 0.34 0.42 0.39] sorted [1 6 7]\n",
      "   state [1 1 0 0 0 0 1 1] state_WI [  0.28   0.19   0.2    0.91   0.89   0.42   0.42 -10.  ] sorted [3 4 6]\n",
      "   state [0 1 0 1 1 0 1 0] state_WI [0.83 0.19 0.2  0.18 0.31 0.42 0.42 0.39] sorted [0 6 5]\n",
      "   state [1 1 1 0 0 1 1 0] state_WI [0.28 0.19 0.09 0.91 0.89 0.34 0.42 0.39] sorted [3 4 6]\n",
      "   state [0 1 0 0 1 0 0 0] state_WI [0.83 0.19 0.2  0.91 0.31 0.42 0.67 0.39] sorted [3 0 6]\n",
      "   state [1 1 1 0 1 1 1 0] state_WI [0.28 0.19 0.09 0.91 0.31 0.34 0.42 0.39] sorted [3 6 7]\n",
      "   state [1 1 0 0 0 1 1 0] state_WI [0.28 0.19 0.2  0.91 0.89 0.34 0.42 0.39] sorted [3 4 6]\n",
      "instance 2, ep 14, state [0 0 0 1 0 0 0 1]\n",
      "   state [0 0 0 1 0 0 0 1] state_WI [  0.83   0.73   0.2    0.18   0.89   0.42   0.67 -10.  ] sorted [4 0 1]\n",
      "   state [1 1 0 0 1 1 0 1] state_WI [  0.28   0.19   0.2    0.91   0.31   0.34   0.67 -10.  ] sorted [3 6 5]\n",
      "   state [0 0 1 0 1 1 0 1] state_WI [  0.83   0.73   0.09   0.91   0.31   0.34   0.67 -10.  ] sorted [3 0 1]\n",
      "   state [1 1 0 0 1 1 0 0] state_WI [0.28 0.19 0.2  0.91 0.31 0.34 0.67 0.39] sorted [3 6 7]\n",
      "   state [1 1 1 1 0 1 1 1] state_WI [  0.28   0.19   0.09   0.18   0.89   0.34   0.42 -10.  ] sorted [4 6 5]\n",
      "   state [1 1 0 0 0 0 1 0] state_WI [0.28 0.19 0.2  0.91 0.89 0.42 0.42 0.39] sorted [3 4 6]\n",
      "   state [0 0 0 0 0 0 1 0] state_WI [0.83 0.73 0.2  0.91 0.89 0.42 0.42 0.39] sorted [3 4 0]\n",
      "   state [1 0 0 1 1 1 0 0] state_WI [0.28 0.73 0.2  0.18 0.31 0.34 0.67 0.39] sorted [1 6 7]\n",
      "   state [0 1 1 1 1 0 1 0] state_WI [0.83 0.19 0.09 0.18 0.31 0.42 0.42 0.39] sorted [0 6 5]\n",
      "   state [0 1 0 0 1 0 1 0] state_WI [0.83 0.19 0.2  0.91 0.31 0.42 0.42 0.39] sorted [3 0 6]\n",
      "   state [0 1 0 1 1 0 1 0] state_WI [0.83 0.19 0.2  0.18 0.31 0.42 0.42 0.39] sorted [0 6 5]\n",
      "   state [1 1 0 1 1 1 1 0] state_WI [0.28 0.19 0.2  0.18 0.31 0.34 0.42 0.39] sorted [6 7 5]\n",
      "   state [1 1 0 0 1 1 1 0] state_WI [0.28 0.19 0.2  0.91 0.31 0.34 0.42 0.39] sorted [3 6 7]\n",
      "   state [0 1 1 1 0 0 1 0] state_WI [0.83 0.19 0.09 0.18 0.89 0.42 0.42 0.39] sorted [4 0 6]\n",
      "   state [1 1 0 0 1 0 1 0] state_WI [0.28 0.19 0.2  0.91 0.31 0.42 0.42 0.39] sorted [3 6 5]\n",
      "   state [0 1 1 1 0 1 1 0] state_WI [0.83 0.19 0.09 0.18 0.89 0.34 0.42 0.39] sorted [4 0 6]\n",
      "   state [0 1 0 1 1 0 1 0] state_WI [0.83 0.19 0.2  0.18 0.31 0.42 0.42 0.39] sorted [0 6 5]\n",
      "   state [1 0 1 0 0 1 0 0] state_WI [0.28 0.73 0.09 0.91 0.89 0.34 0.67 0.39] sorted [3 4 1]\n",
      "   state [0 1 1 0 1 0 0 0] state_WI [0.83 0.19 0.09 0.91 0.31 0.42 0.67 0.39] sorted [3 0 6]\n",
      "   state [1 1 1 0 1 0 1 0] state_WI [0.28 0.19 0.09 0.91 0.31 0.42 0.42 0.39] sorted [3 6 5]\n",
      "instance 2, ep 15, state [0 1 0 1 1 0 0 1]\n",
      "   state [0 1 0 1 1 0 0 1] state_WI [  0.83   0.19   0.2    0.18   0.31   0.42   0.67 -10.  ] sorted [0 6 5]\n",
      "   state [0 0 0 0 0 0 0 0] state_WI [0.83 0.73 0.2  0.91 0.89 0.42 0.67 0.39] sorted [3 4 0]\n",
      "   state [1 0 1 1 1 0 0 0] state_WI [0.28 0.73 0.09 0.18 0.31 0.42 0.67 0.39] sorted [1 6 5]\n",
      "   state [0 0 0 1 1 0 0 0] state_WI [0.83 0.73 0.2  0.18 0.31 0.42 0.67 0.39] sorted [0 1 6]\n",
      "   state [0 1 1 1 0 0 0 0] state_WI [0.83 0.19 0.09 0.18 0.89 0.42 0.67 0.39] sorted [4 0 6]\n",
      "   state [0 0 0 1 0 1 1 1] state_WI [  0.83   0.73   0.2    0.18   0.89   0.34   0.42 -10.  ] sorted [4 0 1]\n",
      "   state [1 0 0 1 1 1 1 0] state_WI [0.28 0.73 0.2  0.18 0.31 0.34 0.42 0.39] sorted [1 6 7]\n",
      "   state [0 0 0 1 1 1 1 1] state_WI [  0.83   0.73   0.2    0.18   0.31   0.34   0.42 -10.  ] sorted [0 1 6]\n",
      "   state [1 1 0 1 1 0 1 1] state_WI [  0.28   0.19   0.2    0.18   0.31   0.42   0.42 -10.  ] sorted [6 5 4]\n",
      "   state [0 0 0 1 1 0 1 1] state_WI [  0.83   0.73   0.2    0.18   0.31   0.42   0.42 -10.  ] sorted [0 1 6]\n",
      "   state [1 1 0 0 0 0 0 0] state_WI [0.28 0.19 0.2  0.91 0.89 0.42 0.67 0.39] sorted [3 4 6]\n",
      "   state [0 0 1 0 1 1 0 0] state_WI [0.83 0.73 0.09 0.91 0.31 0.34 0.67 0.39] sorted [3 0 1]\n",
      "   state [1 1 0 0 0 1 0 0] state_WI [0.28 0.19 0.2  0.91 0.89 0.34 0.67 0.39] sorted [3 4 6]\n",
      "   state [0 0 1 1 1 0 0 0] state_WI [0.83 0.73 0.09 0.18 0.31 0.42 0.67 0.39] sorted [0 1 6]\n",
      "   state [0 0 0 0 0 0 1 0] state_WI [0.83 0.73 0.2  0.91 0.89 0.42 0.42 0.39] sorted [3 4 0]\n",
      "   state [1 0 1 1 0 0 1 0] state_WI [0.28 0.73 0.09 0.18 0.89 0.42 0.42 0.39] sorted [4 1 6]\n",
      "   state [0 0 0 1 1 0 1 0] state_WI [0.83 0.73 0.2  0.18 0.31 0.42 0.42 0.39] sorted [0 1 6]\n",
      "   state [1 1 1 0 1 0 1 1] state_WI [  0.28   0.19   0.09   0.91   0.31   0.42   0.42 -10.  ] sorted [3 6 5]\n",
      "   state [1 0 0 0 1 0 1 0] state_WI [0.28 0.73 0.2  0.91 0.31 0.42 0.42 0.39] sorted [3 1 6]\n",
      "   state [0 0 1 1 0 0 1 0] state_WI [0.83 0.73 0.09 0.18 0.89 0.42 0.42 0.39] sorted [4 0 1]\n",
      "instance 2, ep 16, state [1 0 0 1 1 0 1 0]\n",
      "   state [1 0 0 1 1 0 1 0] state_WI [0.28 0.73 0.2  0.18 0.31 0.42 0.42 0.39] sorted [1 6 5]\n",
      "   state [0 1 0 1 1 0 1 0] state_WI [0.83 0.19 0.2  0.18 0.31 0.42 0.42 0.39] sorted [0 6 5]\n",
      "   state [1 1 1 0 1 0 1 0] state_WI [0.28 0.19 0.09 0.91 0.31 0.42 0.42 0.39] sorted [3 6 5]\n",
      "   state [1 0 0 1 0 0 1 0] state_WI [0.28 0.73 0.2  0.18 0.89 0.42 0.42 0.39] sorted [4 1 6]\n",
      "   state [0 1 1 0 1 0 1 0] state_WI [0.83 0.19 0.09 0.91 0.31 0.42 0.42 0.39] sorted [3 0 6]\n",
      "   state [0 1 0 1 1 0 1 0] state_WI [0.83 0.19 0.2  0.18 0.31 0.42 0.42 0.39] sorted [0 6 5]\n",
      "   state [1 0 1 1 0 1 0 1] state_WI [  0.28   0.73   0.09   0.18   0.89   0.34   0.67 -10.  ] sorted [4 1 6]\n",
      "   state [1 0 0 1 1 0 0 0] state_WI [0.28 0.73 0.2  0.18 0.31 0.42 0.67 0.39] sorted [1 6 5]\n",
      "   state [0 1 1 1 1 0 0 0] state_WI [0.83 0.19 0.09 0.18 0.31 0.42 0.67 0.39] sorted [0 6 5]\n",
      "   state [1 1 1 1 1 1 0 0] state_WI [0.28 0.19 0.09 0.18 0.31 0.34 0.67 0.39] sorted [6 7 5]\n",
      "   state [1 0 0 0 1 0 1 0] state_WI [0.28 0.73 0.2  0.91 0.31 0.42 0.42 0.39] sorted [3 1 6]\n",
      "   state [0 0 0 1 0 0 1 0] state_WI [0.83 0.73 0.2  0.18 0.89 0.42 0.42 0.39] sorted [4 0 1]\n",
      "   state [0 0 1 1 1 0 0 0] state_WI [0.83 0.73 0.09 0.18 0.31 0.42 0.67 0.39] sorted [0 1 6]\n",
      "   state [1 1 0 1 0 0 0 0] state_WI [0.28 0.19 0.2  0.18 0.89 0.42 0.67 0.39] sorted [4 6 5]\n",
      "   state [1 0 0 1 1 1 1 0] state_WI [0.28 0.73 0.2  0.18 0.31 0.34 0.42 0.39] sorted [1 6 7]\n",
      "   state [1 1 1 1 0 1 1 0] state_WI [0.28 0.19 0.09 0.18 0.89 0.34 0.42 0.39] sorted [4 6 7]\n",
      "   state [0 1 0 1 1 1 1 1] state_WI [  0.83   0.19   0.2    0.18   0.31   0.34   0.42 -10.  ] sorted [0 6 5]\n",
      "   state [1 0 0 1 1 1 1 1] state_WI [  0.28   0.73   0.2    0.18   0.31   0.34   0.42 -10.  ] sorted [1 6 5]\n",
      "   state [0 1 1 0 1 1 1 0] state_WI [0.83 0.19 0.09 0.91 0.31 0.34 0.42 0.39] sorted [3 0 6]\n",
      "   state [1 1 0 0 1 0 1 0] state_WI [0.28 0.19 0.2  0.91 0.31 0.42 0.42 0.39] sorted [3 6 5]\n",
      "instance 2, ep 17, state [1 0 0 0 1 0 0 0]\n",
      "   state [1 0 0 0 1 0 0 0] state_WI [0.28 0.73 0.2  0.91 0.31 0.42 0.67 0.39] sorted [3 1 6]\n",
      "   state [0 1 0 1 1 0 0 0] state_WI [0.83 0.19 0.2  0.18 0.31 0.42 0.67 0.39] sorted [0 6 5]\n",
      "   state [1 1 1 0 1 0 1 1] state_WI [  0.28   0.19   0.09   0.91   0.31   0.42   0.42 -10.  ] sorted [3 6 5]\n",
      "   state [1 1 0 1 1 0 1 0] state_WI [0.28 0.19 0.2  0.18 0.31 0.42 0.42 0.39] sorted [6 5 7]\n",
      "   state [1 0 1 0 0 1 1 1] state_WI [  0.28   0.73   0.09   0.91   0.89   0.34   0.42 -10.  ] sorted [3 4 1]\n",
      "   state [0 0 0 1 1 1 0 0] state_WI [0.83 0.73 0.2  0.18 0.31 0.34 0.67 0.39] sorted [0 1 6]\n",
      "   state [1 1 1 1 0 1 1 1] state_WI [  0.28   0.19   0.09   0.18   0.89   0.34   0.42 -10.  ] sorted [4 6 5]\n",
      "   state [0 0 0 0 0 1 1 1] state_WI [  0.83   0.73   0.2    0.91   0.89   0.34   0.42 -10.  ] sorted [3 4 0]\n",
      "   state [1 0 1 0 1 0 0 0] state_WI [0.28 0.73 0.09 0.91 0.31 0.42 0.67 0.39] sorted [3 1 6]\n",
      "   state [0 0 0 1 1 0 1 0] state_WI [0.83 0.73 0.2  0.18 0.31 0.42 0.42 0.39] sorted [0 1 6]\n",
      "   state [0 1 0 1 1 0 1 0] state_WI [0.83 0.19 0.2  0.18 0.31 0.42 0.42 0.39] sorted [0 6 5]\n",
      "   state [0 1 1 0 1 0 1 0] state_WI [0.83 0.19 0.09 0.91 0.31 0.42 0.42 0.39] sorted [3 0 6]\n",
      "   state [0 0 0 1 1 0 1 0] state_WI [0.83 0.73 0.2  0.18 0.31 0.42 0.42 0.39] sorted [0 1 6]\n",
      "   state [0 1 1 1 0 0 1 0] state_WI [0.83 0.19 0.09 0.18 0.89 0.42 0.42 0.39] sorted [4 0 6]\n",
      "   state [1 1 0 1 1 0 1 0] state_WI [0.28 0.19 0.2  0.18 0.31 0.42 0.42 0.39] sorted [6 5 7]\n",
      "   state [0 1 0 0 1 0 0 0] state_WI [0.83 0.19 0.2  0.91 0.31 0.42 0.67 0.39] sorted [3 0 6]\n",
      "   state [0 0 1 1 0 0 1 0] state_WI [0.83 0.73 0.09 0.18 0.89 0.42 0.42 0.39] sorted [4 0 1]\n",
      "   state [0 1 0 0 1 0 0 0] state_WI [0.83 0.19 0.2  0.91 0.31 0.42 0.67 0.39] sorted [3 0 6]\n",
      "   state [1 1 0 1 1 1 0 0] state_WI [0.28 0.19 0.2  0.18 0.31 0.34 0.67 0.39] sorted [6 7 5]\n",
      "   state [1 1 0 1 0 0 1 0] state_WI [0.28 0.19 0.2  0.18 0.89 0.42 0.42 0.39] sorted [4 6 5]\n",
      "instance 2, ep 18, state [1 1 0 1 1 1 0 0]\n",
      "   state [1 1 0 1 1 1 0 0] state_WI [0.28 0.19 0.2  0.18 0.31 0.34 0.67 0.39] sorted [6 7 5]\n",
      "   state [0 0 0 1 1 1 1 0] state_WI [0.83 0.73 0.2  0.18 0.31 0.34 0.42 0.39] sorted [0 1 6]\n",
      "   state [1 1 1 1 1 1 1 0] state_WI [0.28 0.19 0.09 0.18 0.31 0.34 0.42 0.39] sorted [6 7 5]\n",
      "   state [1 1 0 1 0 1 0 0] state_WI [0.28 0.19 0.2  0.18 0.89 0.34 0.67 0.39] sorted [4 6 7]\n",
      "   state [1 1 0 1 0 0 1 0] state_WI [0.28 0.19 0.2  0.18 0.89 0.42 0.42 0.39] sorted [4 6 5]\n",
      "   state [1 1 0 1 1 0 1 0] state_WI [0.28 0.19 0.2  0.18 0.31 0.42 0.42 0.39] sorted [6 5 7]\n",
      "   state [0 0 0 0 1 1 1 1] state_WI [  0.83   0.73   0.2    0.91   0.31   0.34   0.42 -10.  ] sorted [3 0 1]\n",
      "   state [1 0 1 1 1 0 1 0] state_WI [0.28 0.73 0.09 0.18 0.31 0.42 0.42 0.39] sorted [1 6 5]\n",
      "   state [1 1 0 1 1 0 1 0] state_WI [0.28 0.19 0.2  0.18 0.31 0.42 0.42 0.39] sorted [6 5 7]\n",
      "   state [1 0 1 0 0 0 1 1] state_WI [  0.28   0.73   0.09   0.91   0.89   0.42   0.42 -10.  ] sorted [3 4 1]\n",
      "   state [1 1 0 0 1 0 1 1] state_WI [  0.28   0.19   0.2    0.91   0.31   0.42   0.42 -10.  ] sorted [3 6 5]\n",
      "   state [0 0 1 0 0 0 1 1] state_WI [  0.83   0.73   0.09   0.91   0.89   0.42   0.42 -10.  ] sorted [3 4 0]\n",
      "   state [0 0 0 1 0 0 1 1] state_WI [  0.83   0.73   0.2    0.18   0.89   0.42   0.42 -10.  ] sorted [4 0 1]\n",
      "   state [1 1 0 0 1 0 1 1] state_WI [  0.28   0.19   0.2    0.91   0.31   0.42   0.42 -10.  ] sorted [3 6 5]\n",
      "   state [1 0 1 1 0 1 1 0] state_WI [0.28 0.73 0.09 0.18 0.89 0.34 0.42 0.39] sorted [4 1 6]\n",
      "   state [1 1 0 0 1 1 1 0] state_WI [0.28 0.19 0.2  0.91 0.31 0.34 0.42 0.39] sorted [3 6 7]\n",
      "   state [0 0 0 0 0 1 1 1] state_WI [  0.83   0.73   0.2    0.91   0.89   0.34   0.42 -10.  ] sorted [3 4 0]\n",
      "   state [0 0 0 1 0 1 1 0] state_WI [0.83 0.73 0.2  0.18 0.89 0.34 0.42 0.39] sorted [4 0 1]\n",
      "   state [0 1 1 0 1 1 1 0] state_WI [0.83 0.19 0.09 0.91 0.31 0.34 0.42 0.39] sorted [3 0 6]\n",
      "   state [1 1 0 1 1 1 1 0] state_WI [0.28 0.19 0.2  0.18 0.31 0.34 0.42 0.39] sorted [6 7 5]\n",
      "instance 2, ep 19, state [0 0 0 1 0 0 1 0]\n",
      "   state [0 0 0 1 0 0 1 0] state_WI [0.83 0.73 0.2  0.18 0.89 0.42 0.42 0.39] sorted [4 0 1]\n",
      "   state [0 0 1 1 1 1 1 0] state_WI [0.83 0.73 0.09 0.18 0.31 0.34 0.42 0.39] sorted [0 1 6]\n",
      "   state [1 1 1 0 1 0 1 0] state_WI [0.28 0.19 0.09 0.91 0.31 0.42 0.42 0.39] sorted [3 6 5]\n",
      "   state [0 0 0 0 1 0 1 0] state_WI [0.83 0.73 0.2  0.91 0.31 0.42 0.42 0.39] sorted [3 0 1]\n",
      "   state [1 0 0 1 1 0 0 0] state_WI [0.28 0.73 0.2  0.18 0.31 0.42 0.67 0.39] sorted [1 6 5]\n",
      "   state [1 1 1 0 1 0 0 0] state_WI [0.28 0.19 0.09 0.91 0.31 0.42 0.67 0.39] sorted [3 6 5]\n",
      "   state [0 0 1 1 0 1 1 0] state_WI [0.83 0.73 0.09 0.18 0.89 0.34 0.42 0.39] sorted [4 0 1]\n",
      "   state [1 1 0 1 0 0 0 0] state_WI [0.28 0.19 0.2  0.18 0.89 0.42 0.67 0.39] sorted [4 6 5]\n",
      "   state [1 0 1 0 0 1 1 0] state_WI [0.28 0.73 0.09 0.91 0.89 0.34 0.42 0.39] sorted [3 4 1]\n",
      "   state [0 1 0 1 1 0 0 0] state_WI [0.83 0.19 0.2  0.18 0.31 0.42 0.67 0.39] sorted [0 6 5]\n",
      "   state [0 1 1 1 1 0 1 0] state_WI [0.83 0.19 0.09 0.18 0.31 0.42 0.42 0.39] sorted [0 6 5]\n",
      "   state [1 0 1 1 0 0 1 0] state_WI [0.28 0.73 0.09 0.18 0.89 0.42 0.42 0.39] sorted [4 1 6]\n",
      "   state [1 1 0 1 1 0 1 1] state_WI [  0.28   0.19   0.2    0.18   0.31   0.42   0.42 -10.  ] sorted [6 5 4]\n",
      "   state [1 0 0 1 1 1 1 1] state_WI [  0.28   0.73   0.2    0.18   0.31   0.34   0.42 -10.  ] sorted [1 6 5]\n",
      "   state [1 1 1 0 1 0 1 1] state_WI [  0.28   0.19   0.09   0.91   0.31   0.42   0.42 -10.  ] sorted [3 6 5]\n",
      "   state [1 1 0 1 1 0 1 0] state_WI [0.28 0.19 0.2  0.18 0.31 0.42 0.42 0.39] sorted [6 5 7]\n",
      "   state [1 0 1 1 1 1 1 1] state_WI [  0.28   0.73   0.09   0.18   0.31   0.34   0.42 -10.  ] sorted [1 6 5]\n",
      "   state [1 1 0 0 0 0 1 0] state_WI [0.28 0.19 0.2  0.91 0.89 0.42 0.42 0.39] sorted [3 4 6]\n",
      "   state [0 0 1 1 1 1 0 1] state_WI [  0.83   0.73   0.09   0.18   0.31   0.34   0.67 -10.  ] sorted [0 1 6]\n",
      "   state [1 0 1 1 0 1 0 0] state_WI [0.28 0.73 0.09 0.18 0.89 0.34 0.67 0.39] sorted [4 1 6]\n",
      "instance 2, ep 20, state [1 1 0 1 1 1 0 0]\n",
      "   state [1 1 0 1 1 1 0 0] state_WI [0.28 0.19 0.2  0.18 0.31 0.34 0.67 0.39] sorted [6 7 5]\n",
      "   state [1 1 1 1 1 1 0 0] state_WI [0.28 0.19 0.09 0.18 0.31 0.34 0.67 0.39] sorted [6 7 5]\n",
      "   state [1 0 0 1 1 0 1 1] state_WI [  0.28   0.73   0.2    0.18   0.31   0.42   0.42 -10.  ] sorted [1 6 5]\n",
      "   state [1 1 1 1 0 1 1 1] state_WI [  0.28   0.19   0.09   0.18   0.89   0.34   0.42 -10.  ] sorted [4 6 5]\n",
      "   state [1 0 0 0 0 0 0 1] state_WI [  0.28   0.73   0.2    0.91   0.89   0.42   0.67 -10.  ] sorted [3 4 1]\n",
      "   state [0 0 1 1 0 0 0 0] state_WI [0.83 0.73 0.09 0.18 0.89 0.42 0.67 0.39] sorted [4 0 1]\n",
      "   state [0 1 0 0 1 0 1 0] state_WI [0.83 0.19 0.2  0.91 0.31 0.42 0.42 0.39] sorted [3 0 6]\n",
      "   state [1 1 0 0 1 0 1 0] state_WI [0.28 0.19 0.2  0.91 0.31 0.42 0.42 0.39] sorted [3 6 5]\n",
      "   state [0 1 1 1 1 1 1 0] state_WI [0.83 0.19 0.09 0.18 0.31 0.34 0.42 0.39] sorted [0 6 7]\n",
      "   state [0 0 1 0 1 0 1 0] state_WI [0.83 0.73 0.09 0.91 0.31 0.42 0.42 0.39] sorted [3 0 1]\n",
      "   state [0 0 0 1 1 0 0 0] state_WI [0.83 0.73 0.2  0.18 0.31 0.42 0.67 0.39] sorted [0 1 6]\n",
      "   state [1 1 1 0 1 0 0 0] state_WI [0.28 0.19 0.09 0.91 0.31 0.42 0.67 0.39] sorted [3 6 5]\n",
      "   state [1 0 0 0 1 0 0 0] state_WI [0.28 0.73 0.2  0.91 0.31 0.42 0.67 0.39] sorted [3 1 6]\n",
      "   state [0 0 1 0 1 0 1 0] state_WI [0.83 0.73 0.09 0.91 0.31 0.42 0.42 0.39] sorted [3 0 1]\n",
      "   state [0 1 0 1 0 1 1 1] state_WI [  0.83   0.19   0.2    0.18   0.89   0.34   0.42 -10.  ] sorted [4 0 6]\n",
      "   state [1 0 1 1 1 0 1 0] state_WI [0.28 0.73 0.09 0.18 0.31 0.42 0.42 0.39] sorted [1 6 5]\n",
      "   state [1 0 0 1 0 1 1 0] state_WI [0.28 0.73 0.2  0.18 0.89 0.34 0.42 0.39] sorted [4 1 6]\n",
      "   state [0 1 0 1 1 0 1 0] state_WI [0.83 0.19 0.2  0.18 0.31 0.42 0.42 0.39] sorted [0 6 5]\n",
      "   state [1 0 0 1 1 0 1 1] state_WI [  0.28   0.73   0.2    0.18   0.31   0.42   0.42 -10.  ] sorted [1 6 5]\n",
      "   state [1 1 1 1 1 1 1 1] state_WI [  0.28   0.19   0.09   0.18   0.31   0.34   0.42 -10.  ] sorted [6 5 4]\n",
      "instance 2, ep 21, state [1 0 0 0 1 0 1 1]\n",
      "   state [1 0 0 0 1 0 1 1] state_WI [  0.28   0.73   0.2    0.91   0.31   0.42   0.42 -10.  ] sorted [3 1 6]\n",
      "   state [1 1 0 1 0 0 1 0] state_WI [0.28 0.19 0.2  0.18 0.89 0.42 0.42 0.39] sorted [4 6 5]\n",
      "   state [1 0 1 1 1 0 1 0] state_WI [0.28 0.73 0.09 0.18 0.31 0.42 0.42 0.39] sorted [1 6 5]\n",
      "   state [1 0 1 0 0 0 1 0] state_WI [0.28 0.73 0.09 0.91 0.89 0.42 0.42 0.39] sorted [3 4 1]\n",
      "   state [1 0 0 0 1 0 0 0] state_WI [0.28 0.73 0.2  0.91 0.31 0.42 0.67 0.39] sorted [3 1 6]\n",
      "   state [1 1 1 1 1 0 0 0] state_WI [0.28 0.19 0.09 0.18 0.31 0.42 0.67 0.39] sorted [6 5 7]\n",
      "   state [1 1 0 0 1 1 1 1] state_WI [  0.28   0.19   0.2    0.91   0.31   0.34   0.42 -10.  ] sorted [3 6 5]\n",
      "   state [1 0 0 0 1 0 1 0] state_WI [0.28 0.73 0.2  0.91 0.31 0.42 0.42 0.39] sorted [3 1 6]\n",
      "   state [0 1 0 1 1 0 1 0] state_WI [0.83 0.19 0.2  0.18 0.31 0.42 0.42 0.39] sorted [0 6 5]\n",
      "   state [1 1 0 1 0 0 0 0] state_WI [0.28 0.19 0.2  0.18 0.89 0.42 0.67 0.39] sorted [4 6 5]\n",
      "   state [1 0 1 1 1 1 0 0] state_WI [0.28 0.73 0.09 0.18 0.31 0.34 0.67 0.39] sorted [1 6 7]\n",
      "   state [0 0 0 1 0 0 0 1] state_WI [  0.83   0.73   0.2    0.18   0.89   0.42   0.67 -10.  ] sorted [4 0 1]\n",
      "   state [1 1 0 1 1 0 0 0] state_WI [0.28 0.19 0.2  0.18 0.31 0.42 0.67 0.39] sorted [6 5 7]\n",
      "   state [0 1 1 0 0 1 0 1] state_WI [  0.83   0.19   0.09   0.91   0.89   0.34   0.67 -10.  ] sorted [3 4 0]\n",
      "   state [1 0 0 0 0 0 0 1] state_WI [  0.28   0.73   0.2    0.91   0.89   0.42   0.67 -10.  ] sorted [3 4 1]\n",
      "   state [0 1 1 1 1 0 0 0] state_WI [0.83 0.19 0.09 0.18 0.31 0.42 0.67 0.39] sorted [0 6 5]\n",
      "   state [0 1 0 1 1 1 1 0] state_WI [0.83 0.19 0.2  0.18 0.31 0.34 0.42 0.39] sorted [0 6 7]\n",
      "   state [1 0 1 1 1 0 1 0] state_WI [0.28 0.73 0.09 0.18 0.31 0.42 0.42 0.39] sorted [1 6 5]\n",
      "   state [0 1 0 1 0 1 1 0] state_WI [0.83 0.19 0.2  0.18 0.89 0.34 0.42 0.39] sorted [4 0 6]\n",
      "   state [1 1 0 1 0 0 1 0] state_WI [0.28 0.19 0.2  0.18 0.89 0.42 0.42 0.39] sorted [4 6 5]\n",
      "instance 2, ep 22, state [1 1 1 1 0 1 0 0]\n",
      "   state [1 1 1 1 0 1 0 0] state_WI [0.28 0.19 0.09 0.18 0.89 0.34 0.67 0.39] sorted [4 6 7]\n",
      "   state [1 0 0 0 0 0 0 0] state_WI [0.28 0.73 0.2  0.91 0.89 0.42 0.67 0.39] sorted [3 4 1]\n",
      "   state [1 1 1 1 1 0 0 0] state_WI [0.28 0.19 0.09 0.18 0.31 0.42 0.67 0.39] sorted [6 5 7]\n",
      "   state [0 1 1 0 1 0 0 0] state_WI [0.83 0.19 0.09 0.91 0.31 0.42 0.67 0.39] sorted [3 0 6]\n",
      "   state [1 1 1 0 1 0 0 0] state_WI [0.28 0.19 0.09 0.91 0.31 0.42 0.67 0.39] sorted [3 6 5]\n",
      "   state [0 0 0 1 0 0 0 0] state_WI [0.83 0.73 0.2  0.18 0.89 0.42 0.67 0.39] sorted [4 0 1]\n",
      "   state [0 1 1 1 1 0 0 0] state_WI [0.83 0.19 0.09 0.18 0.31 0.42 0.67 0.39] sorted [0 6 5]\n",
      "   state [1 0 0 0 1 1 1 0] state_WI [0.28 0.73 0.2  0.91 0.31 0.34 0.42 0.39] sorted [3 1 6]\n",
      "   state [0 0 0 0 0 0 0 0] state_WI [0.83 0.73 0.2  0.91 0.89 0.42 0.67 0.39] sorted [3 4 0]\n",
      "   state [0 1 1 1 1 0 0 0] state_WI [0.83 0.19 0.09 0.18 0.31 0.42 0.67 0.39] sorted [0 6 5]\n",
      "   state [0 1 1 0 0 0 0 0] state_WI [0.83 0.19 0.09 0.91 0.89 0.42 0.67 0.39] sorted [3 4 0]\n",
      "   state [0 0 0 1 0 0 1 0] state_WI [0.83 0.73 0.2  0.18 0.89 0.42 0.42 0.39] sorted [4 0 1]\n",
      "   state [1 1 1 1 1 1 0 0] state_WI [0.28 0.19 0.09 0.18 0.31 0.34 0.67 0.39] sorted [6 7 5]\n",
      "   state [1 1 1 1 1 1 1 0] state_WI [0.28 0.19 0.09 0.18 0.31 0.34 0.42 0.39] sorted [6 7 5]\n",
      "   state [1 1 1 1 0 0 1 1] state_WI [  0.28   0.19   0.09   0.18   0.89   0.42   0.42 -10.  ] sorted [4 6 5]\n",
      "   state [0 0 1 1 1 1 1 0] state_WI [0.83 0.73 0.09 0.18 0.31 0.34 0.42 0.39] sorted [0 1 6]\n",
      "   state [0 1 0 1 1 0 1 0] state_WI [0.83 0.19 0.2  0.18 0.31 0.42 0.42 0.39] sorted [0 6 5]\n",
      "   state [1 0 0 1 0 1 1 0] state_WI [0.28 0.73 0.2  0.18 0.89 0.34 0.42 0.39] sorted [4 1 6]\n",
      "   state [0 1 1 1 1 1 1 0] state_WI [0.83 0.19 0.09 0.18 0.31 0.34 0.42 0.39] sorted [0 6 7]\n",
      "   state [1 1 1 1 1 0 1 0] state_WI [0.28 0.19 0.09 0.18 0.31 0.42 0.42 0.39] sorted [6 5 7]\n",
      "instance 2, ep 23, state [1 1 0 1 1 1 1 1]\n",
      "   state [1 1 0 1 1 1 1 1] state_WI [  0.28   0.19   0.2    0.18   0.31   0.34   0.42 -10.  ] sorted [6 5 4]\n",
      "   state [1 1 0 1 1 1 1 0] state_WI [0.28 0.19 0.2  0.18 0.31 0.34 0.42 0.39] sorted [6 7 5]\n",
      "   state [1 0 0 1 0 1 1 0] state_WI [0.28 0.73 0.2  0.18 0.89 0.34 0.42 0.39] sorted [4 1 6]\n",
      "   state [1 1 1 1 1 0 1 1] state_WI [  0.28   0.19   0.09   0.18   0.31   0.42   0.42 -10.  ] sorted [6 5 4]\n",
      "   state [0 0 0 0 1 1 1 1] state_WI [  0.83   0.73   0.2    0.91   0.31   0.34   0.42 -10.  ] sorted [3 0 1]\n",
      "   state [0 0 1 1 0 1 1 0] state_WI [0.83 0.73 0.09 0.18 0.89 0.34 0.42 0.39] sorted [4 0 1]\n",
      "   state [1 1 0 1 1 0 1 1] state_WI [  0.28   0.19   0.2    0.18   0.31   0.42   0.42 -10.  ] sorted [6 5 4]\n",
      "   state [0 0 0 1 0 0 0 0] state_WI [0.83 0.73 0.2  0.18 0.89 0.42 0.67 0.39] sorted [4 0 1]\n",
      "   state [0 1 0 0 1 0 0 0] state_WI [0.83 0.19 0.2  0.91 0.31 0.42 0.67 0.39] sorted [3 0 6]\n",
      "   state [1 0 1 1 0 0 1 0] state_WI [0.28 0.73 0.09 0.18 0.89 0.42 0.42 0.39] sorted [4 1 6]\n",
      "   state [0 1 0 1 1 0 1 0] state_WI [0.83 0.19 0.2  0.18 0.31 0.42 0.42 0.39] sorted [0 6 5]\n",
      "   state [1 1 0 0 0 0 1 0] state_WI [0.28 0.19 0.2  0.91 0.89 0.42 0.42 0.39] sorted [3 4 6]\n",
      "   state [1 0 1 1 1 0 1 0] state_WI [0.28 0.73 0.09 0.18 0.31 0.42 0.42 0.39] sorted [1 6 5]\n",
      "   state [0 0 1 1 1 1 0 0] state_WI [0.83 0.73 0.09 0.18 0.31 0.34 0.67 0.39] sorted [0 1 6]\n",
      "   state [1 0 0 0 1 0 0 0] state_WI [0.28 0.73 0.2  0.91 0.31 0.42 0.67 0.39] sorted [3 1 6]\n",
      "   state [0 0 0 1 1 0 1 0] state_WI [0.83 0.73 0.2  0.18 0.31 0.42 0.42 0.39] sorted [0 1 6]\n",
      "   state [0 0 1 1 0 0 1 0] state_WI [0.83 0.73 0.09 0.18 0.89 0.42 0.42 0.39] sorted [4 0 1]\n",
      "   state [1 0 1 0 1 1 0 0] state_WI [0.28 0.73 0.09 0.91 0.31 0.34 0.67 0.39] sorted [3 1 6]\n",
      "   state [1 1 1 1 0 1 1 0] state_WI [0.28 0.19 0.09 0.18 0.89 0.34 0.42 0.39] sorted [4 6 7]\n",
      "   state [0 0 1 1 0 0 1 0] state_WI [0.83 0.73 0.09 0.18 0.89 0.42 0.42 0.39] sorted [4 0 1]\n",
      "instance 2, ep 24, state [1 1 1 1 1 0 0 0]\n",
      "   state [1 1 1 1 1 0 0 0] state_WI [0.28 0.19 0.09 0.18 0.31 0.42 0.67 0.39] sorted [6 5 7]\n",
      "   state [1 1 1 1 1 1 1 1] state_WI [  0.28   0.19   0.09   0.18   0.31   0.34   0.42 -10.  ] sorted [6 5 4]\n",
      "   state [0 1 0 0 0 1 1 1] state_WI [  0.83   0.19   0.2    0.91   0.89   0.34   0.42 -10.  ] sorted [3 4 0]\n",
      "   state [1 1 1 1 1 1 1 1] state_WI [  0.28   0.19   0.09   0.18   0.31   0.34   0.42 -10.  ] sorted [6 5 4]\n",
      "   state [1 1 0 1 1 1 1 0] state_WI [0.28 0.19 0.2  0.18 0.31 0.34 0.42 0.39] sorted [6 7 5]\n",
      "   state [0 1 0 1 0 1 1 0] state_WI [0.83 0.19 0.2  0.18 0.89 0.34 0.42 0.39] sorted [4 0 6]\n",
      "   state [1 1 0 1 1 0 1 0] state_WI [0.28 0.19 0.2  0.18 0.31 0.42 0.42 0.39] sorted [6 5 7]\n",
      "   state [1 1 1 1 1 1 1 0] state_WI [0.28 0.19 0.09 0.18 0.31 0.34 0.42 0.39] sorted [6 7 5]\n",
      "   state [1 1 1 1 0 1 1 1] state_WI [  0.28   0.19   0.09   0.18   0.89   0.34   0.42 -10.  ] sorted [4 6 5]\n",
      "   state [0 1 1 1 0 1 1 1] state_WI [  0.83   0.19   0.09   0.18   0.89   0.34   0.42 -10.  ] sorted [4 0 6]\n",
      "   state [0 1 0 1 0 1 1 0] state_WI [0.83 0.19 0.2  0.18 0.89 0.34 0.42 0.39] sorted [4 0 6]\n",
      "   state [1 1 0 1 0 0 1 0] state_WI [0.28 0.19 0.2  0.18 0.89 0.42 0.42 0.39] sorted [4 6 5]\n",
      "   state [0 1 1 0 1 0 1 0] state_WI [0.83 0.19 0.09 0.91 0.31 0.42 0.42 0.39] sorted [3 0 6]\n",
      "   state [0 1 1 1 1 0 1 0] state_WI [0.83 0.19 0.09 0.18 0.31 0.42 0.42 0.39] sorted [0 6 5]\n",
      "   state [0 0 0 1 0 1 1 0] state_WI [0.83 0.73 0.2  0.18 0.89 0.34 0.42 0.39] sorted [4 0 1]\n",
      "   state [1 1 1 1 1 0 0 0] state_WI [0.28 0.19 0.09 0.18 0.31 0.42 0.67 0.39] sorted [6 5 7]\n",
      "   state [0 0 0 0 1 0 1 1] state_WI [  0.83   0.73   0.2    0.91   0.31   0.42   0.42 -10.  ] sorted [3 0 1]\n",
      "   state [0 0 1 0 0 0 1 1] state_WI [  0.83   0.73   0.09   0.91   0.89   0.42   0.42 -10.  ] sorted [3 4 0]\n",
      "   state [1 0 1 1 1 0 0 0] state_WI [0.28 0.73 0.09 0.18 0.31 0.42 0.67 0.39] sorted [1 6 5]\n",
      "   state [1 0 0 1 1 0 1 0] state_WI [0.28 0.73 0.2  0.18 0.31 0.42 0.42 0.39] sorted [1 6 5]\n",
      "instance 2, ep 25, state [0 1 1 1 0 1 1 1]\n",
      "   state [0 1 1 1 0 1 1 1] state_WI [  0.83   0.19   0.09   0.18   0.89   0.34   0.42 -10.  ] sorted [4 0 6]\n",
      "   state [0 0 0 1 1 1 1 0] state_WI [0.83 0.73 0.2  0.18 0.31 0.34 0.42 0.39] sorted [0 1 6]\n",
      "   state [1 0 1 1 0 0 1 0] state_WI [0.28 0.73 0.09 0.18 0.89 0.42 0.42 0.39] sorted [4 1 6]\n",
      "   state [0 1 0 0 1 1 1 0] state_WI [0.83 0.19 0.2  0.91 0.31 0.34 0.42 0.39] sorted [3 0 6]\n",
      "   state [1 1 0 0 1 1 1 1] state_WI [  0.28   0.19   0.2    0.91   0.31   0.34   0.42 -10.  ] sorted [3 6 5]\n",
      "   state [1 1 0 1 1 1 0 1] state_WI [  0.28   0.19   0.2    0.18   0.31   0.34   0.67 -10.  ] sorted [6 5 4]\n",
      "   state [0 0 1 1 1 1 0 0] state_WI [0.83 0.73 0.09 0.18 0.31 0.34 0.67 0.39] sorted [0 1 6]\n",
      "   state [1 1 1 1 1 0 0 0] state_WI [0.28 0.19 0.09 0.18 0.31 0.42 0.67 0.39] sorted [6 5 7]\n",
      "   state [0 1 1 1 0 1 1 0] state_WI [0.83 0.19 0.09 0.18 0.89 0.34 0.42 0.39] sorted [4 0 6]\n",
      "   state [1 0 0 0 0 0 1 0] state_WI [0.28 0.73 0.2  0.91 0.89 0.42 0.42 0.39] sorted [3 4 1]\n",
      "   state [0 0 0 0 1 0 1 0] state_WI [0.83 0.73 0.2  0.91 0.31 0.42 0.42 0.39] sorted [3 0 1]\n",
      "   state [1 1 1 1 1 0 0 0] state_WI [0.28 0.19 0.09 0.18 0.31 0.42 0.67 0.39] sorted [6 5 7]\n",
      "   state [0 0 0 0 0 1 1 1] state_WI [  0.83   0.73   0.2    0.91   0.89   0.34   0.42 -10.  ] sorted [3 4 0]\n",
      "   state [1 1 1 1 1 1 1 0] state_WI [0.28 0.19 0.09 0.18 0.31 0.34 0.42 0.39] sorted [6 7 5]\n",
      "   state [0 1 0 1 1 1 1 0] state_WI [0.83 0.19 0.2  0.18 0.31 0.34 0.42 0.39] sorted [0 6 7]\n",
      "   state [0 1 1 0 1 0 0 0] state_WI [0.83 0.19 0.09 0.91 0.31 0.42 0.67 0.39] sorted [3 0 6]\n",
      "   state [0 0 0 1 1 0 0 1] state_WI [  0.83   0.73   0.2    0.18   0.31   0.42   0.67 -10.  ] sorted [0 1 6]\n",
      "   state [1 0 1 0 1 0 1 1] state_WI [  0.28   0.73   0.09   0.91   0.31   0.42   0.42 -10.  ] sorted [3 1 6]\n",
      "   state [0 0 1 1 1 0 0 1] state_WI [  0.83   0.73   0.09   0.18   0.31   0.42   0.67 -10.  ] sorted [0 1 6]\n",
      "   state [0 0 0 0 0 0 0 0] state_WI [0.83 0.73 0.2  0.91 0.89 0.42 0.67 0.39] sorted [3 4 0]\n",
      "instance 2, ep 26, state [1 1 0 1 0 0 1 0]\n",
      "   state [1 1 0 1 0 0 1 0] state_WI [0.28 0.19 0.2  0.18 0.89 0.42 0.42 0.39] sorted [4 6 5]\n",
      "   state [0 1 1 1 1 0 1 0] state_WI [0.83 0.19 0.09 0.18 0.31 0.42 0.42 0.39] sorted [0 6 5]\n",
      "   state [1 0 1 1 1 1 1 0] state_WI [0.28 0.73 0.09 0.18 0.31 0.34 0.42 0.39] sorted [1 6 7]\n",
      "   state [1 1 0 1 0 0 1 0] state_WI [0.28 0.19 0.2  0.18 0.89 0.42 0.42 0.39] sorted [4 6 5]\n",
      "   state [0 1 1 1 1 1 1 0] state_WI [0.83 0.19 0.09 0.18 0.31 0.34 0.42 0.39] sorted [0 6 7]\n",
      "   state [0 0 0 1 0 0 1 0] state_WI [0.83 0.73 0.2  0.18 0.89 0.42 0.42 0.39] sorted [4 0 1]\n",
      "   state [1 0 1 0 1 0 1 0] state_WI [0.28 0.73 0.09 0.91 0.31 0.42 0.42 0.39] sorted [3 1 6]\n",
      "   state [1 1 0 1 1 0 1 0] state_WI [0.28 0.19 0.2  0.18 0.31 0.42 0.42 0.39] sorted [6 5 7]\n",
      "   state [0 0 0 1 1 1 1 0] state_WI [0.83 0.73 0.2  0.18 0.31 0.34 0.42 0.39] sorted [0 1 6]\n",
      "   state [0 1 1 0 1 1 1 0] state_WI [0.83 0.19 0.09 0.91 0.31 0.34 0.42 0.39] sorted [3 0 6]\n",
      "   state [1 0 1 1 1 1 1 0] state_WI [0.28 0.73 0.09 0.18 0.31 0.34 0.42 0.39] sorted [1 6 7]\n",
      "   state [1 1 0 1 1 1 1 0] state_WI [0.28 0.19 0.2  0.18 0.31 0.34 0.42 0.39] sorted [6 7 5]\n",
      "   state [1 0 1 1 1 0 1 0] state_WI [0.28 0.73 0.09 0.18 0.31 0.42 0.42 0.39] sorted [1 6 5]\n",
      "   state [0 1 0 0 0 0 1 0] state_WI [0.83 0.19 0.2  0.91 0.89 0.42 0.42 0.39] sorted [3 4 0]\n",
      "   state [1 1 1 1 0 0 0 0] state_WI [0.28 0.19 0.09 0.18 0.89 0.42 0.67 0.39] sorted [4 6 5]\n",
      "   state [0 1 0 1 1 1 1 0] state_WI [0.83 0.19 0.2  0.18 0.31 0.34 0.42 0.39] sorted [0 6 7]\n",
      "   state [1 1 0 1 1 1 1 0] state_WI [0.28 0.19 0.2  0.18 0.31 0.34 0.42 0.39] sorted [6 7 5]\n",
      "   state [1 0 1 0 0 1 1 1] state_WI [  0.28   0.73   0.09   0.91   0.89   0.34   0.42 -10.  ] sorted [3 4 1]\n",
      "   state [0 1 0 1 1 1 0 1] state_WI [  0.83   0.19   0.2    0.18   0.31   0.34   0.67 -10.  ] sorted [0 6 5]\n",
      "   state [1 1 0 1 0 1 0 0] state_WI [0.28 0.19 0.2  0.18 0.89 0.34 0.67 0.39] sorted [4 6 7]\n",
      "instance 2, ep 27, state [1 0 1 0 1 1 0 1]\n",
      "   state [1 0 1 0 1 1 0 1] state_WI [  0.28   0.73   0.09   0.91   0.31   0.34   0.67 -10.  ] sorted [3 1 6]\n",
      "   state [1 0 0 0 1 0 0 0] state_WI [0.28 0.73 0.2  0.91 0.31 0.42 0.67 0.39] sorted [3 1 6]\n",
      "   state [0 1 1 1 0 0 0 0] state_WI [0.83 0.19 0.09 0.18 0.89 0.42 0.67 0.39] sorted [4 0 6]\n",
      "   state [1 0 0 0 0 0 1 0] state_WI [0.28 0.73 0.2  0.91 0.89 0.42 0.42 0.39] sorted [3 4 1]\n",
      "   state [1 1 0 1 1 0 0 0] state_WI [0.28 0.19 0.2  0.18 0.31 0.42 0.67 0.39] sorted [6 5 7]\n",
      "   state [0 1 1 1 0 0 1 0] state_WI [0.83 0.19 0.09 0.18 0.89 0.42 0.42 0.39] sorted [4 0 6]\n",
      "   state [1 1 1 0 0 1 1 0] state_WI [0.28 0.19 0.09 0.91 0.89 0.34 0.42 0.39] sorted [3 4 6]\n",
      "   state [0 1 0 0 1 1 1 0] state_WI [0.83 0.19 0.2  0.91 0.31 0.34 0.42 0.39] sorted [3 0 6]\n",
      "   state [1 0 1 1 0 1 1 0] state_WI [0.28 0.73 0.09 0.18 0.89 0.34 0.42 0.39] sorted [4 1 6]\n",
      "   state [1 0 0 0 0 1 1 1] state_WI [  0.28   0.73   0.2    0.91   0.89   0.34   0.42 -10.  ] sorted [3 4 1]\n",
      "   state [1 1 1 1 1 1 1 0] state_WI [0.28 0.19 0.09 0.18 0.31 0.34 0.42 0.39] sorted [6 7 5]\n",
      "   state [1 1 1 0 1 1 1 1] state_WI [  0.28   0.19   0.09   0.91   0.31   0.34   0.42 -10.  ] sorted [3 6 5]\n",
      "   state [0 0 0 1 0 1 1 0] state_WI [0.83 0.73 0.2  0.18 0.89 0.34 0.42 0.39] sorted [4 0 1]\n",
      "   state [0 0 1 1 0 0 1 0] state_WI [0.83 0.73 0.09 0.18 0.89 0.42 0.42 0.39] sorted [4 0 1]\n",
      "   state [1 1 0 0 1 0 0 0] state_WI [0.28 0.19 0.2  0.91 0.31 0.42 0.67 0.39] sorted [3 6 5]\n",
      "   state [1 0 0 1 0 1 0 0] state_WI [0.28 0.73 0.2  0.18 0.89 0.34 0.67 0.39] sorted [4 1 6]\n",
      "   state [1 0 0 0 0 0 1 0] state_WI [0.28 0.73 0.2  0.91 0.89 0.42 0.42 0.39] sorted [3 4 1]\n",
      "   state [0 1 1 1 1 0 0 0] state_WI [0.83 0.19 0.09 0.18 0.31 0.42 0.67 0.39] sorted [0 6 5]\n",
      "   state [1 1 0 0 1 1 1 0] state_WI [0.28 0.19 0.2  0.91 0.31 0.34 0.42 0.39] sorted [3 6 7]\n",
      "   state [1 1 1 0 0 0 1 1] state_WI [  0.28   0.19   0.09   0.91   0.89   0.42   0.42 -10.  ] sorted [3 4 6]\n",
      "instance 2, ep 28, state [1 0 0 0 1 1 1 0]\n",
      "   state [1 0 0 0 1 1 1 0] state_WI [0.28 0.73 0.2  0.91 0.31 0.34 0.42 0.39] sorted [3 1 6]\n",
      "   state [0 1 1 1 0 0 1 0] state_WI [0.83 0.19 0.09 0.18 0.89 0.42 0.42 0.39] sorted [4 0 6]\n",
      "   state [1 0 1 1 1 1 1 0] state_WI [0.28 0.73 0.09 0.18 0.31 0.34 0.42 0.39] sorted [1 6 7]\n",
      "   state [1 0 1 0 0 0 1 1] state_WI [  0.28   0.73   0.09   0.91   0.89   0.42   0.42 -10.  ] sorted [3 4 1]\n",
      "   state [1 1 1 0 1 0 1 1] state_WI [  0.28   0.19   0.09   0.91   0.31   0.42   0.42 -10.  ] sorted [3 6 5]\n",
      "   state [1 0 1 0 0 1 1 0] state_WI [0.28 0.73 0.09 0.91 0.89 0.34 0.42 0.39] sorted [3 4 1]\n",
      "   state [0 1 0 1 1 0 0 0] state_WI [0.83 0.19 0.2  0.18 0.31 0.42 0.67 0.39] sorted [0 6 5]\n",
      "   state [0 1 1 1 1 0 1 0] state_WI [0.83 0.19 0.09 0.18 0.31 0.42 0.42 0.39] sorted [0 6 5]\n",
      "   state [1 1 1 1 0 1 1 0] state_WI [0.28 0.19 0.09 0.18 0.89 0.34 0.42 0.39] sorted [4 6 7]\n",
      "   state [0 1 1 0 1 0 1 0] state_WI [0.83 0.19 0.09 0.91 0.31 0.42 0.42 0.39] sorted [3 0 6]\n",
      "   state [0 0 1 0 1 1 1 0] state_WI [0.83 0.73 0.09 0.91 0.31 0.34 0.42 0.39] sorted [3 0 1]\n",
      "   state [1 1 0 0 0 1 0 0] state_WI [0.28 0.19 0.2  0.91 0.89 0.34 0.67 0.39] sorted [3 4 6]\n",
      "   state [1 1 1 1 0 1 0 0] state_WI [0.28 0.19 0.09 0.18 0.89 0.34 0.67 0.39] sorted [4 6 7]\n",
      "   state [1 0 1 1 0 1 1 1] state_WI [  0.28   0.73   0.09   0.18   0.89   0.34   0.42 -10.  ] sorted [4 1 6]\n",
      "   state [1 1 0 0 1 0 1 0] state_WI [0.28 0.19 0.2  0.91 0.31 0.42 0.42 0.39] sorted [3 6 5]\n",
      "   state [0 0 1 1 0 1 1 0] state_WI [0.83 0.73 0.09 0.18 0.89 0.34 0.42 0.39] sorted [4 0 1]\n",
      "   state [0 1 1 1 1 1 1 1] state_WI [  0.83   0.19   0.09   0.18   0.31   0.34   0.42 -10.  ] sorted [0 6 5]\n",
      "   state [1 0 1 0 0 0 1 0] state_WI [0.28 0.73 0.09 0.91 0.89 0.42 0.42 0.39] sorted [3 4 1]\n",
      "   state [1 1 0 1 0 0 1 0] state_WI [0.28 0.19 0.2  0.18 0.89 0.42 0.42 0.39] sorted [4 6 5]\n",
      "   state [0 1 1 1 1 0 1 0] state_WI [0.83 0.19 0.09 0.18 0.31 0.42 0.42 0.39] sorted [0 6 5]\n",
      "instance 2, ep 29, state [0 1 0 0 1 1 1 1]\n",
      "   state [0 1 0 0 1 1 1 1] state_WI [  0.83   0.19   0.2    0.91   0.31   0.34   0.42 -10.  ] sorted [3 0 6]\n",
      "   state [0 1 0 1 1 0 1 1] state_WI [  0.83   0.19   0.2    0.18   0.31   0.42   0.42 -10.  ] sorted [0 6 5]\n",
      "   state [1 1 1 0 1 0 1 0] state_WI [0.28 0.19 0.09 0.91 0.31 0.42 0.42 0.39] sorted [3 6 5]\n",
      "   state [1 0 0 1 1 1 1 0] state_WI [0.28 0.73 0.2  0.18 0.31 0.34 0.42 0.39] sorted [1 6 7]\n",
      "   state [1 1 0 1 1 0 1 1] state_WI [  0.28   0.19   0.2    0.18   0.31   0.42   0.42 -10.  ] sorted [6 5 4]\n",
      "   state [0 1 1 1 1 0 1 0] state_WI [0.83 0.19 0.09 0.18 0.31 0.42 0.42 0.39] sorted [0 6 5]\n",
      "   state [1 1 0 1 0 0 1 0] state_WI [0.28 0.19 0.2  0.18 0.89 0.42 0.42 0.39] sorted [4 6 5]\n",
      "   state [1 0 1 0 1 1 1 0] state_WI [0.28 0.73 0.09 0.91 0.31 0.34 0.42 0.39] sorted [3 1 6]\n",
      "   state [0 0 0 1 1 0 1 0] state_WI [0.83 0.73 0.2  0.18 0.31 0.42 0.42 0.39] sorted [0 1 6]\n",
      "   state [0 1 1 0 1 0 1 0] state_WI [0.83 0.19 0.09 0.91 0.31 0.42 0.42 0.39] sorted [3 0 6]\n",
      "   state [1 0 1 1 1 0 1 0] state_WI [0.28 0.73 0.09 0.18 0.31 0.42 0.42 0.39] sorted [1 6 5]\n",
      "   state [0 1 0 0 1 0 1 0] state_WI [0.83 0.19 0.2  0.91 0.31 0.42 0.42 0.39] sorted [3 0 6]\n",
      "   state [1 0 1 0 1 0 1 0] state_WI [0.28 0.73 0.09 0.91 0.31 0.42 0.42 0.39] sorted [3 1 6]\n",
      "   state [1 0 0 1 1 0 1 0] state_WI [0.28 0.73 0.2  0.18 0.31 0.42 0.42 0.39] sorted [1 6 5]\n",
      "   state [0 1 0 0 0 1 1 0] state_WI [0.83 0.19 0.2  0.91 0.89 0.34 0.42 0.39] sorted [3 4 0]\n",
      "   state [1 1 1 1 1 0 0 0] state_WI [0.28 0.19 0.09 0.18 0.31 0.42 0.67 0.39] sorted [6 5 7]\n",
      "   state [0 1 1 1 1 0 0 0] state_WI [0.83 0.19 0.09 0.18 0.31 0.42 0.67 0.39] sorted [0 6 5]\n",
      "   state [1 1 0 1 0 1 1 0] state_WI [0.28 0.19 0.2  0.18 0.89 0.34 0.42 0.39] sorted [4 6 7]\n",
      "   state [1 1 1 1 0 1 1 0] state_WI [0.28 0.19 0.09 0.18 0.89 0.34 0.42 0.39] sorted [4 6 7]\n",
      "   state [0 1 0 1 1 1 1 0] state_WI [0.83 0.19 0.2  0.18 0.31 0.34 0.42 0.39] sorted [0 6 7]\n",
      "first state [1 1 1 1 1 1 1 0]\n",
      "   state [1 1 1 1 1 1 1 0] state_WI [  0.39   0.28 -10.     0.39 -10.   -10.   -10.     0.84] sorted [7 3 0]\n",
      "   state [1 0 0 1 1 1 1 0] state_WI [  0.39   0.67   0.55   0.39 -10.   -10.   -10.     0.84] sorted [7 1 2]\n",
      "   state [1 0 1 1 0 1 1 1] state_WI [  0.39   0.67 -10.     0.39   0.39 -10.   -10.     0.44] sorted [1 7 3]\n",
      "   state [0 0 0 1 0 1 0 1] state_WI [  0.38   0.67   0.55   0.39   0.39 -10.     0.7    0.44] sorted [6 1 2]\n",
      "   state [1 1 1 1 0 1 0 1] state_WI [  0.39   0.28 -10.     0.39   0.39 -10.     0.7    0.44] sorted [6 7 3]\n",
      "   state [0 0 1 1 0 0 0 1] state_WI [  0.38   0.67 -10.     0.39   0.39 -10.     0.7    0.44] sorted [6 1 7]\n",
      "   state [0 1 0 0 0 0 1 1] state_WI [  0.38   0.28   0.55   0.61   0.39 -10.   -10.     0.44] sorted [3 2 7]\n",
      "   state [0 1 1 1 1 0 1 1] state_WI [  0.38   0.28 -10.     0.39 -10.   -10.   -10.     0.44] sorted [7 3 0]\n",
      "   state [0 0 0 1 1 0 0 1] state_WI [  0.38   0.67   0.55   0.39 -10.   -10.     0.7    0.44] sorted [6 1 2]\n",
      "   state [0 1 0 1 0 0 1 0] state_WI [  0.38   0.28   0.55   0.39   0.39 -10.   -10.     0.84] sorted [7 2 3]\n",
      "   state [0 1 0 1 0 0 1 0] state_WI [  0.38   0.28   0.55   0.39   0.39 -10.   -10.     0.84] sorted [7 2 3]\n",
      "   state [0 1 1 1 0 0 1 1] state_WI [  0.38   0.28 -10.     0.39   0.39 -10.   -10.     0.44] sorted [7 3 4]\n",
      "   state [0 1 0 0 0 0 0 1] state_WI [  0.38   0.28   0.55   0.61   0.39 -10.     0.7    0.44] sorted [6 3 2]\n",
      "   state [0 0 1 0 0 0 1 1] state_WI [  0.38   0.67 -10.     0.61   0.39 -10.   -10.     0.44] sorted [1 3 7]\n",
      "   state [0 1 1 1 0 0 1 1] state_WI [  0.38   0.28 -10.     0.39   0.39 -10.   -10.     0.44] sorted [7 3 4]\n",
      "   state [0 0 0 1 0 0 0 0] state_WI [  0.38   0.67   0.55   0.39   0.39 -10.     0.7    0.84] sorted [7 6 1]\n",
      "   state [1 0 0 0 1 0 1 0] state_WI [  0.39   0.67   0.55   0.61 -10.   -10.   -10.     0.84] sorted [7 1 3]\n",
      "   state [1 0 0 1 1 0 1 1] state_WI [  0.39   0.67   0.55   0.39 -10.   -10.   -10.     0.44] sorted [1 2 7]\n",
      "   state [0 0 0 1 0 0 0 1] state_WI [  0.38   0.67   0.55   0.39   0.39 -10.     0.7    0.44] sorted [6 1 2]\n",
      "   state [0 0 1 0 0 0 0 0] state_WI [  0.38   0.67 -10.     0.61   0.39 -10.     0.7    0.84] sorted [7 6 1]\n",
      "instance 3, ep 1, state [1 0 1 1 1 0 0 0]\n",
      "   state [1 0 1 1 1 0 0 0] state_WI [  0.39   0.67 -10.     0.39 -10.   -10.     0.7    0.84] sorted [7 6 1]\n",
      "   state [0 1 0 1 1 0 0 1] state_WI [  0.38   0.28   0.55   0.39 -10.   -10.     0.7    0.44] sorted [6 2 7]\n",
      "   state [0 1 1 0 0 0 1 1] state_WI [  0.38   0.28 -10.     0.61   0.39 -10.   -10.     0.44] sorted [3 7 4]\n",
      "   state [0 0 1 0 0 0 0 1] state_WI [  0.38   0.67 -10.     0.61   0.39 -10.     0.7    0.44] sorted [6 1 3]\n",
      "   state [1 0 1 1 0 0 1 1] state_WI [  0.39   0.67 -10.     0.39   0.39 -10.   -10.     0.44] sorted [1 7 3]\n",
      "   state [0 0 1 1 0 0 1 1] state_WI [  0.38   0.67 -10.     0.39   0.39 -10.   -10.     0.44] sorted [1 7 3]\n",
      "   state [1 0 1 1 0 0 1 1] state_WI [  0.39   0.67 -10.     0.39   0.39 -10.   -10.     0.44] sorted [1 7 3]\n",
      "   state [1 0 0 1 0 0 0 0] state_WI [  0.39   0.67   0.55   0.39   0.39 -10.     0.7    0.84] sorted [7 6 1]\n",
      "   state [0 0 1 0 0 0 1 1] state_WI [  0.38   0.67 -10.     0.61   0.39 -10.   -10.     0.44] sorted [1 3 7]\n",
      "   state [0 0 0 1 0 0 1 1] state_WI [  0.38   0.67   0.55   0.39   0.39 -10.   -10.     0.44] sorted [1 2 7]\n",
      "   state [1 1 0 1 0 0 1 1] state_WI [  0.39   0.28   0.55   0.39   0.39 -10.   -10.     0.44] sorted [2 7 3]\n",
      "   state [1 1 0 1 0 0 1 1] state_WI [  0.39   0.28   0.55   0.39   0.39 -10.   -10.     0.44] sorted [2 7 3]\n",
      "   state [1 1 0 1 0 0 0 1] state_WI [  0.39   0.28   0.55   0.39   0.39 -10.     0.7    0.44] sorted [6 2 7]\n",
      "   state [0 1 0 1 1 0 1 1] state_WI [  0.38   0.28   0.55   0.39 -10.   -10.   -10.     0.44] sorted [2 7 3]\n",
      "   state [0 1 1 1 1 0 0 1] state_WI [  0.38   0.28 -10.     0.39 -10.   -10.     0.7    0.44] sorted [6 7 3]\n",
      "   state [0 0 0 0 0 0 0 1] state_WI [  0.38   0.67   0.55   0.61   0.39 -10.     0.7    0.44] sorted [6 1 3]\n",
      "   state [0 0 0 0 0 0 1 1] state_WI [  0.38   0.67   0.55   0.61   0.39 -10.   -10.     0.44] sorted [1 3 2]\n",
      "   state [1 0 0 0 0 0 1 0] state_WI [  0.39   0.67   0.55   0.61   0.39 -10.   -10.     0.84] sorted [7 1 3]\n",
      "   state [0 1 0 1 0 0 1 1] state_WI [  0.38   0.28   0.55   0.39   0.39 -10.   -10.     0.44] sorted [2 7 3]\n",
      "   state [0 1 1 1 0 1 1 1] state_WI [  0.38   0.28 -10.     0.39   0.39 -10.   -10.     0.44] sorted [7 3 4]\n",
      "instance 3, ep 2, state [1 0 0 0 1 1 0 0]\n",
      "   state [1 0 0 0 1 1 0 0] state_WI [  0.39   0.67   0.55   0.61 -10.   -10.     0.7    0.84] sorted [7 6 1]\n",
      "   state [0 1 0 0 0 0 0 1] state_WI [  0.38   0.28   0.55   0.61   0.39 -10.     0.7    0.44] sorted [6 3 2]\n",
      "   state [1 1 1 0 0 0 1 1] state_WI [  0.39   0.28 -10.     0.61   0.39 -10.   -10.     0.44] sorted [3 7 0]\n",
      "   state [1 0 0 1 0 0 1 1] state_WI [  0.39   0.67   0.55   0.39   0.39 -10.   -10.     0.44] sorted [1 2 7]\n",
      "   state [1 1 1 0 0 0 0 1] state_WI [  0.39   0.28 -10.     0.61   0.39 -10.     0.7    0.44] sorted [6 3 7]\n",
      "   state [1 0 0 0 0 1 1 0] state_WI [  0.39   0.67   0.55   0.61   0.39 -10.   -10.     0.84] sorted [7 1 3]\n",
      "   state [1 1 0 1 1 0 1 1] state_WI [  0.39   0.28   0.55   0.39 -10.   -10.   -10.     0.44] sorted [2 7 3]\n",
      "   state [1 0 0 0 0 0 1 1] state_WI [  0.39   0.67   0.55   0.61   0.39 -10.   -10.     0.44] sorted [1 3 2]\n",
      "   state [1 0 0 1 0 1 0 1] state_WI [  0.39   0.67   0.55   0.39   0.39 -10.     0.7    0.44] sorted [6 1 2]\n",
      "   state [0 1 1 1 1 0 1 0] state_WI [  0.38   0.28 -10.     0.39 -10.   -10.   -10.     0.84] sorted [7 3 0]\n",
      "   state [1 0 1 1 0 0 0 1] state_WI [  0.39   0.67 -10.     0.39   0.39 -10.     0.7    0.44] sorted [6 1 7]\n",
      "   state [0 1 1 1 0 0 1 1] state_WI [  0.38   0.28 -10.     0.39   0.39 -10.   -10.     0.44] sorted [7 3 4]\n",
      "   state [1 1 1 0 1 0 1 1] state_WI [  0.39   0.28 -10.     0.61 -10.   -10.   -10.     0.44] sorted [3 7 0]\n",
      "   state [0 1 1 0 1 0 1 1] state_WI [  0.38   0.28 -10.     0.61 -10.   -10.   -10.     0.44] sorted [3 7 0]\n",
      "   state [1 0 0 1 0 0 0 1] state_WI [  0.39   0.67   0.55   0.39   0.39 -10.     0.7    0.44] sorted [6 1 2]\n",
      "   state [1 1 1 0 0 0 0 1] state_WI [  0.39   0.28 -10.     0.61   0.39 -10.     0.7    0.44] sorted [6 3 7]\n",
      "   state [0 1 0 1 0 0 1 1] state_WI [  0.38   0.28   0.55   0.39   0.39 -10.   -10.     0.44] sorted [2 7 3]\n",
      "   state [0 1 0 1 0 0 1 1] state_WI [  0.38   0.28   0.55   0.39   0.39 -10.   -10.     0.44] sorted [2 7 3]\n",
      "   state [0 0 1 1 0 0 1 0] state_WI [  0.38   0.67 -10.     0.39   0.39 -10.   -10.     0.84] sorted [7 1 3]\n",
      "   state [0 0 0 1 0 1 1 0] state_WI [  0.38   0.67   0.55   0.39   0.39 -10.   -10.     0.84] sorted [7 1 2]\n",
      "instance 3, ep 3, state [1 1 1 0 1 0 1 1]\n",
      "   state [1 1 1 0 1 0 1 1] state_WI [  0.39   0.28 -10.     0.61 -10.   -10.   -10.     0.44] sorted [3 7 0]\n",
      "   state [1 1 1 0 0 0 1 1] state_WI [  0.39   0.28 -10.     0.61   0.39 -10.   -10.     0.44] sorted [3 7 0]\n",
      "   state [1 0 0 1 0 0 0 1] state_WI [  0.39   0.67   0.55   0.39   0.39 -10.     0.7    0.44] sorted [6 1 2]\n",
      "   state [1 1 0 1 1 0 0 0] state_WI [  0.39   0.28   0.55   0.39 -10.   -10.     0.7    0.84] sorted [7 6 2]\n",
      "   state [0 0 1 1 0 0 0 1] state_WI [  0.38   0.67 -10.     0.39   0.39 -10.     0.7    0.44] sorted [6 1 7]\n",
      "   state [0 1 0 1 0 0 1 1] state_WI [  0.38   0.28   0.55   0.39   0.39 -10.   -10.     0.44] sorted [2 7 3]\n",
      "   state [0 0 0 1 0 0 0 1] state_WI [  0.38   0.67   0.55   0.39   0.39 -10.     0.7    0.44] sorted [6 1 2]\n",
      "   state [0 1 0 1 0 0 1 1] state_WI [  0.38   0.28   0.55   0.39   0.39 -10.   -10.     0.44] sorted [2 7 3]\n",
      "   state [1 1 1 1 0 0 1 1] state_WI [  0.39   0.28 -10.     0.39   0.39 -10.   -10.     0.44] sorted [7 3 0]\n",
      "   state [0 1 1 1 0 1 0 1] state_WI [  0.38   0.28 -10.     0.39   0.39 -10.     0.7    0.44] sorted [6 7 3]\n",
      "   state [0 0 0 1 0 0 0 1] state_WI [  0.38   0.67   0.55   0.39   0.39 -10.     0.7    0.44] sorted [6 1 2]\n",
      "   state [0 0 1 0 0 0 0 1] state_WI [  0.38   0.67 -10.     0.61   0.39 -10.     0.7    0.44] sorted [6 1 3]\n",
      "   state [0 1 0 1 0 0 0 0] state_WI [  0.38   0.28   0.55   0.39   0.39 -10.     0.7    0.84] sorted [7 6 2]\n",
      "   state [1 0 0 0 0 0 0 0] state_WI [  0.39   0.67   0.55   0.61   0.39 -10.     0.7    0.84] sorted [7 6 1]\n",
      "   state [1 1 0 0 0 0 0 1] state_WI [  0.39   0.28   0.55   0.61   0.39 -10.     0.7    0.44] sorted [6 3 2]\n",
      "   state [0 1 0 1 0 0 1 0] state_WI [  0.38   0.28   0.55   0.39   0.39 -10.   -10.     0.84] sorted [7 2 3]\n",
      "   state [0 1 0 0 0 0 1 0] state_WI [  0.38   0.28   0.55   0.61   0.39 -10.   -10.     0.84] sorted [7 3 2]\n",
      "   state [0 1 0 1 0 0 1 1] state_WI [  0.38   0.28   0.55   0.39   0.39 -10.   -10.     0.44] sorted [2 7 3]\n",
      "   state [0 0 1 1 0 0 1 1] state_WI [  0.38   0.67 -10.     0.39   0.39 -10.   -10.     0.44] sorted [1 7 3]\n",
      "   state [0 1 1 1 0 0 1 1] state_WI [  0.38   0.28 -10.     0.39   0.39 -10.   -10.     0.44] sorted [7 3 4]\n",
      "instance 3, ep 4, state [0 0 1 1 1 1 1 1]\n",
      "   state [0 0 1 1 1 1 1 1] state_WI [  0.38   0.67 -10.     0.39 -10.   -10.   -10.     0.44] sorted [1 7 3]\n",
      "   state [0 1 0 1 0 0 1 1] state_WI [  0.38   0.28   0.55   0.39   0.39 -10.   -10.     0.44] sorted [2 7 3]\n",
      "   state [0 1 1 1 0 0 0 1] state_WI [  0.38   0.28 -10.     0.39   0.39 -10.     0.7    0.44] sorted [6 7 3]\n",
      "   state [0 1 0 1 0 0 1 1] state_WI [  0.38   0.28   0.55   0.39   0.39 -10.   -10.     0.44] sorted [2 7 3]\n",
      "   state [1 0 0 1 0 1 1 1] state_WI [  0.39   0.67   0.55   0.39   0.39 -10.   -10.     0.44] sorted [1 2 7]\n",
      "   state [0 1 0 1 0 0 0 0] state_WI [  0.38   0.28   0.55   0.39   0.39 -10.     0.7    0.84] sorted [7 6 2]\n",
      "   state [0 0 1 0 0 0 0 1] state_WI [  0.38   0.67 -10.     0.61   0.39 -10.     0.7    0.44] sorted [6 1 3]\n",
      "   state [0 0 0 0 0 0 0 1] state_WI [  0.38   0.67   0.55   0.61   0.39 -10.     0.7    0.44] sorted [6 1 3]\n",
      "   state [0 0 0 1 1 0 1 0] state_WI [  0.38   0.67   0.55   0.39 -10.   -10.   -10.     0.84] sorted [7 1 2]\n",
      "   state [0 0 0 0 0 0 0 0] state_WI [  0.38   0.67   0.55   0.61   0.39 -10.     0.7    0.84] sorted [7 6 1]\n",
      "   state [0 1 0 0 0 0 0 1] state_WI [  0.38   0.28   0.55   0.61   0.39 -10.     0.7    0.44] sorted [6 3 2]\n",
      "   state [0 0 0 0 0 0 1 0] state_WI [  0.38   0.67   0.55   0.61   0.39 -10.   -10.     0.84] sorted [7 1 3]\n",
      "   state [1 1 0 1 0 0 0 1] state_WI [  0.39   0.28   0.55   0.39   0.39 -10.     0.7    0.44] sorted [6 2 7]\n",
      "   state [1 1 1 1 0 0 0 1] state_WI [  0.39   0.28 -10.     0.39   0.39 -10.     0.7    0.44] sorted [6 7 3]\n",
      "   state [1 1 0 0 0 0 1 1] state_WI [  0.39   0.28   0.55   0.61   0.39 -10.   -10.     0.44] sorted [3 2 7]\n",
      "   state [1 1 0 1 0 0 1 1] state_WI [  0.39   0.28   0.55   0.39   0.39 -10.   -10.     0.44] sorted [2 7 3]\n",
      "   state [1 0 0 0 0 0 0 1] state_WI [  0.39   0.67   0.55   0.61   0.39 -10.     0.7    0.44] sorted [6 1 3]\n",
      "   state [1 0 0 1 0 0 0 1] state_WI [  0.39   0.67   0.55   0.39   0.39 -10.     0.7    0.44] sorted [6 1 2]\n",
      "   state [1 1 1 1 0 0 1 0] state_WI [  0.39   0.28 -10.     0.39   0.39 -10.   -10.     0.84] sorted [7 3 0]\n",
      "   state [1 0 1 1 0 1 1 1] state_WI [  0.39   0.67 -10.     0.39   0.39 -10.   -10.     0.44] sorted [1 7 3]\n",
      "instance 3, ep 5, state [0 1 0 0 1 0 0 0]\n",
      "   state [0 1 0 0 1 0 0 0] state_WI [  0.38   0.28   0.55   0.61 -10.   -10.     0.7    0.84] sorted [7 6 3]\n",
      "   state [0 0 0 0 0 0 1 1] state_WI [  0.38   0.67   0.55   0.61   0.39 -10.   -10.     0.44] sorted [1 3 2]\n",
      "   state [0 0 0 1 0 0 0 1] state_WI [  0.38   0.67   0.55   0.39   0.39 -10.     0.7    0.44] sorted [6 1 2]\n",
      "   state [0 1 0 1 0 1 0 0] state_WI [  0.38   0.28   0.55   0.39   0.39 -10.     0.7    0.84] sorted [7 6 2]\n",
      "   state [0 1 0 0 0 0 0 1] state_WI [  0.38   0.28   0.55   0.61   0.39 -10.     0.7    0.44] sorted [6 3 2]\n",
      "   state [0 1 1 1 0 0 1 0] state_WI [  0.38   0.28 -10.     0.39   0.39 -10.   -10.     0.84] sorted [7 3 4]\n",
      "   state [0 1 0 1 0 0 1 0] state_WI [  0.38   0.28   0.55   0.39   0.39 -10.   -10.     0.84] sorted [7 2 3]\n",
      "   state [0 1 1 0 0 0 1 1] state_WI [  0.38   0.28 -10.     0.61   0.39 -10.   -10.     0.44] sorted [3 7 4]\n",
      "   state [1 1 0 1 1 0 0 1] state_WI [  0.39   0.28   0.55   0.39 -10.   -10.     0.7    0.44] sorted [6 2 7]\n",
      "   state [0 0 0 1 1 0 1 0] state_WI [  0.38   0.67   0.55   0.39 -10.   -10.   -10.     0.84] sorted [7 1 2]\n",
      "   state [0 0 1 0 1 0 0 0] state_WI [  0.38   0.67 -10.     0.61 -10.   -10.     0.7    0.84] sorted [7 6 1]\n",
      "   state [0 1 1 0 0 0 1 1] state_WI [  0.38   0.28 -10.     0.61   0.39 -10.   -10.     0.44] sorted [3 7 4]\n",
      "   state [0 0 1 0 0 0 1 1] state_WI [  0.38   0.67 -10.     0.61   0.39 -10.   -10.     0.44] sorted [1 3 7]\n",
      "   state [0 1 0 0 0 0 1 1] state_WI [  0.38   0.28   0.55   0.61   0.39 -10.   -10.     0.44] sorted [3 2 7]\n",
      "   state [0 0 1 0 0 0 1 1] state_WI [  0.38   0.67 -10.     0.61   0.39 -10.   -10.     0.44] sorted [1 3 7]\n",
      "   state [0 0 1 0 0 0 1 0] state_WI [  0.38   0.67 -10.     0.61   0.39 -10.   -10.     0.84] sorted [7 1 3]\n",
      "   state [1 1 0 1 0 0 1 1] state_WI [  0.39   0.28   0.55   0.39   0.39 -10.   -10.     0.44] sorted [2 7 3]\n",
      "   state [1 1 0 1 0 0 0 1] state_WI [  0.39   0.28   0.55   0.39   0.39 -10.     0.7    0.44] sorted [6 2 7]\n",
      "   state [1 1 1 1 0 0 1 1] state_WI [  0.39   0.28 -10.     0.39   0.39 -10.   -10.     0.44] sorted [7 3 0]\n",
      "   state [1 0 0 1 0 0 1 1] state_WI [  0.39   0.67   0.55   0.39   0.39 -10.   -10.     0.44] sorted [1 2 7]\n",
      "instance 3, ep 6, state [1 0 0 0 0 0 0 1]\n",
      "   state [1 0 0 0 0 0 0 1] state_WI [  0.39   0.67   0.55   0.61   0.39 -10.     0.7    0.44] sorted [6 1 3]\n",
      "   state [1 0 0 0 0 0 0 0] state_WI [  0.39   0.67   0.55   0.61   0.39 -10.     0.7    0.84] sorted [7 6 1]\n",
      "   state [1 1 0 1 0 0 0 1] state_WI [  0.39   0.28   0.55   0.39   0.39 -10.     0.7    0.44] sorted [6 2 7]\n",
      "   state [0 1 1 0 0 0 1 1] state_WI [  0.38   0.28 -10.     0.61   0.39 -10.   -10.     0.44] sorted [3 7 4]\n",
      "   state [1 1 1 1 0 0 1 1] state_WI [  0.39   0.28 -10.     0.39   0.39 -10.   -10.     0.44] sorted [7 3 0]\n",
      "   state [1 0 0 1 0 0 1 1] state_WI [  0.39   0.67   0.55   0.39   0.39 -10.   -10.     0.44] sorted [1 2 7]\n",
      "   state [0 1 1 1 0 0 1 1] state_WI [  0.38   0.28 -10.     0.39   0.39 -10.   -10.     0.44] sorted [7 3 4]\n",
      "   state [0 0 0 0 0 0 1 1] state_WI [  0.38   0.67   0.55   0.61   0.39 -10.   -10.     0.44] sorted [1 3 2]\n",
      "   state [1 1 1 1 0 0 1 0] state_WI [  0.39   0.28 -10.     0.39   0.39 -10.   -10.     0.84] sorted [7 3 0]\n",
      "   state [1 1 1 1 0 0 0 0] state_WI [  0.39   0.28 -10.     0.39   0.39 -10.     0.7    0.84] sorted [7 6 3]\n",
      "   state [0 1 0 1 0 0 1 0] state_WI [  0.38   0.28   0.55   0.39   0.39 -10.   -10.     0.84] sorted [7 2 3]\n",
      "   state [0 0 0 1 0 0 1 1] state_WI [  0.38   0.67   0.55   0.39   0.39 -10.   -10.     0.44] sorted [1 2 7]\n",
      "   state [0 0 1 1 0 0 1 1] state_WI [  0.38   0.67 -10.     0.39   0.39 -10.   -10.     0.44] sorted [1 7 3]\n",
      "   state [1 1 1 1 0 0 0 1] state_WI [  0.39   0.28 -10.     0.39   0.39 -10.     0.7    0.44] sorted [6 7 3]\n",
      "   state [1 0 1 1 0 1 1 0] state_WI [  0.39   0.67 -10.     0.39   0.39 -10.   -10.     0.84] sorted [7 1 3]\n",
      "   state [1 0 0 1 0 0 0 1] state_WI [  0.39   0.67   0.55   0.39   0.39 -10.     0.7    0.44] sorted [6 1 2]\n",
      "   state [1 0 0 1 0 0 0 1] state_WI [  0.39   0.67   0.55   0.39   0.39 -10.     0.7    0.44] sorted [6 1 2]\n",
      "   state [0 1 0 0 0 0 1 1] state_WI [  0.38   0.28   0.55   0.61   0.39 -10.   -10.     0.44] sorted [3 2 7]\n",
      "   state [0 1 1 1 1 0 0 1] state_WI [  0.38   0.28 -10.     0.39 -10.   -10.     0.7    0.44] sorted [6 7 3]\n",
      "   state [0 1 0 1 1 0 0 1] state_WI [  0.38   0.28   0.55   0.39 -10.   -10.     0.7    0.44] sorted [6 2 7]\n",
      "instance 3, ep 7, state [0 0 0 0 1 1 0 0]\n",
      "   state [0 0 0 0 1 1 0 0] state_WI [  0.38   0.67   0.55   0.61 -10.   -10.     0.7    0.84] sorted [7 6 1]\n",
      "   state [0 0 0 0 1 0 1 0] state_WI [  0.38   0.67   0.55   0.61 -10.   -10.   -10.     0.84] sorted [7 1 3]\n",
      "   state [0 1 0 0 1 0 1 0] state_WI [  0.38   0.28   0.55   0.61 -10.   -10.   -10.     0.84] sorted [7 3 2]\n",
      "   state [0 1 0 1 0 0 0 1] state_WI [  0.38   0.28   0.55   0.39   0.39 -10.     0.7    0.44] sorted [6 2 7]\n",
      "   state [0 0 0 0 0 0 0 1] state_WI [  0.38   0.67   0.55   0.61   0.39 -10.     0.7    0.44] sorted [6 1 3]\n",
      "   state [1 1 0 0 0 0 0 0] state_WI [  0.39   0.28   0.55   0.61   0.39 -10.     0.7    0.84] sorted [7 6 3]\n",
      "   state [1 1 0 0 1 0 1 1] state_WI [  0.39   0.28   0.55   0.61 -10.   -10.   -10.     0.44] sorted [3 2 7]\n",
      "   state [1 1 0 0 1 0 1 1] state_WI [  0.39   0.28   0.55   0.61 -10.   -10.   -10.     0.44] sorted [3 2 7]\n",
      "   state [1 1 1 1 0 0 1 1] state_WI [  0.39   0.28 -10.     0.39   0.39 -10.   -10.     0.44] sorted [7 3 0]\n",
      "   state [1 1 1 1 0 0 0 1] state_WI [  0.39   0.28 -10.     0.39   0.39 -10.     0.7    0.44] sorted [6 7 3]\n",
      "   state [0 1 1 1 1 0 0 0] state_WI [  0.38   0.28 -10.     0.39 -10.   -10.     0.7    0.84] sorted [7 6 3]\n",
      "   state [0 0 1 1 0 0 1 0] state_WI [  0.38   0.67 -10.     0.39   0.39 -10.   -10.     0.84] sorted [7 1 3]\n",
      "   state [0 0 0 1 0 0 1 1] state_WI [  0.38   0.67   0.55   0.39   0.39 -10.   -10.     0.44] sorted [1 2 7]\n",
      "   state [1 0 1 1 0 0 1 1] state_WI [  0.39   0.67 -10.     0.39   0.39 -10.   -10.     0.44] sorted [1 7 3]\n",
      "   state [1 1 0 0 0 1 0 0] state_WI [  0.39   0.28   0.55   0.61   0.39 -10.     0.7    0.84] sorted [7 6 3]\n",
      "   state [1 1 0 0 0 0 1 1] state_WI [  0.39   0.28   0.55   0.61   0.39 -10.   -10.     0.44] sorted [3 2 7]\n",
      "   state [1 1 1 0 0 0 0 1] state_WI [  0.39   0.28 -10.     0.61   0.39 -10.     0.7    0.44] sorted [6 3 7]\n",
      "   state [0 1 0 0 1 0 1 1] state_WI [  0.38   0.28   0.55   0.61 -10.   -10.   -10.     0.44] sorted [3 2 7]\n",
      "   state [0 1 0 1 0 0 1 0] state_WI [  0.38   0.28   0.55   0.39   0.39 -10.   -10.     0.84] sorted [7 2 3]\n",
      "   state [0 0 0 0 0 0 0 1] state_WI [  0.38   0.67   0.55   0.61   0.39 -10.     0.7    0.44] sorted [6 1 3]\n",
      "instance 3, ep 8, state [0 1 1 1 0 1 0 0]\n",
      "   state [0 1 1 1 0 1 0 0] state_WI [  0.38   0.28 -10.     0.39   0.39 -10.     0.7    0.84] sorted [7 6 3]\n",
      "   state [0 1 1 1 0 0 1 1] state_WI [  0.38   0.28 -10.     0.39   0.39 -10.   -10.     0.44] sorted [7 3 4]\n",
      "   state [0 0 0 1 1 0 0 1] state_WI [  0.38   0.67   0.55   0.39 -10.   -10.     0.7    0.44] sorted [6 1 2]\n",
      "   state [0 1 1 1 1 0 1 1] state_WI [  0.38   0.28 -10.     0.39 -10.   -10.   -10.     0.44] sorted [7 3 0]\n",
      "   state [0 1 1 1 1 0 1 1] state_WI [  0.38   0.28 -10.     0.39 -10.   -10.   -10.     0.44] sorted [7 3 0]\n",
      "   state [0 0 1 1 0 0 0 1] state_WI [  0.38   0.67 -10.     0.39   0.39 -10.     0.7    0.44] sorted [6 1 7]\n",
      "   state [0 1 1 1 0 0 0 1] state_WI [  0.38   0.28 -10.     0.39   0.39 -10.     0.7    0.44] sorted [6 7 3]\n",
      "   state [0 0 0 1 0 0 0 1] state_WI [  0.38   0.67   0.55   0.39   0.39 -10.     0.7    0.44] sorted [6 1 2]\n",
      "   state [0 1 0 1 0 0 0 1] state_WI [  0.38   0.28   0.55   0.39   0.39 -10.     0.7    0.44] sorted [6 2 7]\n",
      "   state [0 0 1 0 1 0 1 1] state_WI [  0.38   0.67 -10.     0.61 -10.   -10.   -10.     0.44] sorted [1 3 7]\n",
      "   state [0 1 1 1 0 0 1 1] state_WI [  0.38   0.28 -10.     0.39   0.39 -10.   -10.     0.44] sorted [7 3 4]\n",
      "   state [0 0 0 0 0 0 1 1] state_WI [  0.38   0.67   0.55   0.61   0.39 -10.   -10.     0.44] sorted [1 3 2]\n",
      "   state [0 0 1 1 0 0 1 1] state_WI [  0.38   0.67 -10.     0.39   0.39 -10.   -10.     0.44] sorted [1 7 3]\n",
      "   state [0 1 1 1 0 1 1 1] state_WI [  0.38   0.28 -10.     0.39   0.39 -10.   -10.     0.44] sorted [7 3 4]\n",
      "   state [0 0 0 1 0 0 0 1] state_WI [  0.38   0.67   0.55   0.39   0.39 -10.     0.7    0.44] sorted [6 1 2]\n",
      "   state [0 1 1 1 0 0 0 0] state_WI [  0.38   0.28 -10.     0.39   0.39 -10.     0.7    0.84] sorted [7 6 3]\n",
      "   state [0 1 0 1 0 0 0 1] state_WI [  0.38   0.28   0.55   0.39   0.39 -10.     0.7    0.44] sorted [6 2 7]\n",
      "   state [0 0 0 0 0 0 1 1] state_WI [  0.38   0.67   0.55   0.61   0.39 -10.   -10.     0.44] sorted [1 3 2]\n",
      "   state [0 0 0 1 0 0 1 1] state_WI [  0.38   0.67   0.55   0.39   0.39 -10.   -10.     0.44] sorted [1 2 7]\n",
      "   state [0 0 1 0 0 0 0 1] state_WI [  0.38   0.67 -10.     0.61   0.39 -10.     0.7    0.44] sorted [6 1 3]\n",
      "instance 3, ep 9, state [0 0 1 1 0 1 1 1]\n",
      "   state [0 0 1 1 0 1 1 1] state_WI [  0.38   0.67 -10.     0.39   0.39 -10.   -10.     0.44] sorted [1 7 3]\n",
      "   state [0 1 0 0 0 0 1 1] state_WI [  0.38   0.28   0.55   0.61   0.39 -10.   -10.     0.44] sorted [3 2 7]\n",
      "   state [0 1 0 1 0 0 0 1] state_WI [  0.38   0.28   0.55   0.39   0.39 -10.     0.7    0.44] sorted [6 2 7]\n",
      "   state [0 0 1 1 0 0 1 1] state_WI [  0.38   0.67 -10.     0.39   0.39 -10.   -10.     0.44] sorted [1 7 3]\n",
      "   state [0 1 0 1 0 0 0 1] state_WI [  0.38   0.28   0.55   0.39   0.39 -10.     0.7    0.44] sorted [6 2 7]\n",
      "   state [0 1 1 0 0 0 1 1] state_WI [  0.38   0.28 -10.     0.61   0.39 -10.   -10.     0.44] sorted [3 7 4]\n",
      "   state [0 1 0 1 0 0 1 1] state_WI [  0.38   0.28   0.55   0.39   0.39 -10.   -10.     0.44] sorted [2 7 3]\n",
      "   state [0 0 1 1 0 0 0 1] state_WI [  0.38   0.67 -10.     0.39   0.39 -10.     0.7    0.44] sorted [6 1 7]\n",
      "   state [0 1 0 0 0 0 1 1] state_WI [  0.38   0.28   0.55   0.61   0.39 -10.   -10.     0.44] sorted [3 2 7]\n",
      "   state [0 1 0 1 0 0 1 1] state_WI [  0.38   0.28   0.55   0.39   0.39 -10.   -10.     0.44] sorted [2 7 3]\n",
      "   state [0 1 0 1 0 0 1 0] state_WI [  0.38   0.28   0.55   0.39   0.39 -10.   -10.     0.84] sorted [7 2 3]\n",
      "   state [0 1 0 1 0 0 1 1] state_WI [  0.38   0.28   0.55   0.39   0.39 -10.   -10.     0.44] sorted [2 7 3]\n",
      "   state [0 1 1 1 0 0 0 0] state_WI [  0.38   0.28 -10.     0.39   0.39 -10.     0.7    0.84] sorted [7 6 3]\n",
      "   state [0 0 0 1 0 0 1 1] state_WI [  0.38   0.67   0.55   0.39   0.39 -10.   -10.     0.44] sorted [1 2 7]\n",
      "   state [0 1 0 1 0 1 0 1] state_WI [  0.38   0.28   0.55   0.39   0.39 -10.     0.7    0.44] sorted [6 2 7]\n",
      "   state [0 0 1 1 0 0 0 1] state_WI [  0.38   0.67 -10.     0.39   0.39 -10.     0.7    0.44] sorted [6 1 7]\n",
      "   state [0 1 1 0 0 0 1 1] state_WI [  0.38   0.28 -10.     0.61   0.39 -10.   -10.     0.44] sorted [3 7 4]\n",
      "   state [0 0 0 0 1 0 1 1] state_WI [  0.38   0.67   0.55   0.61 -10.   -10.   -10.     0.44] sorted [1 3 2]\n",
      "   state [1 0 1 1 1 1 1 0] state_WI [  0.39   0.67 -10.     0.39 -10.   -10.   -10.     0.84] sorted [7 1 3]\n",
      "   state [0 0 0 1 0 1 0 1] state_WI [  0.38   0.67   0.55   0.39   0.39 -10.     0.7    0.44] sorted [6 1 2]\n",
      "instance 3, ep 10, state [1 1 1 1 0 0 1 0]\n",
      "   state [1 1 1 1 0 0 1 0] state_WI [  0.39   0.28 -10.     0.39   0.39 -10.   -10.     0.84] sorted [7 3 0]\n",
      "   state [1 1 1 1 0 0 1 1] state_WI [  0.39   0.28 -10.     0.39   0.39 -10.   -10.     0.44] sorted [7 3 0]\n",
      "   state [1 1 0 1 0 1 1 1] state_WI [  0.39   0.28   0.55   0.39   0.39 -10.   -10.     0.44] sorted [2 7 3]\n",
      "   state [0 1 1 1 0 0 0 1] state_WI [  0.38   0.28 -10.     0.39   0.39 -10.     0.7    0.44] sorted [6 7 3]\n",
      "   state [0 0 0 1 0 0 1 1] state_WI [  0.38   0.67   0.55   0.39   0.39 -10.   -10.     0.44] sorted [1 2 7]\n",
      "   state [0 1 1 0 0 1 0 0] state_WI [  0.38   0.28 -10.     0.61   0.39 -10.     0.7    0.84] sorted [7 6 3]\n",
      "   state [0 0 1 0 1 1 1 0] state_WI [  0.38   0.67 -10.     0.61 -10.   -10.   -10.     0.84] sorted [7 1 3]\n",
      "   state [0 1 0 1 0 1 1 1] state_WI [  0.38   0.28   0.55   0.39   0.39 -10.   -10.     0.44] sorted [2 7 3]\n",
      "   state [1 0 0 0 0 0 0 1] state_WI [  0.39   0.67   0.55   0.61   0.39 -10.     0.7    0.44] sorted [6 1 3]\n",
      "   state [1 0 0 0 0 0 1 0] state_WI [  0.39   0.67   0.55   0.61   0.39 -10.   -10.     0.84] sorted [7 1 3]\n",
      "   state [0 0 0 0 0 0 0 1] state_WI [  0.38   0.67   0.55   0.61   0.39 -10.     0.7    0.44] sorted [6 1 3]\n",
      "   state [0 0 1 0 0 0 1 0] state_WI [  0.38   0.67 -10.     0.61   0.39 -10.   -10.     0.84] sorted [7 1 3]\n",
      "   state [0 0 0 1 0 0 1 1] state_WI [  0.38   0.67   0.55   0.39   0.39 -10.   -10.     0.44] sorted [1 2 7]\n",
      "   state [0 0 1 0 0 0 1 1] state_WI [  0.38   0.67 -10.     0.61   0.39 -10.   -10.     0.44] sorted [1 3 7]\n",
      "   state [1 0 1 0 0 0 1 1] state_WI [  0.39   0.67 -10.     0.61   0.39 -10.   -10.     0.44] sorted [1 3 7]\n",
      "   state [0 1 0 0 1 0 1 1] state_WI [  0.38   0.28   0.55   0.61 -10.   -10.   -10.     0.44] sorted [3 2 7]\n",
      "   state [0 1 0 1 0 0 0 1] state_WI [  0.38   0.28   0.55   0.39   0.39 -10.     0.7    0.44] sorted [6 2 7]\n",
      "   state [0 1 1 1 1 0 1 1] state_WI [  0.38   0.28 -10.     0.39 -10.   -10.   -10.     0.44] sorted [7 3 0]\n",
      "   state [0 1 0 1 1 0 1 1] state_WI [  0.38   0.28   0.55   0.39 -10.   -10.   -10.     0.44] sorted [2 7 3]\n",
      "   state [0 0 0 1 1 0 0 1] state_WI [  0.38   0.67   0.55   0.39 -10.   -10.     0.7    0.44] sorted [6 1 2]\n",
      "instance 3, ep 11, state [1 0 0 0 0 1 1 1]\n",
      "   state [1 0 0 0 0 1 1 1] state_WI [  0.39   0.67   0.55   0.61   0.39 -10.   -10.     0.44] sorted [1 3 2]\n",
      "   state [1 1 1 1 0 0 0 1] state_WI [  0.39   0.28 -10.     0.39   0.39 -10.     0.7    0.44] sorted [6 7 3]\n",
      "   state [1 0 0 0 0 1 1 1] state_WI [  0.39   0.67   0.55   0.61   0.39 -10.   -10.     0.44] sorted [1 3 2]\n",
      "   state [0 0 1 1 0 1 1 1] state_WI [  0.38   0.67 -10.     0.39   0.39 -10.   -10.     0.44] sorted [1 7 3]\n",
      "   state [1 1 0 0 0 1 0 0] state_WI [  0.39   0.28   0.55   0.61   0.39 -10.     0.7    0.84] sorted [7 6 3]\n",
      "   state [0 1 0 0 0 0 0 1] state_WI [  0.38   0.28   0.55   0.61   0.39 -10.     0.7    0.44] sorted [6 3 2]\n",
      "   state [0 1 0 1 0 0 0 0] state_WI [  0.38   0.28   0.55   0.39   0.39 -10.     0.7    0.84] sorted [7 6 2]\n",
      "   state [0 1 0 0 0 0 0 1] state_WI [  0.38   0.28   0.55   0.61   0.39 -10.     0.7    0.44] sorted [6 3 2]\n",
      "   state [0 1 0 1 0 0 0 0] state_WI [  0.38   0.28   0.55   0.39   0.39 -10.     0.7    0.84] sorted [7 6 2]\n",
      "   state [0 0 1 0 0 0 0 1] state_WI [  0.38   0.67 -10.     0.61   0.39 -10.     0.7    0.44] sorted [6 1 3]\n",
      "   state [1 0 0 1 1 1 1 0] state_WI [  0.39   0.67   0.55   0.39 -10.   -10.   -10.     0.84] sorted [7 1 2]\n",
      "   state [1 1 1 1 1 0 0 1] state_WI [  0.39   0.28 -10.     0.39 -10.   -10.     0.7    0.44] sorted [6 7 3]\n",
      "   state [0 0 0 0 0 0 0 1] state_WI [  0.38   0.67   0.55   0.61   0.39 -10.     0.7    0.44] sorted [6 1 3]\n",
      "   state [0 0 1 1 0 0 0 1] state_WI [  0.38   0.67 -10.     0.39   0.39 -10.     0.7    0.44] sorted [6 1 7]\n",
      "   state [0 0 0 1 0 0 0 1] state_WI [  0.38   0.67   0.55   0.39   0.39 -10.     0.7    0.44] sorted [6 1 2]\n",
      "   state [0 1 0 0 1 1 1 0] state_WI [  0.38   0.28   0.55   0.61 -10.   -10.   -10.     0.84] sorted [7 3 2]\n",
      "   state [0 1 1 1 0 0 1 0] state_WI [  0.38   0.28 -10.     0.39   0.39 -10.   -10.     0.84] sorted [7 3 4]\n",
      "   state [0 1 1 0 1 0 1 1] state_WI [  0.38   0.28 -10.     0.61 -10.   -10.   -10.     0.44] sorted [3 7 0]\n",
      "   state [1 0 0 1 0 0 1 1] state_WI [  0.39   0.67   0.55   0.39   0.39 -10.   -10.     0.44] sorted [1 2 7]\n",
      "   state [0 0 1 0 0 0 0 1] state_WI [  0.38   0.67 -10.     0.61   0.39 -10.     0.7    0.44] sorted [6 1 3]\n",
      "instance 3, ep 12, state [1 0 1 1 1 0 1 0]\n",
      "   state [1 0 1 1 1 0 1 0] state_WI [  0.39   0.67 -10.     0.39 -10.   -10.   -10.     0.84] sorted [7 1 3]\n",
      "   state [1 0 1 0 0 0 1 1] state_WI [  0.39   0.67 -10.     0.61   0.39 -10.   -10.     0.44] sorted [1 3 7]\n",
      "   state [0 0 0 0 0 0 1 1] state_WI [  0.38   0.67   0.55   0.61   0.39 -10.   -10.     0.44] sorted [1 3 2]\n",
      "   state [0 1 1 1 0 0 1 1] state_WI [  0.38   0.28 -10.     0.39   0.39 -10.   -10.     0.44] sorted [7 3 4]\n",
      "   state [0 1 0 1 1 0 1 1] state_WI [  0.38   0.28   0.55   0.39 -10.   -10.   -10.     0.44] sorted [2 7 3]\n",
      "   state [0 0 0 0 0 0 0 0] state_WI [  0.38   0.67   0.55   0.61   0.39 -10.     0.7    0.84] sorted [7 6 1]\n",
      "   state [1 0 0 0 0 0 1 1] state_WI [  0.39   0.67   0.55   0.61   0.39 -10.   -10.     0.44] sorted [1 3 2]\n",
      "   state [0 0 1 1 0 0 1 1] state_WI [  0.38   0.67 -10.     0.39   0.39 -10.   -10.     0.44] sorted [1 7 3]\n",
      "   state [0 1 0 1 0 0 0 1] state_WI [  0.38   0.28   0.55   0.39   0.39 -10.     0.7    0.44] sorted [6 2 7]\n",
      "   state [0 1 0 0 1 0 1 0] state_WI [  0.38   0.28   0.55   0.61 -10.   -10.   -10.     0.84] sorted [7 3 2]\n",
      "   state [0 1 0 1 0 0 0 1] state_WI [  0.38   0.28   0.55   0.39   0.39 -10.     0.7    0.44] sorted [6 2 7]\n",
      "   state [0 1 0 0 0 0 0 1] state_WI [  0.38   0.28   0.55   0.61   0.39 -10.     0.7    0.44] sorted [6 3 2]\n",
      "   state [1 0 0 1 0 0 1 1] state_WI [  0.39   0.67   0.55   0.39   0.39 -10.   -10.     0.44] sorted [1 2 7]\n",
      "   state [0 0 1 0 0 0 0 1] state_WI [  0.38   0.67 -10.     0.61   0.39 -10.     0.7    0.44] sorted [6 1 3]\n",
      "   state [1 0 0 0 0 0 1 1] state_WI [  0.39   0.67   0.55   0.61   0.39 -10.   -10.     0.44] sorted [1 3 2]\n",
      "   state [1 0 1 0 0 0 0 1] state_WI [  0.39   0.67 -10.     0.61   0.39 -10.     0.7    0.44] sorted [6 1 3]\n",
      "   state [0 0 0 1 0 0 0 0] state_WI [  0.38   0.67   0.55   0.39   0.39 -10.     0.7    0.84] sorted [7 6 1]\n",
      "   state [0 0 0 0 0 0 1 0] state_WI [  0.38   0.67   0.55   0.61   0.39 -10.   -10.     0.84] sorted [7 1 3]\n",
      "   state [1 0 1 0 0 0 0 1] state_WI [  0.39   0.67 -10.     0.61   0.39 -10.     0.7    0.44] sorted [6 1 3]\n",
      "   state [1 1 1 1 0 1 1 1] state_WI [  0.39   0.28 -10.     0.39   0.39 -10.   -10.     0.44] sorted [7 3 0]\n",
      "instance 3, ep 13, state [1 1 0 1 1 0 1 1]\n",
      "   state [1 1 0 1 1 0 1 1] state_WI [  0.39   0.28   0.55   0.39 -10.   -10.   -10.     0.44] sorted [2 7 3]\n",
      "   state [0 0 1 1 0 1 1 1] state_WI [  0.38   0.67 -10.     0.39   0.39 -10.   -10.     0.44] sorted [1 7 3]\n",
      "   state [0 1 0 1 0 0 0 1] state_WI [  0.38   0.28   0.55   0.39   0.39 -10.     0.7    0.44] sorted [6 2 7]\n",
      "   state [0 1 0 0 0 0 1 1] state_WI [  0.38   0.28   0.55   0.61   0.39 -10.   -10.     0.44] sorted [3 2 7]\n",
      "   state [0 1 1 1 0 0 0 1] state_WI [  0.38   0.28 -10.     0.39   0.39 -10.     0.7    0.44] sorted [6 7 3]\n",
      "   state [0 0 0 1 0 0 1 1] state_WI [  0.38   0.67   0.55   0.39   0.39 -10.   -10.     0.44] sorted [1 2 7]\n",
      "   state [0 0 1 0 0 0 1 1] state_WI [  0.38   0.67 -10.     0.61   0.39 -10.   -10.     0.44] sorted [1 3 7]\n",
      "   state [0 0 0 1 0 0 0 1] state_WI [  0.38   0.67   0.55   0.39   0.39 -10.     0.7    0.44] sorted [6 1 2]\n",
      "   state [0 1 0 1 0 0 0 1] state_WI [  0.38   0.28   0.55   0.39   0.39 -10.     0.7    0.44] sorted [6 2 7]\n",
      "   state [0 1 1 0 0 0 1 1] state_WI [  0.38   0.28 -10.     0.61   0.39 -10.   -10.     0.44] sorted [3 7 4]\n",
      "   state [1 1 1 0 1 0 0 1] state_WI [  0.39   0.28 -10.     0.61 -10.   -10.     0.7    0.44] sorted [6 3 7]\n",
      "   state [0 1 0 0 1 0 0 1] state_WI [  0.38   0.28   0.55   0.61 -10.   -10.     0.7    0.44] sorted [6 3 2]\n",
      "   state [1 1 0 1 0 1 0 0] state_WI [  0.39   0.28   0.55   0.39   0.39 -10.     0.7    0.84] sorted [7 6 2]\n",
      "   state [0 0 1 1 0 0 0 0] state_WI [  0.38   0.67 -10.     0.39   0.39 -10.     0.7    0.84] sorted [7 6 1]\n",
      "   state [0 1 0 1 0 0 1 0] state_WI [  0.38   0.28   0.55   0.39   0.39 -10.   -10.     0.84] sorted [7 2 3]\n",
      "   state [0 1 0 0 0 0 1 1] state_WI [  0.38   0.28   0.55   0.61   0.39 -10.   -10.     0.44] sorted [3 2 7]\n",
      "   state [0 1 1 0 0 0 0 1] state_WI [  0.38   0.28 -10.     0.61   0.39 -10.     0.7    0.44] sorted [6 3 7]\n",
      "   state [0 1 1 1 0 0 1 1] state_WI [  0.38   0.28 -10.     0.39   0.39 -10.   -10.     0.44] sorted [7 3 4]\n",
      "   state [0 1 1 1 0 0 1 1] state_WI [  0.38   0.28 -10.     0.39   0.39 -10.   -10.     0.44] sorted [7 3 4]\n",
      "   state [0 1 1 1 0 0 1 1] state_WI [  0.38   0.28 -10.     0.39   0.39 -10.   -10.     0.44] sorted [7 3 4]\n",
      "instance 3, ep 14, state [0 0 0 0 0 1 0 0]\n",
      "   state [0 0 0 0 0 1 0 0] state_WI [  0.38   0.67   0.55   0.61   0.39 -10.     0.7    0.84] sorted [7 6 1]\n",
      "   state [0 1 0 0 0 0 1 1] state_WI [  0.38   0.28   0.55   0.61   0.39 -10.   -10.     0.44] sorted [3 2 7]\n",
      "   state [0 1 0 1 0 0 1 1] state_WI [  0.38   0.28   0.55   0.39   0.39 -10.   -10.     0.44] sorted [2 7 3]\n",
      "   state [0 0 1 1 0 0 0 1] state_WI [  0.38   0.67 -10.     0.39   0.39 -10.     0.7    0.44] sorted [6 1 7]\n",
      "   state [0 1 1 1 0 0 1 1] state_WI [  0.38   0.28 -10.     0.39   0.39 -10.   -10.     0.44] sorted [7 3 4]\n",
      "   state [0 0 0 1 1 1 1 1] state_WI [  0.38   0.67   0.55   0.39 -10.   -10.   -10.     0.44] sorted [1 2 7]\n",
      "   state [0 1 1 1 1 1 1 1] state_WI [  0.38   0.28 -10.     0.39 -10.   -10.   -10.     0.44] sorted [7 3 0]\n",
      "   state [0 1 0 1 0 0 0 1] state_WI [  0.38   0.28   0.55   0.39   0.39 -10.     0.7    0.44] sorted [6 2 7]\n",
      "   state [0 1 1 0 0 0 0 0] state_WI [  0.38   0.28 -10.     0.61   0.39 -10.     0.7    0.84] sorted [7 6 3]\n",
      "   state [1 1 0 0 0 0 0 1] state_WI [  0.39   0.28   0.55   0.61   0.39 -10.     0.7    0.44] sorted [6 3 2]\n",
      "   state [0 0 0 1 0 0 0 1] state_WI [  0.38   0.67   0.55   0.39   0.39 -10.     0.7    0.44] sorted [6 1 2]\n",
      "   state [0 0 0 0 0 0 0 0] state_WI [  0.38   0.67   0.55   0.61   0.39 -10.     0.7    0.84] sorted [7 6 1]\n",
      "   state [0 0 0 1 0 0 1 1] state_WI [  0.38   0.67   0.55   0.39   0.39 -10.   -10.     0.44] sorted [1 2 7]\n",
      "   state [0 1 0 0 0 1 0 1] state_WI [  0.38   0.28   0.55   0.61   0.39 -10.     0.7    0.44] sorted [6 3 2]\n",
      "   state [0 0 0 1 0 0 1 1] state_WI [  0.38   0.67   0.55   0.39   0.39 -10.   -10.     0.44] sorted [1 2 7]\n",
      "   state [0 1 0 0 0 0 0 1] state_WI [  0.38   0.28   0.55   0.61   0.39 -10.     0.7    0.44] sorted [6 3 2]\n",
      "   state [0 0 1 1 0 0 0 0] state_WI [  0.38   0.67 -10.     0.39   0.39 -10.     0.7    0.84] sorted [7 6 1]\n",
      "   state [0 0 1 0 0 0 1 1] state_WI [  0.38   0.67 -10.     0.61   0.39 -10.   -10.     0.44] sorted [1 3 7]\n",
      "   state [0 1 1 1 1 0 0 1] state_WI [  0.38   0.28 -10.     0.39 -10.   -10.     0.7    0.44] sorted [6 7 3]\n",
      "   state [0 1 0 0 1 0 0 1] state_WI [  0.38   0.28   0.55   0.61 -10.   -10.     0.7    0.44] sorted [6 3 2]\n",
      "instance 3, ep 15, state [1 1 0 0 0 1 0 1]\n",
      "   state [1 1 0 0 0 1 0 1] state_WI [  0.39   0.28   0.55   0.61   0.39 -10.     0.7    0.44] sorted [6 3 2]\n",
      "   state [0 1 0 1 0 0 0 0] state_WI [  0.38   0.28   0.55   0.39   0.39 -10.     0.7    0.84] sorted [7 6 2]\n",
      "   state [0 1 1 1 0 0 1 1] state_WI [  0.38   0.28 -10.     0.39   0.39 -10.   -10.     0.44] sorted [7 3 4]\n",
      "   state [1 1 0 1 0 0 1 1] state_WI [  0.39   0.28   0.55   0.39   0.39 -10.   -10.     0.44] sorted [2 7 3]\n",
      "   state [0 0 0 1 0 0 1 0] state_WI [  0.38   0.67   0.55   0.39   0.39 -10.   -10.     0.84] sorted [7 1 2]\n",
      "   state [0 1 0 1 0 0 0 1] state_WI [  0.38   0.28   0.55   0.39   0.39 -10.     0.7    0.44] sorted [6 2 7]\n",
      "   state [0 1 1 0 0 0 1 1] state_WI [  0.38   0.28 -10.     0.61   0.39 -10.   -10.     0.44] sorted [3 7 4]\n",
      "   state [0 1 0 0 0 0 1 1] state_WI [  0.38   0.28   0.55   0.61   0.39 -10.   -10.     0.44] sorted [3 2 7]\n",
      "   state [0 0 0 1 0 0 0 1] state_WI [  0.38   0.67   0.55   0.39   0.39 -10.     0.7    0.44] sorted [6 1 2]\n",
      "   state [0 0 1 0 0 0 0 0] state_WI [  0.38   0.67 -10.     0.61   0.39 -10.     0.7    0.84] sorted [7 6 1]\n",
      "   state [0 0 0 0 0 0 1 1] state_WI [  0.38   0.67   0.55   0.61   0.39 -10.   -10.     0.44] sorted [1 3 2]\n",
      "   state [0 1 0 1 0 0 1 1] state_WI [  0.38   0.28   0.55   0.39   0.39 -10.   -10.     0.44] sorted [2 7 3]\n",
      "   state [0 1 0 1 0 0 1 1] state_WI [  0.38   0.28   0.55   0.39   0.39 -10.   -10.     0.44] sorted [2 7 3]\n",
      "   state [0 1 1 1 0 1 1 0] state_WI [  0.38   0.28 -10.     0.39   0.39 -10.   -10.     0.84] sorted [7 3 4]\n",
      "   state [1 0 0 1 1 0 0 1] state_WI [  0.39   0.67   0.55   0.39 -10.   -10.     0.7    0.44] sorted [6 1 2]\n",
      "   state [0 1 1 0 0 0 0 1] state_WI [  0.38   0.28 -10.     0.61   0.39 -10.     0.7    0.44] sorted [6 3 7]\n",
      "   state [0 1 0 0 0 0 1 1] state_WI [  0.38   0.28   0.55   0.61   0.39 -10.   -10.     0.44] sorted [3 2 7]\n",
      "   state [1 1 0 1 0 0 0 1] state_WI [  0.39   0.28   0.55   0.39   0.39 -10.     0.7    0.44] sorted [6 2 7]\n",
      "   state [1 0 0 0 0 0 0 1] state_WI [  0.39   0.67   0.55   0.61   0.39 -10.     0.7    0.44] sorted [6 1 3]\n",
      "   state [1 1 0 1 0 1 1 0] state_WI [  0.39   0.28   0.55   0.39   0.39 -10.   -10.     0.84] sorted [7 2 3]\n",
      "instance 3, ep 16, state [1 0 1 1 0 1 1 1]\n",
      "   state [1 0 1 1 0 1 1 1] state_WI [  0.39   0.67 -10.     0.39   0.39 -10.   -10.     0.44] sorted [1 7 3]\n",
      "   state [1 1 1 1 0 1 1 1] state_WI [  0.39   0.28 -10.     0.39   0.39 -10.   -10.     0.44] sorted [7 3 0]\n",
      "   state [0 1 0 1 0 0 0 1] state_WI [  0.38   0.28   0.55   0.39   0.39 -10.     0.7    0.44] sorted [6 2 7]\n",
      "   state [0 0 0 0 1 0 0 1] state_WI [  0.38   0.67   0.55   0.61 -10.   -10.     0.7    0.44] sorted [6 1 3]\n",
      "   state [0 1 0 1 0 1 1 0] state_WI [  0.38   0.28   0.55   0.39   0.39 -10.   -10.     0.84] sorted [7 2 3]\n",
      "   state [0 1 0 1 1 0 0 1] state_WI [  0.38   0.28   0.55   0.39 -10.   -10.     0.7    0.44] sorted [6 2 7]\n",
      "   state [0 0 1 1 0 1 0 1] state_WI [  0.38   0.67 -10.     0.39   0.39 -10.     0.7    0.44] sorted [6 1 7]\n",
      "   state [0 1 0 0 0 0 1 1] state_WI [  0.38   0.28   0.55   0.61   0.39 -10.   -10.     0.44] sorted [3 2 7]\n",
      "   state [1 1 0 0 0 0 0 1] state_WI [  0.39   0.28   0.55   0.61   0.39 -10.     0.7    0.44] sorted [6 3 2]\n",
      "   state [0 1 1 1 0 0 0 1] state_WI [  0.38   0.28 -10.     0.39   0.39 -10.     0.7    0.44] sorted [6 7 3]\n",
      "   state [0 1 0 0 0 0 0 1] state_WI [  0.38   0.28   0.55   0.61   0.39 -10.     0.7    0.44] sorted [6 3 2]\n",
      "   state [0 0 0 0 1 0 0 1] state_WI [  0.38   0.67   0.55   0.61 -10.   -10.     0.7    0.44] sorted [6 1 3]\n",
      "   state [0 0 0 1 0 0 0 0] state_WI [  0.38   0.67   0.55   0.39   0.39 -10.     0.7    0.84] sorted [7 6 1]\n",
      "   state [1 0 0 0 0 0 0 1] state_WI [  0.39   0.67   0.55   0.61   0.39 -10.     0.7    0.44] sorted [6 1 3]\n",
      "   state [0 1 0 0 0 0 0 1] state_WI [  0.38   0.28   0.55   0.61   0.39 -10.     0.7    0.44] sorted [6 3 2]\n",
      "   state [0 1 0 1 0 0 0 1] state_WI [  0.38   0.28   0.55   0.39   0.39 -10.     0.7    0.44] sorted [6 2 7]\n",
      "   state [0 0 0 0 0 0 0 1] state_WI [  0.38   0.67   0.55   0.61   0.39 -10.     0.7    0.44] sorted [6 1 3]\n",
      "   state [1 1 0 0 0 0 0 1] state_WI [  0.39   0.28   0.55   0.61   0.39 -10.     0.7    0.44] sorted [6 3 2]\n",
      "   state [1 1 1 1 0 0 1 0] state_WI [  0.39   0.28 -10.     0.39   0.39 -10.   -10.     0.84] sorted [7 3 0]\n",
      "   state [1 0 0 1 0 0 1 0] state_WI [  0.39   0.67   0.55   0.39   0.39 -10.   -10.     0.84] sorted [7 1 2]\n",
      "instance 3, ep 17, state [1 1 1 1 1 1 1 0]\n",
      "   state [1 1 1 1 1 1 1 0] state_WI [  0.39   0.28 -10.     0.39 -10.   -10.   -10.     0.84] sorted [7 3 0]\n",
      "   state [1 1 0 1 0 0 1 1] state_WI [  0.39   0.28   0.55   0.39   0.39 -10.   -10.     0.44] sorted [2 7 3]\n",
      "   state [1 0 1 1 0 0 0 1] state_WI [  0.39   0.67 -10.     0.39   0.39 -10.     0.7    0.44] sorted [6 1 7]\n",
      "   state [0 1 0 1 0 0 1 1] state_WI [  0.38   0.28   0.55   0.39   0.39 -10.   -10.     0.44] sorted [2 7 3]\n",
      "   state [0 0 0 1 0 0 0 1] state_WI [  0.38   0.67   0.55   0.39   0.39 -10.     0.7    0.44] sorted [6 1 2]\n",
      "   state [0 1 1 1 0 0 0 1] state_WI [  0.38   0.28 -10.     0.39   0.39 -10.     0.7    0.44] sorted [6 7 3]\n",
      "   state [0 0 1 0 0 0 1 1] state_WI [  0.38   0.67 -10.     0.61   0.39 -10.   -10.     0.44] sorted [1 3 7]\n",
      "   state [0 1 0 1 0 0 1 1] state_WI [  0.38   0.28   0.55   0.39   0.39 -10.   -10.     0.44] sorted [2 7 3]\n",
      "   state [0 0 0 1 0 0 1 1] state_WI [  0.38   0.67   0.55   0.39   0.39 -10.   -10.     0.44] sorted [1 2 7]\n",
      "   state [0 0 0 1 0 0 1 1] state_WI [  0.38   0.67   0.55   0.39   0.39 -10.   -10.     0.44] sorted [1 2 7]\n",
      "   state [0 0 0 1 0 0 1 1] state_WI [  0.38   0.67   0.55   0.39   0.39 -10.   -10.     0.44] sorted [1 2 7]\n",
      "   state [0 1 1 0 0 0 0 1] state_WI [  0.38   0.28 -10.     0.61   0.39 -10.     0.7    0.44] sorted [6 3 7]\n",
      "   state [0 1 0 0 0 0 0 1] state_WI [  0.38   0.28   0.55   0.61   0.39 -10.     0.7    0.44] sorted [6 3 2]\n",
      "   state [0 1 0 1 0 0 1 0] state_WI [  0.38   0.28   0.55   0.39   0.39 -10.   -10.     0.84] sorted [7 2 3]\n",
      "   state [1 0 1 1 0 0 1 1] state_WI [  0.39   0.67 -10.     0.39   0.39 -10.   -10.     0.44] sorted [1 7 3]\n",
      "   state [0 0 0 1 0 0 1 1] state_WI [  0.38   0.67   0.55   0.39   0.39 -10.   -10.     0.44] sorted [1 2 7]\n",
      "   state [0 0 1 1 0 0 1 1] state_WI [  0.38   0.67 -10.     0.39   0.39 -10.   -10.     0.44] sorted [1 7 3]\n",
      "   state [0 1 1 1 0 0 1 1] state_WI [  0.38   0.28 -10.     0.39   0.39 -10.   -10.     0.44] sorted [7 3 4]\n",
      "   state [0 0 1 1 0 0 0 1] state_WI [  0.38   0.67 -10.     0.39   0.39 -10.     0.7    0.44] sorted [6 1 7]\n",
      "   state [0 0 1 1 0 0 1 1] state_WI [  0.38   0.67 -10.     0.39   0.39 -10.   -10.     0.44] sorted [1 7 3]\n",
      "instance 3, ep 18, state [0 0 0 0 1 0 1 0]\n",
      "   state [0 0 0 0 1 0 1 0] state_WI [  0.38   0.67   0.55   0.61 -10.   -10.   -10.     0.84] sorted [7 1 3]\n",
      "   state [0 1 1 1 0 1 0 1] state_WI [  0.38   0.28 -10.     0.39   0.39 -10.     0.7    0.44] sorted [6 7 3]\n",
      "   state [0 1 1 1 0 1 0 1] state_WI [  0.38   0.28 -10.     0.39   0.39 -10.     0.7    0.44] sorted [6 7 3]\n",
      "   state [0 0 0 0 0 0 1 1] state_WI [  0.38   0.67   0.55   0.61   0.39 -10.   -10.     0.44] sorted [1 3 2]\n",
      "   state [0 1 1 1 0 0 1 0] state_WI [  0.38   0.28 -10.     0.39   0.39 -10.   -10.     0.84] sorted [7 3 4]\n",
      "   state [0 1 0 1 0 0 0 1] state_WI [  0.38   0.28   0.55   0.39   0.39 -10.     0.7    0.44] sorted [6 2 7]\n",
      "   state [0 1 1 0 0 0 1 1] state_WI [  0.38   0.28 -10.     0.61   0.39 -10.   -10.     0.44] sorted [3 7 4]\n",
      "   state [0 1 0 0 0 0 1 1] state_WI [  0.38   0.28   0.55   0.61   0.39 -10.   -10.     0.44] sorted [3 2 7]\n",
      "   state [1 1 0 0 0 0 0 1] state_WI [  0.39   0.28   0.55   0.61   0.39 -10.     0.7    0.44] sorted [6 3 2]\n",
      "   state [1 1 1 1 0 0 0 0] state_WI [  0.39   0.28 -10.     0.39   0.39 -10.     0.7    0.84] sorted [7 6 3]\n",
      "   state [1 0 0 1 0 1 0 1] state_WI [  0.39   0.67   0.55   0.39   0.39 -10.     0.7    0.44] sorted [6 1 2]\n",
      "   state [0 0 0 1 0 0 0 0] state_WI [  0.38   0.67   0.55   0.39   0.39 -10.     0.7    0.84] sorted [7 6 1]\n",
      "   state [0 0 0 0 0 0 0 1] state_WI [  0.38   0.67   0.55   0.61   0.39 -10.     0.7    0.44] sorted [6 1 3]\n",
      "   state [0 0 0 1 0 0 1 1] state_WI [  0.38   0.67   0.55   0.39   0.39 -10.   -10.     0.44] sorted [1 2 7]\n",
      "   state [0 1 1 1 0 0 0 1] state_WI [  0.38   0.28 -10.     0.39   0.39 -10.     0.7    0.44] sorted [6 7 3]\n",
      "   state [0 1 0 1 0 0 1 1] state_WI [  0.38   0.28   0.55   0.39   0.39 -10.   -10.     0.44] sorted [2 7 3]\n",
      "   state [0 1 1 1 0 0 1 1] state_WI [  0.38   0.28 -10.     0.39   0.39 -10.   -10.     0.44] sorted [7 3 4]\n",
      "   state [0 1 1 1 1 1 1 1] state_WI [  0.38   0.28 -10.     0.39 -10.   -10.   -10.     0.44] sorted [7 3 0]\n",
      "   state [0 0 0 1 1 0 0 1] state_WI [  0.38   0.67   0.55   0.39 -10.   -10.     0.7    0.44] sorted [6 1 2]\n",
      "   state [0 1 0 0 0 0 0 0] state_WI [  0.38   0.28   0.55   0.61   0.39 -10.     0.7    0.84] sorted [7 6 3]\n",
      "instance 3, ep 19, state [1 1 0 1 0 1 0 1]\n",
      "   state [1 1 0 1 0 1 0 1] state_WI [  0.39   0.28   0.55   0.39   0.39 -10.     0.7    0.44] sorted [6 2 7]\n",
      "   state [1 1 1 1 0 0 0 1] state_WI [  0.39   0.28 -10.     0.39   0.39 -10.     0.7    0.44] sorted [6 7 3]\n",
      "   state [0 1 0 1 1 0 1 1] state_WI [  0.38   0.28   0.55   0.39 -10.   -10.   -10.     0.44] sorted [2 7 3]\n",
      "   state [1 1 1 1 1 0 1 1] state_WI [  0.39   0.28 -10.     0.39 -10.   -10.   -10.     0.44] sorted [7 3 0]\n",
      "   state [1 0 0 1 0 0 0 1] state_WI [  0.39   0.67   0.55   0.39   0.39 -10.     0.7    0.44] sorted [6 1 2]\n",
      "   state [0 0 0 1 0 0 1 0] state_WI [  0.38   0.67   0.55   0.39   0.39 -10.   -10.     0.84] sorted [7 1 2]\n",
      "   state [0 1 0 0 0 0 1 0] state_WI [  0.38   0.28   0.55   0.61   0.39 -10.   -10.     0.84] sorted [7 3 2]\n",
      "   state [1 1 0 1 0 0 0 1] state_WI [  0.39   0.28   0.55   0.39   0.39 -10.     0.7    0.44] sorted [6 2 7]\n",
      "   state [1 0 1 1 0 0 1 0] state_WI [  0.39   0.67 -10.     0.39   0.39 -10.   -10.     0.84] sorted [7 1 3]\n",
      "   state [0 1 0 1 0 0 1 1] state_WI [  0.38   0.28   0.55   0.39   0.39 -10.   -10.     0.44] sorted [2 7 3]\n",
      "   state [0 1 0 1 1 0 0 1] state_WI [  0.38   0.28   0.55   0.39 -10.   -10.     0.7    0.44] sorted [6 2 7]\n",
      "   state [1 1 1 0 0 0 1 1] state_WI [  0.39   0.28 -10.     0.61   0.39 -10.   -10.     0.44] sorted [3 7 0]\n",
      "   state [1 1 0 1 0 1 0 0] state_WI [  0.39   0.28   0.55   0.39   0.39 -10.     0.7    0.84] sorted [7 6 2]\n",
      "   state [1 0 0 0 0 0 0 1] state_WI [  0.39   0.67   0.55   0.61   0.39 -10.     0.7    0.44] sorted [6 1 3]\n",
      "   state [0 1 0 1 0 0 1 1] state_WI [  0.38   0.28   0.55   0.39   0.39 -10.   -10.     0.44] sorted [2 7 3]\n",
      "   state [0 0 1 0 0 0 0 1] state_WI [  0.38   0.67 -10.     0.61   0.39 -10.     0.7    0.44] sorted [6 1 3]\n",
      "   state [0 1 0 1 1 0 1 1] state_WI [  0.38   0.28   0.55   0.39 -10.   -10.   -10.     0.44] sorted [2 7 3]\n",
      "   state [0 1 0 1 0 0 1 0] state_WI [  0.38   0.28   0.55   0.39   0.39 -10.   -10.     0.84] sorted [7 2 3]\n",
      "   state [0 0 0 0 0 0 1 1] state_WI [  0.38   0.67   0.55   0.61   0.39 -10.   -10.     0.44] sorted [1 3 2]\n",
      "   state [0 0 1 1 0 0 1 1] state_WI [  0.38   0.67 -10.     0.39   0.39 -10.   -10.     0.44] sorted [1 7 3]\n",
      "instance 3, ep 20, state [0 1 1 0 0 0 0 1]\n",
      "   state [0 1 1 0 0 0 0 1] state_WI [  0.38   0.28 -10.     0.61   0.39 -10.     0.7    0.44] sorted [6 3 7]\n",
      "   state [1 0 0 0 0 0 1 1] state_WI [  0.39   0.67   0.55   0.61   0.39 -10.   -10.     0.44] sorted [1 3 2]\n",
      "   state [1 0 0 0 0 0 0 0] state_WI [  0.39   0.67   0.55   0.61   0.39 -10.     0.7    0.84] sorted [7 6 1]\n",
      "   state [0 0 0 0 0 0 0 0] state_WI [  0.38   0.67   0.55   0.61   0.39 -10.     0.7    0.84] sorted [7 6 1]\n",
      "   state [0 1 0 0 0 0 0 0] state_WI [  0.38   0.28   0.55   0.61   0.39 -10.     0.7    0.84] sorted [7 6 3]\n",
      "   state [0 0 0 1 0 0 0 1] state_WI [  0.38   0.67   0.55   0.39   0.39 -10.     0.7    0.44] sorted [6 1 2]\n",
      "   state [0 1 0 0 1 0 1 0] state_WI [  0.38   0.28   0.55   0.61 -10.   -10.   -10.     0.84] sorted [7 3 2]\n",
      "   state [0 0 1 1 1 0 1 1] state_WI [  0.38   0.67 -10.     0.39 -10.   -10.   -10.     0.44] sorted [1 7 3]\n",
      "   state [0 1 0 0 0 0 0 1] state_WI [  0.38   0.28   0.55   0.61   0.39 -10.     0.7    0.44] sorted [6 3 2]\n",
      "   state [0 0 1 1 0 1 1 0] state_WI [  0.38   0.67 -10.     0.39   0.39 -10.   -10.     0.84] sorted [7 1 3]\n",
      "   state [0 1 1 1 0 0 0 0] state_WI [  0.38   0.28 -10.     0.39   0.39 -10.     0.7    0.84] sorted [7 6 3]\n",
      "   state [0 0 0 0 0 0 0 1] state_WI [  0.38   0.67   0.55   0.61   0.39 -10.     0.7    0.44] sorted [6 1 3]\n",
      "   state [0 1 1 0 0 0 1 1] state_WI [  0.38   0.28 -10.     0.61   0.39 -10.   -10.     0.44] sorted [3 7 4]\n",
      "   state [0 1 1 1 0 0 1 1] state_WI [  0.38   0.28 -10.     0.39   0.39 -10.   -10.     0.44] sorted [7 3 4]\n",
      "   state [0 1 0 1 0 0 1 1] state_WI [  0.38   0.28   0.55   0.39   0.39 -10.   -10.     0.44] sorted [2 7 3]\n",
      "   state [0 1 1 0 0 0 0 1] state_WI [  0.38   0.28 -10.     0.61   0.39 -10.     0.7    0.44] sorted [6 3 7]\n",
      "   state [0 0 1 1 0 0 1 1] state_WI [  0.38   0.67 -10.     0.39   0.39 -10.   -10.     0.44] sorted [1 7 3]\n",
      "   state [0 1 0 0 0 0 0 0] state_WI [  0.38   0.28   0.55   0.61   0.39 -10.     0.7    0.84] sorted [7 6 3]\n",
      "   state [0 1 0 1 1 0 1 1] state_WI [  0.38   0.28   0.55   0.39 -10.   -10.   -10.     0.44] sorted [2 7 3]\n",
      "   state [0 1 0 1 0 0 0 0] state_WI [  0.38   0.28   0.55   0.39   0.39 -10.     0.7    0.84] sorted [7 6 2]\n",
      "instance 3, ep 21, state [0 0 0 1 0 0 0 0]\n",
      "   state [0 0 0 1 0 0 0 0] state_WI [  0.38   0.67   0.55   0.39   0.39 -10.     0.7    0.84] sorted [7 6 1]\n",
      "   state [0 1 0 1 0 0 0 1] state_WI [  0.38   0.28   0.55   0.39   0.39 -10.     0.7    0.44] sorted [6 2 7]\n",
      "   state [1 0 0 0 0 0 1 1] state_WI [  0.39   0.67   0.55   0.61   0.39 -10.   -10.     0.44] sorted [1 3 2]\n",
      "   state [0 0 1 1 0 0 0 1] state_WI [  0.38   0.67 -10.     0.39   0.39 -10.     0.7    0.44] sorted [6 1 7]\n",
      "   state [0 1 0 0 0 0 1 0] state_WI [  0.38   0.28   0.55   0.61   0.39 -10.   -10.     0.84] sorted [7 3 2]\n",
      "   state [0 1 1 0 0 1 1 1] state_WI [  0.38   0.28 -10.     0.61   0.39 -10.   -10.     0.44] sorted [3 7 4]\n",
      "   state [0 1 0 1 1 1 1 1] state_WI [  0.38   0.28   0.55   0.39 -10.   -10.   -10.     0.44] sorted [2 7 3]\n",
      "   state [0 1 0 1 0 0 0 1] state_WI [  0.38   0.28   0.55   0.39   0.39 -10.     0.7    0.44] sorted [6 2 7]\n",
      "   state [1 0 0 1 1 1 0 1] state_WI [  0.39   0.67   0.55   0.39 -10.   -10.     0.7    0.44] sorted [6 1 2]\n",
      "   state [0 1 1 0 0 0 1 0] state_WI [  0.38   0.28 -10.     0.61   0.39 -10.   -10.     0.84] sorted [7 3 4]\n",
      "   state [0 0 0 1 1 1 0 0] state_WI [  0.38   0.67   0.55   0.39 -10.   -10.     0.7    0.84] sorted [7 6 1]\n",
      "   state [0 1 0 1 0 0 0 1] state_WI [  0.38   0.28   0.55   0.39   0.39 -10.     0.7    0.44] sorted [6 2 7]\n",
      "   state [0 1 1 0 0 0 1 0] state_WI [  0.38   0.28 -10.     0.61   0.39 -10.   -10.     0.84] sorted [7 3 4]\n",
      "   state [0 1 1 1 1 0 1 1] state_WI [  0.38   0.28 -10.     0.39 -10.   -10.   -10.     0.44] sorted [7 3 0]\n",
      "   state [1 0 0 1 0 0 1 0] state_WI [  0.39   0.67   0.55   0.39   0.39 -10.   -10.     0.84] sorted [7 1 2]\n",
      "   state [0 0 0 1 0 0 1 1] state_WI [  0.38   0.67   0.55   0.39   0.39 -10.   -10.     0.44] sorted [1 2 7]\n",
      "   state [0 1 1 1 0 1 0 1] state_WI [  0.38   0.28 -10.     0.39   0.39 -10.     0.7    0.44] sorted [6 7 3]\n",
      "   state [0 0 1 1 0 0 0 1] state_WI [  0.38   0.67 -10.     0.39   0.39 -10.     0.7    0.44] sorted [6 1 7]\n",
      "   state [0 1 1 1 0 0 1 1] state_WI [  0.38   0.28 -10.     0.39   0.39 -10.   -10.     0.44] sorted [7 3 4]\n",
      "   state [0 1 1 1 1 0 1 1] state_WI [  0.38   0.28 -10.     0.39 -10.   -10.   -10.     0.44] sorted [7 3 0]\n",
      "instance 3, ep 22, state [1 0 0 1 1 0 1 1]\n",
      "   state [1 0 0 1 1 0 1 1] state_WI [  0.39   0.67   0.55   0.39 -10.   -10.   -10.     0.44] sorted [1 2 7]\n",
      "   state [0 0 1 1 1 0 0 1] state_WI [  0.38   0.67 -10.     0.39 -10.   -10.     0.7    0.44] sorted [6 1 7]\n",
      "   state [0 1 0 1 1 1 1 1] state_WI [  0.38   0.28   0.55   0.39 -10.   -10.   -10.     0.44] sorted [2 7 3]\n",
      "   state [0 0 0 1 0 0 0 1] state_WI [  0.38   0.67   0.55   0.39   0.39 -10.     0.7    0.44] sorted [6 1 2]\n",
      "   state [0 1 1 1 0 1 1 1] state_WI [  0.38   0.28 -10.     0.39   0.39 -10.   -10.     0.44] sorted [7 3 4]\n",
      "   state [0 1 1 1 1 1 0 1] state_WI [  0.38   0.28 -10.     0.39 -10.   -10.     0.7    0.44] sorted [6 7 3]\n",
      "   state [0 1 1 1 0 0 0 1] state_WI [  0.38   0.28 -10.     0.39   0.39 -10.     0.7    0.44] sorted [6 7 3]\n",
      "   state [1 1 1 1 0 0 0 1] state_WI [  0.39   0.28 -10.     0.39   0.39 -10.     0.7    0.44] sorted [6 7 3]\n",
      "   state [1 1 0 1 1 0 1 1] state_WI [  0.39   0.28   0.55   0.39 -10.   -10.   -10.     0.44] sorted [2 7 3]\n",
      "   state [0 1 0 1 1 0 1 1] state_WI [  0.38   0.28   0.55   0.39 -10.   -10.   -10.     0.44] sorted [2 7 3]\n",
      "   state [0 1 1 0 1 0 1 1] state_WI [  0.38   0.28 -10.     0.61 -10.   -10.   -10.     0.44] sorted [3 7 0]\n",
      "   state [0 1 0 1 1 0 0 1] state_WI [  0.38   0.28   0.55   0.39 -10.   -10.     0.7    0.44] sorted [6 2 7]\n",
      "   state [1 1 1 1 0 0 1 1] state_WI [  0.39   0.28 -10.     0.39   0.39 -10.   -10.     0.44] sorted [7 3 0]\n",
      "   state [1 1 1 1 0 0 1 1] state_WI [  0.39   0.28 -10.     0.39   0.39 -10.   -10.     0.44] sorted [7 3 0]\n",
      "   state [1 0 0 1 0 0 0 1] state_WI [  0.39   0.67   0.55   0.39   0.39 -10.     0.7    0.44] sorted [6 1 2]\n",
      "   state [0 1 1 0 0 0 1 0] state_WI [  0.38   0.28 -10.     0.61   0.39 -10.   -10.     0.84] sorted [7 3 4]\n",
      "   state [0 0 0 1 1 0 0 1] state_WI [  0.38   0.67   0.55   0.39 -10.   -10.     0.7    0.44] sorted [6 1 2]\n",
      "   state [0 1 0 0 1 0 1 0] state_WI [  0.38   0.28   0.55   0.61 -10.   -10.   -10.     0.84] sorted [7 3 2]\n",
      "   state [0 0 0 1 1 0 0 1] state_WI [  0.38   0.67   0.55   0.39 -10.   -10.     0.7    0.44] sorted [6 1 2]\n",
      "   state [0 1 0 0 0 0 0 0] state_WI [  0.38   0.28   0.55   0.61   0.39 -10.     0.7    0.84] sorted [7 6 3]\n",
      "instance 3, ep 23, state [0 1 1 0 0 0 1 1]\n",
      "   state [0 1 1 0 0 0 1 1] state_WI [  0.38   0.28 -10.     0.61   0.39 -10.   -10.     0.44] sorted [3 7 4]\n",
      "   state [1 0 0 1 0 1 0 1] state_WI [  0.39   0.67   0.55   0.39   0.39 -10.     0.7    0.44] sorted [6 1 2]\n",
      "   state [0 0 0 0 0 1 0 0] state_WI [  0.38   0.67   0.55   0.61   0.39 -10.     0.7    0.84] sorted [7 6 1]\n",
      "   state [0 1 0 0 1 0 1 1] state_WI [  0.38   0.28   0.55   0.61 -10.   -10.   -10.     0.44] sorted [3 2 7]\n",
      "   state [1 1 1 0 0 0 1 1] state_WI [  0.39   0.28 -10.     0.61   0.39 -10.   -10.     0.44] sorted [3 7 0]\n",
      "   state [1 1 0 1 0 0 0 0] state_WI [  0.39   0.28   0.55   0.39   0.39 -10.     0.7    0.84] sorted [7 6 2]\n",
      "   state [1 1 1 1 0 0 1 1] state_WI [  0.39   0.28 -10.     0.39   0.39 -10.   -10.     0.44] sorted [7 3 0]\n",
      "   state [1 1 1 0 0 0 1 1] state_WI [  0.39   0.28 -10.     0.61   0.39 -10.   -10.     0.44] sorted [3 7 0]\n",
      "   state [1 0 1 1 0 0 1 1] state_WI [  0.39   0.67 -10.     0.39   0.39 -10.   -10.     0.44] sorted [1 7 3]\n",
      "   state [1 0 0 1 0 0 1 1] state_WI [  0.39   0.67   0.55   0.39   0.39 -10.   -10.     0.44] sorted [1 2 7]\n",
      "   state [0 0 1 1 0 0 1 1] state_WI [  0.38   0.67 -10.     0.39   0.39 -10.   -10.     0.44] sorted [1 7 3]\n",
      "   state [0 0 1 1 0 0 1 1] state_WI [  0.38   0.67 -10.     0.39   0.39 -10.   -10.     0.44] sorted [1 7 3]\n",
      "   state [1 1 1 0 0 0 0 0] state_WI [  0.39   0.28 -10.     0.61   0.39 -10.     0.7    0.84] sorted [7 6 3]\n",
      "   state [0 0 0 1 0 0 0 1] state_WI [  0.38   0.67   0.55   0.39   0.39 -10.     0.7    0.44] sorted [6 1 2]\n",
      "   state [0 1 1 0 0 0 1 0] state_WI [  0.38   0.28 -10.     0.61   0.39 -10.   -10.     0.84] sorted [7 3 4]\n",
      "   state [0 0 1 1 1 0 0 1] state_WI [  0.38   0.67 -10.     0.39 -10.   -10.     0.7    0.44] sorted [6 1 7]\n",
      "   state [1 1 0 1 1 0 0 0] state_WI [  0.39   0.28   0.55   0.39 -10.   -10.     0.7    0.84] sorted [7 6 2]\n",
      "   state [0 1 1 0 1 0 0 0] state_WI [  0.38   0.28 -10.     0.61 -10.   -10.     0.7    0.84] sorted [7 6 3]\n",
      "   state [0 1 1 0 1 0 1 1] state_WI [  0.38   0.28 -10.     0.61 -10.   -10.   -10.     0.44] sorted [3 7 0]\n",
      "   state [0 0 0 0 1 0 1 1] state_WI [  0.38   0.67   0.55   0.61 -10.   -10.   -10.     0.44] sorted [1 3 2]\n",
      "instance 3, ep 24, state [1 0 1 1 0 0 1 0]\n",
      "   state [1 0 1 1 0 0 1 0] state_WI [  0.39   0.67 -10.     0.39   0.39 -10.   -10.     0.84] sorted [7 1 3]\n",
      "   state [0 1 1 1 0 0 1 1] state_WI [  0.38   0.28 -10.     0.39   0.39 -10.   -10.     0.44] sorted [7 3 4]\n",
      "   state [0 1 0 0 0 0 0 1] state_WI [  0.38   0.28   0.55   0.61   0.39 -10.     0.7    0.44] sorted [6 3 2]\n",
      "   state [0 1 1 1 0 0 1 0] state_WI [  0.38   0.28 -10.     0.39   0.39 -10.   -10.     0.84] sorted [7 3 4]\n",
      "   state [0 1 1 1 0 0 0 1] state_WI [  0.38   0.28 -10.     0.39   0.39 -10.     0.7    0.44] sorted [6 7 3]\n",
      "   state [1 1 1 0 0 0 1 1] state_WI [  0.39   0.28 -10.     0.61   0.39 -10.   -10.     0.44] sorted [3 7 0]\n",
      "   state [1 0 0 1 0 0 1 1] state_WI [  0.39   0.67   0.55   0.39   0.39 -10.   -10.     0.44] sorted [1 2 7]\n",
      "   state [0 0 1 0 0 0 1 1] state_WI [  0.38   0.67 -10.     0.61   0.39 -10.   -10.     0.44] sorted [1 3 7]\n",
      "   state [0 1 0 1 0 0 1 1] state_WI [  0.38   0.28   0.55   0.39   0.39 -10.   -10.     0.44] sorted [2 7 3]\n",
      "   state [0 0 0 1 0 0 1 1] state_WI [  0.38   0.67   0.55   0.39   0.39 -10.   -10.     0.44] sorted [1 2 7]\n",
      "   state [0 1 1 0 0 0 1 1] state_WI [  0.38   0.28 -10.     0.61   0.39 -10.   -10.     0.44] sorted [3 7 4]\n",
      "   state [0 1 0 1 0 0 0 0] state_WI [  0.38   0.28   0.55   0.39   0.39 -10.     0.7    0.84] sorted [7 6 2]\n",
      "   state [0 0 0 1 0 0 1 1] state_WI [  0.38   0.67   0.55   0.39   0.39 -10.   -10.     0.44] sorted [1 2 7]\n",
      "   state [0 0 0 1 0 0 1 1] state_WI [  0.38   0.67   0.55   0.39   0.39 -10.   -10.     0.44] sorted [1 2 7]\n",
      "   state [0 1 1 0 0 0 1 1] state_WI [  0.38   0.28 -10.     0.61   0.39 -10.   -10.     0.44] sorted [3 7 4]\n",
      "   state [0 0 0 0 0 0 1 1] state_WI [  0.38   0.67   0.55   0.61   0.39 -10.   -10.     0.44] sorted [1 3 2]\n",
      "   state [1 1 1 1 1 0 0 0] state_WI [  0.39   0.28 -10.     0.39 -10.   -10.     0.7    0.84] sorted [7 6 3]\n",
      "   state [1 0 0 1 0 0 1 1] state_WI [  0.39   0.67   0.55   0.39   0.39 -10.   -10.     0.44] sorted [1 2 7]\n",
      "   state [1 0 0 0 0 0 1 1] state_WI [  0.39   0.67   0.55   0.61   0.39 -10.   -10.     0.44] sorted [1 3 2]\n",
      "   state [1 1 0 1 0 0 0 0] state_WI [  0.39   0.28   0.55   0.39   0.39 -10.     0.7    0.84] sorted [7 6 2]\n",
      "instance 3, ep 25, state [1 0 0 0 0 1 0 1]\n",
      "   state [1 0 0 0 0 1 0 1] state_WI [  0.39   0.67   0.55   0.61   0.39 -10.     0.7    0.44] sorted [6 1 3]\n",
      "   state [0 0 0 1 0 0 1 0] state_WI [  0.38   0.67   0.55   0.39   0.39 -10.   -10.     0.84] sorted [7 1 2]\n",
      "   state [0 1 1 0 0 0 1 0] state_WI [  0.38   0.28 -10.     0.61   0.39 -10.   -10.     0.84] sorted [7 3 4]\n",
      "   state [0 1 0 1 1 0 1 1] state_WI [  0.38   0.28   0.55   0.39 -10.   -10.   -10.     0.44] sorted [2 7 3]\n",
      "   state [0 1 1 1 0 0 1 1] state_WI [  0.38   0.28 -10.     0.39   0.39 -10.   -10.     0.44] sorted [7 3 4]\n",
      "   state [0 1 0 1 1 0 0 1] state_WI [  0.38   0.28   0.55   0.39 -10.   -10.     0.7    0.44] sorted [6 2 7]\n",
      "   state [0 0 1 1 1 0 1 1] state_WI [  0.38   0.67 -10.     0.39 -10.   -10.   -10.     0.44] sorted [1 7 3]\n",
      "   state [0 0 0 1 0 0 1 1] state_WI [  0.38   0.67   0.55   0.39   0.39 -10.   -10.     0.44] sorted [1 2 7]\n",
      "   state [0 1 1 0 0 0 0 1] state_WI [  0.38   0.28 -10.     0.61   0.39 -10.     0.7    0.44] sorted [6 3 7]\n",
      "   state [0 0 0 1 0 0 0 1] state_WI [  0.38   0.67   0.55   0.39   0.39 -10.     0.7    0.44] sorted [6 1 2]\n",
      "   state [1 1 1 1 0 1 1 1] state_WI [  0.39   0.28 -10.     0.39   0.39 -10.   -10.     0.44] sorted [7 3 0]\n",
      "   state [1 1 1 1 0 0 0 1] state_WI [  0.39   0.28 -10.     0.39   0.39 -10.     0.7    0.44] sorted [6 7 3]\n",
      "   state [0 0 0 1 0 0 1 1] state_WI [  0.38   0.67   0.55   0.39   0.39 -10.   -10.     0.44] sorted [1 2 7]\n",
      "   state [0 0 1 0 1 0 1 1] state_WI [  0.38   0.67 -10.     0.61 -10.   -10.   -10.     0.44] sorted [1 3 7]\n",
      "   state [0 0 1 0 0 0 0 1] state_WI [  0.38   0.67 -10.     0.61   0.39 -10.     0.7    0.44] sorted [6 1 3]\n",
      "   state [1 0 0 0 0 0 0 0] state_WI [  0.39   0.67   0.55   0.61   0.39 -10.     0.7    0.84] sorted [7 6 1]\n",
      "   state [0 1 0 0 0 0 1 1] state_WI [  0.38   0.28   0.55   0.61   0.39 -10.   -10.     0.44] sorted [3 2 7]\n",
      "   state [0 1 0 0 0 0 0 1] state_WI [  0.38   0.28   0.55   0.61   0.39 -10.     0.7    0.44] sorted [6 3 2]\n",
      "   state [0 1 0 1 1 0 1 1] state_WI [  0.38   0.28   0.55   0.39 -10.   -10.   -10.     0.44] sorted [2 7 3]\n",
      "   state [0 1 0 1 1 0 1 1] state_WI [  0.38   0.28   0.55   0.39 -10.   -10.   -10.     0.44] sorted [2 7 3]\n",
      "instance 3, ep 26, state [1 1 0 1 1 0 0 1]\n",
      "   state [1 1 0 1 1 0 0 1] state_WI [  0.39   0.28   0.55   0.39 -10.   -10.     0.7    0.44] sorted [6 2 7]\n",
      "   state [0 0 0 0 0 0 1 1] state_WI [  0.38   0.67   0.55   0.61   0.39 -10.   -10.     0.44] sorted [1 3 2]\n",
      "   state [0 1 1 1 0 0 1 0] state_WI [  0.38   0.28 -10.     0.39   0.39 -10.   -10.     0.84] sorted [7 3 4]\n",
      "   state [0 1 0 0 1 0 1 1] state_WI [  0.38   0.28   0.55   0.61 -10.   -10.   -10.     0.44] sorted [3 2 7]\n",
      "   state [0 1 1 1 1 0 0 1] state_WI [  0.38   0.28 -10.     0.39 -10.   -10.     0.7    0.44] sorted [6 7 3]\n",
      "   state [0 0 1 1 1 0 0 1] state_WI [  0.38   0.67 -10.     0.39 -10.   -10.     0.7    0.44] sorted [6 1 7]\n",
      "   state [0 1 0 1 0 0 0 1] state_WI [  0.38   0.28   0.55   0.39   0.39 -10.     0.7    0.44] sorted [6 2 7]\n",
      "   state [1 1 0 0 0 0 1 1] state_WI [  0.39   0.28   0.55   0.61   0.39 -10.   -10.     0.44] sorted [3 2 7]\n",
      "   state [0 1 0 1 1 0 1 1] state_WI [  0.38   0.28   0.55   0.39 -10.   -10.   -10.     0.44] sorted [2 7 3]\n",
      "   state [0 0 0 1 0 0 1 1] state_WI [  0.38   0.67   0.55   0.39   0.39 -10.   -10.     0.44] sorted [1 2 7]\n",
      "   state [0 0 0 0 0 0 1 1] state_WI [  0.38   0.67   0.55   0.61   0.39 -10.   -10.     0.44] sorted [1 3 2]\n",
      "   state [0 0 0 0 0 0 1 0] state_WI [  0.38   0.67   0.55   0.61   0.39 -10.   -10.     0.84] sorted [7 1 3]\n",
      "   state [0 1 0 0 0 0 0 1] state_WI [  0.38   0.28   0.55   0.61   0.39 -10.     0.7    0.44] sorted [6 3 2]\n",
      "   state [0 0 0 1 0 0 1 1] state_WI [  0.38   0.67   0.55   0.39   0.39 -10.   -10.     0.44] sorted [1 2 7]\n",
      "   state [0 1 1 0 0 1 0 1] state_WI [  0.38   0.28 -10.     0.61   0.39 -10.     0.7    0.44] sorted [6 3 7]\n",
      "   state [1 1 0 1 0 0 1 1] state_WI [  0.39   0.28   0.55   0.39   0.39 -10.   -10.     0.44] sorted [2 7 3]\n",
      "   state [0 1 0 1 0 0 0 1] state_WI [  0.38   0.28   0.55   0.39   0.39 -10.     0.7    0.44] sorted [6 2 7]\n",
      "   state [0 1 0 0 0 0 1 1] state_WI [  0.38   0.28   0.55   0.61   0.39 -10.   -10.     0.44] sorted [3 2 7]\n",
      "   state [0 1 0 1 0 0 1 1] state_WI [  0.38   0.28   0.55   0.39   0.39 -10.   -10.     0.44] sorted [2 7 3]\n",
      "   state [0 1 1 1 0 0 0 1] state_WI [  0.38   0.28 -10.     0.39   0.39 -10.     0.7    0.44] sorted [6 7 3]\n",
      "instance 3, ep 27, state [1 0 1 1 1 1 1 0]\n",
      "   state [1 0 1 1 1 1 1 0] state_WI [  0.39   0.67 -10.     0.39 -10.   -10.   -10.     0.84] sorted [7 1 3]\n",
      "   state [1 1 1 1 1 1 1 1] state_WI [  0.39   0.28 -10.     0.39 -10.   -10.   -10.     0.44] sorted [7 3 0]\n",
      "   state [1 1 0 1 0 0 1 1] state_WI [  0.39   0.28   0.55   0.39   0.39 -10.   -10.     0.44] sorted [2 7 3]\n",
      "   state [1 1 1 1 0 0 0 1] state_WI [  0.39   0.28 -10.     0.39   0.39 -10.     0.7    0.44] sorted [6 7 3]\n",
      "   state [0 0 1 1 0 0 0 1] state_WI [  0.38   0.67 -10.     0.39   0.39 -10.     0.7    0.44] sorted [6 1 7]\n",
      "   state [0 0 1 0 0 0 1 1] state_WI [  0.38   0.67 -10.     0.61   0.39 -10.   -10.     0.44] sorted [1 3 7]\n",
      "   state [1 0 0 1 0 0 0 1] state_WI [  0.39   0.67   0.55   0.39   0.39 -10.     0.7    0.44] sorted [6 1 2]\n",
      "   state [0 0 0 1 0 0 1 1] state_WI [  0.38   0.67   0.55   0.39   0.39 -10.   -10.     0.44] sorted [1 2 7]\n",
      "   state [0 1 0 0 0 0 0 1] state_WI [  0.38   0.28   0.55   0.61   0.39 -10.     0.7    0.44] sorted [6 3 2]\n",
      "   state [1 0 0 0 0 0 1 0] state_WI [  0.39   0.67   0.55   0.61   0.39 -10.   -10.     0.84] sorted [7 1 3]\n",
      "   state [0 0 1 1 0 1 1 0] state_WI [  0.38   0.67 -10.     0.39   0.39 -10.   -10.     0.84] sorted [7 1 3]\n",
      "   state [0 0 1 0 0 0 1 1] state_WI [  0.38   0.67 -10.     0.61   0.39 -10.   -10.     0.44] sorted [1 3 7]\n",
      "   state [0 1 0 0 0 0 0 1] state_WI [  0.38   0.28   0.55   0.61   0.39 -10.     0.7    0.44] sorted [6 3 2]\n",
      "   state [0 0 1 0 0 0 1 0] state_WI [  0.38   0.67 -10.     0.61   0.39 -10.   -10.     0.84] sorted [7 1 3]\n",
      "   state [0 0 0 0 0 0 1 1] state_WI [  0.38   0.67   0.55   0.61   0.39 -10.   -10.     0.44] sorted [1 3 2]\n",
      "   state [0 1 0 1 0 0 1 0] state_WI [  0.38   0.28   0.55   0.39   0.39 -10.   -10.     0.84] sorted [7 2 3]\n",
      "   state [0 0 1 1 0 0 1 1] state_WI [  0.38   0.67 -10.     0.39   0.39 -10.   -10.     0.44] sorted [1 7 3]\n",
      "   state [0 0 0 1 0 0 0 1] state_WI [  0.38   0.67   0.55   0.39   0.39 -10.     0.7    0.44] sorted [6 1 2]\n",
      "   state [1 1 1 0 0 0 1 0] state_WI [  0.39   0.28 -10.     0.61   0.39 -10.   -10.     0.84] sorted [7 3 0]\n",
      "   state [1 0 1 0 0 0 0 1] state_WI [  0.39   0.67 -10.     0.61   0.39 -10.     0.7    0.44] sorted [6 1 3]\n",
      "instance 3, ep 28, state [0 0 1 1 0 1 1 1]\n",
      "   state [0 0 1 1 0 1 1 1] state_WI [  0.38   0.67 -10.     0.39   0.39 -10.   -10.     0.44] sorted [1 7 3]\n",
      "   state [0 0 0 1 0 1 1 1] state_WI [  0.38   0.67   0.55   0.39   0.39 -10.   -10.     0.44] sorted [1 2 7]\n",
      "   state [0 0 0 0 0 0 0 1] state_WI [  0.38   0.67   0.55   0.61   0.39 -10.     0.7    0.44] sorted [6 1 3]\n",
      "   state [0 0 0 1 0 0 0 1] state_WI [  0.38   0.67   0.55   0.39   0.39 -10.     0.7    0.44] sorted [6 1 2]\n",
      "   state [0 1 1 1 0 0 1 0] state_WI [  0.38   0.28 -10.     0.39   0.39 -10.   -10.     0.84] sorted [7 3 4]\n",
      "   state [1 0 1 1 1 0 1 1] state_WI [  0.39   0.67 -10.     0.39 -10.   -10.   -10.     0.44] sorted [1 7 3]\n",
      "   state [0 0 0 1 0 0 0 1] state_WI [  0.38   0.67   0.55   0.39   0.39 -10.     0.7    0.44] sorted [6 1 2]\n",
      "   state [0 0 1 1 0 1 1 0] state_WI [  0.38   0.67 -10.     0.39   0.39 -10.   -10.     0.84] sorted [7 1 3]\n",
      "   state [0 1 0 1 0 0 1 1] state_WI [  0.38   0.28   0.55   0.39   0.39 -10.   -10.     0.44] sorted [2 7 3]\n",
      "   state [0 1 1 1 0 0 1 0] state_WI [  0.38   0.28 -10.     0.39   0.39 -10.   -10.     0.84] sorted [7 3 4]\n",
      "   state [0 1 1 1 0 0 1 1] state_WI [  0.38   0.28 -10.     0.39   0.39 -10.   -10.     0.44] sorted [7 3 4]\n",
      "   state [0 0 1 1 0 0 0 1] state_WI [  0.38   0.67 -10.     0.39   0.39 -10.     0.7    0.44] sorted [6 1 7]\n",
      "   state [1 1 0 1 0 0 1 1] state_WI [  0.39   0.28   0.55   0.39   0.39 -10.   -10.     0.44] sorted [2 7 3]\n",
      "   state [0 1 0 1 1 0 0 1] state_WI [  0.38   0.28   0.55   0.39 -10.   -10.     0.7    0.44] sorted [6 2 7]\n",
      "   state [0 0 1 0 0 0 1 1] state_WI [  0.38   0.67 -10.     0.61   0.39 -10.   -10.     0.44] sorted [1 3 7]\n",
      "   state [0 1 0 0 0 0 1 1] state_WI [  0.38   0.28   0.55   0.61   0.39 -10.   -10.     0.44] sorted [3 2 7]\n",
      "   state [1 1 1 0 0 0 0 1] state_WI [  0.39   0.28 -10.     0.61   0.39 -10.     0.7    0.44] sorted [6 3 7]\n",
      "   state [0 0 0 1 0 0 1 1] state_WI [  0.38   0.67   0.55   0.39   0.39 -10.   -10.     0.44] sorted [1 2 7]\n",
      "   state [1 1 0 0 1 0 1 1] state_WI [  0.39   0.28   0.55   0.61 -10.   -10.   -10.     0.44] sorted [3 2 7]\n",
      "   state [0 1 1 1 0 0 1 1] state_WI [  0.38   0.28 -10.     0.39   0.39 -10.   -10.     0.44] sorted [7 3 4]\n",
      "instance 3, ep 29, state [0 1 0 0 0 0 0 1]\n",
      "   state [0 1 0 0 0 0 0 1] state_WI [  0.38   0.28   0.55   0.61   0.39 -10.     0.7    0.44] sorted [6 3 2]\n",
      "   state [0 0 0 0 0 0 1 1] state_WI [  0.38   0.67   0.55   0.61   0.39 -10.   -10.     0.44] sorted [1 3 2]\n",
      "   state [0 1 0 1 0 0 0 0] state_WI [  0.38   0.28   0.55   0.39   0.39 -10.     0.7    0.84] sorted [7 6 2]\n",
      "   state [0 1 0 1 0 0 1 1] state_WI [  0.38   0.28   0.55   0.39   0.39 -10.   -10.     0.44] sorted [2 7 3]\n",
      "   state [1 1 1 1 0 0 0 1] state_WI [  0.39   0.28 -10.     0.39   0.39 -10.     0.7    0.44] sorted [6 7 3]\n",
      "   state [0 0 0 0 0 0 1 0] state_WI [  0.38   0.67   0.55   0.61   0.39 -10.   -10.     0.84] sorted [7 1 3]\n",
      "   state [0 1 0 0 0 0 0 0] state_WI [  0.38   0.28   0.55   0.61   0.39 -10.     0.7    0.84] sorted [7 6 3]\n",
      "   state [0 1 0 1 0 0 1 0] state_WI [  0.38   0.28   0.55   0.39   0.39 -10.   -10.     0.84] sorted [7 2 3]\n",
      "   state [1 1 1 1 0 0 1 0] state_WI [  0.39   0.28 -10.     0.39   0.39 -10.   -10.     0.84] sorted [7 3 0]\n",
      "   state [1 0 0 1 0 1 0 0] state_WI [  0.39   0.67   0.55   0.39   0.39 -10.     0.7    0.84] sorted [7 6 1]\n",
      "   state [1 0 0 0 0 0 0 1] state_WI [  0.39   0.67   0.55   0.61   0.39 -10.     0.7    0.44] sorted [6 1 3]\n",
      "   state [1 0 0 0 0 0 1 1] state_WI [  0.39   0.67   0.55   0.61   0.39 -10.   -10.     0.44] sorted [1 3 2]\n",
      "   state [1 0 0 1 1 0 0 1] state_WI [  0.39   0.67   0.55   0.39 -10.   -10.     0.7    0.44] sorted [6 1 2]\n",
      "   state [0 1 1 0 1 1 1 0] state_WI [  0.38   0.28 -10.     0.61 -10.   -10.   -10.     0.84] sorted [7 3 0]\n",
      "   state [0 1 0 0 0 0 0 1] state_WI [  0.38   0.28   0.55   0.61   0.39 -10.     0.7    0.44] sorted [6 3 2]\n",
      "   state [0 1 1 0 1 0 1 1] state_WI [  0.38   0.28 -10.     0.61 -10.   -10.   -10.     0.44] sorted [3 7 0]\n",
      "   state [1 0 1 1 0 0 0 1] state_WI [  0.39   0.67 -10.     0.39   0.39 -10.     0.7    0.44] sorted [6 1 7]\n",
      "   state [0 1 0 1 0 0 0 0] state_WI [  0.38   0.28   0.55   0.39   0.39 -10.     0.7    0.84] sorted [7 6 2]\n",
      "   state [0 1 1 1 0 0 0 1] state_WI [  0.38   0.28 -10.     0.39   0.39 -10.     0.7    0.44] sorted [6 7 3]\n",
      "   state [0 0 0 1 1 0 1 1] state_WI [  0.38   0.67   0.55   0.39 -10.   -10.   -10.     0.44] sorted [1 2 7]\n",
      "first state [1 1 1 0 1 1 1 0]\n",
      "   state [1 1 1 0 1 1 1 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.42   0.47 -10.  ] sorted [6 5 4]\n",
      "   state [1 0 1 0 1 1 0 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.42   0.38 -10.  ] sorted [5 6 4]\n",
      "   state [0 0 1 0 1 1 1 0] state_WI [  0.51  -0.     0.27   0.14   0.32   0.42   0.47 -10.  ] sorted [0 6 5]\n",
      "   state [0 0 1 0 1 1 1 0] state_WI [  0.51  -0.     0.27   0.14   0.32   0.42   0.47 -10.  ] sorted [0 6 5]\n",
      "   state [1 0 1 0 0 1 1 0] state_WI [  0.22  -0.     0.27   0.14   0.61   0.42   0.47 -10.  ] sorted [4 6 5]\n",
      "   state [0 0 1 1 1 1 1 1] state_WI [  0.51  -0.     0.27   0.05   0.32   0.42   0.47 -10.  ] sorted [0 6 5]\n",
      "   state [1 0 1 0 1 0 1 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.41   0.47 -10.  ] sorted [6 5 4]\n",
      "   state [1 0 0 0 1 1 1 0] state_WI [  0.22  -0.     0.77   0.14   0.32   0.42   0.47 -10.  ] sorted [2 6 5]\n",
      "   state [0 0 1 0 1 1 1 0] state_WI [  0.51  -0.     0.27   0.14   0.32   0.42   0.47 -10.  ] sorted [0 6 5]\n",
      "   state [0 0 0 0 0 0 1 0] state_WI [  0.51  -0.     0.77   0.14   0.61   0.41   0.47 -10.  ] sorted [2 4 0]\n",
      "   state [0 0 1 0 0 1 0 0] state_WI [  0.51  -0.     0.27   0.14   0.61   0.42   0.38 -10.  ] sorted [4 0 5]\n",
      "   state [1 0 1 0 1 0 0 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.41   0.38 -10.  ] sorted [5 6 4]\n",
      "   state [1 0 1 0 1 1 1 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.42   0.47 -10.  ] sorted [6 5 4]\n",
      "   state [1 0 0 0 1 1 0 0] state_WI [  0.22  -0.     0.77   0.14   0.32   0.42   0.38 -10.  ] sorted [2 5 6]\n",
      "   state [1 0 1 0 0 0 0 0] state_WI [  0.22  -0.     0.27   0.14   0.61   0.41   0.38 -10.  ] sorted [4 5 6]\n",
      "   state [0 0 0 0 1 1 1 0] state_WI [  0.51  -0.     0.77   0.14   0.32   0.42   0.47 -10.  ] sorted [2 0 6]\n",
      "   state [0 0 0 0 1 0 1 0] state_WI [  0.51  -0.     0.77   0.14   0.32   0.41   0.47 -10.  ] sorted [2 0 6]\n",
      "   state [1 0 1 0 0 0 1 0] state_WI [  0.22  -0.     0.27   0.14   0.61   0.41   0.47 -10.  ] sorted [4 6 5]\n",
      "   state [0 0 1 0 0 1 1 0] state_WI [  0.51  -0.     0.27   0.14   0.61   0.42   0.47 -10.  ] sorted [4 0 6]\n",
      "   state [1 0 1 0 0 0 1 0] state_WI [  0.22  -0.     0.27   0.14   0.61   0.41   0.47 -10.  ] sorted [4 6 5]\n",
      "instance 4, ep 1, state [0 0 0 1 0 1 0 0]\n",
      "   state [0 0 0 1 0 1 0 0] state_WI [  0.51  -0.     0.77   0.05   0.61   0.42   0.38 -10.  ] sorted [2 4 0]\n",
      "   state [0 0 1 0 1 0 0 0] state_WI [  0.51  -0.     0.27   0.14   0.32   0.41   0.38 -10.  ] sorted [0 5 6]\n",
      "   state [1 0 0 0 0 0 0 0] state_WI [  0.22  -0.     0.77   0.14   0.61   0.41   0.38 -10.  ] sorted [2 4 5]\n",
      "   state [0 0 1 0 1 0 0 0] state_WI [  0.51  -0.     0.27   0.14   0.32   0.41   0.38 -10.  ] sorted [0 5 6]\n",
      "   state [0 0 1 0 1 0 1 0] state_WI [  0.51  -0.     0.27   0.14   0.32   0.41   0.47 -10.  ] sorted [0 6 5]\n",
      "   state [1 0 0 0 1 1 1 0] state_WI [  0.22  -0.     0.77   0.14   0.32   0.42   0.47 -10.  ] sorted [2 6 5]\n",
      "   state [1 0 0 0 0 1 1 0] state_WI [  0.22  -0.     0.77   0.14   0.61   0.42   0.47 -10.  ] sorted [2 4 6]\n",
      "   state [1 0 1 1 1 1 1 0] state_WI [  0.22  -0.     0.27   0.05   0.32   0.42   0.47 -10.  ] sorted [6 5 4]\n",
      "   state [1 0 0 1 1 0 0 0] state_WI [  0.22  -0.     0.77   0.05   0.32   0.41   0.38 -10.  ] sorted [2 5 6]\n",
      "   state [1 0 1 1 1 0 1 0] state_WI [  0.22  -0.     0.27   0.05   0.32   0.41   0.47 -10.  ] sorted [6 5 4]\n",
      "   state [0 0 1 0 0 0 1 0] state_WI [  0.51  -0.     0.27   0.14   0.61   0.41   0.47 -10.  ] sorted [4 0 6]\n",
      "   state [1 0 0 0 1 0 0 0] state_WI [  0.22  -0.     0.77   0.14   0.32   0.41   0.38 -10.  ] sorted [2 5 6]\n",
      "   state [0 0 1 0 0 1 0 0] state_WI [  0.51  -0.     0.27   0.14   0.61   0.42   0.38 -10.  ] sorted [4 0 5]\n",
      "   state [1 0 0 0 0 1 1 0] state_WI [  0.22  -0.     0.77   0.14   0.61   0.42   0.47 -10.  ] sorted [2 4 6]\n",
      "   state [1 0 1 0 1 0 1 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.41   0.47 -10.  ] sorted [6 5 4]\n",
      "   state [0 0 0 0 1 1 1 0] state_WI [  0.51  -0.     0.77   0.14   0.32   0.42   0.47 -10.  ] sorted [2 0 6]\n",
      "   state [1 0 0 0 1 0 1 0] state_WI [  0.22  -0.     0.77   0.14   0.32   0.41   0.47 -10.  ] sorted [2 6 5]\n",
      "   state [1 0 1 0 0 0 1 0] state_WI [  0.22  -0.     0.27   0.14   0.61   0.41   0.47 -10.  ] sorted [4 6 5]\n",
      "   state [1 0 0 0 0 0 1 0] state_WI [  0.22  -0.     0.77   0.14   0.61   0.41   0.47 -10.  ] sorted [2 4 6]\n",
      "   state [1 0 1 0 1 0 1 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.41   0.47 -10.  ] sorted [6 5 4]\n",
      "instance 4, ep 2, state [1 1 0 1 1 0 1 1]\n",
      "   state [1 1 0 1 1 0 1 1] state_WI [  0.22  -0.     0.77   0.05   0.32   0.41   0.47 -10.  ] sorted [2 6 5]\n",
      "   state [1 0 1 1 0 0 1 0] state_WI [  0.22  -0.     0.27   0.05   0.61   0.41   0.47 -10.  ] sorted [4 6 5]\n",
      "   state [1 0 1 0 0 1 0 0] state_WI [  0.22  -0.     0.27   0.14   0.61   0.42   0.38 -10.  ] sorted [4 5 6]\n",
      "   state [1 0 0 0 1 1 1 0] state_WI [  0.22  -0.     0.77   0.14   0.32   0.42   0.47 -10.  ] sorted [2 6 5]\n",
      "   state [0 0 1 0 0 0 1 0] state_WI [  0.51  -0.     0.27   0.14   0.61   0.41   0.47 -10.  ] sorted [4 0 6]\n",
      "   state [0 0 1 0 0 0 1 0] state_WI [  0.51  -0.     0.27   0.14   0.61   0.41   0.47 -10.  ] sorted [4 0 6]\n",
      "   state [0 0 1 0 1 0 0 0] state_WI [  0.51  -0.     0.27   0.14   0.32   0.41   0.38 -10.  ] sorted [0 5 6]\n",
      "   state [0 0 0 0 1 1 0 0] state_WI [  0.51  -0.     0.77   0.14   0.32   0.42   0.38 -10.  ] sorted [2 0 5]\n",
      "   state [0 0 1 0 1 0 0 0] state_WI [  0.51  -0.     0.27   0.14   0.32   0.41   0.38 -10.  ] sorted [0 5 6]\n",
      "   state [1 0 1 0 1 0 1 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.41   0.47 -10.  ] sorted [6 5 4]\n",
      "   state [1 0 1 0 0 1 1 1] state_WI [  0.22  -0.     0.27   0.14   0.61   0.42   0.47 -10.  ] sorted [4 6 5]\n",
      "   state [1 0 1 0 1 1 1 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.42   0.47 -10.  ] sorted [6 5 4]\n",
      "   state [0 0 0 1 0 1 1 0] state_WI [  0.51  -0.     0.77   0.05   0.61   0.42   0.47 -10.  ] sorted [2 4 0]\n",
      "   state [0 0 0 1 0 0 0 0] state_WI [  0.51  -0.     0.77   0.05   0.61   0.41   0.38 -10.  ] sorted [2 4 0]\n",
      "   state [1 0 1 0 0 0 0 0] state_WI [  0.22  -0.     0.27   0.14   0.61   0.41   0.38 -10.  ] sorted [4 5 6]\n",
      "   state [0 0 1 0 1 1 0 0] state_WI [  0.51  -0.     0.27   0.14   0.32   0.42   0.38 -10.  ] sorted [0 5 6]\n",
      "   state [1 0 1 0 1 1 0 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.42   0.38 -10.  ] sorted [5 6 4]\n",
      "   state [1 0 0 0 1 1 1 0] state_WI [  0.22  -0.     0.77   0.14   0.32   0.42   0.47 -10.  ] sorted [2 6 5]\n",
      "   state [1 0 1 0 0 1 1 0] state_WI [  0.22  -0.     0.27   0.14   0.61   0.42   0.47 -10.  ] sorted [4 6 5]\n",
      "   state [0 0 1 1 1 1 1 0] state_WI [  0.51  -0.     0.27   0.05   0.32   0.42   0.47 -10.  ] sorted [0 6 5]\n",
      "instance 4, ep 3, state [1 0 1 0 0 0 0 1]\n",
      "   state [1 0 1 0 0 0 0 1] state_WI [  0.22  -0.     0.27   0.14   0.61   0.41   0.38 -10.  ] sorted [4 5 6]\n",
      "   state [1 0 1 0 1 1 1 1] state_WI [  0.22  -0.     0.27   0.14   0.32   0.42   0.47 -10.  ] sorted [6 5 4]\n",
      "   state [1 0 0 0 0 1 1 0] state_WI [  0.22  -0.     0.77   0.14   0.61   0.42   0.47 -10.  ] sorted [2 4 6]\n",
      "   state [1 0 1 0 1 1 1 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.42   0.47 -10.  ] sorted [6 5 4]\n",
      "   state [0 0 0 0 1 1 0 0] state_WI [  0.51  -0.     0.77   0.14   0.32   0.42   0.38 -10.  ] sorted [2 0 5]\n",
      "   state [0 0 0 1 0 0 0 0] state_WI [  0.51  -0.     0.77   0.05   0.61   0.41   0.38 -10.  ] sorted [2 4 0]\n",
      "   state [1 0 0 1 0 0 0 0] state_WI [  0.22  -0.     0.77   0.05   0.61   0.41   0.38 -10.  ] sorted [2 4 5]\n",
      "   state [0 0 1 0 1 1 0 0] state_WI [  0.51  -0.     0.27   0.14   0.32   0.42   0.38 -10.  ] sorted [0 5 6]\n",
      "   state [1 0 1 0 1 1 0 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.42   0.38 -10.  ] sorted [5 6 4]\n",
      "   state [1 0 1 0 1 1 0 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.42   0.38 -10.  ] sorted [5 6 4]\n",
      "   state [1 0 1 0 1 0 0 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.41   0.38 -10.  ] sorted [5 6 4]\n",
      "   state [1 0 1 0 0 0 1 0] state_WI [  0.22  -0.     0.27   0.14   0.61   0.41   0.47 -10.  ] sorted [4 6 5]\n",
      "   state [1 0 1 0 1 0 1 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.41   0.47 -10.  ] sorted [6 5 4]\n",
      "   state [0 0 0 0 1 1 1 0] state_WI [  0.51  -0.     0.77   0.14   0.32   0.42   0.47 -10.  ] sorted [2 0 6]\n",
      "   state [1 0 1 0 1 1 1 1] state_WI [  0.22  -0.     0.27   0.14   0.32   0.42   0.47 -10.  ] sorted [6 5 4]\n",
      "   state [1 0 1 0 1 0 0 1] state_WI [  0.22  -0.     0.27   0.14   0.32   0.41   0.38 -10.  ] sorted [5 6 4]\n",
      "   state [1 0 0 0 1 1 0 1] state_WI [  0.22  -0.     0.77   0.14   0.32   0.42   0.38 -10.  ] sorted [2 5 6]\n",
      "   state [1 0 1 0 0 1 0 0] state_WI [  0.22  -0.     0.27   0.14   0.61   0.42   0.38 -10.  ] sorted [4 5 6]\n",
      "   state [1 0 1 0 1 1 0 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.42   0.38 -10.  ] sorted [5 6 4]\n",
      "   state [1 0 1 0 1 0 0 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.41   0.38 -10.  ] sorted [5 6 4]\n",
      "instance 4, ep 4, state [1 1 0 0 0 1 0 1]\n",
      "   state [1 1 0 0 0 1 0 1] state_WI [  0.22  -0.     0.77   0.14   0.61   0.42   0.38 -10.  ] sorted [2 4 5]\n",
      "   state [1 0 1 0 0 1 0 0] state_WI [  0.22  -0.     0.27   0.14   0.61   0.42   0.38 -10.  ] sorted [4 5 6]\n",
      "   state [1 0 1 0 1 1 0 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.42   0.38 -10.  ] sorted [5 6 4]\n",
      "   state [0 0 0 0 1 1 0 0] state_WI [  0.51  -0.     0.77   0.14   0.32   0.42   0.38 -10.  ] sorted [2 0 5]\n",
      "   state [0 0 1 0 0 1 0 0] state_WI [  0.51  -0.     0.27   0.14   0.61   0.42   0.38 -10.  ] sorted [4 0 5]\n",
      "   state [1 0 1 0 1 0 0 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.41   0.38 -10.  ] sorted [5 6 4]\n",
      "   state [0 0 1 0 1 1 0 0] state_WI [  0.51  -0.     0.27   0.14   0.32   0.42   0.38 -10.  ] sorted [0 5 6]\n",
      "   state [0 0 1 0 0 1 0 1] state_WI [  0.51  -0.     0.27   0.14   0.61   0.42   0.38 -10.  ] sorted [4 0 5]\n",
      "   state [1 0 1 0 1 1 0 1] state_WI [  0.22  -0.     0.27   0.14   0.32   0.42   0.38 -10.  ] sorted [5 6 4]\n",
      "   state [1 0 1 0 1 0 0 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.41   0.38 -10.  ] sorted [5 6 4]\n",
      "   state [1 0 1 0 0 1 0 0] state_WI [  0.22  -0.     0.27   0.14   0.61   0.42   0.38 -10.  ] sorted [4 5 6]\n",
      "   state [1 0 1 0 1 1 0 1] state_WI [  0.22  -0.     0.27   0.14   0.32   0.42   0.38 -10.  ] sorted [5 6 4]\n",
      "   state [1 0 0 0 0 0 0 0] state_WI [  0.22  -0.     0.77   0.14   0.61   0.41   0.38 -10.  ] sorted [2 4 5]\n",
      "   state [1 0 1 1 0 0 0 0] state_WI [  0.22  -0.     0.27   0.05   0.61   0.41   0.38 -10.  ] sorted [4 5 6]\n",
      "   state [0 0 1 0 0 0 1 0] state_WI [  0.51  -0.     0.27   0.14   0.61   0.41   0.47 -10.  ] sorted [4 0 6]\n",
      "   state [0 0 1 0 1 0 1 1] state_WI [  0.51  -0.     0.27   0.14   0.32   0.41   0.47 -10.  ] sorted [0 6 5]\n",
      "   state [1 0 0 0 0 1 1 0] state_WI [  0.22  -0.     0.77   0.14   0.61   0.42   0.47 -10.  ] sorted [2 4 6]\n",
      "   state [0 0 1 0 0 0 1 0] state_WI [  0.51  -0.     0.27   0.14   0.61   0.41   0.47 -10.  ] sorted [4 0 6]\n",
      "   state [1 0 1 0 1 0 1 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.41   0.47 -10.  ] sorted [6 5 4]\n",
      "   state [1 0 0 0 1 1 0 0] state_WI [  0.22  -0.     0.77   0.14   0.32   0.42   0.38 -10.  ] sorted [2 5 6]\n",
      "instance 4, ep 5, state [1 0 1 0 1 1 0 0]\n",
      "   state [1 0 1 0 1 1 0 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.42   0.38 -10.  ] sorted [5 6 4]\n",
      "   state [0 0 0 0 0 0 0 0] state_WI [  0.51  -0.     0.77   0.14   0.61   0.41   0.38 -10.  ] sorted [2 4 0]\n",
      "   state [1 0 0 0 1 1 0 0] state_WI [  0.22  -0.     0.77   0.14   0.32   0.42   0.38 -10.  ] sorted [2 5 6]\n",
      "   state [0 0 1 0 0 1 1 0] state_WI [  0.51  -0.     0.27   0.14   0.61   0.42   0.47 -10.  ] sorted [4 0 6]\n",
      "   state [0 0 0 1 1 1 1 0] state_WI [  0.51  -0.     0.77   0.05   0.32   0.42   0.47 -10.  ] sorted [2 0 6]\n",
      "   state [0 0 1 1 0 0 1 0] state_WI [  0.51  -0.     0.27   0.05   0.61   0.41   0.47 -10.  ] sorted [4 0 6]\n",
      "   state [0 0 0 0 0 0 1 0] state_WI [  0.51  -0.     0.77   0.14   0.61   0.41   0.47 -10.  ] sorted [2 4 0]\n",
      "   state [1 0 0 0 1 0 1 0] state_WI [  0.22  -0.     0.77   0.14   0.32   0.41   0.47 -10.  ] sorted [2 6 5]\n",
      "   state [1 0 1 1 0 0 1 0] state_WI [  0.22  -0.     0.27   0.05   0.61   0.41   0.47 -10.  ] sorted [4 6 5]\n",
      "   state [1 0 1 0 1 0 1 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.41   0.47 -10.  ] sorted [6 5 4]\n",
      "   state [1 0 1 0 1 1 0 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.42   0.38 -10.  ] sorted [5 6 4]\n",
      "   state [1 0 1 0 1 0 1 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.41   0.47 -10.  ] sorted [6 5 4]\n",
      "   state [1 0 0 0 0 0 1 0] state_WI [  0.22  -0.     0.77   0.14   0.61   0.41   0.47 -10.  ] sorted [2 4 6]\n",
      "   state [1 0 1 0 0 0 1 0] state_WI [  0.22  -0.     0.27   0.14   0.61   0.41   0.47 -10.  ] sorted [4 6 5]\n",
      "   state [1 0 1 0 1 0 1 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.41   0.47 -10.  ] sorted [6 5 4]\n",
      "   state [1 0 0 0 1 0 1 0] state_WI [  0.22  -0.     0.77   0.14   0.32   0.41   0.47 -10.  ] sorted [2 6 5]\n",
      "   state [0 0 1 0 1 1 0 0] state_WI [  0.51  -0.     0.27   0.14   0.32   0.42   0.38 -10.  ] sorted [0 5 6]\n",
      "   state [1 0 1 0 1 1 0 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.42   0.38 -10.  ] sorted [5 6 4]\n",
      "   state [1 0 1 0 1 1 1 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.42   0.47 -10.  ] sorted [6 5 4]\n",
      "   state [1 0 1 0 1 0 1 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.41   0.47 -10.  ] sorted [6 5 4]\n",
      "instance 4, ep 6, state [1 1 0 1 1 1 0 1]\n",
      "   state [1 1 0 1 1 1 0 1] state_WI [  0.22  -0.     0.77   0.05   0.32   0.42   0.38 -10.  ] sorted [2 5 6]\n",
      "   state [1 0 1 0 0 1 1 1] state_WI [  0.22  -0.     0.27   0.14   0.61   0.42   0.47 -10.  ] sorted [4 6 5]\n",
      "   state [1 0 0 0 1 0 0 0] state_WI [  0.22  -0.     0.77   0.14   0.32   0.41   0.38 -10.  ] sorted [2 5 6]\n",
      "   state [1 0 1 0 1 0 0 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.41   0.38 -10.  ] sorted [5 6 4]\n",
      "   state [1 0 0 0 1 0 1 0] state_WI [  0.22  -0.     0.77   0.14   0.32   0.41   0.47 -10.  ] sorted [2 6 5]\n",
      "   state [1 0 1 0 0 1 1 0] state_WI [  0.22  -0.     0.27   0.14   0.61   0.42   0.47 -10.  ] sorted [4 6 5]\n",
      "   state [1 0 1 0 1 1 1 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.42   0.47 -10.  ] sorted [6 5 4]\n",
      "   state [0 0 1 0 1 1 1 0] state_WI [  0.51  -0.     0.27   0.14   0.32   0.42   0.47 -10.  ] sorted [0 6 5]\n",
      "   state [0 0 0 0 0 1 1 1] state_WI [  0.51  -0.     0.77   0.14   0.61   0.42   0.47 -10.  ] sorted [2 4 0]\n",
      "   state [0 0 1 1 1 1 0 0] state_WI [  0.51  -0.     0.27   0.05   0.32   0.42   0.38 -10.  ] sorted [0 5 6]\n",
      "   state [0 0 1 0 1 1 1 0] state_WI [  0.51  -0.     0.27   0.14   0.32   0.42   0.47 -10.  ] sorted [0 6 5]\n",
      "   state [0 0 1 0 1 0 1 0] state_WI [  0.51  -0.     0.27   0.14   0.32   0.41   0.47 -10.  ] sorted [0 6 5]\n",
      "   state [1 0 0 0 0 1 1 0] state_WI [  0.22  -0.     0.77   0.14   0.61   0.42   0.47 -10.  ] sorted [2 4 6]\n",
      "   state [0 0 1 0 1 1 1 0] state_WI [  0.51  -0.     0.27   0.14   0.32   0.42   0.47 -10.  ] sorted [0 6 5]\n",
      "   state [0 0 0 0 1 1 1 0] state_WI [  0.51  -0.     0.77   0.14   0.32   0.42   0.47 -10.  ] sorted [2 0 6]\n",
      "   state [1 0 1 0 0 0 1 0] state_WI [  0.22  -0.     0.27   0.14   0.61   0.41   0.47 -10.  ] sorted [4 6 5]\n",
      "   state [1 0 1 0 0 1 1 0] state_WI [  0.22  -0.     0.27   0.14   0.61   0.42   0.47 -10.  ] sorted [4 6 5]\n",
      "   state [1 0 1 0 1 1 0 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.42   0.38 -10.  ] sorted [5 6 4]\n",
      "   state [0 0 0 0 0 1 1 0] state_WI [  0.51  -0.     0.77   0.14   0.61   0.42   0.47 -10.  ] sorted [2 4 0]\n",
      "   state [0 0 1 0 1 1 1 0] state_WI [  0.51  -0.     0.27   0.14   0.32   0.42   0.47 -10.  ] sorted [0 6 5]\n",
      "instance 4, ep 7, state [1 0 0 1 0 1 0 0]\n",
      "   state [1 0 0 1 0 1 0 0] state_WI [  0.22  -0.     0.77   0.05   0.61   0.42   0.38 -10.  ] sorted [2 4 5]\n",
      "   state [0 0 1 0 1 0 0 0] state_WI [  0.51  -0.     0.27   0.14   0.32   0.41   0.38 -10.  ] sorted [0 5 6]\n",
      "   state [0 0 0 0 1 1 0 0] state_WI [  0.51  -0.     0.77   0.14   0.32   0.42   0.38 -10.  ] sorted [2 0 5]\n",
      "   state [0 0 1 0 0 1 0 0] state_WI [  0.51  -0.     0.27   0.14   0.61   0.42   0.38 -10.  ] sorted [4 0 5]\n",
      "   state [1 0 1 0 1 1 0 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.42   0.38 -10.  ] sorted [5 6 4]\n",
      "   state [1 0 0 0 1 1 0 0] state_WI [  0.22  -0.     0.77   0.14   0.32   0.42   0.38 -10.  ] sorted [2 5 6]\n",
      "   state [0 0 0 0 0 1 0 0] state_WI [  0.51  -0.     0.77   0.14   0.61   0.42   0.38 -10.  ] sorted [2 4 0]\n",
      "   state [1 0 1 0 1 0 1 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.41   0.47 -10.  ] sorted [6 5 4]\n",
      "   state [0 0 1 0 1 0 1 0] state_WI [  0.51  -0.     0.27   0.14   0.32   0.41   0.47 -10.  ] sorted [0 6 5]\n",
      "   state [0 0 0 0 0 1 0 0] state_WI [  0.51  -0.     0.77   0.14   0.61   0.42   0.38 -10.  ] sorted [2 4 0]\n",
      "   state [1 0 0 0 0 1 0 0] state_WI [  0.22  -0.     0.77   0.14   0.61   0.42   0.38 -10.  ] sorted [2 4 5]\n",
      "   state [0 0 1 0 1 1 0 0] state_WI [  0.51  -0.     0.27   0.14   0.32   0.42   0.38 -10.  ] sorted [0 5 6]\n",
      "   state [1 0 0 0 1 1 0 0] state_WI [  0.22  -0.     0.77   0.14   0.32   0.42   0.38 -10.  ] sorted [2 5 6]\n",
      "   state [0 0 1 0 1 1 0 0] state_WI [  0.51  -0.     0.27   0.14   0.32   0.42   0.38 -10.  ] sorted [0 5 6]\n",
      "   state [0 0 0 0 0 1 1 0] state_WI [  0.51  -0.     0.77   0.14   0.61   0.42   0.47 -10.  ] sorted [2 4 0]\n",
      "   state [1 0 1 0 1 1 1 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.42   0.47 -10.  ] sorted [6 5 4]\n",
      "   state [1 0 1 0 1 0 1 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.41   0.47 -10.  ] sorted [6 5 4]\n",
      "   state [0 0 1 0 0 1 1 0] state_WI [  0.51  -0.     0.27   0.14   0.61   0.42   0.47 -10.  ] sorted [4 0 6]\n",
      "   state [0 0 1 0 1 1 1 0] state_WI [  0.51  -0.     0.27   0.14   0.32   0.42   0.47 -10.  ] sorted [0 6 5]\n",
      "   state [1 0 1 0 1 1 1 1] state_WI [  0.22  -0.     0.27   0.14   0.32   0.42   0.47 -10.  ] sorted [6 5 4]\n",
      "instance 4, ep 8, state [1 0 1 0 1 0 0 1]\n",
      "   state [1 0 1 0 1 0 0 1] state_WI [  0.22  -0.     0.27   0.14   0.32   0.41   0.38 -10.  ] sorted [5 6 4]\n",
      "   state [1 0 1 0 0 1 0 0] state_WI [  0.22  -0.     0.27   0.14   0.61   0.42   0.38 -10.  ] sorted [4 5 6]\n",
      "   state [0 0 1 0 0 1 0 0] state_WI [  0.51  -0.     0.27   0.14   0.61   0.42   0.38 -10.  ] sorted [4 0 5]\n",
      "   state [0 0 0 0 1 0 1 0] state_WI [  0.51  -0.     0.77   0.14   0.32   0.41   0.47 -10.  ] sorted [2 0 6]\n",
      "   state [0 0 0 0 1 0 1 0] state_WI [  0.51  -0.     0.77   0.14   0.32   0.41   0.47 -10.  ] sorted [2 0 6]\n",
      "   state [1 0 1 1 0 0 1 0] state_WI [  0.22  -0.     0.27   0.05   0.61   0.41   0.47 -10.  ] sorted [4 6 5]\n",
      "   state [1 0 0 1 1 0 1 0] state_WI [  0.22  -0.     0.77   0.05   0.32   0.41   0.47 -10.  ] sorted [2 6 5]\n",
      "   state [1 0 1 0 1 1 1 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.42   0.47 -10.  ] sorted [6 5 4]\n",
      "   state [1 0 0 0 0 1 1 0] state_WI [  0.22  -0.     0.77   0.14   0.61   0.42   0.47 -10.  ] sorted [2 4 6]\n",
      "   state [0 0 1 0 1 0 1 0] state_WI [  0.51  -0.     0.27   0.14   0.32   0.41   0.47 -10.  ] sorted [0 6 5]\n",
      "   state [1 0 1 0 1 1 1 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.42   0.47 -10.  ] sorted [6 5 4]\n",
      "   state [1 0 1 0 0 1 1 0] state_WI [  0.22  -0.     0.27   0.14   0.61   0.42   0.47 -10.  ] sorted [4 6 5]\n",
      "   state [1 0 0 0 1 1 1 0] state_WI [  0.22  -0.     0.77   0.14   0.32   0.42   0.47 -10.  ] sorted [2 6 5]\n",
      "   state [0 0 0 0 1 0 1 0] state_WI [  0.51  -0.     0.77   0.14   0.32   0.41   0.47 -10.  ] sorted [2 0 6]\n",
      "   state [0 0 1 0 0 0 1 0] state_WI [  0.51  -0.     0.27   0.14   0.61   0.41   0.47 -10.  ] sorted [4 0 6]\n",
      "   state [1 0 0 0 1 0 1 0] state_WI [  0.22  -0.     0.77   0.14   0.32   0.41   0.47 -10.  ] sorted [2 6 5]\n",
      "   state [1 0 0 0 1 0 1 0] state_WI [  0.22  -0.     0.77   0.14   0.32   0.41   0.47 -10.  ] sorted [2 6 5]\n",
      "   state [1 0 1 0 1 1 0 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.42   0.38 -10.  ] sorted [5 6 4]\n",
      "   state [1 0 0 0 1 1 0 0] state_WI [  0.22  -0.     0.77   0.14   0.32   0.42   0.38 -10.  ] sorted [2 5 6]\n",
      "   state [1 0 0 0 0 1 1 1] state_WI [  0.22  -0.     0.77   0.14   0.61   0.42   0.47 -10.  ] sorted [2 4 6]\n",
      "instance 4, ep 9, state [0 1 0 1 0 1 0 0]\n",
      "   state [0 1 0 1 0 1 0 0] state_WI [  0.51  -0.     0.77   0.05   0.61   0.42   0.38 -10.  ] sorted [2 4 0]\n",
      "   state [0 0 1 1 0 0 0 0] state_WI [  0.51  -0.     0.27   0.05   0.61   0.41   0.38 -10.  ] sorted [4 0 5]\n",
      "   state [1 0 0 1 1 1 0 0] state_WI [  0.22  -0.     0.77   0.05   0.32   0.42   0.38 -10.  ] sorted [2 5 6]\n",
      "   state [1 0 1 0 1 1 0 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.42   0.38 -10.  ] sorted [5 6 4]\n",
      "   state [1 0 1 0 1 1 0 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.42   0.38 -10.  ] sorted [5 6 4]\n",
      "   state [1 0 1 0 1 0 1 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.41   0.47 -10.  ] sorted [6 5 4]\n",
      "   state [1 0 1 0 1 0 1 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.41   0.47 -10.  ] sorted [6 5 4]\n",
      "   state [1 0 1 1 1 0 1 0] state_WI [  0.22  -0.     0.27   0.05   0.32   0.41   0.47 -10.  ] sorted [6 5 4]\n",
      "   state [0 0 0 0 1 1 0 0] state_WI [  0.51  -0.     0.77   0.14   0.32   0.42   0.38 -10.  ] sorted [2 0 5]\n",
      "   state [0 0 1 0 0 1 0 0] state_WI [  0.51  -0.     0.27   0.14   0.61   0.42   0.38 -10.  ] sorted [4 0 5]\n",
      "   state [0 0 1 0 0 1 0 0] state_WI [  0.51  -0.     0.27   0.14   0.61   0.42   0.38 -10.  ] sorted [4 0 5]\n",
      "   state [1 0 1 0 0 1 1 0] state_WI [  0.22  -0.     0.27   0.14   0.61   0.42   0.47 -10.  ] sorted [4 6 5]\n",
      "   state [1 0 0 0 1 0 1 0] state_WI [  0.22  -0.     0.77   0.14   0.32   0.41   0.47 -10.  ] sorted [2 6 5]\n",
      "   state [1 0 1 0 1 0 1 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.41   0.47 -10.  ] sorted [6 5 4]\n",
      "   state [0 0 1 0 1 1 0 0] state_WI [  0.51  -0.     0.27   0.14   0.32   0.42   0.38 -10.  ] sorted [0 5 6]\n",
      "   state [0 0 1 0 1 1 0 0] state_WI [  0.51  -0.     0.27   0.14   0.32   0.42   0.38 -10.  ] sorted [0 5 6]\n",
      "   state [0 0 0 0 0 1 0 0] state_WI [  0.51  -0.     0.77   0.14   0.61   0.42   0.38 -10.  ] sorted [2 4 0]\n",
      "   state [0 0 1 0 1 0 0 0] state_WI [  0.51  -0.     0.27   0.14   0.32   0.41   0.38 -10.  ] sorted [0 5 6]\n",
      "   state [0 0 1 0 0 0 0 1] state_WI [  0.51  -0.     0.27   0.14   0.61   0.41   0.38 -10.  ] sorted [4 0 5]\n",
      "   state [0 0 1 0 1 0 1 1] state_WI [  0.51  -0.     0.27   0.14   0.32   0.41   0.47 -10.  ] sorted [0 6 5]\n",
      "instance 4, ep 10, state [0 0 1 0 1 0 0 1]\n",
      "   state [0 0 1 0 1 0 0 1] state_WI [  0.51  -0.     0.27   0.14   0.32   0.41   0.38 -10.  ] sorted [0 5 6]\n",
      "   state [1 0 1 0 0 1 1 0] state_WI [  0.22  -0.     0.27   0.14   0.61   0.42   0.47 -10.  ] sorted [4 6 5]\n",
      "   state [1 0 1 0 1 1 1 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.42   0.47 -10.  ] sorted [6 5 4]\n",
      "   state [0 0 0 0 1 1 1 0] state_WI [  0.51  -0.     0.77   0.14   0.32   0.42   0.47 -10.  ] sorted [2 0 6]\n",
      "   state [1 0 1 0 0 0 1 0] state_WI [  0.22  -0.     0.27   0.14   0.61   0.41   0.47 -10.  ] sorted [4 6 5]\n",
      "   state [0 0 1 0 0 0 1 0] state_WI [  0.51  -0.     0.27   0.14   0.61   0.41   0.47 -10.  ] sorted [4 0 6]\n",
      "   state [1 0 1 0 0 0 1 0] state_WI [  0.22  -0.     0.27   0.14   0.61   0.41   0.47 -10.  ] sorted [4 6 5]\n",
      "   state [1 0 0 0 0 0 1 0] state_WI [  0.22  -0.     0.77   0.14   0.61   0.41   0.47 -10.  ] sorted [2 4 6]\n",
      "   state [1 0 1 0 1 1 0 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.42   0.38 -10.  ] sorted [5 6 4]\n",
      "   state [1 0 0 0 1 1 0 0] state_WI [  0.22  -0.     0.77   0.14   0.32   0.42   0.38 -10.  ] sorted [2 5 6]\n",
      "   state [1 0 1 0 1 0 0 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.41   0.38 -10.  ] sorted [5 6 4]\n",
      "   state [1 0 0 0 1 1 1 0] state_WI [  0.22  -0.     0.77   0.14   0.32   0.42   0.47 -10.  ] sorted [2 6 5]\n",
      "   state [1 0 0 0 0 1 0 0] state_WI [  0.22  -0.     0.77   0.14   0.61   0.42   0.38 -10.  ] sorted [2 4 5]\n",
      "   state [1 0 1 0 1 1 0 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.42   0.38 -10.  ] sorted [5 6 4]\n",
      "   state [0 0 1 0 0 0 0 0] state_WI [  0.51  -0.     0.27   0.14   0.61   0.41   0.38 -10.  ] sorted [4 0 5]\n",
      "   state [0 0 1 0 1 0 0 0] state_WI [  0.51  -0.     0.27   0.14   0.32   0.41   0.38 -10.  ] sorted [0 5 6]\n",
      "   state [0 0 0 0 0 0 0 0] state_WI [  0.51  -0.     0.77   0.14   0.61   0.41   0.38 -10.  ] sorted [2 4 0]\n",
      "   state [1 0 1 0 0 1 0 0] state_WI [  0.22  -0.     0.27   0.14   0.61   0.42   0.38 -10.  ] sorted [4 5 6]\n",
      "   state [1 0 1 0 1 0 0 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.41   0.38 -10.  ] sorted [5 6 4]\n",
      "   state [1 0 1 0 1 1 1 1] state_WI [  0.22  -0.     0.27   0.14   0.32   0.42   0.47 -10.  ] sorted [6 5 4]\n",
      "instance 4, ep 11, state [1 0 0 0 1 1 0 1]\n",
      "   state [1 0 0 0 1 1 0 1] state_WI [  0.22  -0.     0.77   0.14   0.32   0.42   0.38 -10.  ] sorted [2 5 6]\n",
      "   state [0 0 1 0 0 1 1 0] state_WI [  0.51  -0.     0.27   0.14   0.61   0.42   0.47 -10.  ] sorted [4 0 6]\n",
      "   state [1 0 1 0 1 1 1 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.42   0.47 -10.  ] sorted [6 5 4]\n",
      "   state [0 0 0 0 1 1 1 0] state_WI [  0.51  -0.     0.77   0.14   0.32   0.42   0.47 -10.  ] sorted [2 0 6]\n",
      "   state [1 0 1 0 1 1 1 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.42   0.47 -10.  ] sorted [6 5 4]\n",
      "   state [1 0 0 0 1 1 1 0] state_WI [  0.22  -0.     0.77   0.14   0.32   0.42   0.47 -10.  ] sorted [2 6 5]\n",
      "   state [1 0 1 0 0 0 0 0] state_WI [  0.22  -0.     0.27   0.14   0.61   0.41   0.38 -10.  ] sorted [4 5 6]\n",
      "   state [1 0 1 0 1 1 0 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.42   0.38 -10.  ] sorted [5 6 4]\n",
      "   state [1 0 0 1 1 1 0 0] state_WI [  0.22  -0.     0.77   0.05   0.32   0.42   0.38 -10.  ] sorted [2 5 6]\n",
      "   state [1 0 1 0 0 1 0 0] state_WI [  0.22  -0.     0.27   0.14   0.61   0.42   0.38 -10.  ] sorted [4 5 6]\n",
      "   state [1 0 1 0 1 1 1 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.42   0.47 -10.  ] sorted [6 5 4]\n",
      "   state [1 0 0 0 1 0 1 0] state_WI [  0.22  -0.     0.77   0.14   0.32   0.41   0.47 -10.  ] sorted [2 6 5]\n",
      "   state [0 0 1 0 0 1 1 0] state_WI [  0.51  -0.     0.27   0.14   0.61   0.42   0.47 -10.  ] sorted [4 0 6]\n",
      "   state [0 0 0 0 1 0 1 0] state_WI [  0.51  -0.     0.77   0.14   0.32   0.41   0.47 -10.  ] sorted [2 0 6]\n",
      "   state [0 0 1 0 1 0 0 0] state_WI [  0.51  -0.     0.27   0.14   0.32   0.41   0.38 -10.  ] sorted [0 5 6]\n",
      "   state [1 0 1 0 0 1 1 0] state_WI [  0.22  -0.     0.27   0.14   0.61   0.42   0.47 -10.  ] sorted [4 6 5]\n",
      "   state [1 0 1 0 1 0 1 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.41   0.47 -10.  ] sorted [6 5 4]\n",
      "   state [1 0 1 0 0 1 0 0] state_WI [  0.22  -0.     0.27   0.14   0.61   0.42   0.38 -10.  ] sorted [4 5 6]\n",
      "   state [1 0 0 0 0 1 1 0] state_WI [  0.22  -0.     0.77   0.14   0.61   0.42   0.47 -10.  ] sorted [2 4 6]\n",
      "   state [1 0 1 0 1 0 1 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.41   0.47 -10.  ] sorted [6 5 4]\n",
      "instance 4, ep 12, state [1 1 1 0 0 0 0 1]\n",
      "   state [1 1 1 0 0 0 0 1] state_WI [  0.22  -0.     0.27   0.14   0.61   0.41   0.38 -10.  ] sorted [4 5 6]\n",
      "   state [0 0 1 0 1 0 1 1] state_WI [  0.51  -0.     0.27   0.14   0.32   0.41   0.47 -10.  ] sorted [0 6 5]\n",
      "   state [1 0 0 0 0 0 1 0] state_WI [  0.22  -0.     0.77   0.14   0.61   0.41   0.47 -10.  ] sorted [2 4 6]\n",
      "   state [0 0 1 0 1 0 1 0] state_WI [  0.51  -0.     0.27   0.14   0.32   0.41   0.47 -10.  ] sorted [0 6 5]\n",
      "   state [0 0 1 0 0 0 1 0] state_WI [  0.51  -0.     0.27   0.14   0.61   0.41   0.47 -10.  ] sorted [4 0 6]\n",
      "   state [0 0 0 1 1 0 0 0] state_WI [  0.51  -0.     0.77   0.05   0.32   0.41   0.38 -10.  ] sorted [2 0 5]\n",
      "   state [1 0 0 0 1 1 0 0] state_WI [  0.22  -0.     0.77   0.14   0.32   0.42   0.38 -10.  ] sorted [2 5 6]\n",
      "   state [1 0 1 0 1 1 1 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.42   0.47 -10.  ] sorted [6 5 4]\n",
      "   state [1 0 0 0 1 0 1 0] state_WI [  0.22  -0.     0.77   0.14   0.32   0.41   0.47 -10.  ] sorted [2 6 5]\n",
      "   state [0 0 0 0 0 0 1 0] state_WI [  0.51  -0.     0.77   0.14   0.61   0.41   0.47 -10.  ] sorted [2 4 0]\n",
      "   state [1 0 1 0 0 0 1 0] state_WI [  0.22  -0.     0.27   0.14   0.61   0.41   0.47 -10.  ] sorted [4 6 5]\n",
      "   state [0 0 1 0 1 1 1 0] state_WI [  0.51  -0.     0.27   0.14   0.32   0.42   0.47 -10.  ] sorted [0 6 5]\n",
      "   state [0 0 1 0 0 1 1 0] state_WI [  0.51  -0.     0.27   0.14   0.61   0.42   0.47 -10.  ] sorted [4 0 6]\n",
      "   state [0 0 0 0 1 1 0 0] state_WI [  0.51  -0.     0.77   0.14   0.32   0.42   0.38 -10.  ] sorted [2 0 5]\n",
      "   state [0 0 0 0 0 1 0 0] state_WI [  0.51  -0.     0.77   0.14   0.61   0.42   0.38 -10.  ] sorted [2 4 0]\n",
      "   state [0 0 1 0 1 1 0 0] state_WI [  0.51  -0.     0.27   0.14   0.32   0.42   0.38 -10.  ] sorted [0 5 6]\n",
      "   state [0 0 0 0 1 0 0 0] state_WI [  0.51  -0.     0.77   0.14   0.32   0.41   0.38 -10.  ] sorted [2 0 5]\n",
      "   state [0 0 1 0 0 0 0 0] state_WI [  0.51  -0.     0.27   0.14   0.61   0.41   0.38 -10.  ] sorted [4 0 5]\n",
      "   state [0 0 0 0 1 0 1 0] state_WI [  0.51  -0.     0.77   0.14   0.32   0.41   0.47 -10.  ] sorted [2 0 6]\n",
      "   state [1 0 1 0 0 0 1 0] state_WI [  0.22  -0.     0.27   0.14   0.61   0.41   0.47 -10.  ] sorted [4 6 5]\n",
      "instance 4, ep 13, state [1 0 0 0 1 0 1 0]\n",
      "   state [1 0 0 0 1 0 1 0] state_WI [  0.22  -0.     0.77   0.14   0.32   0.41   0.47 -10.  ] sorted [2 6 5]\n",
      "   state [0 0 1 0 1 0 1 0] state_WI [  0.51  -0.     0.27   0.14   0.32   0.41   0.47 -10.  ] sorted [0 6 5]\n",
      "   state [0 0 1 0 0 0 1 0] state_WI [  0.51  -0.     0.27   0.14   0.61   0.41   0.47 -10.  ] sorted [4 0 6]\n",
      "   state [1 0 0 0 1 0 1 0] state_WI [  0.22  -0.     0.77   0.14   0.32   0.41   0.47 -10.  ] sorted [2 6 5]\n",
      "   state [0 0 1 0 1 0 1 0] state_WI [  0.51  -0.     0.27   0.14   0.32   0.41   0.47 -10.  ] sorted [0 6 5]\n",
      "   state [1 0 1 0 0 0 0 0] state_WI [  0.22  -0.     0.27   0.14   0.61   0.41   0.38 -10.  ] sorted [4 5 6]\n",
      "   state [0 0 1 0 1 0 0 0] state_WI [  0.51  -0.     0.27   0.14   0.32   0.41   0.38 -10.  ] sorted [0 5 6]\n",
      "   state [1 0 0 0 0 1 0 0] state_WI [  0.22  -0.     0.77   0.14   0.61   0.42   0.38 -10.  ] sorted [2 4 5]\n",
      "   state [1 0 1 0 0 1 1 0] state_WI [  0.22  -0.     0.27   0.14   0.61   0.42   0.47 -10.  ] sorted [4 6 5]\n",
      "   state [1 0 1 0 1 1 1 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.42   0.47 -10.  ] sorted [6 5 4]\n",
      "   state [0 0 1 0 1 1 1 0] state_WI [  0.51  -0.     0.27   0.14   0.32   0.42   0.47 -10.  ] sorted [0 6 5]\n",
      "   state [1 0 0 0 1 1 1 0] state_WI [  0.22  -0.     0.77   0.14   0.32   0.42   0.47 -10.  ] sorted [2 6 5]\n",
      "   state [1 0 1 0 1 1 1 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.42   0.47 -10.  ] sorted [6 5 4]\n",
      "   state [0 0 0 0 1 0 0 0] state_WI [  0.51  -0.     0.77   0.14   0.32   0.41   0.38 -10.  ] sorted [2 0 5]\n",
      "   state [1 0 1 0 0 0 0 0] state_WI [  0.22  -0.     0.27   0.14   0.61   0.41   0.38 -10.  ] sorted [4 5 6]\n",
      "   state [1 0 1 0 1 0 1 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.41   0.47 -10.  ] sorted [6 5 4]\n",
      "   state [0 0 1 0 0 0 1 0] state_WI [  0.51  -0.     0.27   0.14   0.61   0.41   0.47 -10.  ] sorted [4 0 6]\n",
      "   state [0 0 1 0 0 0 1 0] state_WI [  0.51  -0.     0.27   0.14   0.61   0.41   0.47 -10.  ] sorted [4 0 6]\n",
      "   state [0 0 0 0 1 0 0 0] state_WI [  0.51  -0.     0.77   0.14   0.32   0.41   0.38 -10.  ] sorted [2 0 5]\n",
      "   state [1 0 1 0 1 0 0 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.41   0.38 -10.  ] sorted [5 6 4]\n",
      "instance 4, ep 14, state [0 1 1 0 1 1 1 0]\n",
      "   state [0 1 1 0 1 1 1 0] state_WI [  0.51  -0.     0.27   0.14   0.32   0.42   0.47 -10.  ] sorted [0 6 5]\n",
      "   state [0 0 1 0 1 0 1 0] state_WI [  0.51  -0.     0.27   0.14   0.32   0.41   0.47 -10.  ] sorted [0 6 5]\n",
      "   state [0 0 0 0 0 1 1 0] state_WI [  0.51  -0.     0.77   0.14   0.61   0.42   0.47 -10.  ] sorted [2 4 0]\n",
      "   state [0 0 1 0 0 0 0 0] state_WI [  0.51  -0.     0.27   0.14   0.61   0.41   0.38 -10.  ] sorted [4 0 5]\n",
      "   state [0 0 1 0 0 0 0 0] state_WI [  0.51  -0.     0.27   0.14   0.61   0.41   0.38 -10.  ] sorted [4 0 5]\n",
      "   state [1 0 0 0 1 0 1 0] state_WI [  0.22  -0.     0.77   0.14   0.32   0.41   0.47 -10.  ] sorted [2 6 5]\n",
      "   state [0 0 1 0 1 0 1 0] state_WI [  0.51  -0.     0.27   0.14   0.32   0.41   0.47 -10.  ] sorted [0 6 5]\n",
      "   state [1 0 1 0 0 0 0 0] state_WI [  0.22  -0.     0.27   0.14   0.61   0.41   0.38 -10.  ] sorted [4 5 6]\n",
      "   state [0 0 1 0 1 0 0 0] state_WI [  0.51  -0.     0.27   0.14   0.32   0.41   0.38 -10.  ] sorted [0 5 6]\n",
      "   state [0 0 0 0 0 1 1 0] state_WI [  0.51  -0.     0.77   0.14   0.61   0.42   0.47 -10.  ] sorted [2 4 0]\n",
      "   state [0 0 1 0 0 1 0 0] state_WI [  0.51  -0.     0.27   0.14   0.61   0.42   0.38 -10.  ] sorted [4 0 5]\n",
      "   state [1 0 1 0 0 1 0 0] state_WI [  0.22  -0.     0.27   0.14   0.61   0.42   0.38 -10.  ] sorted [4 5 6]\n",
      "   state [1 0 0 0 1 1 0 0] state_WI [  0.22  -0.     0.77   0.14   0.32   0.42   0.38 -10.  ] sorted [2 5 6]\n",
      "   state [1 0 1 0 0 0 0 0] state_WI [  0.22  -0.     0.27   0.14   0.61   0.41   0.38 -10.  ] sorted [4 5 6]\n",
      "   state [0 0 1 0 0 1 0 0] state_WI [  0.51  -0.     0.27   0.14   0.61   0.42   0.38 -10.  ] sorted [4 0 5]\n",
      "   state [1 0 1 0 0 1 0 0] state_WI [  0.22  -0.     0.27   0.14   0.61   0.42   0.38 -10.  ] sorted [4 5 6]\n",
      "   state [0 0 0 0 0 1 0 0] state_WI [  0.51  -0.     0.77   0.14   0.61   0.42   0.38 -10.  ] sorted [2 4 0]\n",
      "   state [0 0 0 0 1 0 0 0] state_WI [  0.51  -0.     0.77   0.14   0.32   0.41   0.38 -10.  ] sorted [2 0 5]\n",
      "   state [1 0 1 0 0 1 0 0] state_WI [  0.22  -0.     0.27   0.14   0.61   0.42   0.38 -10.  ] sorted [4 5 6]\n",
      "   state [1 0 1 0 1 1 0 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.42   0.38 -10.  ] sorted [5 6 4]\n",
      "instance 4, ep 15, state [1 0 1 0 0 0 1 0]\n",
      "   state [1 0 1 0 0 0 1 0] state_WI [  0.22  -0.     0.27   0.14   0.61   0.41   0.47 -10.  ] sorted [4 6 5]\n",
      "   state [1 0 0 0 0 0 1 0] state_WI [  0.22  -0.     0.77   0.14   0.61   0.41   0.47 -10.  ] sorted [2 4 6]\n",
      "   state [1 0 1 1 1 0 1 0] state_WI [  0.22  -0.     0.27   0.05   0.32   0.41   0.47 -10.  ] sorted [6 5 4]\n",
      "   state [1 0 1 1 0 1 0 0] state_WI [  0.22  -0.     0.27   0.05   0.61   0.42   0.38 -10.  ] sorted [4 5 6]\n",
      "   state [1 0 1 0 0 1 0 0] state_WI [  0.22  -0.     0.27   0.14   0.61   0.42   0.38 -10.  ] sorted [4 5 6]\n",
      "   state [0 0 1 0 1 1 1 0] state_WI [  0.51  -0.     0.27   0.14   0.32   0.42   0.47 -10.  ] sorted [0 6 5]\n",
      "   state [0 0 1 0 0 1 0 1] state_WI [  0.51  -0.     0.27   0.14   0.61   0.42   0.38 -10.  ] sorted [4 0 5]\n",
      "   state [1 0 1 0 0 1 0 0] state_WI [  0.22  -0.     0.27   0.14   0.61   0.42   0.38 -10.  ] sorted [4 5 6]\n",
      "   state [0 0 0 0 1 1 1 0] state_WI [  0.51  -0.     0.77   0.14   0.32   0.42   0.47 -10.  ] sorted [2 0 6]\n",
      "   state [0 0 1 0 0 1 1 0] state_WI [  0.51  -0.     0.27   0.14   0.61   0.42   0.47 -10.  ] sorted [4 0 6]\n",
      "   state [0 0 0 0 1 1 1 0] state_WI [  0.51  -0.     0.77   0.14   0.32   0.42   0.47 -10.  ] sorted [2 0 6]\n",
      "   state [0 0 1 0 1 1 1 0] state_WI [  0.51  -0.     0.27   0.14   0.32   0.42   0.47 -10.  ] sorted [0 6 5]\n",
      "   state [1 0 1 0 1 1 1 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.42   0.47 -10.  ] sorted [6 5 4]\n",
      "   state [1 0 0 0 1 1 1 0] state_WI [  0.22  -0.     0.77   0.14   0.32   0.42   0.47 -10.  ] sorted [2 6 5]\n",
      "   state [0 0 1 0 0 1 1 0] state_WI [  0.51  -0.     0.27   0.14   0.61   0.42   0.47 -10.  ] sorted [4 0 6]\n",
      "   state [1 0 1 0 1 0 0 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.41   0.38 -10.  ] sorted [5 6 4]\n",
      "   state [1 0 0 0 0 1 0 0] state_WI [  0.22  -0.     0.77   0.14   0.61   0.42   0.38 -10.  ] sorted [2 4 5]\n",
      "   state [0 0 0 1 0 1 0 0] state_WI [  0.51  -0.     0.77   0.05   0.61   0.42   0.38 -10.  ] sorted [2 4 0]\n",
      "   state [0 0 1 0 1 1 1 0] state_WI [  0.51  -0.     0.27   0.14   0.32   0.42   0.47 -10.  ] sorted [0 6 5]\n",
      "   state [1 0 0 0 0 1 1 0] state_WI [  0.22  -0.     0.77   0.14   0.61   0.42   0.47 -10.  ] sorted [2 4 6]\n",
      "instance 4, ep 16, state [1 1 0 1 0 1 0 1]\n",
      "   state [1 1 0 1 0 1 0 1] state_WI [  0.22  -0.     0.77   0.05   0.61   0.42   0.38 -10.  ] sorted [2 4 5]\n",
      "   state [1 0 1 0 0 1 1 0] state_WI [  0.22  -0.     0.27   0.14   0.61   0.42   0.47 -10.  ] sorted [4 6 5]\n",
      "   state [1 0 0 0 1 1 0 1] state_WI [  0.22  -0.     0.77   0.14   0.32   0.42   0.38 -10.  ] sorted [2 5 6]\n",
      "   state [1 0 1 0 0 1 1 0] state_WI [  0.22  -0.     0.27   0.14   0.61   0.42   0.47 -10.  ] sorted [4 6 5]\n",
      "   state [1 0 0 0 1 1 0 0] state_WI [  0.22  -0.     0.77   0.14   0.32   0.42   0.38 -10.  ] sorted [2 5 6]\n",
      "   state [0 0 1 0 0 1 0 0] state_WI [  0.51  -0.     0.27   0.14   0.61   0.42   0.38 -10.  ] sorted [4 0 5]\n",
      "   state [1 0 1 0 0 1 0 0] state_WI [  0.22  -0.     0.27   0.14   0.61   0.42   0.38 -10.  ] sorted [4 5 6]\n",
      "   state [1 0 0 0 1 1 1 0] state_WI [  0.22  -0.     0.77   0.14   0.32   0.42   0.47 -10.  ] sorted [2 6 5]\n",
      "   state [0 0 1 0 1 1 1 0] state_WI [  0.51  -0.     0.27   0.14   0.32   0.42   0.47 -10.  ] sorted [0 6 5]\n",
      "   state [0 0 1 0 1 1 1 0] state_WI [  0.51  -0.     0.27   0.14   0.32   0.42   0.47 -10.  ] sorted [0 6 5]\n",
      "   state [0 0 0 0 0 1 1 0] state_WI [  0.51  -0.     0.77   0.14   0.61   0.42   0.47 -10.  ] sorted [2 4 0]\n",
      "   state [1 0 1 0 1 0 0 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.41   0.38 -10.  ] sorted [5 6 4]\n",
      "   state [1 0 0 0 1 1 0 0] state_WI [  0.22  -0.     0.77   0.14   0.32   0.42   0.38 -10.  ] sorted [2 5 6]\n",
      "   state [1 0 1 0 0 0 0 0] state_WI [  0.22  -0.     0.27   0.14   0.61   0.41   0.38 -10.  ] sorted [4 5 6]\n",
      "   state [1 0 1 1 1 0 0 0] state_WI [  0.22  -0.     0.27   0.05   0.32   0.41   0.38 -10.  ] sorted [5 6 4]\n",
      "   state [1 0 1 1 1 0 0 0] state_WI [  0.22  -0.     0.27   0.05   0.32   0.41   0.38 -10.  ] sorted [5 6 4]\n",
      "   state [0 0 0 0 1 0 0 1] state_WI [  0.51  -0.     0.77   0.14   0.32   0.41   0.38 -10.  ] sorted [2 0 5]\n",
      "   state [1 0 1 0 1 0 0 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.41   0.38 -10.  ] sorted [5 6 4]\n",
      "   state [1 0 1 1 0 1 0 0] state_WI [  0.22  -0.     0.27   0.05   0.61   0.42   0.38 -10.  ] sorted [4 5 6]\n",
      "   state [1 0 1 0 1 1 1 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.42   0.47 -10.  ] sorted [6 5 4]\n",
      "instance 4, ep 17, state [1 1 1 0 1 1 1 0]\n",
      "   state [1 1 1 0 1 1 1 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.42   0.47 -10.  ] sorted [6 5 4]\n",
      "   state [1 0 0 0 1 1 1 0] state_WI [  0.22  -0.     0.77   0.14   0.32   0.42   0.47 -10.  ] sorted [2 6 5]\n",
      "   state [1 0 1 0 0 1 1 0] state_WI [  0.22  -0.     0.27   0.14   0.61   0.42   0.47 -10.  ] sorted [4 6 5]\n",
      "   state [0 0 0 0 0 1 1 0] state_WI [  0.51  -0.     0.77   0.14   0.61   0.42   0.47 -10.  ] sorted [2 4 0]\n",
      "   state [1 0 1 0 0 0 0 0] state_WI [  0.22  -0.     0.27   0.14   0.61   0.41   0.38 -10.  ] sorted [4 5 6]\n",
      "   state [0 0 0 0 1 0 0 0] state_WI [  0.51  -0.     0.77   0.14   0.32   0.41   0.38 -10.  ] sorted [2 0 5]\n",
      "   state [1 0 1 0 0 0 0 0] state_WI [  0.22  -0.     0.27   0.14   0.61   0.41   0.38 -10.  ] sorted [4 5 6]\n",
      "   state [1 0 1 0 1 1 1 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.42   0.47 -10.  ] sorted [6 5 4]\n",
      "   state [1 0 0 1 1 1 0 0] state_WI [  0.22  -0.     0.77   0.05   0.32   0.42   0.38 -10.  ] sorted [2 5 6]\n",
      "   state [0 0 1 0 0 1 0 0] state_WI [  0.51  -0.     0.27   0.14   0.61   0.42   0.38 -10.  ] sorted [4 0 5]\n",
      "   state [1 0 0 0 0 1 0 0] state_WI [  0.22  -0.     0.77   0.14   0.61   0.42   0.38 -10.  ] sorted [2 4 5]\n",
      "   state [1 0 1 0 0 1 0 0] state_WI [  0.22  -0.     0.27   0.14   0.61   0.42   0.38 -10.  ] sorted [4 5 6]\n",
      "   state [0 0 0 0 1 1 0 0] state_WI [  0.51  -0.     0.77   0.14   0.32   0.42   0.38 -10.  ] sorted [2 0 5]\n",
      "   state [1 0 0 0 1 1 0 1] state_WI [  0.22  -0.     0.77   0.14   0.32   0.42   0.38 -10.  ] sorted [2 5 6]\n",
      "   state [1 0 1 0 0 1 0 0] state_WI [  0.22  -0.     0.27   0.14   0.61   0.42   0.38 -10.  ] sorted [4 5 6]\n",
      "   state [1 0 1 0 1 1 0 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.42   0.38 -10.  ] sorted [5 6 4]\n",
      "   state [0 0 1 0 1 0 0 1] state_WI [  0.51  -0.     0.27   0.14   0.32   0.41   0.38 -10.  ] sorted [0 5 6]\n",
      "   state [0 0 1 1 0 0 0 0] state_WI [  0.51  -0.     0.27   0.05   0.61   0.41   0.38 -10.  ] sorted [4 0 5]\n",
      "   state [1 0 1 0 0 0 0 0] state_WI [  0.22  -0.     0.27   0.14   0.61   0.41   0.38 -10.  ] sorted [4 5 6]\n",
      "   state [0 0 1 0 1 1 0 0] state_WI [  0.51  -0.     0.27   0.14   0.32   0.42   0.38 -10.  ] sorted [0 5 6]\n",
      "instance 4, ep 18, state [1 1 1 0 1 0 1 0]\n",
      "   state [1 1 1 0 1 0 1 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.41   0.47 -10.  ] sorted [6 5 4]\n",
      "   state [0 0 1 0 1 0 1 0] state_WI [  0.51  -0.     0.27   0.14   0.32   0.41   0.47 -10.  ] sorted [0 6 5]\n",
      "   state [0 0 1 0 1 1 1 0] state_WI [  0.51  -0.     0.27   0.14   0.32   0.42   0.47 -10.  ] sorted [0 6 5]\n",
      "   state [0 0 0 0 0 1 1 0] state_WI [  0.51  -0.     0.77   0.14   0.61   0.42   0.47 -10.  ] sorted [2 4 0]\n",
      "   state [1 0 0 0 0 0 0 0] state_WI [  0.22  -0.     0.77   0.14   0.61   0.41   0.38 -10.  ] sorted [2 4 5]\n",
      "   state [0 0 1 0 0 1 0 0] state_WI [  0.51  -0.     0.27   0.14   0.61   0.42   0.38 -10.  ] sorted [4 0 5]\n",
      "   state [0 0 0 0 0 1 0 0] state_WI [  0.51  -0.     0.77   0.14   0.61   0.42   0.38 -10.  ] sorted [2 4 0]\n",
      "   state [0 0 1 0 0 0 0 1] state_WI [  0.51  -0.     0.27   0.14   0.61   0.41   0.38 -10.  ] sorted [4 0 5]\n",
      "   state [0 0 0 0 1 1 0 1] state_WI [  0.51  -0.     0.77   0.14   0.32   0.42   0.38 -10.  ] sorted [2 0 5]\n",
      "   state [1 0 1 0 0 1 0 0] state_WI [  0.22  -0.     0.27   0.14   0.61   0.42   0.38 -10.  ] sorted [4 5 6]\n",
      "   state [1 0 1 0 1 0 1 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.41   0.47 -10.  ] sorted [6 5 4]\n",
      "   state [0 0 1 0 1 1 1 0] state_WI [  0.51  -0.     0.27   0.14   0.32   0.42   0.47 -10.  ] sorted [0 6 5]\n",
      "   state [0 0 0 1 1 1 0 0] state_WI [  0.51  -0.     0.77   0.05   0.32   0.42   0.38 -10.  ] sorted [2 0 5]\n",
      "   state [1 0 0 0 0 1 0 0] state_WI [  0.22  -0.     0.77   0.14   0.61   0.42   0.38 -10.  ] sorted [2 4 5]\n",
      "   state [0 0 0 1 0 1 0 0] state_WI [  0.51  -0.     0.77   0.05   0.61   0.42   0.38 -10.  ] sorted [2 4 0]\n",
      "   state [0 0 1 0 0 1 1 0] state_WI [  0.51  -0.     0.27   0.14   0.61   0.42   0.47 -10.  ] sorted [4 0 6]\n",
      "   state [1 0 0 0 1 1 0 0] state_WI [  0.22  -0.     0.77   0.14   0.32   0.42   0.38 -10.  ] sorted [2 5 6]\n",
      "   state [1 0 0 0 0 0 0 0] state_WI [  0.22  -0.     0.77   0.14   0.61   0.41   0.38 -10.  ] sorted [2 4 5]\n",
      "   state [1 0 1 0 1 0 0 1] state_WI [  0.22  -0.     0.27   0.14   0.32   0.41   0.38 -10.  ] sorted [5 6 4]\n",
      "   state [1 0 0 0 0 1 0 0] state_WI [  0.22  -0.     0.77   0.14   0.61   0.42   0.38 -10.  ] sorted [2 4 5]\n",
      "instance 4, ep 19, state [1 1 0 1 0 1 1 1]\n",
      "   state [1 1 0 1 0 1 1 1] state_WI [  0.22  -0.     0.77   0.05   0.61   0.42   0.47 -10.  ] sorted [2 4 6]\n",
      "   state [0 0 1 0 0 0 1 0] state_WI [  0.51  -0.     0.27   0.14   0.61   0.41   0.47 -10.  ] sorted [4 0 6]\n",
      "   state [0 0 1 0 1 0 1 0] state_WI [  0.51  -0.     0.27   0.14   0.32   0.41   0.47 -10.  ] sorted [0 6 5]\n",
      "   state [1 0 0 0 0 0 1 0] state_WI [  0.22  -0.     0.77   0.14   0.61   0.41   0.47 -10.  ] sorted [2 4 6]\n",
      "   state [1 0 1 0 1 0 0 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.41   0.38 -10.  ] sorted [5 6 4]\n",
      "   state [1 0 1 0 0 0 1 0] state_WI [  0.22  -0.     0.27   0.14   0.61   0.41   0.47 -10.  ] sorted [4 6 5]\n",
      "   state [0 0 0 0 0 0 1 0] state_WI [  0.51  -0.     0.77   0.14   0.61   0.41   0.47 -10.  ] sorted [2 4 0]\n",
      "   state [1 0 1 0 0 0 1 0] state_WI [  0.22  -0.     0.27   0.14   0.61   0.41   0.47 -10.  ] sorted [4 6 5]\n",
      "   state [0 0 0 0 1 1 0 0] state_WI [  0.51  -0.     0.77   0.14   0.32   0.42   0.38 -10.  ] sorted [2 0 5]\n",
      "   state [1 0 1 1 0 0 0 0] state_WI [  0.22  -0.     0.27   0.05   0.61   0.41   0.38 -10.  ] sorted [4 5 6]\n",
      "   state [1 0 0 0 1 1 0 0] state_WI [  0.22  -0.     0.77   0.14   0.32   0.42   0.38 -10.  ] sorted [2 5 6]\n",
      "   state [1 0 1 1 0 1 0 0] state_WI [  0.22  -0.     0.27   0.05   0.61   0.42   0.38 -10.  ] sorted [4 5 6]\n",
      "   state [0 0 1 0 1 1 0 0] state_WI [  0.51  -0.     0.27   0.14   0.32   0.42   0.38 -10.  ] sorted [0 5 6]\n",
      "   state [0 0 0 0 1 0 0 0] state_WI [  0.51  -0.     0.77   0.14   0.32   0.41   0.38 -10.  ] sorted [2 0 5]\n",
      "   state [1 0 0 0 1 0 0 0] state_WI [  0.22  -0.     0.77   0.14   0.32   0.41   0.38 -10.  ] sorted [2 5 6]\n",
      "   state [1 0 1 1 1 0 0 0] state_WI [  0.22  -0.     0.27   0.05   0.32   0.41   0.38 -10.  ] sorted [5 6 4]\n",
      "   state [1 0 1 0 1 1 0 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.42   0.38 -10.  ] sorted [5 6 4]\n",
      "   state [1 0 1 0 1 1 0 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.42   0.38 -10.  ] sorted [5 6 4]\n",
      "   state [1 0 0 1 0 1 1 0] state_WI [  0.22  -0.     0.77   0.05   0.61   0.42   0.47 -10.  ] sorted [2 4 6]\n",
      "   state [1 0 1 0 1 0 1 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.41   0.47 -10.  ] sorted [6 5 4]\n",
      "instance 4, ep 20, state [1 1 0 0 1 1 1 1]\n",
      "   state [1 1 0 0 1 1 1 1] state_WI [  0.22  -0.     0.77   0.14   0.32   0.42   0.47 -10.  ] sorted [2 6 5]\n",
      "   state [0 0 0 0 1 1 1 0] state_WI [  0.51  -0.     0.77   0.14   0.32   0.42   0.47 -10.  ] sorted [2 0 6]\n",
      "   state [1 0 1 0 1 1 1 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.42   0.47 -10.  ] sorted [6 5 4]\n",
      "   state [0 0 1 0 1 1 1 0] state_WI [  0.51  -0.     0.27   0.14   0.32   0.42   0.47 -10.  ] sorted [0 6 5]\n",
      "   state [0 0 0 0 0 1 1 0] state_WI [  0.51  -0.     0.77   0.14   0.61   0.42   0.47 -10.  ] sorted [2 4 0]\n",
      "   state [1 0 1 0 0 0 0 0] state_WI [  0.22  -0.     0.27   0.14   0.61   0.41   0.38 -10.  ] sorted [4 5 6]\n",
      "   state [1 0 0 0 1 1 0 0] state_WI [  0.22  -0.     0.77   0.14   0.32   0.42   0.38 -10.  ] sorted [2 5 6]\n",
      "   state [1 0 1 0 1 0 0 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.41   0.38 -10.  ] sorted [5 6 4]\n",
      "   state [1 0 1 0 1 1 0 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.42   0.38 -10.  ] sorted [5 6 4]\n",
      "   state [1 0 1 0 1 1 0 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.42   0.38 -10.  ] sorted [5 6 4]\n",
      "   state [0 0 0 0 1 0 0 0] state_WI [  0.51  -0.     0.77   0.14   0.32   0.41   0.38 -10.  ] sorted [2 0 5]\n",
      "   state [0 0 1 0 1 0 0 0] state_WI [  0.51  -0.     0.27   0.14   0.32   0.41   0.38 -10.  ] sorted [0 5 6]\n",
      "   state [0 0 1 0 1 1 1 0] state_WI [  0.51  -0.     0.27   0.14   0.32   0.42   0.47 -10.  ] sorted [0 6 5]\n",
      "   state [1 0 1 0 0 1 1 0] state_WI [  0.22  -0.     0.27   0.14   0.61   0.42   0.47 -10.  ] sorted [4 6 5]\n",
      "   state [1 0 1 0 0 1 1 0] state_WI [  0.22  -0.     0.27   0.14   0.61   0.42   0.47 -10.  ] sorted [4 6 5]\n",
      "   state [0 0 1 0 0 1 1 0] state_WI [  0.51  -0.     0.27   0.14   0.61   0.42   0.47 -10.  ] sorted [4 0 6]\n",
      "   state [1 0 1 0 0 0 1 0] state_WI [  0.22  -0.     0.27   0.14   0.61   0.41   0.47 -10.  ] sorted [4 6 5]\n",
      "   state [1 0 0 0 1 1 1 0] state_WI [  0.22  -0.     0.77   0.14   0.32   0.42   0.47 -10.  ] sorted [2 6 5]\n",
      "   state [1 0 1 0 1 0 1 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.41   0.47 -10.  ] sorted [6 5 4]\n",
      "   state [0 0 1 0 0 1 1 0] state_WI [  0.51  -0.     0.27   0.14   0.61   0.42   0.47 -10.  ] sorted [4 0 6]\n",
      "instance 4, ep 21, state [0 1 0 1 0 0 0 0]\n",
      "   state [0 1 0 1 0 0 0 0] state_WI [  0.51  -0.     0.77   0.05   0.61   0.41   0.38 -10.  ] sorted [2 4 0]\n",
      "   state [0 0 0 0 1 0 0 0] state_WI [  0.51  -0.     0.77   0.14   0.32   0.41   0.38 -10.  ] sorted [2 0 5]\n",
      "   state [1 0 1 0 0 1 0 0] state_WI [  0.22  -0.     0.27   0.14   0.61   0.42   0.38 -10.  ] sorted [4 5 6]\n",
      "   state [1 0 1 0 1 1 1 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.42   0.47 -10.  ] sorted [6 5 4]\n",
      "   state [1 0 1 0 1 0 0 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.41   0.38 -10.  ] sorted [5 6 4]\n",
      "   state [0 0 1 0 1 1 1 0] state_WI [  0.51  -0.     0.27   0.14   0.32   0.42   0.47 -10.  ] sorted [0 6 5]\n",
      "   state [1 0 0 0 1 1 1 0] state_WI [  0.22  -0.     0.77   0.14   0.32   0.42   0.47 -10.  ] sorted [2 6 5]\n",
      "   state [1 0 1 0 1 1 1 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.42   0.47 -10.  ] sorted [6 5 4]\n",
      "   state [1 0 1 0 0 1 1 0] state_WI [  0.22  -0.     0.27   0.14   0.61   0.42   0.47 -10.  ] sorted [4 6 5]\n",
      "   state [1 0 0 0 0 0 1 0] state_WI [  0.22  -0.     0.77   0.14   0.61   0.41   0.47 -10.  ] sorted [2 4 6]\n",
      "   state [0 0 1 0 0 0 0 0] state_WI [  0.51  -0.     0.27   0.14   0.61   0.41   0.38 -10.  ] sorted [4 0 5]\n",
      "   state [0 0 0 0 1 0 0 0] state_WI [  0.51  -0.     0.77   0.14   0.32   0.41   0.38 -10.  ] sorted [2 0 5]\n",
      "   state [0 0 1 0 0 1 0 0] state_WI [  0.51  -0.     0.27   0.14   0.61   0.42   0.38 -10.  ] sorted [4 0 5]\n",
      "   state [0 0 0 0 1 0 0 0] state_WI [  0.51  -0.     0.77   0.14   0.32   0.41   0.38 -10.  ] sorted [2 0 5]\n",
      "   state [0 0 1 0 1 0 0 0] state_WI [  0.51  -0.     0.27   0.14   0.32   0.41   0.38 -10.  ] sorted [0 5 6]\n",
      "   state [0 0 1 0 0 0 1 0] state_WI [  0.51  -0.     0.27   0.14   0.61   0.41   0.47 -10.  ] sorted [4 0 6]\n",
      "   state [0 0 0 1 1 0 0 0] state_WI [  0.51  -0.     0.77   0.05   0.32   0.41   0.38 -10.  ] sorted [2 0 5]\n",
      "   state [0 0 0 1 1 1 0 0] state_WI [  0.51  -0.     0.77   0.05   0.32   0.42   0.38 -10.  ] sorted [2 0 5]\n",
      "   state [1 0 1 0 0 1 0 0] state_WI [  0.22  -0.     0.27   0.14   0.61   0.42   0.38 -10.  ] sorted [4 5 6]\n",
      "   state [0 0 0 0 1 0 0 1] state_WI [  0.51  -0.     0.77   0.14   0.32   0.41   0.38 -10.  ] sorted [2 0 5]\n",
      "instance 4, ep 22, state [1 0 0 0 0 0 0 1]\n",
      "   state [1 0 0 0 0 0 0 1] state_WI [  0.22  -0.     0.77   0.14   0.61   0.41   0.38 -10.  ] sorted [2 4 5]\n",
      "   state [0 0 0 1 1 1 0 0] state_WI [  0.51  -0.     0.77   0.05   0.32   0.42   0.38 -10.  ] sorted [2 0 5]\n",
      "   state [0 0 1 0 0 1 0 0] state_WI [  0.51  -0.     0.27   0.14   0.61   0.42   0.38 -10.  ] sorted [4 0 5]\n",
      "   state [0 0 0 0 0 1 1 0] state_WI [  0.51  -0.     0.77   0.14   0.61   0.42   0.47 -10.  ] sorted [2 4 0]\n",
      "   state [0 0 1 0 1 0 0 0] state_WI [  0.51  -0.     0.27   0.14   0.32   0.41   0.38 -10.  ] sorted [0 5 6]\n",
      "   state [1 0 1 0 0 1 1 0] state_WI [  0.22  -0.     0.27   0.14   0.61   0.42   0.47 -10.  ] sorted [4 6 5]\n",
      "   state [0 0 1 0 0 1 1 0] state_WI [  0.51  -0.     0.27   0.14   0.61   0.42   0.47 -10.  ] sorted [4 0 6]\n",
      "   state [1 0 0 0 0 0 1 0] state_WI [  0.22  -0.     0.77   0.14   0.61   0.41   0.47 -10.  ] sorted [2 4 6]\n",
      "   state [0 0 0 0 0 0 1 0] state_WI [  0.51  -0.     0.77   0.14   0.61   0.41   0.47 -10.  ] sorted [2 4 0]\n",
      "   state [0 0 1 0 0 0 0 0] state_WI [  0.51  -0.     0.27   0.14   0.61   0.41   0.38 -10.  ] sorted [4 0 5]\n",
      "   state [0 0 1 0 1 1 1 0] state_WI [  0.51  -0.     0.27   0.14   0.32   0.42   0.47 -10.  ] sorted [0 6 5]\n",
      "   state [0 0 1 1 1 1 1 0] state_WI [  0.51  -0.     0.27   0.05   0.32   0.42   0.47 -10.  ] sorted [0 6 5]\n",
      "   state [1 0 0 0 0 1 0 0] state_WI [  0.22  -0.     0.77   0.14   0.61   0.42   0.38 -10.  ] sorted [2 4 5]\n",
      "   state [0 0 0 0 1 0 1 0] state_WI [  0.51  -0.     0.77   0.14   0.32   0.41   0.47 -10.  ] sorted [2 0 6]\n",
      "   state [0 0 1 0 0 0 0 0] state_WI [  0.51  -0.     0.27   0.14   0.61   0.41   0.38 -10.  ] sorted [4 0 5]\n",
      "   state [1 0 0 0 0 1 0 0] state_WI [  0.22  -0.     0.77   0.14   0.61   0.42   0.38 -10.  ] sorted [2 4 5]\n",
      "   state [1 0 1 0 0 0 0 0] state_WI [  0.22  -0.     0.27   0.14   0.61   0.41   0.38 -10.  ] sorted [4 5 6]\n",
      "   state [1 0 1 0 0 0 0 1] state_WI [  0.22  -0.     0.27   0.14   0.61   0.41   0.38 -10.  ] sorted [4 5 6]\n",
      "   state [1 0 1 0 1 1 0 1] state_WI [  0.22  -0.     0.27   0.14   0.32   0.42   0.38 -10.  ] sorted [5 6 4]\n",
      "   state [0 0 1 0 1 1 0 0] state_WI [  0.51  -0.     0.27   0.14   0.32   0.42   0.38 -10.  ] sorted [0 5 6]\n",
      "instance 4, ep 23, state [1 1 0 0 1 1 0 0]\n",
      "   state [1 1 0 0 1 1 0 0] state_WI [  0.22  -0.     0.77   0.14   0.32   0.42   0.38 -10.  ] sorted [2 5 6]\n",
      "   state [1 0 1 0 0 1 0 0] state_WI [  0.22  -0.     0.27   0.14   0.61   0.42   0.38 -10.  ] sorted [4 5 6]\n",
      "   state [1 0 1 0 1 0 1 1] state_WI [  0.22  -0.     0.27   0.14   0.32   0.41   0.47 -10.  ] sorted [6 5 4]\n",
      "   state [1 0 1 0 1 1 1 1] state_WI [  0.22  -0.     0.27   0.14   0.32   0.42   0.47 -10.  ] sorted [6 5 4]\n",
      "   state [1 0 1 0 1 0 1 1] state_WI [  0.22  -0.     0.27   0.14   0.32   0.41   0.47 -10.  ] sorted [6 5 4]\n",
      "   state [1 0 1 0 1 0 1 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.41   0.47 -10.  ] sorted [6 5 4]\n",
      "   state [1 0 1 0 1 0 1 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.41   0.47 -10.  ] sorted [6 5 4]\n",
      "   state [1 0 1 0 1 1 1 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.42   0.47 -10.  ] sorted [6 5 4]\n",
      "   state [0 0 1 0 0 1 1 1] state_WI [  0.51  -0.     0.27   0.14   0.61   0.42   0.47 -10.  ] sorted [4 0 6]\n",
      "   state [1 0 0 0 1 1 0 0] state_WI [  0.22  -0.     0.77   0.14   0.32   0.42   0.38 -10.  ] sorted [2 5 6]\n",
      "   state [0 0 0 0 0 1 1 0] state_WI [  0.51  -0.     0.77   0.14   0.61   0.42   0.47 -10.  ] sorted [2 4 0]\n",
      "   state [0 0 1 1 0 0 0 0] state_WI [  0.51  -0.     0.27   0.05   0.61   0.41   0.38 -10.  ] sorted [4 0 5]\n",
      "   state [0 0 1 0 1 1 0 0] state_WI [  0.51  -0.     0.27   0.14   0.32   0.42   0.38 -10.  ] sorted [0 5 6]\n",
      "   state [1 0 0 0 0 1 0 0] state_WI [  0.22  -0.     0.77   0.14   0.61   0.42   0.38 -10.  ] sorted [2 4 5]\n",
      "   state [0 0 1 0 1 1 1 1] state_WI [  0.51  -0.     0.27   0.14   0.32   0.42   0.47 -10.  ] sorted [0 6 5]\n",
      "   state [1 0 1 0 1 1 1 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.42   0.47 -10.  ] sorted [6 5 4]\n",
      "   state [1 0 0 0 0 1 1 0] state_WI [  0.22  -0.     0.77   0.14   0.61   0.42   0.47 -10.  ] sorted [2 4 6]\n",
      "   state [1 0 1 0 1 0 1 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.41   0.47 -10.  ] sorted [6 5 4]\n",
      "   state [1 0 1 0 1 0 1 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.41   0.47 -10.  ] sorted [6 5 4]\n",
      "   state [0 0 1 0 1 0 1 0] state_WI [  0.51  -0.     0.27   0.14   0.32   0.41   0.47 -10.  ] sorted [0 6 5]\n",
      "instance 4, ep 24, state [0 0 0 1 1 1 1 1]\n",
      "   state [0 0 0 1 1 1 1 1] state_WI [  0.51  -0.     0.77   0.05   0.32   0.42   0.47 -10.  ] sorted [2 0 6]\n",
      "   state [1 0 0 0 1 1 1 0] state_WI [  0.22  -0.     0.77   0.14   0.32   0.42   0.47 -10.  ] sorted [2 6 5]\n",
      "   state [0 0 1 0 0 1 0 0] state_WI [  0.51  -0.     0.27   0.14   0.61   0.42   0.38 -10.  ] sorted [4 0 5]\n",
      "   state [1 0 0 0 1 1 0 1] state_WI [  0.22  -0.     0.77   0.14   0.32   0.42   0.38 -10.  ] sorted [2 5 6]\n",
      "   state [1 0 0 0 0 1 1 0] state_WI [  0.22  -0.     0.77   0.14   0.61   0.42   0.47 -10.  ] sorted [2 4 6]\n",
      "   state [1 0 1 0 0 0 1 0] state_WI [  0.22  -0.     0.27   0.14   0.61   0.41   0.47 -10.  ] sorted [4 6 5]\n",
      "   state [0 0 1 0 1 1 0 0] state_WI [  0.51  -0.     0.27   0.14   0.32   0.42   0.38 -10.  ] sorted [0 5 6]\n",
      "   state [0 0 1 0 0 0 1 0] state_WI [  0.51  -0.     0.27   0.14   0.61   0.41   0.47 -10.  ] sorted [4 0 6]\n",
      "   state [0 0 1 0 1 0 1 0] state_WI [  0.51  -0.     0.27   0.14   0.32   0.41   0.47 -10.  ] sorted [0 6 5]\n",
      "   state [1 0 0 0 1 0 1 0] state_WI [  0.22  -0.     0.77   0.14   0.32   0.41   0.47 -10.  ] sorted [2 6 5]\n",
      "   state [1 0 1 0 0 1 0 0] state_WI [  0.22  -0.     0.27   0.14   0.61   0.42   0.38 -10.  ] sorted [4 5 6]\n",
      "   state [0 0 1 0 1 1 0 0] state_WI [  0.51  -0.     0.27   0.14   0.32   0.42   0.38 -10.  ] sorted [0 5 6]\n",
      "   state [0 0 1 0 0 0 0 0] state_WI [  0.51  -0.     0.27   0.14   0.61   0.41   0.38 -10.  ] sorted [4 0 5]\n",
      "   state [0 0 0 1 0 1 0 0] state_WI [  0.51  -0.     0.77   0.05   0.61   0.42   0.38 -10.  ] sorted [2 4 0]\n",
      "   state [0 0 0 0 1 0 0 1] state_WI [  0.51  -0.     0.77   0.14   0.32   0.41   0.38 -10.  ] sorted [2 0 5]\n",
      "   state [1 0 0 0 0 1 0 0] state_WI [  0.22  -0.     0.77   0.14   0.61   0.42   0.38 -10.  ] sorted [2 4 5]\n",
      "   state [0 0 1 0 0 0 0 0] state_WI [  0.51  -0.     0.27   0.14   0.61   0.41   0.38 -10.  ] sorted [4 0 5]\n",
      "   state [1 0 0 0 1 0 0 0] state_WI [  0.22  -0.     0.77   0.14   0.32   0.41   0.38 -10.  ] sorted [2 5 6]\n",
      "   state [1 0 1 0 1 0 1 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.41   0.47 -10.  ] sorted [6 5 4]\n",
      "   state [1 0 1 0 0 0 1 0] state_WI [  0.22  -0.     0.27   0.14   0.61   0.41   0.47 -10.  ] sorted [4 6 5]\n",
      "instance 4, ep 25, state [1 1 0 0 0 1 1 0]\n",
      "   state [1 1 0 0 0 1 1 0] state_WI [  0.22  -0.     0.77   0.14   0.61   0.42   0.47 -10.  ] sorted [2 4 6]\n",
      "   state [0 0 1 0 1 0 1 0] state_WI [  0.51  -0.     0.27   0.14   0.32   0.41   0.47 -10.  ] sorted [0 6 5]\n",
      "   state [0 0 1 0 1 1 0 0] state_WI [  0.51  -0.     0.27   0.14   0.32   0.42   0.38 -10.  ] sorted [0 5 6]\n",
      "   state [1 0 0 0 0 1 0 0] state_WI [  0.22  -0.     0.77   0.14   0.61   0.42   0.38 -10.  ] sorted [2 4 5]\n",
      "   state [1 0 1 1 1 1 0 0] state_WI [  0.22  -0.     0.27   0.05   0.32   0.42   0.38 -10.  ] sorted [5 6 4]\n",
      "   state [1 0 1 0 1 0 0 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.41   0.38 -10.  ] sorted [5 6 4]\n",
      "   state [0 0 0 0 1 1 0 0] state_WI [  0.51  -0.     0.77   0.14   0.32   0.42   0.38 -10.  ] sorted [2 0 5]\n",
      "   state [1 0 1 0 0 0 0 0] state_WI [  0.22  -0.     0.27   0.14   0.61   0.41   0.38 -10.  ] sorted [4 5 6]\n",
      "   state [1 0 1 0 0 1 1 0] state_WI [  0.22  -0.     0.27   0.14   0.61   0.42   0.47 -10.  ] sorted [4 6 5]\n",
      "   state [0 0 1 0 1 1 1 0] state_WI [  0.51  -0.     0.27   0.14   0.32   0.42   0.47 -10.  ] sorted [0 6 5]\n",
      "   state [0 0 1 1 1 1 1 0] state_WI [  0.51  -0.     0.27   0.05   0.32   0.42   0.47 -10.  ] sorted [0 6 5]\n",
      "   state [1 0 1 0 1 1 1 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.42   0.47 -10.  ] sorted [6 5 4]\n",
      "   state [1 0 1 0 1 1 0 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.42   0.38 -10.  ] sorted [5 6 4]\n",
      "   state [1 0 1 1 0 1 1 0] state_WI [  0.22  -0.     0.27   0.05   0.61   0.42   0.47 -10.  ] sorted [4 6 5]\n",
      "   state [1 0 0 0 0 1 0 0] state_WI [  0.22  -0.     0.77   0.14   0.61   0.42   0.38 -10.  ] sorted [2 4 5]\n",
      "   state [1 0 1 0 1 1 0 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.42   0.38 -10.  ] sorted [5 6 4]\n",
      "   state [1 0 0 0 1 1 0 0] state_WI [  0.22  -0.     0.77   0.14   0.32   0.42   0.38 -10.  ] sorted [2 5 6]\n",
      "   state [0 0 1 1 0 1 0 0] state_WI [  0.51  -0.     0.27   0.05   0.61   0.42   0.38 -10.  ] sorted [4 0 5]\n",
      "   state [1 0 0 0 0 1 0 0] state_WI [  0.22  -0.     0.77   0.14   0.61   0.42   0.38 -10.  ] sorted [2 4 5]\n",
      "   state [1 0 1 1 1 1 0 0] state_WI [  0.22  -0.     0.27   0.05   0.32   0.42   0.38 -10.  ] sorted [5 6 4]\n",
      "instance 4, ep 26, state [1 0 1 0 0 0 0 0]\n",
      "   state [1 0 1 0 0 0 0 0] state_WI [  0.22  -0.     0.27   0.14   0.61   0.41   0.38 -10.  ] sorted [4 5 6]\n",
      "   state [1 0 1 0 0 0 0 0] state_WI [  0.22  -0.     0.27   0.14   0.61   0.41   0.38 -10.  ] sorted [4 5 6]\n",
      "   state [1 0 1 0 1 1 1 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.42   0.47 -10.  ] sorted [6 5 4]\n",
      "   state [1 0 0 0 1 1 1 0] state_WI [  0.22  -0.     0.77   0.14   0.32   0.42   0.47 -10.  ] sorted [2 6 5]\n",
      "   state [1 0 0 0 1 1 0 0] state_WI [  0.22  -0.     0.77   0.14   0.32   0.42   0.38 -10.  ] sorted [2 5 6]\n",
      "   state [1 0 1 0 1 0 0 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.41   0.38 -10.  ] sorted [5 6 4]\n",
      "   state [1 0 1 0 1 0 0 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.41   0.38 -10.  ] sorted [5 6 4]\n",
      "   state [0 0 1 0 1 0 1 0] state_WI [  0.51  -0.     0.27   0.14   0.32   0.41   0.47 -10.  ] sorted [0 6 5]\n",
      "   state [0 0 1 1 0 1 1 0] state_WI [  0.51  -0.     0.27   0.05   0.61   0.42   0.47 -10.  ] sorted [4 0 6]\n",
      "   state [1 0 0 0 1 0 1 0] state_WI [  0.22  -0.     0.77   0.14   0.32   0.41   0.47 -10.  ] sorted [2 6 5]\n",
      "   state [0 0 1 1 0 0 0 0] state_WI [  0.51  -0.     0.27   0.05   0.61   0.41   0.38 -10.  ] sorted [4 0 5]\n",
      "   state [0 0 0 0 1 1 0 0] state_WI [  0.51  -0.     0.77   0.14   0.32   0.42   0.38 -10.  ] sorted [2 0 5]\n",
      "   state [0 0 1 0 0 1 0 0] state_WI [  0.51  -0.     0.27   0.14   0.61   0.42   0.38 -10.  ] sorted [4 0 5]\n",
      "   state [0 0 1 0 1 0 0 0] state_WI [  0.51  -0.     0.27   0.14   0.32   0.41   0.38 -10.  ] sorted [0 5 6]\n",
      "   state [0 0 0 0 0 1 0 0] state_WI [  0.51  -0.     0.77   0.14   0.61   0.42   0.38 -10.  ] sorted [2 4 0]\n",
      "   state [0 0 1 0 1 0 0 0] state_WI [  0.51  -0.     0.27   0.14   0.32   0.41   0.38 -10.  ] sorted [0 5 6]\n",
      "   state [1 0 0 0 0 0 1 0] state_WI [  0.22  -0.     0.77   0.14   0.61   0.41   0.47 -10.  ] sorted [2 4 6]\n",
      "   state [0 0 1 0 0 0 1 0] state_WI [  0.51  -0.     0.27   0.14   0.61   0.41   0.47 -10.  ] sorted [4 0 6]\n",
      "   state [1 0 1 0 1 1 1 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.42   0.47 -10.  ] sorted [6 5 4]\n",
      "   state [1 0 1 0 1 0 0 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.41   0.38 -10.  ] sorted [5 6 4]\n",
      "instance 4, ep 27, state [0 1 1 0 1 1 0 0]\n",
      "   state [0 1 1 0 1 1 0 0] state_WI [  0.51  -0.     0.27   0.14   0.32   0.42   0.38 -10.  ] sorted [0 5 6]\n",
      "   state [0 0 0 0 0 1 0 0] state_WI [  0.51  -0.     0.77   0.14   0.61   0.42   0.38 -10.  ] sorted [2 4 0]\n",
      "   state [0 0 1 0 1 1 0 0] state_WI [  0.51  -0.     0.27   0.14   0.32   0.42   0.38 -10.  ] sorted [0 5 6]\n",
      "   state [0 0 0 0 1 0 0 0] state_WI [  0.51  -0.     0.77   0.14   0.32   0.41   0.38 -10.  ] sorted [2 0 5]\n",
      "   state [1 0 1 0 1 0 0 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.41   0.38 -10.  ] sorted [5 6 4]\n",
      "   state [0 0 1 0 1 1 1 0] state_WI [  0.51  -0.     0.27   0.14   0.32   0.42   0.47 -10.  ] sorted [0 6 5]\n",
      "   state [1 0 1 0 1 1 1 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.42   0.47 -10.  ] sorted [6 5 4]\n",
      "   state [0 0 1 0 1 0 0 0] state_WI [  0.51  -0.     0.27   0.14   0.32   0.41   0.38 -10.  ] sorted [0 5 6]\n",
      "   state [0 0 1 0 1 0 1 0] state_WI [  0.51  -0.     0.27   0.14   0.32   0.41   0.47 -10.  ] sorted [0 6 5]\n",
      "   state [0 0 1 1 0 0 1 0] state_WI [  0.51  -0.     0.27   0.05   0.61   0.41   0.47 -10.  ] sorted [4 0 6]\n",
      "   state [1 0 1 0 0 0 1 0] state_WI [  0.22  -0.     0.27   0.14   0.61   0.41   0.47 -10.  ] sorted [4 6 5]\n",
      "   state [0 0 1 0 0 0 1 0] state_WI [  0.51  -0.     0.27   0.14   0.61   0.41   0.47 -10.  ] sorted [4 0 6]\n",
      "   state [1 0 0 0 1 1 1 0] state_WI [  0.22  -0.     0.77   0.14   0.32   0.42   0.47 -10.  ] sorted [2 6 5]\n",
      "   state [1 0 1 0 0 0 1 0] state_WI [  0.22  -0.     0.27   0.14   0.61   0.41   0.47 -10.  ] sorted [4 6 5]\n",
      "   state [1 0 1 0 1 0 1 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.41   0.47 -10.  ] sorted [6 5 4]\n",
      "   state [0 0 1 0 1 0 1 0] state_WI [  0.51  -0.     0.27   0.14   0.32   0.41   0.47 -10.  ] sorted [0 6 5]\n",
      "   state [1 0 0 1 1 1 1 0] state_WI [  0.22  -0.     0.77   0.05   0.32   0.42   0.47 -10.  ] sorted [2 6 5]\n",
      "   state [0 0 1 1 0 1 1 0] state_WI [  0.51  -0.     0.27   0.05   0.61   0.42   0.47 -10.  ] sorted [4 0 6]\n",
      "   state [0 0 1 1 0 0 1 0] state_WI [  0.51  -0.     0.27   0.05   0.61   0.41   0.47 -10.  ] sorted [4 0 6]\n",
      "   state [0 0 1 0 0 0 0 0] state_WI [  0.51  -0.     0.27   0.14   0.61   0.41   0.38 -10.  ] sorted [4 0 5]\n",
      "instance 4, ep 28, state [0 0 1 0 1 1 0 1]\n",
      "   state [0 0 1 0 1 1 0 1] state_WI [  0.51  -0.     0.27   0.14   0.32   0.42   0.38 -10.  ] sorted [0 5 6]\n",
      "   state [0 0 1 0 0 0 1 0] state_WI [  0.51  -0.     0.27   0.14   0.61   0.41   0.47 -10.  ] sorted [4 0 6]\n",
      "   state [0 0 1 0 1 0 1 0] state_WI [  0.51  -0.     0.27   0.14   0.32   0.41   0.47 -10.  ] sorted [0 6 5]\n",
      "   state [1 0 1 0 1 0 0 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.41   0.38 -10.  ] sorted [5 6 4]\n",
      "   state [1 0 1 0 0 0 1 0] state_WI [  0.22  -0.     0.27   0.14   0.61   0.41   0.47 -10.  ] sorted [4 6 5]\n",
      "   state [0 0 1 0 0 0 1 0] state_WI [  0.51  -0.     0.27   0.14   0.61   0.41   0.47 -10.  ] sorted [4 0 6]\n",
      "   state [0 0 0 0 0 0 1 0] state_WI [  0.51  -0.     0.77   0.14   0.61   0.41   0.47 -10.  ] sorted [2 4 0]\n",
      "   state [1 0 1 0 1 0 1 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.41   0.47 -10.  ] sorted [6 5 4]\n",
      "   state [1 0 0 0 1 1 1 0] state_WI [  0.22  -0.     0.77   0.14   0.32   0.42   0.47 -10.  ] sorted [2 6 5]\n",
      "   state [0 0 1 0 0 1 1 0] state_WI [  0.51  -0.     0.27   0.14   0.61   0.42   0.47 -10.  ] sorted [4 0 6]\n",
      "   state [1 0 1 0 0 0 1 0] state_WI [  0.22  -0.     0.27   0.14   0.61   0.41   0.47 -10.  ] sorted [4 6 5]\n",
      "   state [0 0 0 0 1 1 0 0] state_WI [  0.51  -0.     0.77   0.14   0.32   0.42   0.38 -10.  ] sorted [2 0 5]\n",
      "   state [0 0 1 0 1 1 0 0] state_WI [  0.51  -0.     0.27   0.14   0.32   0.42   0.38 -10.  ] sorted [0 5 6]\n",
      "   state [0 0 1 0 0 1 0 0] state_WI [  0.51  -0.     0.27   0.14   0.61   0.42   0.38 -10.  ] sorted [4 0 5]\n",
      "   state [1 0 1 0 1 1 0 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.42   0.38 -10.  ] sorted [5 6 4]\n",
      "   state [0 0 0 0 1 1 1 0] state_WI [  0.51  -0.     0.77   0.14   0.32   0.42   0.47 -10.  ] sorted [2 0 6]\n",
      "   state [1 0 1 0 0 0 1 0] state_WI [  0.22  -0.     0.27   0.14   0.61   0.41   0.47 -10.  ] sorted [4 6 5]\n",
      "   state [0 0 0 0 1 1 1 0] state_WI [  0.51  -0.     0.77   0.14   0.32   0.42   0.47 -10.  ] sorted [2 0 6]\n",
      "   state [0 0 0 0 1 0 1 0] state_WI [  0.51  -0.     0.77   0.14   0.32   0.41   0.47 -10.  ] sorted [2 0 6]\n",
      "   state [0 0 1 0 1 1 1 0] state_WI [  0.51  -0.     0.27   0.14   0.32   0.42   0.47 -10.  ] sorted [0 6 5]\n",
      "instance 4, ep 29, state [0 1 0 1 1 0 1 1]\n",
      "   state [0 1 0 1 1 0 1 1] state_WI [  0.51  -0.     0.77   0.05   0.32   0.41   0.47 -10.  ] sorted [2 0 6]\n",
      "   state [1 0 1 0 0 0 0 1] state_WI [  0.22  -0.     0.27   0.14   0.61   0.41   0.38 -10.  ] sorted [4 5 6]\n",
      "   state [1 0 1 0 0 0 0 0] state_WI [  0.22  -0.     0.27   0.14   0.61   0.41   0.38 -10.  ] sorted [4 5 6]\n",
      "   state [1 0 1 0 0 0 0 0] state_WI [  0.22  -0.     0.27   0.14   0.61   0.41   0.38 -10.  ] sorted [4 5 6]\n",
      "   state [1 0 1 0 1 1 0 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.42   0.38 -10.  ] sorted [5 6 4]\n",
      "   state [1 0 1 0 0 1 0 0] state_WI [  0.22  -0.     0.27   0.14   0.61   0.42   0.38 -10.  ] sorted [4 5 6]\n",
      "   state [1 0 0 0 1 1 1 0] state_WI [  0.22  -0.     0.77   0.14   0.32   0.42   0.47 -10.  ] sorted [2 6 5]\n",
      "   state [0 0 1 0 1 1 1 0] state_WI [  0.51  -0.     0.27   0.14   0.32   0.42   0.47 -10.  ] sorted [0 6 5]\n",
      "   state [1 0 0 0 1 0 1 0] state_WI [  0.22  -0.     0.77   0.14   0.32   0.41   0.47 -10.  ] sorted [2 6 5]\n",
      "   state [0 0 0 0 0 1 0 0] state_WI [  0.51  -0.     0.77   0.14   0.61   0.42   0.38 -10.  ] sorted [2 4 0]\n",
      "   state [0 0 0 0 0 1 0 0] state_WI [  0.51  -0.     0.77   0.14   0.61   0.42   0.38 -10.  ] sorted [2 4 0]\n",
      "   state [0 0 0 0 1 1 0 0] state_WI [  0.51  -0.     0.77   0.14   0.32   0.42   0.38 -10.  ] sorted [2 0 5]\n",
      "   state [0 0 1 0 1 1 0 0] state_WI [  0.51  -0.     0.27   0.14   0.32   0.42   0.38 -10.  ] sorted [0 5 6]\n",
      "   state [0 0 1 0 0 1 1 0] state_WI [  0.51  -0.     0.27   0.14   0.61   0.42   0.47 -10.  ] sorted [4 0 6]\n",
      "   state [1 0 1 0 1 0 1 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.41   0.47 -10.  ] sorted [6 5 4]\n",
      "   state [0 0 1 0 1 0 1 0] state_WI [  0.51  -0.     0.27   0.14   0.32   0.41   0.47 -10.  ] sorted [0 6 5]\n",
      "   state [0 0 0 0 0 1 1 0] state_WI [  0.51  -0.     0.77   0.14   0.61   0.42   0.47 -10.  ] sorted [2 4 0]\n",
      "   state [1 0 1 0 1 0 1 0] state_WI [  0.22  -0.     0.27   0.14   0.32   0.41   0.47 -10.  ] sorted [6 5 4]\n",
      "   state [0 0 0 0 0 0 1 0] state_WI [  0.51  -0.     0.77   0.14   0.61   0.41   0.47 -10.  ] sorted [2 4 0]\n",
      "   state [1 0 1 0 0 0 1 0] state_WI [  0.22  -0.     0.27   0.14   0.61   0.41   0.47 -10.  ] sorted [4 6 5]\n",
      "first state [0 0 1 1 0 1 0 1]\n",
      "   state [0 0 1 1 0 1 0 1] state_WI [  0.84   0.32   0.22   0.45   0.47 -10.     0.83   0.28] sorted [0 6 4]\n",
      "   state [1 0 0 1 1 0 1 0] state_WI [0.33 0.32 0.51 0.45 0.42 0.91 0.28 0.67] sorted [5 7 2]\n",
      "   state [1 0 0 1 0 0 0 0] state_WI [0.33 0.32 0.51 0.45 0.47 0.91 0.83 0.67] sorted [5 6 7]\n",
      "   state [0 0 0 1 0 1 1 1] state_WI [  0.84   0.32   0.51   0.45   0.47 -10.     0.28   0.28] sorted [0 2 4]\n",
      "   state [0 0 0 0 1 0 0 0] state_WI [0.84 0.32 0.51 0.44 0.42 0.91 0.83 0.67] sorted [5 0 6]\n",
      "   state [0 1 0 0 0 1 1 1] state_WI [  0.84   0.34   0.51   0.44   0.47 -10.     0.28   0.28] sorted [0 2 4]\n",
      "   state [0 0 0 0 1 1 0 0] state_WI [  0.84   0.32   0.51   0.44   0.42 -10.     0.83   0.67] sorted [0 6 7]\n",
      "   state [1 0 0 0 1 1 1 0] state_WI [  0.33   0.32   0.51   0.44   0.42 -10.     0.28   0.67] sorted [7 2 3]\n",
      "   state [0 0 1 1 0 0 0 0] state_WI [0.84 0.32 0.22 0.45 0.47 0.91 0.83 0.67] sorted [5 0 6]\n",
      "   state [0 0 1 0 0 0 0 0] state_WI [0.84 0.32 0.22 0.44 0.47 0.91 0.83 0.67] sorted [5 0 6]\n",
      "   state [1 0 1 0 0 1 1 0] state_WI [  0.33   0.32   0.22   0.44   0.47 -10.     0.28   0.67] sorted [7 4 3]\n",
      "   state [0 0 1 0 0 0 0 0] state_WI [0.84 0.32 0.22 0.44 0.47 0.91 0.83 0.67] sorted [5 0 6]\n",
      "   state [0 0 1 0 0 0 1 0] state_WI [0.84 0.32 0.22 0.44 0.47 0.91 0.28 0.67] sorted [5 0 7]\n",
      "   state [1 0 1 0 0 1 1 0] state_WI [  0.33   0.32   0.22   0.44   0.47 -10.     0.28   0.67] sorted [7 4 3]\n",
      "   state [1 0 1 1 1 1 0 1] state_WI [  0.33   0.32   0.22   0.45   0.42 -10.     0.83   0.28] sorted [6 3 4]\n",
      "   state [1 0 1 1 0 1 1 0] state_WI [  0.33   0.32   0.22   0.45   0.47 -10.     0.28   0.67] sorted [7 4 3]\n",
      "   state [1 0 1 1 0 1 1 0] state_WI [  0.33   0.32   0.22   0.45   0.47 -10.     0.28   0.67] sorted [7 4 3]\n",
      "   state [0 0 1 1 0 0 1 1] state_WI [0.84 0.32 0.22 0.45 0.47 0.91 0.28 0.28] sorted [5 0 4]\n",
      "   state [1 0 1 1 0 0 1 1] state_WI [0.33 0.32 0.22 0.45 0.47 0.91 0.28 0.28] sorted [5 4 3]\n",
      "   state [1 0 1 1 1 1 1 1] state_WI [  0.33   0.32   0.22   0.45   0.42 -10.     0.28   0.28] sorted [3 4 0]\n",
      "instance 5, ep 1, state [0 0 1 0 1 1 1 0]\n",
      "   state [0 0 1 0 1 1 1 0] state_WI [  0.84   0.32   0.22   0.44   0.42 -10.     0.28   0.67] sorted [0 7 3]\n",
      "   state [0 0 1 1 0 0 0 1] state_WI [0.84 0.32 0.22 0.45 0.47 0.91 0.83 0.28] sorted [5 0 6]\n",
      "   state [1 0 0 0 1 1 1 0] state_WI [  0.33   0.32   0.51   0.44   0.42 -10.     0.28   0.67] sorted [7 2 3]\n",
      "   state [1 1 0 1 0 0 0 1] state_WI [0.33 0.34 0.51 0.45 0.47 0.91 0.83 0.28] sorted [5 6 2]\n",
      "   state [0 1 0 0 0 0 1 0] state_WI [0.84 0.34 0.51 0.44 0.47 0.91 0.28 0.67] sorted [5 0 7]\n",
      "   state [1 1 0 0 1 1 0 0] state_WI [  0.33   0.34   0.51   0.44   0.42 -10.     0.83   0.67] sorted [6 7 2]\n",
      "   state [0 1 0 0 0 1 1 0] state_WI [  0.84   0.34   0.51   0.44   0.47 -10.     0.28   0.67] sorted [0 7 2]\n",
      "   state [1 1 1 0 0 0 1 1] state_WI [0.33 0.34 0.22 0.44 0.47 0.91 0.28 0.28] sorted [5 4 3]\n",
      "   state [0 1 0 0 0 0 0 1] state_WI [0.84 0.34 0.51 0.44 0.47 0.91 0.83 0.28] sorted [5 0 6]\n",
      "   state [0 1 0 0 1 1 1 1] state_WI [  0.84   0.34   0.51   0.44   0.42 -10.     0.28   0.28] sorted [0 2 3]\n",
      "   state [1 0 1 1 0 0 0 0] state_WI [0.33 0.32 0.22 0.45 0.47 0.91 0.83 0.67] sorted [5 6 7]\n",
      "   state [1 0 0 1 0 1 1 0] state_WI [  0.33   0.32   0.51   0.45   0.47 -10.     0.28   0.67] sorted [7 2 4]\n",
      "   state [0 0 0 1 1 0 1 1] state_WI [0.84 0.32 0.51 0.45 0.42 0.91 0.28 0.28] sorted [5 0 2]\n",
      "   state [1 1 1 0 0 0 0 1] state_WI [0.33 0.34 0.22 0.44 0.47 0.91 0.83 0.28] sorted [5 6 4]\n",
      "   state [1 0 1 0 0 1 1 0] state_WI [  0.33   0.32   0.22   0.44   0.47 -10.     0.28   0.67] sorted [7 4 3]\n",
      "   state [0 0 0 0 0 0 1 0] state_WI [0.84 0.32 0.51 0.44 0.47 0.91 0.28 0.67] sorted [5 0 7]\n",
      "   state [0 1 0 0 0 1 0 0] state_WI [  0.84   0.34   0.51   0.44   0.47 -10.     0.83   0.67] sorted [0 6 7]\n",
      "   state [1 0 0 0 0 1 1 0] state_WI [  0.33   0.32   0.51   0.44   0.47 -10.     0.28   0.67] sorted [7 2 4]\n",
      "   state [0 0 0 0 0 0 0 0] state_WI [0.84 0.32 0.51 0.44 0.47 0.91 0.83 0.67] sorted [5 0 6]\n",
      "   state [1 0 1 0 0 1 1 0] state_WI [  0.33   0.32   0.22   0.44   0.47 -10.     0.28   0.67] sorted [7 4 3]\n",
      "instance 5, ep 2, state [0 0 1 1 1 1 1 1]\n",
      "   state [0 0 1 1 1 1 1 1] state_WI [  0.84   0.32   0.22   0.45   0.42 -10.     0.28   0.28] sorted [0 3 4]\n",
      "   state [1 1 1 1 1 1 1 0] state_WI [  0.33   0.34   0.22   0.45   0.42 -10.     0.28   0.67] sorted [7 3 4]\n",
      "   state [1 0 1 0 0 1 0 1] state_WI [  0.33   0.32   0.22   0.44   0.47 -10.     0.83   0.28] sorted [6 4 3]\n",
      "   state [0 0 0 1 1 0 1 1] state_WI [0.84 0.32 0.51 0.45 0.42 0.91 0.28 0.28] sorted [5 0 2]\n",
      "   state [0 0 0 0 0 0 1 1] state_WI [0.84 0.32 0.51 0.44 0.47 0.91 0.28 0.28] sorted [5 0 2]\n",
      "   state [1 0 1 0 0 0 0 1] state_WI [0.33 0.32 0.22 0.44 0.47 0.91 0.83 0.28] sorted [5 6 4]\n",
      "   state [1 1 1 0 0 1 1 0] state_WI [  0.33   0.34   0.22   0.44   0.47 -10.     0.28   0.67] sorted [7 4 3]\n",
      "   state [1 0 1 1 0 0 0 1] state_WI [0.33 0.32 0.22 0.45 0.47 0.91 0.83 0.28] sorted [5 6 4]\n",
      "   state [1 0 1 0 0 1 0 1] state_WI [  0.33   0.32   0.22   0.44   0.47 -10.     0.83   0.28] sorted [6 4 3]\n",
      "   state [0 0 1 1 0 1 1 0] state_WI [  0.84   0.32   0.22   0.45   0.47 -10.     0.28   0.67] sorted [0 7 4]\n",
      "   state [1 1 1 1 1 1 0 0] state_WI [  0.33   0.34   0.22   0.45   0.42 -10.     0.83   0.67] sorted [6 7 3]\n",
      "   state [1 0 1 1 0 1 1 0] state_WI [  0.33   0.32   0.22   0.45   0.47 -10.     0.28   0.67] sorted [7 4 3]\n",
      "   state [0 0 1 1 0 0 1 1] state_WI [0.84 0.32 0.22 0.45 0.47 0.91 0.28 0.28] sorted [5 0 4]\n",
      "   state [1 0 1 0 1 0 1 0] state_WI [0.33 0.32 0.22 0.44 0.42 0.91 0.28 0.67] sorted [5 7 3]\n",
      "   state [0 0 0 1 0 1 0 1] state_WI [  0.84   0.32   0.51   0.45   0.47 -10.     0.83   0.28] sorted [0 6 2]\n",
      "   state [1 1 1 0 0 1 1 0] state_WI [  0.33   0.34   0.22   0.44   0.47 -10.     0.28   0.67] sorted [7 4 3]\n",
      "   state [0 1 1 1 0 0 0 1] state_WI [0.84 0.34 0.22 0.45 0.47 0.91 0.83 0.28] sorted [5 0 6]\n",
      "   state [1 1 1 0 0 1 0 0] state_WI [  0.33   0.34   0.22   0.44   0.47 -10.     0.83   0.67] sorted [6 7 4]\n",
      "   state [1 1 1 0 0 0 1 1] state_WI [0.33 0.34 0.22 0.44 0.47 0.91 0.28 0.28] sorted [5 4 3]\n",
      "   state [1 0 1 0 0 0 1 0] state_WI [0.33 0.32 0.22 0.44 0.47 0.91 0.28 0.67] sorted [5 7 4]\n",
      "instance 5, ep 3, state [0 1 0 1 1 1 0 0]\n",
      "   state [0 1 0 1 1 1 0 0] state_WI [  0.84   0.34   0.51   0.45   0.42 -10.     0.83   0.67] sorted [0 6 7]\n",
      "   state [1 1 0 0 0 1 0 1] state_WI [  0.33   0.34   0.51   0.44   0.47 -10.     0.83   0.28] sorted [6 2 4]\n",
      "   state [1 0 1 0 1 0 1 0] state_WI [0.33 0.32 0.22 0.44 0.42 0.91 0.28 0.67] sorted [5 7 3]\n",
      "   state [1 0 0 0 1 1 1 1] state_WI [  0.33   0.32   0.51   0.44   0.42 -10.     0.28   0.28] sorted [2 3 4]\n",
      "   state [1 0 1 0 1 1 0 0] state_WI [  0.33   0.32   0.22   0.44   0.42 -10.     0.83   0.67] sorted [6 7 3]\n",
      "   state [1 0 1 0 1 0 1 1] state_WI [0.33 0.32 0.22 0.44 0.42 0.91 0.28 0.28] sorted [5 3 4]\n",
      "   state [1 0 1 0 1 1 1 0] state_WI [  0.33   0.32   0.22   0.44   0.42 -10.     0.28   0.67] sorted [7 3 4]\n",
      "   state [1 0 0 0 1 0 1 1] state_WI [0.33 0.32 0.51 0.44 0.42 0.91 0.28 0.28] sorted [5 2 3]\n",
      "   state [1 0 1 0 0 1 1 1] state_WI [  0.33   0.32   0.22   0.44   0.47 -10.     0.28   0.28] sorted [4 3 0]\n",
      "   state [0 0 0 0 1 1 1 1] state_WI [  0.84   0.32   0.51   0.44   0.42 -10.     0.28   0.28] sorted [0 2 3]\n",
      "   state [1 0 0 0 0 1 1 1] state_WI [  0.33   0.32   0.51   0.44   0.47 -10.     0.28   0.28] sorted [2 4 3]\n",
      "   state [0 0 1 1 0 1 1 1] state_WI [  0.84   0.32   0.22   0.45   0.47 -10.     0.28   0.28] sorted [0 4 3]\n",
      "   state [0 1 1 0 1 1 1 0] state_WI [  0.84   0.34   0.22   0.44   0.42 -10.     0.28   0.67] sorted [0 7 3]\n",
      "   state [1 0 1 1 0 0 1 1] state_WI [0.33 0.32 0.22 0.45 0.47 0.91 0.28 0.28] sorted [5 4 3]\n",
      "   state [1 0 0 0 1 1 1 0] state_WI [  0.33   0.32   0.51   0.44   0.42 -10.     0.28   0.67] sorted [7 2 3]\n",
      "   state [1 0 1 0 0 1 0 1] state_WI [  0.33   0.32   0.22   0.44   0.47 -10.     0.83   0.28] sorted [6 4 3]\n",
      "   state [1 0 1 0 0 1 1 0] state_WI [  0.33   0.32   0.22   0.44   0.47 -10.     0.28   0.67] sorted [7 4 3]\n",
      "   state [1 0 0 0 0 0 0 0] state_WI [0.33 0.32 0.51 0.44 0.47 0.91 0.83 0.67] sorted [5 6 7]\n",
      "   state [0 0 0 0 0 1 0 0] state_WI [  0.84   0.32   0.51   0.44   0.47 -10.     0.83   0.67] sorted [0 6 7]\n",
      "   state [1 0 0 1 0 0 0 1] state_WI [0.33 0.32 0.51 0.45 0.47 0.91 0.83 0.28] sorted [5 6 2]\n",
      "instance 5, ep 4, state [0 0 0 1 1 0 0 0]\n",
      "   state [0 0 0 1 1 0 0 0] state_WI [0.84 0.32 0.51 0.45 0.42 0.91 0.83 0.67] sorted [5 0 6]\n",
      "   state [1 0 0 1 0 1 1 0] state_WI [  0.33   0.32   0.51   0.45   0.47 -10.     0.28   0.67] sorted [7 2 4]\n",
      "   state [1 1 1 1 1 1 0 1] state_WI [  0.33   0.34   0.22   0.45   0.42 -10.     0.83   0.28] sorted [6 3 4]\n",
      "   state [1 0 1 1 1 1 1 1] state_WI [  0.33   0.32   0.22   0.45   0.42 -10.     0.28   0.28] sorted [3 4 0]\n",
      "   state [1 0 1 1 1 0 1 0] state_WI [0.33 0.32 0.22 0.45 0.42 0.91 0.28 0.67] sorted [5 7 3]\n",
      "   state [1 0 1 1 0 1 1 1] state_WI [  0.33   0.32   0.22   0.45   0.47 -10.     0.28   0.28] sorted [4 3 0]\n",
      "   state [1 0 0 1 1 1 0 1] state_WI [  0.33   0.32   0.51   0.45   0.42 -10.     0.83   0.28] sorted [6 2 3]\n",
      "   state [1 0 0 1 0 1 0 0] state_WI [  0.33   0.32   0.51   0.45   0.47 -10.     0.83   0.67] sorted [6 7 2]\n",
      "   state [1 0 1 0 0 0 0 1] state_WI [0.33 0.32 0.22 0.44 0.47 0.91 0.83 0.28] sorted [5 6 4]\n",
      "   state [0 0 1 0 0 1 0 0] state_WI [  0.84   0.32   0.22   0.44   0.47 -10.     0.83   0.67] sorted [0 6 7]\n",
      "   state [1 0 1 0 0 1 1 0] state_WI [  0.33   0.32   0.22   0.44   0.47 -10.     0.28   0.67] sorted [7 4 3]\n",
      "   state [1 1 0 0 0 1 1 0] state_WI [  0.33   0.34   0.51   0.44   0.47 -10.     0.28   0.67] sorted [7 2 4]\n",
      "   state [1 0 1 0 1 0 0 1] state_WI [0.33 0.32 0.22 0.44 0.42 0.91 0.83 0.28] sorted [5 6 3]\n",
      "   state [0 0 1 0 1 0 0 0] state_WI [0.84 0.32 0.22 0.44 0.42 0.91 0.83 0.67] sorted [5 0 6]\n",
      "   state [1 0 1 1 0 1 1 0] state_WI [  0.33   0.32   0.22   0.45   0.47 -10.     0.28   0.67] sorted [7 4 3]\n",
      "   state [0 0 1 1 0 0 1 0] state_WI [0.84 0.32 0.22 0.45 0.47 0.91 0.28 0.67] sorted [5 0 7]\n",
      "   state [1 0 1 1 0 0 0 0] state_WI [0.33 0.32 0.22 0.45 0.47 0.91 0.83 0.67] sorted [5 6 7]\n",
      "   state [0 0 0 0 0 1 0 1] state_WI [  0.84   0.32   0.51   0.44   0.47 -10.     0.83   0.28] sorted [0 6 2]\n",
      "   state [1 0 0 0 0 1 1 0] state_WI [  0.33   0.32   0.51   0.44   0.47 -10.     0.28   0.67] sorted [7 2 4]\n",
      "   state [1 1 0 0 1 1 0 1] state_WI [  0.33   0.34   0.51   0.44   0.42 -10.     0.83   0.28] sorted [6 2 3]\n",
      "instance 5, ep 5, state [1 1 1 0 1 1 0 1]\n",
      "   state [1 1 1 0 1 1 0 1] state_WI [  0.33   0.34   0.22   0.44   0.42 -10.     0.83   0.28] sorted [6 3 4]\n",
      "   state [1 1 0 1 1 0 1 1] state_WI [0.33 0.34 0.51 0.45 0.42 0.91 0.28 0.28] sorted [5 2 3]\n",
      "   state [0 1 0 0 0 1 0 0] state_WI [  0.84   0.34   0.51   0.44   0.47 -10.     0.83   0.67] sorted [0 6 7]\n",
      "   state [1 0 0 0 0 1 0 0] state_WI [  0.33   0.32   0.51   0.44   0.47 -10.     0.83   0.67] sorted [6 7 2]\n",
      "   state [1 1 1 0 0 1 1 1] state_WI [  0.33   0.34   0.22   0.44   0.47 -10.     0.28   0.28] sorted [4 3 1]\n",
      "   state [1 0 1 1 1 0 0 0] state_WI [0.33 0.32 0.22 0.45 0.42 0.91 0.83 0.67] sorted [5 6 7]\n",
      "   state [1 0 0 0 0 1 1 0] state_WI [  0.33   0.32   0.51   0.44   0.47 -10.     0.28   0.67] sorted [7 2 4]\n",
      "   state [1 0 0 0 1 1 0 1] state_WI [  0.33   0.32   0.51   0.44   0.42 -10.     0.83   0.28] sorted [6 2 3]\n",
      "   state [0 0 0 1 0 0 1 0] state_WI [0.84 0.32 0.51 0.45 0.47 0.91 0.28 0.67] sorted [5 0 7]\n",
      "   state [0 0 0 1 0 1 0 1] state_WI [  0.84   0.32   0.51   0.45   0.47 -10.     0.83   0.28] sorted [0 6 2]\n",
      "   state [1 0 0 0 1 1 0 0] state_WI [  0.33   0.32   0.51   0.44   0.42 -10.     0.83   0.67] sorted [6 7 2]\n",
      "   state [0 0 1 0 0 0 1 0] state_WI [0.84 0.32 0.22 0.44 0.47 0.91 0.28 0.67] sorted [5 0 7]\n",
      "   state [1 0 1 0 0 1 0 1] state_WI [  0.33   0.32   0.22   0.44   0.47 -10.     0.83   0.28] sorted [6 4 3]\n",
      "   state [0 0 0 1 0 1 1 0] state_WI [  0.84   0.32   0.51   0.45   0.47 -10.     0.28   0.67] sorted [0 7 2]\n",
      "   state [1 1 1 0 0 1 0 0] state_WI [  0.33   0.34   0.22   0.44   0.47 -10.     0.83   0.67] sorted [6 7 4]\n",
      "   state [1 1 0 0 1 0 1 0] state_WI [0.33 0.34 0.51 0.44 0.42 0.91 0.28 0.67] sorted [5 7 2]\n",
      "   state [1 0 1 0 1 1 0 0] state_WI [  0.33   0.32   0.22   0.44   0.42 -10.     0.83   0.67] sorted [6 7 3]\n",
      "   state [1 0 1 0 1 1 0 1] state_WI [  0.33   0.32   0.22   0.44   0.42 -10.     0.83   0.28] sorted [6 3 4]\n",
      "   state [0 0 0 0 0 1 1 0] state_WI [  0.84   0.32   0.51   0.44   0.47 -10.     0.28   0.67] sorted [0 7 2]\n",
      "   state [1 0 1 0 0 1 0 1] state_WI [  0.33   0.32   0.22   0.44   0.47 -10.     0.83   0.28] sorted [6 4 3]\n",
      "instance 5, ep 6, state [0 1 0 1 1 1 1 0]\n",
      "   state [0 1 0 1 1 1 1 0] state_WI [  0.84   0.34   0.51   0.45   0.42 -10.     0.28   0.67] sorted [0 7 2]\n",
      "   state [1 1 0 0 1 1 1 0] state_WI [  0.33   0.34   0.51   0.44   0.42 -10.     0.28   0.67] sorted [7 2 3]\n",
      "   state [0 0 1 0 0 0 0 0] state_WI [0.84 0.32 0.22 0.44 0.47 0.91 0.83 0.67] sorted [5 0 6]\n",
      "   state [1 0 0 0 0 1 1 0] state_WI [  0.33   0.32   0.51   0.44   0.47 -10.     0.28   0.67] sorted [7 2 4]\n",
      "   state [1 0 1 0 0 1 0 0] state_WI [  0.33   0.32   0.22   0.44   0.47 -10.     0.83   0.67] sorted [6 7 4]\n",
      "   state [1 0 1 0 1 1 0 1] state_WI [  0.33   0.32   0.22   0.44   0.42 -10.     0.83   0.28] sorted [6 3 4]\n",
      "   state [0 0 1 0 0 1 1 1] state_WI [  0.84   0.32   0.22   0.44   0.47 -10.     0.28   0.28] sorted [0 4 3]\n",
      "   state [1 0 0 0 0 0 1 1] state_WI [0.33 0.32 0.51 0.44 0.47 0.91 0.28 0.28] sorted [5 2 4]\n",
      "   state [0 0 0 0 1 1 1 1] state_WI [  0.84   0.32   0.51   0.44   0.42 -10.     0.28   0.28] sorted [0 2 3]\n",
      "   state [1 0 1 1 1 1 1 0] state_WI [  0.33   0.32   0.22   0.45   0.42 -10.     0.28   0.67] sorted [7 3 4]\n",
      "   state [1 1 1 1 1 0 0 1] state_WI [0.33 0.34 0.22 0.45 0.42 0.91 0.83 0.28] sorted [5 6 3]\n",
      "   state [0 0 1 1 1 1 1 1] state_WI [  0.84   0.32   0.22   0.45   0.42 -10.     0.28   0.28] sorted [0 3 4]\n",
      "   state [1 0 0 1 1 1 0 0] state_WI [  0.33   0.32   0.51   0.45   0.42 -10.     0.83   0.67] sorted [6 7 2]\n",
      "   state [1 0 0 0 0 1 1 1] state_WI [  0.33   0.32   0.51   0.44   0.47 -10.     0.28   0.28] sorted [2 4 3]\n",
      "   state [1 0 1 0 0 1 0 1] state_WI [  0.33   0.32   0.22   0.44   0.47 -10.     0.83   0.28] sorted [6 4 3]\n",
      "   state [1 1 1 0 0 1 0 0] state_WI [  0.33   0.34   0.22   0.44   0.47 -10.     0.83   0.67] sorted [6 7 4]\n",
      "   state [1 1 1 0 0 1 1 1] state_WI [  0.33   0.34   0.22   0.44   0.47 -10.     0.28   0.28] sorted [4 3 1]\n",
      "   state [0 1 1 1 1 0 0 1] state_WI [0.84 0.34 0.22 0.45 0.42 0.91 0.83 0.28] sorted [5 0 6]\n",
      "   state [1 1 0 1 0 1 0 1] state_WI [  0.33   0.34   0.51   0.45   0.47 -10.     0.83   0.28] sorted [6 2 4]\n",
      "   state [0 1 0 0 1 0 1 0] state_WI [0.84 0.34 0.51 0.44 0.42 0.91 0.28 0.67] sorted [5 0 7]\n",
      "instance 5, ep 7, state [0 0 0 1 0 1 1 1]\n",
      "   state [0 0 0 1 0 1 1 1] state_WI [  0.84   0.32   0.51   0.45   0.47 -10.     0.28   0.28] sorted [0 2 4]\n",
      "   state [0 0 1 0 1 1 0 0] state_WI [  0.84   0.32   0.22   0.44   0.42 -10.     0.83   0.67] sorted [0 6 7]\n",
      "   state [1 1 0 0 1 0 1 1] state_WI [0.33 0.34 0.51 0.44 0.42 0.91 0.28 0.28] sorted [5 2 3]\n",
      "   state [0 0 1 0 0 0 0 0] state_WI [0.84 0.32 0.22 0.44 0.47 0.91 0.83 0.67] sorted [5 0 6]\n",
      "   state [1 1 0 0 0 0 0 0] state_WI [0.33 0.34 0.51 0.44 0.47 0.91 0.83 0.67] sorted [5 6 7]\n",
      "   state [1 0 0 0 0 1 0 1] state_WI [  0.33   0.32   0.51   0.44   0.47 -10.     0.83   0.28] sorted [6 2 4]\n",
      "   state [0 0 1 0 0 1 0 1] state_WI [  0.84   0.32   0.22   0.44   0.47 -10.     0.83   0.28] sorted [0 6 4]\n",
      "   state [0 0 0 1 0 0 1 0] state_WI [0.84 0.32 0.51 0.45 0.47 0.91 0.28 0.67] sorted [5 0 7]\n",
      "   state [1 0 0 1 0 0 1 1] state_WI [0.33 0.32 0.51 0.45 0.47 0.91 0.28 0.28] sorted [5 2 4]\n",
      "   state [0 0 0 1 1 0 0 0] state_WI [0.84 0.32 0.51 0.45 0.42 0.91 0.83 0.67] sorted [5 0 6]\n",
      "   state [0 0 1 0 1 1 1 0] state_WI [  0.84   0.32   0.22   0.44   0.42 -10.     0.28   0.67] sorted [0 7 3]\n",
      "   state [0 1 0 1 1 0 1 1] state_WI [0.84 0.34 0.51 0.45 0.42 0.91 0.28 0.28] sorted [5 0 2]\n",
      "   state [1 1 0 1 1 1 1 0] state_WI [  0.33   0.34   0.51   0.45   0.42 -10.     0.28   0.67] sorted [7 2 3]\n",
      "   state [0 1 1 1 1 1 1 1] state_WI [  0.84   0.34   0.22   0.45   0.42 -10.     0.28   0.28] sorted [0 3 4]\n",
      "   state [1 1 1 0 0 0 0 0] state_WI [0.33 0.34 0.22 0.44 0.47 0.91 0.83 0.67] sorted [5 6 7]\n",
      "   state [1 1 0 0 0 0 1 0] state_WI [0.33 0.34 0.51 0.44 0.47 0.91 0.28 0.67] sorted [5 7 2]\n",
      "   state [1 0 0 0 0 1 0 1] state_WI [  0.33   0.32   0.51   0.44   0.47 -10.     0.83   0.28] sorted [6 2 4]\n",
      "   state [1 1 0 0 1 0 1 1] state_WI [0.33 0.34 0.51 0.44 0.42 0.91 0.28 0.28] sorted [5 2 3]\n",
      "   state [1 0 0 1 0 1 0 0] state_WI [  0.33   0.32   0.51   0.45   0.47 -10.     0.83   0.67] sorted [6 7 2]\n",
      "   state [0 0 0 0 0 1 0 1] state_WI [  0.84   0.32   0.51   0.44   0.47 -10.     0.83   0.28] sorted [0 6 2]\n",
      "instance 5, ep 8, state [0 1 1 0 1 1 0 1]\n",
      "   state [0 1 1 0 1 1 0 1] state_WI [  0.84   0.34   0.22   0.44   0.42 -10.     0.83   0.28] sorted [0 6 3]\n",
      "   state [1 1 1 1 0 1 0 1] state_WI [  0.33   0.34   0.22   0.45   0.47 -10.     0.83   0.28] sorted [6 4 3]\n",
      "   state [0 0 0 0 0 0 1 0] state_WI [0.84 0.32 0.51 0.44 0.47 0.91 0.28 0.67] sorted [5 0 7]\n",
      "   state [1 0 0 0 1 0 1 1] state_WI [0.33 0.32 0.51 0.44 0.42 0.91 0.28 0.28] sorted [5 2 3]\n",
      "   state [0 0 0 1 1 1 0 0] state_WI [  0.84   0.32   0.51   0.45   0.42 -10.     0.83   0.67] sorted [0 6 7]\n",
      "   state [0 1 0 0 1 1 1 0] state_WI [  0.84   0.34   0.51   0.44   0.42 -10.     0.28   0.67] sorted [0 7 2]\n",
      "   state [1 1 0 0 0 0 1 0] state_WI [0.33 0.34 0.51 0.44 0.47 0.91 0.28 0.67] sorted [5 7 2]\n",
      "   state [1 0 1 0 0 1 0 1] state_WI [  0.33   0.32   0.22   0.44   0.47 -10.     0.83   0.28] sorted [6 4 3]\n",
      "   state [0 0 0 0 1 0 1 1] state_WI [0.84 0.32 0.51 0.44 0.42 0.91 0.28 0.28] sorted [5 0 2]\n",
      "   state [1 0 0 0 0 1 0 0] state_WI [  0.33   0.32   0.51   0.44   0.47 -10.     0.83   0.67] sorted [6 7 2]\n",
      "   state [1 0 1 0 0 1 1 1] state_WI [  0.33   0.32   0.22   0.44   0.47 -10.     0.28   0.28] sorted [4 3 0]\n",
      "   state [1 0 1 0 0 0 0 0] state_WI [0.33 0.32 0.22 0.44 0.47 0.91 0.83 0.67] sorted [5 6 7]\n",
      "   state [1 0 0 0 0 1 1 1] state_WI [  0.33   0.32   0.51   0.44   0.47 -10.     0.28   0.28] sorted [2 4 3]\n",
      "   state [0 0 0 1 1 0 0 1] state_WI [0.84 0.32 0.51 0.45 0.42 0.91 0.83 0.28] sorted [5 0 6]\n",
      "   state [1 0 0 1 0 1 0 1] state_WI [  0.33   0.32   0.51   0.45   0.47 -10.     0.83   0.28] sorted [6 2 4]\n",
      "   state [0 0 1 1 0 0 0 1] state_WI [0.84 0.32 0.22 0.45 0.47 0.91 0.83 0.28] sorted [5 0 6]\n",
      "   state [1 0 1 1 0 1 1 1] state_WI [  0.33   0.32   0.22   0.45   0.47 -10.     0.28   0.28] sorted [4 3 0]\n",
      "   state [1 0 0 1 0 0 1 1] state_WI [0.33 0.32 0.51 0.45 0.47 0.91 0.28 0.28] sorted [5 2 4]\n",
      "   state [1 0 1 0 0 1 1 0] state_WI [  0.33   0.32   0.22   0.44   0.47 -10.     0.28   0.67] sorted [7 4 3]\n",
      "   state [1 1 0 0 0 1 0 0] state_WI [  0.33   0.34   0.51   0.44   0.47 -10.     0.83   0.67] sorted [6 7 2]\n",
      "instance 5, ep 9, state [0 0 0 0 0 0 1 1]\n",
      "   state [0 0 0 0 0 0 1 1] state_WI [0.84 0.32 0.51 0.44 0.47 0.91 0.28 0.28] sorted [5 0 2]\n",
      "   state [0 1 1 0 0 1 0 1] state_WI [  0.84   0.34   0.22   0.44   0.47 -10.     0.83   0.28] sorted [0 6 4]\n",
      "   state [1 0 1 0 1 0 1 1] state_WI [0.33 0.32 0.22 0.44 0.42 0.91 0.28 0.28] sorted [5 3 4]\n",
      "   state [1 0 1 0 0 1 0 1] state_WI [  0.33   0.32   0.22   0.44   0.47 -10.     0.83   0.28] sorted [6 4 3]\n",
      "   state [1 0 1 0 1 0 1 0] state_WI [0.33 0.32 0.22 0.44 0.42 0.91 0.28 0.67] sorted [5 7 3]\n",
      "   state [1 0 1 1 0 1 1 1] state_WI [  0.33   0.32   0.22   0.45   0.47 -10.     0.28   0.28] sorted [4 3 0]\n",
      "   state [1 0 1 1 0 1 1 0] state_WI [  0.33   0.32   0.22   0.45   0.47 -10.     0.28   0.67] sorted [7 4 3]\n",
      "   state [0 0 1 0 1 0 1 0] state_WI [0.84 0.32 0.22 0.44 0.42 0.91 0.28 0.67] sorted [5 0 7]\n",
      "   state [1 1 0 1 0 1 1 1] state_WI [  0.33   0.34   0.51   0.45   0.47 -10.     0.28   0.28] sorted [2 4 3]\n",
      "   state [1 1 1 0 0 1 1 1] state_WI [  0.33   0.34   0.22   0.44   0.47 -10.     0.28   0.28] sorted [4 3 1]\n",
      "   state [0 1 1 0 0 0 0 1] state_WI [0.84 0.34 0.22 0.44 0.47 0.91 0.83 0.28] sorted [5 0 6]\n",
      "   state [1 0 1 0 0 1 1 1] state_WI [  0.33   0.32   0.22   0.44   0.47 -10.     0.28   0.28] sorted [4 3 0]\n",
      "   state [1 0 0 0 0 0 0 0] state_WI [0.33 0.32 0.51 0.44 0.47 0.91 0.83 0.67] sorted [5 6 7]\n",
      "   state [1 0 0 0 0 1 1 1] state_WI [  0.33   0.32   0.51   0.44   0.47 -10.     0.28   0.28] sorted [2 4 3]\n",
      "   state [0 0 0 0 1 0 1 1] state_WI [0.84 0.32 0.51 0.44 0.42 0.91 0.28 0.28] sorted [5 0 2]\n",
      "   state [0 0 1 0 0 1 1 0] state_WI [  0.84   0.32   0.22   0.44   0.47 -10.     0.28   0.67] sorted [0 7 4]\n",
      "   state [0 0 0 0 0 1 1 0] state_WI [  0.84   0.32   0.51   0.44   0.47 -10.     0.28   0.67] sorted [0 7 2]\n",
      "   state [1 0 0 0 0 0 1 1] state_WI [0.33 0.32 0.51 0.44 0.47 0.91 0.28 0.28] sorted [5 2 4]\n",
      "   state [0 0 0 0 0 1 0 0] state_WI [  0.84   0.32   0.51   0.44   0.47 -10.     0.83   0.67] sorted [0 6 7]\n",
      "   state [0 0 0 0 0 1 1 0] state_WI [  0.84   0.32   0.51   0.44   0.47 -10.     0.28   0.67] sorted [0 7 2]\n",
      "instance 5, ep 10, state [1 0 0 1 0 0 1 0]\n",
      "   state [1 0 0 1 0 0 1 0] state_WI [0.33 0.32 0.51 0.45 0.47 0.91 0.28 0.67] sorted [5 7 2]\n",
      "   state [0 0 1 0 0 1 1 1] state_WI [  0.84   0.32   0.22   0.44   0.47 -10.     0.28   0.28] sorted [0 4 3]\n",
      "   state [1 0 0 0 1 1 0 1] state_WI [  0.33   0.32   0.51   0.44   0.42 -10.     0.83   0.28] sorted [6 2 3]\n",
      "   state [0 1 1 0 1 0 0 1] state_WI [0.84 0.34 0.22 0.44 0.42 0.91 0.83 0.28] sorted [5 0 6]\n",
      "   state [1 0 1 0 0 1 1 0] state_WI [  0.33   0.32   0.22   0.44   0.47 -10.     0.28   0.67] sorted [7 4 3]\n",
      "   state [1 0 0 0 1 1 0 0] state_WI [  0.33   0.32   0.51   0.44   0.42 -10.     0.83   0.67] sorted [6 7 2]\n",
      "   state [1 0 0 0 0 0 0 0] state_WI [0.33 0.32 0.51 0.44 0.47 0.91 0.83 0.67] sorted [5 6 7]\n",
      "   state [1 0 0 0 0 1 1 0] state_WI [  0.33   0.32   0.51   0.44   0.47 -10.     0.28   0.67] sorted [7 2 4]\n",
      "   state [1 0 1 0 0 0 0 1] state_WI [0.33 0.32 0.22 0.44 0.47 0.91 0.83 0.28] sorted [5 6 4]\n",
      "   state [1 0 0 0 1 1 0 0] state_WI [  0.33   0.32   0.51   0.44   0.42 -10.     0.83   0.67] sorted [6 7 2]\n",
      "   state [0 0 1 0 1 0 0 0] state_WI [0.84 0.32 0.22 0.44 0.42 0.91 0.83 0.67] sorted [5 0 6]\n",
      "   state [1 0 0 0 0 0 1 0] state_WI [0.33 0.32 0.51 0.44 0.47 0.91 0.28 0.67] sorted [5 7 2]\n",
      "   state [0 1 0 0 0 1 1 0] state_WI [  0.84   0.34   0.51   0.44   0.47 -10.     0.28   0.67] sorted [0 7 2]\n",
      "   state [1 0 1 1 0 1 0 1] state_WI [  0.33   0.32   0.22   0.45   0.47 -10.     0.83   0.28] sorted [6 4 3]\n",
      "   state [1 0 1 1 0 0 1 1] state_WI [0.33 0.32 0.22 0.45 0.47 0.91 0.28 0.28] sorted [5 4 3]\n",
      "   state [1 0 1 1 0 1 0 0] state_WI [  0.33   0.32   0.22   0.45   0.47 -10.     0.83   0.67] sorted [6 7 4]\n",
      "   state [0 0 0 0 0 0 1 1] state_WI [0.84 0.32 0.51 0.44 0.47 0.91 0.28 0.28] sorted [5 0 2]\n",
      "   state [1 1 0 0 0 0 1 1] state_WI [0.33 0.34 0.51 0.44 0.47 0.91 0.28 0.28] sorted [5 2 4]\n",
      "   state [1 1 0 0 1 1 1 0] state_WI [  0.33   0.34   0.51   0.44   0.42 -10.     0.28   0.67] sorted [7 2 3]\n",
      "   state [0 0 0 0 0 1 1 1] state_WI [  0.84   0.32   0.51   0.44   0.47 -10.     0.28   0.28] sorted [0 2 4]\n",
      "instance 5, ep 11, state [1 1 0 0 1 0 0 1]\n",
      "   state [1 1 0 0 1 0 0 1] state_WI [0.33 0.34 0.51 0.44 0.42 0.91 0.83 0.28] sorted [5 6 2]\n",
      "   state [0 1 0 0 1 1 1 1] state_WI [  0.84   0.34   0.51   0.44   0.42 -10.     0.28   0.28] sorted [0 2 3]\n",
      "   state [1 1 1 1 1 1 1 0] state_WI [  0.33   0.34   0.22   0.45   0.42 -10.     0.28   0.67] sorted [7 3 4]\n",
      "   state [0 1 1 1 1 0 0 0] state_WI [0.84 0.34 0.22 0.45 0.42 0.91 0.83 0.67] sorted [5 0 6]\n",
      "   state [1 1 0 0 0 1 1 0] state_WI [  0.33   0.34   0.51   0.44   0.47 -10.     0.28   0.67] sorted [7 2 4]\n",
      "   state [1 0 0 0 0 1 1 1] state_WI [  0.33   0.32   0.51   0.44   0.47 -10.     0.28   0.28] sorted [2 4 3]\n",
      "   state [0 0 0 0 0 0 1 1] state_WI [0.84 0.32 0.51 0.44 0.47 0.91 0.28 0.28] sorted [5 0 2]\n",
      "   state [0 0 0 0 0 1 1 1] state_WI [  0.84   0.32   0.51   0.44   0.47 -10.     0.28   0.28] sorted [0 2 4]\n",
      "   state [1 0 0 1 0 0 0 0] state_WI [0.33 0.32 0.51 0.45 0.47 0.91 0.83 0.67] sorted [5 6 7]\n",
      "   state [1 1 0 0 0 1 1 1] state_WI [  0.33   0.34   0.51   0.44   0.47 -10.     0.28   0.28] sorted [2 4 3]\n",
      "   state [1 1 1 0 0 1 1 0] state_WI [  0.33   0.34   0.22   0.44   0.47 -10.     0.28   0.67] sorted [7 4 3]\n",
      "   state [1 0 1 0 1 0 0 0] state_WI [0.33 0.32 0.22 0.44 0.42 0.91 0.83 0.67] sorted [5 6 7]\n",
      "   state [1 1 0 0 1 0 1 0] state_WI [0.33 0.34 0.51 0.44 0.42 0.91 0.28 0.67] sorted [5 7 2]\n",
      "   state [0 1 1 0 0 1 1 0] state_WI [  0.84   0.34   0.22   0.44   0.47 -10.     0.28   0.67] sorted [0 7 4]\n",
      "   state [1 0 0 0 0 0 1 0] state_WI [0.33 0.32 0.51 0.44 0.47 0.91 0.28 0.67] sorted [5 7 2]\n",
      "   state [1 0 0 0 0 1 0 0] state_WI [  0.33   0.32   0.51   0.44   0.47 -10.     0.83   0.67] sorted [6 7 2]\n",
      "   state [1 0 1 0 0 1 1 1] state_WI [  0.33   0.32   0.22   0.44   0.47 -10.     0.28   0.28] sorted [4 3 0]\n",
      "   state [1 1 0 1 1 0 0 1] state_WI [0.33 0.34 0.51 0.45 0.42 0.91 0.83 0.28] sorted [5 6 2]\n",
      "   state [1 0 1 0 0 1 1 1] state_WI [  0.33   0.32   0.22   0.44   0.47 -10.     0.28   0.28] sorted [4 3 0]\n",
      "   state [1 1 0 1 0 0 1 0] state_WI [0.33 0.34 0.51 0.45 0.47 0.91 0.28 0.67] sorted [5 7 2]\n",
      "instance 5, ep 12, state [0 1 1 0 0 0 0 0]\n",
      "   state [0 1 1 0 0 0 0 0] state_WI [0.84 0.34 0.22 0.44 0.47 0.91 0.83 0.67] sorted [5 0 6]\n",
      "   state [0 0 1 1 0 0 1 0] state_WI [0.84 0.32 0.22 0.45 0.47 0.91 0.28 0.67] sorted [5 0 7]\n",
      "   state [1 1 1 0 0 1 1 0] state_WI [  0.33   0.34   0.22   0.44   0.47 -10.     0.28   0.67] sorted [7 4 3]\n",
      "   state [0 1 0 0 1 1 0 0] state_WI [  0.84   0.34   0.51   0.44   0.42 -10.     0.83   0.67] sorted [0 6 7]\n",
      "   state [0 1 1 0 0 0 1 0] state_WI [0.84 0.34 0.22 0.44 0.47 0.91 0.28 0.67] sorted [5 0 7]\n",
      "   state [1 1 1 1 0 1 0 1] state_WI [  0.33   0.34   0.22   0.45   0.47 -10.     0.83   0.28] sorted [6 4 3]\n",
      "   state [1 0 0 0 0 1 0 1] state_WI [  0.33   0.32   0.51   0.44   0.47 -10.     0.83   0.28] sorted [6 2 4]\n",
      "   state [0 0 1 0 1 1 0 1] state_WI [  0.84   0.32   0.22   0.44   0.42 -10.     0.83   0.28] sorted [0 6 3]\n",
      "   state [0 0 1 0 1 0 0 1] state_WI [0.84 0.32 0.22 0.44 0.42 0.91 0.83 0.28] sorted [5 0 6]\n",
      "   state [1 0 0 0 1 1 1 1] state_WI [  0.33   0.32   0.51   0.44   0.42 -10.     0.28   0.28] sorted [2 3 4]\n",
      "   state [0 0 0 1 0 1 0 1] state_WI [  0.84   0.32   0.51   0.45   0.47 -10.     0.83   0.28] sorted [0 6 2]\n",
      "   state [0 1 0 1 0 1 0 0] state_WI [  0.84   0.34   0.51   0.45   0.47 -10.     0.83   0.67] sorted [0 6 7]\n",
      "   state [1 0 0 0 0 0 1 0] state_WI [0.33 0.32 0.51 0.44 0.47 0.91 0.28 0.67] sorted [5 7 2]\n",
      "   state [0 0 0 0 0 1 0 0] state_WI [  0.84   0.32   0.51   0.44   0.47 -10.     0.83   0.67] sorted [0 6 7]\n",
      "   state [0 0 0 0 0 1 1 0] state_WI [  0.84   0.32   0.51   0.44   0.47 -10.     0.28   0.67] sorted [0 7 2]\n",
      "   state [0 1 1 0 0 1 1 0] state_WI [  0.84   0.34   0.22   0.44   0.47 -10.     0.28   0.67] sorted [0 7 4]\n",
      "   state [1 0 0 0 0 1 0 0] state_WI [  0.33   0.32   0.51   0.44   0.47 -10.     0.83   0.67] sorted [6 7 2]\n",
      "   state [1 1 0 0 0 0 0 0] state_WI [0.33 0.34 0.51 0.44 0.47 0.91 0.83 0.67] sorted [5 6 7]\n",
      "   state [0 0 0 0 0 0 1 1] state_WI [0.84 0.32 0.51 0.44 0.47 0.91 0.28 0.28] sorted [5 0 2]\n",
      "   state [0 1 0 0 0 1 0 0] state_WI [  0.84   0.34   0.51   0.44   0.47 -10.     0.83   0.67] sorted [0 6 7]\n",
      "instance 5, ep 13, state [1 0 1 1 1 1 0 1]\n",
      "   state [1 0 1 1 1 1 0 1] state_WI [  0.33   0.32   0.22   0.45   0.42 -10.     0.83   0.28] sorted [6 3 4]\n",
      "   state [1 0 1 1 1 0 0 0] state_WI [0.33 0.32 0.22 0.45 0.42 0.91 0.83 0.67] sorted [5 6 7]\n",
      "   state [1 1 0 1 1 1 0 0] state_WI [  0.33   0.34   0.51   0.45   0.42 -10.     0.83   0.67] sorted [6 7 2]\n",
      "   state [0 1 1 0 0 0 1 1] state_WI [0.84 0.34 0.22 0.44 0.47 0.91 0.28 0.28] sorted [5 0 4]\n",
      "   state [1 1 0 0 1 0 1 0] state_WI [0.33 0.34 0.51 0.44 0.42 0.91 0.28 0.67] sorted [5 7 2]\n",
      "   state [1 1 1 0 0 1 0 1] state_WI [  0.33   0.34   0.22   0.44   0.47 -10.     0.83   0.28] sorted [6 4 3]\n",
      "   state [0 1 0 0 0 1 0 0] state_WI [  0.84   0.34   0.51   0.44   0.47 -10.     0.83   0.67] sorted [0 6 7]\n",
      "   state [0 0 0 0 0 1 0 0] state_WI [  0.84   0.32   0.51   0.44   0.47 -10.     0.83   0.67] sorted [0 6 7]\n",
      "   state [1 0 0 0 0 1 1 1] state_WI [  0.33   0.32   0.51   0.44   0.47 -10.     0.28   0.28] sorted [2 4 3]\n",
      "   state [0 0 0 0 0 0 1 0] state_WI [0.84 0.32 0.51 0.44 0.47 0.91 0.28 0.67] sorted [5 0 7]\n",
      "   state [1 0 0 0 0 0 0 0] state_WI [0.33 0.32 0.51 0.44 0.47 0.91 0.83 0.67] sorted [5 6 7]\n",
      "   state [1 1 0 0 0 0 0 1] state_WI [0.33 0.34 0.51 0.44 0.47 0.91 0.83 0.28] sorted [5 6 2]\n",
      "   state [0 0 0 0 0 1 1 0] state_WI [  0.84   0.32   0.51   0.44   0.47 -10.     0.28   0.67] sorted [0 7 2]\n",
      "   state [0 0 1 0 0 0 0 0] state_WI [0.84 0.32 0.22 0.44 0.47 0.91 0.83 0.67] sorted [5 0 6]\n",
      "   state [1 1 0 0 0 0 1 0] state_WI [0.33 0.34 0.51 0.44 0.47 0.91 0.28 0.67] sorted [5 7 2]\n",
      "   state [1 0 0 0 0 1 0 1] state_WI [  0.33   0.32   0.51   0.44   0.47 -10.     0.83   0.28] sorted [6 2 4]\n",
      "   state [0 1 1 0 1 0 1 0] state_WI [0.84 0.34 0.22 0.44 0.42 0.91 0.28 0.67] sorted [5 0 7]\n",
      "   state [1 1 1 0 0 1 0 0] state_WI [  0.33   0.34   0.22   0.44   0.47 -10.     0.83   0.67] sorted [6 7 4]\n",
      "   state [1 1 0 0 1 1 1 0] state_WI [  0.33   0.34   0.51   0.44   0.42 -10.     0.28   0.67] sorted [7 2 3]\n",
      "   state [1 1 0 1 0 0 1 0] state_WI [0.33 0.34 0.51 0.45 0.47 0.91 0.28 0.67] sorted [5 7 2]\n",
      "instance 5, ep 14, state [1 0 0 1 0 0 0 0]\n",
      "   state [1 0 0 1 0 0 0 0] state_WI [0.33 0.32 0.51 0.45 0.47 0.91 0.83 0.67] sorted [5 6 7]\n",
      "   state [1 0 1 0 0 0 1 1] state_WI [0.33 0.32 0.22 0.44 0.47 0.91 0.28 0.28] sorted [5 4 3]\n",
      "   state [1 0 0 1 0 1 0 0] state_WI [  0.33   0.32   0.51   0.45   0.47 -10.     0.83   0.67] sorted [6 7 2]\n",
      "   state [0 0 0 1 0 0 0 1] state_WI [0.84 0.32 0.51 0.45 0.47 0.91 0.83 0.28] sorted [5 0 6]\n",
      "   state [0 0 1 1 0 1 1 0] state_WI [  0.84   0.32   0.22   0.45   0.47 -10.     0.28   0.67] sorted [0 7 4]\n",
      "   state [0 0 0 1 1 1 1 0] state_WI [  0.84   0.32   0.51   0.45   0.42 -10.     0.28   0.67] sorted [0 7 2]\n",
      "   state [0 0 0 0 0 0 0 0] state_WI [0.84 0.32 0.51 0.44 0.47 0.91 0.83 0.67] sorted [5 0 6]\n",
      "   state [0 0 0 0 1 1 1 1] state_WI [  0.84   0.32   0.51   0.44   0.42 -10.     0.28   0.28] sorted [0 2 3]\n",
      "   state [1 0 0 1 0 0 1 0] state_WI [0.33 0.32 0.51 0.45 0.47 0.91 0.28 0.67] sorted [5 7 2]\n",
      "   state [0 0 0 0 0 1 0 0] state_WI [  0.84   0.32   0.51   0.44   0.47 -10.     0.83   0.67] sorted [0 6 7]\n",
      "   state [1 1 0 0 0 1 0 0] state_WI [  0.33   0.34   0.51   0.44   0.47 -10.     0.83   0.67] sorted [6 7 2]\n",
      "   state [0 0 1 0 0 1 1 0] state_WI [  0.84   0.32   0.22   0.44   0.47 -10.     0.28   0.67] sorted [0 7 4]\n",
      "   state [1 0 0 0 0 0 0 1] state_WI [0.33 0.32 0.51 0.44 0.47 0.91 0.83 0.28] sorted [5 6 2]\n",
      "   state [1 0 0 0 0 1 0 1] state_WI [  0.33   0.32   0.51   0.44   0.47 -10.     0.83   0.28] sorted [6 2 4]\n",
      "   state [0 0 0 0 0 1 1 1] state_WI [  0.84   0.32   0.51   0.44   0.47 -10.     0.28   0.28] sorted [0 2 4]\n",
      "   state [0 0 0 0 1 1 1 1] state_WI [  0.84   0.32   0.51   0.44   0.42 -10.     0.28   0.28] sorted [0 2 3]\n",
      "   state [1 0 1 1 0 1 0 0] state_WI [  0.33   0.32   0.22   0.45   0.47 -10.     0.83   0.67] sorted [6 7 4]\n",
      "   state [1 0 1 1 0 0 1 0] state_WI [0.33 0.32 0.22 0.45 0.47 0.91 0.28 0.67] sorted [5 7 4]\n",
      "   state [0 0 0 0 1 1 0 1] state_WI [  0.84   0.32   0.51   0.44   0.42 -10.     0.83   0.28] sorted [0 6 2]\n",
      "   state [1 0 0 0 1 1 1 0] state_WI [  0.33   0.32   0.51   0.44   0.42 -10.     0.28   0.67] sorted [7 2 3]\n",
      "instance 5, ep 15, state [1 1 1 0 0 0 0 0]\n",
      "   state [1 1 1 0 0 0 0 0] state_WI [0.33 0.34 0.22 0.44 0.47 0.91 0.83 0.67] sorted [5 6 7]\n",
      "   state [1 0 0 0 0 1 1 0] state_WI [  0.33   0.32   0.51   0.44   0.47 -10.     0.28   0.67] sorted [7 2 4]\n",
      "   state [1 0 0 0 0 1 0 0] state_WI [  0.33   0.32   0.51   0.44   0.47 -10.     0.83   0.67] sorted [6 7 2]\n",
      "   state [1 0 0 1 0 0 0 0] state_WI [0.33 0.32 0.51 0.45 0.47 0.91 0.83 0.67] sorted [5 6 7]\n",
      "   state [0 1 0 0 1 1 0 0] state_WI [  0.84   0.34   0.51   0.44   0.42 -10.     0.83   0.67] sorted [0 6 7]\n",
      "   state [0 0 0 0 1 1 1 0] state_WI [  0.84   0.32   0.51   0.44   0.42 -10.     0.28   0.67] sorted [0 7 2]\n",
      "   state [0 0 0 0 0 0 1 0] state_WI [0.84 0.32 0.51 0.44 0.47 0.91 0.28 0.67] sorted [5 0 7]\n",
      "   state [1 0 0 0 0 1 1 1] state_WI [  0.33   0.32   0.51   0.44   0.47 -10.     0.28   0.28] sorted [2 4 3]\n",
      "   state [0 0 1 0 0 0 1 1] state_WI [0.84 0.32 0.22 0.44 0.47 0.91 0.28 0.28] sorted [5 0 4]\n",
      "   state [1 1 1 0 0 0 1 0] state_WI [0.33 0.34 0.22 0.44 0.47 0.91 0.28 0.67] sorted [5 7 4]\n",
      "   state [1 0 1 0 0 1 0 1] state_WI [  0.33   0.32   0.22   0.44   0.47 -10.     0.83   0.28] sorted [6 4 3]\n",
      "   state [1 1 1 0 1 0 1 1] state_WI [0.33 0.34 0.22 0.44 0.42 0.91 0.28 0.28] sorted [5 3 4]\n",
      "   state [1 0 0 1 0 1 1 0] state_WI [  0.33   0.32   0.51   0.45   0.47 -10.     0.28   0.67] sorted [7 2 4]\n",
      "   state [0 0 1 1 1 0 1 1] state_WI [0.84 0.32 0.22 0.45 0.42 0.91 0.28 0.28] sorted [5 0 3]\n",
      "   state [1 0 1 1 0 1 1 0] state_WI [  0.33   0.32   0.22   0.45   0.47 -10.     0.28   0.67] sorted [7 4 3]\n",
      "   state [0 0 1 1 1 0 0 0] state_WI [0.84 0.32 0.22 0.45 0.42 0.91 0.83 0.67] sorted [5 0 6]\n",
      "   state [1 1 0 1 0 0 1 0] state_WI [0.33 0.34 0.51 0.45 0.47 0.91 0.28 0.67] sorted [5 7 2]\n",
      "   state [0 1 0 0 0 1 0 1] state_WI [  0.84   0.34   0.51   0.44   0.47 -10.     0.83   0.28] sorted [0 6 2]\n",
      "   state [1 0 1 0 0 0 1 1] state_WI [0.33 0.32 0.22 0.44 0.47 0.91 0.28 0.28] sorted [5 4 3]\n",
      "   state [1 0 1 0 0 0 0 1] state_WI [0.33 0.32 0.22 0.44 0.47 0.91 0.83 0.28] sorted [5 6 4]\n",
      "instance 5, ep 16, state [1 0 1 0 0 0 1 1]\n",
      "   state [1 0 1 0 0 0 1 1] state_WI [0.33 0.32 0.22 0.44 0.47 0.91 0.28 0.28] sorted [5 4 3]\n",
      "   state [1 0 1 0 1 0 1 1] state_WI [0.33 0.32 0.22 0.44 0.42 0.91 0.28 0.28] sorted [5 3 4]\n",
      "   state [1 0 1 1 0 1 0 1] state_WI [  0.33   0.32   0.22   0.45   0.47 -10.     0.83   0.28] sorted [6 4 3]\n",
      "   state [1 0 1 1 0 0 1 1] state_WI [0.33 0.32 0.22 0.45 0.47 0.91 0.28 0.28] sorted [5 4 3]\n",
      "   state [0 0 0 0 1 1 1 1] state_WI [  0.84   0.32   0.51   0.44   0.42 -10.     0.28   0.28] sorted [0 2 3]\n",
      "   state [1 0 1 0 0 0 0 1] state_WI [0.33 0.32 0.22 0.44 0.47 0.91 0.83 0.28] sorted [5 6 4]\n",
      "   state [1 0 1 0 0 0 0 0] state_WI [0.33 0.32 0.22 0.44 0.47 0.91 0.83 0.67] sorted [5 6 7]\n",
      "   state [0 0 1 0 0 1 1 1] state_WI [  0.84   0.32   0.22   0.44   0.47 -10.     0.28   0.28] sorted [0 4 3]\n",
      "   state [0 0 1 0 0 1 0 1] state_WI [  0.84   0.32   0.22   0.44   0.47 -10.     0.83   0.28] sorted [0 6 4]\n",
      "   state [1 0 1 0 1 0 1 0] state_WI [0.33 0.32 0.22 0.44 0.42 0.91 0.28 0.67] sorted [5 7 3]\n",
      "   state [1 1 0 0 0 1 0 1] state_WI [  0.33   0.34   0.51   0.44   0.47 -10.     0.83   0.28] sorted [6 2 4]\n",
      "   state [1 0 1 0 0 1 1 0] state_WI [  0.33   0.32   0.22   0.44   0.47 -10.     0.28   0.67] sorted [7 4 3]\n",
      "   state [0 0 0 0 1 1 0 1] state_WI [  0.84   0.32   0.51   0.44   0.42 -10.     0.83   0.28] sorted [0 6 2]\n",
      "   state [1 0 1 1 0 0 1 0] state_WI [0.33 0.32 0.22 0.45 0.47 0.91 0.28 0.67] sorted [5 7 4]\n",
      "   state [0 0 1 0 1 1 0 1] state_WI [  0.84   0.32   0.22   0.44   0.42 -10.     0.83   0.28] sorted [0 6 3]\n",
      "   state [0 0 1 0 1 0 1 1] state_WI [0.84 0.32 0.22 0.44 0.42 0.91 0.28 0.28] sorted [5 0 3]\n",
      "   state [0 0 0 0 0 0 1 0] state_WI [0.84 0.32 0.51 0.44 0.47 0.91 0.28 0.67] sorted [5 0 7]\n",
      "   state [0 0 0 0 0 1 1 1] state_WI [  0.84   0.32   0.51   0.44   0.47 -10.     0.28   0.28] sorted [0 2 4]\n",
      "   state [1 1 1 0 0 0 1 1] state_WI [0.33 0.34 0.22 0.44 0.47 0.91 0.28 0.28] sorted [5 4 3]\n",
      "   state [1 1 0 1 1 1 1 0] state_WI [  0.33   0.34   0.51   0.45   0.42 -10.     0.28   0.67] sorted [7 2 3]\n",
      "instance 5, ep 17, state [1 0 0 1 0 1 0 0]\n",
      "   state [1 0 0 1 0 1 0 0] state_WI [  0.33   0.32   0.51   0.45   0.47 -10.     0.83   0.67] sorted [6 7 2]\n",
      "   state [1 0 1 1 1 1 1 0] state_WI [  0.33   0.32   0.22   0.45   0.42 -10.     0.28   0.67] sorted [7 3 4]\n",
      "   state [0 1 1 1 1 1 0 0] state_WI [  0.84   0.34   0.22   0.45   0.42 -10.     0.83   0.67] sorted [0 6 7]\n",
      "   state [1 1 0 0 0 1 1 1] state_WI [  0.33   0.34   0.51   0.44   0.47 -10.     0.28   0.28] sorted [2 4 3]\n",
      "   state [0 0 1 0 0 0 1 0] state_WI [0.84 0.32 0.22 0.44 0.47 0.91 0.28 0.67] sorted [5 0 7]\n",
      "   state [0 1 1 0 0 1 0 1] state_WI [  0.84   0.34   0.22   0.44   0.47 -10.     0.83   0.28] sorted [0 6 4]\n",
      "   state [1 0 1 0 0 1 1 0] state_WI [  0.33   0.32   0.22   0.44   0.47 -10.     0.28   0.67] sorted [7 4 3]\n",
      "   state [0 0 0 1 1 0 0 0] state_WI [0.84 0.32 0.51 0.45 0.42 0.91 0.83 0.67] sorted [5 0 6]\n",
      "   state [0 0 0 0 0 1 1 1] state_WI [  0.84   0.32   0.51   0.44   0.47 -10.     0.28   0.28] sorted [0 2 4]\n",
      "   state [1 1 1 0 1 0 1 1] state_WI [0.33 0.34 0.22 0.44 0.42 0.91 0.28 0.28] sorted [5 3 4]\n",
      "   state [1 1 1 0 1 1 1 1] state_WI [  0.33   0.34   0.22   0.44   0.42 -10.     0.28   0.28] sorted [3 4 1]\n",
      "   state [1 0 1 0 1 0 0 1] state_WI [0.33 0.32 0.22 0.44 0.42 0.91 0.83 0.28] sorted [5 6 3]\n",
      "   state [1 0 1 1 0 1 0 1] state_WI [  0.33   0.32   0.22   0.45   0.47 -10.     0.83   0.28] sorted [6 4 3]\n",
      "   state [0 0 1 1 0 1 1 1] state_WI [  0.84   0.32   0.22   0.45   0.47 -10.     0.28   0.28] sorted [0 4 3]\n",
      "   state [1 0 0 0 0 1 0 0] state_WI [  0.33   0.32   0.51   0.44   0.47 -10.     0.83   0.67] sorted [6 7 2]\n",
      "   state [0 0 0 0 0 1 1 1] state_WI [  0.84   0.32   0.51   0.44   0.47 -10.     0.28   0.28] sorted [0 2 4]\n",
      "   state [1 0 0 0 1 0 0 0] state_WI [0.33 0.32 0.51 0.44 0.42 0.91 0.83 0.67] sorted [5 6 7]\n",
      "   state [1 0 0 0 0 1 1 0] state_WI [  0.33   0.32   0.51   0.44   0.47 -10.     0.28   0.67] sorted [7 2 4]\n",
      "   state [0 0 1 0 0 1 1 0] state_WI [  0.84   0.32   0.22   0.44   0.47 -10.     0.28   0.67] sorted [0 7 4]\n",
      "   state [0 1 1 0 0 1 1 0] state_WI [  0.84   0.34   0.22   0.44   0.47 -10.     0.28   0.67] sorted [0 7 4]\n",
      "instance 5, ep 18, state [0 0 1 0 0 0 0 1]\n",
      "   state [0 0 1 0 0 0 0 1] state_WI [0.84 0.32 0.22 0.44 0.47 0.91 0.83 0.28] sorted [5 0 6]\n",
      "   state [0 0 1 1 0 1 0 1] state_WI [  0.84   0.32   0.22   0.45   0.47 -10.     0.83   0.28] sorted [0 6 4]\n",
      "   state [1 1 0 0 0 1 1 1] state_WI [  0.33   0.34   0.51   0.44   0.47 -10.     0.28   0.28] sorted [2 4 3]\n",
      "   state [1 0 0 0 1 1 1 0] state_WI [  0.33   0.32   0.51   0.44   0.42 -10.     0.28   0.67] sorted [7 2 3]\n",
      "   state [0 0 1 1 0 0 1 1] state_WI [0.84 0.32 0.22 0.45 0.47 0.91 0.28 0.28] sorted [5 0 4]\n",
      "   state [0 1 0 1 0 0 0 0] state_WI [0.84 0.34 0.51 0.45 0.47 0.91 0.83 0.67] sorted [5 0 6]\n",
      "   state [1 1 0 1 0 0 1 0] state_WI [0.33 0.34 0.51 0.45 0.47 0.91 0.28 0.67] sorted [5 7 2]\n",
      "   state [0 0 1 0 0 1 0 0] state_WI [  0.84   0.32   0.22   0.44   0.47 -10.     0.83   0.67] sorted [0 6 7]\n",
      "   state [1 0 0 0 0 0 1 1] state_WI [0.33 0.32 0.51 0.44 0.47 0.91 0.28 0.28] sorted [5 2 4]\n",
      "   state [0 0 1 0 0 1 1 1] state_WI [  0.84   0.32   0.22   0.44   0.47 -10.     0.28   0.28] sorted [0 4 3]\n",
      "   state [1 0 1 0 1 1 0 1] state_WI [  0.33   0.32   0.22   0.44   0.42 -10.     0.83   0.28] sorted [6 3 4]\n",
      "   state [0 0 0 0 1 0 0 0] state_WI [0.84 0.32 0.51 0.44 0.42 0.91 0.83 0.67] sorted [5 0 6]\n",
      "   state [1 1 0 0 0 0 0 0] state_WI [0.33 0.34 0.51 0.44 0.47 0.91 0.83 0.67] sorted [5 6 7]\n",
      "   state [0 0 0 0 0 1 0 1] state_WI [  0.84   0.32   0.51   0.44   0.47 -10.     0.83   0.28] sorted [0 6 2]\n",
      "   state [1 1 1 0 0 0 1 0] state_WI [0.33 0.34 0.22 0.44 0.47 0.91 0.28 0.67] sorted [5 7 4]\n",
      "   state [0 0 1 1 0 1 1 0] state_WI [  0.84   0.32   0.22   0.45   0.47 -10.     0.28   0.67] sorted [0 7 4]\n",
      "   state [0 0 1 0 0 0 1 1] state_WI [0.84 0.32 0.22 0.44 0.47 0.91 0.28 0.28] sorted [5 0 4]\n",
      "   state [1 1 0 0 1 1 0 1] state_WI [  0.33   0.34   0.51   0.44   0.42 -10.     0.83   0.28] sorted [6 2 3]\n",
      "   state [1 1 1 1 1 1 1 1] state_WI [  0.33   0.34   0.22   0.45   0.42 -10.     0.28   0.28] sorted [3 4 1]\n",
      "   state [0 0 0 1 0 0 0 0] state_WI [0.84 0.32 0.51 0.45 0.47 0.91 0.83 0.67] sorted [5 0 6]\n",
      "instance 5, ep 19, state [1 1 1 0 1 0 0 1]\n",
      "   state [1 1 1 0 1 0 0 1] state_WI [0.33 0.34 0.22 0.44 0.42 0.91 0.83 0.28] sorted [5 6 3]\n",
      "   state [0 1 0 0 0 0 1 1] state_WI [0.84 0.34 0.51 0.44 0.47 0.91 0.28 0.28] sorted [5 0 2]\n",
      "   state [1 1 1 0 0 1 0 1] state_WI [  0.33   0.34   0.22   0.44   0.47 -10.     0.83   0.28] sorted [6 4 3]\n",
      "   state [1 1 1 0 1 1 0 1] state_WI [  0.33   0.34   0.22   0.44   0.42 -10.     0.83   0.28] sorted [6 3 4]\n",
      "   state [1 1 1 0 1 1 0 1] state_WI [  0.33   0.34   0.22   0.44   0.42 -10.     0.83   0.28] sorted [6 3 4]\n",
      "   state [0 1 0 0 1 1 1 1] state_WI [  0.84   0.34   0.51   0.44   0.42 -10.     0.28   0.28] sorted [0 2 3]\n",
      "   state [0 0 0 1 0 1 0 1] state_WI [  0.84   0.32   0.51   0.45   0.47 -10.     0.83   0.28] sorted [0 6 2]\n",
      "   state [1 1 0 0 0 0 1 0] state_WI [0.33 0.34 0.51 0.44 0.47 0.91 0.28 0.67] sorted [5 7 2]\n",
      "   state [0 1 0 0 0 0 0 1] state_WI [0.84 0.34 0.51 0.44 0.47 0.91 0.83 0.28] sorted [5 0 6]\n",
      "   state [1 0 0 0 0 1 0 0] state_WI [  0.33   0.32   0.51   0.44   0.47 -10.     0.83   0.67] sorted [6 7 2]\n",
      "   state [1 0 0 0 0 1 0 0] state_WI [  0.33   0.32   0.51   0.44   0.47 -10.     0.83   0.67] sorted [6 7 2]\n",
      "   state [0 0 0 0 0 0 1 1] state_WI [0.84 0.32 0.51 0.44 0.47 0.91 0.28 0.28] sorted [5 0 2]\n",
      "   state [1 1 0 0 0 1 0 0] state_WI [  0.33   0.34   0.51   0.44   0.47 -10.     0.83   0.67] sorted [6 7 2]\n",
      "   state [0 0 0 0 0 0 1 1] state_WI [0.84 0.32 0.51 0.44 0.47 0.91 0.28 0.28] sorted [5 0 2]\n",
      "   state [0 1 0 0 0 1 1 0] state_WI [  0.84   0.34   0.51   0.44   0.47 -10.     0.28   0.67] sorted [0 7 2]\n",
      "   state [1 0 0 0 0 0 1 1] state_WI [0.33 0.32 0.51 0.44 0.47 0.91 0.28 0.28] sorted [5 2 4]\n",
      "   state [0 1 1 0 0 1 0 1] state_WI [  0.84   0.34   0.22   0.44   0.47 -10.     0.83   0.28] sorted [0 6 4]\n",
      "   state [0 0 1 1 0 1 0 1] state_WI [  0.84   0.32   0.22   0.45   0.47 -10.     0.83   0.28] sorted [0 6 4]\n",
      "   state [1 0 0 0 0 0 1 0] state_WI [0.33 0.32 0.51 0.44 0.47 0.91 0.28 0.67] sorted [5 7 2]\n",
      "   state [1 1 0 0 0 1 0 1] state_WI [  0.33   0.34   0.51   0.44   0.47 -10.     0.83   0.28] sorted [6 2 4]\n",
      "instance 5, ep 20, state [0 1 0 1 1 1 1 1]\n",
      "   state [0 1 0 1 1 1 1 1] state_WI [  0.84   0.34   0.51   0.45   0.42 -10.     0.28   0.28] sorted [0 2 3]\n",
      "   state [0 1 1 1 1 1 0 1] state_WI [  0.84   0.34   0.22   0.45   0.42 -10.     0.83   0.28] sorted [0 6 3]\n",
      "   state [1 1 0 1 0 0 1 0] state_WI [0.33 0.34 0.51 0.45 0.47 0.91 0.28 0.67] sorted [5 7 2]\n",
      "   state [0 0 0 0 0 1 0 1] state_WI [  0.84   0.32   0.51   0.44   0.47 -10.     0.83   0.28] sorted [0 6 2]\n",
      "   state [1 0 0 0 0 0 1 0] state_WI [0.33 0.32 0.51 0.44 0.47 0.91 0.28 0.67] sorted [5 7 2]\n",
      "   state [0 0 0 0 0 1 0 1] state_WI [  0.84   0.32   0.51   0.44   0.47 -10.     0.83   0.28] sorted [0 6 2]\n",
      "   state [1 0 0 0 0 1 1 0] state_WI [  0.33   0.32   0.51   0.44   0.47 -10.     0.28   0.67] sorted [7 2 4]\n",
      "   state [0 0 1 0 0 0 1 1] state_WI [0.84 0.32 0.22 0.44 0.47 0.91 0.28 0.28] sorted [5 0 4]\n",
      "   state [0 1 0 0 0 0 0 1] state_WI [0.84 0.34 0.51 0.44 0.47 0.91 0.83 0.28] sorted [5 0 6]\n",
      "   state [1 1 0 0 0 1 1 1] state_WI [  0.33   0.34   0.51   0.44   0.47 -10.     0.28   0.28] sorted [2 4 3]\n",
      "   state [0 0 1 1 0 1 0 1] state_WI [  0.84   0.32   0.22   0.45   0.47 -10.     0.83   0.28] sorted [0 6 4]\n",
      "   state [0 0 0 0 0 1 1 0] state_WI [  0.84   0.32   0.51   0.44   0.47 -10.     0.28   0.67] sorted [0 7 2]\n",
      "   state [1 0 0 0 0 1 0 1] state_WI [  0.33   0.32   0.51   0.44   0.47 -10.     0.83   0.28] sorted [6 2 4]\n",
      "   state [1 0 1 1 1 0 0 1] state_WI [0.33 0.32 0.22 0.45 0.42 0.91 0.83 0.28] sorted [5 6 3]\n",
      "   state [1 1 0 1 0 1 0 0] state_WI [  0.33   0.34   0.51   0.45   0.47 -10.     0.83   0.67] sorted [6 7 2]\n",
      "   state [0 0 0 0 0 1 1 1] state_WI [  0.84   0.32   0.51   0.44   0.47 -10.     0.28   0.28] sorted [0 2 4]\n",
      "   state [1 0 0 1 0 0 0 0] state_WI [0.33 0.32 0.51 0.45 0.47 0.91 0.83 0.67] sorted [5 6 7]\n",
      "   state [0 0 0 0 0 1 0 0] state_WI [  0.84   0.32   0.51   0.44   0.47 -10.     0.83   0.67] sorted [0 6 7]\n",
      "   state [1 1 0 0 0 1 0 0] state_WI [  0.33   0.34   0.51   0.44   0.47 -10.     0.83   0.67] sorted [6 7 2]\n",
      "   state [0 0 0 1 0 1 0 1] state_WI [  0.84   0.32   0.51   0.45   0.47 -10.     0.83   0.28] sorted [0 6 2]\n",
      "instance 5, ep 21, state [0 1 0 1 1 1 0 0]\n",
      "   state [0 1 0 1 1 1 0 0] state_WI [  0.84   0.34   0.51   0.45   0.42 -10.     0.83   0.67] sorted [0 6 7]\n",
      "   state [1 0 1 1 0 0 1 1] state_WI [0.33 0.32 0.22 0.45 0.47 0.91 0.28 0.28] sorted [5 4 3]\n",
      "   state [0 0 1 1 0 1 1 0] state_WI [  0.84   0.32   0.22   0.45   0.47 -10.     0.28   0.67] sorted [0 7 4]\n",
      "   state [1 0 1 0 0 0 0 1] state_WI [0.33 0.32 0.22 0.44 0.47 0.91 0.83 0.28] sorted [5 6 4]\n",
      "   state [1 0 0 0 0 1 1 1] state_WI [  0.33   0.32   0.51   0.44   0.47 -10.     0.28   0.28] sorted [2 4 3]\n",
      "   state [1 0 0 1 0 0 1 1] state_WI [0.33 0.32 0.51 0.45 0.47 0.91 0.28 0.28] sorted [5 2 4]\n",
      "   state [0 0 1 1 1 1 1 1] state_WI [  0.84   0.32   0.22   0.45   0.42 -10.     0.28   0.28] sorted [0 3 4]\n",
      "   state [1 0 0 1 1 0 1 0] state_WI [0.33 0.32 0.51 0.45 0.42 0.91 0.28 0.67] sorted [5 7 2]\n",
      "   state [1 0 0 1 0 1 0 1] state_WI [  0.33   0.32   0.51   0.45   0.47 -10.     0.83   0.28] sorted [6 2 4]\n",
      "   state [1 0 1 0 1 1 1 1] state_WI [  0.33   0.32   0.22   0.44   0.42 -10.     0.28   0.28] sorted [3 4 0]\n",
      "   state [1 0 1 1 1 1 1 1] state_WI [  0.33   0.32   0.22   0.45   0.42 -10.     0.28   0.28] sorted [3 4 0]\n",
      "   state [1 0 1 1 1 1 1 0] state_WI [  0.33   0.32   0.22   0.45   0.42 -10.     0.28   0.67] sorted [7 3 4]\n",
      "   state [0 0 1 1 1 0 1 1] state_WI [0.84 0.32 0.22 0.45 0.42 0.91 0.28 0.28] sorted [5 0 3]\n",
      "   state [0 0 1 1 0 1 0 1] state_WI [  0.84   0.32   0.22   0.45   0.47 -10.     0.83   0.28] sorted [0 6 4]\n",
      "   state [0 1 0 1 0 1 1 1] state_WI [  0.84   0.34   0.51   0.45   0.47 -10.     0.28   0.28] sorted [0 2 4]\n",
      "   state [1 1 1 0 1 0 1 1] state_WI [0.33 0.34 0.22 0.44 0.42 0.91 0.28 0.28] sorted [5 3 4]\n",
      "   state [1 0 0 0 0 0 0 1] state_WI [0.33 0.32 0.51 0.44 0.47 0.91 0.83 0.28] sorted [5 6 2]\n",
      "   state [1 0 0 0 1 1 0 1] state_WI [  0.33   0.32   0.51   0.44   0.42 -10.     0.83   0.28] sorted [6 2 3]\n",
      "   state [1 0 1 0 0 1 0 0] state_WI [  0.33   0.32   0.22   0.44   0.47 -10.     0.83   0.67] sorted [6 7 4]\n",
      "   state [0 1 0 0 0 1 1 0] state_WI [  0.84   0.34   0.51   0.44   0.47 -10.     0.28   0.67] sorted [0 7 2]\n",
      "instance 5, ep 22, state [1 0 0 0 1 1 0 0]\n",
      "   state [1 0 0 0 1 1 0 0] state_WI [  0.33   0.32   0.51   0.44   0.42 -10.     0.83   0.67] sorted [6 7 2]\n",
      "   state [1 1 0 0 1 1 1 1] state_WI [  0.33   0.34   0.51   0.44   0.42 -10.     0.28   0.28] sorted [2 3 4]\n",
      "   state [1 1 0 0 0 1 0 1] state_WI [  0.33   0.34   0.51   0.44   0.47 -10.     0.83   0.28] sorted [6 2 4]\n",
      "   state [0 1 0 0 1 0 1 1] state_WI [0.84 0.34 0.51 0.44 0.42 0.91 0.28 0.28] sorted [5 0 2]\n",
      "   state [0 1 1 0 1 1 1 1] state_WI [  0.84   0.34   0.22   0.44   0.42 -10.     0.28   0.28] sorted [0 3 4]\n",
      "   state [0 0 0 1 0 1 0 1] state_WI [  0.84   0.32   0.51   0.45   0.47 -10.     0.83   0.28] sorted [0 6 2]\n",
      "   state [0 0 0 0 0 1 1 1] state_WI [  0.84   0.32   0.51   0.44   0.47 -10.     0.28   0.28] sorted [0 2 4]\n",
      "   state [1 0 0 0 1 1 0 1] state_WI [  0.33   0.32   0.51   0.44   0.42 -10.     0.83   0.28] sorted [6 2 3]\n",
      "   state [0 0 1 1 0 0 1 1] state_WI [0.84 0.32 0.22 0.45 0.47 0.91 0.28 0.28] sorted [5 0 4]\n",
      "   state [1 0 1 1 0 1 0 0] state_WI [  0.33   0.32   0.22   0.45   0.47 -10.     0.83   0.67] sorted [6 7 4]\n",
      "   state [0 0 1 0 0 0 1 1] state_WI [0.84 0.32 0.22 0.44 0.47 0.91 0.28 0.28] sorted [5 0 4]\n",
      "   state [1 0 1 1 0 1 1 1] state_WI [  0.33   0.32   0.22   0.45   0.47 -10.     0.28   0.28] sorted [4 3 0]\n",
      "   state [1 0 0 1 1 0 1 1] state_WI [0.33 0.32 0.51 0.45 0.42 0.91 0.28 0.28] sorted [5 2 3]\n",
      "   state [0 0 0 1 0 1 1 1] state_WI [  0.84   0.32   0.51   0.45   0.47 -10.     0.28   0.28] sorted [0 2 4]\n",
      "   state [1 0 1 0 1 1 1 1] state_WI [  0.33   0.32   0.22   0.44   0.42 -10.     0.28   0.28] sorted [3 4 0]\n",
      "   state [0 0 1 0 0 0 1 0] state_WI [0.84 0.32 0.22 0.44 0.47 0.91 0.28 0.67] sorted [5 0 7]\n",
      "   state [1 1 1 0 0 1 1 0] state_WI [  0.33   0.34   0.22   0.44   0.47 -10.     0.28   0.67] sorted [7 4 3]\n",
      "   state [0 0 1 1 0 0 1 1] state_WI [0.84 0.32 0.22 0.45 0.47 0.91 0.28 0.28] sorted [5 0 4]\n",
      "   state [1 1 1 1 1 1 0 0] state_WI [  0.33   0.34   0.22   0.45   0.42 -10.     0.83   0.67] sorted [6 7 3]\n",
      "   state [1 0 1 0 1 1 1 0] state_WI [  0.33   0.32   0.22   0.44   0.42 -10.     0.28   0.67] sorted [7 3 4]\n",
      "instance 5, ep 23, state [0 1 1 0 0 0 1 1]\n",
      "   state [0 1 1 0 0 0 1 1] state_WI [0.84 0.34 0.22 0.44 0.47 0.91 0.28 0.28] sorted [5 0 4]\n",
      "   state [1 1 1 0 1 0 0 0] state_WI [0.33 0.34 0.22 0.44 0.42 0.91 0.83 0.67] sorted [5 6 7]\n",
      "   state [0 0 1 1 0 1 1 0] state_WI [  0.84   0.32   0.22   0.45   0.47 -10.     0.28   0.67] sorted [0 7 4]\n",
      "   state [1 1 0 0 0 0 1 1] state_WI [0.33 0.34 0.51 0.44 0.47 0.91 0.28 0.28] sorted [5 2 4]\n",
      "   state [1 0 1 0 1 1 1 1] state_WI [  0.33   0.32   0.22   0.44   0.42 -10.     0.28   0.28] sorted [3 4 0]\n",
      "   state [1 0 1 1 1 0 0 0] state_WI [0.33 0.32 0.22 0.45 0.42 0.91 0.83 0.67] sorted [5 6 7]\n",
      "   state [0 1 1 0 1 0 1 0] state_WI [0.84 0.34 0.22 0.44 0.42 0.91 0.28 0.67] sorted [5 0 7]\n",
      "   state [1 1 0 0 0 1 0 0] state_WI [  0.33   0.34   0.51   0.44   0.47 -10.     0.83   0.67] sorted [6 7 2]\n",
      "   state [1 1 0 0 0 0 1 0] state_WI [0.33 0.34 0.51 0.44 0.47 0.91 0.28 0.67] sorted [5 7 2]\n",
      "   state [1 0 0 1 0 1 0 0] state_WI [  0.33   0.32   0.51   0.45   0.47 -10.     0.83   0.67] sorted [6 7 2]\n",
      "   state [0 0 1 1 0 0 1 0] state_WI [0.84 0.32 0.22 0.45 0.47 0.91 0.28 0.67] sorted [5 0 7]\n",
      "   state [0 0 1 0 0 1 0 0] state_WI [  0.84   0.32   0.22   0.44   0.47 -10.     0.83   0.67] sorted [0 6 7]\n",
      "   state [0 0 0 0 0 0 1 0] state_WI [0.84 0.32 0.51 0.44 0.47 0.91 0.28 0.67] sorted [5 0 7]\n",
      "   state [0 0 0 0 1 1 0 1] state_WI [  0.84   0.32   0.51   0.44   0.42 -10.     0.83   0.28] sorted [0 6 2]\n",
      "   state [0 0 1 0 0 1 1 1] state_WI [  0.84   0.32   0.22   0.44   0.47 -10.     0.28   0.28] sorted [0 4 3]\n",
      "   state [1 0 0 0 1 1 0 1] state_WI [  0.33   0.32   0.51   0.44   0.42 -10.     0.83   0.28] sorted [6 2 3]\n",
      "   state [0 0 0 0 1 0 1 1] state_WI [0.84 0.32 0.51 0.44 0.42 0.91 0.28 0.28] sorted [5 0 2]\n",
      "   state [1 1 0 0 0 1 1 1] state_WI [  0.33   0.34   0.51   0.44   0.47 -10.     0.28   0.28] sorted [2 4 3]\n",
      "   state [1 1 1 0 1 0 0 0] state_WI [0.33 0.34 0.22 0.44 0.42 0.91 0.83 0.67] sorted [5 6 7]\n",
      "   state [0 0 0 0 1 1 1 0] state_WI [  0.84   0.32   0.51   0.44   0.42 -10.     0.28   0.67] sorted [0 7 2]\n",
      "instance 5, ep 24, state [0 0 0 1 0 1 1 0]\n",
      "   state [0 0 0 1 0 1 1 0] state_WI [  0.84   0.32   0.51   0.45   0.47 -10.     0.28   0.67] sorted [0 7 2]\n",
      "   state [1 0 0 1 0 1 0 1] state_WI [  0.33   0.32   0.51   0.45   0.47 -10.     0.83   0.28] sorted [6 2 4]\n",
      "   state [1 0 0 0 1 1 0 0] state_WI [  0.33   0.32   0.51   0.44   0.42 -10.     0.83   0.67] sorted [6 7 2]\n",
      "   state [1 0 1 0 1 0 0 0] state_WI [0.33 0.32 0.22 0.44 0.42 0.91 0.83 0.67] sorted [5 6 7]\n",
      "   state [1 0 0 0 0 1 1 1] state_WI [  0.33   0.32   0.51   0.44   0.47 -10.     0.28   0.28] sorted [2 4 3]\n",
      "   state [0 1 0 1 0 0 0 1] state_WI [0.84 0.34 0.51 0.45 0.47 0.91 0.83 0.28] sorted [5 0 6]\n",
      "   state [1 0 0 1 0 1 1 1] state_WI [  0.33   0.32   0.51   0.45   0.47 -10.     0.28   0.28] sorted [2 4 3]\n",
      "   state [0 1 0 1 0 1 0 1] state_WI [  0.84   0.34   0.51   0.45   0.47 -10.     0.83   0.28] sorted [0 6 2]\n",
      "   state [0 0 1 1 0 1 1 0] state_WI [  0.84   0.32   0.22   0.45   0.47 -10.     0.28   0.67] sorted [0 7 4]\n",
      "   state [1 0 1 1 0 0 0 1] state_WI [0.33 0.32 0.22 0.45 0.47 0.91 0.83 0.28] sorted [5 6 4]\n",
      "   state [1 0 1 0 1 1 1 0] state_WI [  0.33   0.32   0.22   0.44   0.42 -10.     0.28   0.67] sorted [7 3 4]\n",
      "   state [1 0 1 0 1 0 0 1] state_WI [0.33 0.32 0.22 0.44 0.42 0.91 0.83 0.28] sorted [5 6 3]\n",
      "   state [1 0 0 1 0 0 1 0] state_WI [0.33 0.32 0.51 0.45 0.47 0.91 0.28 0.67] sorted [5 7 2]\n",
      "   state [1 0 0 1 0 1 0 1] state_WI [  0.33   0.32   0.51   0.45   0.47 -10.     0.83   0.28] sorted [6 2 4]\n",
      "   state [0 0 1 0 1 1 1 0] state_WI [  0.84   0.32   0.22   0.44   0.42 -10.     0.28   0.67] sorted [0 7 3]\n",
      "   state [1 0 0 0 0 0 1 0] state_WI [0.33 0.32 0.51 0.44 0.47 0.91 0.28 0.67] sorted [5 7 2]\n",
      "   state [0 0 0 0 0 1 0 1] state_WI [  0.84   0.32   0.51   0.44   0.47 -10.     0.83   0.28] sorted [0 6 2]\n",
      "   state [1 1 0 0 0 0 1 1] state_WI [0.33 0.34 0.51 0.44 0.47 0.91 0.28 0.28] sorted [5 2 4]\n",
      "   state [1 0 1 0 1 0 0 0] state_WI [0.33 0.32 0.22 0.44 0.42 0.91 0.83 0.67] sorted [5 6 7]\n",
      "   state [1 1 0 0 0 1 1 0] state_WI [  0.33   0.34   0.51   0.44   0.47 -10.     0.28   0.67] sorted [7 2 4]\n",
      "instance 5, ep 25, state [0 0 1 1 1 1 0 1]\n",
      "   state [0 0 1 1 1 1 0 1] state_WI [  0.84   0.32   0.22   0.45   0.42 -10.     0.83   0.28] sorted [0 6 3]\n",
      "   state [1 0 1 1 1 0 1 1] state_WI [0.33 0.32 0.22 0.45 0.42 0.91 0.28 0.28] sorted [5 3 4]\n",
      "   state [0 0 1 1 1 0 1 1] state_WI [0.84 0.32 0.22 0.45 0.42 0.91 0.28 0.28] sorted [5 0 3]\n",
      "   state [0 0 0 0 1 1 0 0] state_WI [  0.84   0.32   0.51   0.44   0.42 -10.     0.83   0.67] sorted [0 6 7]\n",
      "   state [1 0 0 0 1 0 1 0] state_WI [0.33 0.32 0.51 0.44 0.42 0.91 0.28 0.67] sorted [5 7 2]\n",
      "   state [0 0 0 0 0 1 1 0] state_WI [  0.84   0.32   0.51   0.44   0.47 -10.     0.28   0.67] sorted [0 7 2]\n",
      "   state [1 1 1 0 0 0 0 0] state_WI [0.33 0.34 0.22 0.44 0.47 0.91 0.83 0.67] sorted [5 6 7]\n",
      "   state [1 0 1 0 0 1 1 1] state_WI [  0.33   0.32   0.22   0.44   0.47 -10.     0.28   0.28] sorted [4 3 0]\n",
      "   state [1 1 0 0 1 0 1 0] state_WI [0.33 0.34 0.51 0.44 0.42 0.91 0.28 0.67] sorted [5 7 2]\n",
      "   state [1 0 0 0 1 0 1 1] state_WI [0.33 0.32 0.51 0.44 0.42 0.91 0.28 0.28] sorted [5 2 3]\n",
      "   state [1 0 0 0 0 1 1 0] state_WI [  0.33   0.32   0.51   0.44   0.47 -10.     0.28   0.67] sorted [7 2 4]\n",
      "   state [1 1 1 0 1 0 1 1] state_WI [0.33 0.34 0.22 0.44 0.42 0.91 0.28 0.28] sorted [5 3 4]\n",
      "   state [1 0 1 0 0 1 1 1] state_WI [  0.33   0.32   0.22   0.44   0.47 -10.     0.28   0.28] sorted [4 3 0]\n",
      "   state [0 1 0 0 1 0 0 0] state_WI [0.84 0.34 0.51 0.44 0.42 0.91 0.83 0.67] sorted [5 0 6]\n",
      "   state [1 1 0 0 0 1 1 0] state_WI [  0.33   0.34   0.51   0.44   0.47 -10.     0.28   0.67] sorted [7 2 4]\n",
      "   state [1 1 1 0 1 0 1 1] state_WI [0.33 0.34 0.22 0.44 0.42 0.91 0.28 0.28] sorted [5 3 4]\n",
      "   state [1 0 1 1 0 1 1 0] state_WI [  0.33   0.32   0.22   0.45   0.47 -10.     0.28   0.67] sorted [7 4 3]\n",
      "   state [0 0 1 0 0 0 0 0] state_WI [0.84 0.32 0.22 0.44 0.47 0.91 0.83 0.67] sorted [5 0 6]\n",
      "   state [1 0 1 0 0 1 1 0] state_WI [  0.33   0.32   0.22   0.44   0.47 -10.     0.28   0.67] sorted [7 4 3]\n",
      "   state [1 0 1 0 1 1 1 0] state_WI [  0.33   0.32   0.22   0.44   0.42 -10.     0.28   0.67] sorted [7 3 4]\n",
      "instance 5, ep 26, state [1 0 1 1 1 1 1 1]\n",
      "   state [1 0 1 1 1 1 1 1] state_WI [  0.33   0.32   0.22   0.45   0.42 -10.     0.28   0.28] sorted [3 4 0]\n",
      "   state [1 1 1 1 0 1 1 0] state_WI [  0.33   0.34   0.22   0.45   0.47 -10.     0.28   0.67] sorted [7 4 3]\n",
      "   state [1 1 1 1 1 0 0 1] state_WI [0.33 0.34 0.22 0.45 0.42 0.91 0.83 0.28] sorted [5 6 3]\n",
      "   state [0 0 1 1 0 1 0 0] state_WI [  0.84   0.32   0.22   0.45   0.47 -10.     0.83   0.67] sorted [0 6 7]\n",
      "   state [1 0 0 0 0 1 1 1] state_WI [  0.33   0.32   0.51   0.44   0.47 -10.     0.28   0.28] sorted [2 4 3]\n",
      "   state [0 1 0 0 0 1 0 0] state_WI [  0.84   0.34   0.51   0.44   0.47 -10.     0.83   0.67] sorted [0 6 7]\n",
      "   state [1 0 0 0 0 1 1 0] state_WI [  0.33   0.32   0.51   0.44   0.47 -10.     0.28   0.67] sorted [7 2 4]\n",
      "   state [0 1 1 1 0 1 0 0] state_WI [  0.84   0.34   0.22   0.45   0.47 -10.     0.83   0.67] sorted [0 6 7]\n",
      "   state [1 0 0 0 0 0 0 1] state_WI [0.33 0.32 0.51 0.44 0.47 0.91 0.83 0.28] sorted [5 6 2]\n",
      "   state [0 0 1 0 0 1 0 1] state_WI [  0.84   0.32   0.22   0.44   0.47 -10.     0.83   0.28] sorted [0 6 4]\n",
      "   state [0 0 1 1 1 1 1 0] state_WI [  0.84   0.32   0.22   0.45   0.42 -10.     0.28   0.67] sorted [0 7 3]\n",
      "   state [0 1 1 1 0 0 0 0] state_WI [0.84 0.34 0.22 0.45 0.47 0.91 0.83 0.67] sorted [5 0 6]\n",
      "   state [0 0 1 0 0 1 1 0] state_WI [  0.84   0.32   0.22   0.44   0.47 -10.     0.28   0.67] sorted [0 7 4]\n",
      "   state [1 1 1 1 0 0 0 1] state_WI [0.33 0.34 0.22 0.45 0.47 0.91 0.83 0.28] sorted [5 6 4]\n",
      "   state [1 1 0 1 1 1 1 1] state_WI [  0.33   0.34   0.51   0.45   0.42 -10.     0.28   0.28] sorted [2 3 4]\n",
      "   state [0 0 1 0 1 0 0 0] state_WI [0.84 0.32 0.22 0.44 0.42 0.91 0.83 0.67] sorted [5 0 6]\n",
      "   state [1 0 0 0 1 1 1 0] state_WI [  0.33   0.32   0.51   0.44   0.42 -10.     0.28   0.67] sorted [7 2 3]\n",
      "   state [1 0 0 1 0 1 0 0] state_WI [  0.33   0.32   0.51   0.45   0.47 -10.     0.83   0.67] sorted [6 7 2]\n",
      "   state [0 0 1 1 0 0 0 1] state_WI [0.84 0.32 0.22 0.45 0.47 0.91 0.83 0.28] sorted [5 0 6]\n",
      "   state [0 1 1 1 0 1 1 1] state_WI [  0.84   0.34   0.22   0.45   0.47 -10.     0.28   0.28] sorted [0 4 3]\n",
      "instance 5, ep 27, state [0 0 1 0 0 0 0 1]\n",
      "   state [0 0 1 0 0 0 0 1] state_WI [0.84 0.32 0.22 0.44 0.47 0.91 0.83 0.28] sorted [5 0 6]\n",
      "   state [1 0 0 0 0 1 0 0] state_WI [  0.33   0.32   0.51   0.44   0.47 -10.     0.83   0.67] sorted [6 7 2]\n",
      "   state [1 1 0 0 0 1 1 1] state_WI [  0.33   0.34   0.51   0.44   0.47 -10.     0.28   0.28] sorted [2 4 3]\n",
      "   state [1 0 0 1 1 1 1 1] state_WI [  0.33   0.32   0.51   0.45   0.42 -10.     0.28   0.28] sorted [2 3 4]\n",
      "   state [1 0 0 1 0 0 1 1] state_WI [0.33 0.32 0.51 0.45 0.47 0.91 0.28 0.28] sorted [5 2 4]\n",
      "   state [0 0 0 0 1 1 0 0] state_WI [  0.84   0.32   0.51   0.44   0.42 -10.     0.83   0.67] sorted [0 6 7]\n",
      "   state [0 1 0 0 0 1 1 1] state_WI [  0.84   0.34   0.51   0.44   0.47 -10.     0.28   0.28] sorted [0 2 4]\n",
      "   state [0 1 0 0 0 1 1 1] state_WI [  0.84   0.34   0.51   0.44   0.47 -10.     0.28   0.28] sorted [0 2 4]\n",
      "   state [1 0 0 0 1 1 0 0] state_WI [  0.33   0.32   0.51   0.44   0.42 -10.     0.83   0.67] sorted [6 7 2]\n",
      "   state [0 1 0 0 0 0 1 1] state_WI [0.84 0.34 0.51 0.44 0.47 0.91 0.28 0.28] sorted [5 0 2]\n",
      "   state [1 0 0 0 0 0 1 1] state_WI [0.33 0.32 0.51 0.44 0.47 0.91 0.28 0.28] sorted [5 2 4]\n",
      "   state [1 0 1 0 0 0 0 1] state_WI [0.33 0.32 0.22 0.44 0.47 0.91 0.83 0.28] sorted [5 6 4]\n",
      "   state [0 0 1 0 1 1 1 0] state_WI [  0.84   0.32   0.22   0.44   0.42 -10.     0.28   0.67] sorted [0 7 3]\n",
      "   state [1 0 0 1 1 0 0 0] state_WI [0.33 0.32 0.51 0.45 0.42 0.91 0.83 0.67] sorted [5 6 7]\n",
      "   state [1 0 0 0 0 0 1 0] state_WI [0.33 0.32 0.51 0.44 0.47 0.91 0.28 0.67] sorted [5 7 2]\n",
      "   state [1 1 0 0 0 1 1 1] state_WI [  0.33   0.34   0.51   0.44   0.47 -10.     0.28   0.28] sorted [2 4 3]\n",
      "   state [1 0 0 0 1 0 1 1] state_WI [0.33 0.32 0.51 0.44 0.42 0.91 0.28 0.28] sorted [5 2 3]\n",
      "   state [0 0 1 0 0 1 1 0] state_WI [  0.84   0.32   0.22   0.44   0.47 -10.     0.28   0.67] sorted [0 7 4]\n",
      "   state [1 0 1 0 1 0 0 1] state_WI [0.33 0.32 0.22 0.44 0.42 0.91 0.83 0.28] sorted [5 6 3]\n",
      "   state [0 1 1 1 0 1 0 1] state_WI [  0.84   0.34   0.22   0.45   0.47 -10.     0.83   0.28] sorted [0 6 4]\n",
      "instance 5, ep 28, state [1 0 0 0 1 1 0 1]\n",
      "   state [1 0 0 0 1 1 0 1] state_WI [  0.33   0.32   0.51   0.44   0.42 -10.     0.83   0.28] sorted [6 2 3]\n",
      "   state [0 0 1 0 0 1 1 1] state_WI [  0.84   0.32   0.22   0.44   0.47 -10.     0.28   0.28] sorted [0 4 3]\n",
      "   state [1 0 1 1 0 0 1 1] state_WI [0.33 0.32 0.22 0.45 0.47 0.91 0.28 0.28] sorted [5 4 3]\n",
      "   state [0 1 1 1 1 1 1 1] state_WI [  0.84   0.34   0.22   0.45   0.42 -10.     0.28   0.28] sorted [0 3 4]\n",
      "   state [1 1 0 1 0 1 1 1] state_WI [  0.33   0.34   0.51   0.45   0.47 -10.     0.28   0.28] sorted [2 4 3]\n",
      "   state [1 1 0 0 0 1 1 0] state_WI [  0.33   0.34   0.51   0.44   0.47 -10.     0.28   0.67] sorted [7 2 4]\n",
      "   state [0 1 1 0 0 0 1 0] state_WI [0.84 0.34 0.22 0.44 0.47 0.91 0.28 0.67] sorted [5 0 7]\n",
      "   state [0 1 1 0 0 1 0 0] state_WI [  0.84   0.34   0.22   0.44   0.47 -10.     0.83   0.67] sorted [0 6 7]\n",
      "   state [1 0 1 0 0 1 1 0] state_WI [  0.33   0.32   0.22   0.44   0.47 -10.     0.28   0.67] sorted [7 4 3]\n",
      "   state [1 0 1 1 0 1 1 1] state_WI [  0.33   0.32   0.22   0.45   0.47 -10.     0.28   0.28] sorted [4 3 0]\n",
      "   state [1 0 0 1 1 0 1 1] state_WI [0.33 0.32 0.51 0.45 0.42 0.91 0.28 0.28] sorted [5 2 3]\n",
      "   state [1 0 0 1 0 0 0 1] state_WI [0.33 0.32 0.51 0.45 0.47 0.91 0.83 0.28] sorted [5 6 2]\n",
      "   state [0 0 0 0 0 1 1 0] state_WI [  0.84   0.32   0.51   0.44   0.47 -10.     0.28   0.67] sorted [0 7 2]\n",
      "   state [1 0 1 0 0 1 0 0] state_WI [  0.33   0.32   0.22   0.44   0.47 -10.     0.83   0.67] sorted [6 7 4]\n",
      "   state [0 0 0 0 0 0 0 1] state_WI [0.84 0.32 0.51 0.44 0.47 0.91 0.83 0.28] sorted [5 0 6]\n",
      "   state [1 0 0 0 0 0 1 0] state_WI [0.33 0.32 0.51 0.44 0.47 0.91 0.28 0.67] sorted [5 7 2]\n",
      "   state [0 1 1 0 0 1 0 0] state_WI [  0.84   0.34   0.22   0.44   0.47 -10.     0.83   0.67] sorted [0 6 7]\n",
      "   state [0 0 1 0 1 0 0 1] state_WI [0.84 0.32 0.22 0.44 0.42 0.91 0.83 0.28] sorted [5 0 6]\n",
      "   state [1 1 1 0 1 1 0 1] state_WI [  0.33   0.34   0.22   0.44   0.42 -10.     0.83   0.28] sorted [6 3 4]\n",
      "   state [1 0 1 0 1 0 1 1] state_WI [0.33 0.32 0.22 0.44 0.42 0.91 0.28 0.28] sorted [5 3 4]\n",
      "instance 5, ep 29, state [1 1 1 0 1 0 1 1]\n",
      "   state [1 1 1 0 1 0 1 1] state_WI [0.33 0.34 0.22 0.44 0.42 0.91 0.28 0.28] sorted [5 3 4]\n",
      "   state [1 0 1 0 0 1 0 0] state_WI [  0.33   0.32   0.22   0.44   0.47 -10.     0.83   0.67] sorted [6 7 4]\n",
      "   state [1 0 1 0 1 0 0 1] state_WI [0.33 0.32 0.22 0.44 0.42 0.91 0.83 0.28] sorted [5 6 3]\n",
      "   state [0 1 1 0 0 1 0 0] state_WI [  0.84   0.34   0.22   0.44   0.47 -10.     0.83   0.67] sorted [0 6 7]\n",
      "   state [1 0 0 0 0 1 1 1] state_WI [  0.33   0.32   0.51   0.44   0.47 -10.     0.28   0.28] sorted [2 4 3]\n",
      "   state [1 1 0 0 1 0 1 0] state_WI [0.33 0.34 0.51 0.44 0.42 0.91 0.28 0.67] sorted [5 7 2]\n",
      "   state [1 1 0 0 0 1 0 1] state_WI [  0.33   0.34   0.51   0.44   0.47 -10.     0.83   0.28] sorted [6 2 4]\n",
      "   state [0 0 0 0 0 1 1 0] state_WI [  0.84   0.32   0.51   0.44   0.47 -10.     0.28   0.67] sorted [0 7 2]\n",
      "   state [0 0 0 0 0 0 0 1] state_WI [0.84 0.32 0.51 0.44 0.47 0.91 0.83 0.28] sorted [5 0 6]\n",
      "   state [0 1 0 0 0 0 1 1] state_WI [0.84 0.34 0.51 0.44 0.47 0.91 0.28 0.28] sorted [5 0 2]\n",
      "   state [0 1 0 0 0 0 0 1] state_WI [0.84 0.34 0.51 0.44 0.47 0.91 0.83 0.28] sorted [5 0 6]\n",
      "   state [1 0 0 0 0 1 1 1] state_WI [  0.33   0.32   0.51   0.44   0.47 -10.     0.28   0.28] sorted [2 4 3]\n",
      "   state [0 0 1 0 1 1 1 0] state_WI [  0.84   0.32   0.22   0.44   0.42 -10.     0.28   0.67] sorted [0 7 3]\n",
      "   state [0 0 0 1 0 0 0 1] state_WI [0.84 0.32 0.51 0.45 0.47 0.91 0.83 0.28] sorted [5 0 6]\n",
      "   state [1 0 1 1 1 0 1 0] state_WI [0.33 0.32 0.22 0.45 0.42 0.91 0.28 0.67] sorted [5 7 3]\n",
      "   state [1 1 0 1 1 0 1 0] state_WI [0.33 0.34 0.51 0.45 0.42 0.91 0.28 0.67] sorted [5 7 2]\n",
      "   state [1 0 1 0 0 1 1 0] state_WI [  0.33   0.32   0.22   0.44   0.47 -10.     0.28   0.67] sorted [7 4 3]\n",
      "   state [1 0 1 0 1 0 1 1] state_WI [0.33 0.32 0.22 0.44 0.42 0.91 0.28 0.28] sorted [5 3 4]\n",
      "   state [0 0 0 0 0 1 1 0] state_WI [  0.84   0.32   0.51   0.44   0.47 -10.     0.28   0.67] sorted [0 7 2]\n",
      "   state [0 0 1 0 0 1 1 0] state_WI [  0.84   0.32   0.22   0.44   0.47 -10.     0.28   0.67] sorted [0 7 4]\n",
      "first state [0 1 0 1 0 1 0 1]\n",
      "   state [0 1 0 1 0 1 0 1] state_WI [  0.39   0.31   0.32   0.3    0.91   0.39   0.47 -10.  ] sorted [4 6 5]\n",
      "   state [0 1 0 1 1 1 1 1] state_WI [  0.39   0.31   0.32   0.3    0.38   0.39   0.49 -10.  ] sorted [6 5 0]\n",
      "   state [0 1 0 1 0 1 1 1] state_WI [  0.39   0.31   0.32   0.3    0.91   0.39   0.49 -10.  ] sorted [4 6 5]\n",
      "   state [0 0 0 0 1 1 1 0] state_WI [  0.39   0.89   0.32   0.48   0.38   0.39   0.49 -10.  ] sorted [1 6 3]\n",
      "   state [0 1 1 0 0 0 1 0] state_WI [  0.39   0.31   0.34   0.48   0.91   0.47   0.49 -10.  ] sorted [4 6 3]\n",
      "   state [1 0 1 1 1 0 1 0] state_WI [  0.26   0.89   0.34   0.3    0.38   0.47   0.49 -10.  ] sorted [1 6 5]\n",
      "   state [0 1 0 1 1 1 1 0] state_WI [  0.39   0.31   0.32   0.3    0.38   0.39   0.49 -10.  ] sorted [6 5 0]\n",
      "   state [1 1 0 1 1 0 1 0] state_WI [  0.26   0.31   0.32   0.3    0.38   0.47   0.49 -10.  ] sorted [6 5 4]\n",
      "   state [1 1 0 0 1 0 1 0] state_WI [  0.26   0.31   0.32   0.48   0.38   0.47   0.49 -10.  ] sorted [6 3 5]\n",
      "   state [0 0 0 0 1 1 1 0] state_WI [  0.39   0.89   0.32   0.48   0.38   0.39   0.49 -10.  ] sorted [1 6 3]\n",
      "   state [1 0 1 1 0 0 1 0] state_WI [  0.26   0.89   0.34   0.3    0.91   0.47   0.49 -10.  ] sorted [4 1 6]\n",
      "   state [0 1 1 0 0 0 1 0] state_WI [  0.39   0.31   0.34   0.48   0.91   0.47   0.49 -10.  ] sorted [4 6 3]\n",
      "   state [0 1 0 1 0 0 1 0] state_WI [  0.39   0.31   0.32   0.3    0.91   0.47   0.49 -10.  ] sorted [4 6 5]\n",
      "   state [1 1 0 0 1 0 1 0] state_WI [  0.26   0.31   0.32   0.48   0.38   0.47   0.49 -10.  ] sorted [6 3 5]\n",
      "   state [1 1 1 1 0 1 1 0] state_WI [  0.26   0.31   0.34   0.3    0.91   0.39   0.49 -10.  ] sorted [4 6 5]\n",
      "   state [1 1 1 1 1 1 0 0] state_WI [  0.26   0.31   0.34   0.3    0.38   0.39   0.47 -10.  ] sorted [6 5 4]\n",
      "   state [0 0 1 0 0 1 0 0] state_WI [  0.39   0.89   0.34   0.48   0.91   0.39   0.47 -10.  ] sorted [4 1 3]\n",
      "   state [0 1 0 0 1 0 0 0] state_WI [  0.39   0.31   0.32   0.48   0.38   0.47   0.47 -10.  ] sorted [3 6 5]\n",
      "   state [0 0 1 0 1 1 0 1] state_WI [  0.39   0.89   0.34   0.48   0.38   0.39   0.47 -10.  ] sorted [1 3 6]\n",
      "   state [0 0 0 0 0 1 0 1] state_WI [  0.39   0.89   0.32   0.48   0.91   0.39   0.47 -10.  ] sorted [4 1 3]\n",
      "instance 6, ep 1, state [1 1 1 1 1 0 1 0]\n",
      "   state [1 1 1 1 1 0 1 0] state_WI [  0.26   0.31   0.34   0.3    0.38   0.47   0.49 -10.  ] sorted [6 5 4]\n",
      "   state [0 0 1 0 1 0 1 0] state_WI [  0.39   0.89   0.34   0.48   0.38   0.47   0.49 -10.  ] sorted [1 6 3]\n",
      "   state [0 0 0 1 1 0 1 1] state_WI [  0.39   0.89   0.32   0.3    0.38   0.47   0.49 -10.  ] sorted [1 6 5]\n",
      "   state [0 1 0 0 0 0 1 0] state_WI [  0.39   0.31   0.32   0.48   0.91   0.47   0.49 -10.  ] sorted [4 6 3]\n",
      "   state [1 1 0 1 1 1 1 0] state_WI [  0.26   0.31   0.32   0.3    0.38   0.39   0.49 -10.  ] sorted [6 5 4]\n",
      "   state [0 1 0 1 1 1 1 0] state_WI [  0.39   0.31   0.32   0.3    0.38   0.39   0.49 -10.  ] sorted [6 5 0]\n",
      "   state [1 1 1 1 0 0 0 0] state_WI [  0.26   0.31   0.34   0.3    0.91   0.47   0.47 -10.  ] sorted [4 6 5]\n",
      "   state [0 0 0 1 1 1 0 0] state_WI [  0.39   0.89   0.32   0.3    0.38   0.39   0.47 -10.  ] sorted [1 6 5]\n",
      "   state [0 1 0 0 1 1 0 0] state_WI [  0.39   0.31   0.32   0.48   0.38   0.39   0.47 -10.  ] sorted [3 6 5]\n",
      "   state [1 1 0 1 0 0 0 0] state_WI [  0.26   0.31   0.32   0.3    0.91   0.47   0.47 -10.  ] sorted [4 6 5]\n",
      "   state [0 0 1 1 1 0 1 0] state_WI [  0.39   0.89   0.34   0.3    0.38   0.47   0.49 -10.  ] sorted [1 6 5]\n",
      "   state [0 1 0 0 1 0 1 0] state_WI [  0.39   0.31   0.32   0.48   0.38   0.47   0.49 -10.  ] sorted [6 3 5]\n",
      "   state [1 0 1 0 0 1 0 0] state_WI [  0.26   0.89   0.34   0.48   0.91   0.39   0.47 -10.  ] sorted [4 1 3]\n",
      "   state [0 1 0 1 1 1 0 0] state_WI [  0.39   0.31   0.32   0.3    0.38   0.39   0.47 -10.  ] sorted [6 5 0]\n",
      "   state [1 1 0 0 1 0 1 0] state_WI [  0.26   0.31   0.32   0.48   0.38   0.47   0.49 -10.  ] sorted [6 3 5]\n",
      "   state [0 1 0 1 1 1 0 0] state_WI [  0.39   0.31   0.32   0.3    0.38   0.39   0.47 -10.  ] sorted [6 5 0]\n",
      "   state [1 1 0 0 0 1 1 0] state_WI [  0.26   0.31   0.32   0.48   0.91   0.39   0.49 -10.  ] sorted [4 6 3]\n",
      "   state [0 1 1 1 1 0 1 1] state_WI [  0.39   0.31   0.34   0.3    0.38   0.47   0.49 -10.  ] sorted [6 5 0]\n",
      "   state [1 1 1 1 0 0 1 1] state_WI [  0.26   0.31   0.34   0.3    0.91   0.47   0.49 -10.  ] sorted [4 6 5]\n",
      "   state [1 1 0 0 0 1 1 0] state_WI [  0.26   0.31   0.32   0.48   0.91   0.39   0.49 -10.  ] sorted [4 6 3]\n",
      "instance 6, ep 2, state [0 0 0 1 1 1 1 0]\n",
      "   state [0 0 0 1 1 1 1 0] state_WI [  0.39   0.89   0.32   0.3    0.38   0.39   0.49 -10.  ] sorted [1 6 5]\n",
      "   state [1 0 0 0 1 1 1 0] state_WI [  0.26   0.89   0.32   0.48   0.38   0.39   0.49 -10.  ] sorted [1 6 3]\n",
      "   state [0 0 0 1 0 1 1 0] state_WI [  0.39   0.89   0.32   0.3    0.91   0.39   0.49 -10.  ] sorted [4 1 6]\n",
      "   state [1 1 1 0 0 0 0 0] state_WI [  0.26   0.31   0.34   0.48   0.91   0.47   0.47 -10.  ] sorted [4 3 6]\n",
      "   state [0 0 0 0 1 0 0 0] state_WI [  0.39   0.89   0.32   0.48   0.38   0.47   0.47 -10.  ] sorted [1 3 6]\n",
      "   state [0 1 0 0 0 0 0 0] state_WI [  0.39   0.31   0.32   0.48   0.91   0.47   0.47 -10.  ] sorted [4 3 6]\n",
      "   state [0 1 0 0 1 1 0 0] state_WI [  0.39   0.31   0.32   0.48   0.38   0.39   0.47 -10.  ] sorted [3 6 5]\n",
      "   state [0 0 0 0 1 1 1 0] state_WI [  0.39   0.89   0.32   0.48   0.38   0.39   0.49 -10.  ] sorted [1 6 3]\n",
      "   state [1 1 0 0 1 1 1 0] state_WI [  0.26   0.31   0.32   0.48   0.38   0.39   0.49 -10.  ] sorted [6 3 5]\n",
      "   state [0 0 0 0 0 1 1 1] state_WI [  0.39   0.89   0.32   0.48   0.91   0.39   0.49 -10.  ] sorted [4 1 6]\n",
      "   state [0 1 0 0 1 0 1 0] state_WI [  0.39   0.31   0.32   0.48   0.38   0.47   0.49 -10.  ] sorted [6 3 5]\n",
      "   state [0 1 0 0 0 1 1 0] state_WI [  0.39   0.31   0.32   0.48   0.91   0.39   0.49 -10.  ] sorted [4 6 3]\n",
      "   state [0 0 0 1 1 0 1 0] state_WI [  0.39   0.89   0.32   0.3    0.38   0.47   0.49 -10.  ] sorted [1 6 5]\n",
      "   state [0 1 1 0 1 1 1 0] state_WI [  0.39   0.31   0.34   0.48   0.38   0.39   0.49 -10.  ] sorted [6 3 5]\n",
      "   state [0 0 1 0 0 1 1 0] state_WI [  0.39   0.89   0.34   0.48   0.91   0.39   0.49 -10.  ] sorted [4 1 6]\n",
      "   state [0 0 1 0 1 0 1 0] state_WI [  0.39   0.89   0.34   0.48   0.38   0.47   0.49 -10.  ] sorted [1 6 3]\n",
      "   state [0 1 0 1 1 0 1 0] state_WI [  0.39   0.31   0.32   0.3    0.38   0.47   0.49 -10.  ] sorted [6 5 0]\n",
      "   state [0 1 0 0 1 1 1 0] state_WI [  0.39   0.31   0.32   0.48   0.38   0.39   0.49 -10.  ] sorted [6 3 5]\n",
      "   state [0 1 1 0 1 0 0 0] state_WI [  0.39   0.31   0.34   0.48   0.38   0.47   0.47 -10.  ] sorted [3 6 5]\n",
      "   state [0 1 1 0 0 0 0 0] state_WI [  0.39   0.31   0.34   0.48   0.91   0.47   0.47 -10.  ] sorted [4 3 6]\n",
      "instance 6, ep 3, state [0 0 0 0 0 1 1 1]\n",
      "   state [0 0 0 0 0 1 1 1] state_WI [  0.39   0.89   0.32   0.48   0.91   0.39   0.49 -10.  ] sorted [4 1 6]\n",
      "   state [1 1 1 0 1 0 1 0] state_WI [  0.26   0.31   0.34   0.48   0.38   0.47   0.49 -10.  ] sorted [6 3 5]\n",
      "   state [1 1 1 1 0 1 1 0] state_WI [  0.26   0.31   0.34   0.3    0.91   0.39   0.49 -10.  ] sorted [4 6 5]\n",
      "   state [1 1 1 1 1 1 1 1] state_WI [  0.26   0.31   0.34   0.3    0.38   0.39   0.49 -10.  ] sorted [6 5 4]\n",
      "   state [1 1 0 0 1 1 1 0] state_WI [  0.26   0.31   0.32   0.48   0.38   0.39   0.49 -10.  ] sorted [6 3 5]\n",
      "   state [0 1 1 1 0 1 1 0] state_WI [  0.39   0.31   0.34   0.3    0.91   0.39   0.49 -10.  ] sorted [4 6 5]\n",
      "   state [0 0 0 0 0 0 1 0] state_WI [  0.39   0.89   0.32   0.48   0.91   0.47   0.49 -10.  ] sorted [4 1 6]\n",
      "   state [0 0 0 1 1 0 1 0] state_WI [  0.39   0.89   0.32   0.3    0.38   0.47   0.49 -10.  ] sorted [1 6 5]\n",
      "   state [0 0 0 1 0 1 0 0] state_WI [  0.39   0.89   0.32   0.3    0.91   0.39   0.47 -10.  ] sorted [4 1 6]\n",
      "   state [1 1 1 0 1 0 1 0] state_WI [  0.26   0.31   0.34   0.48   0.38   0.47   0.49 -10.  ] sorted [6 3 5]\n",
      "   state [0 1 0 0 0 1 1 0] state_WI [  0.39   0.31   0.32   0.48   0.91   0.39   0.49 -10.  ] sorted [4 6 3]\n",
      "   state [1 0 0 1 1 0 0 0] state_WI [  0.26   0.89   0.32   0.3    0.38   0.47   0.47 -10.  ] sorted [1 6 5]\n",
      "   state [0 1 0 0 0 1 1 0] state_WI [  0.39   0.31   0.32   0.48   0.91   0.39   0.49 -10.  ] sorted [4 6 3]\n",
      "   state [0 1 0 1 0 1 1 0] state_WI [  0.39   0.31   0.32   0.3    0.91   0.39   0.49 -10.  ] sorted [4 6 5]\n",
      "   state [1 1 0 1 0 1 0 0] state_WI [  0.26   0.31   0.32   0.3    0.91   0.39   0.47 -10.  ] sorted [4 6 5]\n",
      "   state [1 0 0 0 0 1 0 0] state_WI [  0.26   0.89   0.32   0.48   0.91   0.39   0.47 -10.  ] sorted [4 1 3]\n",
      "   state [0 1 0 1 0 0 0 0] state_WI [  0.39   0.31   0.32   0.3    0.91   0.47   0.47 -10.  ] sorted [4 6 5]\n",
      "   state [0 1 0 0 0 0 1 1] state_WI [  0.39   0.31   0.32   0.48   0.91   0.47   0.49 -10.  ] sorted [4 6 3]\n",
      "   state [0 0 0 0 1 1 0 1] state_WI [  0.39   0.89   0.32   0.48   0.38   0.39   0.47 -10.  ] sorted [1 3 6]\n",
      "   state [0 1 0 0 0 0 0 1] state_WI [  0.39   0.31   0.32   0.48   0.91   0.47   0.47 -10.  ] sorted [4 3 6]\n",
      "instance 6, ep 4, state [1 1 0 1 1 0 0 1]\n",
      "   state [1 1 0 1 1 0 0 1] state_WI [  0.26   0.31   0.32   0.3    0.38   0.47   0.47 -10.  ] sorted [6 5 4]\n",
      "   state [1 1 0 1 1 1 1 0] state_WI [  0.26   0.31   0.32   0.3    0.38   0.39   0.49 -10.  ] sorted [6 5 4]\n",
      "   state [0 1 0 0 1 1 0 0] state_WI [  0.39   0.31   0.32   0.48   0.38   0.39   0.47 -10.  ] sorted [3 6 5]\n",
      "   state [0 0 1 1 0 1 0 0] state_WI [  0.39   0.89   0.34   0.3    0.91   0.39   0.47 -10.  ] sorted [4 1 6]\n",
      "   state [0 0 1 0 1 1 1 1] state_WI [  0.39   0.89   0.34   0.48   0.38   0.39   0.49 -10.  ] sorted [1 6 3]\n",
      "   state [0 1 1 0 1 0 1 1] state_WI [  0.39   0.31   0.34   0.48   0.38   0.47   0.49 -10.  ] sorted [6 3 5]\n",
      "   state [0 0 1 0 1 1 0 0] state_WI [  0.39   0.89   0.34   0.48   0.38   0.39   0.47 -10.  ] sorted [1 3 6]\n",
      "   state [0 1 1 0 1 0 1 1] state_WI [  0.39   0.31   0.34   0.48   0.38   0.47   0.49 -10.  ] sorted [6 3 5]\n",
      "   state [0 0 1 0 1 1 1 0] state_WI [  0.39   0.89   0.34   0.48   0.38   0.39   0.49 -10.  ] sorted [1 6 3]\n",
      "   state [0 1 1 0 0 1 1 0] state_WI [  0.39   0.31   0.34   0.48   0.91   0.39   0.49 -10.  ] sorted [4 6 3]\n",
      "   state [0 0 0 1 1 1 1 0] state_WI [  0.39   0.89   0.32   0.3    0.38   0.39   0.49 -10.  ] sorted [1 6 5]\n",
      "   state [0 1 0 0 1 0 1 1] state_WI [  0.39   0.31   0.32   0.48   0.38   0.47   0.49 -10.  ] sorted [6 3 5]\n",
      "   state [0 0 0 1 0 1 1 0] state_WI [  0.39   0.89   0.32   0.3    0.91   0.39   0.49 -10.  ] sorted [4 1 6]\n",
      "   state [0 1 0 1 0 0 1 0] state_WI [  0.39   0.31   0.32   0.3    0.91   0.47   0.49 -10.  ] sorted [4 6 5]\n",
      "   state [0 1 0 1 1 0 1 0] state_WI [  0.39   0.31   0.32   0.3    0.38   0.47   0.49 -10.  ] sorted [6 5 0]\n",
      "   state [1 0 0 0 0 1 0 0] state_WI [  0.26   0.89   0.32   0.48   0.91   0.39   0.47 -10.  ] sorted [4 1 3]\n",
      "   state [1 1 0 1 1 0 0 0] state_WI [  0.26   0.31   0.32   0.3    0.38   0.47   0.47 -10.  ] sorted [6 5 4]\n",
      "   state [0 1 0 0 1 0 0 0] state_WI [  0.39   0.31   0.32   0.48   0.38   0.47   0.47 -10.  ] sorted [3 6 5]\n",
      "   state [0 1 0 1 0 1 1 0] state_WI [  0.39   0.31   0.32   0.3    0.91   0.39   0.49 -10.  ] sorted [4 6 5]\n",
      "   state [0 1 0 0 1 0 0 0] state_WI [  0.39   0.31   0.32   0.48   0.38   0.47   0.47 -10.  ] sorted [3 6 5]\n",
      "instance 6, ep 5, state [0 1 1 0 0 0 0 0]\n",
      "   state [0 1 1 0 0 0 0 0] state_WI [  0.39   0.31   0.34   0.48   0.91   0.47   0.47 -10.  ] sorted [4 3 6]\n",
      "   state [0 1 0 1 1 0 1 0] state_WI [  0.39   0.31   0.32   0.3    0.38   0.47   0.49 -10.  ] sorted [6 5 0]\n",
      "   state [0 1 0 0 1 1 1 0] state_WI [  0.39   0.31   0.32   0.48   0.38   0.39   0.49 -10.  ] sorted [6 3 5]\n",
      "   state [1 0 0 0 1 1 1 0] state_WI [  0.26   0.89   0.32   0.48   0.38   0.39   0.49 -10.  ] sorted [1 6 3]\n",
      "   state [0 0 0 0 0 1 0 0] state_WI [  0.39   0.89   0.32   0.48   0.91   0.39   0.47 -10.  ] sorted [4 1 3]\n",
      "   state [0 1 0 1 1 1 0 0] state_WI [  0.39   0.31   0.32   0.3    0.38   0.39   0.47 -10.  ] sorted [6 5 0]\n",
      "   state [0 1 0 0 1 1 1 0] state_WI [  0.39   0.31   0.32   0.48   0.38   0.39   0.49 -10.  ] sorted [6 3 5]\n",
      "   state [0 1 0 1 0 1 1 0] state_WI [  0.39   0.31   0.32   0.3    0.91   0.39   0.49 -10.  ] sorted [4 6 5]\n",
      "   state [0 0 0 1 1 0 1 0] state_WI [  0.39   0.89   0.32   0.3    0.38   0.47   0.49 -10.  ] sorted [1 6 5]\n",
      "   state [0 1 0 1 1 0 1 0] state_WI [  0.39   0.31   0.32   0.3    0.38   0.47   0.49 -10.  ] sorted [6 5 0]\n",
      "   state [1 1 0 0 1 1 1 0] state_WI [  0.26   0.31   0.32   0.48   0.38   0.39   0.49 -10.  ] sorted [6 3 5]\n",
      "   state [1 0 0 1 1 0 1 0] state_WI [  0.26   0.89   0.32   0.3    0.38   0.47   0.49 -10.  ] sorted [1 6 5]\n",
      "   state [1 1 0 0 1 1 1 0] state_WI [  0.26   0.31   0.32   0.48   0.38   0.39   0.49 -10.  ] sorted [6 3 5]\n",
      "   state [1 1 0 0 1 1 1 0] state_WI [  0.26   0.31   0.32   0.48   0.38   0.39   0.49 -10.  ] sorted [6 3 5]\n",
      "   state [0 1 1 1 0 0 0 0] state_WI [  0.39   0.31   0.34   0.3    0.91   0.47   0.47 -10.  ] sorted [4 6 5]\n",
      "   state [0 1 1 0 1 1 1 0] state_WI [  0.39   0.31   0.34   0.48   0.38   0.39   0.49 -10.  ] sorted [6 3 5]\n",
      "   state [0 0 0 1 1 1 1 0] state_WI [  0.39   0.89   0.32   0.3    0.38   0.39   0.49 -10.  ] sorted [1 6 5]\n",
      "   state [1 0 0 0 0 1 0 0] state_WI [  0.26   0.89   0.32   0.48   0.91   0.39   0.47 -10.  ] sorted [4 1 3]\n",
      "   state [0 0 1 1 1 1 0 0] state_WI [  0.39   0.89   0.34   0.3    0.38   0.39   0.47 -10.  ] sorted [1 6 5]\n",
      "   state [1 1 0 1 0 0 0 0] state_WI [  0.26   0.31   0.32   0.3    0.91   0.47   0.47 -10.  ] sorted [4 6 5]\n",
      "instance 6, ep 6, state [1 0 1 0 1 0 0 1]\n",
      "   state [1 0 1 0 1 0 0 1] state_WI [  0.26   0.89   0.34   0.48   0.38   0.47   0.47 -10.  ] sorted [1 3 6]\n",
      "   state [1 1 1 0 0 0 0 0] state_WI [  0.26   0.31   0.34   0.48   0.91   0.47   0.47 -10.  ] sorted [4 3 6]\n",
      "   state [1 0 0 0 1 0 0 0] state_WI [  0.26   0.89   0.32   0.48   0.38   0.47   0.47 -10.  ] sorted [1 3 6]\n",
      "   state [1 0 0 1 0 0 1 1] state_WI [  0.26   0.89   0.32   0.3    0.91   0.47   0.49 -10.  ] sorted [4 1 6]\n",
      "   state [0 1 0 1 0 0 1 1] state_WI [  0.39   0.31   0.32   0.3    0.91   0.47   0.49 -10.  ] sorted [4 6 5]\n",
      "   state [0 0 0 0 1 1 1 0] state_WI [  0.39   0.89   0.32   0.48   0.38   0.39   0.49 -10.  ] sorted [1 6 3]\n",
      "   state [0 1 1 1 1 0 0 0] state_WI [  0.39   0.31   0.34   0.3    0.38   0.47   0.47 -10.  ] sorted [6 5 0]\n",
      "   state [1 0 1 1 0 0 0 0] state_WI [  0.26   0.89   0.34   0.3    0.91   0.47   0.47 -10.  ] sorted [4 1 6]\n",
      "   state [0 1 0 0 0 0 1 0] state_WI [  0.39   0.31   0.32   0.48   0.91   0.47   0.49 -10.  ] sorted [4 6 3]\n",
      "   state [1 1 0 0 1 0 1 0] state_WI [  0.26   0.31   0.32   0.48   0.38   0.47   0.49 -10.  ] sorted [6 3 5]\n",
      "   state [0 0 0 1 0 0 1 0] state_WI [  0.39   0.89   0.32   0.3    0.91   0.47   0.49 -10.  ] sorted [4 1 6]\n",
      "   state [0 1 0 0 1 0 1 0] state_WI [  0.39   0.31   0.32   0.48   0.38   0.47   0.49 -10.  ] sorted [6 3 5]\n",
      "   state [1 0 0 1 0 1 1 0] state_WI [  0.26   0.89   0.32   0.3    0.91   0.39   0.49 -10.  ] sorted [4 1 6]\n",
      "   state [1 0 0 1 0 1 1 1] state_WI [  0.26   0.89   0.32   0.3    0.91   0.39   0.49 -10.  ] sorted [4 1 6]\n",
      "   state [0 1 0 0 1 1 1 0] state_WI [  0.39   0.31   0.32   0.48   0.38   0.39   0.49 -10.  ] sorted [6 3 5]\n",
      "   state [0 1 1 0 0 1 1 0] state_WI [  0.39   0.31   0.34   0.48   0.91   0.39   0.49 -10.  ] sorted [4 6 3]\n",
      "   state [0 0 0 0 1 0 1 0] state_WI [  0.39   0.89   0.32   0.48   0.38   0.47   0.49 -10.  ] sorted [1 6 3]\n",
      "   state [0 1 0 1 1 0 1 0] state_WI [  0.39   0.31   0.32   0.3    0.38   0.47   0.49 -10.  ] sorted [6 5 0]\n",
      "   state [0 1 0 1 0 0 1 0] state_WI [  0.39   0.31   0.32   0.3    0.91   0.47   0.49 -10.  ] sorted [4 6 5]\n",
      "   state [0 0 1 0 1 1 1 0] state_WI [  0.39   0.89   0.34   0.48   0.38   0.39   0.49 -10.  ] sorted [1 6 3]\n",
      "instance 6, ep 7, state [1 0 1 0 0 0 0 1]\n",
      "   state [1 0 1 0 0 0 0 1] state_WI [  0.26   0.89   0.34   0.48   0.91   0.47   0.47 -10.  ] sorted [4 1 3]\n",
      "   state [0 1 0 0 1 0 0 1] state_WI [  0.39   0.31   0.32   0.48   0.38   0.47   0.47 -10.  ] sorted [3 6 5]\n",
      "   state [1 0 1 1 0 0 1 0] state_WI [  0.26   0.89   0.34   0.3    0.91   0.47   0.49 -10.  ] sorted [4 1 6]\n",
      "   state [1 0 1 0 1 0 1 0] state_WI [  0.26   0.89   0.34   0.48   0.38   0.47   0.49 -10.  ] sorted [1 6 3]\n",
      "   state [0 0 0 0 1 0 1 0] state_WI [  0.39   0.89   0.32   0.48   0.38   0.47   0.49 -10.  ] sorted [1 6 3]\n",
      "   state [0 1 0 1 1 0 1 0] state_WI [  0.39   0.31   0.32   0.3    0.38   0.47   0.49 -10.  ] sorted [6 5 0]\n",
      "   state [0 1 0 1 0 1 1 0] state_WI [  0.39   0.31   0.32   0.3    0.91   0.39   0.49 -10.  ] sorted [4 6 5]\n",
      "   state [0 1 0 0 0 1 0 0] state_WI [  0.39   0.31   0.32   0.48   0.91   0.39   0.47 -10.  ] sorted [4 3 6]\n",
      "   state [1 1 0 0 1 1 1 0] state_WI [  0.26   0.31   0.32   0.48   0.38   0.39   0.49 -10.  ] sorted [6 3 5]\n",
      "   state [0 0 0 1 0 1 0 0] state_WI [  0.39   0.89   0.32   0.3    0.91   0.39   0.47 -10.  ] sorted [4 1 6]\n",
      "   state [1 1 0 0 0 1 0 1] state_WI [  0.26   0.31   0.32   0.48   0.91   0.39   0.47 -10.  ] sorted [4 3 6]\n",
      "   state [1 1 1 1 1 0 1 0] state_WI [  0.26   0.31   0.34   0.3    0.38   0.47   0.49 -10.  ] sorted [6 5 4]\n",
      "   state [0 0 0 0 1 1 1 0] state_WI [  0.39   0.89   0.32   0.48   0.38   0.39   0.49 -10.  ] sorted [1 6 3]\n",
      "   state [0 1 0 1 0 1 1 0] state_WI [  0.39   0.31   0.32   0.3    0.91   0.39   0.49 -10.  ] sorted [4 6 5]\n",
      "   state [0 0 0 0 1 1 1 0] state_WI [  0.39   0.89   0.32   0.48   0.38   0.39   0.49 -10.  ] sorted [1 6 3]\n",
      "   state [1 0 0 1 1 0 1 0] state_WI [  0.26   0.89   0.32   0.3    0.38   0.47   0.49 -10.  ] sorted [1 6 5]\n",
      "   state [1 1 0 1 1 1 1 0] state_WI [  0.26   0.31   0.32   0.3    0.38   0.39   0.49 -10.  ] sorted [6 5 4]\n",
      "   state [0 0 1 1 1 1 1 0] state_WI [  0.39   0.89   0.34   0.3    0.38   0.39   0.49 -10.  ] sorted [1 6 5]\n",
      "   state [0 0 1 0 0 1 1 0] state_WI [  0.39   0.89   0.34   0.48   0.91   0.39   0.49 -10.  ] sorted [4 1 6]\n",
      "   state [0 1 1 0 1 1 1 0] state_WI [  0.39   0.31   0.34   0.48   0.38   0.39   0.49 -10.  ] sorted [6 3 5]\n",
      "instance 6, ep 8, state [0 0 1 1 0 1 0 1]\n",
      "   state [0 0 1 1 0 1 0 1] state_WI [  0.39   0.89   0.34   0.3    0.91   0.39   0.47 -10.  ] sorted [4 1 6]\n",
      "   state [0 1 1 1 1 0 0 0] state_WI [  0.39   0.31   0.34   0.3    0.38   0.47   0.47 -10.  ] sorted [6 5 0]\n",
      "   state [1 0 1 0 1 0 1 0] state_WI [  0.26   0.89   0.34   0.48   0.38   0.47   0.49 -10.  ] sorted [1 6 3]\n",
      "   state [1 1 1 0 1 0 1 0] state_WI [  0.26   0.31   0.34   0.48   0.38   0.47   0.49 -10.  ] sorted [6 3 5]\n",
      "   state [1 0 1 0 0 0 1 0] state_WI [  0.26   0.89   0.34   0.48   0.91   0.47   0.49 -10.  ] sorted [4 1 6]\n",
      "   state [0 0 1 1 1 0 1 0] state_WI [  0.39   0.89   0.34   0.3    0.38   0.47   0.49 -10.  ] sorted [1 6 5]\n",
      "   state [1 1 0 1 1 0 1 0] state_WI [  0.26   0.31   0.32   0.3    0.38   0.47   0.49 -10.  ] sorted [6 5 4]\n",
      "   state [1 0 0 0 1 1 1 0] state_WI [  0.26   0.89   0.32   0.48   0.38   0.39   0.49 -10.  ] sorted [1 6 3]\n",
      "   state [1 1 1 0 1 0 1 0] state_WI [  0.26   0.31   0.34   0.48   0.38   0.47   0.49 -10.  ] sorted [6 3 5]\n",
      "   state [0 0 1 1 1 0 1 0] state_WI [  0.39   0.89   0.34   0.3    0.38   0.47   0.49 -10.  ] sorted [1 6 5]\n",
      "   state [0 1 1 0 0 0 1 0] state_WI [  0.39   0.31   0.34   0.48   0.91   0.47   0.49 -10.  ] sorted [4 6 3]\n",
      "   state [0 1 1 0 0 0 1 0] state_WI [  0.39   0.31   0.34   0.48   0.91   0.47   0.49 -10.  ] sorted [4 6 3]\n",
      "   state [0 0 1 0 0 0 1 0] state_WI [  0.39   0.89   0.34   0.48   0.91   0.47   0.49 -10.  ] sorted [4 1 6]\n",
      "   state [0 0 0 0 0 0 1 0] state_WI [  0.39   0.89   0.32   0.48   0.91   0.47   0.49 -10.  ] sorted [4 1 6]\n",
      "   state [1 1 0 0 1 0 0 1] state_WI [  0.26   0.31   0.32   0.48   0.38   0.47   0.47 -10.  ] sorted [3 6 5]\n",
      "   state [0 1 0 1 0 0 0 0] state_WI [  0.39   0.31   0.32   0.3    0.91   0.47   0.47 -10.  ] sorted [4 6 5]\n",
      "   state [0 1 0 0 0 1 0 0] state_WI [  0.39   0.31   0.32   0.48   0.91   0.39   0.47 -10.  ] sorted [4 3 6]\n",
      "   state [0 1 0 0 1 0 1 0] state_WI [  0.39   0.31   0.32   0.48   0.38   0.47   0.49 -10.  ] sorted [6 3 5]\n",
      "   state [0 1 0 0 0 0 1 0] state_WI [  0.39   0.31   0.32   0.48   0.91   0.47   0.49 -10.  ] sorted [4 6 3]\n",
      "   state [0 1 0 1 1 0 1 0] state_WI [  0.39   0.31   0.32   0.3    0.38   0.47   0.49 -10.  ] sorted [6 5 0]\n",
      "instance 6, ep 9, state [1 1 0 0 0 0 0 1]\n",
      "   state [1 1 0 0 0 0 0 1] state_WI [  0.26   0.31   0.32   0.48   0.91   0.47   0.47 -10.  ] sorted [4 3 6]\n",
      "   state [1 0 0 1 1 0 1 0] state_WI [  0.26   0.89   0.32   0.3    0.38   0.47   0.49 -10.  ] sorted [1 6 5]\n",
      "   state [1 1 0 0 0 0 1 0] state_WI [  0.26   0.31   0.32   0.48   0.91   0.47   0.49 -10.  ] sorted [4 6 3]\n",
      "   state [1 1 0 1 0 0 1 0] state_WI [  0.26   0.31   0.32   0.3    0.91   0.47   0.49 -10.  ] sorted [4 6 5]\n",
      "   state [0 1 0 0 0 1 1 1] state_WI [  0.39   0.31   0.32   0.48   0.91   0.39   0.49 -10.  ] sorted [4 6 3]\n",
      "   state [1 1 1 0 1 0 0 1] state_WI [  0.26   0.31   0.34   0.48   0.38   0.47   0.47 -10.  ] sorted [3 6 5]\n",
      "   state [0 1 1 0 0 0 0 0] state_WI [  0.39   0.31   0.34   0.48   0.91   0.47   0.47 -10.  ] sorted [4 3 6]\n",
      "   state [0 1 1 0 0 0 0 0] state_WI [  0.39   0.31   0.34   0.48   0.91   0.47   0.47 -10.  ] sorted [4 3 6]\n",
      "   state [0 1 1 0 1 0 1 0] state_WI [  0.39   0.31   0.34   0.48   0.38   0.47   0.49 -10.  ] sorted [6 3 5]\n",
      "   state [0 1 1 1 0 0 1 0] state_WI [  0.39   0.31   0.34   0.3    0.91   0.47   0.49 -10.  ] sorted [4 6 5]\n",
      "   state [0 0 1 0 1 0 1 1] state_WI [  0.39   0.89   0.34   0.48   0.38   0.47   0.49 -10.  ] sorted [1 6 3]\n",
      "   state [0 1 0 0 1 0 1 0] state_WI [  0.39   0.31   0.32   0.48   0.38   0.47   0.49 -10.  ] sorted [6 3 5]\n",
      "   state [0 1 0 1 0 1 1 0] state_WI [  0.39   0.31   0.32   0.3    0.91   0.39   0.49 -10.  ] sorted [4 6 5]\n",
      "   state [0 0 0 0 1 1 1 0] state_WI [  0.39   0.89   0.32   0.48   0.38   0.39   0.49 -10.  ] sorted [1 6 3]\n",
      "   state [0 1 0 1 1 1 1 0] state_WI [  0.39   0.31   0.32   0.3    0.38   0.39   0.49 -10.  ] sorted [6 5 0]\n",
      "   state [1 1 0 1 0 0 1 0] state_WI [  0.26   0.31   0.32   0.3    0.91   0.47   0.49 -10.  ] sorted [4 6 5]\n",
      "   state [0 1 0 1 0 1 1 0] state_WI [  0.39   0.31   0.32   0.3    0.91   0.39   0.49 -10.  ] sorted [4 6 5]\n",
      "   state [0 0 0 0 0 1 1 0] state_WI [  0.39   0.89   0.32   0.48   0.91   0.39   0.49 -10.  ] sorted [4 1 6]\n",
      "   state [0 1 0 0 0 0 1 0] state_WI [  0.39   0.31   0.32   0.48   0.91   0.47   0.49 -10.  ] sorted [4 6 3]\n",
      "   state [0 1 0 0 1 0 1 0] state_WI [  0.39   0.31   0.32   0.48   0.38   0.47   0.49 -10.  ] sorted [6 3 5]\n",
      "instance 6, ep 10, state [0 0 1 0 1 0 0 0]\n",
      "   state [0 0 1 0 1 0 0 0] state_WI [  0.39   0.89   0.34   0.48   0.38   0.47   0.47 -10.  ] sorted [1 3 6]\n",
      "   state [0 1 1 1 1 0 0 0] state_WI [  0.39   0.31   0.34   0.3    0.38   0.47   0.47 -10.  ] sorted [6 5 0]\n",
      "   state [0 0 1 0 1 0 0 0] state_WI [  0.39   0.89   0.34   0.48   0.38   0.47   0.47 -10.  ] sorted [1 3 6]\n",
      "   state [1 1 0 0 1 0 0 0] state_WI [  0.26   0.31   0.32   0.48   0.38   0.47   0.47 -10.  ] sorted [3 6 5]\n",
      "   state [1 0 0 1 0 1 0 0] state_WI [  0.26   0.89   0.32   0.3    0.91   0.39   0.47 -10.  ] sorted [4 1 6]\n",
      "   state [0 1 0 0 1 1 0 0] state_WI [  0.39   0.31   0.32   0.48   0.38   0.39   0.47 -10.  ] sorted [3 6 5]\n",
      "   state [0 1 0 1 1 1 0 0] state_WI [  0.39   0.31   0.32   0.3    0.38   0.39   0.47 -10.  ] sorted [6 5 0]\n",
      "   state [1 0 0 0 1 1 0 0] state_WI [  0.26   0.89   0.32   0.48   0.38   0.39   0.47 -10.  ] sorted [1 3 6]\n",
      "   state [0 1 0 1 0 1 1 0] state_WI [  0.39   0.31   0.32   0.3    0.91   0.39   0.49 -10.  ] sorted [4 6 5]\n",
      "   state [1 0 1 1 1 1 0 0] state_WI [  0.26   0.89   0.34   0.3    0.38   0.39   0.47 -10.  ] sorted [1 6 5]\n",
      "   state [0 1 0 0 1 1 1 0] state_WI [  0.39   0.31   0.32   0.48   0.38   0.39   0.49 -10.  ] sorted [6 3 5]\n",
      "   state [0 1 0 1 1 1 1 0] state_WI [  0.39   0.31   0.32   0.3    0.38   0.39   0.49 -10.  ] sorted [6 5 0]\n",
      "   state [0 1 0 1 0 1 1 0] state_WI [  0.39   0.31   0.32   0.3    0.91   0.39   0.49 -10.  ] sorted [4 6 5]\n",
      "   state [0 0 0 1 0 0 0 1] state_WI [  0.39   0.89   0.32   0.3    0.91   0.47   0.47 -10.  ] sorted [4 1 6]\n",
      "   state [0 1 0 0 1 0 0 0] state_WI [  0.39   0.31   0.32   0.48   0.38   0.47   0.47 -10.  ] sorted [3 6 5]\n",
      "   state [0 0 0 0 0 1 0 0] state_WI [  0.39   0.89   0.32   0.48   0.91   0.39   0.47 -10.  ] sorted [4 1 3]\n",
      "   state [0 1 0 1 1 0 0 0] state_WI [  0.39   0.31   0.32   0.3    0.38   0.47   0.47 -10.  ] sorted [6 5 0]\n",
      "   state [1 1 0 0 0 0 1 0] state_WI [  0.26   0.31   0.32   0.48   0.91   0.47   0.49 -10.  ] sorted [4 6 3]\n",
      "   state [1 0 0 1 1 0 1 0] state_WI [  0.26   0.89   0.32   0.3    0.38   0.47   0.49 -10.  ] sorted [1 6 5]\n",
      "   state [0 1 0 1 0 1 0 0] state_WI [  0.39   0.31   0.32   0.3    0.91   0.39   0.47 -10.  ] sorted [4 6 5]\n",
      "instance 6, ep 11, state [0 1 0 1 0 0 1 0]\n",
      "   state [0 1 0 1 0 0 1 0] state_WI [  0.39   0.31   0.32   0.3    0.91   0.47   0.49 -10.  ] sorted [4 6 5]\n",
      "   state [0 0 0 1 1 1 1 0] state_WI [  0.39   0.89   0.32   0.3    0.38   0.39   0.49 -10.  ] sorted [1 6 5]\n",
      "   state [0 1 1 0 0 0 1 0] state_WI [  0.39   0.31   0.34   0.48   0.91   0.47   0.49 -10.  ] sorted [4 6 3]\n",
      "   state [0 1 0 1 0 1 1 0] state_WI [  0.39   0.31   0.32   0.3    0.91   0.39   0.49 -10.  ] sorted [4 6 5]\n",
      "   state [0 1 1 0 0 1 0 0] state_WI [  0.39   0.31   0.34   0.48   0.91   0.39   0.47 -10.  ] sorted [4 3 6]\n",
      "   state [0 0 1 1 1 0 1 0] state_WI [  0.39   0.89   0.34   0.3    0.38   0.47   0.49 -10.  ] sorted [1 6 5]\n",
      "   state [0 1 1 1 0 0 1 1] state_WI [  0.39   0.31   0.34   0.3    0.91   0.47   0.49 -10.  ] sorted [4 6 5]\n",
      "   state [1 0 0 1 1 0 1 0] state_WI [  0.26   0.89   0.32   0.3    0.38   0.47   0.49 -10.  ] sorted [1 6 5]\n",
      "   state [1 1 0 1 0 1 1 0] state_WI [  0.26   0.31   0.32   0.3    0.91   0.39   0.49 -10.  ] sorted [4 6 5]\n",
      "   state [0 0 0 1 1 0 1 0] state_WI [  0.39   0.89   0.32   0.3    0.38   0.47   0.49 -10.  ] sorted [1 6 5]\n",
      "   state [0 0 0 0 1 0 1 1] state_WI [  0.39   0.89   0.32   0.48   0.38   0.47   0.49 -10.  ] sorted [1 6 3]\n",
      "   state [0 1 0 1 1 0 1 1] state_WI [  0.39   0.31   0.32   0.3    0.38   0.47   0.49 -10.  ] sorted [6 5 0]\n",
      "   state [1 1 0 1 1 1 0 1] state_WI [  0.26   0.31   0.32   0.3    0.38   0.39   0.47 -10.  ] sorted [6 5 4]\n",
      "   state [1 1 0 0 1 1 1 0] state_WI [  0.26   0.31   0.32   0.48   0.38   0.39   0.49 -10.  ] sorted [6 3 5]\n",
      "   state [1 1 0 1 0 1 1 0] state_WI [  0.26   0.31   0.32   0.3    0.91   0.39   0.49 -10.  ] sorted [4 6 5]\n",
      "   state [1 0 1 1 1 1 1 0] state_WI [  0.26   0.89   0.34   0.3    0.38   0.39   0.49 -10.  ] sorted [1 6 5]\n",
      "   state [1 1 0 0 0 1 1 1] state_WI [  0.26   0.31   0.32   0.48   0.91   0.39   0.49 -10.  ] sorted [4 6 3]\n",
      "   state [1 1 0 0 1 0 1 0] state_WI [  0.26   0.31   0.32   0.48   0.38   0.47   0.49 -10.  ] sorted [6 3 5]\n",
      "   state [1 1 0 0 0 1 1 0] state_WI [  0.26   0.31   0.32   0.48   0.91   0.39   0.49 -10.  ] sorted [4 6 3]\n",
      "   state [0 1 0 0 1 0 1 0] state_WI [  0.39   0.31   0.32   0.48   0.38   0.47   0.49 -10.  ] sorted [6 3 5]\n",
      "instance 6, ep 12, state [1 1 1 1 0 0 0 1]\n",
      "   state [1 1 1 1 0 0 0 1] state_WI [  0.26   0.31   0.34   0.3    0.91   0.47   0.47 -10.  ] sorted [4 6 5]\n",
      "   state [1 1 0 1 1 0 1 0] state_WI [  0.26   0.31   0.32   0.3    0.38   0.47   0.49 -10.  ] sorted [6 5 4]\n",
      "   state [0 0 1 0 1 0 1 0] state_WI [  0.39   0.89   0.34   0.48   0.38   0.47   0.49 -10.  ] sorted [1 6 3]\n",
      "   state [0 1 0 1 0 0 1 0] state_WI [  0.39   0.31   0.32   0.3    0.91   0.47   0.49 -10.  ] sorted [4 6 5]\n",
      "   state [1 1 0 0 1 0 1 0] state_WI [  0.26   0.31   0.32   0.48   0.38   0.47   0.49 -10.  ] sorted [6 3 5]\n",
      "   state [1 1 1 1 1 0 1 0] state_WI [  0.26   0.31   0.34   0.3    0.38   0.47   0.49 -10.  ] sorted [6 5 4]\n",
      "   state [1 0 0 0 1 1 0 0] state_WI [  0.26   0.89   0.32   0.48   0.38   0.39   0.47 -10.  ] sorted [1 3 6]\n",
      "   state [0 1 0 0 1 0 1 0] state_WI [  0.39   0.31   0.32   0.48   0.38   0.47   0.49 -10.  ] sorted [6 3 5]\n",
      "   state [0 1 0 0 0 0 1 0] state_WI [  0.39   0.31   0.32   0.48   0.91   0.47   0.49 -10.  ] sorted [4 6 3]\n",
      "   state [0 0 0 0 0 0 1 1] state_WI [  0.39   0.89   0.32   0.48   0.91   0.47   0.49 -10.  ] sorted [4 1 6]\n",
      "   state [0 0 0 0 1 0 1 1] state_WI [  0.39   0.89   0.32   0.48   0.38   0.47   0.49 -10.  ] sorted [1 6 3]\n",
      "   state [1 0 0 0 0 1 1 0] state_WI [  0.26   0.89   0.32   0.48   0.91   0.39   0.49 -10.  ] sorted [4 1 6]\n",
      "   state [0 0 0 0 1 1 1 0] state_WI [  0.39   0.89   0.32   0.48   0.38   0.39   0.49 -10.  ] sorted [1 6 3]\n",
      "   state [0 1 0 1 0 0 1 1] state_WI [  0.39   0.31   0.32   0.3    0.91   0.47   0.49 -10.  ] sorted [4 6 5]\n",
      "   state [0 0 0 1 0 1 1 1] state_WI [  0.39   0.89   0.32   0.3    0.91   0.39   0.49 -10.  ] sorted [4 1 6]\n",
      "   state [0 1 0 1 1 0 1 1] state_WI [  0.39   0.31   0.32   0.3    0.38   0.47   0.49 -10.  ] sorted [6 5 0]\n",
      "   state [0 1 0 0 0 1 1 1] state_WI [  0.39   0.31   0.32   0.48   0.91   0.39   0.49 -10.  ] sorted [4 6 3]\n",
      "   state [0 1 0 0 1 0 1 0] state_WI [  0.39   0.31   0.32   0.48   0.38   0.47   0.49 -10.  ] sorted [6 3 5]\n",
      "   state [0 1 0 0 0 0 0 0] state_WI [  0.39   0.31   0.32   0.48   0.91   0.47   0.47 -10.  ] sorted [4 3 6]\n",
      "   state [1 0 0 1 1 1 0 0] state_WI [  0.26   0.89   0.32   0.3    0.38   0.39   0.47 -10.  ] sorted [1 6 5]\n",
      "instance 6, ep 13, state [1 0 1 0 1 0 1 1]\n",
      "   state [1 0 1 0 1 0 1 1] state_WI [  0.26   0.89   0.34   0.48   0.38   0.47   0.49 -10.  ] sorted [1 6 3]\n",
      "   state [1 1 0 0 1 0 1 0] state_WI [  0.26   0.31   0.32   0.48   0.38   0.47   0.49 -10.  ] sorted [6 3 5]\n",
      "   state [1 0 0 0 0 0 1 1] state_WI [  0.26   0.89   0.32   0.48   0.91   0.47   0.49 -10.  ] sorted [4 1 6]\n",
      "   state [1 1 0 0 0 0 1 1] state_WI [  0.26   0.31   0.32   0.48   0.91   0.47   0.49 -10.  ] sorted [4 6 3]\n",
      "   state [0 1 0 0 1 1 1 0] state_WI [  0.39   0.31   0.32   0.48   0.38   0.39   0.49 -10.  ] sorted [6 3 5]\n",
      "   state [0 1 0 0 1 1 1 1] state_WI [  0.39   0.31   0.32   0.48   0.38   0.39   0.49 -10.  ] sorted [6 3 5]\n",
      "   state [0 1 0 1 1 1 1 0] state_WI [  0.39   0.31   0.32   0.3    0.38   0.39   0.49 -10.  ] sorted [6 5 0]\n",
      "   state [0 1 0 1 0 0 1 0] state_WI [  0.39   0.31   0.32   0.3    0.91   0.47   0.49 -10.  ] sorted [4 6 5]\n",
      "   state [0 1 0 0 0 1 1 0] state_WI [  0.39   0.31   0.32   0.48   0.91   0.39   0.49 -10.  ] sorted [4 6 3]\n",
      "   state [0 0 0 0 1 0 1 0] state_WI [  0.39   0.89   0.32   0.48   0.38   0.47   0.49 -10.  ] sorted [1 6 3]\n",
      "   state [0 0 0 0 1 0 1 0] state_WI [  0.39   0.89   0.32   0.48   0.38   0.47   0.49 -10.  ] sorted [1 6 3]\n",
      "   state [0 0 0 1 0 0 1 0] state_WI [  0.39   0.89   0.32   0.3    0.91   0.47   0.49 -10.  ] sorted [4 1 6]\n",
      "   state [0 1 0 1 0 0 1 0] state_WI [  0.39   0.31   0.32   0.3    0.91   0.47   0.49 -10.  ] sorted [4 6 5]\n",
      "   state [0 1 0 0 1 0 1 0] state_WI [  0.39   0.31   0.32   0.48   0.38   0.47   0.49 -10.  ] sorted [6 3 5]\n",
      "   state [1 1 1 1 1 0 1 1] state_WI [  0.26   0.31   0.34   0.3    0.38   0.47   0.49 -10.  ] sorted [6 5 4]\n",
      "   state [1 1 0 1 1 0 0 0] state_WI [  0.26   0.31   0.32   0.3    0.38   0.47   0.47 -10.  ] sorted [6 5 4]\n",
      "   state [1 1 1 0 1 0 0 0] state_WI [  0.26   0.31   0.34   0.48   0.38   0.47   0.47 -10.  ] sorted [3 6 5]\n",
      "   state [1 0 0 0 0 1 1 0] state_WI [  0.26   0.89   0.32   0.48   0.91   0.39   0.49 -10.  ] sorted [4 1 6]\n",
      "   state [1 1 1 0 1 0 1 0] state_WI [  0.26   0.31   0.34   0.48   0.38   0.47   0.49 -10.  ] sorted [6 3 5]\n",
      "   state [0 0 0 0 1 1 1 0] state_WI [  0.39   0.89   0.32   0.48   0.38   0.39   0.49 -10.  ] sorted [1 6 3]\n",
      "instance 6, ep 14, state [0 0 0 0 0 1 1 1]\n",
      "   state [0 0 0 0 0 1 1 1] state_WI [  0.39   0.89   0.32   0.48   0.91   0.39   0.49 -10.  ] sorted [4 1 6]\n",
      "   state [0 1 1 0 1 0 1 1] state_WI [  0.39   0.31   0.34   0.48   0.38   0.47   0.49 -10.  ] sorted [6 3 5]\n",
      "   state [0 0 0 1 0 0 1 1] state_WI [  0.39   0.89   0.32   0.3    0.91   0.47   0.49 -10.  ] sorted [4 1 6]\n",
      "   state [0 1 0 1 0 0 1 0] state_WI [  0.39   0.31   0.32   0.3    0.91   0.47   0.49 -10.  ] sorted [4 6 5]\n",
      "   state [1 1 0 1 1 0 1 1] state_WI [  0.26   0.31   0.32   0.3    0.38   0.47   0.49 -10.  ] sorted [6 5 4]\n",
      "   state [1 1 0 0 0 1 1 0] state_WI [  0.26   0.31   0.32   0.48   0.91   0.39   0.49 -10.  ] sorted [4 6 3]\n",
      "   state [1 1 0 0 1 1 1 0] state_WI [  0.26   0.31   0.32   0.48   0.38   0.39   0.49 -10.  ] sorted [6 3 5]\n",
      "   state [1 0 0 0 0 1 1 0] state_WI [  0.26   0.89   0.32   0.48   0.91   0.39   0.49 -10.  ] sorted [4 1 6]\n",
      "   state [1 1 0 0 1 1 1 0] state_WI [  0.26   0.31   0.32   0.48   0.38   0.39   0.49 -10.  ] sorted [6 3 5]\n",
      "   state [0 1 1 0 0 1 1 0] state_WI [  0.39   0.31   0.34   0.48   0.91   0.39   0.49 -10.  ] sorted [4 6 3]\n",
      "   state [0 0 0 1 0 1 1 1] state_WI [  0.39   0.89   0.32   0.3    0.91   0.39   0.49 -10.  ] sorted [4 1 6]\n",
      "   state [1 1 0 0 0 0 1 1] state_WI [  0.26   0.31   0.32   0.48   0.91   0.47   0.49 -10.  ] sorted [4 6 3]\n",
      "   state [0 1 0 0 1 0 1 1] state_WI [  0.39   0.31   0.32   0.48   0.38   0.47   0.49 -10.  ] sorted [6 3 5]\n",
      "   state [0 1 0 1 0 1 1 0] state_WI [  0.39   0.31   0.32   0.3    0.91   0.39   0.49 -10.  ] sorted [4 6 5]\n",
      "   state [0 1 0 1 1 1 1 0] state_WI [  0.39   0.31   0.32   0.3    0.38   0.39   0.49 -10.  ] sorted [6 5 0]\n",
      "   state [0 1 0 1 0 1 1 1] state_WI [  0.39   0.31   0.32   0.3    0.91   0.39   0.49 -10.  ] sorted [4 6 5]\n",
      "   state [1 1 0 1 0 0 0 1] state_WI [  0.26   0.31   0.32   0.3    0.91   0.47   0.47 -10.  ] sorted [4 6 5]\n",
      "   state [0 0 0 1 1 0 1 0] state_WI [  0.39   0.89   0.32   0.3    0.38   0.47   0.49 -10.  ] sorted [1 6 5]\n",
      "   state [0 0 0 1 0 1 1 0] state_WI [  0.39   0.89   0.32   0.3    0.91   0.39   0.49 -10.  ] sorted [4 1 6]\n",
      "   state [0 1 0 0 1 1 1 0] state_WI [  0.39   0.31   0.32   0.48   0.38   0.39   0.49 -10.  ] sorted [6 3 5]\n",
      "instance 6, ep 15, state [0 1 1 0 1 1 0 0]\n",
      "   state [0 1 1 0 1 1 0 0] state_WI [  0.39   0.31   0.34   0.48   0.38   0.39   0.47 -10.  ] sorted [3 6 5]\n",
      "   state [0 1 0 0 0 1 1 0] state_WI [  0.39   0.31   0.32   0.48   0.91   0.39   0.49 -10.  ] sorted [4 6 3]\n",
      "   state [0 0 0 1 1 0 1 0] state_WI [  0.39   0.89   0.32   0.3    0.38   0.47   0.49 -10.  ] sorted [1 6 5]\n",
      "   state [0 1 0 0 0 0 1 0] state_WI [  0.39   0.31   0.32   0.48   0.91   0.47   0.49 -10.  ] sorted [4 6 3]\n",
      "   state [0 1 1 0 0 1 1 0] state_WI [  0.39   0.31   0.34   0.48   0.91   0.39   0.49 -10.  ] sorted [4 6 3]\n",
      "   state [0 1 1 1 1 1 1 0] state_WI [  0.39   0.31   0.34   0.3    0.38   0.39   0.49 -10.  ] sorted [6 5 0]\n",
      "   state [1 0 1 0 0 1 0 0] state_WI [  0.26   0.89   0.34   0.48   0.91   0.39   0.47 -10.  ] sorted [4 1 3]\n",
      "   state [0 1 1 0 0 0 0 0] state_WI [  0.39   0.31   0.34   0.48   0.91   0.47   0.47 -10.  ] sorted [4 3 6]\n",
      "   state [0 1 0 1 0 0 1 0] state_WI [  0.39   0.31   0.32   0.3    0.91   0.47   0.49 -10.  ] sorted [4 6 5]\n",
      "   state [0 0 0 0 1 0 1 0] state_WI [  0.39   0.89   0.32   0.48   0.38   0.47   0.49 -10.  ] sorted [1 6 3]\n",
      "   state [0 1 0 0 1 0 1 0] state_WI [  0.39   0.31   0.32   0.48   0.38   0.47   0.49 -10.  ] sorted [6 3 5]\n",
      "   state [1 0 1 0 1 0 1 0] state_WI [  0.26   0.89   0.34   0.48   0.38   0.47   0.49 -10.  ] sorted [1 6 3]\n",
      "   state [0 1 0 1 1 0 1 0] state_WI [  0.39   0.31   0.32   0.3    0.38   0.47   0.49 -10.  ] sorted [6 5 0]\n",
      "   state [0 1 0 0 0 1 1 0] state_WI [  0.39   0.31   0.32   0.48   0.91   0.39   0.49 -10.  ] sorted [4 6 3]\n",
      "   state [0 1 0 0 1 1 1 0] state_WI [  0.39   0.31   0.32   0.48   0.38   0.39   0.49 -10.  ] sorted [6 3 5]\n",
      "   state [1 0 0 0 1 1 1 0] state_WI [  0.26   0.89   0.32   0.48   0.38   0.39   0.49 -10.  ] sorted [1 6 3]\n",
      "   state [1 1 0 0 1 0 1 0] state_WI [  0.26   0.31   0.32   0.48   0.38   0.47   0.49 -10.  ] sorted [6 3 5]\n",
      "   state [1 0 0 0 0 1 1 0] state_WI [  0.26   0.89   0.32   0.48   0.91   0.39   0.49 -10.  ] sorted [4 1 6]\n",
      "   state [0 0 1 0 0 0 1 0] state_WI [  0.39   0.89   0.34   0.48   0.91   0.47   0.49 -10.  ] sorted [4 1 6]\n",
      "   state [0 1 0 1 0 0 0 0] state_WI [  0.39   0.31   0.32   0.3    0.91   0.47   0.47 -10.  ] sorted [4 6 5]\n",
      "instance 6, ep 16, state [0 0 1 1 1 0 0 1]\n",
      "   state [0 0 1 1 1 0 0 1] state_WI [  0.39   0.89   0.34   0.3    0.38   0.47   0.47 -10.  ] sorted [1 6 5]\n",
      "   state [0 0 0 1 1 1 0 1] state_WI [  0.39   0.89   0.32   0.3    0.38   0.39   0.47 -10.  ] sorted [1 6 5]\n",
      "   state [0 1 0 1 1 1 0 0] state_WI [  0.39   0.31   0.32   0.3    0.38   0.39   0.47 -10.  ] sorted [6 5 0]\n",
      "   state [0 0 0 1 0 1 1 0] state_WI [  0.39   0.89   0.32   0.3    0.91   0.39   0.49 -10.  ] sorted [4 1 6]\n",
      "   state [0 1 1 0 0 0 1 0] state_WI [  0.39   0.31   0.34   0.48   0.91   0.47   0.49 -10.  ] sorted [4 6 3]\n",
      "   state [0 1 1 1 0 0 1 0] state_WI [  0.39   0.31   0.34   0.3    0.91   0.47   0.49 -10.  ] sorted [4 6 5]\n",
      "   state [1 1 1 0 1 1 1 0] state_WI [  0.26   0.31   0.34   0.48   0.38   0.39   0.49 -10.  ] sorted [6 3 5]\n",
      "   state [1 0 1 0 0 1 0 0] state_WI [  0.26   0.89   0.34   0.48   0.91   0.39   0.47 -10.  ] sorted [4 1 3]\n",
      "   state [0 1 1 1 1 1 0 0] state_WI [  0.39   0.31   0.34   0.3    0.38   0.39   0.47 -10.  ] sorted [6 5 0]\n",
      "   state [1 1 1 0 0 1 0 0] state_WI [  0.26   0.31   0.34   0.48   0.91   0.39   0.47 -10.  ] sorted [4 3 6]\n",
      "   state [1 1 0 1 0 0 1 0] state_WI [  0.26   0.31   0.32   0.3    0.91   0.47   0.49 -10.  ] sorted [4 6 5]\n",
      "   state [0 0 0 1 1 1 1 0] state_WI [  0.39   0.89   0.32   0.3    0.38   0.39   0.49 -10.  ] sorted [1 6 5]\n",
      "   state [0 1 0 1 0 1 1 0] state_WI [  0.39   0.31   0.32   0.3    0.91   0.39   0.49 -10.  ] sorted [4 6 5]\n",
      "   state [0 0 0 0 1 1 1 1] state_WI [  0.39   0.89   0.32   0.48   0.38   0.39   0.49 -10.  ] sorted [1 6 3]\n",
      "   state [0 1 1 0 0 1 1 0] state_WI [  0.39   0.31   0.34   0.48   0.91   0.39   0.49 -10.  ] sorted [4 6 3]\n",
      "   state [0 1 0 0 1 0 1 0] state_WI [  0.39   0.31   0.32   0.48   0.38   0.47   0.49 -10.  ] sorted [6 3 5]\n",
      "   state [0 1 0 0 0 0 1 0] state_WI [  0.39   0.31   0.32   0.48   0.91   0.47   0.49 -10.  ] sorted [4 6 3]\n",
      "   state [0 1 1 0 1 0 0 0] state_WI [  0.39   0.31   0.34   0.48   0.38   0.47   0.47 -10.  ] sorted [3 6 5]\n",
      "   state [1 0 1 0 0 0 0 0] state_WI [  0.26   0.89   0.34   0.48   0.91   0.47   0.47 -10.  ] sorted [4 1 3]\n",
      "   state [0 1 0 0 0 0 0 0] state_WI [  0.39   0.31   0.32   0.48   0.91   0.47   0.47 -10.  ] sorted [4 3 6]\n",
      "instance 6, ep 17, state [1 0 1 1 0 0 1 0]\n",
      "   state [1 0 1 1 0 0 1 0] state_WI [  0.26   0.89   0.34   0.3    0.91   0.47   0.49 -10.  ] sorted [4 1 6]\n",
      "   state [1 1 0 1 1 0 0 0] state_WI [  0.26   0.31   0.32   0.3    0.38   0.47   0.47 -10.  ] sorted [6 5 4]\n",
      "   state [0 1 0 1 1 1 0 0] state_WI [  0.39   0.31   0.32   0.3    0.38   0.39   0.47 -10.  ] sorted [6 5 0]\n",
      "   state [1 0 0 0 0 1 0 0] state_WI [  0.26   0.89   0.32   0.48   0.91   0.39   0.47 -10.  ] sorted [4 1 3]\n",
      "   state [0 0 0 0 1 1 0 0] state_WI [  0.39   0.89   0.32   0.48   0.38   0.39   0.47 -10.  ] sorted [1 3 6]\n",
      "   state [0 1 0 0 0 0 1 1] state_WI [  0.39   0.31   0.32   0.48   0.91   0.47   0.49 -10.  ] sorted [4 6 3]\n",
      "   state [0 1 0 1 0 0 1 0] state_WI [  0.39   0.31   0.32   0.3    0.91   0.47   0.49 -10.  ] sorted [4 6 5]\n",
      "   state [0 1 0 1 1 1 1 0] state_WI [  0.39   0.31   0.32   0.3    0.38   0.39   0.49 -10.  ] sorted [6 5 0]\n",
      "   state [0 1 0 0 0 1 1 0] state_WI [  0.39   0.31   0.32   0.48   0.91   0.39   0.49 -10.  ] sorted [4 6 3]\n",
      "   state [0 1 1 0 1 0 1 0] state_WI [  0.39   0.31   0.34   0.48   0.38   0.47   0.49 -10.  ] sorted [6 3 5]\n",
      "   state [0 0 1 1 0 0 1 0] state_WI [  0.39   0.89   0.34   0.3    0.91   0.47   0.49 -10.  ] sorted [4 1 6]\n",
      "   state [0 1 1 1 1 0 1 0] state_WI [  0.39   0.31   0.34   0.3    0.38   0.47   0.49 -10.  ] sorted [6 5 0]\n",
      "   state [1 0 0 1 1 1 1 0] state_WI [  0.26   0.89   0.32   0.3    0.38   0.39   0.49 -10.  ] sorted [1 6 5]\n",
      "   state [0 1 0 1 1 1 0 0] state_WI [  0.39   0.31   0.32   0.3    0.38   0.39   0.47 -10.  ] sorted [6 5 0]\n",
      "   state [0 1 1 0 1 1 1 0] state_WI [  0.39   0.31   0.34   0.48   0.38   0.39   0.49 -10.  ] sorted [6 3 5]\n",
      "   state [0 1 0 1 1 1 1 0] state_WI [  0.39   0.31   0.32   0.3    0.38   0.39   0.49 -10.  ] sorted [6 5 0]\n",
      "   state [1 0 1 0 0 1 1 0] state_WI [  0.26   0.89   0.34   0.48   0.91   0.39   0.49 -10.  ] sorted [4 1 6]\n",
      "   state [0 1 0 0 1 0 1 0] state_WI [  0.39   0.31   0.32   0.48   0.38   0.47   0.49 -10.  ] sorted [6 3 5]\n",
      "   state [0 0 0 0 1 0 1 1] state_WI [  0.39   0.89   0.32   0.48   0.38   0.47   0.49 -10.  ] sorted [1 6 3]\n",
      "   state [0 1 0 0 1 0 0 0] state_WI [  0.39   0.31   0.32   0.48   0.38   0.47   0.47 -10.  ] sorted [3 6 5]\n",
      "instance 6, ep 18, state [0 0 0 1 1 0 1 1]\n",
      "   state [0 0 0 1 1 0 1 1] state_WI [  0.39   0.89   0.32   0.3    0.38   0.47   0.49 -10.  ] sorted [1 6 5]\n",
      "   state [0 0 0 0 1 1 0 0] state_WI [  0.39   0.89   0.32   0.48   0.38   0.39   0.47 -10.  ] sorted [1 3 6]\n",
      "   state [0 1 1 0 0 0 0 0] state_WI [  0.39   0.31   0.34   0.48   0.91   0.47   0.47 -10.  ] sorted [4 3 6]\n",
      "   state [0 1 0 1 1 0 1 1] state_WI [  0.39   0.31   0.32   0.3    0.38   0.47   0.49 -10.  ] sorted [6 5 0]\n",
      "   state [1 1 0 0 1 1 1 0] state_WI [  0.26   0.31   0.32   0.48   0.38   0.39   0.49 -10.  ] sorted [6 3 5]\n",
      "   state [1 1 0 1 1 0 1 0] state_WI [  0.26   0.31   0.32   0.3    0.38   0.47   0.49 -10.  ] sorted [6 5 4]\n",
      "   state [0 1 1 0 1 0 1 0] state_WI [  0.39   0.31   0.34   0.48   0.38   0.47   0.49 -10.  ] sorted [6 3 5]\n",
      "   state [1 1 1 0 0 0 1 0] state_WI [  0.26   0.31   0.34   0.48   0.91   0.47   0.49 -10.  ] sorted [4 6 3]\n",
      "   state [0 1 1 1 0 0 1 0] state_WI [  0.39   0.31   0.34   0.3    0.91   0.47   0.49 -10.  ] sorted [4 6 5]\n",
      "   state [0 0 0 1 1 0 1 0] state_WI [  0.39   0.89   0.32   0.3    0.38   0.47   0.49 -10.  ] sorted [1 6 5]\n",
      "   state [1 1 1 1 0 0 0 0] state_WI [  0.26   0.31   0.34   0.3    0.91   0.47   0.47 -10.  ] sorted [4 6 5]\n",
      "   state [1 1 1 1 1 1 0 0] state_WI [  0.26   0.31   0.34   0.3    0.38   0.39   0.47 -10.  ] sorted [6 5 4]\n",
      "   state [1 1 0 1 1 0 0 1] state_WI [  0.26   0.31   0.32   0.3    0.38   0.47   0.47 -10.  ] sorted [6 5 4]\n",
      "   state [1 1 0 1 1 0 0 1] state_WI [  0.26   0.31   0.32   0.3    0.38   0.47   0.47 -10.  ] sorted [6 5 4]\n",
      "   state [1 0 0 0 1 1 1 0] state_WI [  0.26   0.89   0.32   0.48   0.38   0.39   0.49 -10.  ] sorted [1 6 3]\n",
      "   state [1 1 0 1 1 0 0 0] state_WI [  0.26   0.31   0.32   0.3    0.38   0.47   0.47 -10.  ] sorted [6 5 4]\n",
      "   state [0 0 1 0 1 0 1 0] state_WI [  0.39   0.89   0.34   0.48   0.38   0.47   0.49 -10.  ] sorted [1 6 3]\n",
      "   state [1 1 0 1 1 0 0 0] state_WI [  0.26   0.31   0.32   0.3    0.38   0.47   0.47 -10.  ] sorted [6 5 4]\n",
      "   state [1 1 0 1 1 1 1 0] state_WI [  0.26   0.31   0.32   0.3    0.38   0.39   0.49 -10.  ] sorted [6 5 4]\n",
      "   state [1 1 1 0 1 1 0 0] state_WI [  0.26   0.31   0.34   0.48   0.38   0.39   0.47 -10.  ] sorted [3 6 5]\n",
      "instance 6, ep 19, state [1 0 0 1 1 0 0 0]\n",
      "   state [1 0 0 1 1 0 0 0] state_WI [  0.26   0.89   0.32   0.3    0.38   0.47   0.47 -10.  ] sorted [1 6 5]\n",
      "   state [1 1 0 1 0 0 0 0] state_WI [  0.26   0.31   0.32   0.3    0.91   0.47   0.47 -10.  ] sorted [4 6 5]\n",
      "   state [0 0 0 0 1 1 1 0] state_WI [  0.39   0.89   0.32   0.48   0.38   0.39   0.49 -10.  ] sorted [1 6 3]\n",
      "   state [1 1 1 0 1 0 1 0] state_WI [  0.26   0.31   0.34   0.48   0.38   0.47   0.49 -10.  ] sorted [6 3 5]\n",
      "   state [0 1 1 1 0 0 1 0] state_WI [  0.39   0.31   0.34   0.3    0.91   0.47   0.49 -10.  ] sorted [4 6 5]\n",
      "   state [0 1 0 0 1 0 1 0] state_WI [  0.39   0.31   0.32   0.48   0.38   0.47   0.49 -10.  ] sorted [6 3 5]\n",
      "   state [0 0 0 1 0 0 1 0] state_WI [  0.39   0.89   0.32   0.3    0.91   0.47   0.49 -10.  ] sorted [4 1 6]\n",
      "   state [0 1 0 1 1 0 1 1] state_WI [  0.39   0.31   0.32   0.3    0.38   0.47   0.49 -10.  ] sorted [6 5 0]\n",
      "   state [0 1 0 1 1 1 0 0] state_WI [  0.39   0.31   0.32   0.3    0.38   0.39   0.47 -10.  ] sorted [6 5 0]\n",
      "   state [0 1 0 1 0 0 0 0] state_WI [  0.39   0.31   0.32   0.3    0.91   0.47   0.47 -10.  ] sorted [4 6 5]\n",
      "   state [1 0 1 0 1 1 0 0] state_WI [  0.26   0.89   0.34   0.48   0.38   0.39   0.47 -10.  ] sorted [1 3 6]\n",
      "   state [0 0 1 1 1 1 0 0] state_WI [  0.39   0.89   0.34   0.3    0.38   0.39   0.47 -10.  ] sorted [1 6 5]\n",
      "   state [1 1 1 1 0 0 1 0] state_WI [  0.26   0.31   0.34   0.3    0.91   0.47   0.49 -10.  ] sorted [4 6 5]\n",
      "   state [1 0 0 0 1 1 1 0] state_WI [  0.26   0.89   0.32   0.48   0.38   0.39   0.49 -10.  ] sorted [1 6 3]\n",
      "   state [1 0 0 0 0 0 0 0] state_WI [  0.26   0.89   0.32   0.48   0.91   0.47   0.47 -10.  ] sorted [4 1 3]\n",
      "   state [0 0 1 0 1 0 0 0] state_WI [  0.39   0.89   0.34   0.48   0.38   0.47   0.47 -10.  ] sorted [1 3 6]\n",
      "   state [0 1 0 0 0 0 0 0] state_WI [  0.39   0.31   0.32   0.48   0.91   0.47   0.47 -10.  ] sorted [4 3 6]\n",
      "   state [0 1 0 0 1 0 0 0] state_WI [  0.39   0.31   0.32   0.48   0.38   0.47   0.47 -10.  ] sorted [3 6 5]\n",
      "   state [0 0 1 0 0 0 1 0] state_WI [  0.39   0.89   0.34   0.48   0.91   0.47   0.49 -10.  ] sorted [4 1 6]\n",
      "   state [0 0 0 0 1 0 1 0] state_WI [  0.39   0.89   0.32   0.48   0.38   0.47   0.49 -10.  ] sorted [1 6 3]\n",
      "instance 6, ep 20, state [1 1 0 0 1 1 0 1]\n",
      "   state [1 1 0 0 1 1 0 1] state_WI [  0.26   0.31   0.32   0.48   0.38   0.39   0.47 -10.  ] sorted [3 6 5]\n",
      "   state [1 0 1 1 0 1 0 1] state_WI [  0.26   0.89   0.34   0.3    0.91   0.39   0.47 -10.  ] sorted [4 1 6]\n",
      "   state [0 1 1 0 0 1 1 0] state_WI [  0.39   0.31   0.34   0.48   0.91   0.39   0.49 -10.  ] sorted [4 6 3]\n",
      "   state [0 1 0 0 0 1 0 0] state_WI [  0.39   0.31   0.32   0.48   0.91   0.39   0.47 -10.  ] sorted [4 3 6]\n",
      "   state [0 1 0 0 1 0 1 0] state_WI [  0.39   0.31   0.32   0.48   0.38   0.47   0.49 -10.  ] sorted [6 3 5]\n",
      "   state [0 1 0 0 1 1 1 0] state_WI [  0.39   0.31   0.32   0.48   0.38   0.39   0.49 -10.  ] sorted [6 3 5]\n",
      "   state [1 0 0 0 0 1 0 0] state_WI [  0.26   0.89   0.32   0.48   0.91   0.39   0.47 -10.  ] sorted [4 1 3]\n",
      "   state [1 1 0 1 1 0 0 0] state_WI [  0.26   0.31   0.32   0.3    0.38   0.47   0.47 -10.  ] sorted [6 5 4]\n",
      "   state [0 1 0 0 1 0 1 0] state_WI [  0.39   0.31   0.32   0.48   0.38   0.47   0.49 -10.  ] sorted [6 3 5]\n",
      "   state [0 1 0 1 0 0 0 0] state_WI [  0.39   0.31   0.32   0.3    0.91   0.47   0.47 -10.  ] sorted [4 6 5]\n",
      "   state [0 1 1 0 1 0 1 0] state_WI [  0.39   0.31   0.34   0.48   0.38   0.47   0.49 -10.  ] sorted [6 3 5]\n",
      "   state [0 1 0 0 0 1 0 0] state_WI [  0.39   0.31   0.32   0.48   0.91   0.39   0.47 -10.  ] sorted [4 3 6]\n",
      "   state [0 0 0 0 1 0 0 0] state_WI [  0.39   0.89   0.32   0.48   0.38   0.47   0.47 -10.  ] sorted [1 3 6]\n",
      "   state [0 0 0 1 1 0 0 0] state_WI [  0.39   0.89   0.32   0.3    0.38   0.47   0.47 -10.  ] sorted [1 6 5]\n",
      "   state [0 1 1 1 0 0 0 0] state_WI [  0.39   0.31   0.34   0.3    0.91   0.47   0.47 -10.  ] sorted [4 6 5]\n",
      "   state [0 0 0 0 1 1 0 0] state_WI [  0.39   0.89   0.32   0.48   0.38   0.39   0.47 -10.  ] sorted [1 3 6]\n",
      "   state [0 1 0 1 0 0 0 0] state_WI [  0.39   0.31   0.32   0.3    0.91   0.47   0.47 -10.  ] sorted [4 6 5]\n",
      "   state [0 0 0 1 1 1 0 0] state_WI [  0.39   0.89   0.32   0.3    0.38   0.39   0.47 -10.  ] sorted [1 6 5]\n",
      "   state [0 1 0 0 0 1 1 0] state_WI [  0.39   0.31   0.32   0.48   0.91   0.39   0.49 -10.  ] sorted [4 6 3]\n",
      "   state [0 1 0 1 1 1 0 0] state_WI [  0.39   0.31   0.32   0.3    0.38   0.39   0.47 -10.  ] sorted [6 5 0]\n",
      "instance 6, ep 21, state [1 0 1 0 1 1 1 1]\n",
      "   state [1 0 1 0 1 1 1 1] state_WI [  0.26   0.89   0.34   0.48   0.38   0.39   0.49 -10.  ] sorted [1 6 3]\n",
      "   state [1 0 1 0 0 1 1 0] state_WI [  0.26   0.89   0.34   0.48   0.91   0.39   0.49 -10.  ] sorted [4 1 6]\n",
      "   state [1 0 0 0 1 0 1 0] state_WI [  0.26   0.89   0.32   0.48   0.38   0.47   0.49 -10.  ] sorted [1 6 3]\n",
      "   state [1 1 0 0 1 0 1 0] state_WI [  0.26   0.31   0.32   0.48   0.38   0.47   0.49 -10.  ] sorted [6 3 5]\n",
      "   state [1 0 0 0 0 1 0 0] state_WI [  0.26   0.89   0.32   0.48   0.91   0.39   0.47 -10.  ] sorted [4 1 3]\n",
      "   state [1 1 0 0 1 0 0 0] state_WI [  0.26   0.31   0.32   0.48   0.38   0.47   0.47 -10.  ] sorted [3 6 5]\n",
      "   state [0 1 0 0 1 1 0 0] state_WI [  0.39   0.31   0.32   0.48   0.38   0.39   0.47 -10.  ] sorted [3 6 5]\n",
      "   state [0 0 0 0 1 1 1 0] state_WI [  0.39   0.89   0.32   0.48   0.38   0.39   0.49 -10.  ] sorted [1 6 3]\n",
      "   state [1 1 1 0 0 0 1 0] state_WI [  0.26   0.31   0.34   0.48   0.91   0.47   0.49 -10.  ] sorted [4 6 3]\n",
      "   state [1 1 1 0 1 0 0 0] state_WI [  0.26   0.31   0.34   0.48   0.38   0.47   0.47 -10.  ] sorted [3 6 5]\n",
      "   state [1 0 1 0 1 1 0 0] state_WI [  0.26   0.89   0.34   0.48   0.38   0.39   0.47 -10.  ] sorted [1 3 6]\n",
      "   state [1 0 0 0 0 1 0 0] state_WI [  0.26   0.89   0.32   0.48   0.91   0.39   0.47 -10.  ] sorted [4 1 3]\n",
      "   state [0 1 0 0 1 0 0 1] state_WI [  0.39   0.31   0.32   0.48   0.38   0.47   0.47 -10.  ] sorted [3 6 5]\n",
      "   state [0 1 0 0 0 1 1 0] state_WI [  0.39   0.31   0.32   0.48   0.91   0.39   0.49 -10.  ] sorted [4 6 3]\n",
      "   state [0 0 0 0 1 1 1 0] state_WI [  0.39   0.89   0.32   0.48   0.38   0.39   0.49 -10.  ] sorted [1 6 3]\n",
      "   state [0 1 0 0 0 1 1 0] state_WI [  0.39   0.31   0.32   0.48   0.91   0.39   0.49 -10.  ] sorted [4 6 3]\n",
      "   state [1 0 1 1 1 1 1 0] state_WI [  0.26   0.89   0.34   0.3    0.38   0.39   0.49 -10.  ] sorted [1 6 5]\n",
      "   state [0 1 1 0 1 1 0 0] state_WI [  0.39   0.31   0.34   0.48   0.38   0.39   0.47 -10.  ] sorted [3 6 5]\n",
      "   state [0 0 0 0 0 1 1 0] state_WI [  0.39   0.89   0.32   0.48   0.91   0.39   0.49 -10.  ] sorted [4 1 6]\n",
      "   state [0 1 1 1 1 1 1 0] state_WI [  0.39   0.31   0.34   0.3    0.38   0.39   0.49 -10.  ] sorted [6 5 0]\n",
      "instance 6, ep 22, state [0 1 1 0 1 1 0 1]\n",
      "   state [0 1 1 0 1 1 0 1] state_WI [  0.39   0.31   0.34   0.48   0.38   0.39   0.47 -10.  ] sorted [3 6 5]\n",
      "   state [0 0 1 0 1 1 0 0] state_WI [  0.39   0.89   0.34   0.48   0.38   0.39   0.47 -10.  ] sorted [1 3 6]\n",
      "   state [1 1 0 0 1 1 0 0] state_WI [  0.26   0.31   0.32   0.48   0.38   0.39   0.47 -10.  ] sorted [3 6 5]\n",
      "   state [0 1 0 0 0 1 1 0] state_WI [  0.39   0.31   0.32   0.48   0.91   0.39   0.49 -10.  ] sorted [4 6 3]\n",
      "   state [0 1 0 1 0 1 1 0] state_WI [  0.39   0.31   0.32   0.3    0.91   0.39   0.49 -10.  ] sorted [4 6 5]\n",
      "   state [0 1 1 0 1 1 1 0] state_WI [  0.39   0.31   0.34   0.48   0.38   0.39   0.49 -10.  ] sorted [6 3 5]\n",
      "   state [0 1 0 0 1 1 1 0] state_WI [  0.39   0.31   0.32   0.48   0.38   0.39   0.49 -10.  ] sorted [6 3 5]\n",
      "   state [1 1 0 0 0 1 0 0] state_WI [  0.26   0.31   0.32   0.48   0.91   0.39   0.47 -10.  ] sorted [4 3 6]\n",
      "   state [0 1 0 1 0 0 1 0] state_WI [  0.39   0.31   0.32   0.3    0.91   0.47   0.49 -10.  ] sorted [4 6 5]\n",
      "   state [0 1 0 0 1 0 0 0] state_WI [  0.39   0.31   0.32   0.48   0.38   0.47   0.47 -10.  ] sorted [3 6 5]\n",
      "   state [0 0 0 0 0 0 0 0] state_WI [  0.39   0.89   0.32   0.48   0.91   0.47   0.47 -10.  ] sorted [4 1 3]\n",
      "   state [0 1 0 1 1 0 0 0] state_WI [  0.39   0.31   0.32   0.3    0.38   0.47   0.47 -10.  ] sorted [6 5 0]\n",
      "   state [1 1 0 0 1 1 0 0] state_WI [  0.26   0.31   0.32   0.48   0.38   0.39   0.47 -10.  ] sorted [3 6 5]\n",
      "   state [0 0 0 0 1 1 1 0] state_WI [  0.39   0.89   0.32   0.48   0.38   0.39   0.49 -10.  ] sorted [1 6 3]\n",
      "   state [0 0 0 1 0 0 1 0] state_WI [  0.39   0.89   0.32   0.3    0.91   0.47   0.49 -10.  ] sorted [4 1 6]\n",
      "   state [0 1 1 1 0 0 1 0] state_WI [  0.39   0.31   0.34   0.3    0.91   0.47   0.49 -10.  ] sorted [4 6 5]\n",
      "   state [0 0 0 1 1 0 0 0] state_WI [  0.39   0.89   0.32   0.3    0.38   0.47   0.47 -10.  ] sorted [1 6 5]\n",
      "   state [0 1 0 1 0 1 1 0] state_WI [  0.39   0.31   0.32   0.3    0.91   0.39   0.49 -10.  ] sorted [4 6 5]\n",
      "   state [0 0 1 0 1 1 0 0] state_WI [  0.39   0.89   0.34   0.48   0.38   0.39   0.47 -10.  ] sorted [1 3 6]\n",
      "   state [0 1 1 1 0 1 0 0] state_WI [  0.39   0.31   0.34   0.3    0.91   0.39   0.47 -10.  ] sorted [4 6 5]\n",
      "instance 6, ep 23, state [1 0 1 0 0 0 1 1]\n",
      "   state [1 0 1 0 0 0 1 1] state_WI [  0.26   0.89   0.34   0.48   0.91   0.47   0.49 -10.  ] sorted [4 1 6]\n",
      "   state [0 0 0 0 0 1 1 1] state_WI [  0.39   0.89   0.32   0.48   0.91   0.39   0.49 -10.  ] sorted [4 1 6]\n",
      "   state [0 1 0 1 1 0 1 0] state_WI [  0.39   0.31   0.32   0.3    0.38   0.47   0.49 -10.  ] sorted [6 5 0]\n",
      "   state [0 0 0 0 0 1 1 0] state_WI [  0.39   0.89   0.32   0.48   0.91   0.39   0.49 -10.  ] sorted [4 1 6]\n",
      "   state [0 0 0 0 1 0 0 0] state_WI [  0.39   0.89   0.32   0.48   0.38   0.47   0.47 -10.  ] sorted [1 3 6]\n",
      "   state [0 1 1 1 0 0 1 0] state_WI [  0.39   0.31   0.34   0.3    0.91   0.47   0.49 -10.  ] sorted [4 6 5]\n",
      "   state [0 0 0 1 1 0 1 0] state_WI [  0.39   0.89   0.32   0.3    0.38   0.47   0.49 -10.  ] sorted [1 6 5]\n",
      "   state [1 0 0 0 0 0 0 1] state_WI [  0.26   0.89   0.32   0.48   0.91   0.47   0.47 -10.  ] sorted [4 1 3]\n",
      "   state [1 1 1 1 1 0 0 0] state_WI [  0.26   0.31   0.34   0.3    0.38   0.47   0.47 -10.  ] sorted [6 5 4]\n",
      "   state [0 0 0 1 1 1 1 0] state_WI [  0.39   0.89   0.32   0.3    0.38   0.39   0.49 -10.  ] sorted [1 6 5]\n",
      "   state [0 0 0 1 1 1 1 0] state_WI [  0.39   0.89   0.32   0.3    0.38   0.39   0.49 -10.  ] sorted [1 6 5]\n",
      "   state [0 1 0 1 0 1 1 0] state_WI [  0.39   0.31   0.32   0.3    0.91   0.39   0.49 -10.  ] sorted [4 6 5]\n",
      "   state [0 1 1 1 1 1 1 0] state_WI [  0.39   0.31   0.34   0.3    0.38   0.39   0.49 -10.  ] sorted [6 5 0]\n",
      "   state [0 0 0 1 0 0 1 0] state_WI [  0.39   0.89   0.32   0.3    0.91   0.47   0.49 -10.  ] sorted [4 1 6]\n",
      "   state [1 1 0 0 1 0 1 1] state_WI [  0.26   0.31   0.32   0.48   0.38   0.47   0.49 -10.  ] sorted [6 3 5]\n",
      "   state [1 1 0 1 1 1 0 0] state_WI [  0.26   0.31   0.32   0.3    0.38   0.39   0.47 -10.  ] sorted [6 5 4]\n",
      "   state [1 0 1 1 1 0 0 0] state_WI [  0.26   0.89   0.34   0.3    0.38   0.47   0.47 -10.  ] sorted [1 6 5]\n",
      "   state [1 1 1 1 1 1 1 0] state_WI [  0.26   0.31   0.34   0.3    0.38   0.39   0.49 -10.  ] sorted [6 5 4]\n",
      "   state [1 0 0 0 1 1 1 0] state_WI [  0.26   0.89   0.32   0.48   0.38   0.39   0.49 -10.  ] sorted [1 6 3]\n",
      "   state [1 1 1 1 0 1 1 0] state_WI [  0.26   0.31   0.34   0.3    0.91   0.39   0.49 -10.  ] sorted [4 6 5]\n",
      "instance 6, ep 24, state [0 0 1 0 1 1 1 1]\n",
      "   state [0 0 1 0 1 1 1 1] state_WI [  0.39   0.89   0.34   0.48   0.38   0.39   0.49 -10.  ] sorted [1 6 3]\n",
      "   state [0 1 0 1 1 0 1 1] state_WI [  0.39   0.31   0.32   0.3    0.38   0.47   0.49 -10.  ] sorted [6 5 0]\n",
      "   state [0 1 0 0 1 1 1 0] state_WI [  0.39   0.31   0.32   0.48   0.38   0.39   0.49 -10.  ] sorted [6 3 5]\n",
      "   state [0 0 0 1 0 1 1 0] state_WI [  0.39   0.89   0.32   0.3    0.91   0.39   0.49 -10.  ] sorted [4 1 6]\n",
      "   state [0 1 0 0 1 1 0 0] state_WI [  0.39   0.31   0.32   0.48   0.38   0.39   0.47 -10.  ] sorted [3 6 5]\n",
      "   state [0 1 1 1 1 1 1 0] state_WI [  0.39   0.31   0.34   0.3    0.38   0.39   0.49 -10.  ] sorted [6 5 0]\n",
      "   state [1 0 0 0 1 1 1 0] state_WI [  0.26   0.89   0.32   0.48   0.38   0.39   0.49 -10.  ] sorted [1 6 3]\n",
      "   state [0 1 0 0 1 0 1 0] state_WI [  0.39   0.31   0.32   0.48   0.38   0.47   0.49 -10.  ] sorted [6 3 5]\n",
      "   state [0 1 0 0 0 1 1 0] state_WI [  0.39   0.31   0.32   0.48   0.91   0.39   0.49 -10.  ] sorted [4 6 3]\n",
      "   state [0 0 0 0 1 1 1 0] state_WI [  0.39   0.89   0.32   0.48   0.38   0.39   0.49 -10.  ] sorted [1 6 3]\n",
      "   state [0 0 0 0 1 1 1 0] state_WI [  0.39   0.89   0.32   0.48   0.38   0.39   0.49 -10.  ] sorted [1 6 3]\n",
      "   state [0 0 1 0 0 1 1 0] state_WI [  0.39   0.89   0.34   0.48   0.91   0.39   0.49 -10.  ] sorted [4 1 6]\n",
      "   state [0 1 1 0 0 0 1 1] state_WI [  0.39   0.31   0.34   0.48   0.91   0.47   0.49 -10.  ] sorted [4 6 3]\n",
      "   state [0 0 1 1 1 0 1 0] state_WI [  0.39   0.89   0.34   0.3    0.38   0.47   0.49 -10.  ] sorted [1 6 5]\n",
      "   state [1 0 0 0 0 1 1 0] state_WI [  0.26   0.89   0.32   0.48   0.91   0.39   0.49 -10.  ] sorted [4 1 6]\n",
      "   state [0 1 0 0 1 0 0 0] state_WI [  0.39   0.31   0.32   0.48   0.38   0.47   0.47 -10.  ] sorted [3 6 5]\n",
      "   state [1 1 0 0 0 0 0 0] state_WI [  0.26   0.31   0.32   0.48   0.91   0.47   0.47 -10.  ] sorted [4 3 6]\n",
      "   state [1 1 0 1 1 0 0 0] state_WI [  0.26   0.31   0.32   0.3    0.38   0.47   0.47 -10.  ] sorted [6 5 4]\n",
      "   state [1 0 0 0 1 0 0 0] state_WI [  0.26   0.89   0.32   0.48   0.38   0.47   0.47 -10.  ] sorted [1 3 6]\n",
      "   state [1 0 0 0 0 0 1 0] state_WI [  0.26   0.89   0.32   0.48   0.91   0.47   0.49 -10.  ] sorted [4 1 6]\n",
      "instance 6, ep 25, state [0 1 1 1 0 1 0 0]\n",
      "   state [0 1 1 1 0 1 0 0] state_WI [  0.39   0.31   0.34   0.3    0.91   0.39   0.47 -10.  ] sorted [4 6 5]\n",
      "   state [0 0 1 0 1 1 1 0] state_WI [  0.39   0.89   0.34   0.48   0.38   0.39   0.49 -10.  ] sorted [1 6 3]\n",
      "   state [0 0 1 0 0 0 1 0] state_WI [  0.39   0.89   0.34   0.48   0.91   0.47   0.49 -10.  ] sorted [4 1 6]\n",
      "   state [1 1 1 0 1 0 1 0] state_WI [  0.26   0.31   0.34   0.48   0.38   0.47   0.49 -10.  ] sorted [6 3 5]\n",
      "   state [0 0 1 0 0 0 1 0] state_WI [  0.39   0.89   0.34   0.48   0.91   0.47   0.49 -10.  ] sorted [4 1 6]\n",
      "   state [0 0 0 0 1 0 1 0] state_WI [  0.39   0.89   0.32   0.48   0.38   0.47   0.49 -10.  ] sorted [1 6 3]\n",
      "   state [1 1 0 1 0 0 1 0] state_WI [  0.26   0.31   0.32   0.3    0.91   0.47   0.49 -10.  ] sorted [4 6 5]\n",
      "   state [0 1 0 1 0 1 1 0] state_WI [  0.39   0.31   0.32   0.3    0.91   0.39   0.49 -10.  ] sorted [4 6 5]\n",
      "   state [1 1 0 0 1 1 1 0] state_WI [  0.26   0.31   0.32   0.48   0.38   0.39   0.49 -10.  ] sorted [6 3 5]\n",
      "   state [0 1 0 0 0 1 1 0] state_WI [  0.39   0.31   0.32   0.48   0.91   0.39   0.49 -10.  ] sorted [4 6 3]\n",
      "   state [1 1 0 1 0 0 1 0] state_WI [  0.26   0.31   0.32   0.3    0.91   0.47   0.49 -10.  ] sorted [4 6 5]\n",
      "   state [0 0 0 0 1 1 1 0] state_WI [  0.39   0.89   0.32   0.48   0.38   0.39   0.49 -10.  ] sorted [1 6 3]\n",
      "   state [0 1 0 0 0 1 1 0] state_WI [  0.39   0.31   0.32   0.48   0.91   0.39   0.49 -10.  ] sorted [4 6 3]\n",
      "   state [0 1 0 1 1 0 0 0] state_WI [  0.39   0.31   0.32   0.3    0.38   0.47   0.47 -10.  ] sorted [6 5 0]\n",
      "   state [0 0 0 1 1 1 1 0] state_WI [  0.39   0.89   0.32   0.3    0.38   0.39   0.49 -10.  ] sorted [1 6 5]\n",
      "   state [0 1 0 0 1 1 1 0] state_WI [  0.39   0.31   0.32   0.48   0.38   0.39   0.49 -10.  ] sorted [6 3 5]\n",
      "   state [0 1 0 0 0 1 1 0] state_WI [  0.39   0.31   0.32   0.48   0.91   0.39   0.49 -10.  ] sorted [4 6 3]\n",
      "   state [0 1 1 0 1 1 1 0] state_WI [  0.39   0.31   0.34   0.48   0.38   0.39   0.49 -10.  ] sorted [6 3 5]\n",
      "   state [1 1 1 1 1 0 1 0] state_WI [  0.26   0.31   0.34   0.3    0.38   0.47   0.49 -10.  ] sorted [6 5 4]\n",
      "   state [0 0 1 0 0 1 1 0] state_WI [  0.39   0.89   0.34   0.48   0.91   0.39   0.49 -10.  ] sorted [4 1 6]\n",
      "instance 6, ep 26, state [0 1 1 1 1 0 1 0]\n",
      "   state [0 1 1 1 1 0 1 0] state_WI [  0.39   0.31   0.34   0.3    0.38   0.47   0.49 -10.  ] sorted [6 5 0]\n",
      "   state [1 0 0 0 0 1 1 0] state_WI [  0.26   0.89   0.32   0.48   0.91   0.39   0.49 -10.  ] sorted [4 1 6]\n",
      "   state [0 0 1 0 1 0 1 0] state_WI [  0.39   0.89   0.34   0.48   0.38   0.47   0.49 -10.  ] sorted [1 6 3]\n",
      "   state [1 1 1 1 0 0 1 0] state_WI [  0.26   0.31   0.34   0.3    0.91   0.47   0.49 -10.  ] sorted [4 6 5]\n",
      "   state [0 0 1 1 1 0 0 0] state_WI [  0.39   0.89   0.34   0.3    0.38   0.47   0.47 -10.  ] sorted [1 6 5]\n",
      "   state [1 1 1 1 0 0 0 0] state_WI [  0.26   0.31   0.34   0.3    0.91   0.47   0.47 -10.  ] sorted [4 6 5]\n",
      "   state [0 1 1 0 1 1 1 0] state_WI [  0.39   0.31   0.34   0.48   0.38   0.39   0.49 -10.  ] sorted [6 3 5]\n",
      "   state [0 0 0 1 0 1 0 0] state_WI [  0.39   0.89   0.32   0.3    0.91   0.39   0.47 -10.  ] sorted [4 1 6]\n",
      "   state [1 1 0 1 0 0 0 0] state_WI [  0.26   0.31   0.32   0.3    0.91   0.47   0.47 -10.  ] sorted [4 6 5]\n",
      "   state [1 0 0 0 0 0 0 0] state_WI [  0.26   0.89   0.32   0.48   0.91   0.47   0.47 -10.  ] sorted [4 1 3]\n",
      "   state [1 1 0 0 0 1 0 0] state_WI [  0.26   0.31   0.32   0.48   0.91   0.39   0.47 -10.  ] sorted [4 3 6]\n",
      "   state [0 0 0 1 0 1 1 0] state_WI [  0.39   0.89   0.32   0.3    0.91   0.39   0.49 -10.  ] sorted [4 1 6]\n",
      "   state [0 1 0 1 0 0 1 0] state_WI [  0.39   0.31   0.32   0.3    0.91   0.47   0.49 -10.  ] sorted [4 6 5]\n",
      "   state [0 1 0 0 1 0 1 0] state_WI [  0.39   0.31   0.32   0.48   0.38   0.47   0.49 -10.  ] sorted [6 3 5]\n",
      "   state [1 0 0 1 1 0 1 1] state_WI [  0.26   0.89   0.32   0.3    0.38   0.47   0.49 -10.  ] sorted [1 6 5]\n",
      "   state [0 1 0 0 0 0 0 1] state_WI [  0.39   0.31   0.32   0.48   0.91   0.47   0.47 -10.  ] sorted [4 3 6]\n",
      "   state [0 1 0 0 0 1 1 0] state_WI [  0.39   0.31   0.32   0.48   0.91   0.39   0.49 -10.  ] sorted [4 6 3]\n",
      "   state [1 0 1 1 0 0 1 0] state_WI [  0.26   0.89   0.34   0.3    0.91   0.47   0.49 -10.  ] sorted [4 1 6]\n",
      "   state [0 1 1 1 1 1 1 0] state_WI [  0.39   0.31   0.34   0.3    0.38   0.39   0.49 -10.  ] sorted [6 5 0]\n",
      "   state [1 0 0 1 0 1 0 0] state_WI [  0.26   0.89   0.32   0.3    0.91   0.39   0.47 -10.  ] sorted [4 1 6]\n",
      "instance 6, ep 27, state [1 1 1 1 0 0 1 0]\n",
      "   state [1 1 1 1 0 0 1 0] state_WI [  0.26   0.31   0.34   0.3    0.91   0.47   0.49 -10.  ] sorted [4 6 5]\n",
      "   state [0 0 0 1 1 1 0 0] state_WI [  0.39   0.89   0.32   0.3    0.38   0.39   0.47 -10.  ] sorted [1 6 5]\n",
      "   state [0 0 1 1 1 1 1 0] state_WI [  0.39   0.89   0.34   0.3    0.38   0.39   0.49 -10.  ] sorted [1 6 5]\n",
      "   state [0 0 0 0 1 1 1 0] state_WI [  0.39   0.89   0.32   0.48   0.38   0.39   0.49 -10.  ] sorted [1 6 3]\n",
      "   state [0 1 0 1 1 1 1 0] state_WI [  0.39   0.31   0.32   0.3    0.38   0.39   0.49 -10.  ] sorted [6 5 0]\n",
      "   state [1 0 0 1 0 1 1 0] state_WI [  0.26   0.89   0.32   0.3    0.91   0.39   0.49 -10.  ] sorted [4 1 6]\n",
      "   state [0 1 0 1 1 0 1 0] state_WI [  0.39   0.31   0.32   0.3    0.38   0.47   0.49 -10.  ] sorted [6 5 0]\n",
      "   state [0 0 0 0 1 1 1 0] state_WI [  0.39   0.89   0.32   0.48   0.38   0.39   0.49 -10.  ] sorted [1 6 3]\n",
      "   state [0 0 0 0 1 0 0 0] state_WI [  0.39   0.89   0.32   0.48   0.38   0.47   0.47 -10.  ] sorted [1 3 6]\n",
      "   state [1 0 0 1 1 0 0 0] state_WI [  0.26   0.89   0.32   0.3    0.38   0.47   0.47 -10.  ] sorted [1 6 5]\n",
      "   state [1 1 0 1 0 0 1 0] state_WI [  0.26   0.31   0.32   0.3    0.91   0.47   0.49 -10.  ] sorted [4 6 5]\n",
      "   state [1 1 0 0 1 1 1 0] state_WI [  0.26   0.31   0.32   0.48   0.38   0.39   0.49 -10.  ] sorted [6 3 5]\n",
      "   state [0 1 0 0 1 1 0 0] state_WI [  0.39   0.31   0.32   0.48   0.38   0.39   0.47 -10.  ] sorted [3 6 5]\n",
      "   state [1 0 0 0 0 1 1 0] state_WI [  0.26   0.89   0.32   0.48   0.91   0.39   0.49 -10.  ] sorted [4 1 6]\n",
      "   state [1 1 0 1 1 1 1 0] state_WI [  0.26   0.31   0.32   0.3    0.38   0.39   0.49 -10.  ] sorted [6 5 4]\n",
      "   state [1 0 0 1 1 1 1 0] state_WI [  0.26   0.89   0.32   0.3    0.38   0.39   0.49 -10.  ] sorted [1 6 5]\n",
      "   state [1 1 1 0 0 1 1 0] state_WI [  0.26   0.31   0.34   0.48   0.91   0.39   0.49 -10.  ] sorted [4 6 3]\n",
      "   state [0 0 0 0 0 1 1 0] state_WI [  0.39   0.89   0.32   0.48   0.91   0.39   0.49 -10.  ] sorted [4 1 6]\n",
      "   state [1 1 1 0 1 0 1 0] state_WI [  0.26   0.31   0.34   0.48   0.38   0.47   0.49 -10.  ] sorted [6 3 5]\n",
      "   state [0 1 0 0 1 1 1 0] state_WI [  0.39   0.31   0.32   0.48   0.38   0.39   0.49 -10.  ] sorted [6 3 5]\n",
      "instance 6, ep 28, state [0 0 1 0 0 1 1 0]\n",
      "   state [0 0 1 0 0 1 1 0] state_WI [  0.39   0.89   0.34   0.48   0.91   0.39   0.49 -10.  ] sorted [4 1 6]\n",
      "   state [0 0 0 0 0 0 1 0] state_WI [  0.39   0.89   0.32   0.48   0.91   0.47   0.49 -10.  ] sorted [4 1 6]\n",
      "   state [0 1 0 0 1 0 1 0] state_WI [  0.39   0.31   0.32   0.48   0.38   0.47   0.49 -10.  ] sorted [6 3 5]\n",
      "   state [0 0 0 0 0 0 0 0] state_WI [  0.39   0.89   0.32   0.48   0.91   0.47   0.47 -10.  ] sorted [4 1 3]\n",
      "   state [0 1 0 1 1 1 0 0] state_WI [  0.39   0.31   0.32   0.3    0.38   0.39   0.47 -10.  ] sorted [6 5 0]\n",
      "   state [1 1 0 0 0 1 0 0] state_WI [  0.26   0.31   0.32   0.48   0.91   0.39   0.47 -10.  ] sorted [4 3 6]\n",
      "   state [0 0 0 0 1 1 0 0] state_WI [  0.39   0.89   0.32   0.48   0.38   0.39   0.47 -10.  ] sorted [1 3 6]\n",
      "   state [1 0 0 1 0 0 0 1] state_WI [  0.26   0.89   0.32   0.3    0.91   0.47   0.47 -10.  ] sorted [4 1 6]\n",
      "   state [0 1 1 1 1 0 1 0] state_WI [  0.39   0.31   0.34   0.3    0.38   0.47   0.49 -10.  ] sorted [6 5 0]\n",
      "   state [0 1 0 0 0 0 1 0] state_WI [  0.39   0.31   0.32   0.48   0.91   0.47   0.49 -10.  ] sorted [4 6 3]\n",
      "   state [0 1 0 0 1 0 0 0] state_WI [  0.39   0.31   0.32   0.48   0.38   0.47   0.47 -10.  ] sorted [3 6 5]\n",
      "   state [0 1 0 1 0 1 0 0] state_WI [  0.39   0.31   0.32   0.3    0.91   0.39   0.47 -10.  ] sorted [4 6 5]\n",
      "   state [0 0 1 0 1 1 0 0] state_WI [  0.39   0.89   0.34   0.48   0.38   0.39   0.47 -10.  ] sorted [1 3 6]\n",
      "   state [0 1 1 1 0 0 1 0] state_WI [  0.39   0.31   0.34   0.3    0.91   0.47   0.49 -10.  ] sorted [4 6 5]\n",
      "   state [0 0 0 0 0 0 1 0] state_WI [  0.39   0.89   0.32   0.48   0.91   0.47   0.49 -10.  ] sorted [4 1 6]\n",
      "   state [0 1 0 0 1 0 1 0] state_WI [  0.39   0.31   0.32   0.48   0.38   0.47   0.49 -10.  ] sorted [6 3 5]\n",
      "   state [0 0 0 1 0 0 1 0] state_WI [  0.39   0.89   0.32   0.3    0.91   0.47   0.49 -10.  ] sorted [4 1 6]\n",
      "   state [0 1 0 0 1 0 0 0] state_WI [  0.39   0.31   0.32   0.48   0.38   0.47   0.47 -10.  ] sorted [3 6 5]\n",
      "   state [0 0 1 0 0 0 1 0] state_WI [  0.39   0.89   0.34   0.48   0.91   0.47   0.49 -10.  ] sorted [4 1 6]\n",
      "   state [0 0 1 0 1 0 0 0] state_WI [  0.39   0.89   0.34   0.48   0.38   0.47   0.47 -10.  ] sorted [1 3 6]\n",
      "instance 6, ep 29, state [0 0 0 0 1 1 1 0]\n",
      "   state [0 0 0 0 1 1 1 0] state_WI [  0.39   0.89   0.32   0.48   0.38   0.39   0.49 -10.  ] sorted [1 6 3]\n",
      "   state [0 0 0 1 1 0 1 0] state_WI [  0.39   0.89   0.32   0.3    0.38   0.47   0.49 -10.  ] sorted [1 6 5]\n",
      "   state [0 1 0 1 1 1 0 0] state_WI [  0.39   0.31   0.32   0.3    0.38   0.39   0.47 -10.  ] sorted [6 5 0]\n",
      "   state [0 1 0 0 1 1 1 0] state_WI [  0.39   0.31   0.32   0.48   0.38   0.39   0.49 -10.  ] sorted [6 3 5]\n",
      "   state [0 1 0 1 0 1 1 0] state_WI [  0.39   0.31   0.32   0.3    0.91   0.39   0.49 -10.  ] sorted [4 6 5]\n",
      "   state [0 1 0 1 1 1 0 0] state_WI [  0.39   0.31   0.32   0.3    0.38   0.39   0.47 -10.  ] sorted [6 5 0]\n",
      "   state [1 1 0 0 1 1 1 0] state_WI [  0.26   0.31   0.32   0.48   0.38   0.39   0.49 -10.  ] sorted [6 3 5]\n",
      "   state [1 0 0 1 1 0 1 0] state_WI [  0.26   0.89   0.32   0.3    0.38   0.47   0.49 -10.  ] sorted [1 6 5]\n",
      "   state [1 1 0 0 0 0 1 0] state_WI [  0.26   0.31   0.32   0.48   0.91   0.47   0.49 -10.  ] sorted [4 6 3]\n",
      "   state [0 1 1 1 1 0 1 0] state_WI [  0.39   0.31   0.34   0.3    0.38   0.47   0.49 -10.  ] sorted [6 5 0]\n",
      "   state [0 1 1 0 0 1 1 0] state_WI [  0.39   0.31   0.34   0.48   0.91   0.39   0.49 -10.  ] sorted [4 6 3]\n",
      "   state [0 0 0 1 1 1 1 0] state_WI [  0.39   0.89   0.32   0.3    0.38   0.39   0.49 -10.  ] sorted [1 6 5]\n",
      "   state [0 1 0 0 0 1 0 1] state_WI [  0.39   0.31   0.32   0.48   0.91   0.39   0.47 -10.  ] sorted [4 3 6]\n",
      "   state [0 0 0 0 1 0 1 0] state_WI [  0.39   0.89   0.32   0.48   0.38   0.47   0.49 -10.  ] sorted [1 6 3]\n",
      "   state [1 1 1 0 1 0 1 0] state_WI [  0.26   0.31   0.34   0.48   0.38   0.47   0.49 -10.  ] sorted [6 3 5]\n",
      "   state [1 0 0 1 1 1 1 0] state_WI [  0.26   0.89   0.32   0.3    0.38   0.39   0.49 -10.  ] sorted [1 6 5]\n",
      "   state [0 1 1 1 1 1 1 0] state_WI [  0.39   0.31   0.34   0.3    0.38   0.39   0.49 -10.  ] sorted [6 5 0]\n",
      "   state [1 1 0 0 0 1 1 0] state_WI [  0.26   0.31   0.32   0.48   0.91   0.39   0.49 -10.  ] sorted [4 6 3]\n",
      "   state [1 0 1 1 1 0 1 0] state_WI [  0.26   0.89   0.34   0.3    0.38   0.47   0.49 -10.  ] sorted [1 6 5]\n",
      "   state [0 1 1 1 1 1 1 0] state_WI [  0.39   0.31   0.34   0.3    0.38   0.39   0.49 -10.  ] sorted [6 5 0]\n",
      "first state [1 0 1 1 1 1 1 0]\n",
      "   state [1 0 1 1 1 1 1 0] state_WI [-10.    -0.04   0.4    0.29   0.33   0.05   0.09   0.53] sorted [7 2 4]\n",
      "   state [1 0 1 0 0 0 0 0] state_WI [-10.    -0.04   0.4    0.32   0.66   0.14   0.2    0.53] sorted [4 7 2]\n",
      "   state [0 0 1 0 1 0 0 1] state_WI [  0.7   -0.04   0.4    0.32   0.33   0.14   0.2  -10.  ] sorted [0 2 4]\n",
      "   state [0 0 1 0 1 0 0 1] state_WI [  0.7   -0.04   0.4    0.32   0.33   0.14   0.2  -10.  ] sorted [0 2 4]\n",
      "   state [0 0 1 0 1 0 0 0] state_WI [ 0.7  -0.04  0.4   0.32  0.33  0.14  0.2   0.53] sorted [0 7 2]\n",
      "   state [1 0 1 0 0 0 1 0] state_WI [-10.    -0.04   0.4    0.32   0.66   0.14   0.09   0.53] sorted [4 7 2]\n",
      "   state [1 0 1 0 1 0 0 1] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.2  -10.  ] sorted [2 4 3]\n",
      "   state [1 0 1 1 1 0 0 1] state_WI [-10.    -0.04   0.4    0.29   0.33   0.14   0.2  -10.  ] sorted [2 4 3]\n",
      "   state [1 0 1 0 0 0 1 1] state_WI [-10.    -0.04   0.4    0.32   0.66   0.14   0.09 -10.  ] sorted [4 2 3]\n",
      "   state [0 0 1 0 1 0 1 0] state_WI [ 0.7  -0.04  0.4   0.32  0.33  0.14  0.09  0.53] sorted [0 7 2]\n",
      "   state [1 0 1 0 1 0 1 1] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.09 -10.  ] sorted [2 4 3]\n",
      "   state [0 0 1 0 1 0 0 1] state_WI [  0.7   -0.04   0.4    0.32   0.33   0.14   0.2  -10.  ] sorted [0 2 4]\n",
      "   state [0 0 1 0 1 1 0 1] state_WI [  0.7   -0.04   0.4    0.32   0.33   0.05   0.2  -10.  ] sorted [0 2 4]\n",
      "   state [0 0 1 0 1 0 0 1] state_WI [  0.7   -0.04   0.4    0.32   0.33   0.14   0.2  -10.  ] sorted [0 2 4]\n",
      "   state [0 1 1 0 1 0 1 1] state_WI [  0.7   -0.15   0.4    0.32   0.33   0.14   0.09 -10.  ] sorted [0 2 4]\n",
      "   state [1 1 1 1 0 0 0 1] state_WI [-10.    -0.15   0.4    0.29   0.66   0.14   0.2  -10.  ] sorted [4 2 3]\n",
      "   state [0 0 1 1 1 0 0 1] state_WI [  0.7   -0.04   0.4    0.29   0.33   0.14   0.2  -10.  ] sorted [0 2 4]\n",
      "   state [1 0 1 1 1 0 1 1] state_WI [-10.    -0.04   0.4    0.29   0.33   0.14   0.09 -10.  ] sorted [2 4 3]\n",
      "   state [0 0 1 1 1 0 0 0] state_WI [ 0.7  -0.04  0.4   0.29  0.33  0.14  0.2   0.53] sorted [0 7 2]\n",
      "   state [1 0 1 0 0 0 0 1] state_WI [-10.    -0.04   0.4    0.32   0.66   0.14   0.2  -10.  ] sorted [4 2 3]\n",
      "instance 7, ep 1, state [0 0 1 0 1 1 1 1]\n",
      "   state [0 0 1 0 1 1 1 1] state_WI [  0.7   -0.04   0.4    0.32   0.33   0.05   0.09 -10.  ] sorted [0 2 4]\n",
      "   state [0 0 1 0 1 0 0 0] state_WI [ 0.7  -0.04  0.4   0.32  0.33  0.14  0.2   0.53] sorted [0 7 2]\n",
      "   state [0 0 1 0 1 0 0 0] state_WI [ 0.7  -0.04  0.4   0.32  0.33  0.14  0.2   0.53] sorted [0 7 2]\n",
      "   state [0 0 0 0 1 1 0 1] state_WI [  0.7   -0.04   0.59   0.32   0.33   0.05   0.2  -10.  ] sorted [0 2 4]\n",
      "   state [1 0 1 0 0 0 1 0] state_WI [-10.    -0.04   0.4    0.32   0.66   0.14   0.09   0.53] sorted [4 7 2]\n",
      "   state [1 0 1 0 1 0 0 0] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.2    0.53] sorted [7 2 4]\n",
      "   state [0 0 1 0 1 0 1 0] state_WI [ 0.7  -0.04  0.4   0.32  0.33  0.14  0.09  0.53] sorted [0 7 2]\n",
      "   state [0 0 1 0 1 0 0 0] state_WI [ 0.7  -0.04  0.4   0.32  0.33  0.14  0.2   0.53] sorted [0 7 2]\n",
      "   state [1 0 1 0 0 0 1 1] state_WI [-10.    -0.04   0.4    0.32   0.66   0.14   0.09 -10.  ] sorted [4 2 3]\n",
      "   state [1 0 1 0 1 0 0 0] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.2    0.53] sorted [7 2 4]\n",
      "   state [0 0 1 0 0 0 1 1] state_WI [  0.7   -0.04   0.4    0.32   0.66   0.14   0.09 -10.  ] sorted [0 4 2]\n",
      "   state [1 0 1 0 0 0 0 1] state_WI [-10.    -0.04   0.4    0.32   0.66   0.14   0.2  -10.  ] sorted [4 2 3]\n",
      "   state [0 0 1 1 0 0 1 0] state_WI [ 0.7  -0.04  0.4   0.29  0.66  0.14  0.09  0.53] sorted [0 4 7]\n",
      "   state [1 0 0 1 1 0 0 1] state_WI [-10.    -0.04   0.59   0.29   0.33   0.14   0.2  -10.  ] sorted [2 4 3]\n",
      "   state [1 0 1 0 0 0 0 0] state_WI [-10.    -0.04   0.4    0.32   0.66   0.14   0.2    0.53] sorted [4 7 2]\n",
      "   state [0 0 1 0 1 0 0 1] state_WI [  0.7   -0.04   0.4    0.32   0.33   0.14   0.2  -10.  ] sorted [0 2 4]\n",
      "   state [1 0 0 0 1 0 0 1] state_WI [-10.    -0.04   0.59   0.32   0.33   0.14   0.2  -10.  ] sorted [2 4 3]\n",
      "   state [1 0 1 0 0 0 0 0] state_WI [-10.    -0.04   0.4    0.32   0.66   0.14   0.2    0.53] sorted [4 7 2]\n",
      "   state [0 0 1 0 0 0 1 1] state_WI [  0.7   -0.04   0.4    0.32   0.66   0.14   0.09 -10.  ] sorted [0 4 2]\n",
      "   state [0 0 1 0 1 0 1 0] state_WI [ 0.7  -0.04  0.4   0.32  0.33  0.14  0.09  0.53] sorted [0 7 2]\n",
      "instance 7, ep 2, state [0 1 1 0 0 1 1 1]\n",
      "   state [0 1 1 0 0 1 1 1] state_WI [  0.7   -0.15   0.4    0.32   0.66   0.05   0.09 -10.  ] sorted [0 4 2]\n",
      "   state [0 0 1 0 1 0 0 0] state_WI [ 0.7  -0.04  0.4   0.32  0.33  0.14  0.2   0.53] sorted [0 7 2]\n",
      "   state [1 1 1 0 1 0 0 0] state_WI [-10.    -0.15   0.4    0.32   0.33   0.14   0.2    0.53] sorted [7 2 4]\n",
      "   state [0 0 1 1 0 0 0 0] state_WI [ 0.7  -0.04  0.4   0.29  0.66  0.14  0.2   0.53] sorted [0 4 7]\n",
      "   state [1 0 1 0 0 0 1 0] state_WI [-10.    -0.04   0.4    0.32   0.66   0.14   0.09   0.53] sorted [4 7 2]\n",
      "   state [1 0 1 0 0 0 1 0] state_WI [-10.    -0.04   0.4    0.32   0.66   0.14   0.09   0.53] sorted [4 7 2]\n",
      "   state [1 0 0 0 1 0 0 1] state_WI [-10.    -0.04   0.59   0.32   0.33   0.14   0.2  -10.  ] sorted [2 4 3]\n",
      "   state [0 0 0 1 1 0 0 1] state_WI [  0.7   -0.04   0.59   0.29   0.33   0.14   0.2  -10.  ] sorted [0 2 4]\n",
      "   state [1 0 0 0 1 0 1 0] state_WI [-10.    -0.04   0.59   0.32   0.33   0.14   0.09   0.53] sorted [2 7 4]\n",
      "   state [0 1 1 0 0 0 0 0] state_WI [ 0.7  -0.15  0.4   0.32  0.66  0.14  0.2   0.53] sorted [0 4 7]\n",
      "   state [0 0 0 0 0 0 1 1] state_WI [  0.7   -0.04   0.59   0.32   0.66   0.14   0.09 -10.  ] sorted [0 4 2]\n",
      "   state [1 0 1 1 0 0 0 0] state_WI [-10.    -0.04   0.4    0.29   0.66   0.14   0.2    0.53] sorted [4 7 2]\n",
      "   state [0 0 1 0 1 0 1 0] state_WI [ 0.7  -0.04  0.4   0.32  0.33  0.14  0.09  0.53] sorted [0 7 2]\n",
      "   state [1 0 1 0 0 0 0 0] state_WI [-10.    -0.04   0.4    0.32   0.66   0.14   0.2    0.53] sorted [4 7 2]\n",
      "   state [1 0 1 0 1 0 1 0] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.09   0.53] sorted [7 2 4]\n",
      "   state [0 0 1 0 1 0 0 1] state_WI [  0.7   -0.04   0.4    0.32   0.33   0.14   0.2  -10.  ] sorted [0 2 4]\n",
      "   state [0 0 1 0 1 0 1 1] state_WI [  0.7   -0.04   0.4    0.32   0.33   0.14   0.09 -10.  ] sorted [0 2 4]\n",
      "   state [1 0 1 0 1 0 0 0] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.2    0.53] sorted [7 2 4]\n",
      "   state [0 0 1 0 0 0 1 1] state_WI [  0.7   -0.04   0.4    0.32   0.66   0.14   0.09 -10.  ] sorted [0 4 2]\n",
      "   state [1 0 1 0 1 0 1 1] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.09 -10.  ] sorted [2 4 3]\n",
      "instance 7, ep 3, state [1 1 1 0 0 0 1 1]\n",
      "   state [1 1 1 0 0 0 1 1] state_WI [-10.    -0.15   0.4    0.32   0.66   0.14   0.09 -10.  ] sorted [4 2 3]\n",
      "   state [0 1 1 1 0 0 0 0] state_WI [ 0.7  -0.15  0.4   0.29  0.66  0.14  0.2   0.53] sorted [0 4 7]\n",
      "   state [1 0 0 1 1 0 0 0] state_WI [-10.    -0.04   0.59   0.29   0.33   0.14   0.2    0.53] sorted [2 7 4]\n",
      "   state [0 0 1 0 0 0 0 1] state_WI [  0.7   -0.04   0.4    0.32   0.66   0.14   0.2  -10.  ] sorted [0 4 2]\n",
      "   state [1 0 0 0 1 0 0 0] state_WI [-10.    -0.04   0.59   0.32   0.33   0.14   0.2    0.53] sorted [2 7 4]\n",
      "   state [1 0 0 0 1 0 0 1] state_WI [-10.    -0.04   0.59   0.32   0.33   0.14   0.2  -10.  ] sorted [2 4 3]\n",
      "   state [0 0 1 1 1 0 0 1] state_WI [  0.7   -0.04   0.4    0.29   0.33   0.14   0.2  -10.  ] sorted [0 2 4]\n",
      "   state [0 0 1 0 1 0 1 0] state_WI [ 0.7  -0.04  0.4   0.32  0.33  0.14  0.09  0.53] sorted [0 7 2]\n",
      "   state [1 0 1 0 1 0 0 0] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.2    0.53] sorted [7 2 4]\n",
      "   state [0 0 1 1 1 0 1 0] state_WI [ 0.7  -0.04  0.4   0.29  0.33  0.14  0.09  0.53] sorted [0 7 2]\n",
      "   state [1 0 1 0 0 0 1 1] state_WI [-10.    -0.04   0.4    0.32   0.66   0.14   0.09 -10.  ] sorted [4 2 3]\n",
      "   state [1 0 1 0 1 0 0 0] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.2    0.53] sorted [7 2 4]\n",
      "   state [1 0 1 0 0 0 1 0] state_WI [-10.    -0.04   0.4    0.32   0.66   0.14   0.09   0.53] sorted [4 7 2]\n",
      "   state [0 0 1 1 0 0 0 1] state_WI [  0.7   -0.04   0.4    0.29   0.66   0.14   0.2  -10.  ] sorted [0 4 2]\n",
      "   state [0 0 0 1 0 0 0 0] state_WI [ 0.7  -0.04  0.59  0.29  0.66  0.14  0.2   0.53] sorted [0 4 2]\n",
      "   state [0 0 1 0 0 0 1 0] state_WI [ 0.7  -0.04  0.4   0.32  0.66  0.14  0.09  0.53] sorted [0 4 7]\n",
      "   state [1 0 0 0 1 0 1 1] state_WI [-10.    -0.04   0.59   0.32   0.33   0.14   0.09 -10.  ] sorted [2 4 3]\n",
      "   state [0 0 0 0 1 0 0 0] state_WI [ 0.7  -0.04  0.59  0.32  0.33  0.14  0.2   0.53] sorted [0 2 7]\n",
      "   state [0 0 1 0 0 0 0 0] state_WI [ 0.7  -0.04  0.4   0.32  0.66  0.14  0.2   0.53] sorted [0 4 7]\n",
      "   state [1 0 0 0 0 0 0 1] state_WI [-10.    -0.04   0.59   0.32   0.66   0.14   0.2  -10.  ] sorted [4 2 3]\n",
      "instance 7, ep 4, state [1 0 1 1 1 1 0 1]\n",
      "   state [1 0 1 1 1 1 0 1] state_WI [-10.    -0.04   0.4    0.29   0.33   0.05   0.2  -10.  ] sorted [2 4 3]\n",
      "   state [1 0 1 1 1 0 0 0] state_WI [-10.    -0.04   0.4    0.29   0.33   0.14   0.2    0.53] sorted [7 2 4]\n",
      "   state [0 0 0 0 1 0 0 1] state_WI [  0.7   -0.04   0.59   0.32   0.33   0.14   0.2  -10.  ] sorted [0 2 4]\n",
      "   state [1 0 1 0 1 0 0 1] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.2  -10.  ] sorted [2 4 3]\n",
      "   state [1 0 1 0 1 0 1 0] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.09   0.53] sorted [7 2 4]\n",
      "   state [1 0 0 0 1 0 1 1] state_WI [-10.    -0.04   0.59   0.32   0.33   0.14   0.09 -10.  ] sorted [2 4 3]\n",
      "   state [1 1 1 0 0 0 0 0] state_WI [-10.    -0.15   0.4    0.32   0.66   0.14   0.2    0.53] sorted [4 7 2]\n",
      "   state [0 0 1 0 1 0 0 0] state_WI [ 0.7  -0.04  0.4   0.32  0.33  0.14  0.2   0.53] sorted [0 7 2]\n",
      "   state [1 0 0 0 1 0 0 1] state_WI [-10.    -0.04   0.59   0.32   0.33   0.14   0.2  -10.  ] sorted [2 4 3]\n",
      "   state [0 0 1 0 1 0 0 0] state_WI [ 0.7  -0.04  0.4   0.32  0.33  0.14  0.2   0.53] sorted [0 7 2]\n",
      "   state [0 0 1 0 1 0 1 0] state_WI [ 0.7  -0.04  0.4   0.32  0.33  0.14  0.09  0.53] sorted [0 7 2]\n",
      "   state [1 0 1 0 0 0 1 1] state_WI [-10.    -0.04   0.4    0.32   0.66   0.14   0.09 -10.  ] sorted [4 2 3]\n",
      "   state [1 0 1 1 0 0 1 1] state_WI [-10.    -0.04   0.4    0.29   0.66   0.14   0.09 -10.  ] sorted [4 2 3]\n",
      "   state [0 0 1 1 1 0 0 0] state_WI [ 0.7  -0.04  0.4   0.29  0.33  0.14  0.2   0.53] sorted [0 7 2]\n",
      "   state [1 0 1 0 0 1 1 1] state_WI [-10.    -0.04   0.4    0.32   0.66   0.05   0.09 -10.  ] sorted [4 2 3]\n",
      "   state [0 0 1 0 1 0 1 0] state_WI [ 0.7  -0.04  0.4   0.32  0.33  0.14  0.09  0.53] sorted [0 7 2]\n",
      "   state [0 0 1 0 1 0 0 0] state_WI [ 0.7  -0.04  0.4   0.32  0.33  0.14  0.2   0.53] sorted [0 7 2]\n",
      "   state [1 0 1 1 0 0 0 0] state_WI [-10.    -0.04   0.4    0.29   0.66   0.14   0.2    0.53] sorted [4 7 2]\n",
      "   state [0 0 1 0 1 1 1 0] state_WI [ 0.7  -0.04  0.4   0.32  0.33  0.05  0.09  0.53] sorted [0 7 2]\n",
      "   state [0 0 1 0 0 1 0 1] state_WI [  0.7   -0.04   0.4    0.32   0.66   0.05   0.2  -10.  ] sorted [0 4 2]\n",
      "instance 7, ep 5, state [0 0 0 1 1 1 1 1]\n",
      "   state [0 0 0 1 1 1 1 1] state_WI [  0.7   -0.04   0.59   0.29   0.33   0.05   0.09 -10.  ] sorted [0 2 4]\n",
      "   state [0 0 1 0 1 1 0 0] state_WI [ 0.7  -0.04  0.4   0.32  0.33  0.05  0.2   0.53] sorted [0 7 2]\n",
      "   state [0 0 1 1 0 0 1 0] state_WI [ 0.7  -0.04  0.4   0.29  0.66  0.14  0.09  0.53] sorted [0 4 7]\n",
      "   state [1 0 0 0 1 0 1 0] state_WI [-10.    -0.04   0.59   0.32   0.33   0.14   0.09   0.53] sorted [2 7 4]\n",
      "   state [0 0 0 0 1 0 0 0] state_WI [ 0.7  -0.04  0.59  0.32  0.33  0.14  0.2   0.53] sorted [0 2 7]\n",
      "   state [1 0 1 0 1 0 1 0] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.09   0.53] sorted [7 2 4]\n",
      "   state [1 0 1 0 1 0 0 1] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.2  -10.  ] sorted [2 4 3]\n",
      "   state [1 0 1 1 1 0 1 0] state_WI [-10.    -0.04   0.4    0.29   0.33   0.14   0.09   0.53] sorted [7 2 4]\n",
      "   state [0 0 1 0 0 0 1 0] state_WI [ 0.7  -0.04  0.4   0.32  0.66  0.14  0.09  0.53] sorted [0 4 7]\n",
      "   state [1 0 1 0 0 0 1 1] state_WI [-10.    -0.04   0.4    0.32   0.66   0.14   0.09 -10.  ] sorted [4 2 3]\n",
      "   state [1 0 1 0 0 0 1 0] state_WI [-10.    -0.04   0.4    0.32   0.66   0.14   0.09   0.53] sorted [4 7 2]\n",
      "   state [0 0 1 0 1 0 1 1] state_WI [  0.7   -0.04   0.4    0.32   0.33   0.14   0.09 -10.  ] sorted [0 2 4]\n",
      "   state [1 0 1 0 1 0 1 1] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.09 -10.  ] sorted [2 4 3]\n",
      "   state [0 0 0 0 1 0 0 1] state_WI [  0.7   -0.04   0.59   0.32   0.33   0.14   0.2  -10.  ] sorted [0 2 4]\n",
      "   state [1 0 0 0 1 0 0 0] state_WI [-10.    -0.04   0.59   0.32   0.33   0.14   0.2    0.53] sorted [2 7 4]\n",
      "   state [1 0 1 0 0 0 0 0] state_WI [-10.    -0.04   0.4    0.32   0.66   0.14   0.2    0.53] sorted [4 7 2]\n",
      "   state [0 0 1 0 1 0 1 0] state_WI [ 0.7  -0.04  0.4   0.32  0.33  0.14  0.09  0.53] sorted [0 7 2]\n",
      "   state [1 0 1 0 1 0 0 0] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.2    0.53] sorted [7 2 4]\n",
      "   state [1 0 1 0 1 0 0 1] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.2  -10.  ] sorted [2 4 3]\n",
      "   state [0 0 1 0 0 0 1 1] state_WI [  0.7   -0.04   0.4    0.32   0.66   0.14   0.09 -10.  ] sorted [0 4 2]\n",
      "instance 7, ep 6, state [1 0 0 0 0 0 0 0]\n",
      "   state [1 0 0 0 0 0 0 0] state_WI [-10.    -0.04   0.59   0.32   0.66   0.14   0.2    0.53] sorted [4 2 7]\n",
      "   state [0 0 1 0 0 0 1 1] state_WI [  0.7   -0.04   0.4    0.32   0.66   0.14   0.09 -10.  ] sorted [0 4 2]\n",
      "   state [1 0 1 0 1 0 0 1] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.2  -10.  ] sorted [2 4 3]\n",
      "   state [0 1 1 0 1 0 1 1] state_WI [  0.7   -0.15   0.4    0.32   0.33   0.14   0.09 -10.  ] sorted [0 2 4]\n",
      "   state [0 0 1 0 0 0 0 0] state_WI [ 0.7  -0.04  0.4   0.32  0.66  0.14  0.2   0.53] sorted [0 4 7]\n",
      "   state [1 0 0 0 1 0 1 0] state_WI [-10.    -0.04   0.59   0.32   0.33   0.14   0.09   0.53] sorted [2 7 4]\n",
      "   state [0 0 1 0 1 0 1 1] state_WI [  0.7   -0.04   0.4    0.32   0.33   0.14   0.09 -10.  ] sorted [0 2 4]\n",
      "   state [1 0 0 0 1 0 0 0] state_WI [-10.    -0.04   0.59   0.32   0.33   0.14   0.2    0.53] sorted [2 7 4]\n",
      "   state [1 0 0 0 0 0 0 0] state_WI [-10.    -0.04   0.59   0.32   0.66   0.14   0.2    0.53] sorted [4 2 7]\n",
      "   state [0 0 1 0 1 0 0 0] state_WI [ 0.7  -0.04  0.4   0.32  0.33  0.14  0.2   0.53] sorted [0 7 2]\n",
      "   state [1 0 1 0 1 0 1 0] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.09   0.53] sorted [7 2 4]\n",
      "   state [1 0 1 0 1 0 0 1] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.2  -10.  ] sorted [2 4 3]\n",
      "   state [0 0 1 0 1 0 0 1] state_WI [  0.7   -0.04   0.4    0.32   0.33   0.14   0.2  -10.  ] sorted [0 2 4]\n",
      "   state [0 0 1 0 1 0 0 1] state_WI [  0.7   -0.04   0.4    0.32   0.33   0.14   0.2  -10.  ] sorted [0 2 4]\n",
      "   state [1 0 1 0 1 0 1 0] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.09   0.53] sorted [7 2 4]\n",
      "   state [1 0 1 0 1 0 1 1] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.09 -10.  ] sorted [2 4 3]\n",
      "   state [1 0 1 1 1 0 0 1] state_WI [-10.    -0.04   0.4    0.29   0.33   0.14   0.2  -10.  ] sorted [2 4 3]\n",
      "   state [0 0 1 1 1 0 0 0] state_WI [ 0.7  -0.04  0.4   0.29  0.33  0.14  0.2   0.53] sorted [0 7 2]\n",
      "   state [1 0 1 0 0 0 1 1] state_WI [-10.    -0.04   0.4    0.32   0.66   0.14   0.09 -10.  ] sorted [4 2 3]\n",
      "   state [0 0 1 0 1 0 1 1] state_WI [  0.7   -0.04   0.4    0.32   0.33   0.14   0.09 -10.  ] sorted [0 2 4]\n",
      "instance 7, ep 7, state [1 0 0 0 1 0 0 1]\n",
      "   state [1 0 0 0 1 0 0 1] state_WI [-10.    -0.04   0.59   0.32   0.33   0.14   0.2  -10.  ] sorted [2 4 3]\n",
      "   state [0 0 0 0 1 0 1 0] state_WI [ 0.7  -0.04  0.59  0.32  0.33  0.14  0.09  0.53] sorted [0 2 7]\n",
      "   state [1 0 1 0 1 0 0 0] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.2    0.53] sorted [7 2 4]\n",
      "   state [0 0 1 0 1 0 0 1] state_WI [  0.7   -0.04   0.4    0.32   0.33   0.14   0.2  -10.  ] sorted [0 2 4]\n",
      "   state [1 0 1 0 0 0 1 1] state_WI [-10.    -0.04   0.4    0.32   0.66   0.14   0.09 -10.  ] sorted [4 2 3]\n",
      "   state [0 0 1 1 1 0 0 1] state_WI [  0.7   -0.04   0.4    0.29   0.33   0.14   0.2  -10.  ] sorted [0 2 4]\n",
      "   state [1 0 1 0 1 0 0 0] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.2    0.53] sorted [7 2 4]\n",
      "   state [1 0 0 1 0 0 1 1] state_WI [-10.    -0.04   0.59   0.29   0.66   0.14   0.09 -10.  ] sorted [4 2 3]\n",
      "   state [1 1 1 1 0 0 1 1] state_WI [-10.    -0.15   0.4    0.29   0.66   0.14   0.09 -10.  ] sorted [4 2 3]\n",
      "   state [1 0 1 0 0 0 0 0] state_WI [-10.    -0.04   0.4    0.32   0.66   0.14   0.2    0.53] sorted [4 7 2]\n",
      "   state [1 0 1 0 1 0 0 1] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.2  -10.  ] sorted [2 4 3]\n",
      "   state [1 0 1 1 1 0 0 0] state_WI [-10.    -0.04   0.4    0.29   0.33   0.14   0.2    0.53] sorted [7 2 4]\n",
      "   state [0 0 0 0 1 0 1 1] state_WI [  0.7   -0.04   0.59   0.32   0.33   0.14   0.09 -10.  ] sorted [0 2 4]\n",
      "   state [0 0 1 0 1 0 0 0] state_WI [ 0.7  -0.04  0.4   0.32  0.33  0.14  0.2   0.53] sorted [0 7 2]\n",
      "   state [1 0 1 1 0 0 0 0] state_WI [-10.    -0.04   0.4    0.29   0.66   0.14   0.2    0.53] sorted [4 7 2]\n",
      "   state [0 0 0 0 1 0 0 0] state_WI [ 0.7  -0.04  0.59  0.32  0.33  0.14  0.2   0.53] sorted [0 2 7]\n",
      "   state [1 0 1 1 0 0 1 1] state_WI [-10.    -0.04   0.4    0.29   0.66   0.14   0.09 -10.  ] sorted [4 2 3]\n",
      "   state [1 0 1 1 0 0 0 1] state_WI [-10.    -0.04   0.4    0.29   0.66   0.14   0.2  -10.  ] sorted [4 2 3]\n",
      "   state [1 0 0 1 0 0 0 0] state_WI [-10.    -0.04   0.59   0.29   0.66   0.14   0.2    0.53] sorted [4 2 7]\n",
      "   state [1 0 1 0 1 0 0 0] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.2    0.53] sorted [7 2 4]\n",
      "instance 7, ep 8, state [0 0 0 0 0 0 1 1]\n",
      "   state [0 0 0 0 0 0 1 1] state_WI [  0.7   -0.04   0.59   0.32   0.66   0.14   0.09 -10.  ] sorted [0 4 2]\n",
      "   state [1 0 1 0 1 0 0 0] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.2    0.53] sorted [7 2 4]\n",
      "   state [1 0 1 0 1 0 0 1] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.2  -10.  ] sorted [2 4 3]\n",
      "   state [0 0 1 0 1 1 1 1] state_WI [  0.7   -0.04   0.4    0.32   0.33   0.05   0.09 -10.  ] sorted [0 2 4]\n",
      "   state [1 0 1 0 1 0 1 1] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.09 -10.  ] sorted [2 4 3]\n",
      "   state [1 0 1 0 0 0 0 1] state_WI [-10.    -0.04   0.4    0.32   0.66   0.14   0.2  -10.  ] sorted [4 2 3]\n",
      "   state [1 0 1 0 0 0 0 0] state_WI [-10.    -0.04   0.4    0.32   0.66   0.14   0.2    0.53] sorted [4 7 2]\n",
      "   state [0 0 1 0 0 0 0 0] state_WI [ 0.7  -0.04  0.4   0.32  0.66  0.14  0.2   0.53] sorted [0 4 7]\n",
      "   state [1 0 0 0 1 0 1 1] state_WI [-10.    -0.04   0.59   0.32   0.33   0.14   0.09 -10.  ] sorted [2 4 3]\n",
      "   state [0 0 0 0 1 0 0 0] state_WI [ 0.7  -0.04  0.59  0.32  0.33  0.14  0.2   0.53] sorted [0 2 7]\n",
      "   state [0 0 0 0 0 0 0 0] state_WI [ 0.7  -0.04  0.59  0.32  0.66  0.14  0.2   0.53] sorted [0 4 2]\n",
      "   state [0 0 1 0 0 0 1 0] state_WI [ 0.7  -0.04  0.4   0.32  0.66  0.14  0.09  0.53] sorted [0 4 7]\n",
      "   state [0 0 1 0 1 0 0 1] state_WI [  0.7   -0.04   0.4    0.32   0.33   0.14   0.2  -10.  ] sorted [0 2 4]\n",
      "   state [0 0 1 0 1 0 1 1] state_WI [  0.7   -0.04   0.4    0.32   0.33   0.14   0.09 -10.  ] sorted [0 2 4]\n",
      "   state [0 0 1 0 1 0 0 0] state_WI [ 0.7  -0.04  0.4   0.32  0.33  0.14  0.2   0.53] sorted [0 7 2]\n",
      "   state [1 0 1 0 1 0 1 1] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.09 -10.  ] sorted [2 4 3]\n",
      "   state [1 0 1 0 1 0 1 0] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.09   0.53] sorted [7 2 4]\n",
      "   state [0 0 1 0 1 0 0 0] state_WI [ 0.7  -0.04  0.4   0.32  0.33  0.14  0.2   0.53] sorted [0 7 2]\n",
      "   state [1 0 1 0 0 0 0 1] state_WI [-10.    -0.04   0.4    0.32   0.66   0.14   0.2  -10.  ] sorted [4 2 3]\n",
      "   state [1 0 1 0 1 0 0 1] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.2  -10.  ] sorted [2 4 3]\n",
      "instance 7, ep 9, state [1 0 1 0 0 1 0 0]\n",
      "   state [1 0 1 0 0 1 0 0] state_WI [-10.    -0.04   0.4    0.32   0.66   0.05   0.2    0.53] sorted [4 7 2]\n",
      "   state [1 0 1 0 1 0 1 0] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.09   0.53] sorted [7 2 4]\n",
      "   state [1 0 1 0 1 0 0 1] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.2  -10.  ] sorted [2 4 3]\n",
      "   state [0 0 1 0 1 0 1 0] state_WI [ 0.7  -0.04  0.4   0.32  0.33  0.14  0.09  0.53] sorted [0 7 2]\n",
      "   state [0 0 1 0 0 0 0 1] state_WI [  0.7   -0.04   0.4    0.32   0.66   0.14   0.2  -10.  ] sorted [0 4 2]\n",
      "   state [1 0 1 0 0 0 1 0] state_WI [-10.    -0.04   0.4    0.32   0.66   0.14   0.09   0.53] sorted [4 7 2]\n",
      "   state [0 0 0 0 0 1 0 1] state_WI [  0.7   -0.04   0.59   0.32   0.66   0.05   0.2  -10.  ] sorted [0 4 2]\n",
      "   state [0 0 1 0 1 0 1 1] state_WI [  0.7   -0.04   0.4    0.32   0.33   0.14   0.09 -10.  ] sorted [0 2 4]\n",
      "   state [0 0 1 0 1 0 1 1] state_WI [  0.7   -0.04   0.4    0.32   0.33   0.14   0.09 -10.  ] sorted [0 2 4]\n",
      "   state [1 0 1 0 1 1 1 0] state_WI [-10.    -0.04   0.4    0.32   0.33   0.05   0.09   0.53] sorted [7 2 4]\n",
      "   state [1 0 0 0 1 0 1 0] state_WI [-10.    -0.04   0.59   0.32   0.33   0.14   0.09   0.53] sorted [2 7 4]\n",
      "   state [1 0 1 0 1 0 1 1] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.09 -10.  ] sorted [2 4 3]\n",
      "   state [0 1 0 0 1 0 1 1] state_WI [  0.7   -0.15   0.59   0.32   0.33   0.14   0.09 -10.  ] sorted [0 2 4]\n",
      "   state [1 0 1 0 1 0 0 0] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.2    0.53] sorted [7 2 4]\n",
      "   state [1 0 1 0 0 0 0 0] state_WI [-10.    -0.04   0.4    0.32   0.66   0.14   0.2    0.53] sorted [4 7 2]\n",
      "   state [0 0 0 0 1 0 0 1] state_WI [  0.7   -0.04   0.59   0.32   0.33   0.14   0.2  -10.  ] sorted [0 2 4]\n",
      "   state [1 0 1 0 1 0 0 0] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.2    0.53] sorted [7 2 4]\n",
      "   state [0 1 1 0 1 0 0 1] state_WI [  0.7   -0.15   0.4    0.32   0.33   0.14   0.2  -10.  ] sorted [0 2 4]\n",
      "   state [0 0 1 0 1 0 0 1] state_WI [  0.7   -0.04   0.4    0.32   0.33   0.14   0.2  -10.  ] sorted [0 2 4]\n",
      "   state [0 0 1 0 1 0 0 0] state_WI [ 0.7  -0.04  0.4   0.32  0.33  0.14  0.2   0.53] sorted [0 7 2]\n",
      "instance 7, ep 10, state [1 1 0 1 1 0 0 0]\n",
      "   state [1 1 0 1 1 0 0 0] state_WI [-10.    -0.15   0.59   0.29   0.33   0.14   0.2    0.53] sorted [2 7 4]\n",
      "   state [0 0 1 0 1 0 0 0] state_WI [ 0.7  -0.04  0.4   0.32  0.33  0.14  0.2   0.53] sorted [0 7 2]\n",
      "   state [1 0 0 0 0 0 0 0] state_WI [-10.    -0.04   0.59   0.32   0.66   0.14   0.2    0.53] sorted [4 2 7]\n",
      "   state [0 0 1 0 1 0 1 1] state_WI [  0.7   -0.04   0.4    0.32   0.33   0.14   0.09 -10.  ] sorted [0 2 4]\n",
      "   state [1 0 1 0 1 0 0 0] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.2    0.53] sorted [7 2 4]\n",
      "   state [1 0 1 0 1 0 0 1] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.2  -10.  ] sorted [2 4 3]\n",
      "   state [1 0 1 0 1 0 1 0] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.09   0.53] sorted [7 2 4]\n",
      "   state [0 0 0 0 1 0 0 0] state_WI [ 0.7  -0.04  0.59  0.32  0.33  0.14  0.2   0.53] sorted [0 2 7]\n",
      "   state [1 0 0 0 1 0 0 0] state_WI [-10.    -0.04   0.59   0.32   0.33   0.14   0.2    0.53] sorted [2 7 4]\n",
      "   state [1 0 0 0 1 0 0 1] state_WI [-10.    -0.04   0.59   0.32   0.33   0.14   0.2  -10.  ] sorted [2 4 3]\n",
      "   state [1 0 0 0 1 0 1 1] state_WI [-10.    -0.04   0.59   0.32   0.33   0.14   0.09 -10.  ] sorted [2 4 3]\n",
      "   state [1 0 1 1 1 0 0 1] state_WI [-10.    -0.04   0.4    0.29   0.33   0.14   0.2  -10.  ] sorted [2 4 3]\n",
      "   state [1 0 1 0 1 0 0 1] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.2  -10.  ] sorted [2 4 3]\n",
      "   state [1 0 1 0 1 0 1 1] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.09 -10.  ] sorted [2 4 3]\n",
      "   state [0 0 0 0 1 0 0 0] state_WI [ 0.7  -0.04  0.59  0.32  0.33  0.14  0.2   0.53] sorted [0 2 7]\n",
      "   state [1 0 0 0 0 0 0 1] state_WI [-10.    -0.04   0.59   0.32   0.66   0.14   0.2  -10.  ] sorted [4 2 3]\n",
      "   state [0 0 1 0 0 0 1 1] state_WI [  0.7   -0.04   0.4    0.32   0.66   0.14   0.09 -10.  ] sorted [0 4 2]\n",
      "   state [0 0 1 0 1 0 0 0] state_WI [ 0.7  -0.04  0.4   0.32  0.33  0.14  0.2   0.53] sorted [0 7 2]\n",
      "   state [1 0 1 0 0 0 1 1] state_WI [-10.    -0.04   0.4    0.32   0.66   0.14   0.09 -10.  ] sorted [4 2 3]\n",
      "   state [1 0 1 1 0 0 0 0] state_WI [-10.    -0.04   0.4    0.29   0.66   0.14   0.2    0.53] sorted [4 7 2]\n",
      "instance 7, ep 11, state [0 0 1 1 1 0 1 1]\n",
      "   state [0 0 1 1 1 0 1 1] state_WI [  0.7   -0.04   0.4    0.29   0.33   0.14   0.09 -10.  ] sorted [0 2 4]\n",
      "   state [0 0 1 0 1 0 0 0] state_WI [ 0.7  -0.04  0.4   0.32  0.33  0.14  0.2   0.53] sorted [0 7 2]\n",
      "   state [0 0 0 0 1 0 0 1] state_WI [  0.7   -0.04   0.59   0.32   0.33   0.14   0.2  -10.  ] sorted [0 2 4]\n",
      "   state [0 0 1 0 1 0 0 0] state_WI [ 0.7  -0.04  0.4   0.32  0.33  0.14  0.2   0.53] sorted [0 7 2]\n",
      "   state [1 0 0 0 0 0 1 0] state_WI [-10.    -0.04   0.59   0.32   0.66   0.14   0.09   0.53] sorted [4 2 7]\n",
      "   state [1 0 1 0 1 1 0 1] state_WI [-10.    -0.04   0.4    0.32   0.33   0.05   0.2  -10.  ] sorted [2 4 3]\n",
      "   state [0 0 1 1 1 1 1 1] state_WI [  0.7   -0.04   0.4    0.29   0.33   0.05   0.09 -10.  ] sorted [0 2 4]\n",
      "   state [0 0 1 0 1 0 0 1] state_WI [  0.7   -0.04   0.4    0.32   0.33   0.14   0.2  -10.  ] sorted [0 2 4]\n",
      "   state [0 0 1 0 1 0 0 1] state_WI [  0.7   -0.04   0.4    0.32   0.33   0.14   0.2  -10.  ] sorted [0 2 4]\n",
      "   state [1 0 1 0 1 0 0 1] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.2  -10.  ] sorted [2 4 3]\n",
      "   state [0 0 1 1 1 0 1 1] state_WI [  0.7   -0.04   0.4    0.29   0.33   0.14   0.09 -10.  ] sorted [0 2 4]\n",
      "   state [0 0 1 0 1 0 0 0] state_WI [ 0.7  -0.04  0.4   0.32  0.33  0.14  0.2   0.53] sorted [0 7 2]\n",
      "   state [0 0 1 0 0 0 1 1] state_WI [  0.7   -0.04   0.4    0.32   0.66   0.14   0.09 -10.  ] sorted [0 4 2]\n",
      "   state [1 0 1 0 1 0 0 0] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.2    0.53] sorted [7 2 4]\n",
      "   state [1 0 1 0 0 0 1 0] state_WI [-10.    -0.04   0.4    0.32   0.66   0.14   0.09   0.53] sorted [4 7 2]\n",
      "   state [0 0 1 0 1 0 1 1] state_WI [  0.7   -0.04   0.4    0.32   0.33   0.14   0.09 -10.  ] sorted [0 2 4]\n",
      "   state [0 0 1 0 1 0 0 0] state_WI [ 0.7  -0.04  0.4   0.32  0.33  0.14  0.2   0.53] sorted [0 7 2]\n",
      "   state [1 0 1 1 0 0 1 0] state_WI [-10.    -0.04   0.4    0.29   0.66   0.14   0.09   0.53] sorted [4 7 2]\n",
      "   state [0 0 1 0 1 0 0 0] state_WI [ 0.7  -0.04  0.4   0.32  0.33  0.14  0.2   0.53] sorted [0 7 2]\n",
      "   state [0 0 1 0 0 0 1 0] state_WI [ 0.7  -0.04  0.4   0.32  0.66  0.14  0.09  0.53] sorted [0 4 7]\n",
      "instance 7, ep 12, state [1 0 1 0 0 0 1 1]\n",
      "   state [1 0 1 0 0 0 1 1] state_WI [-10.    -0.04   0.4    0.32   0.66   0.14   0.09 -10.  ] sorted [4 2 3]\n",
      "   state [1 0 1 0 1 0 0 1] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.2  -10.  ] sorted [2 4 3]\n",
      "   state [1 0 1 0 0 0 0 1] state_WI [-10.    -0.04   0.4    0.32   0.66   0.14   0.2  -10.  ] sorted [4 2 3]\n",
      "   state [1 0 0 0 0 0 0 0] state_WI [-10.    -0.04   0.59   0.32   0.66   0.14   0.2    0.53] sorted [4 2 7]\n",
      "   state [1 0 1 0 0 0 1 0] state_WI [-10.    -0.04   0.4    0.32   0.66   0.14   0.09   0.53] sorted [4 7 2]\n",
      "   state [0 0 1 0 0 0 1 1] state_WI [  0.7   -0.04   0.4    0.32   0.66   0.14   0.09 -10.  ] sorted [0 4 2]\n",
      "   state [1 0 1 0 1 0 0 1] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.2  -10.  ] sorted [2 4 3]\n",
      "   state [0 0 1 0 1 0 1 1] state_WI [  0.7   -0.04   0.4    0.32   0.33   0.14   0.09 -10.  ] sorted [0 2 4]\n",
      "   state [1 0 1 0 1 0 0 1] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.2  -10.  ] sorted [2 4 3]\n",
      "   state [0 0 1 0 1 0 1 0] state_WI [ 0.7  -0.04  0.4   0.32  0.33  0.14  0.09  0.53] sorted [0 7 2]\n",
      "   state [1 0 1 0 0 0 0 0] state_WI [-10.    -0.04   0.4    0.32   0.66   0.14   0.2    0.53] sorted [4 7 2]\n",
      "   state [0 0 1 0 1 0 1 1] state_WI [  0.7   -0.04   0.4    0.32   0.33   0.14   0.09 -10.  ] sorted [0 2 4]\n",
      "   state [1 0 1 0 1 0 0 0] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.2    0.53] sorted [7 2 4]\n",
      "   state [0 0 1 0 1 0 1 1] state_WI [  0.7   -0.04   0.4    0.32   0.33   0.14   0.09 -10.  ] sorted [0 2 4]\n",
      "   state [0 0 1 0 1 0 1 0] state_WI [ 0.7  -0.04  0.4   0.32  0.33  0.14  0.09  0.53] sorted [0 7 2]\n",
      "   state [1 0 1 0 1 0 1 0] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.09   0.53] sorted [7 2 4]\n",
      "   state [1 0 1 0 1 0 1 0] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.09   0.53] sorted [7 2 4]\n",
      "   state [1 0 1 0 1 0 1 0] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.09   0.53] sorted [7 2 4]\n",
      "   state [1 0 1 0 0 0 0 1] state_WI [-10.    -0.04   0.4    0.32   0.66   0.14   0.2  -10.  ] sorted [4 2 3]\n",
      "   state [0 0 0 0 1 0 0 0] state_WI [ 0.7  -0.04  0.59  0.32  0.33  0.14  0.2   0.53] sorted [0 2 7]\n",
      "instance 7, ep 13, state [0 0 0 0 0 0 1 0]\n",
      "   state [0 0 0 0 0 0 1 0] state_WI [ 0.7  -0.04  0.59  0.32  0.66  0.14  0.09  0.53] sorted [0 4 2]\n",
      "   state [0 0 1 0 1 1 1 0] state_WI [ 0.7  -0.04  0.4   0.32  0.33  0.05  0.09  0.53] sorted [0 7 2]\n",
      "   state [1 1 1 0 1 0 1 0] state_WI [-10.    -0.15   0.4    0.32   0.33   0.14   0.09   0.53] sorted [7 2 4]\n",
      "   state [1 1 1 0 1 1 0 1] state_WI [-10.    -0.15   0.4    0.32   0.33   0.05   0.2  -10.  ] sorted [2 4 3]\n",
      "   state [0 0 1 1 1 0 0 1] state_WI [  0.7   -0.04   0.4    0.29   0.33   0.14   0.2  -10.  ] sorted [0 2 4]\n",
      "   state [0 0 1 0 1 0 1 1] state_WI [  0.7   -0.04   0.4    0.32   0.33   0.14   0.09 -10.  ] sorted [0 2 4]\n",
      "   state [0 0 1 0 1 0 0 1] state_WI [  0.7   -0.04   0.4    0.32   0.33   0.14   0.2  -10.  ] sorted [0 2 4]\n",
      "   state [1 0 1 0 0 0 1 0] state_WI [-10.    -0.04   0.4    0.32   0.66   0.14   0.09   0.53] sorted [4 7 2]\n",
      "   state [1 0 1 0 0 0 1 0] state_WI [-10.    -0.04   0.4    0.32   0.66   0.14   0.09   0.53] sorted [4 7 2]\n",
      "   state [0 0 1 0 0 0 0 1] state_WI [  0.7   -0.04   0.4    0.32   0.66   0.14   0.2  -10.  ] sorted [0 4 2]\n",
      "   state [1 0 1 0 1 0 0 1] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.2  -10.  ] sorted [2 4 3]\n",
      "   state [1 0 1 1 1 0 1 1] state_WI [-10.    -0.04   0.4    0.29   0.33   0.14   0.09 -10.  ] sorted [2 4 3]\n",
      "   state [0 0 0 1 1 0 0 1] state_WI [  0.7   -0.04   0.59   0.29   0.33   0.14   0.2  -10.  ] sorted [0 2 4]\n",
      "   state [1 0 1 0 0 0 1 0] state_WI [-10.    -0.04   0.4    0.32   0.66   0.14   0.09   0.53] sorted [4 7 2]\n",
      "   state [1 0 1 0 0 0 0 0] state_WI [-10.    -0.04   0.4    0.32   0.66   0.14   0.2    0.53] sorted [4 7 2]\n",
      "   state [0 0 1 0 1 0 1 0] state_WI [ 0.7  -0.04  0.4   0.32  0.33  0.14  0.09  0.53] sorted [0 7 2]\n",
      "   state [0 0 1 0 0 0 0 0] state_WI [ 0.7  -0.04  0.4   0.32  0.66  0.14  0.2   0.53] sorted [0 4 7]\n",
      "   state [1 0 1 0 0 0 0 0] state_WI [-10.    -0.04   0.4    0.32   0.66   0.14   0.2    0.53] sorted [4 7 2]\n",
      "   state [0 1 1 0 0 0 0 0] state_WI [ 0.7  -0.15  0.4   0.32  0.66  0.14  0.2   0.53] sorted [0 4 7]\n",
      "   state [0 0 1 0 1 0 0 1] state_WI [  0.7   -0.04   0.4    0.32   0.33   0.14   0.2  -10.  ] sorted [0 2 4]\n",
      "instance 7, ep 14, state [0 0 1 1 1 0 1 0]\n",
      "   state [0 0 1 1 1 0 1 0] state_WI [ 0.7  -0.04  0.4   0.29  0.33  0.14  0.09  0.53] sorted [0 7 2]\n",
      "   state [0 0 1 0 0 0 1 0] state_WI [ 0.7  -0.04  0.4   0.32  0.66  0.14  0.09  0.53] sorted [0 4 7]\n",
      "   state [0 1 1 0 0 0 0 0] state_WI [ 0.7  -0.15  0.4   0.32  0.66  0.14  0.2   0.53] sorted [0 4 7]\n",
      "   state [1 1 1 0 0 0 1 0] state_WI [-10.    -0.15   0.4    0.32   0.66   0.14   0.09   0.53] sorted [4 7 2]\n",
      "   state [1 0 1 0 1 0 1 0] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.09   0.53] sorted [7 2 4]\n",
      "   state [0 0 1 1 1 0 0 0] state_WI [ 0.7  -0.04  0.4   0.29  0.33  0.14  0.2   0.53] sorted [0 7 2]\n",
      "   state [1 0 1 0 1 0 1 0] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.09   0.53] sorted [7 2 4]\n",
      "   state [1 0 1 0 1 1 0 1] state_WI [-10.    -0.04   0.4    0.32   0.33   0.05   0.2  -10.  ] sorted [2 4 3]\n",
      "   state [1 0 1 0 1 0 0 1] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.2  -10.  ] sorted [2 4 3]\n",
      "   state [1 0 1 0 1 0 0 0] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.2    0.53] sorted [7 2 4]\n",
      "   state [1 0 1 1 1 0 1 1] state_WI [-10.    -0.04   0.4    0.29   0.33   0.14   0.09 -10.  ] sorted [2 4 3]\n",
      "   state [0 0 1 1 1 0 0 1] state_WI [  0.7   -0.04   0.4    0.29   0.33   0.14   0.2  -10.  ] sorted [0 2 4]\n",
      "   state [1 0 1 0 1 0 1 1] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.09 -10.  ] sorted [2 4 3]\n",
      "   state [1 1 0 0 1 0 0 1] state_WI [-10.    -0.15   0.59   0.32   0.33   0.14   0.2  -10.  ] sorted [2 4 3]\n",
      "   state [1 0 0 0 1 0 1 1] state_WI [-10.    -0.04   0.59   0.32   0.33   0.14   0.09 -10.  ] sorted [2 4 3]\n",
      "   state [0 0 1 0 1 0 0 0] state_WI [ 0.7  -0.04  0.4   0.32  0.33  0.14  0.2   0.53] sorted [0 7 2]\n",
      "   state [1 0 0 0 1 0 0 1] state_WI [-10.    -0.04   0.59   0.32   0.33   0.14   0.2  -10.  ] sorted [2 4 3]\n",
      "   state [0 0 0 0 1 0 0 1] state_WI [  0.7   -0.04   0.59   0.32   0.33   0.14   0.2  -10.  ] sorted [0 2 4]\n",
      "   state [1 0 1 0 0 0 0 0] state_WI [-10.    -0.04   0.4    0.32   0.66   0.14   0.2    0.53] sorted [4 7 2]\n",
      "   state [1 0 1 0 0 0 0 0] state_WI [-10.    -0.04   0.4    0.32   0.66   0.14   0.2    0.53] sorted [4 7 2]\n",
      "instance 7, ep 15, state [1 1 1 1 1 0 1 0]\n",
      "   state [1 1 1 1 1 0 1 0] state_WI [-10.    -0.15   0.4    0.29   0.33   0.14   0.09   0.53] sorted [7 2 4]\n",
      "   state [0 0 1 0 1 0 0 1] state_WI [  0.7   -0.04   0.4    0.32   0.33   0.14   0.2  -10.  ] sorted [0 2 4]\n",
      "   state [1 0 1 0 1 0 0 1] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.2  -10.  ] sorted [2 4 3]\n",
      "   state [0 0 1 0 1 0 0 0] state_WI [ 0.7  -0.04  0.4   0.32  0.33  0.14  0.2   0.53] sorted [0 7 2]\n",
      "   state [0 0 1 0 1 0 1 0] state_WI [ 0.7  -0.04  0.4   0.32  0.33  0.14  0.09  0.53] sorted [0 7 2]\n",
      "   state [1 0 1 0 1 0 0 0] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.2    0.53] sorted [7 2 4]\n",
      "   state [0 0 1 0 1 0 0 0] state_WI [ 0.7  -0.04  0.4   0.32  0.33  0.14  0.2   0.53] sorted [0 7 2]\n",
      "   state [1 0 1 0 0 0 0 1] state_WI [-10.    -0.04   0.4    0.32   0.66   0.14   0.2  -10.  ] sorted [4 2 3]\n",
      "   state [1 0 1 0 0 1 0 1] state_WI [-10.    -0.04   0.4    0.32   0.66   0.05   0.2  -10.  ] sorted [4 2 3]\n",
      "   state [1 0 1 0 0 0 0 0] state_WI [-10.    -0.04   0.4    0.32   0.66   0.14   0.2    0.53] sorted [4 7 2]\n",
      "   state [1 0 1 0 1 0 0 1] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.2  -10.  ] sorted [2 4 3]\n",
      "   state [0 1 1 1 1 0 0 0] state_WI [ 0.7  -0.15  0.4   0.29  0.33  0.14  0.2   0.53] sorted [0 7 2]\n",
      "   state [1 0 1 1 1 0 0 1] state_WI [-10.    -0.04   0.4    0.29   0.33   0.14   0.2  -10.  ] sorted [2 4 3]\n",
      "   state [0 0 1 0 1 0 1 0] state_WI [ 0.7  -0.04  0.4   0.32  0.33  0.14  0.09  0.53] sorted [0 7 2]\n",
      "   state [0 0 1 0 1 0 1 1] state_WI [  0.7   -0.04   0.4    0.32   0.33   0.14   0.09 -10.  ] sorted [0 2 4]\n",
      "   state [1 0 1 0 0 0 1 0] state_WI [-10.    -0.04   0.4    0.32   0.66   0.14   0.09   0.53] sorted [4 7 2]\n",
      "   state [0 0 1 0 0 0 0 1] state_WI [  0.7   -0.04   0.4    0.32   0.66   0.14   0.2  -10.  ] sorted [0 4 2]\n",
      "   state [1 0 1 0 0 0 1 0] state_WI [-10.    -0.04   0.4    0.32   0.66   0.14   0.09   0.53] sorted [4 7 2]\n",
      "   state [1 0 1 0 0 0 1 0] state_WI [-10.    -0.04   0.4    0.32   0.66   0.14   0.09   0.53] sorted [4 7 2]\n",
      "   state [0 0 1 0 1 0 1 1] state_WI [  0.7   -0.04   0.4    0.32   0.33   0.14   0.09 -10.  ] sorted [0 2 4]\n",
      "instance 7, ep 16, state [1 0 0 0 0 0 1 0]\n",
      "   state [1 0 0 0 0 0 1 0] state_WI [-10.    -0.04   0.59   0.32   0.66   0.14   0.09   0.53] sorted [4 2 7]\n",
      "   state [0 0 1 0 1 0 0 0] state_WI [ 0.7  -0.04  0.4   0.32  0.33  0.14  0.2   0.53] sorted [0 7 2]\n",
      "   state [1 0 1 0 0 0 0 0] state_WI [-10.    -0.04   0.4    0.32   0.66   0.14   0.2    0.53] sorted [4 7 2]\n",
      "   state [1 1 1 0 1 1 1 0] state_WI [-10.    -0.15   0.4    0.32   0.33   0.05   0.09   0.53] sorted [7 2 4]\n",
      "   state [1 1 1 0 1 0 1 0] state_WI [-10.    -0.15   0.4    0.32   0.33   0.14   0.09   0.53] sorted [7 2 4]\n",
      "   state [0 0 1 0 1 0 1 1] state_WI [  0.7   -0.04   0.4    0.32   0.33   0.14   0.09 -10.  ] sorted [0 2 4]\n",
      "   state [0 0 1 0 1 0 1 0] state_WI [ 0.7  -0.04  0.4   0.32  0.33  0.14  0.09  0.53] sorted [0 7 2]\n",
      "   state [1 0 1 0 0 0 0 0] state_WI [-10.    -0.04   0.4    0.32   0.66   0.14   0.2    0.53] sorted [4 7 2]\n",
      "   state [1 1 1 0 0 0 1 1] state_WI [-10.    -0.15   0.4    0.32   0.66   0.14   0.09 -10.  ] sorted [4 2 3]\n",
      "   state [1 0 1 1 1 0 1 1] state_WI [-10.    -0.04   0.4    0.29   0.33   0.14   0.09 -10.  ] sorted [2 4 3]\n",
      "   state [1 0 1 1 1 0 0 0] state_WI [-10.    -0.04   0.4    0.29   0.33   0.14   0.2    0.53] sorted [7 2 4]\n",
      "   state [1 0 1 0 1 0 1 1] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.09 -10.  ] sorted [2 4 3]\n",
      "   state [0 0 1 0 1 0 0 1] state_WI [  0.7   -0.04   0.4    0.32   0.33   0.14   0.2  -10.  ] sorted [0 2 4]\n",
      "   state [1 0 1 0 1 0 0 0] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.2    0.53] sorted [7 2 4]\n",
      "   state [1 0 1 0 1 0 0 0] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.2    0.53] sorted [7 2 4]\n",
      "   state [1 0 1 0 1 0 1 0] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.09   0.53] sorted [7 2 4]\n",
      "   state [0 0 1 0 1 0 1 0] state_WI [ 0.7  -0.04  0.4   0.32  0.33  0.14  0.09  0.53] sorted [0 7 2]\n",
      "   state [0 0 0 0 0 0 1 1] state_WI [  0.7   -0.04   0.59   0.32   0.66   0.14   0.09 -10.  ] sorted [0 4 2]\n",
      "   state [1 0 1 0 1 0 1 0] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.09   0.53] sorted [7 2 4]\n",
      "   state [0 0 1 0 0 0 0 1] state_WI [  0.7   -0.04   0.4    0.32   0.66   0.14   0.2  -10.  ] sorted [0 4 2]\n",
      "instance 7, ep 17, state [0 1 0 1 1 1 1 0]\n",
      "   state [0 1 0 1 1 1 1 0] state_WI [ 0.7  -0.15  0.59  0.29  0.33  0.05  0.09  0.53] sorted [0 2 7]\n",
      "   state [0 0 1 0 1 0 0 1] state_WI [  0.7   -0.04   0.4    0.32   0.33   0.14   0.2  -10.  ] sorted [0 2 4]\n",
      "   state [1 0 1 0 1 0 1 1] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.09 -10.  ] sorted [2 4 3]\n",
      "   state [1 0 1 0 1 0 0 1] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.2  -10.  ] sorted [2 4 3]\n",
      "   state [0 0 1 0 1 0 0 0] state_WI [ 0.7  -0.04  0.4   0.32  0.33  0.14  0.2   0.53] sorted [0 7 2]\n",
      "   state [0 0 1 0 1 0 0 0] state_WI [ 0.7  -0.04  0.4   0.32  0.33  0.14  0.2   0.53] sorted [0 7 2]\n",
      "   state [1 0 0 0 1 0 1 0] state_WI [-10.    -0.04   0.59   0.32   0.33   0.14   0.09   0.53] sorted [2 7 4]\n",
      "   state [0 0 1 0 0 0 1 0] state_WI [ 0.7  -0.04  0.4   0.32  0.66  0.14  0.09  0.53] sorted [0 4 7]\n",
      "   state [0 0 0 0 0 1 1 0] state_WI [ 0.7  -0.04  0.59  0.32  0.66  0.05  0.09  0.53] sorted [0 4 2]\n",
      "   state [1 0 1 0 1 1 0 0] state_WI [-10.    -0.04   0.4    0.32   0.33   0.05   0.2    0.53] sorted [7 2 4]\n",
      "   state [0 0 1 1 1 0 0 1] state_WI [  0.7   -0.04   0.4    0.29   0.33   0.14   0.2  -10.  ] sorted [0 2 4]\n",
      "   state [0 0 1 1 1 0 0 1] state_WI [  0.7   -0.04   0.4    0.29   0.33   0.14   0.2  -10.  ] sorted [0 2 4]\n",
      "   state [1 1 1 1 0 0 0 1] state_WI [-10.    -0.15   0.4    0.29   0.66   0.14   0.2  -10.  ] sorted [4 2 3]\n",
      "   state [0 0 1 0 0 0 1 0] state_WI [ 0.7  -0.04  0.4   0.32  0.66  0.14  0.09  0.53] sorted [0 4 7]\n",
      "   state [1 0 1 0 0 0 0 0] state_WI [-10.    -0.04   0.4    0.32   0.66   0.14   0.2    0.53] sorted [4 7 2]\n",
      "   state [1 0 0 0 0 0 1 1] state_WI [-10.    -0.04   0.59   0.32   0.66   0.14   0.09 -10.  ] sorted [4 2 3]\n",
      "   state [0 0 0 0 0 0 0 1] state_WI [  0.7   -0.04   0.59   0.32   0.66   0.14   0.2  -10.  ] sorted [0 4 2]\n",
      "   state [1 0 0 0 1 0 0 1] state_WI [-10.    -0.04   0.59   0.32   0.33   0.14   0.2  -10.  ] sorted [2 4 3]\n",
      "   state [1 0 1 0 0 0 0 1] state_WI [-10.    -0.04   0.4    0.32   0.66   0.14   0.2  -10.  ] sorted [4 2 3]\n",
      "   state [0 0 1 0 1 0 0 1] state_WI [  0.7   -0.04   0.4    0.32   0.33   0.14   0.2  -10.  ] sorted [0 2 4]\n",
      "instance 7, ep 18, state [1 0 0 1 0 1 1 1]\n",
      "   state [1 0 0 1 0 1 1 1] state_WI [-10.    -0.04   0.59   0.29   0.66   0.05   0.09 -10.  ] sorted [4 2 3]\n",
      "   state [0 0 1 1 0 1 1 1] state_WI [  0.7   -0.04   0.4    0.29   0.66   0.05   0.09 -10.  ] sorted [0 4 2]\n",
      "   state [0 0 0 0 0 0 0 1] state_WI [  0.7   -0.04   0.59   0.32   0.66   0.14   0.2  -10.  ] sorted [0 4 2]\n",
      "   state [1 1 0 0 1 0 0 1] state_WI [-10.    -0.15   0.59   0.32   0.33   0.14   0.2  -10.  ] sorted [2 4 3]\n",
      "   state [1 0 1 0 1 0 0 0] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.2    0.53] sorted [7 2 4]\n",
      "   state [0 0 1 0 1 0 1 1] state_WI [  0.7   -0.04   0.4    0.32   0.33   0.14   0.09 -10.  ] sorted [0 2 4]\n",
      "   state [1 0 1 0 1 0 1 0] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.09   0.53] sorted [7 2 4]\n",
      "   state [1 0 1 0 1 0 0 1] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.2  -10.  ] sorted [2 4 3]\n",
      "   state [1 0 1 1 1 0 1 0] state_WI [-10.    -0.04   0.4    0.29   0.33   0.14   0.09   0.53] sorted [7 2 4]\n",
      "   state [1 0 0 0 1 0 0 0] state_WI [-10.    -0.04   0.59   0.32   0.33   0.14   0.2    0.53] sorted [2 7 4]\n",
      "   state [0 0 1 0 0 0 1 1] state_WI [  0.7   -0.04   0.4    0.32   0.66   0.14   0.09 -10.  ] sorted [0 4 2]\n",
      "   state [0 0 1 0 0 0 1 0] state_WI [ 0.7  -0.04  0.4   0.32  0.66  0.14  0.09  0.53] sorted [0 4 7]\n",
      "   state [0 0 1 0 1 0 0 1] state_WI [  0.7   -0.04   0.4    0.32   0.33   0.14   0.2  -10.  ] sorted [0 2 4]\n",
      "   state [1 0 1 0 0 0 0 1] state_WI [-10.    -0.04   0.4    0.32   0.66   0.14   0.2  -10.  ] sorted [4 2 3]\n",
      "   state [0 0 0 0 1 0 0 0] state_WI [ 0.7  -0.04  0.59  0.32  0.33  0.14  0.2   0.53] sorted [0 2 7]\n",
      "   state [1 0 0 0 0 0 1 0] state_WI [-10.    -0.04   0.59   0.32   0.66   0.14   0.09   0.53] sorted [4 2 7]\n",
      "   state [1 0 1 1 1 0 1 0] state_WI [-10.    -0.04   0.4    0.29   0.33   0.14   0.09   0.53] sorted [7 2 4]\n",
      "   state [0 1 1 0 1 0 0 0] state_WI [ 0.7  -0.15  0.4   0.32  0.33  0.14  0.2   0.53] sorted [0 7 2]\n",
      "   state [0 1 1 0 1 0 1 0] state_WI [ 0.7  -0.15  0.4   0.32  0.33  0.14  0.09  0.53] sorted [0 7 2]\n",
      "   state [1 0 0 0 0 1 1 1] state_WI [-10.    -0.04   0.59   0.32   0.66   0.05   0.09 -10.  ] sorted [4 2 3]\n",
      "instance 7, ep 19, state [1 0 0 1 0 1 1 1]\n",
      "   state [1 0 0 1 0 1 1 1] state_WI [-10.    -0.04   0.59   0.29   0.66   0.05   0.09 -10.  ] sorted [4 2 3]\n",
      "   state [1 0 1 0 0 0 1 0] state_WI [-10.    -0.04   0.4    0.32   0.66   0.14   0.09   0.53] sorted [4 7 2]\n",
      "   state [1 0 1 0 1 0 1 0] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.09   0.53] sorted [7 2 4]\n",
      "   state [0 0 0 0 1 0 1 0] state_WI [ 0.7  -0.04  0.59  0.32  0.33  0.14  0.09  0.53] sorted [0 2 7]\n",
      "   state [1 0 1 0 1 0 0 1] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.2  -10.  ] sorted [2 4 3]\n",
      "   state [1 0 1 0 1 0 0 1] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.2  -10.  ] sorted [2 4 3]\n",
      "   state [1 0 1 1 1 0 0 0] state_WI [-10.    -0.04   0.4    0.29   0.33   0.14   0.2    0.53] sorted [7 2 4]\n",
      "   state [0 0 1 1 1 0 1 0] state_WI [ 0.7  -0.04  0.4   0.29  0.33  0.14  0.09  0.53] sorted [0 7 2]\n",
      "   state [1 0 1 0 1 0 1 1] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.09 -10.  ] sorted [2 4 3]\n",
      "   state [0 0 1 0 1 0 0 0] state_WI [ 0.7  -0.04  0.4   0.32  0.33  0.14  0.2   0.53] sorted [0 7 2]\n",
      "   state [1 1 1 0 1 0 1 1] state_WI [-10.    -0.15   0.4    0.32   0.33   0.14   0.09 -10.  ] sorted [2 4 3]\n",
      "   state [1 0 1 0 0 0 0 1] state_WI [-10.    -0.04   0.4    0.32   0.66   0.14   0.2  -10.  ] sorted [4 2 3]\n",
      "   state [1 0 1 0 0 0 1 1] state_WI [-10.    -0.04   0.4    0.32   0.66   0.14   0.09 -10.  ] sorted [4 2 3]\n",
      "   state [1 0 1 0 0 0 0 1] state_WI [-10.    -0.04   0.4    0.32   0.66   0.14   0.2  -10.  ] sorted [4 2 3]\n",
      "   state [0 0 0 0 0 0 1 1] state_WI [  0.7   -0.04   0.59   0.32   0.66   0.14   0.09 -10.  ] sorted [0 4 2]\n",
      "   state [1 0 1 0 1 0 1 1] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.09 -10.  ] sorted [2 4 3]\n",
      "   state [1 0 1 1 1 0 1 0] state_WI [-10.    -0.04   0.4    0.29   0.33   0.14   0.09   0.53] sorted [7 2 4]\n",
      "   state [0 0 0 0 1 0 0 1] state_WI [  0.7   -0.04   0.59   0.32   0.33   0.14   0.2  -10.  ] sorted [0 2 4]\n",
      "   state [0 0 1 0 1 0 0 1] state_WI [  0.7   -0.04   0.4    0.32   0.33   0.14   0.2  -10.  ] sorted [0 2 4]\n",
      "   state [1 0 1 0 1 0 0 1] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.2  -10.  ] sorted [2 4 3]\n",
      "instance 7, ep 20, state [0 0 0 0 1 0 0 0]\n",
      "   state [0 0 0 0 1 0 0 0] state_WI [ 0.7  -0.04  0.59  0.32  0.33  0.14  0.2   0.53] sorted [0 2 7]\n",
      "   state [1 0 1 0 0 0 0 1] state_WI [-10.    -0.04   0.4    0.32   0.66   0.14   0.2  -10.  ] sorted [4 2 3]\n",
      "   state [0 0 1 1 1 1 1 0] state_WI [ 0.7  -0.04  0.4   0.29  0.33  0.05  0.09  0.53] sorted [0 7 2]\n",
      "   state [0 0 1 0 0 0 0 1] state_WI [  0.7   -0.04   0.4    0.32   0.66   0.14   0.2  -10.  ] sorted [0 4 2]\n",
      "   state [1 0 1 0 1 0 1 1] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.09 -10.  ] sorted [2 4 3]\n",
      "   state [0 0 1 0 1 0 0 1] state_WI [  0.7   -0.04   0.4    0.32   0.33   0.14   0.2  -10.  ] sorted [0 2 4]\n",
      "   state [0 0 1 0 1 0 0 0] state_WI [ 0.7  -0.04  0.4   0.32  0.33  0.14  0.2   0.53] sorted [0 7 2]\n",
      "   state [0 0 0 0 1 0 1 0] state_WI [ 0.7  -0.04  0.59  0.32  0.33  0.14  0.09  0.53] sorted [0 2 7]\n",
      "   state [0 0 0 0 1 0 0 0] state_WI [ 0.7  -0.04  0.59  0.32  0.33  0.14  0.2   0.53] sorted [0 2 7]\n",
      "   state [0 0 1 0 1 0 1 1] state_WI [  0.7   -0.04   0.4    0.32   0.33   0.14   0.09 -10.  ] sorted [0 2 4]\n",
      "   state [1 0 1 0 1 0 0 1] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.2  -10.  ] sorted [2 4 3]\n",
      "   state [0 0 1 0 0 0 0 0] state_WI [ 0.7  -0.04  0.4   0.32  0.66  0.14  0.2   0.53] sorted [0 4 7]\n",
      "   state [1 0 1 0 0 0 0 1] state_WI [-10.    -0.04   0.4    0.32   0.66   0.14   0.2  -10.  ] sorted [4 2 3]\n",
      "   state [1 0 0 1 0 0 0 1] state_WI [-10.    -0.04   0.59   0.29   0.66   0.14   0.2  -10.  ] sorted [4 2 3]\n",
      "   state [0 0 0 0 1 1 1 0] state_WI [ 0.7  -0.04  0.59  0.32  0.33  0.05  0.09  0.53] sorted [0 2 7]\n",
      "   state [0 0 0 1 0 1 1 1] state_WI [  0.7   -0.04   0.59   0.29   0.66   0.05   0.09 -10.  ] sorted [0 4 2]\n",
      "   state [1 0 1 1 1 0 0 1] state_WI [-10.    -0.04   0.4    0.29   0.33   0.14   0.2  -10.  ] sorted [2 4 3]\n",
      "   state [0 0 0 1 1 0 0 1] state_WI [  0.7   -0.04   0.59   0.29   0.33   0.14   0.2  -10.  ] sorted [0 2 4]\n",
      "   state [1 0 0 0 0 0 1 0] state_WI [-10.    -0.04   0.59   0.32   0.66   0.14   0.09   0.53] sorted [4 2 7]\n",
      "   state [1 0 1 0 1 0 1 1] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.09 -10.  ] sorted [2 4 3]\n",
      "instance 7, ep 21, state [1 1 0 0 0 0 1 1]\n",
      "   state [1 1 0 0 0 0 1 1] state_WI [-10.    -0.15   0.59   0.32   0.66   0.14   0.09 -10.  ] sorted [4 2 3]\n",
      "   state [1 0 1 0 1 0 0 1] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.2  -10.  ] sorted [2 4 3]\n",
      "   state [1 0 0 0 1 0 0 0] state_WI [-10.    -0.04   0.59   0.32   0.33   0.14   0.2    0.53] sorted [2 7 4]\n",
      "   state [1 0 0 0 1 0 0 1] state_WI [-10.    -0.04   0.59   0.32   0.33   0.14   0.2  -10.  ] sorted [2 4 3]\n",
      "   state [1 0 1 0 1 0 1 0] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.09   0.53] sorted [7 2 4]\n",
      "   state [1 0 1 0 1 0 1 0] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.09   0.53] sorted [7 2 4]\n",
      "   state [1 0 1 0 1 0 0 1] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.2  -10.  ] sorted [2 4 3]\n",
      "   state [0 0 1 0 1 0 1 1] state_WI [  0.7   -0.04   0.4    0.32   0.33   0.14   0.09 -10.  ] sorted [0 2 4]\n",
      "   state [1 0 1 0 1 0 0 1] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.2  -10.  ] sorted [2 4 3]\n",
      "   state [1 0 1 1 1 0 0 0] state_WI [-10.    -0.04   0.4    0.29   0.33   0.14   0.2    0.53] sorted [7 2 4]\n",
      "   state [1 0 1 0 1 0 1 1] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.09 -10.  ] sorted [2 4 3]\n",
      "   state [1 0 1 0 1 0 0 1] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.2  -10.  ] sorted [2 4 3]\n",
      "   state [1 0 1 0 1 0 1 0] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.09   0.53] sorted [7 2 4]\n",
      "   state [1 0 0 0 1 0 1 0] state_WI [-10.    -0.04   0.59   0.32   0.33   0.14   0.09   0.53] sorted [2 7 4]\n",
      "   state [0 0 0 0 1 0 1 0] state_WI [ 0.7  -0.04  0.59  0.32  0.33  0.14  0.09  0.53] sorted [0 2 7]\n",
      "   state [0 0 1 0 0 0 0 0] state_WI [ 0.7  -0.04  0.4   0.32  0.66  0.14  0.2   0.53] sorted [0 4 7]\n",
      "   state [1 0 1 0 1 0 0 0] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.2    0.53] sorted [7 2 4]\n",
      "   state [1 0 1 0 1 0 0 1] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.2  -10.  ] sorted [2 4 3]\n",
      "   state [0 1 1 0 1 0 0 0] state_WI [ 0.7  -0.15  0.4   0.32  0.33  0.14  0.2   0.53] sorted [0 7 2]\n",
      "   state [0 0 1 0 0 1 0 0] state_WI [ 0.7  -0.04  0.4   0.32  0.66  0.05  0.2   0.53] sorted [0 4 7]\n",
      "instance 7, ep 22, state [0 0 1 0 1 0 0 0]\n",
      "   state [0 0 1 0 1 0 0 0] state_WI [ 0.7  -0.04  0.4   0.32  0.33  0.14  0.2   0.53] sorted [0 7 2]\n",
      "   state [0 0 1 0 0 0 0 0] state_WI [ 0.7  -0.04  0.4   0.32  0.66  0.14  0.2   0.53] sorted [0 4 7]\n",
      "   state [1 0 1 0 1 0 1 0] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.09   0.53] sorted [7 2 4]\n",
      "   state [0 0 1 0 1 0 0 1] state_WI [  0.7   -0.04   0.4    0.32   0.33   0.14   0.2  -10.  ] sorted [0 2 4]\n",
      "   state [1 0 1 0 1 0 0 1] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.2  -10.  ] sorted [2 4 3]\n",
      "   state [0 0 1 1 1 0 0 0] state_WI [ 0.7  -0.04  0.4   0.29  0.33  0.14  0.2   0.53] sorted [0 7 2]\n",
      "   state [1 0 1 1 1 0 0 1] state_WI [-10.    -0.04   0.4    0.29   0.33   0.14   0.2  -10.  ] sorted [2 4 3]\n",
      "   state [1 0 1 0 1 1 1 0] state_WI [-10.    -0.04   0.4    0.32   0.33   0.05   0.09   0.53] sorted [7 2 4]\n",
      "   state [1 0 1 0 1 0 1 1] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.09 -10.  ] sorted [2 4 3]\n",
      "   state [0 0 1 1 1 0 0 0] state_WI [ 0.7  -0.04  0.4   0.29  0.33  0.14  0.2   0.53] sorted [0 7 2]\n",
      "   state [0 0 1 0 1 0 0 1] state_WI [  0.7   -0.04   0.4    0.32   0.33   0.14   0.2  -10.  ] sorted [0 2 4]\n",
      "   state [0 0 0 0 1 0 0 0] state_WI [ 0.7  -0.04  0.59  0.32  0.33  0.14  0.2   0.53] sorted [0 2 7]\n",
      "   state [1 0 0 0 0 0 1 0] state_WI [-10.    -0.04   0.59   0.32   0.66   0.14   0.09   0.53] sorted [4 2 7]\n",
      "   state [1 0 0 0 1 0 0 0] state_WI [-10.    -0.04   0.59   0.32   0.33   0.14   0.2    0.53] sorted [2 7 4]\n",
      "   state [0 0 1 0 1 0 1 1] state_WI [  0.7   -0.04   0.4    0.32   0.33   0.14   0.09 -10.  ] sorted [0 2 4]\n",
      "   state [1 0 1 0 1 0 0 0] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.2    0.53] sorted [7 2 4]\n",
      "   state [1 1 1 0 1 0 1 1] state_WI [-10.    -0.15   0.4    0.32   0.33   0.14   0.09 -10.  ] sorted [2 4 3]\n",
      "   state [0 0 1 0 1 0 0 1] state_WI [  0.7   -0.04   0.4    0.32   0.33   0.14   0.2  -10.  ] sorted [0 2 4]\n",
      "   state [0 0 1 0 1 0 1 0] state_WI [ 0.7  -0.04  0.4   0.32  0.33  0.14  0.09  0.53] sorted [0 7 2]\n",
      "   state [1 0 1 0 0 0 0 1] state_WI [-10.    -0.04   0.4    0.32   0.66   0.14   0.2  -10.  ] sorted [4 2 3]\n",
      "instance 7, ep 23, state [1 1 0 0 0 0 0 0]\n",
      "   state [1 1 0 0 0 0 0 0] state_WI [-10.    -0.15   0.59   0.32   0.66   0.14   0.2    0.53] sorted [4 2 7]\n",
      "   state [1 0 1 0 0 0 0 0] state_WI [-10.    -0.04   0.4    0.32   0.66   0.14   0.2    0.53] sorted [4 7 2]\n",
      "   state [1 0 1 0 1 0 1 0] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.09   0.53] sorted [7 2 4]\n",
      "   state [1 0 1 0 0 0 0 1] state_WI [-10.    -0.04   0.4    0.32   0.66   0.14   0.2  -10.  ] sorted [4 2 3]\n",
      "   state [0 1 0 1 1 0 0 1] state_WI [  0.7   -0.15   0.59   0.29   0.33   0.14   0.2  -10.  ] sorted [0 2 4]\n",
      "   state [0 0 1 0 1 0 0 0] state_WI [ 0.7  -0.04  0.4   0.32  0.33  0.14  0.2   0.53] sorted [0 7 2]\n",
      "   state [1 0 1 0 1 0 1 1] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.09 -10.  ] sorted [2 4 3]\n",
      "   state [0 0 1 1 0 0 0 1] state_WI [  0.7   -0.04   0.4    0.29   0.66   0.14   0.2  -10.  ] sorted [0 4 2]\n",
      "   state [1 0 1 0 1 0 1 0] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.09   0.53] sorted [7 2 4]\n",
      "   state [0 0 1 0 1 0 1 1] state_WI [  0.7   -0.04   0.4    0.32   0.33   0.14   0.09 -10.  ] sorted [0 2 4]\n",
      "   state [1 0 1 0 1 0 0 0] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.2    0.53] sorted [7 2 4]\n",
      "   state [0 1 1 0 1 0 1 0] state_WI [ 0.7  -0.15  0.4   0.32  0.33  0.14  0.09  0.53] sorted [0 7 2]\n",
      "   state [0 1 1 0 1 0 0 0] state_WI [ 0.7  -0.15  0.4   0.32  0.33  0.14  0.2   0.53] sorted [0 7 2]\n",
      "   state [0 0 1 0 1 0 0 0] state_WI [ 0.7  -0.04  0.4   0.32  0.33  0.14  0.2   0.53] sorted [0 7 2]\n",
      "   state [0 0 1 0 0 0 0 1] state_WI [  0.7   -0.04   0.4    0.32   0.66   0.14   0.2  -10.  ] sorted [0 4 2]\n",
      "   state [0 0 1 0 1 0 0 0] state_WI [ 0.7  -0.04  0.4   0.32  0.33  0.14  0.2   0.53] sorted [0 7 2]\n",
      "   state [1 0 1 0 0 0 0 1] state_WI [-10.    -0.04   0.4    0.32   0.66   0.14   0.2  -10.  ] sorted [4 2 3]\n",
      "   state [1 0 1 0 1 0 0 1] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.2  -10.  ] sorted [2 4 3]\n",
      "   state [0 0 1 1 0 0 1 0] state_WI [ 0.7  -0.04  0.4   0.29  0.66  0.14  0.09  0.53] sorted [0 4 7]\n",
      "   state [1 0 1 0 1 0 0 0] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.2    0.53] sorted [7 2 4]\n",
      "instance 7, ep 24, state [1 0 0 1 0 1 0 1]\n",
      "   state [1 0 0 1 0 1 0 1] state_WI [-10.    -0.04   0.59   0.29   0.66   0.05   0.2  -10.  ] sorted [4 2 3]\n",
      "   state [1 0 1 1 0 0 0 0] state_WI [-10.    -0.04   0.4    0.29   0.66   0.14   0.2    0.53] sorted [4 7 2]\n",
      "   state [0 0 0 1 1 0 0 1] state_WI [  0.7   -0.04   0.59   0.29   0.33   0.14   0.2  -10.  ] sorted [0 2 4]\n",
      "   state [0 0 1 0 1 0 0 1] state_WI [  0.7   -0.04   0.4    0.32   0.33   0.14   0.2  -10.  ] sorted [0 2 4]\n",
      "   state [1 0 1 1 1 0 1 1] state_WI [-10.    -0.04   0.4    0.29   0.33   0.14   0.09 -10.  ] sorted [2 4 3]\n",
      "   state [1 0 0 1 1 0 1 0] state_WI [-10.    -0.04   0.59   0.29   0.33   0.14   0.09   0.53] sorted [2 7 4]\n",
      "   state [1 0 1 0 1 0 1 0] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.09   0.53] sorted [7 2 4]\n",
      "   state [0 0 1 0 0 0 1 1] state_WI [  0.7   -0.04   0.4    0.32   0.66   0.14   0.09 -10.  ] sorted [0 4 2]\n",
      "   state [1 0 1 1 1 0 1 1] state_WI [-10.    -0.04   0.4    0.29   0.33   0.14   0.09 -10.  ] sorted [2 4 3]\n",
      "   state [1 0 1 1 0 1 0 0] state_WI [-10.    -0.04   0.4    0.29   0.66   0.05   0.2    0.53] sorted [4 7 2]\n",
      "   state [1 0 1 0 0 0 0 1] state_WI [-10.    -0.04   0.4    0.32   0.66   0.14   0.2  -10.  ] sorted [4 2 3]\n",
      "   state [0 0 1 1 0 0 0 0] state_WI [ 0.7  -0.04  0.4   0.29  0.66  0.14  0.2   0.53] sorted [0 4 7]\n",
      "   state [1 0 1 1 1 0 1 1] state_WI [-10.    -0.04   0.4    0.29   0.33   0.14   0.09 -10.  ] sorted [2 4 3]\n",
      "   state [0 0 1 1 1 0 0 1] state_WI [  0.7   -0.04   0.4    0.29   0.33   0.14   0.2  -10.  ] sorted [0 2 4]\n",
      "   state [0 0 1 1 0 1 1 0] state_WI [ 0.7  -0.04  0.4   0.29  0.66  0.05  0.09  0.53] sorted [0 4 7]\n",
      "   state [0 0 1 0 0 0 1 1] state_WI [  0.7   -0.04   0.4    0.32   0.66   0.14   0.09 -10.  ] sorted [0 4 2]\n",
      "   state [0 0 1 0 1 0 0 1] state_WI [  0.7   -0.04   0.4    0.32   0.33   0.14   0.2  -10.  ] sorted [0 2 4]\n",
      "   state [0 0 1 1 1 0 0 0] state_WI [ 0.7  -0.04  0.4   0.29  0.33  0.14  0.2   0.53] sorted [0 7 2]\n",
      "   state [1 0 1 0 0 0 0 1] state_WI [-10.    -0.04   0.4    0.32   0.66   0.14   0.2  -10.  ] sorted [4 2 3]\n",
      "   state [1 0 1 0 0 0 0 1] state_WI [-10.    -0.04   0.4    0.32   0.66   0.14   0.2  -10.  ] sorted [4 2 3]\n",
      "instance 7, ep 25, state [1 1 1 0 1 0 0 0]\n",
      "   state [1 1 1 0 1 0 0 0] state_WI [-10.    -0.15   0.4    0.32   0.33   0.14   0.2    0.53] sorted [7 2 4]\n",
      "   state [0 1 0 0 1 0 0 0] state_WI [ 0.7  -0.15  0.59  0.32  0.33  0.14  0.2   0.53] sorted [0 2 7]\n",
      "   state [0 0 0 0 0 0 0 1] state_WI [  0.7   -0.04   0.59   0.32   0.66   0.14   0.2  -10.  ] sorted [0 4 2]\n",
      "   state [1 0 0 0 1 0 1 1] state_WI [-10.    -0.04   0.59   0.32   0.33   0.14   0.09 -10.  ] sorted [2 4 3]\n",
      "   state [1 0 0 0 1 0 1 1] state_WI [-10.    -0.04   0.59   0.32   0.33   0.14   0.09 -10.  ] sorted [2 4 3]\n",
      "   state [1 0 1 0 0 0 1 0] state_WI [-10.    -0.04   0.4    0.32   0.66   0.14   0.09   0.53] sorted [4 7 2]\n",
      "   state [1 0 1 0 1 0 0 0] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.2    0.53] sorted [7 2 4]\n",
      "   state [1 0 0 0 1 0 0 0] state_WI [-10.    -0.04   0.59   0.32   0.33   0.14   0.2    0.53] sorted [2 7 4]\n",
      "   state [0 0 1 0 1 0 0 1] state_WI [  0.7   -0.04   0.4    0.32   0.33   0.14   0.2  -10.  ] sorted [0 2 4]\n",
      "   state [1 0 1 0 1 0 1 0] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.09   0.53] sorted [7 2 4]\n",
      "   state [0 0 1 0 1 0 1 1] state_WI [  0.7   -0.04   0.4    0.32   0.33   0.14   0.09 -10.  ] sorted [0 2 4]\n",
      "   state [1 0 1 0 1 0 0 1] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.2  -10.  ] sorted [2 4 3]\n",
      "   state [0 0 1 1 1 0 1 0] state_WI [ 0.7  -0.04  0.4   0.29  0.33  0.14  0.09  0.53] sorted [0 7 2]\n",
      "   state [1 0 1 0 0 0 0 1] state_WI [-10.    -0.04   0.4    0.32   0.66   0.14   0.2  -10.  ] sorted [4 2 3]\n",
      "   state [1 0 1 0 1 0 0 0] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.2    0.53] sorted [7 2 4]\n",
      "   state [1 0 1 0 1 0 1 1] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.09 -10.  ] sorted [2 4 3]\n",
      "   state [1 0 1 0 0 0 0 1] state_WI [-10.    -0.04   0.4    0.32   0.66   0.14   0.2  -10.  ] sorted [4 2 3]\n",
      "   state [0 0 1 1 1 0 0 1] state_WI [  0.7   -0.04   0.4    0.29   0.33   0.14   0.2  -10.  ] sorted [0 2 4]\n",
      "   state [0 0 1 1 1 1 1 0] state_WI [ 0.7  -0.04  0.4   0.29  0.33  0.05  0.09  0.53] sorted [0 7 2]\n",
      "   state [0 0 1 0 1 0 0 0] state_WI [ 0.7  -0.04  0.4   0.32  0.33  0.14  0.2   0.53] sorted [0 7 2]\n",
      "instance 7, ep 26, state [1 0 1 1 1 1 0 0]\n",
      "   state [1 0 1 1 1 1 0 0] state_WI [-10.    -0.04   0.4    0.29   0.33   0.05   0.2    0.53] sorted [7 2 4]\n",
      "   state [0 1 1 1 1 0 0 0] state_WI [ 0.7  -0.15  0.4   0.29  0.33  0.14  0.2   0.53] sorted [0 7 2]\n",
      "   state [1 0 1 0 1 0 0 0] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.2    0.53] sorted [7 2 4]\n",
      "   state [1 0 1 0 1 0 0 1] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.2  -10.  ] sorted [2 4 3]\n",
      "   state [1 0 1 1 1 0 0 0] state_WI [-10.    -0.04   0.4    0.29   0.33   0.14   0.2    0.53] sorted [7 2 4]\n",
      "   state [0 1 1 1 1 0 1 0] state_WI [ 0.7  -0.15  0.4   0.29  0.33  0.14  0.09  0.53] sorted [0 7 2]\n",
      "   state [1 0 1 0 0 0 0 1] state_WI [-10.    -0.04   0.4    0.32   0.66   0.14   0.2  -10.  ] sorted [4 2 3]\n",
      "   state [0 0 1 0 0 0 0 1] state_WI [  0.7   -0.04   0.4    0.32   0.66   0.14   0.2  -10.  ] sorted [0 4 2]\n",
      "   state [1 0 1 0 0 0 0 1] state_WI [-10.    -0.04   0.4    0.32   0.66   0.14   0.2  -10.  ] sorted [4 2 3]\n",
      "   state [1 0 1 1 0 0 1 0] state_WI [-10.    -0.04   0.4    0.29   0.66   0.14   0.09   0.53] sorted [4 7 2]\n",
      "   state [1 0 1 1 1 1 1 0] state_WI [-10.    -0.04   0.4    0.29   0.33   0.05   0.09   0.53] sorted [7 2 4]\n",
      "   state [1 0 1 1 1 1 1 0] state_WI [-10.    -0.04   0.4    0.29   0.33   0.05   0.09   0.53] sorted [7 2 4]\n",
      "   state [1 0 1 0 1 0 0 0] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.2    0.53] sorted [7 2 4]\n",
      "   state [0 0 1 0 0 0 1 0] state_WI [ 0.7  -0.04  0.4   0.32  0.66  0.14  0.09  0.53] sorted [0 4 7]\n",
      "   state [0 0 0 0 1 0 0 1] state_WI [  0.7   -0.04   0.59   0.32   0.33   0.14   0.2  -10.  ] sorted [0 2 4]\n",
      "   state [1 0 1 0 1 0 1 0] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.09   0.53] sorted [7 2 4]\n",
      "   state [0 0 0 0 1 0 1 0] state_WI [ 0.7  -0.04  0.59  0.32  0.33  0.14  0.09  0.53] sorted [0 2 7]\n",
      "   state [0 0 1 0 0 0 1 1] state_WI [  0.7   -0.04   0.4    0.32   0.66   0.14   0.09 -10.  ] sorted [0 4 2]\n",
      "   state [0 0 1 0 1 0 1 0] state_WI [ 0.7  -0.04  0.4   0.32  0.33  0.14  0.09  0.53] sorted [0 7 2]\n",
      "   state [1 0 1 1 0 0 0 1] state_WI [-10.    -0.04   0.4    0.29   0.66   0.14   0.2  -10.  ] sorted [4 2 3]\n",
      "instance 7, ep 27, state [0 0 0 0 0 1 1 0]\n",
      "   state [0 0 0 0 0 1 1 0] state_WI [ 0.7  -0.04  0.59  0.32  0.66  0.05  0.09  0.53] sorted [0 4 2]\n",
      "   state [0 0 0 0 1 1 1 1] state_WI [  0.7   -0.04   0.59   0.32   0.33   0.05   0.09 -10.  ] sorted [0 2 4]\n",
      "   state [1 0 1 0 1 0 1 1] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.09 -10.  ] sorted [2 4 3]\n",
      "   state [0 0 1 0 1 0 0 0] state_WI [ 0.7  -0.04  0.4   0.32  0.33  0.14  0.2   0.53] sorted [0 7 2]\n",
      "   state [0 0 1 0 1 0 0 1] state_WI [  0.7   -0.04   0.4    0.32   0.33   0.14   0.2  -10.  ] sorted [0 2 4]\n",
      "   state [1 0 1 1 1 0 0 0] state_WI [-10.    -0.04   0.4    0.29   0.33   0.14   0.2    0.53] sorted [7 2 4]\n",
      "   state [0 0 0 0 1 0 0 0] state_WI [ 0.7  -0.04  0.59  0.32  0.33  0.14  0.2   0.53] sorted [0 2 7]\n",
      "   state [0 0 1 0 0 0 1 0] state_WI [ 0.7  -0.04  0.4   0.32  0.66  0.14  0.09  0.53] sorted [0 4 7]\n",
      "   state [0 1 1 0 0 0 0 0] state_WI [ 0.7  -0.15  0.4   0.32  0.66  0.14  0.2   0.53] sorted [0 4 7]\n",
      "   state [1 0 0 0 1 0 1 0] state_WI [-10.    -0.04   0.59   0.32   0.33   0.14   0.09   0.53] sorted [2 7 4]\n",
      "   state [0 0 1 0 1 0 0 0] state_WI [ 0.7  -0.04  0.4   0.32  0.33  0.14  0.2   0.53] sorted [0 7 2]\n",
      "   state [0 0 0 0 1 0 1 1] state_WI [  0.7   -0.04   0.59   0.32   0.33   0.14   0.09 -10.  ] sorted [0 2 4]\n",
      "   state [0 0 1 0 1 0 0 0] state_WI [ 0.7  -0.04  0.4   0.32  0.33  0.14  0.2   0.53] sorted [0 7 2]\n",
      "   state [1 0 1 0 0 0 0 1] state_WI [-10.    -0.04   0.4    0.32   0.66   0.14   0.2  -10.  ] sorted [4 2 3]\n",
      "   state [1 0 1 0 0 0 0 0] state_WI [-10.    -0.04   0.4    0.32   0.66   0.14   0.2    0.53] sorted [4 7 2]\n",
      "   state [1 0 1 0 1 0 0 0] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.2    0.53] sorted [7 2 4]\n",
      "   state [0 0 1 0 1 0 1 1] state_WI [  0.7   -0.04   0.4    0.32   0.33   0.14   0.09 -10.  ] sorted [0 2 4]\n",
      "   state [1 0 0 0 1 0 0 1] state_WI [-10.    -0.04   0.59   0.32   0.33   0.14   0.2  -10.  ] sorted [2 4 3]\n",
      "   state [0 0 1 1 1 0 0 0] state_WI [ 0.7  -0.04  0.4   0.29  0.33  0.14  0.2   0.53] sorted [0 7 2]\n",
      "   state [0 0 1 0 0 0 0 0] state_WI [ 0.7  -0.04  0.4   0.32  0.66  0.14  0.2   0.53] sorted [0 4 7]\n",
      "instance 7, ep 28, state [1 0 0 1 0 0 1 1]\n",
      "   state [1 0 0 1 0 0 1 1] state_WI [-10.    -0.04   0.59   0.29   0.66   0.14   0.09 -10.  ] sorted [4 2 3]\n",
      "   state [1 0 1 0 0 0 0 1] state_WI [-10.    -0.04   0.4    0.32   0.66   0.14   0.2  -10.  ] sorted [4 2 3]\n",
      "   state [1 0 1 0 0 0 0 1] state_WI [-10.    -0.04   0.4    0.32   0.66   0.14   0.2  -10.  ] sorted [4 2 3]\n",
      "   state [0 0 1 1 1 0 1 1] state_WI [  0.7   -0.04   0.4    0.29   0.33   0.14   0.09 -10.  ] sorted [0 2 4]\n",
      "   state [1 0 1 1 1 0 1 0] state_WI [-10.    -0.04   0.4    0.29   0.33   0.14   0.09   0.53] sorted [7 2 4]\n",
      "   state [0 0 1 0 1 1 0 1] state_WI [  0.7   -0.04   0.4    0.32   0.33   0.05   0.2  -10.  ] sorted [0 2 4]\n",
      "   state [0 0 1 0 0 0 0 1] state_WI [  0.7   -0.04   0.4    0.32   0.66   0.14   0.2  -10.  ] sorted [0 4 2]\n",
      "   state [0 0 1 0 1 0 0 1] state_WI [  0.7   -0.04   0.4    0.32   0.33   0.14   0.2  -10.  ] sorted [0 2 4]\n",
      "   state [0 1 1 0 1 0 0 1] state_WI [  0.7   -0.15   0.4    0.32   0.33   0.14   0.2  -10.  ] sorted [0 2 4]\n",
      "   state [0 0 1 0 1 0 0 1] state_WI [  0.7   -0.04   0.4    0.32   0.33   0.14   0.2  -10.  ] sorted [0 2 4]\n",
      "   state [1 0 1 0 1 0 1 1] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.09 -10.  ] sorted [2 4 3]\n",
      "   state [0 0 1 0 1 0 0 0] state_WI [ 0.7  -0.04  0.4   0.32  0.33  0.14  0.2   0.53] sorted [0 7 2]\n",
      "   state [0 0 0 0 0 0 0 1] state_WI [  0.7   -0.04   0.59   0.32   0.66   0.14   0.2  -10.  ] sorted [0 4 2]\n",
      "   state [1 0 0 0 0 0 0 0] state_WI [-10.    -0.04   0.59   0.32   0.66   0.14   0.2    0.53] sorted [4 2 7]\n",
      "   state [1 0 1 0 1 0 1 1] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.09 -10.  ] sorted [2 4 3]\n",
      "   state [1 0 1 0 1 0 1 0] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.09   0.53] sorted [7 2 4]\n",
      "   state [0 0 1 0 1 0 0 1] state_WI [  0.7   -0.04   0.4    0.32   0.33   0.14   0.2  -10.  ] sorted [0 2 4]\n",
      "   state [1 0 1 0 1 0 1 0] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.09   0.53] sorted [7 2 4]\n",
      "   state [0 0 1 0 1 0 1 0] state_WI [ 0.7  -0.04  0.4   0.32  0.33  0.14  0.09  0.53] sorted [0 7 2]\n",
      "   state [1 0 1 0 1 0 0 0] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.2    0.53] sorted [7 2 4]\n",
      "instance 7, ep 29, state [1 1 1 0 0 0 0 1]\n",
      "   state [1 1 1 0 0 0 0 1] state_WI [-10.    -0.15   0.4    0.32   0.66   0.14   0.2  -10.  ] sorted [4 2 3]\n",
      "   state [0 0 1 0 0 0 0 1] state_WI [  0.7   -0.04   0.4    0.32   0.66   0.14   0.2  -10.  ] sorted [0 4 2]\n",
      "   state [1 0 0 0 1 0 1 0] state_WI [-10.    -0.04   0.59   0.32   0.33   0.14   0.09   0.53] sorted [2 7 4]\n",
      "   state [0 0 1 0 1 0 1 0] state_WI [ 0.7  -0.04  0.4   0.32  0.33  0.14  0.09  0.53] sorted [0 7 2]\n",
      "   state [0 0 1 0 1 0 0 0] state_WI [ 0.7  -0.04  0.4   0.32  0.33  0.14  0.2   0.53] sorted [0 7 2]\n",
      "   state [1 0 1 0 1 0 1 1] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.09 -10.  ] sorted [2 4 3]\n",
      "   state [0 0 1 0 0 0 1 0] state_WI [ 0.7  -0.04  0.4   0.32  0.66  0.14  0.09  0.53] sorted [0 4 7]\n",
      "   state [1 0 0 0 0 0 0 1] state_WI [-10.    -0.04   0.59   0.32   0.66   0.14   0.2  -10.  ] sorted [4 2 3]\n",
      "   state [1 0 0 0 1 0 1 0] state_WI [-10.    -0.04   0.59   0.32   0.33   0.14   0.09   0.53] sorted [2 7 4]\n",
      "   state [1 0 0 0 1 0 1 1] state_WI [-10.    -0.04   0.59   0.32   0.33   0.14   0.09 -10.  ] sorted [2 4 3]\n",
      "   state [0 0 1 0 1 0 1 0] state_WI [ 0.7  -0.04  0.4   0.32  0.33  0.14  0.09  0.53] sorted [0 7 2]\n",
      "   state [0 1 1 0 1 0 1 1] state_WI [  0.7   -0.15   0.4    0.32   0.33   0.14   0.09 -10.  ] sorted [0 2 4]\n",
      "   state [1 0 1 0 0 0 0 0] state_WI [-10.    -0.04   0.4    0.32   0.66   0.14   0.2    0.53] sorted [4 7 2]\n",
      "   state [1 0 1 0 1 0 0 0] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.2    0.53] sorted [7 2 4]\n",
      "   state [0 0 1 0 1 0 0 1] state_WI [  0.7   -0.04   0.4    0.32   0.33   0.14   0.2  -10.  ] sorted [0 2 4]\n",
      "   state [1 0 1 0 1 0 1 0] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.09   0.53] sorted [7 2 4]\n",
      "   state [0 0 1 0 1 1 1 0] state_WI [ 0.7  -0.04  0.4   0.32  0.33  0.05  0.09  0.53] sorted [0 7 2]\n",
      "   state [1 0 1 0 1 0 0 1] state_WI [-10.    -0.04   0.4    0.32   0.33   0.14   0.2  -10.  ] sorted [2 4 3]\n",
      "   state [1 0 1 0 1 1 1 1] state_WI [-10.    -0.04   0.4    0.32   0.33   0.05   0.09 -10.  ] sorted [2 4 3]\n",
      "   state [1 0 0 0 1 0 0 1] state_WI [-10.    -0.04   0.59   0.32   0.33   0.14   0.2  -10.  ] sorted [2 4 3]\n",
      "first state [1 0 0 1 0 1 0 0]\n",
      "   state [1 0 0 1 0 1 0 0] state_WI [  0.12   0.44 -10.     0.3    0.67 -10.     0.53   0.83] sorted [7 4 6]\n",
      "   state [1 0 0 1 0 0 1 1] state_WI [  0.12   0.44 -10.     0.3    0.67   0.34 -10.     0.28] sorted [4 1 5]\n",
      "   state [0 0 0 0 0 0 1 0] state_WI [  0.15   0.44 -10.     0.95   0.67   0.34 -10.     0.83] sorted [3 7 4]\n",
      "   state [0 0 0 1 1 0 0 1] state_WI [  0.15   0.44 -10.     0.3    0.42   0.34   0.53   0.28] sorted [6 1 4]\n",
      "   state [0 1 0 1 1 0 1 0] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34 -10.     0.83] sorted [7 1 4]\n",
      "   state [0 0 0 0 1 0 0 0] state_WI [  0.15   0.44 -10.     0.95   0.42   0.34   0.53   0.83] sorted [3 7 6]\n",
      "   state [0 0 0 1 0 0 1 1] state_WI [  0.15   0.44 -10.     0.3    0.67   0.34 -10.     0.28] sorted [4 1 5]\n",
      "   state [0 0 0 1 0 0 0 0] state_WI [  0.15   0.44 -10.     0.3    0.67   0.34   0.53   0.83] sorted [7 4 6]\n",
      "   state [0 0 0 0 1 1 0 1] state_WI [  0.15   0.44 -10.     0.95   0.42 -10.     0.53   0.28] sorted [3 6 1]\n",
      "   state [0 0 0 0 1 0 1 0] state_WI [  0.15   0.44 -10.     0.95   0.42   0.34 -10.     0.83] sorted [3 7 1]\n",
      "   state [0 0 0 1 1 0 1 0] state_WI [  0.15   0.44 -10.     0.3    0.42   0.34 -10.     0.83] sorted [7 1 4]\n",
      "   state [1 0 0 0 0 0 0 1] state_WI [  0.12   0.44 -10.     0.95   0.67   0.34   0.53   0.28] sorted [3 4 6]\n",
      "   state [1 0 0 1 0 0 1 1] state_WI [  0.12   0.44 -10.     0.3    0.67   0.34 -10.     0.28] sorted [4 1 5]\n",
      "   state [0 1 0 0 0 0 0 1] state_WI [  0.15   0.43 -10.     0.95   0.67   0.34   0.53   0.28] sorted [3 4 6]\n",
      "   state [0 0 0 1 1 0 1 1] state_WI [  0.15   0.44 -10.     0.3    0.42   0.34 -10.     0.28] sorted [1 4 5]\n",
      "   state [0 0 0 0 1 0 0 1] state_WI [  0.15   0.44 -10.     0.95   0.42   0.34   0.53   0.28] sorted [3 6 1]\n",
      "   state [0 1 0 1 1 0 1 0] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34 -10.     0.83] sorted [7 1 4]\n",
      "   state [0 1 0 0 1 0 0 1] state_WI [  0.15   0.43 -10.     0.95   0.42   0.34   0.53   0.28] sorted [3 6 1]\n",
      "   state [0 0 0 1 0 0 1 1] state_WI [  0.15   0.44 -10.     0.3    0.67   0.34 -10.     0.28] sorted [4 1 5]\n",
      "   state [0 1 1 1 1 0 0 0] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34   0.53   0.83] sorted [7 6 1]\n",
      "instance 8, ep 1, state [1 1 1 1 0 0 1 1]\n",
      "   state [1 1 1 1 0 0 1 1] state_WI [  0.12   0.43 -10.     0.3    0.67   0.34 -10.     0.28] sorted [4 1 5]\n",
      "   state [0 1 1 1 1 0 0 0] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34   0.53   0.83] sorted [7 6 1]\n",
      "   state [0 1 1 1 0 0 1 1] state_WI [  0.15   0.43 -10.     0.3    0.67   0.34 -10.     0.28] sorted [4 1 5]\n",
      "   state [0 1 0 0 0 0 1 1] state_WI [  0.15   0.43 -10.     0.95   0.67   0.34 -10.     0.28] sorted [3 4 1]\n",
      "   state [1 1 0 1 1 0 1 1] state_WI [  0.12   0.43 -10.     0.3    0.42   0.34 -10.     0.28] sorted [1 4 5]\n",
      "   state [1 1 0 0 1 0 1 0] state_WI [  0.12   0.43 -10.     0.95   0.42   0.34 -10.     0.83] sorted [3 7 1]\n",
      "   state [0 1 1 0 1 0 1 0] state_WI [  0.15   0.43 -10.     0.95   0.42   0.34 -10.     0.83] sorted [3 7 1]\n",
      "   state [1 1 0 0 0 0 1 1] state_WI [  0.12   0.43 -10.     0.95   0.67   0.34 -10.     0.28] sorted [3 4 1]\n",
      "   state [1 1 1 1 0 0 0 1] state_WI [  0.12   0.43 -10.     0.3    0.67   0.34   0.53   0.28] sorted [4 6 1]\n",
      "   state [0 1 0 1 0 1 0 0] state_WI [  0.15   0.43 -10.     0.3    0.67 -10.     0.53   0.83] sorted [7 4 6]\n",
      "   state [0 0 0 0 0 0 0 1] state_WI [  0.15   0.44 -10.     0.95   0.67   0.34   0.53   0.28] sorted [3 4 6]\n",
      "   state [0 0 0 1 0 0 1 0] state_WI [  0.15   0.44 -10.     0.3    0.67   0.34 -10.     0.83] sorted [7 4 1]\n",
      "   state [0 0 0 0 1 1 0 1] state_WI [  0.15   0.44 -10.     0.95   0.42 -10.     0.53   0.28] sorted [3 6 1]\n",
      "   state [0 0 0 1 0 1 0 1] state_WI [  0.15   0.44 -10.     0.3    0.67 -10.     0.53   0.28] sorted [4 6 1]\n",
      "   state [0 0 0 0 1 1 0 1] state_WI [  0.15   0.44 -10.     0.95   0.42 -10.     0.53   0.28] sorted [3 6 1]\n",
      "   state [0 1 0 1 0 1 0 0] state_WI [  0.15   0.43 -10.     0.3    0.67 -10.     0.53   0.83] sorted [7 4 6]\n",
      "   state [0 1 0 1 0 0 0 0] state_WI [  0.15   0.43 -10.     0.3    0.67   0.34   0.53   0.83] sorted [7 4 6]\n",
      "   state [0 0 0 1 0 0 1 0] state_WI [  0.15   0.44 -10.     0.3    0.67   0.34 -10.     0.83] sorted [7 4 1]\n",
      "   state [0 1 0 1 1 1 0 1] state_WI [  0.15   0.43 -10.     0.3    0.42 -10.     0.53   0.28] sorted [6 1 4]\n",
      "   state [0 1 0 0 1 0 0 0] state_WI [  0.15   0.43 -10.     0.95   0.42   0.34   0.53   0.83] sorted [3 7 6]\n",
      "instance 8, ep 2, state [0 1 0 0 0 1 1 0]\n",
      "   state [0 1 0 0 0 1 1 0] state_WI [  0.15   0.43 -10.     0.95   0.67 -10.   -10.     0.83] sorted [3 7 4]\n",
      "   state [0 1 1 1 0 0 1 1] state_WI [  0.15   0.43 -10.     0.3    0.67   0.34 -10.     0.28] sorted [4 1 5]\n",
      "   state [0 1 1 1 1 1 0 1] state_WI [  0.15   0.43 -10.     0.3    0.42 -10.     0.53   0.28] sorted [6 1 4]\n",
      "   state [0 1 0 1 1 0 1 0] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34 -10.     0.83] sorted [7 1 4]\n",
      "   state [0 1 0 0 1 0 0 1] state_WI [  0.15   0.43 -10.     0.95   0.42   0.34   0.53   0.28] sorted [3 6 1]\n",
      "   state [0 1 0 1 0 0 0 1] state_WI [  0.15   0.43 -10.     0.3    0.67   0.34   0.53   0.28] sorted [4 6 1]\n",
      "   state [0 1 1 1 0 0 1 0] state_WI [  0.15   0.43 -10.     0.3    0.67   0.34 -10.     0.83] sorted [7 4 1]\n",
      "   state [0 0 0 1 1 0 1 0] state_WI [  0.15   0.44 -10.     0.3    0.42   0.34 -10.     0.83] sorted [7 1 4]\n",
      "   state [0 1 0 0 1 0 0 1] state_WI [  0.15   0.43 -10.     0.95   0.42   0.34   0.53   0.28] sorted [3 6 1]\n",
      "   state [0 0 0 1 1 0 0 0] state_WI [  0.15   0.44 -10.     0.3    0.42   0.34   0.53   0.83] sorted [7 6 1]\n",
      "   state [0 1 0 0 1 0 0 1] state_WI [  0.15   0.43 -10.     0.95   0.42   0.34   0.53   0.28] sorted [3 6 1]\n",
      "   state [0 1 0 1 1 0 0 1] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34   0.53   0.28] sorted [6 1 4]\n",
      "   state [0 1 0 0 1 0 1 0] state_WI [  0.15   0.43 -10.     0.95   0.42   0.34 -10.     0.83] sorted [3 7 1]\n",
      "   state [0 1 0 1 1 0 0 1] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34   0.53   0.28] sorted [6 1 4]\n",
      "   state [0 1 0 1 0 0 0 1] state_WI [  0.15   0.43 -10.     0.3    0.67   0.34   0.53   0.28] sorted [4 6 1]\n",
      "   state [0 1 0 1 1 0 1 1] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34 -10.     0.28] sorted [1 4 5]\n",
      "   state [0 1 0 0 1 0 0 0] state_WI [  0.15   0.43 -10.     0.95   0.42   0.34   0.53   0.83] sorted [3 7 6]\n",
      "   state [0 0 1 1 0 0 1 1] state_WI [  0.15   0.44 -10.     0.3    0.67   0.34 -10.     0.28] sorted [4 1 5]\n",
      "   state [0 0 0 0 1 1 1 0] state_WI [  0.15   0.44 -10.     0.95   0.42 -10.   -10.     0.83] sorted [3 7 1]\n",
      "   state [0 1 0 1 1 0 0 1] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34   0.53   0.28] sorted [6 1 4]\n",
      "instance 8, ep 3, state [1 0 0 0 0 0 1 1]\n",
      "   state [1 0 0 0 0 0 1 1] state_WI [  0.12   0.44 -10.     0.95   0.67   0.34 -10.     0.28] sorted [3 4 1]\n",
      "   state [0 0 0 0 1 0 1 0] state_WI [  0.15   0.44 -10.     0.95   0.42   0.34 -10.     0.83] sorted [3 7 1]\n",
      "   state [1 0 0 0 0 0 0 0] state_WI [  0.12   0.44 -10.     0.95   0.67   0.34   0.53   0.83] sorted [3 7 4]\n",
      "   state [0 0 0 1 0 0 0 0] state_WI [  0.15   0.44 -10.     0.3    0.67   0.34   0.53   0.83] sorted [7 4 6]\n",
      "   state [0 0 0 1 0 0 1 1] state_WI [  0.15   0.44 -10.     0.3    0.67   0.34 -10.     0.28] sorted [4 1 5]\n",
      "   state [0 0 0 0 1 0 0 1] state_WI [  0.15   0.44 -10.     0.95   0.42   0.34   0.53   0.28] sorted [3 6 1]\n",
      "   state [0 1 0 1 1 0 0 1] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34   0.53   0.28] sorted [6 1 4]\n",
      "   state [0 1 0 0 1 0 0 1] state_WI [  0.15   0.43 -10.     0.95   0.42   0.34   0.53   0.28] sorted [3 6 1]\n",
      "   state [0 1 0 1 1 0 0 0] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34   0.53   0.83] sorted [7 6 1]\n",
      "   state [0 1 0 0 0 1 0 0] state_WI [  0.15   0.43 -10.     0.95   0.67 -10.     0.53   0.83] sorted [3 7 4]\n",
      "   state [0 1 1 1 0 0 0 0] state_WI [  0.15   0.43 -10.     0.3    0.67   0.34   0.53   0.83] sorted [7 4 6]\n",
      "   state [0 1 1 1 0 0 0 0] state_WI [  0.15   0.43 -10.     0.3    0.67   0.34   0.53   0.83] sorted [7 4 6]\n",
      "   state [0 1 1 0 0 0 1 1] state_WI [  0.15   0.43 -10.     0.95   0.67   0.34 -10.     0.28] sorted [3 4 1]\n",
      "   state [0 1 1 1 0 0 0 0] state_WI [  0.15   0.43 -10.     0.3    0.67   0.34   0.53   0.83] sorted [7 4 6]\n",
      "   state [0 1 0 0 0 0 1 0] state_WI [  0.15   0.43 -10.     0.95   0.67   0.34 -10.     0.83] sorted [3 7 4]\n",
      "   state [0 0 0 0 1 0 1 0] state_WI [  0.15   0.44 -10.     0.95   0.42   0.34 -10.     0.83] sorted [3 7 1]\n",
      "   state [0 0 0 0 1 0 0 1] state_WI [  0.15   0.44 -10.     0.95   0.42   0.34   0.53   0.28] sorted [3 6 1]\n",
      "   state [1 1 0 0 0 0 1 1] state_WI [  0.12   0.43 -10.     0.95   0.67   0.34 -10.     0.28] sorted [3 4 1]\n",
      "   state [0 1 0 0 1 0 0 0] state_WI [  0.15   0.43 -10.     0.95   0.42   0.34   0.53   0.83] sorted [3 7 6]\n",
      "   state [0 1 0 1 0 0 1 0] state_WI [  0.15   0.43 -10.     0.3    0.67   0.34 -10.     0.83] sorted [7 4 1]\n",
      "instance 8, ep 4, state [1 0 0 0 0 1 0 1]\n",
      "   state [1 0 0 0 0 1 0 1] state_WI [  0.12   0.44 -10.     0.95   0.67 -10.     0.53   0.28] sorted [3 4 6]\n",
      "   state [0 0 0 1 1 0 1 0] state_WI [  0.15   0.44 -10.     0.3    0.42   0.34 -10.     0.83] sorted [7 1 4]\n",
      "   state [0 1 0 0 1 0 0 1] state_WI [  0.15   0.43 -10.     0.95   0.42   0.34   0.53   0.28] sorted [3 6 1]\n",
      "   state [0 0 0 0 0 1 1 1] state_WI [  0.15   0.44 -10.     0.95   0.67 -10.   -10.     0.28] sorted [3 4 1]\n",
      "   state [0 1 0 0 0 1 0 1] state_WI [  0.15   0.43 -10.     0.95   0.67 -10.     0.53   0.28] sorted [3 4 6]\n",
      "   state [0 1 1 0 1 0 1 0] state_WI [  0.15   0.43 -10.     0.95   0.42   0.34 -10.     0.83] sorted [3 7 1]\n",
      "   state [0 1 0 1 1 0 0 1] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34   0.53   0.28] sorted [6 1 4]\n",
      "   state [0 1 0 1 1 0 1 1] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34 -10.     0.28] sorted [1 4 5]\n",
      "   state [0 1 0 1 1 1 1 1] state_WI [  0.15   0.43 -10.     0.3    0.42 -10.   -10.     0.28] sorted [1 4 3]\n",
      "   state [0 1 0 1 1 0 1 0] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34 -10.     0.83] sorted [7 1 4]\n",
      "   state [1 1 0 1 1 0 1 0] state_WI [  0.12   0.43 -10.     0.3    0.42   0.34 -10.     0.83] sorted [7 1 4]\n",
      "   state [0 1 1 0 0 0 0 1] state_WI [  0.15   0.43 -10.     0.95   0.67   0.34   0.53   0.28] sorted [3 4 6]\n",
      "   state [0 0 1 0 1 0 1 0] state_WI [  0.15   0.44 -10.     0.95   0.42   0.34 -10.     0.83] sorted [3 7 1]\n",
      "   state [0 0 1 1 0 0 0 1] state_WI [  0.15   0.44 -10.     0.3    0.67   0.34   0.53   0.28] sorted [4 6 1]\n",
      "   state [0 0 0 1 1 0 0 1] state_WI [  0.15   0.44 -10.     0.3    0.42   0.34   0.53   0.28] sorted [6 1 4]\n",
      "   state [0 1 0 1 1 1 0 1] state_WI [  0.15   0.43 -10.     0.3    0.42 -10.     0.53   0.28] sorted [6 1 4]\n",
      "   state [0 1 1 0 1 0 0 0] state_WI [  0.15   0.43 -10.     0.95   0.42   0.34   0.53   0.83] sorted [3 7 6]\n",
      "   state [0 0 0 1 1 0 0 1] state_WI [  0.15   0.44 -10.     0.3    0.42   0.34   0.53   0.28] sorted [6 1 4]\n",
      "   state [0 0 1 0 0 0 0 1] state_WI [  0.15   0.44 -10.     0.95   0.67   0.34   0.53   0.28] sorted [3 4 6]\n",
      "   state [0 0 0 0 0 0 1 1] state_WI [  0.15   0.44 -10.     0.95   0.67   0.34 -10.     0.28] sorted [3 4 1]\n",
      "instance 8, ep 5, state [1 0 1 1 1 1 0 0]\n",
      "   state [1 0 1 1 1 1 0 0] state_WI [  0.12   0.44 -10.     0.3    0.42 -10.     0.53   0.83] sorted [7 6 1]\n",
      "   state [0 0 0 1 1 0 0 1] state_WI [  0.15   0.44 -10.     0.3    0.42   0.34   0.53   0.28] sorted [6 1 4]\n",
      "   state [0 1 0 1 1 0 1 1] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34 -10.     0.28] sorted [1 4 5]\n",
      "   state [0 1 0 1 1 0 1 1] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34 -10.     0.28] sorted [1 4 5]\n",
      "   state [0 1 0 1 0 1 0 1] state_WI [  0.15   0.43 -10.     0.3    0.67 -10.     0.53   0.28] sorted [4 6 1]\n",
      "   state [0 1 0 1 1 0 0 0] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34   0.53   0.83] sorted [7 6 1]\n",
      "   state [0 1 0 1 0 1 0 1] state_WI [  0.15   0.43 -10.     0.3    0.67 -10.     0.53   0.28] sorted [4 6 1]\n",
      "   state [0 1 0 1 1 0 0 1] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34   0.53   0.28] sorted [6 1 4]\n",
      "   state [0 1 0 1 1 0 0 1] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34   0.53   0.28] sorted [6 1 4]\n",
      "   state [0 1 0 1 1 0 0 0] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34   0.53   0.83] sorted [7 6 1]\n",
      "   state [1 0 1 1 0 0 1 1] state_WI [  0.12   0.44 -10.     0.3    0.67   0.34 -10.     0.28] sorted [4 1 5]\n",
      "   state [0 0 1 0 1 0 0 0] state_WI [  0.15   0.44 -10.     0.95   0.42   0.34   0.53   0.83] sorted [3 7 6]\n",
      "   state [0 0 0 1 1 0 0 0] state_WI [  0.15   0.44 -10.     0.3    0.42   0.34   0.53   0.83] sorted [7 6 1]\n",
      "   state [0 0 1 0 0 0 1 1] state_WI [  0.15   0.44 -10.     0.95   0.67   0.34 -10.     0.28] sorted [3 4 1]\n",
      "   state [0 0 0 0 1 0 1 0] state_WI [  0.15   0.44 -10.     0.95   0.42   0.34 -10.     0.83] sorted [3 7 1]\n",
      "   state [0 1 0 1 1 1 1 1] state_WI [  0.15   0.43 -10.     0.3    0.42 -10.   -10.     0.28] sorted [1 4 3]\n",
      "   state [0 1 0 1 1 0 0 1] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34   0.53   0.28] sorted [6 1 4]\n",
      "   state [1 1 0 0 1 0 1 0] state_WI [  0.12   0.43 -10.     0.95   0.42   0.34 -10.     0.83] sorted [3 7 1]\n",
      "   state [0 1 0 1 1 0 0 0] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34   0.53   0.83] sorted [7 6 1]\n",
      "   state [0 1 0 0 0 0 1 1] state_WI [  0.15   0.43 -10.     0.95   0.67   0.34 -10.     0.28] sorted [3 4 1]\n",
      "instance 8, ep 6, state [0 0 1 0 1 1 0 0]\n",
      "   state [0 0 1 0 1 1 0 0] state_WI [  0.15   0.44 -10.     0.95   0.42 -10.     0.53   0.83] sorted [3 7 6]\n",
      "   state [0 0 1 1 1 0 1 1] state_WI [  0.15   0.44 -10.     0.3    0.42   0.34 -10.     0.28] sorted [1 4 5]\n",
      "   state [0 1 0 1 0 0 1 1] state_WI [  0.15   0.43 -10.     0.3    0.67   0.34 -10.     0.28] sorted [4 1 5]\n",
      "   state [0 0 0 1 1 0 1 0] state_WI [  0.15   0.44 -10.     0.3    0.42   0.34 -10.     0.83] sorted [7 1 4]\n",
      "   state [0 0 1 0 1 0 0 0] state_WI [  0.15   0.44 -10.     0.95   0.42   0.34   0.53   0.83] sorted [3 7 6]\n",
      "   state [0 0 0 1 1 0 0 1] state_WI [  0.15   0.44 -10.     0.3    0.42   0.34   0.53   0.28] sorted [6 1 4]\n",
      "   state [0 0 0 0 1 0 1 0] state_WI [  0.15   0.44 -10.     0.95   0.42   0.34 -10.     0.83] sorted [3 7 1]\n",
      "   state [1 0 0 1 0 0 0 1] state_WI [  0.12   0.44 -10.     0.3    0.67   0.34   0.53   0.28] sorted [4 6 1]\n",
      "   state [0 1 0 0 0 1 1 1] state_WI [  0.15   0.43 -10.     0.95   0.67 -10.   -10.     0.28] sorted [3 4 1]\n",
      "   state [0 0 0 1 1 0 1 0] state_WI [  0.15   0.44 -10.     0.3    0.42   0.34 -10.     0.83] sorted [7 1 4]\n",
      "   state [0 1 0 0 1 0 0 1] state_WI [  0.15   0.43 -10.     0.95   0.42   0.34   0.53   0.28] sorted [3 6 1]\n",
      "   state [0 0 0 1 0 0 1 0] state_WI [  0.15   0.44 -10.     0.3    0.67   0.34 -10.     0.83] sorted [7 4 1]\n",
      "   state [0 1 0 0 0 0 0 0] state_WI [  0.15   0.43 -10.     0.95   0.67   0.34   0.53   0.83] sorted [3 7 4]\n",
      "   state [0 0 1 1 1 0 0 1] state_WI [  0.15   0.44 -10.     0.3    0.42   0.34   0.53   0.28] sorted [6 1 4]\n",
      "   state [0 0 1 1 1 0 0 0] state_WI [  0.15   0.44 -10.     0.3    0.42   0.34   0.53   0.83] sorted [7 6 1]\n",
      "   state [0 0 0 1 1 0 1 0] state_WI [  0.15   0.44 -10.     0.3    0.42   0.34 -10.     0.83] sorted [7 1 4]\n",
      "   state [0 1 0 0 1 0 1 1] state_WI [  0.15   0.43 -10.     0.95   0.42   0.34 -10.     0.28] sorted [3 1 4]\n",
      "   state [0 1 0 1 1 0 0 1] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34   0.53   0.28] sorted [6 1 4]\n",
      "   state [1 1 0 1 1 0 1 1] state_WI [  0.12   0.43 -10.     0.3    0.42   0.34 -10.     0.28] sorted [1 4 5]\n",
      "   state [1 0 0 1 1 0 1 1] state_WI [  0.12   0.44 -10.     0.3    0.42   0.34 -10.     0.28] sorted [1 4 5]\n",
      "instance 8, ep 7, state [1 1 1 0 0 0 0 1]\n",
      "   state [1 1 1 0 0 0 0 1] state_WI [  0.12   0.43 -10.     0.95   0.67   0.34   0.53   0.28] sorted [3 4 6]\n",
      "   state [0 1 0 1 1 0 1 1] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34 -10.     0.28] sorted [1 4 5]\n",
      "   state [0 1 0 1 1 0 1 1] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34 -10.     0.28] sorted [1 4 5]\n",
      "   state [0 0 1 1 1 1 1 0] state_WI [  0.15   0.44 -10.     0.3    0.42 -10.   -10.     0.83] sorted [7 1 4]\n",
      "   state [0 1 1 0 1 1 0 0] state_WI [  0.15   0.43 -10.     0.95   0.42 -10.     0.53   0.83] sorted [3 7 6]\n",
      "   state [0 1 1 1 1 1 0 0] state_WI [  0.15   0.43 -10.     0.3    0.42 -10.     0.53   0.83] sorted [7 6 1]\n",
      "   state [0 1 1 1 1 0 1 1] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34 -10.     0.28] sorted [1 4 5]\n",
      "   state [0 1 1 0 1 0 1 0] state_WI [  0.15   0.43 -10.     0.95   0.42   0.34 -10.     0.83] sorted [3 7 1]\n",
      "   state [0 1 0 0 1 0 0 1] state_WI [  0.15   0.43 -10.     0.95   0.42   0.34   0.53   0.28] sorted [3 6 1]\n",
      "   state [0 1 0 1 1 0 1 1] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34 -10.     0.28] sorted [1 4 5]\n",
      "   state [0 0 0 0 1 1 1 1] state_WI [  0.15   0.44 -10.     0.95   0.42 -10.   -10.     0.28] sorted [3 1 4]\n",
      "   state [0 1 0 0 1 0 0 1] state_WI [  0.15   0.43 -10.     0.95   0.42   0.34   0.53   0.28] sorted [3 6 1]\n",
      "   state [0 1 1 1 1 0 1 1] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34 -10.     0.28] sorted [1 4 5]\n",
      "   state [0 0 0 0 1 0 0 0] state_WI [  0.15   0.44 -10.     0.95   0.42   0.34   0.53   0.83] sorted [3 7 6]\n",
      "   state [0 0 0 1 1 0 1 1] state_WI [  0.15   0.44 -10.     0.3    0.42   0.34 -10.     0.28] sorted [1 4 5]\n",
      "   state [0 0 0 0 1 1 0 0] state_WI [  0.15   0.44 -10.     0.95   0.42 -10.     0.53   0.83] sorted [3 7 6]\n",
      "   state [0 0 1 0 1 0 1 0] state_WI [  0.15   0.44 -10.     0.95   0.42   0.34 -10.     0.83] sorted [3 7 1]\n",
      "   state [0 1 0 1 0 0 0 1] state_WI [  0.15   0.43 -10.     0.3    0.67   0.34   0.53   0.28] sorted [4 6 1]\n",
      "   state [0 0 0 1 1 0 1 1] state_WI [  0.15   0.44 -10.     0.3    0.42   0.34 -10.     0.28] sorted [1 4 5]\n",
      "   state [0 0 0 0 1 0 1 0] state_WI [  0.15   0.44 -10.     0.95   0.42   0.34 -10.     0.83] sorted [3 7 1]\n",
      "instance 8, ep 8, state [1 1 1 1 0 0 1 0]\n",
      "   state [1 1 1 1 0 0 1 0] state_WI [  0.12   0.43 -10.     0.3    0.67   0.34 -10.     0.83] sorted [7 4 1]\n",
      "   state [0 1 1 0 0 0 0 1] state_WI [  0.15   0.43 -10.     0.95   0.67   0.34   0.53   0.28] sorted [3 4 6]\n",
      "   state [0 0 0 0 1 0 1 1] state_WI [  0.15   0.44 -10.     0.95   0.42   0.34 -10.     0.28] sorted [3 1 4]\n",
      "   state [0 1 1 0 1 0 0 0] state_WI [  0.15   0.43 -10.     0.95   0.42   0.34   0.53   0.83] sorted [3 7 6]\n",
      "   state [0 0 0 0 0 0 0 1] state_WI [  0.15   0.44 -10.     0.95   0.67   0.34   0.53   0.28] sorted [3 4 6]\n",
      "   state [0 1 0 1 0 0 0 1] state_WI [  0.15   0.43 -10.     0.3    0.67   0.34   0.53   0.28] sorted [4 6 1]\n",
      "   state [0 0 0 1 1 0 1 1] state_WI [  0.15   0.44 -10.     0.3    0.42   0.34 -10.     0.28] sorted [1 4 5]\n",
      "   state [0 1 0 0 1 0 1 1] state_WI [  0.15   0.43 -10.     0.95   0.42   0.34 -10.     0.28] sorted [3 1 4]\n",
      "   state [0 0 0 0 1 0 0 0] state_WI [  0.15   0.44 -10.     0.95   0.42   0.34   0.53   0.83] sorted [3 7 6]\n",
      "   state [0 0 0 1 1 0 1 1] state_WI [  0.15   0.44 -10.     0.3    0.42   0.34 -10.     0.28] sorted [1 4 5]\n",
      "   state [0 1 1 0 1 0 0 0] state_WI [  0.15   0.43 -10.     0.95   0.42   0.34   0.53   0.83] sorted [3 7 6]\n",
      "   state [0 1 0 1 0 0 0 1] state_WI [  0.15   0.43 -10.     0.3    0.67   0.34   0.53   0.28] sorted [4 6 1]\n",
      "   state [0 0 1 1 0 0 0 1] state_WI [  0.15   0.44 -10.     0.3    0.67   0.34   0.53   0.28] sorted [4 6 1]\n",
      "   state [0 0 0 0 1 0 1 1] state_WI [  0.15   0.44 -10.     0.95   0.42   0.34 -10.     0.28] sorted [3 1 4]\n",
      "   state [1 0 0 0 1 0 0 0] state_WI [  0.12   0.44 -10.     0.95   0.42   0.34   0.53   0.83] sorted [3 7 6]\n",
      "   state [0 0 1 1 0 0 0 1] state_WI [  0.15   0.44 -10.     0.3    0.67   0.34   0.53   0.28] sorted [4 6 1]\n",
      "   state [0 1 1 1 0 1 1 0] state_WI [  0.15   0.43 -10.     0.3    0.67 -10.   -10.     0.83] sorted [7 4 1]\n",
      "   state [0 1 0 1 1 1 1 1] state_WI [  0.15   0.43 -10.     0.3    0.42 -10.   -10.     0.28] sorted [1 4 3]\n",
      "   state [0 1 0 1 1 0 1 1] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34 -10.     0.28] sorted [1 4 5]\n",
      "   state [1 1 0 1 0 0 0 0] state_WI [  0.12   0.43 -10.     0.3    0.67   0.34   0.53   0.83] sorted [7 4 6]\n",
      "instance 8, ep 9, state [1 1 0 1 1 1 1 1]\n",
      "   state [1 1 0 1 1 1 1 1] state_WI [  0.12   0.43 -10.     0.3    0.42 -10.   -10.     0.28] sorted [1 4 3]\n",
      "   state [0 1 0 1 1 1 1 1] state_WI [  0.15   0.43 -10.     0.3    0.42 -10.   -10.     0.28] sorted [1 4 3]\n",
      "   state [0 1 1 1 1 0 1 0] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34 -10.     0.83] sorted [7 1 4]\n",
      "   state [0 1 0 0 1 0 1 1] state_WI [  0.15   0.43 -10.     0.95   0.42   0.34 -10.     0.28] sorted [3 1 4]\n",
      "   state [1 1 0 1 1 0 1 0] state_WI [  0.12   0.43 -10.     0.3    0.42   0.34 -10.     0.83] sorted [7 1 4]\n",
      "   state [0 0 0 1 1 0 1 1] state_WI [  0.15   0.44 -10.     0.3    0.42   0.34 -10.     0.28] sorted [1 4 5]\n",
      "   state [0 1 1 1 0 0 0 1] state_WI [  0.15   0.43 -10.     0.3    0.67   0.34   0.53   0.28] sorted [4 6 1]\n",
      "   state [0 1 0 1 1 1 0 0] state_WI [  0.15   0.43 -10.     0.3    0.42 -10.     0.53   0.83] sorted [7 6 1]\n",
      "   state [1 1 0 0 1 1 0 1] state_WI [  0.12   0.43 -10.     0.95   0.42 -10.     0.53   0.28] sorted [3 6 1]\n",
      "   state [0 1 0 1 0 0 1 0] state_WI [  0.15   0.43 -10.     0.3    0.67   0.34 -10.     0.83] sorted [7 4 1]\n",
      "   state [0 1 0 1 1 0 1 1] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34 -10.     0.28] sorted [1 4 5]\n",
      "   state [0 1 0 1 1 0 0 0] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34   0.53   0.83] sorted [7 6 1]\n",
      "   state [0 1 1 0 0 0 0 1] state_WI [  0.15   0.43 -10.     0.95   0.67   0.34   0.53   0.28] sorted [3 4 6]\n",
      "   state [0 1 0 0 0 0 0 1] state_WI [  0.15   0.43 -10.     0.95   0.67   0.34   0.53   0.28] sorted [3 4 6]\n",
      "   state [0 0 0 1 0 0 1 1] state_WI [  0.15   0.44 -10.     0.3    0.67   0.34 -10.     0.28] sorted [4 1 5]\n",
      "   state [0 0 0 0 0 0 0 0] state_WI [  0.15   0.44 -10.     0.95   0.67   0.34   0.53   0.83] sorted [3 7 4]\n",
      "   state [0 0 0 0 1 0 0 0] state_WI [  0.15   0.44 -10.     0.95   0.42   0.34   0.53   0.83] sorted [3 7 6]\n",
      "   state [0 0 0 1 1 0 1 1] state_WI [  0.15   0.44 -10.     0.3    0.42   0.34 -10.     0.28] sorted [1 4 5]\n",
      "   state [0 0 0 1 1 0 0 1] state_WI [  0.15   0.44 -10.     0.3    0.42   0.34   0.53   0.28] sorted [6 1 4]\n",
      "   state [0 0 0 0 1 0 1 1] state_WI [  0.15   0.44 -10.     0.95   0.42   0.34 -10.     0.28] sorted [3 1 4]\n",
      "instance 8, ep 10, state [0 0 1 1 0 0 1 1]\n",
      "   state [0 0 1 1 0 0 1 1] state_WI [  0.15   0.44 -10.     0.3    0.67   0.34 -10.     0.28] sorted [4 1 5]\n",
      "   state [0 0 0 1 1 1 1 0] state_WI [  0.15   0.44 -10.     0.3    0.42 -10.   -10.     0.83] sorted [7 1 4]\n",
      "   state [0 0 0 0 1 0 0 1] state_WI [  0.15   0.44 -10.     0.95   0.42   0.34   0.53   0.28] sorted [3 6 1]\n",
      "   state [0 0 1 1 1 0 0 1] state_WI [  0.15   0.44 -10.     0.3    0.42   0.34   0.53   0.28] sorted [6 1 4]\n",
      "   state [0 0 0 0 1 0 1 1] state_WI [  0.15   0.44 -10.     0.95   0.42   0.34 -10.     0.28] sorted [3 1 4]\n",
      "   state [0 1 0 1 1 0 1 1] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34 -10.     0.28] sorted [1 4 5]\n",
      "   state [0 0 1 1 1 1 1 0] state_WI [  0.15   0.44 -10.     0.3    0.42 -10.   -10.     0.83] sorted [7 1 4]\n",
      "   state [0 0 1 1 1 1 1 1] state_WI [  0.15   0.44 -10.     0.3    0.42 -10.   -10.     0.28] sorted [1 4 3]\n",
      "   state [0 1 0 1 1 0 0 1] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34   0.53   0.28] sorted [6 1 4]\n",
      "   state [1 1 0 1 1 0 0 0] state_WI [  0.12   0.43 -10.     0.3    0.42   0.34   0.53   0.83] sorted [7 6 1]\n",
      "   state [0 1 0 1 1 0 0 1] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34   0.53   0.28] sorted [6 1 4]\n",
      "   state [0 1 0 0 1 0 0 1] state_WI [  0.15   0.43 -10.     0.95   0.42   0.34   0.53   0.28] sorted [3 6 1]\n",
      "   state [0 1 1 1 0 0 1 0] state_WI [  0.15   0.43 -10.     0.3    0.67   0.34 -10.     0.83] sorted [7 4 1]\n",
      "   state [0 1 1 0 1 0 1 1] state_WI [  0.15   0.43 -10.     0.95   0.42   0.34 -10.     0.28] sorted [3 1 4]\n",
      "   state [0 1 1 1 0 1 1 1] state_WI [  0.15   0.43 -10.     0.3    0.67 -10.   -10.     0.28] sorted [4 1 3]\n",
      "   state [0 1 1 1 1 0 0 0] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34   0.53   0.83] sorted [7 6 1]\n",
      "   state [0 1 0 1 1 0 0 1] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34   0.53   0.28] sorted [6 1 4]\n",
      "   state [0 1 0 1 1 0 1 0] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34 -10.     0.83] sorted [7 1 4]\n",
      "   state [1 1 0 1 1 1 0 1] state_WI [  0.12   0.43 -10.     0.3    0.42 -10.     0.53   0.28] sorted [6 1 4]\n",
      "   state [0 0 0 0 1 0 1 0] state_WI [  0.15   0.44 -10.     0.95   0.42   0.34 -10.     0.83] sorted [3 7 1]\n",
      "instance 8, ep 11, state [1 1 0 0 1 0 0 0]\n",
      "   state [1 1 0 0 1 0 0 0] state_WI [  0.12   0.43 -10.     0.95   0.42   0.34   0.53   0.83] sorted [3 7 6]\n",
      "   state [0 0 1 0 0 0 0 1] state_WI [  0.15   0.44 -10.     0.95   0.67   0.34   0.53   0.28] sorted [3 4 6]\n",
      "   state [0 0 0 1 0 0 0 1] state_WI [  0.15   0.44 -10.     0.3    0.67   0.34   0.53   0.28] sorted [4 6 1]\n",
      "   state [0 1 0 0 1 0 0 1] state_WI [  0.15   0.43 -10.     0.95   0.42   0.34   0.53   0.28] sorted [3 6 1]\n",
      "   state [0 0 0 0 0 0 1 0] state_WI [  0.15   0.44 -10.     0.95   0.67   0.34 -10.     0.83] sorted [3 7 4]\n",
      "   state [0 0 0 1 1 0 1 1] state_WI [  0.15   0.44 -10.     0.3    0.42   0.34 -10.     0.28] sorted [1 4 5]\n",
      "   state [0 0 0 1 0 0 1 0] state_WI [  0.15   0.44 -10.     0.3    0.67   0.34 -10.     0.83] sorted [7 4 1]\n",
      "   state [0 0 1 1 1 1 0 1] state_WI [  0.15   0.44 -10.     0.3    0.42 -10.     0.53   0.28] sorted [6 1 4]\n",
      "   state [0 1 0 0 1 0 1 1] state_WI [  0.15   0.43 -10.     0.95   0.42   0.34 -10.     0.28] sorted [3 1 4]\n",
      "   state [0 1 0 1 1 0 1 0] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34 -10.     0.83] sorted [7 1 4]\n",
      "   state [0 1 0 0 1 0 0 0] state_WI [  0.15   0.43 -10.     0.95   0.42   0.34   0.53   0.83] sorted [3 7 6]\n",
      "   state [0 1 0 0 1 0 0 1] state_WI [  0.15   0.43 -10.     0.95   0.42   0.34   0.53   0.28] sorted [3 6 1]\n",
      "   state [0 1 0 0 1 0 1 0] state_WI [  0.15   0.43 -10.     0.95   0.42   0.34 -10.     0.83] sorted [3 7 1]\n",
      "   state [0 1 1 1 0 0 0 1] state_WI [  0.15   0.43 -10.     0.3    0.67   0.34   0.53   0.28] sorted [4 6 1]\n",
      "   state [0 1 0 0 0 0 0 1] state_WI [  0.15   0.43 -10.     0.95   0.67   0.34   0.53   0.28] sorted [3 4 6]\n",
      "   state [0 1 0 1 1 0 1 1] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34 -10.     0.28] sorted [1 4 5]\n",
      "   state [0 1 0 1 1 0 0 0] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34   0.53   0.83] sorted [7 6 1]\n",
      "   state [0 0 0 0 1 0 1 0] state_WI [  0.15   0.44 -10.     0.95   0.42   0.34 -10.     0.83] sorted [3 7 1]\n",
      "   state [0 1 0 1 0 0 1 0] state_WI [  0.15   0.43 -10.     0.3    0.67   0.34 -10.     0.83] sorted [7 4 1]\n",
      "   state [0 0 1 1 0 0 0 0] state_WI [  0.15   0.44 -10.     0.3    0.67   0.34   0.53   0.83] sorted [7 4 6]\n",
      "instance 8, ep 12, state [1 1 0 0 1 1 0 0]\n",
      "   state [1 1 0 0 1 1 0 0] state_WI [  0.12   0.43 -10.     0.95   0.42 -10.     0.53   0.83] sorted [3 7 6]\n",
      "   state [0 0 0 1 1 1 0 0] state_WI [  0.15   0.44 -10.     0.3    0.42 -10.     0.53   0.83] sorted [7 6 1]\n",
      "   state [0 0 0 0 1 0 0 0] state_WI [  0.15   0.44 -10.     0.95   0.42   0.34   0.53   0.83] sorted [3 7 6]\n",
      "   state [0 0 0 1 1 0 0 1] state_WI [  0.15   0.44 -10.     0.3    0.42   0.34   0.53   0.28] sorted [6 1 4]\n",
      "   state [0 0 0 0 1 0 0 0] state_WI [  0.15   0.44 -10.     0.95   0.42   0.34   0.53   0.83] sorted [3 7 6]\n",
      "   state [0 0 1 1 0 0 1 0] state_WI [  0.15   0.44 -10.     0.3    0.67   0.34 -10.     0.83] sorted [7 4 1]\n",
      "   state [0 0 1 0 0 0 1 1] state_WI [  0.15   0.44 -10.     0.95   0.67   0.34 -10.     0.28] sorted [3 4 1]\n",
      "   state [0 0 0 1 1 0 0 0] state_WI [  0.15   0.44 -10.     0.3    0.42   0.34   0.53   0.83] sorted [7 6 1]\n",
      "   state [0 1 1 1 1 0 1 0] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34 -10.     0.83] sorted [7 1 4]\n",
      "   state [1 1 1 1 1 0 0 0] state_WI [  0.12   0.43 -10.     0.3    0.42   0.34   0.53   0.83] sorted [7 6 1]\n",
      "   state [0 1 0 0 1 0 1 0] state_WI [  0.15   0.43 -10.     0.95   0.42   0.34 -10.     0.83] sorted [3 7 1]\n",
      "   state [0 0 0 1 1 0 0 1] state_WI [  0.15   0.44 -10.     0.3    0.42   0.34   0.53   0.28] sorted [6 1 4]\n",
      "   state [0 0 0 0 1 0 0 0] state_WI [  0.15   0.44 -10.     0.95   0.42   0.34   0.53   0.83] sorted [3 7 6]\n",
      "   state [0 0 1 0 1 1 1 1] state_WI [  0.15   0.44 -10.     0.95   0.42 -10.   -10.     0.28] sorted [3 1 4]\n",
      "   state [0 1 1 0 1 0 0 0] state_WI [  0.15   0.43 -10.     0.95   0.42   0.34   0.53   0.83] sorted [3 7 6]\n",
      "   state [0 1 0 1 0 0 1 1] state_WI [  0.15   0.43 -10.     0.3    0.67   0.34 -10.     0.28] sorted [4 1 5]\n",
      "   state [0 1 1 0 0 0 0 1] state_WI [  0.15   0.43 -10.     0.95   0.67   0.34   0.53   0.28] sorted [3 4 6]\n",
      "   state [0 1 1 1 0 0 1 1] state_WI [  0.15   0.43 -10.     0.3    0.67   0.34 -10.     0.28] sorted [4 1 5]\n",
      "   state [0 1 0 0 1 0 1 1] state_WI [  0.15   0.43 -10.     0.95   0.42   0.34 -10.     0.28] sorted [3 1 4]\n",
      "   state [0 1 1 1 1 0 0 1] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34   0.53   0.28] sorted [6 1 4]\n",
      "instance 8, ep 13, state [0 1 0 0 1 1 0 1]\n",
      "   state [0 1 0 0 1 1 0 1] state_WI [  0.15   0.43 -10.     0.95   0.42 -10.     0.53   0.28] sorted [3 6 1]\n",
      "   state [0 1 0 1 0 0 1 1] state_WI [  0.15   0.43 -10.     0.3    0.67   0.34 -10.     0.28] sorted [4 1 5]\n",
      "   state [0 1 0 0 0 1 0 0] state_WI [  0.15   0.43 -10.     0.95   0.67 -10.     0.53   0.83] sorted [3 7 4]\n",
      "   state [0 0 1 1 0 1 0 1] state_WI [  0.15   0.44 -10.     0.3    0.67 -10.     0.53   0.28] sorted [4 6 1]\n",
      "   state [0 1 0 0 0 1 1 0] state_WI [  0.15   0.43 -10.     0.95   0.67 -10.   -10.     0.83] sorted [3 7 4]\n",
      "   state [0 1 0 0 0 0 1 1] state_WI [  0.15   0.43 -10.     0.95   0.67   0.34 -10.     0.28] sorted [3 4 1]\n",
      "   state [0 1 0 1 0 0 0 0] state_WI [  0.15   0.43 -10.     0.3    0.67   0.34   0.53   0.83] sorted [7 4 6]\n",
      "   state [1 0 1 0 0 0 1 1] state_WI [  0.12   0.44 -10.     0.95   0.67   0.34 -10.     0.28] sorted [3 4 1]\n",
      "   state [0 1 0 1 1 0 1 1] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34 -10.     0.28] sorted [1 4 5]\n",
      "   state [0 1 0 0 1 1 1 1] state_WI [  0.15   0.43 -10.     0.95   0.42 -10.   -10.     0.28] sorted [3 1 4]\n",
      "   state [0 1 0 1 1 0 1 1] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34 -10.     0.28] sorted [1 4 5]\n",
      "   state [0 0 0 1 1 0 0 0] state_WI [  0.15   0.44 -10.     0.3    0.42   0.34   0.53   0.83] sorted [7 6 1]\n",
      "   state [0 0 1 1 1 0 0 0] state_WI [  0.15   0.44 -10.     0.3    0.42   0.34   0.53   0.83] sorted [7 6 1]\n",
      "   state [0 0 1 0 0 0 0 1] state_WI [  0.15   0.44 -10.     0.95   0.67   0.34   0.53   0.28] sorted [3 4 6]\n",
      "   state [0 0 1 1 1 0 1 0] state_WI [  0.15   0.44 -10.     0.3    0.42   0.34 -10.     0.83] sorted [7 1 4]\n",
      "   state [0 0 0 1 1 0 1 1] state_WI [  0.15   0.44 -10.     0.3    0.42   0.34 -10.     0.28] sorted [1 4 5]\n",
      "   state [0 0 0 1 1 1 0 1] state_WI [  0.15   0.44 -10.     0.3    0.42 -10.     0.53   0.28] sorted [6 1 4]\n",
      "   state [0 0 0 1 0 0 1 0] state_WI [  0.15   0.44 -10.     0.3    0.67   0.34 -10.     0.83] sorted [7 4 1]\n",
      "   state [0 0 0 0 1 0 1 1] state_WI [  0.15   0.44 -10.     0.95   0.42   0.34 -10.     0.28] sorted [3 1 4]\n",
      "   state [0 0 0 1 1 0 0 1] state_WI [  0.15   0.44 -10.     0.3    0.42   0.34   0.53   0.28] sorted [6 1 4]\n",
      "instance 8, ep 14, state [0 1 0 1 0 1 1 1]\n",
      "   state [0 1 0 1 0 1 1 1] state_WI [  0.15   0.43 -10.     0.3    0.67 -10.   -10.     0.28] sorted [4 1 3]\n",
      "   state [0 1 0 0 1 0 0 0] state_WI [  0.15   0.43 -10.     0.95   0.42   0.34   0.53   0.83] sorted [3 7 6]\n",
      "   state [0 1 0 0 0 0 1 1] state_WI [  0.15   0.43 -10.     0.95   0.67   0.34 -10.     0.28] sorted [3 4 1]\n",
      "   state [0 1 0 0 1 0 1 0] state_WI [  0.15   0.43 -10.     0.95   0.42   0.34 -10.     0.83] sorted [3 7 1]\n",
      "   state [0 1 0 1 0 0 1 1] state_WI [  0.15   0.43 -10.     0.3    0.67   0.34 -10.     0.28] sorted [4 1 5]\n",
      "   state [0 1 0 1 1 0 0 1] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34   0.53   0.28] sorted [6 1 4]\n",
      "   state [0 1 0 0 1 0 1 0] state_WI [  0.15   0.43 -10.     0.95   0.42   0.34 -10.     0.83] sorted [3 7 1]\n",
      "   state [0 1 0 1 0 0 1 1] state_WI [  0.15   0.43 -10.     0.3    0.67   0.34 -10.     0.28] sorted [4 1 5]\n",
      "   state [0 1 0 1 1 0 1 1] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34 -10.     0.28] sorted [1 4 5]\n",
      "   state [0 1 0 1 1 0 1 0] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34 -10.     0.83] sorted [7 1 4]\n",
      "   state [0 1 0 1 1 0 0 1] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34   0.53   0.28] sorted [6 1 4]\n",
      "   state [0 1 0 1 0 0 1 0] state_WI [  0.15   0.43 -10.     0.3    0.67   0.34 -10.     0.83] sorted [7 4 1]\n",
      "   state [0 1 1 1 0 0 1 0] state_WI [  0.15   0.43 -10.     0.3    0.67   0.34 -10.     0.83] sorted [7 4 1]\n",
      "   state [0 0 0 0 0 0 0 1] state_WI [  0.15   0.44 -10.     0.95   0.67   0.34   0.53   0.28] sorted [3 4 6]\n",
      "   state [1 0 0 0 1 0 1 1] state_WI [  0.12   0.44 -10.     0.95   0.42   0.34 -10.     0.28] sorted [3 1 4]\n",
      "   state [1 1 0 0 1 1 0 0] state_WI [  0.12   0.43 -10.     0.95   0.42 -10.     0.53   0.83] sorted [3 7 6]\n",
      "   state [1 0 0 0 0 0 1 0] state_WI [  0.12   0.44 -10.     0.95   0.67   0.34 -10.     0.83] sorted [3 7 4]\n",
      "   state [1 0 0 0 1 0 0 0] state_WI [  0.12   0.44 -10.     0.95   0.42   0.34   0.53   0.83] sorted [3 7 6]\n",
      "   state [1 0 0 0 1 1 0 1] state_WI [  0.12   0.44 -10.     0.95   0.42 -10.     0.53   0.28] sorted [3 6 1]\n",
      "   state [1 0 0 1 0 1 1 1] state_WI [  0.12   0.44 -10.     0.3    0.67 -10.   -10.     0.28] sorted [4 1 3]\n",
      "instance 8, ep 15, state [1 1 0 0 1 0 1 1]\n",
      "   state [1 1 0 0 1 0 1 1] state_WI [  0.12   0.43 -10.     0.95   0.42   0.34 -10.     0.28] sorted [3 1 4]\n",
      "   state [0 0 0 1 1 0 0 1] state_WI [  0.15   0.44 -10.     0.3    0.42   0.34   0.53   0.28] sorted [6 1 4]\n",
      "   state [0 1 0 0 1 0 0 1] state_WI [  0.15   0.43 -10.     0.95   0.42   0.34   0.53   0.28] sorted [3 6 1]\n",
      "   state [0 1 0 1 0 0 0 1] state_WI [  0.15   0.43 -10.     0.3    0.67   0.34   0.53   0.28] sorted [4 6 1]\n",
      "   state [0 1 1 0 0 0 0 1] state_WI [  0.15   0.43 -10.     0.95   0.67   0.34   0.53   0.28] sorted [3 4 6]\n",
      "   state [0 1 1 0 1 1 1 1] state_WI [  0.15   0.43 -10.     0.95   0.42 -10.   -10.     0.28] sorted [3 1 4]\n",
      "   state [0 1 1 1 1 1 0 0] state_WI [  0.15   0.43 -10.     0.3    0.42 -10.     0.53   0.83] sorted [7 6 1]\n",
      "   state [1 1 0 0 0 0 0 0] state_WI [  0.12   0.43 -10.     0.95   0.67   0.34   0.53   0.83] sorted [3 7 4]\n",
      "   state [0 0 0 1 1 0 1 0] state_WI [  0.15   0.44 -10.     0.3    0.42   0.34 -10.     0.83] sorted [7 1 4]\n",
      "   state [0 1 0 1 1 0 0 0] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34   0.53   0.83] sorted [7 6 1]\n",
      "   state [0 1 0 0 1 0 0 0] state_WI [  0.15   0.43 -10.     0.95   0.42   0.34   0.53   0.83] sorted [3 7 6]\n",
      "   state [0 0 0 0 1 0 0 1] state_WI [  0.15   0.44 -10.     0.95   0.42   0.34   0.53   0.28] sorted [3 6 1]\n",
      "   state [0 0 0 1 1 0 1 1] state_WI [  0.15   0.44 -10.     0.3    0.42   0.34 -10.     0.28] sorted [1 4 5]\n",
      "   state [0 1 0 1 0 0 0 1] state_WI [  0.15   0.43 -10.     0.3    0.67   0.34   0.53   0.28] sorted [4 6 1]\n",
      "   state [1 1 0 0 0 0 0 0] state_WI [  0.12   0.43 -10.     0.95   0.67   0.34   0.53   0.83] sorted [3 7 4]\n",
      "   state [0 0 0 1 1 0 0 1] state_WI [  0.15   0.44 -10.     0.3    0.42   0.34   0.53   0.28] sorted [6 1 4]\n",
      "   state [0 1 0 0 1 0 0 0] state_WI [  0.15   0.43 -10.     0.95   0.42   0.34   0.53   0.83] sorted [3 7 6]\n",
      "   state [0 0 0 1 1 0 0 0] state_WI [  0.15   0.44 -10.     0.3    0.42   0.34   0.53   0.83] sorted [7 6 1]\n",
      "   state [0 1 0 0 0 0 1 1] state_WI [  0.15   0.43 -10.     0.95   0.67   0.34 -10.     0.28] sorted [3 4 1]\n",
      "   state [1 1 0 0 0 1 0 1] state_WI [  0.12   0.43 -10.     0.95   0.67 -10.     0.53   0.28] sorted [3 4 6]\n",
      "instance 8, ep 16, state [0 1 0 1 0 0 1 1]\n",
      "   state [0 1 0 1 0 0 1 1] state_WI [  0.15   0.43 -10.     0.3    0.67   0.34 -10.     0.28] sorted [4 1 5]\n",
      "   state [0 1 0 1 0 0 1 1] state_WI [  0.15   0.43 -10.     0.3    0.67   0.34 -10.     0.28] sorted [4 1 5]\n",
      "   state [0 1 0 1 0 0 0 0] state_WI [  0.15   0.43 -10.     0.3    0.67   0.34   0.53   0.83] sorted [7 4 6]\n",
      "   state [0 1 0 1 0 0 1 1] state_WI [  0.15   0.43 -10.     0.3    0.67   0.34 -10.     0.28] sorted [4 1 5]\n",
      "   state [0 1 0 0 1 0 1 1] state_WI [  0.15   0.43 -10.     0.95   0.42   0.34 -10.     0.28] sorted [3 1 4]\n",
      "   state [0 1 0 0 1 0 1 1] state_WI [  0.15   0.43 -10.     0.95   0.42   0.34 -10.     0.28] sorted [3 1 4]\n",
      "   state [0 1 1 0 0 0 0 0] state_WI [  0.15   0.43 -10.     0.95   0.67   0.34   0.53   0.83] sorted [3 7 4]\n",
      "   state [0 0 0 1 1 0 0 1] state_WI [  0.15   0.44 -10.     0.3    0.42   0.34   0.53   0.28] sorted [6 1 4]\n",
      "   state [1 1 1 1 1 0 1 0] state_WI [  0.12   0.43 -10.     0.3    0.42   0.34 -10.     0.83] sorted [7 1 4]\n",
      "   state [1 1 1 1 1 0 0 1] state_WI [  0.12   0.43 -10.     0.3    0.42   0.34   0.53   0.28] sorted [6 1 4]\n",
      "   state [1 1 0 0 0 0 1 0] state_WI [  0.12   0.43 -10.     0.95   0.67   0.34 -10.     0.83] sorted [3 7 4]\n",
      "   state [0 0 0 1 1 0 1 0] state_WI [  0.15   0.44 -10.     0.3    0.42   0.34 -10.     0.83] sorted [7 1 4]\n",
      "   state [0 1 0 0 1 0 0 1] state_WI [  0.15   0.43 -10.     0.95   0.42   0.34   0.53   0.28] sorted [3 6 1]\n",
      "   state [0 1 0 1 1 0 0 0] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34   0.53   0.83] sorted [7 6 1]\n",
      "   state [0 0 0 1 0 0 1 0] state_WI [  0.15   0.44 -10.     0.3    0.67   0.34 -10.     0.83] sorted [7 4 1]\n",
      "   state [0 0 0 0 0 0 0 1] state_WI [  0.15   0.44 -10.     0.95   0.67   0.34   0.53   0.28] sorted [3 4 6]\n",
      "   state [0 0 0 1 1 0 1 0] state_WI [  0.15   0.44 -10.     0.3    0.42   0.34 -10.     0.83] sorted [7 1 4]\n",
      "   state [0 0 0 0 1 1 0 1] state_WI [  0.15   0.44 -10.     0.95   0.42 -10.     0.53   0.28] sorted [3 6 1]\n",
      "   state [0 0 0 0 0 0 1 0] state_WI [  0.15   0.44 -10.     0.95   0.67   0.34 -10.     0.83] sorted [3 7 4]\n",
      "   state [0 0 0 1 1 0 1 1] state_WI [  0.15   0.44 -10.     0.3    0.42   0.34 -10.     0.28] sorted [1 4 5]\n",
      "instance 8, ep 17, state [1 1 0 1 0 1 1 1]\n",
      "   state [1 1 0 1 0 1 1 1] state_WI [  0.12   0.43 -10.     0.3    0.67 -10.   -10.     0.28] sorted [4 1 3]\n",
      "   state [0 1 0 1 1 0 0 0] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34   0.53   0.83] sorted [7 6 1]\n",
      "   state [0 1 0 1 0 0 0 0] state_WI [  0.15   0.43 -10.     0.3    0.67   0.34   0.53   0.83] sorted [7 4 6]\n",
      "   state [0 0 0 0 1 0 0 0] state_WI [  0.15   0.44 -10.     0.95   0.42   0.34   0.53   0.83] sorted [3 7 6]\n",
      "   state [0 0 0 1 0 0 0 1] state_WI [  0.15   0.44 -10.     0.3    0.67   0.34   0.53   0.28] sorted [4 6 1]\n",
      "   state [0 1 0 1 0 0 1 1] state_WI [  0.15   0.43 -10.     0.3    0.67   0.34 -10.     0.28] sorted [4 1 5]\n",
      "   state [0 1 1 0 1 0 1 1] state_WI [  0.15   0.43 -10.     0.95   0.42   0.34 -10.     0.28] sorted [3 1 4]\n",
      "   state [0 0 0 0 1 0 1 0] state_WI [  0.15   0.44 -10.     0.95   0.42   0.34 -10.     0.83] sorted [3 7 1]\n",
      "   state [0 0 0 1 0 0 0 1] state_WI [  0.15   0.44 -10.     0.3    0.67   0.34   0.53   0.28] sorted [4 6 1]\n",
      "   state [0 0 0 1 0 0 0 1] state_WI [  0.15   0.44 -10.     0.3    0.67   0.34   0.53   0.28] sorted [4 6 1]\n",
      "   state [0 1 0 1 0 0 1 1] state_WI [  0.15   0.43 -10.     0.3    0.67   0.34 -10.     0.28] sorted [4 1 5]\n",
      "   state [0 0 0 1 0 0 1 0] state_WI [  0.15   0.44 -10.     0.3    0.67   0.34 -10.     0.83] sorted [7 4 1]\n",
      "   state [0 0 0 1 0 0 1 1] state_WI [  0.15   0.44 -10.     0.3    0.67   0.34 -10.     0.28] sorted [4 1 5]\n",
      "   state [0 1 1 1 1 0 0 1] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34   0.53   0.28] sorted [6 1 4]\n",
      "   state [0 1 1 1 1 0 1 0] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34 -10.     0.83] sorted [7 1 4]\n",
      "   state [1 1 1 0 1 0 0 1] state_WI [  0.12   0.43 -10.     0.95   0.42   0.34   0.53   0.28] sorted [3 6 1]\n",
      "   state [0 1 1 0 1 0 1 1] state_WI [  0.15   0.43 -10.     0.95   0.42   0.34 -10.     0.28] sorted [3 1 4]\n",
      "   state [0 1 0 0 1 0 0 0] state_WI [  0.15   0.43 -10.     0.95   0.42   0.34   0.53   0.83] sorted [3 7 6]\n",
      "   state [0 0 0 1 1 0 1 1] state_WI [  0.15   0.44 -10.     0.3    0.42   0.34 -10.     0.28] sorted [1 4 5]\n",
      "   state [0 0 0 1 1 1 1 1] state_WI [  0.15   0.44 -10.     0.3    0.42 -10.   -10.     0.28] sorted [1 4 3]\n",
      "instance 8, ep 18, state [1 0 1 0 1 0 1 1]\n",
      "   state [1 0 1 0 1 0 1 1] state_WI [  0.12   0.44 -10.     0.95   0.42   0.34 -10.     0.28] sorted [3 1 4]\n",
      "   state [0 0 0 0 0 0 0 0] state_WI [  0.15   0.44 -10.     0.95   0.67   0.34   0.53   0.83] sorted [3 7 4]\n",
      "   state [0 1 0 1 1 1 0 0] state_WI [  0.15   0.43 -10.     0.3    0.42 -10.     0.53   0.83] sorted [7 6 1]\n",
      "   state [0 1 0 1 0 0 0 0] state_WI [  0.15   0.43 -10.     0.3    0.67   0.34   0.53   0.83] sorted [7 4 6]\n",
      "   state [0 0 0 0 0 0 0 1] state_WI [  0.15   0.44 -10.     0.95   0.67   0.34   0.53   0.28] sorted [3 4 6]\n",
      "   state [0 1 0 0 1 0 0 0] state_WI [  0.15   0.43 -10.     0.95   0.42   0.34   0.53   0.83] sorted [3 7 6]\n",
      "   state [0 1 0 1 1 0 0 1] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34   0.53   0.28] sorted [6 1 4]\n",
      "   state [0 0 0 1 1 0 0 0] state_WI [  0.15   0.44 -10.     0.3    0.42   0.34   0.53   0.83] sorted [7 6 1]\n",
      "   state [0 1 0 1 1 0 1 1] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34 -10.     0.28] sorted [1 4 5]\n",
      "   state [0 1 0 0 1 0 0 1] state_WI [  0.15   0.43 -10.     0.95   0.42   0.34   0.53   0.28] sorted [3 6 1]\n",
      "   state [0 1 1 1 1 0 1 0] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34 -10.     0.83] sorted [7 1 4]\n",
      "   state [1 1 0 1 1 0 0 1] state_WI [  0.12   0.43 -10.     0.3    0.42   0.34   0.53   0.28] sorted [6 1 4]\n",
      "   state [1 1 1 0 1 0 1 0] state_WI [  0.12   0.43 -10.     0.95   0.42   0.34 -10.     0.83] sorted [3 7 1]\n",
      "   state [1 0 1 1 1 0 0 0] state_WI [  0.12   0.44 -10.     0.3    0.42   0.34   0.53   0.83] sorted [7 6 1]\n",
      "   state [0 0 1 0 0 0 1 0] state_WI [  0.15   0.44 -10.     0.95   0.67   0.34 -10.     0.83] sorted [3 7 4]\n",
      "   state [0 1 1 1 1 0 1 1] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34 -10.     0.28] sorted [1 4 5]\n",
      "   state [0 1 0 1 1 0 1 0] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34 -10.     0.83] sorted [7 1 4]\n",
      "   state [1 1 0 0 1 0 1 1] state_WI [  0.12   0.43 -10.     0.95   0.42   0.34 -10.     0.28] sorted [3 1 4]\n",
      "   state [1 1 0 0 1 0 0 1] state_WI [  0.12   0.43 -10.     0.95   0.42   0.34   0.53   0.28] sorted [3 6 1]\n",
      "   state [0 1 0 0 1 0 1 0] state_WI [  0.15   0.43 -10.     0.95   0.42   0.34 -10.     0.83] sorted [3 7 1]\n",
      "instance 8, ep 19, state [0 0 1 0 0 0 0 1]\n",
      "   state [0 0 1 0 0 0 0 1] state_WI [  0.15   0.44 -10.     0.95   0.67   0.34   0.53   0.28] sorted [3 4 6]\n",
      "   state [0 0 1 1 1 0 0 0] state_WI [  0.15   0.44 -10.     0.3    0.42   0.34   0.53   0.83] sorted [7 6 1]\n",
      "   state [0 0 1 0 0 0 1 1] state_WI [  0.15   0.44 -10.     0.95   0.67   0.34 -10.     0.28] sorted [3 4 1]\n",
      "   state [0 1 0 0 0 1 1 1] state_WI [  0.15   0.43 -10.     0.95   0.67 -10.   -10.     0.28] sorted [3 4 1]\n",
      "   state [0 1 0 1 0 1 0 1] state_WI [  0.15   0.43 -10.     0.3    0.67 -10.     0.53   0.28] sorted [4 6 1]\n",
      "   state [0 1 0 0 1 1 1 0] state_WI [  0.15   0.43 -10.     0.95   0.42 -10.   -10.     0.83] sorted [3 7 1]\n",
      "   state [0 1 0 1 1 0 1 0] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34 -10.     0.83] sorted [7 1 4]\n",
      "   state [0 1 0 0 1 1 1 1] state_WI [  0.15   0.43 -10.     0.95   0.42 -10.   -10.     0.28] sorted [3 1 4]\n",
      "   state [0 1 0 0 1 1 1 1] state_WI [  0.15   0.43 -10.     0.95   0.42 -10.   -10.     0.28] sorted [3 1 4]\n",
      "   state [0 0 0 0 1 0 1 1] state_WI [  0.15   0.44 -10.     0.95   0.42   0.34 -10.     0.28] sorted [3 1 4]\n",
      "   state [1 0 0 0 0 0 0 0] state_WI [  0.12   0.44 -10.     0.95   0.67   0.34   0.53   0.83] sorted [3 7 4]\n",
      "   state [0 0 1 1 1 0 0 1] state_WI [  0.15   0.44 -10.     0.3    0.42   0.34   0.53   0.28] sorted [6 1 4]\n",
      "   state [0 0 1 1 0 0 1 1] state_WI [  0.15   0.44 -10.     0.3    0.67   0.34 -10.     0.28] sorted [4 1 5]\n",
      "   state [0 0 0 1 1 1 0 0] state_WI [  0.15   0.44 -10.     0.3    0.42 -10.     0.53   0.83] sorted [7 6 1]\n",
      "   state [0 0 0 1 0 0 0 0] state_WI [  0.15   0.44 -10.     0.3    0.67   0.34   0.53   0.83] sorted [7 4 6]\n",
      "   state [0 0 0 1 1 0 0 1] state_WI [  0.15   0.44 -10.     0.3    0.42   0.34   0.53   0.28] sorted [6 1 4]\n",
      "   state [1 1 0 0 1 0 1 0] state_WI [  0.12   0.43 -10.     0.95   0.42   0.34 -10.     0.83] sorted [3 7 1]\n",
      "   state [0 0 0 1 0 0 1 0] state_WI [  0.15   0.44 -10.     0.3    0.67   0.34 -10.     0.83] sorted [7 4 1]\n",
      "   state [0 1 0 1 1 0 0 0] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34   0.53   0.83] sorted [7 6 1]\n",
      "   state [0 1 0 1 1 0 1 0] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34 -10.     0.83] sorted [7 1 4]\n",
      "instance 8, ep 20, state [1 0 0 0 0 0 0 0]\n",
      "   state [1 0 0 0 0 0 0 0] state_WI [  0.12   0.44 -10.     0.95   0.67   0.34   0.53   0.83] sorted [3 7 4]\n",
      "   state [0 0 0 0 0 0 0 1] state_WI [  0.15   0.44 -10.     0.95   0.67   0.34   0.53   0.28] sorted [3 4 6]\n",
      "   state [0 0 1 1 0 0 1 0] state_WI [  0.15   0.44 -10.     0.3    0.67   0.34 -10.     0.83] sorted [7 4 1]\n",
      "   state [0 0 1 0 1 0 1 0] state_WI [  0.15   0.44 -10.     0.95   0.42   0.34 -10.     0.83] sorted [3 7 1]\n",
      "   state [1 0 0 1 1 0 0 0] state_WI [  0.12   0.44 -10.     0.3    0.42   0.34   0.53   0.83] sorted [7 6 1]\n",
      "   state [1 1 0 1 1 0 1 0] state_WI [  0.12   0.43 -10.     0.3    0.42   0.34 -10.     0.83] sorted [7 1 4]\n",
      "   state [1 0 0 0 0 0 1 0] state_WI [  0.12   0.44 -10.     0.95   0.67   0.34 -10.     0.83] sorted [3 7 4]\n",
      "   state [0 0 0 1 0 0 0 1] state_WI [  0.15   0.44 -10.     0.3    0.67   0.34   0.53   0.28] sorted [4 6 1]\n",
      "   state [0 0 0 0 0 0 0 1] state_WI [  0.15   0.44 -10.     0.95   0.67   0.34   0.53   0.28] sorted [3 4 6]\n",
      "   state [1 0 0 1 0 0 0 1] state_WI [  0.12   0.44 -10.     0.3    0.67   0.34   0.53   0.28] sorted [4 6 1]\n",
      "   state [0 1 0 1 0 1 0 0] state_WI [  0.15   0.43 -10.     0.3    0.67 -10.     0.53   0.83] sorted [7 4 6]\n",
      "   state [1 1 0 0 1 0 1 1] state_WI [  0.12   0.43 -10.     0.95   0.42   0.34 -10.     0.28] sorted [3 1 4]\n",
      "   state [0 1 0 1 0 0 1 0] state_WI [  0.15   0.43 -10.     0.3    0.67   0.34 -10.     0.83] sorted [7 4 1]\n",
      "   state [0 1 0 0 0 0 0 1] state_WI [  0.15   0.43 -10.     0.95   0.67   0.34   0.53   0.28] sorted [3 4 6]\n",
      "   state [0 0 0 1 1 0 0 0] state_WI [  0.15   0.44 -10.     0.3    0.42   0.34   0.53   0.83] sorted [7 6 1]\n",
      "   state [0 0 0 1 1 0 0 1] state_WI [  0.15   0.44 -10.     0.3    0.42   0.34   0.53   0.28] sorted [6 1 4]\n",
      "   state [0 0 0 1 1 0 1 1] state_WI [  0.15   0.44 -10.     0.3    0.42   0.34 -10.     0.28] sorted [1 4 5]\n",
      "   state [0 0 0 0 1 1 1 1] state_WI [  0.15   0.44 -10.     0.95   0.42 -10.   -10.     0.28] sorted [3 1 4]\n",
      "   state [0 0 0 1 1 0 1 1] state_WI [  0.15   0.44 -10.     0.3    0.42   0.34 -10.     0.28] sorted [1 4 5]\n",
      "   state [0 0 0 1 0 1 0 1] state_WI [  0.15   0.44 -10.     0.3    0.67 -10.     0.53   0.28] sorted [4 6 1]\n",
      "instance 8, ep 21, state [1 0 1 1 1 1 1 1]\n",
      "   state [1 0 1 1 1 1 1 1] state_WI [  0.12   0.44 -10.     0.3    0.42 -10.   -10.     0.28] sorted [1 4 3]\n",
      "   state [0 0 0 1 0 0 1 0] state_WI [  0.15   0.44 -10.     0.3    0.67   0.34 -10.     0.83] sorted [7 4 1]\n",
      "   state [1 0 1 1 1 0 0 0] state_WI [  0.12   0.44 -10.     0.3    0.42   0.34   0.53   0.83] sorted [7 6 1]\n",
      "   state [0 0 1 1 0 0 0 1] state_WI [  0.15   0.44 -10.     0.3    0.67   0.34   0.53   0.28] sorted [4 6 1]\n",
      "   state [0 1 1 0 1 0 1 1] state_WI [  0.15   0.43 -10.     0.95   0.42   0.34 -10.     0.28] sorted [3 1 4]\n",
      "   state [0 1 1 1 1 0 1 0] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34 -10.     0.83] sorted [7 1 4]\n",
      "   state [0 1 1 1 1 0 0 0] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34   0.53   0.83] sorted [7 6 1]\n",
      "   state [0 0 1 1 0 0 1 0] state_WI [  0.15   0.44 -10.     0.3    0.67   0.34 -10.     0.83] sorted [7 4 1]\n",
      "   state [0 0 0 1 1 0 0 1] state_WI [  0.15   0.44 -10.     0.3    0.42   0.34   0.53   0.28] sorted [6 1 4]\n",
      "   state [0 0 0 1 1 0 1 1] state_WI [  0.15   0.44 -10.     0.3    0.42   0.34 -10.     0.28] sorted [1 4 5]\n",
      "   state [0 0 0 0 1 1 1 0] state_WI [  0.15   0.44 -10.     0.95   0.42 -10.   -10.     0.83] sorted [3 7 1]\n",
      "   state [0 1 0 0 0 0 1 1] state_WI [  0.15   0.43 -10.     0.95   0.67   0.34 -10.     0.28] sorted [3 4 1]\n",
      "   state [0 1 0 1 0 0 1 0] state_WI [  0.15   0.43 -10.     0.3    0.67   0.34 -10.     0.83] sorted [7 4 1]\n",
      "   state [0 1 0 0 1 0 1 0] state_WI [  0.15   0.43 -10.     0.95   0.42   0.34 -10.     0.83] sorted [3 7 1]\n",
      "   state [0 0 0 1 1 0 0 0] state_WI [  0.15   0.44 -10.     0.3    0.42   0.34   0.53   0.83] sorted [7 6 1]\n",
      "   state [0 1 0 1 1 0 1 1] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34 -10.     0.28] sorted [1 4 5]\n",
      "   state [0 0 0 0 1 0 1 1] state_WI [  0.15   0.44 -10.     0.95   0.42   0.34 -10.     0.28] sorted [3 1 4]\n",
      "   state [0 1 0 1 1 0 0 1] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34   0.53   0.28] sorted [6 1 4]\n",
      "   state [0 1 1 1 1 0 0 1] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34   0.53   0.28] sorted [6 1 4]\n",
      "   state [0 1 1 1 1 0 1 1] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34 -10.     0.28] sorted [1 4 5]\n",
      "instance 8, ep 22, state [1 1 1 1 0 0 0 1]\n",
      "   state [1 1 1 1 0 0 0 1] state_WI [  0.12   0.43 -10.     0.3    0.67   0.34   0.53   0.28] sorted [4 6 1]\n",
      "   state [1 0 0 1 0 0 0 1] state_WI [  0.12   0.44 -10.     0.3    0.67   0.34   0.53   0.28] sorted [4 6 1]\n",
      "   state [0 1 0 1 1 0 1 0] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34 -10.     0.83] sorted [7 1 4]\n",
      "   state [0 1 0 0 1 0 1 1] state_WI [  0.15   0.43 -10.     0.95   0.42   0.34 -10.     0.28] sorted [3 1 4]\n",
      "   state [0 1 0 1 1 0 1 0] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34 -10.     0.83] sorted [7 1 4]\n",
      "   state [0 1 0 0 1 0 0 1] state_WI [  0.15   0.43 -10.     0.95   0.42   0.34   0.53   0.28] sorted [3 6 1]\n",
      "   state [1 1 1 1 1 1 1 1] state_WI [  0.12   0.43 -10.     0.3    0.42 -10.   -10.     0.28] sorted [1 4 3]\n",
      "   state [0 1 1 1 1 1 0 0] state_WI [  0.15   0.43 -10.     0.3    0.42 -10.     0.53   0.83] sorted [7 6 1]\n",
      "   state [0 1 0 0 0 0 1 1] state_WI [  0.15   0.43 -10.     0.95   0.67   0.34 -10.     0.28] sorted [3 4 1]\n",
      "   state [0 1 0 1 1 0 1 0] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34 -10.     0.83] sorted [7 1 4]\n",
      "   state [1 0 0 0 1 0 0 0] state_WI [  0.12   0.44 -10.     0.95   0.42   0.34   0.53   0.83] sorted [3 7 6]\n",
      "   state [0 0 0 1 0 0 0 1] state_WI [  0.15   0.44 -10.     0.3    0.67   0.34   0.53   0.28] sorted [4 6 1]\n",
      "   state [0 0 0 1 0 0 0 0] state_WI [  0.15   0.44 -10.     0.3    0.67   0.34   0.53   0.83] sorted [7 4 6]\n",
      "   state [0 0 0 0 0 0 0 1] state_WI [  0.15   0.44 -10.     0.95   0.67   0.34   0.53   0.28] sorted [3 4 6]\n",
      "   state [0 0 0 1 1 0 1 0] state_WI [  0.15   0.44 -10.     0.3    0.42   0.34 -10.     0.83] sorted [7 1 4]\n",
      "   state [0 0 0 1 1 0 0 1] state_WI [  0.15   0.44 -10.     0.3    0.42   0.34   0.53   0.28] sorted [6 1 4]\n",
      "   state [0 0 0 0 1 0 1 0] state_WI [  0.15   0.44 -10.     0.95   0.42   0.34 -10.     0.83] sorted [3 7 1]\n",
      "   state [0 0 0 1 1 0 1 1] state_WI [  0.15   0.44 -10.     0.3    0.42   0.34 -10.     0.28] sorted [1 4 5]\n",
      "   state [0 0 0 1 1 1 0 0] state_WI [  0.15   0.44 -10.     0.3    0.42 -10.     0.53   0.83] sorted [7 6 1]\n",
      "   state [0 1 0 0 1 1 1 0] state_WI [  0.15   0.43 -10.     0.95   0.42 -10.   -10.     0.83] sorted [3 7 1]\n",
      "instance 8, ep 23, state [1 1 1 0 0 1 1 1]\n",
      "   state [1 1 1 0 0 1 1 1] state_WI [  0.12   0.43 -10.     0.95   0.67 -10.   -10.     0.28] sorted [3 4 1]\n",
      "   state [0 1 0 1 0 0 0 0] state_WI [  0.15   0.43 -10.     0.3    0.67   0.34   0.53   0.83] sorted [7 4 6]\n",
      "   state [0 0 0 1 0 1 1 1] state_WI [  0.15   0.44 -10.     0.3    0.67 -10.   -10.     0.28] sorted [4 1 3]\n",
      "   state [0 0 0 0 1 0 1 0] state_WI [  0.15   0.44 -10.     0.95   0.42   0.34 -10.     0.83] sorted [3 7 1]\n",
      "   state [0 0 0 1 1 0 0 0] state_WI [  0.15   0.44 -10.     0.3    0.42   0.34   0.53   0.83] sorted [7 6 1]\n",
      "   state [0 1 0 1 1 0 1 1] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34 -10.     0.28] sorted [1 4 5]\n",
      "   state [1 1 0 1 1 1 0 1] state_WI [  0.12   0.43 -10.     0.3    0.42 -10.     0.53   0.28] sorted [6 1 4]\n",
      "   state [0 1 0 0 1 1 0 0] state_WI [  0.15   0.43 -10.     0.95   0.42 -10.     0.53   0.83] sorted [3 7 6]\n",
      "   state [0 0 0 0 1 0 0 1] state_WI [  0.15   0.44 -10.     0.95   0.42   0.34   0.53   0.28] sorted [3 6 1]\n",
      "   state [0 0 0 0 1 0 1 1] state_WI [  0.15   0.44 -10.     0.95   0.42   0.34 -10.     0.28] sorted [3 1 4]\n",
      "   state [0 1 0 1 1 0 1 1] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34 -10.     0.28] sorted [1 4 5]\n",
      "   state [0 1 0 0 1 1 1 1] state_WI [  0.15   0.43 -10.     0.95   0.42 -10.   -10.     0.28] sorted [3 1 4]\n",
      "   state [0 1 0 1 0 0 0 0] state_WI [  0.15   0.43 -10.     0.3    0.67   0.34   0.53   0.83] sorted [7 4 6]\n",
      "   state [0 0 0 0 1 0 1 0] state_WI [  0.15   0.44 -10.     0.95   0.42   0.34 -10.     0.83] sorted [3 7 1]\n",
      "   state [0 1 1 0 0 1 0 0] state_WI [  0.15   0.43 -10.     0.95   0.67 -10.     0.53   0.83] sorted [3 7 4]\n",
      "   state [0 1 0 1 1 0 0 1] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34   0.53   0.28] sorted [6 1 4]\n",
      "   state [0 1 0 1 1 0 1 1] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34 -10.     0.28] sorted [1 4 5]\n",
      "   state [0 1 0 0 1 0 0 1] state_WI [  0.15   0.43 -10.     0.95   0.42   0.34   0.53   0.28] sorted [3 6 1]\n",
      "   state [0 1 1 0 0 0 1 0] state_WI [  0.15   0.43 -10.     0.95   0.67   0.34 -10.     0.83] sorted [3 7 4]\n",
      "   state [0 0 1 1 0 0 0 0] state_WI [  0.15   0.44 -10.     0.3    0.67   0.34   0.53   0.83] sorted [7 4 6]\n",
      "instance 8, ep 24, state [0 1 1 1 1 1 0 1]\n",
      "   state [0 1 1 1 1 1 0 1] state_WI [  0.15   0.43 -10.     0.3    0.42 -10.     0.53   0.28] sorted [6 1 4]\n",
      "   state [0 0 0 0 1 0 1 0] state_WI [  0.15   0.44 -10.     0.95   0.42   0.34 -10.     0.83] sorted [3 7 1]\n",
      "   state [0 0 0 1 0 0 1 1] state_WI [  0.15   0.44 -10.     0.3    0.67   0.34 -10.     0.28] sorted [4 1 5]\n",
      "   state [0 0 0 1 1 0 1 0] state_WI [  0.15   0.44 -10.     0.3    0.42   0.34 -10.     0.83] sorted [7 1 4]\n",
      "   state [0 0 0 1 1 0 1 1] state_WI [  0.15   0.44 -10.     0.3    0.42   0.34 -10.     0.28] sorted [1 4 5]\n",
      "   state [0 1 0 1 1 1 1 1] state_WI [  0.15   0.43 -10.     0.3    0.42 -10.   -10.     0.28] sorted [1 4 3]\n",
      "   state [1 0 0 1 1 0 0 1] state_WI [  0.12   0.44 -10.     0.3    0.42   0.34   0.53   0.28] sorted [6 1 4]\n",
      "   state [1 0 0 0 1 0 0 1] state_WI [  0.12   0.44 -10.     0.95   0.42   0.34   0.53   0.28] sorted [3 6 1]\n",
      "   state [0 1 1 1 0 0 0 1] state_WI [  0.15   0.43 -10.     0.3    0.67   0.34   0.53   0.28] sorted [4 6 1]\n",
      "   state [0 1 1 1 1 0 0 1] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34   0.53   0.28] sorted [6 1 4]\n",
      "   state [1 1 1 1 1 1 0 1] state_WI [  0.12   0.43 -10.     0.3    0.42 -10.     0.53   0.28] sorted [6 1 4]\n",
      "   state [0 1 0 0 1 0 0 1] state_WI [  0.15   0.43 -10.     0.95   0.42   0.34   0.53   0.28] sorted [3 6 1]\n",
      "   state [0 1 0 0 1 0 1 0] state_WI [  0.15   0.43 -10.     0.95   0.42   0.34 -10.     0.83] sorted [3 7 1]\n",
      "   state [0 0 0 1 1 0 0 0] state_WI [  0.15   0.44 -10.     0.3    0.42   0.34   0.53   0.83] sorted [7 6 1]\n",
      "   state [0 0 0 1 1 0 0 1] state_WI [  0.15   0.44 -10.     0.3    0.42   0.34   0.53   0.28] sorted [6 1 4]\n",
      "   state [0 1 0 1 1 0 0 0] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34   0.53   0.83] sorted [7 6 1]\n",
      "   state [0 1 0 0 0 0 1 1] state_WI [  0.15   0.43 -10.     0.95   0.67   0.34 -10.     0.28] sorted [3 4 1]\n",
      "   state [0 1 0 1 1 0 0 0] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34   0.53   0.83] sorted [7 6 1]\n",
      "   state [0 0 0 0 0 0 1 1] state_WI [  0.15   0.44 -10.     0.95   0.67   0.34 -10.     0.28] sorted [3 4 1]\n",
      "   state [0 1 0 1 0 0 0 1] state_WI [  0.15   0.43 -10.     0.3    0.67   0.34   0.53   0.28] sorted [4 6 1]\n",
      "instance 8, ep 25, state [1 1 1 0 0 1 1 1]\n",
      "   state [1 1 1 0 0 1 1 1] state_WI [  0.12   0.43 -10.     0.95   0.67 -10.   -10.     0.28] sorted [3 4 1]\n",
      "   state [0 1 1 0 1 0 0 1] state_WI [  0.15   0.43 -10.     0.95   0.42   0.34   0.53   0.28] sorted [3 6 1]\n",
      "   state [0 1 0 1 0 0 1 1] state_WI [  0.15   0.43 -10.     0.3    0.67   0.34 -10.     0.28] sorted [4 1 5]\n",
      "   state [0 1 0 0 1 0 0 1] state_WI [  0.15   0.43 -10.     0.95   0.42   0.34   0.53   0.28] sorted [3 6 1]\n",
      "   state [0 1 0 1 0 1 0 0] state_WI [  0.15   0.43 -10.     0.3    0.67 -10.     0.53   0.83] sorted [7 4 6]\n",
      "   state [0 1 0 0 1 0 0 1] state_WI [  0.15   0.43 -10.     0.95   0.42   0.34   0.53   0.28] sorted [3 6 1]\n",
      "   state [0 1 0 1 0 1 1 1] state_WI [  0.15   0.43 -10.     0.3    0.67 -10.   -10.     0.28] sorted [4 1 3]\n",
      "   state [0 1 0 1 1 0 0 1] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34   0.53   0.28] sorted [6 1 4]\n",
      "   state [0 1 0 1 1 0 1 0] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34 -10.     0.83] sorted [7 1 4]\n",
      "   state [0 1 0 1 1 0 1 0] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34 -10.     0.83] sorted [7 1 4]\n",
      "   state [0 1 1 0 1 1 0 1] state_WI [  0.15   0.43 -10.     0.95   0.42 -10.     0.53   0.28] sorted [3 6 1]\n",
      "   state [0 1 0 1 0 1 1 0] state_WI [  0.15   0.43 -10.     0.3    0.67 -10.   -10.     0.83] sorted [7 4 1]\n",
      "   state [0 1 0 1 1 0 1 0] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34 -10.     0.83] sorted [7 1 4]\n",
      "   state [0 0 0 1 1 0 0 1] state_WI [  0.15   0.44 -10.     0.3    0.42   0.34   0.53   0.28] sorted [6 1 4]\n",
      "   state [0 0 0 1 1 0 1 1] state_WI [  0.15   0.44 -10.     0.3    0.42   0.34 -10.     0.28] sorted [1 4 5]\n",
      "   state [0 0 0 0 1 0 1 1] state_WI [  0.15   0.44 -10.     0.95   0.42   0.34 -10.     0.28] sorted [3 1 4]\n",
      "   state [0 0 0 1 1 0 0 0] state_WI [  0.15   0.44 -10.     0.3    0.42   0.34   0.53   0.83] sorted [7 6 1]\n",
      "   state [0 0 0 0 1 1 1 1] state_WI [  0.15   0.44 -10.     0.95   0.42 -10.   -10.     0.28] sorted [3 1 4]\n",
      "   state [1 1 1 1 1 0 1 1] state_WI [  0.12   0.43 -10.     0.3    0.42   0.34 -10.     0.28] sorted [1 4 5]\n",
      "   state [0 0 0 1 1 0 0 1] state_WI [  0.15   0.44 -10.     0.3    0.42   0.34   0.53   0.28] sorted [6 1 4]\n",
      "instance 8, ep 26, state [0 1 1 1 0 1 1 0]\n",
      "   state [0 1 1 1 0 1 1 0] state_WI [  0.15   0.43 -10.     0.3    0.67 -10.   -10.     0.83] sorted [7 4 1]\n",
      "   state [0 0 1 1 1 0 0 1] state_WI [  0.15   0.44 -10.     0.3    0.42   0.34   0.53   0.28] sorted [6 1 4]\n",
      "   state [0 0 1 0 1 0 1 1] state_WI [  0.15   0.44 -10.     0.95   0.42   0.34 -10.     0.28] sorted [3 1 4]\n",
      "   state [0 0 0 0 0 0 1 1] state_WI [  0.15   0.44 -10.     0.95   0.67   0.34 -10.     0.28] sorted [3 4 1]\n",
      "   state [0 1 1 1 1 0 0 0] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34   0.53   0.83] sorted [7 6 1]\n",
      "   state [0 1 0 1 0 1 0 1] state_WI [  0.15   0.43 -10.     0.3    0.67 -10.     0.53   0.28] sorted [4 6 1]\n",
      "   state [0 1 0 1 0 0 0 1] state_WI [  0.15   0.43 -10.     0.3    0.67   0.34   0.53   0.28] sorted [4 6 1]\n",
      "   state [0 0 0 1 1 0 1 1] state_WI [  0.15   0.44 -10.     0.3    0.42   0.34 -10.     0.28] sorted [1 4 5]\n",
      "   state [0 1 0 1 1 1 1 0] state_WI [  0.15   0.43 -10.     0.3    0.42 -10.   -10.     0.83] sorted [7 1 4]\n",
      "   state [0 0 0 0 1 0 1 1] state_WI [  0.15   0.44 -10.     0.95   0.42   0.34 -10.     0.28] sorted [3 1 4]\n",
      "   state [0 0 0 1 1 0 0 1] state_WI [  0.15   0.44 -10.     0.3    0.42   0.34   0.53   0.28] sorted [6 1 4]\n",
      "   state [0 0 0 0 1 0 1 0] state_WI [  0.15   0.44 -10.     0.95   0.42   0.34 -10.     0.83] sorted [3 7 1]\n",
      "   state [0 1 0 0 1 0 1 0] state_WI [  0.15   0.43 -10.     0.95   0.42   0.34 -10.     0.83] sorted [3 7 1]\n",
      "   state [0 1 0 1 1 0 0 0] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34   0.53   0.83] sorted [7 6 1]\n",
      "   state [1 1 0 1 0 0 0 0] state_WI [  0.12   0.43 -10.     0.3    0.67   0.34   0.53   0.83] sorted [7 4 6]\n",
      "   state [0 1 0 0 0 0 1 1] state_WI [  0.15   0.43 -10.     0.95   0.67   0.34 -10.     0.28] sorted [3 4 1]\n",
      "   state [0 1 0 0 0 0 0 1] state_WI [  0.15   0.43 -10.     0.95   0.67   0.34   0.53   0.28] sorted [3 4 6]\n",
      "   state [0 1 0 0 1 0 0 0] state_WI [  0.15   0.43 -10.     0.95   0.42   0.34   0.53   0.83] sorted [3 7 6]\n",
      "   state [0 0 0 1 0 0 1 0] state_WI [  0.15   0.44 -10.     0.3    0.67   0.34 -10.     0.83] sorted [7 4 1]\n",
      "   state [0 1 0 0 1 0 0 1] state_WI [  0.15   0.43 -10.     0.95   0.42   0.34   0.53   0.28] sorted [3 6 1]\n",
      "instance 8, ep 27, state [1 1 1 0 0 0 0 0]\n",
      "   state [1 1 1 0 0 0 0 0] state_WI [  0.12   0.43 -10.     0.95   0.67   0.34   0.53   0.83] sorted [3 7 4]\n",
      "   state [0 1 0 1 1 0 0 1] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34   0.53   0.28] sorted [6 1 4]\n",
      "   state [0 0 0 0 1 0 0 0] state_WI [  0.15   0.44 -10.     0.95   0.42   0.34   0.53   0.83] sorted [3 7 6]\n",
      "   state [0 0 1 1 0 1 0 1] state_WI [  0.15   0.44 -10.     0.3    0.67 -10.     0.53   0.28] sorted [4 6 1]\n",
      "   state [0 0 1 1 1 0 0 1] state_WI [  0.15   0.44 -10.     0.3    0.42   0.34   0.53   0.28] sorted [6 1 4]\n",
      "   state [0 1 0 0 1 0 1 0] state_WI [  0.15   0.43 -10.     0.95   0.42   0.34 -10.     0.83] sorted [3 7 1]\n",
      "   state [1 1 0 1 1 0 1 1] state_WI [  0.12   0.43 -10.     0.3    0.42   0.34 -10.     0.28] sorted [1 4 5]\n",
      "   state [1 1 0 1 1 0 1 0] state_WI [  0.12   0.43 -10.     0.3    0.42   0.34 -10.     0.83] sorted [7 1 4]\n",
      "   state [0 1 0 1 1 0 0 1] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34   0.53   0.28] sorted [6 1 4]\n",
      "   state [0 1 0 1 1 0 0 1] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34   0.53   0.28] sorted [6 1 4]\n",
      "   state [0 1 0 0 1 0 0 1] state_WI [  0.15   0.43 -10.     0.95   0.42   0.34   0.53   0.28] sorted [3 6 1]\n",
      "   state [0 1 0 0 0 0 0 0] state_WI [  0.15   0.43 -10.     0.95   0.67   0.34   0.53   0.83] sorted [3 7 4]\n",
      "   state [0 0 0 1 0 0 0 1] state_WI [  0.15   0.44 -10.     0.3    0.67   0.34   0.53   0.28] sorted [4 6 1]\n",
      "   state [0 0 0 0 0 0 1 1] state_WI [  0.15   0.44 -10.     0.95   0.67   0.34 -10.     0.28] sorted [3 4 1]\n",
      "   state [0 1 0 0 1 0 1 0] state_WI [  0.15   0.43 -10.     0.95   0.42   0.34 -10.     0.83] sorted [3 7 1]\n",
      "   state [0 0 0 0 1 0 1 1] state_WI [  0.15   0.44 -10.     0.95   0.42   0.34 -10.     0.28] sorted [3 1 4]\n",
      "   state [0 1 0 1 1 0 1 0] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34 -10.     0.83] sorted [7 1 4]\n",
      "   state [0 1 0 0 1 0 1 1] state_WI [  0.15   0.43 -10.     0.95   0.42   0.34 -10.     0.28] sorted [3 1 4]\n",
      "   state [0 1 0 1 1 0 0 1] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34   0.53   0.28] sorted [6 1 4]\n",
      "   state [0 1 0 1 1 0 0 0] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34   0.53   0.83] sorted [7 6 1]\n",
      "instance 8, ep 28, state [1 0 1 1 1 1 1 1]\n",
      "   state [1 0 1 1 1 1 1 1] state_WI [  0.12   0.44 -10.     0.3    0.42 -10.   -10.     0.28] sorted [1 4 3]\n",
      "   state [1 1 1 1 1 0 0 0] state_WI [  0.12   0.43 -10.     0.3    0.42   0.34   0.53   0.83] sorted [7 6 1]\n",
      "   state [0 1 1 1 0 0 1 1] state_WI [  0.15   0.43 -10.     0.3    0.67   0.34 -10.     0.28] sorted [4 1 5]\n",
      "   state [0 1 1 0 1 0 0 0] state_WI [  0.15   0.43 -10.     0.95   0.42   0.34   0.53   0.83] sorted [3 7 6]\n",
      "   state [0 0 0 1 1 0 1 1] state_WI [  0.15   0.44 -10.     0.3    0.42   0.34 -10.     0.28] sorted [1 4 5]\n",
      "   state [0 0 0 0 1 1 0 1] state_WI [  0.15   0.44 -10.     0.95   0.42 -10.     0.53   0.28] sorted [3 6 1]\n",
      "   state [0 1 0 1 1 1 1 1] state_WI [  0.15   0.43 -10.     0.3    0.42 -10.   -10.     0.28] sorted [1 4 3]\n",
      "   state [0 1 0 1 1 1 1 1] state_WI [  0.15   0.43 -10.     0.3    0.42 -10.   -10.     0.28] sorted [1 4 3]\n",
      "   state [0 1 0 1 1 0 1 0] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34 -10.     0.83] sorted [7 1 4]\n",
      "   state [0 1 0 0 1 0 1 0] state_WI [  0.15   0.43 -10.     0.95   0.42   0.34 -10.     0.83] sorted [3 7 1]\n",
      "   state [0 1 0 0 1 0 1 1] state_WI [  0.15   0.43 -10.     0.95   0.42   0.34 -10.     0.28] sorted [3 1 4]\n",
      "   state [0 1 0 0 1 0 0 1] state_WI [  0.15   0.43 -10.     0.95   0.42   0.34   0.53   0.28] sorted [3 6 1]\n",
      "   state [0 0 0 0 1 0 1 0] state_WI [  0.15   0.44 -10.     0.95   0.42   0.34 -10.     0.83] sorted [3 7 1]\n",
      "   state [0 0 0 1 0 0 0 1] state_WI [  0.15   0.44 -10.     0.3    0.67   0.34   0.53   0.28] sorted [4 6 1]\n",
      "   state [0 1 0 0 0 1 1 0] state_WI [  0.15   0.43 -10.     0.95   0.67 -10.   -10.     0.83] sorted [3 7 4]\n",
      "   state [0 0 0 1 0 0 0 1] state_WI [  0.15   0.44 -10.     0.3    0.67   0.34   0.53   0.28] sorted [4 6 1]\n",
      "   state [0 0 1 0 0 0 0 1] state_WI [  0.15   0.44 -10.     0.95   0.67   0.34   0.53   0.28] sorted [3 4 6]\n",
      "   state [0 0 1 1 0 0 1 0] state_WI [  0.15   0.44 -10.     0.3    0.67   0.34 -10.     0.83] sorted [7 4 1]\n",
      "   state [0 1 0 0 0 0 0 1] state_WI [  0.15   0.43 -10.     0.95   0.67   0.34   0.53   0.28] sorted [3 4 6]\n",
      "   state [0 1 0 1 1 0 1 0] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34 -10.     0.83] sorted [7 1 4]\n",
      "instance 8, ep 29, state [0 0 1 1 0 1 1 0]\n",
      "   state [0 0 1 1 0 1 1 0] state_WI [  0.15   0.44 -10.     0.3    0.67 -10.   -10.     0.83] sorted [7 4 1]\n",
      "   state [0 0 1 1 0 0 0 1] state_WI [  0.15   0.44 -10.     0.3    0.67   0.34   0.53   0.28] sorted [4 6 1]\n",
      "   state [0 1 0 1 0 0 0 0] state_WI [  0.15   0.43 -10.     0.3    0.67   0.34   0.53   0.83] sorted [7 4 6]\n",
      "   state [0 0 0 1 1 0 1 1] state_WI [  0.15   0.44 -10.     0.3    0.42   0.34 -10.     0.28] sorted [1 4 5]\n",
      "   state [0 1 0 0 1 0 0 0] state_WI [  0.15   0.43 -10.     0.95   0.42   0.34   0.53   0.83] sorted [3 7 6]\n",
      "   state [0 1 0 0 0 0 1 0] state_WI [  0.15   0.43 -10.     0.95   0.67   0.34 -10.     0.83] sorted [3 7 4]\n",
      "   state [0 1 1 1 0 1 1 1] state_WI [  0.15   0.43 -10.     0.3    0.67 -10.   -10.     0.28] sorted [4 1 3]\n",
      "   state [0 1 0 0 1 0 0 1] state_WI [  0.15   0.43 -10.     0.95   0.42   0.34   0.53   0.28] sorted [3 6 1]\n",
      "   state [0 0 0 0 1 1 1 1] state_WI [  0.15   0.44 -10.     0.95   0.42 -10.   -10.     0.28] sorted [3 1 4]\n",
      "   state [0 0 0 1 1 1 1 0] state_WI [  0.15   0.44 -10.     0.3    0.42 -10.   -10.     0.83] sorted [7 1 4]\n",
      "   state [0 0 0 1 1 0 1 1] state_WI [  0.15   0.44 -10.     0.3    0.42   0.34 -10.     0.28] sorted [1 4 5]\n",
      "   state [0 1 0 1 0 0 0 1] state_WI [  0.15   0.43 -10.     0.3    0.67   0.34   0.53   0.28] sorted [4 6 1]\n",
      "   state [0 1 0 1 0 0 0 0] state_WI [  0.15   0.43 -10.     0.3    0.67   0.34   0.53   0.83] sorted [7 4 6]\n",
      "   state [0 0 0 1 1 0 0 1] state_WI [  0.15   0.44 -10.     0.3    0.42   0.34   0.53   0.28] sorted [6 1 4]\n",
      "   state [0 0 0 0 0 0 1 0] state_WI [  0.15   0.44 -10.     0.95   0.67   0.34 -10.     0.83] sorted [3 7 4]\n",
      "   state [0 0 0 1 0 0 1 1] state_WI [  0.15   0.44 -10.     0.3    0.67   0.34 -10.     0.28] sorted [4 1 5]\n",
      "   state [0 0 0 1 0 0 1 0] state_WI [  0.15   0.44 -10.     0.3    0.67   0.34 -10.     0.83] sorted [7 4 1]\n",
      "   state [0 1 0 1 1 0 1 1] state_WI [  0.15   0.43 -10.     0.3    0.42   0.34 -10.     0.28] sorted [1 4 5]\n",
      "   state [0 1 0 0 1 0 0 0] state_WI [  0.15   0.43 -10.     0.95   0.42   0.34   0.53   0.83] sorted [3 7 6]\n",
      "   state [0 1 0 0 1 0 1 1] state_WI [  0.15   0.43 -10.     0.95   0.42   0.34 -10.     0.28] sorted [3 1 4]\n",
      "first state [0 1 0 0 0 0 1 0]\n",
      "   state [0 1 0 0 0 0 1 0] state_WI [  0.49   0.17   0.27   0.39   0.47   0.52 -10.     0.67] sorted [7 5 0]\n",
      "   state [0 1 0 0 0 0 0 1] state_WI [0.49 0.17 0.27 0.39 0.47 0.52 0.69 0.28] sorted [6 5 0]\n",
      "   state [0 0 1 0 0 0 1 0] state_WI [  0.49   0.72 -10.     0.39   0.47   0.52 -10.     0.67] sorted [1 7 5]\n",
      "   state [0 1 1 0 0 1 0 1] state_WI [  0.49   0.17 -10.     0.39   0.47   0.4    0.69   0.28] sorted [6 0 4]\n",
      "   state [0 0 1 1 0 0 1 0] state_WI [  0.49   0.72 -10.     0.26   0.47   0.52 -10.     0.67] sorted [1 7 5]\n",
      "   state [1 1 1 0 0 1 1 0] state_WI [-10.     0.17 -10.     0.39   0.47   0.4  -10.     0.67] sorted [7 4 5]\n",
      "   state [0 1 1 0 0 1 0 1] state_WI [  0.49   0.17 -10.     0.39   0.47   0.4    0.69   0.28] sorted [6 0 4]\n",
      "   state [0 1 0 0 1 1 0 0] state_WI [0.49 0.17 0.27 0.39 0.42 0.4  0.69 0.67] sorted [6 7 0]\n",
      "   state [1 1 1 0 0 1 1 1] state_WI [-10.     0.17 -10.     0.39   0.47   0.4  -10.     0.28] sorted [4 5 3]\n",
      "   state [1 0 1 1 0 1 0 0] state_WI [-10.     0.72 -10.     0.26   0.47   0.4    0.69   0.67] sorted [1 6 7]\n",
      "   state [0 0 1 0 0 1 0 1] state_WI [  0.49   0.72 -10.     0.39   0.47   0.4    0.69   0.28] sorted [1 6 0]\n",
      "   state [0 1 0 0 0 1 0 1] state_WI [0.49 0.17 0.27 0.39 0.47 0.4  0.69 0.28] sorted [6 0 4]\n",
      "   state [0 1 1 0 0 0 1 1] state_WI [  0.49   0.17 -10.     0.39   0.47   0.52 -10.     0.28] sorted [5 0 4]\n",
      "   state [1 1 1 0 1 0 1 0] state_WI [-10.     0.17 -10.     0.39   0.42   0.52 -10.     0.67] sorted [7 5 4]\n",
      "   state [0 1 1 0 1 1 0 0] state_WI [  0.49   0.17 -10.     0.39   0.42   0.4    0.69   0.67] sorted [6 7 0]\n",
      "   state [1 1 1 0 1 1 0 0] state_WI [-10.     0.17 -10.     0.39   0.42   0.4    0.69   0.67] sorted [6 7 4]\n",
      "   state [1 0 0 0 0 0 0 0] state_WI [-10.     0.72   0.27   0.39   0.47   0.52   0.69   0.67] sorted [1 6 7]\n",
      "   state [1 1 0 0 0 0 1 0] state_WI [-10.     0.17   0.27   0.39   0.47   0.52 -10.     0.67] sorted [7 5 4]\n",
      "   state [0 1 0 0 1 1 1 1] state_WI [  0.49   0.17   0.27   0.39   0.42   0.4  -10.     0.28] sorted [0 4 5]\n",
      "   state [1 1 0 0 0 1 0 0] state_WI [-10.     0.17   0.27   0.39   0.47   0.4    0.69   0.67] sorted [6 7 4]\n",
      "instance 9, ep 1, state [1 1 0 1 1 1 0 0]\n",
      "   state [1 1 0 1 1 1 0 0] state_WI [-10.     0.17   0.27   0.26   0.42   0.4    0.69   0.67] sorted [6 7 4]\n",
      "   state [0 1 1 1 0 0 0 0] state_WI [  0.49   0.17 -10.     0.26   0.47   0.52   0.69   0.67] sorted [6 7 5]\n",
      "   state [0 1 1 0 0 0 0 1] state_WI [  0.49   0.17 -10.     0.39   0.47   0.52   0.69   0.28] sorted [6 5 0]\n",
      "   state [1 1 0 0 1 1 0 1] state_WI [-10.     0.17   0.27   0.39   0.42   0.4    0.69   0.28] sorted [6 4 5]\n",
      "   state [0 0 1 0 1 1 1 0] state_WI [  0.49   0.72 -10.     0.39   0.42   0.4  -10.     0.67] sorted [1 7 0]\n",
      "   state [1 1 1 0 1 0 0 0] state_WI [-10.     0.17 -10.     0.39   0.42   0.52   0.69   0.67] sorted [6 7 5]\n",
      "   state [0 0 1 0 0 1 1 1] state_WI [  0.49   0.72 -10.     0.39   0.47   0.4  -10.     0.28] sorted [1 0 4]\n",
      "   state [1 0 0 0 0 1 0 1] state_WI [-10.     0.72   0.27   0.39   0.47   0.4    0.69   0.28] sorted [1 6 4]\n",
      "   state [0 1 0 0 1 0 0 0] state_WI [0.49 0.17 0.27 0.39 0.42 0.52 0.69 0.67] sorted [6 7 5]\n",
      "   state [0 0 1 0 0 0 0 1] state_WI [  0.49   0.72 -10.     0.39   0.47   0.52   0.69   0.28] sorted [1 6 5]\n",
      "   state [0 1 1 0 0 0 1 0] state_WI [  0.49   0.17 -10.     0.39   0.47   0.52 -10.     0.67] sorted [7 5 0]\n",
      "   state [0 1 0 1 1 0 1 1] state_WI [  0.49   0.17   0.27   0.26   0.42   0.52 -10.     0.28] sorted [5 0 4]\n",
      "   state [0 0 0 1 1 0 0 1] state_WI [0.49 0.72 0.27 0.26 0.42 0.52 0.69 0.28] sorted [1 6 5]\n",
      "   state [0 1 1 1 0 0 1 1] state_WI [  0.49   0.17 -10.     0.26   0.47   0.52 -10.     0.28] sorted [5 0 4]\n",
      "   state [1 1 0 1 1 1 1 1] state_WI [-10.     0.17   0.27   0.26   0.42   0.4  -10.     0.28] sorted [4 5 7]\n",
      "   state [1 1 1 0 1 1 1 1] state_WI [-10.     0.17 -10.     0.39   0.42   0.4  -10.     0.28] sorted [4 5 3]\n",
      "   state [1 1 0 1 1 1 1 0] state_WI [-10.     0.17   0.27   0.26   0.42   0.4  -10.     0.67] sorted [7 4 5]\n",
      "   state [1 0 1 0 0 1 1 1] state_WI [-10.     0.72 -10.     0.39   0.47   0.4  -10.     0.28] sorted [1 4 5]\n",
      "   state [0 1 1 0 0 1 1 0] state_WI [  0.49   0.17 -10.     0.39   0.47   0.4  -10.     0.67] sorted [7 0 4]\n",
      "   state [1 1 0 0 1 0 1 1] state_WI [-10.     0.17   0.27   0.39   0.42   0.52 -10.     0.28] sorted [5 4 3]\n",
      "instance 9, ep 2, state [1 1 1 0 1 0 0 0]\n",
      "   state [1 1 1 0 1 0 0 0] state_WI [-10.     0.17 -10.     0.39   0.42   0.52   0.69   0.67] sorted [6 7 5]\n",
      "   state [0 1 1 0 1 1 1 1] state_WI [  0.49   0.17 -10.     0.39   0.42   0.4  -10.     0.28] sorted [0 4 5]\n",
      "   state [0 1 0 0 1 1 0 1] state_WI [0.49 0.17 0.27 0.39 0.42 0.4  0.69 0.28] sorted [6 0 4]\n",
      "   state [1 0 0 0 0 0 1 1] state_WI [-10.     0.72   0.27   0.39   0.47   0.52 -10.     0.28] sorted [1 5 4]\n",
      "   state [1 1 0 1 1 1 0 1] state_WI [-10.     0.17   0.27   0.26   0.42   0.4    0.69   0.28] sorted [6 4 5]\n",
      "   state [0 0 1 1 0 1 1 1] state_WI [  0.49   0.72 -10.     0.26   0.47   0.4  -10.     0.28] sorted [1 0 4]\n",
      "   state [0 0 1 1 0 0 0 0] state_WI [  0.49   0.72 -10.     0.26   0.47   0.52   0.69   0.67] sorted [1 6 7]\n",
      "   state [0 0 1 0 0 1 1 1] state_WI [  0.49   0.72 -10.     0.39   0.47   0.4  -10.     0.28] sorted [1 0 4]\n",
      "   state [1 1 1 0 1 1 0 1] state_WI [-10.     0.17 -10.     0.39   0.42   0.4    0.69   0.28] sorted [6 4 5]\n",
      "   state [1 1 0 1 1 1 0 0] state_WI [-10.     0.17   0.27   0.26   0.42   0.4    0.69   0.67] sorted [6 7 4]\n",
      "   state [0 1 0 1 0 1 0 0] state_WI [0.49 0.17 0.27 0.26 0.47 0.4  0.69 0.67] sorted [6 7 0]\n",
      "   state [1 1 1 0 0 1 1 1] state_WI [-10.     0.17 -10.     0.39   0.47   0.4  -10.     0.28] sorted [4 5 3]\n",
      "   state [0 1 0 0 0 0 0 0] state_WI [0.49 0.17 0.27 0.39 0.47 0.52 0.69 0.67] sorted [6 7 5]\n",
      "   state [0 1 1 0 0 0 0 0] state_WI [  0.49   0.17 -10.     0.39   0.47   0.52   0.69   0.67] sorted [6 7 5]\n",
      "   state [0 1 1 1 0 0 1 1] state_WI [  0.49   0.17 -10.     0.26   0.47   0.52 -10.     0.28] sorted [5 0 4]\n",
      "   state [0 1 1 1 0 1 1 0] state_WI [  0.49   0.17 -10.     0.26   0.47   0.4  -10.     0.67] sorted [7 0 4]\n",
      "   state [0 0 0 1 0 1 1 0] state_WI [  0.49   0.72   0.27   0.26   0.47   0.4  -10.     0.67] sorted [1 7 0]\n",
      "   state [0 1 0 0 0 1 1 1] state_WI [  0.49   0.17   0.27   0.39   0.47   0.4  -10.     0.28] sorted [0 4 5]\n",
      "   state [1 1 0 0 1 1 0 0] state_WI [-10.     0.17   0.27   0.39   0.42   0.4    0.69   0.67] sorted [6 7 4]\n",
      "   state [0 0 0 0 1 1 1 0] state_WI [  0.49   0.72   0.27   0.39   0.42   0.4  -10.     0.67] sorted [1 7 0]\n",
      "instance 9, ep 3, state [1 0 0 1 0 0 0 1]\n",
      "   state [1 0 0 1 0 0 0 1] state_WI [-10.     0.72   0.27   0.26   0.47   0.52   0.69   0.28] sorted [1 6 5]\n",
      "   state [1 0 0 0 0 0 1 0] state_WI [-10.     0.72   0.27   0.39   0.47   0.52 -10.     0.67] sorted [1 7 5]\n",
      "   state [0 1 0 0 1 1 0 0] state_WI [0.49 0.17 0.27 0.39 0.42 0.4  0.69 0.67] sorted [6 7 0]\n",
      "   state [1 1 1 1 0 0 1 0] state_WI [-10.     0.17 -10.     0.26   0.47   0.52 -10.     0.67] sorted [7 5 4]\n",
      "   state [0 0 0 1 1 1 1 0] state_WI [  0.49   0.72   0.27   0.26   0.42   0.4  -10.     0.67] sorted [1 7 0]\n",
      "   state [1 1 1 1 0 1 0 1] state_WI [-10.     0.17 -10.     0.26   0.47   0.4    0.69   0.28] sorted [6 4 5]\n",
      "   state [1 1 0 1 1 1 0 0] state_WI [-10.     0.17   0.27   0.26   0.42   0.4    0.69   0.67] sorted [6 7 4]\n",
      "   state [0 0 0 1 1 1 1 0] state_WI [  0.49   0.72   0.27   0.26   0.42   0.4  -10.     0.67] sorted [1 7 0]\n",
      "   state [0 1 1 0 0 0 0 0] state_WI [  0.49   0.17 -10.     0.39   0.47   0.52   0.69   0.67] sorted [6 7 5]\n",
      "   state [0 1 0 0 0 0 1 0] state_WI [  0.49   0.17   0.27   0.39   0.47   0.52 -10.     0.67] sorted [7 5 0]\n",
      "   state [0 0 1 0 0 0 1 1] state_WI [  0.49   0.72 -10.     0.39   0.47   0.52 -10.     0.28] sorted [1 5 0]\n",
      "   state [0 0 1 0 0 1 1 0] state_WI [  0.49   0.72 -10.     0.39   0.47   0.4  -10.     0.67] sorted [1 7 0]\n",
      "   state [1 1 0 0 0 1 1 0] state_WI [-10.     0.17   0.27   0.39   0.47   0.4  -10.     0.67] sorted [7 4 5]\n",
      "   state [0 0 1 1 0 0 0 0] state_WI [  0.49   0.72 -10.     0.26   0.47   0.52   0.69   0.67] sorted [1 6 7]\n",
      "   state [0 0 1 1 0 0 1 0] state_WI [  0.49   0.72 -10.     0.26   0.47   0.52 -10.     0.67] sorted [1 7 5]\n",
      "   state [0 0 0 0 1 1 0 1] state_WI [0.49 0.72 0.27 0.39 0.42 0.4  0.69 0.28] sorted [1 6 0]\n",
      "   state [0 1 1 0 1 1 1 1] state_WI [  0.49   0.17 -10.     0.39   0.42   0.4  -10.     0.28] sorted [0 4 5]\n",
      "   state [0 0 0 0 1 0 0 1] state_WI [0.49 0.72 0.27 0.39 0.42 0.52 0.69 0.28] sorted [1 6 5]\n",
      "   state [0 0 0 0 1 0 1 1] state_WI [  0.49   0.72   0.27   0.39   0.42   0.52 -10.     0.28] sorted [1 5 0]\n",
      "   state [1 0 0 1 0 1 0 0] state_WI [-10.     0.72   0.27   0.26   0.47   0.4    0.69   0.67] sorted [1 6 7]\n",
      "instance 9, ep 4, state [1 0 1 1 0 1 1 1]\n",
      "   state [1 0 1 1 0 1 1 1] state_WI [-10.     0.72 -10.     0.26   0.47   0.4  -10.     0.28] sorted [1 4 5]\n",
      "   state [1 1 0 0 0 1 0 0] state_WI [-10.     0.17   0.27   0.39   0.47   0.4    0.69   0.67] sorted [6 7 4]\n",
      "   state [0 1 0 0 0 1 1 0] state_WI [  0.49   0.17   0.27   0.39   0.47   0.4  -10.     0.67] sorted [7 0 4]\n",
      "   state [1 1 0 0 1 1 0 1] state_WI [-10.     0.17   0.27   0.39   0.42   0.4    0.69   0.28] sorted [6 4 5]\n",
      "   state [1 1 1 0 1 1 1 0] state_WI [-10.     0.17 -10.     0.39   0.42   0.4  -10.     0.67] sorted [7 4 5]\n",
      "   state [0 0 0 0 1 1 0 1] state_WI [0.49 0.72 0.27 0.39 0.42 0.4  0.69 0.28] sorted [1 6 0]\n",
      "   state [1 0 0 0 1 0 0 0] state_WI [-10.     0.72   0.27   0.39   0.42   0.52   0.69   0.67] sorted [1 6 7]\n",
      "   state [1 1 0 1 0 0 0 0] state_WI [-10.     0.17   0.27   0.26   0.47   0.52   0.69   0.67] sorted [6 7 5]\n",
      "   state [1 1 0 0 0 1 0 1] state_WI [-10.     0.17   0.27   0.39   0.47   0.4    0.69   0.28] sorted [6 4 5]\n",
      "   state [1 0 1 0 1 1 0 0] state_WI [-10.     0.72 -10.     0.39   0.42   0.4    0.69   0.67] sorted [1 6 7]\n",
      "   state [1 0 1 0 0 1 1 0] state_WI [-10.     0.72 -10.     0.39   0.47   0.4  -10.     0.67] sorted [1 7 4]\n",
      "   state [1 0 0 0 1 0 1 1] state_WI [-10.     0.72   0.27   0.39   0.42   0.52 -10.     0.28] sorted [1 5 4]\n",
      "   state [0 1 1 0 1 0 1 1] state_WI [  0.49   0.17 -10.     0.39   0.42   0.52 -10.     0.28] sorted [5 0 4]\n",
      "   state [1 1 0 0 0 1 1 0] state_WI [-10.     0.17   0.27   0.39   0.47   0.4  -10.     0.67] sorted [7 4 5]\n",
      "   state [0 1 0 0 0 1 0 0] state_WI [0.49 0.17 0.27 0.39 0.47 0.4  0.69 0.67] sorted [6 7 0]\n",
      "   state [1 1 0 0 0 1 1 1] state_WI [-10.     0.17   0.27   0.39   0.47   0.4  -10.     0.28] sorted [4 5 3]\n",
      "   state [1 0 1 1 0 0 0 0] state_WI [-10.     0.72 -10.     0.26   0.47   0.52   0.69   0.67] sorted [1 6 7]\n",
      "   state [1 1 0 0 1 0 1 0] state_WI [-10.     0.17   0.27   0.39   0.42   0.52 -10.     0.67] sorted [7 5 4]\n",
      "   state [1 1 0 0 1 0 1 0] state_WI [-10.     0.17   0.27   0.39   0.42   0.52 -10.     0.67] sorted [7 5 4]\n",
      "   state [1 1 0 0 0 0 1 0] state_WI [-10.     0.17   0.27   0.39   0.47   0.52 -10.     0.67] sorted [7 5 4]\n",
      "instance 9, ep 5, state [0 1 1 0 0 0 0 1]\n",
      "   state [0 1 1 0 0 0 0 1] state_WI [  0.49   0.17 -10.     0.39   0.47   0.52   0.69   0.28] sorted [6 5 0]\n",
      "   state [0 1 0 0 0 1 1 1] state_WI [  0.49   0.17   0.27   0.39   0.47   0.4  -10.     0.28] sorted [0 4 5]\n",
      "   state [1 0 0 1 1 1 1 0] state_WI [-10.     0.72   0.27   0.26   0.42   0.4  -10.     0.67] sorted [1 7 4]\n",
      "   state [0 1 1 0 1 0 1 1] state_WI [  0.49   0.17 -10.     0.39   0.42   0.52 -10.     0.28] sorted [5 0 4]\n",
      "   state [1 1 0 0 1 0 0 1] state_WI [-10.     0.17   0.27   0.39   0.42   0.52   0.69   0.28] sorted [6 5 4]\n",
      "   state [0 1 0 0 1 1 0 0] state_WI [0.49 0.17 0.27 0.39 0.42 0.4  0.69 0.67] sorted [6 7 0]\n",
      "   state [0 0 1 0 1 1 0 0] state_WI [  0.49   0.72 -10.     0.39   0.42   0.4    0.69   0.67] sorted [1 6 7]\n",
      "   state [0 0 1 0 1 1 0 1] state_WI [  0.49   0.72 -10.     0.39   0.42   0.4    0.69   0.28] sorted [1 6 0]\n",
      "   state [1 0 1 0 0 0 0 1] state_WI [-10.     0.72 -10.     0.39   0.47   0.52   0.69   0.28] sorted [1 6 5]\n",
      "   state [0 0 1 0 0 1 0 1] state_WI [  0.49   0.72 -10.     0.39   0.47   0.4    0.69   0.28] sorted [1 6 0]\n",
      "   state [0 1 1 0 0 1 0 1] state_WI [  0.49   0.17 -10.     0.39   0.47   0.4    0.69   0.28] sorted [6 0 4]\n",
      "   state [1 1 0 0 0 0 1 1] state_WI [-10.     0.17   0.27   0.39   0.47   0.52 -10.     0.28] sorted [5 4 3]\n",
      "   state [0 0 1 1 0 1 1 0] state_WI [  0.49   0.72 -10.     0.26   0.47   0.4  -10.     0.67] sorted [1 7 0]\n",
      "   state [1 1 0 0 0 0 1 0] state_WI [-10.     0.17   0.27   0.39   0.47   0.52 -10.     0.67] sorted [7 5 4]\n",
      "   state [1 1 1 0 1 0 1 0] state_WI [-10.     0.17 -10.     0.39   0.42   0.52 -10.     0.67] sorted [7 5 4]\n",
      "   state [1 0 1 1 1 0 0 1] state_WI [-10.     0.72 -10.     0.26   0.42   0.52   0.69   0.28] sorted [1 6 5]\n",
      "   state [0 0 0 1 0 1 0 1] state_WI [0.49 0.72 0.27 0.26 0.47 0.4  0.69 0.28] sorted [1 6 0]\n",
      "   state [0 1 0 0 0 0 1 1] state_WI [  0.49   0.17   0.27   0.39   0.47   0.52 -10.     0.28] sorted [5 0 4]\n",
      "   state [0 1 1 1 0 0 0 0] state_WI [  0.49   0.17 -10.     0.26   0.47   0.52   0.69   0.67] sorted [6 7 5]\n",
      "   state [0 1 0 1 0 0 0 1] state_WI [0.49 0.17 0.27 0.26 0.47 0.52 0.69 0.28] sorted [6 5 0]\n",
      "instance 9, ep 6, state [0 0 1 0 1 0 0 0]\n",
      "   state [0 0 1 0 1 0 0 0] state_WI [  0.49   0.72 -10.     0.39   0.42   0.52   0.69   0.67] sorted [1 6 7]\n",
      "   state [0 1 0 1 0 0 0 1] state_WI [0.49 0.17 0.27 0.26 0.47 0.52 0.69 0.28] sorted [6 5 0]\n",
      "   state [0 1 1 0 0 1 1 1] state_WI [  0.49   0.17 -10.     0.39   0.47   0.4  -10.     0.28] sorted [0 4 5]\n",
      "   state [1 1 0 0 0 1 1 0] state_WI [-10.     0.17   0.27   0.39   0.47   0.4  -10.     0.67] sorted [7 4 5]\n",
      "   state [0 1 0 1 1 1 1 0] state_WI [  0.49   0.17   0.27   0.26   0.42   0.4  -10.     0.67] sorted [7 0 4]\n",
      "   state [0 1 0 0 0 1 0 0] state_WI [0.49 0.17 0.27 0.39 0.47 0.4  0.69 0.67] sorted [6 7 0]\n",
      "   state [1 1 1 0 0 0 1 1] state_WI [-10.     0.17 -10.     0.39   0.47   0.52 -10.     0.28] sorted [5 4 3]\n",
      "   state [1 0 1 0 0 1 0 1] state_WI [-10.     0.72 -10.     0.39   0.47   0.4    0.69   0.28] sorted [1 6 4]\n",
      "   state [0 0 1 0 0 0 0 1] state_WI [  0.49   0.72 -10.     0.39   0.47   0.52   0.69   0.28] sorted [1 6 5]\n",
      "   state [0 1 0 0 0 0 0 1] state_WI [0.49 0.17 0.27 0.39 0.47 0.52 0.69 0.28] sorted [6 5 0]\n",
      "   state [0 1 0 0 0 1 0 1] state_WI [0.49 0.17 0.27 0.39 0.47 0.4  0.69 0.28] sorted [6 0 4]\n",
      "   state [0 1 1 0 0 1 0 1] state_WI [  0.49   0.17 -10.     0.39   0.47   0.4    0.69   0.28] sorted [6 0 4]\n",
      "   state [0 1 0 0 0 0 0 1] state_WI [0.49 0.17 0.27 0.39 0.47 0.52 0.69 0.28] sorted [6 5 0]\n",
      "   state [0 1 1 0 0 1 1 0] state_WI [  0.49   0.17 -10.     0.39   0.47   0.4  -10.     0.67] sorted [7 0 4]\n",
      "   state [1 0 1 0 0 0 1 1] state_WI [-10.     0.72 -10.     0.39   0.47   0.52 -10.     0.28] sorted [1 5 4]\n",
      "   state [0 1 0 0 1 1 0 0] state_WI [0.49 0.17 0.27 0.39 0.42 0.4  0.69 0.67] sorted [6 7 0]\n",
      "   state [1 1 0 0 1 0 0 0] state_WI [-10.     0.17   0.27   0.39   0.42   0.52   0.69   0.67] sorted [6 7 5]\n",
      "   state [1 1 1 0 1 0 0 1] state_WI [-10.     0.17 -10.     0.39   0.42   0.52   0.69   0.28] sorted [6 5 4]\n",
      "   state [0 1 1 0 1 0 1 1] state_WI [  0.49   0.17 -10.     0.39   0.42   0.52 -10.     0.28] sorted [5 0 4]\n",
      "   state [0 1 1 0 1 0 0 0] state_WI [  0.49   0.17 -10.     0.39   0.42   0.52   0.69   0.67] sorted [6 7 5]\n",
      "instance 9, ep 7, state [0 0 1 1 0 1 1 1]\n",
      "   state [0 0 1 1 0 1 1 1] state_WI [  0.49   0.72 -10.     0.26   0.47   0.4  -10.     0.28] sorted [1 0 4]\n",
      "   state [1 1 0 1 0 1 0 1] state_WI [-10.     0.17   0.27   0.26   0.47   0.4    0.69   0.28] sorted [6 4 5]\n",
      "   state [0 1 1 1 0 1 0 0] state_WI [  0.49   0.17 -10.     0.26   0.47   0.4    0.69   0.67] sorted [6 7 0]\n",
      "   state [0 0 1 1 0 0 1 0] state_WI [  0.49   0.72 -10.     0.26   0.47   0.52 -10.     0.67] sorted [1 7 5]\n",
      "   state [0 1 1 0 0 1 0 0] state_WI [  0.49   0.17 -10.     0.39   0.47   0.4    0.69   0.67] sorted [6 7 0]\n",
      "   state [0 1 0 1 1 1 0 1] state_WI [0.49 0.17 0.27 0.26 0.42 0.4  0.69 0.28] sorted [6 0 4]\n",
      "   state [1 0 0 1 1 0 1 1] state_WI [-10.     0.72   0.27   0.26   0.42   0.52 -10.     0.28] sorted [1 5 4]\n",
      "   state [0 0 1 0 1 1 0 0] state_WI [  0.49   0.72 -10.     0.39   0.42   0.4    0.69   0.67] sorted [1 6 7]\n",
      "   state [0 1 1 0 1 1 1 1] state_WI [  0.49   0.17 -10.     0.39   0.42   0.4  -10.     0.28] sorted [0 4 5]\n",
      "   state [1 1 0 0 1 1 1 0] state_WI [-10.     0.17   0.27   0.39   0.42   0.4  -10.     0.67] sorted [7 4 5]\n",
      "   state [0 0 0 0 1 0 0 1] state_WI [0.49 0.72 0.27 0.39 0.42 0.52 0.69 0.28] sorted [1 6 5]\n",
      "   state [0 1 0 0 0 1 1 1] state_WI [  0.49   0.17   0.27   0.39   0.47   0.4  -10.     0.28] sorted [0 4 5]\n",
      "   state [0 1 1 0 1 1 0 0] state_WI [  0.49   0.17 -10.     0.39   0.42   0.4    0.69   0.67] sorted [6 7 0]\n",
      "   state [1 1 1 0 0 0 1 0] state_WI [-10.     0.17 -10.     0.39   0.47   0.52 -10.     0.67] sorted [7 5 4]\n",
      "   state [0 0 1 1 1 1 0 1] state_WI [  0.49   0.72 -10.     0.26   0.42   0.4    0.69   0.28] sorted [1 6 0]\n",
      "   state [1 1 1 1 1 1 0 1] state_WI [-10.     0.17 -10.     0.26   0.42   0.4    0.69   0.28] sorted [6 4 5]\n",
      "   state [1 1 0 1 1 0 1 1] state_WI [-10.     0.17   0.27   0.26   0.42   0.52 -10.     0.28] sorted [5 4 7]\n",
      "   state [0 0 1 0 0 0 0 1] state_WI [  0.49   0.72 -10.     0.39   0.47   0.52   0.69   0.28] sorted [1 6 5]\n",
      "   state [0 0 1 1 0 0 1 0] state_WI [  0.49   0.72 -10.     0.26   0.47   0.52 -10.     0.67] sorted [1 7 5]\n",
      "   state [0 1 1 1 0 1 1 1] state_WI [  0.49   0.17 -10.     0.26   0.47   0.4  -10.     0.28] sorted [0 4 5]\n",
      "instance 9, ep 8, state [0 0 0 1 1 0 0 1]\n",
      "   state [0 0 0 1 1 0 0 1] state_WI [0.49 0.72 0.27 0.26 0.42 0.52 0.69 0.28] sorted [1 6 5]\n",
      "   state [0 0 0 0 1 0 1 0] state_WI [  0.49   0.72   0.27   0.39   0.42   0.52 -10.     0.67] sorted [1 7 5]\n",
      "   state [0 1 1 0 0 0 1 0] state_WI [  0.49   0.17 -10.     0.39   0.47   0.52 -10.     0.67] sorted [7 5 0]\n",
      "   state [1 1 1 0 0 0 1 1] state_WI [-10.     0.17 -10.     0.39   0.47   0.52 -10.     0.28] sorted [5 4 3]\n",
      "   state [0 0 0 1 0 1 1 1] state_WI [  0.49   0.72   0.27   0.26   0.47   0.4  -10.     0.28] sorted [1 0 4]\n",
      "   state [1 0 0 1 1 0 1 1] state_WI [-10.     0.72   0.27   0.26   0.42   0.52 -10.     0.28] sorted [1 5 4]\n",
      "   state [0 1 1 0 1 0 1 1] state_WI [  0.49   0.17 -10.     0.39   0.42   0.52 -10.     0.28] sorted [5 0 4]\n",
      "   state [0 1 0 0 1 0 1 1] state_WI [  0.49   0.17   0.27   0.39   0.42   0.52 -10.     0.28] sorted [5 0 4]\n",
      "   state [0 1 0 0 1 1 0 1] state_WI [0.49 0.17 0.27 0.39 0.42 0.4  0.69 0.28] sorted [6 0 4]\n",
      "   state [1 0 1 0 0 1 0 1] state_WI [-10.     0.72 -10.     0.39   0.47   0.4    0.69   0.28] sorted [1 6 4]\n",
      "   state [0 0 1 0 0 1 1 1] state_WI [  0.49   0.72 -10.     0.39   0.47   0.4  -10.     0.28] sorted [1 0 4]\n",
      "   state [0 1 1 0 0 1 0 0] state_WI [  0.49   0.17 -10.     0.39   0.47   0.4    0.69   0.67] sorted [6 7 0]\n",
      "   state [0 1 1 0 0 1 0 1] state_WI [  0.49   0.17 -10.     0.39   0.47   0.4    0.69   0.28] sorted [6 0 4]\n",
      "   state [0 1 0 0 1 1 0 0] state_WI [0.49 0.17 0.27 0.39 0.42 0.4  0.69 0.67] sorted [6 7 0]\n",
      "   state [1 0 1 0 1 0 0 1] state_WI [-10.     0.72 -10.     0.39   0.42   0.52   0.69   0.28] sorted [1 6 5]\n",
      "   state [0 1 0 0 1 0 0 0] state_WI [0.49 0.17 0.27 0.39 0.42 0.52 0.69 0.67] sorted [6 7 5]\n",
      "   state [0 0 0 0 1 0 1 1] state_WI [  0.49   0.72   0.27   0.39   0.42   0.52 -10.     0.28] sorted [1 5 0]\n",
      "   state [0 0 0 0 1 1 1 0] state_WI [  0.49   0.72   0.27   0.39   0.42   0.4  -10.     0.67] sorted [1 7 0]\n",
      "   state [1 1 1 0 0 1 1 1] state_WI [-10.     0.17 -10.     0.39   0.47   0.4  -10.     0.28] sorted [4 5 3]\n",
      "   state [0 1 1 0 0 1 1 1] state_WI [  0.49   0.17 -10.     0.39   0.47   0.4  -10.     0.28] sorted [0 4 5]\n",
      "instance 9, ep 9, state [1 1 1 0 1 1 0 1]\n",
      "   state [1 1 1 0 1 1 0 1] state_WI [-10.     0.17 -10.     0.39   0.42   0.4    0.69   0.28] sorted [6 4 5]\n",
      "   state [1 1 1 0 0 1 1 0] state_WI [-10.     0.17 -10.     0.39   0.47   0.4  -10.     0.67] sorted [7 4 5]\n",
      "   state [1 1 1 0 1 0 0 1] state_WI [-10.     0.17 -10.     0.39   0.42   0.52   0.69   0.28] sorted [6 5 4]\n",
      "   state [0 1 0 0 1 1 1 0] state_WI [  0.49   0.17   0.27   0.39   0.42   0.4  -10.     0.67] sorted [7 0 4]\n",
      "   state [0 1 1 0 1 0 1 1] state_WI [  0.49   0.17 -10.     0.39   0.42   0.52 -10.     0.28] sorted [5 0 4]\n",
      "   state [0 1 1 1 0 0 1 0] state_WI [  0.49   0.17 -10.     0.26   0.47   0.52 -10.     0.67] sorted [7 5 0]\n",
      "   state [1 0 1 0 0 0 0 0] state_WI [-10.     0.72 -10.     0.39   0.47   0.52   0.69   0.67] sorted [1 6 7]\n",
      "   state [1 1 0 0 0 0 0 0] state_WI [-10.     0.17   0.27   0.39   0.47   0.52   0.69   0.67] sorted [6 7 5]\n",
      "   state [0 0 0 0 0 0 1 1] state_WI [  0.49   0.72   0.27   0.39   0.47   0.52 -10.     0.28] sorted [1 5 0]\n",
      "   state [1 1 1 0 0 0 0 1] state_WI [-10.     0.17 -10.     0.39   0.47   0.52   0.69   0.28] sorted [6 5 4]\n",
      "   state [1 0 1 0 0 1 1 1] state_WI [-10.     0.72 -10.     0.39   0.47   0.4  -10.     0.28] sorted [1 4 5]\n",
      "   state [0 1 1 0 0 0 1 1] state_WI [  0.49   0.17 -10.     0.39   0.47   0.52 -10.     0.28] sorted [5 0 4]\n",
      "   state [0 1 1 0 0 0 0 1] state_WI [  0.49   0.17 -10.     0.39   0.47   0.52   0.69   0.28] sorted [6 5 0]\n",
      "   state [0 0 0 0 1 1 1 1] state_WI [  0.49   0.72   0.27   0.39   0.42   0.4  -10.     0.28] sorted [1 0 4]\n",
      "   state [0 0 0 0 1 0 1 0] state_WI [  0.49   0.72   0.27   0.39   0.42   0.52 -10.     0.67] sorted [1 7 5]\n",
      "   state [0 1 0 0 0 0 1 1] state_WI [  0.49   0.17   0.27   0.39   0.47   0.52 -10.     0.28] sorted [5 0 4]\n",
      "   state [0 1 1 0 0 1 1 0] state_WI [  0.49   0.17 -10.     0.39   0.47   0.4  -10.     0.67] sorted [7 0 4]\n",
      "   state [0 0 0 0 1 1 1 0] state_WI [  0.49   0.72   0.27   0.39   0.42   0.4  -10.     0.67] sorted [1 7 0]\n",
      "   state [0 0 1 0 0 0 1 1] state_WI [  0.49   0.72 -10.     0.39   0.47   0.52 -10.     0.28] sorted [1 5 0]\n",
      "   state [0 1 1 0 0 1 0 1] state_WI [  0.49   0.17 -10.     0.39   0.47   0.4    0.69   0.28] sorted [6 0 4]\n",
      "instance 9, ep 10, state [1 0 1 1 1 0 0 1]\n",
      "   state [1 0 1 1 1 0 0 1] state_WI [-10.     0.72 -10.     0.26   0.42   0.52   0.69   0.28] sorted [1 6 5]\n",
      "   state [1 1 0 1 0 0 1 0] state_WI [-10.     0.17   0.27   0.26   0.47   0.52 -10.     0.67] sorted [7 5 4]\n",
      "   state [1 0 1 1 1 0 1 1] state_WI [-10.     0.72 -10.     0.26   0.42   0.52 -10.     0.28] sorted [1 5 4]\n",
      "   state [1 0 1 1 1 0 0 0] state_WI [-10.     0.72 -10.     0.26   0.42   0.52   0.69   0.67] sorted [1 6 7]\n",
      "   state [0 0 1 1 0 1 1 1] state_WI [  0.49   0.72 -10.     0.26   0.47   0.4  -10.     0.28] sorted [1 0 4]\n",
      "   state [1 1 0 1 0 1 1 0] state_WI [-10.     0.17   0.27   0.26   0.47   0.4  -10.     0.67] sorted [7 4 5]\n",
      "   state [1 0 0 0 1 0 1 1] state_WI [-10.     0.72   0.27   0.39   0.42   0.52 -10.     0.28] sorted [1 5 4]\n",
      "   state [1 1 0 0 0 1 1 0] state_WI [-10.     0.17   0.27   0.39   0.47   0.4  -10.     0.67] sorted [7 4 5]\n",
      "   state [1 1 1 0 1 1 1 1] state_WI [-10.     0.17 -10.     0.39   0.42   0.4  -10.     0.28] sorted [4 5 3]\n",
      "   state [0 0 0 1 0 0 1 1] state_WI [  0.49   0.72   0.27   0.26   0.47   0.52 -10.     0.28] sorted [1 5 0]\n",
      "   state [0 1 0 1 0 0 1 1] state_WI [  0.49   0.17   0.27   0.26   0.47   0.52 -10.     0.28] sorted [5 0 4]\n",
      "   state [1 0 0 1 1 1 1 1] state_WI [-10.     0.72   0.27   0.26   0.42   0.4  -10.     0.28] sorted [1 4 5]\n",
      "   state [0 1 1 1 1 1 0 0] state_WI [  0.49   0.17 -10.     0.26   0.42   0.4    0.69   0.67] sorted [6 7 0]\n",
      "   state [1 1 0 0 0 0 0 1] state_WI [-10.     0.17   0.27   0.39   0.47   0.52   0.69   0.28] sorted [6 5 4]\n",
      "   state [0 1 0 1 1 0 1 0] state_WI [  0.49   0.17   0.27   0.26   0.42   0.52 -10.     0.67] sorted [7 5 0]\n",
      "   state [1 1 1 0 0 1 0 1] state_WI [-10.     0.17 -10.     0.39   0.47   0.4    0.69   0.28] sorted [6 4 5]\n",
      "   state [0 0 0 1 1 0 0 0] state_WI [0.49 0.72 0.27 0.26 0.42 0.52 0.69 0.67] sorted [1 6 7]\n",
      "   state [0 1 1 1 1 0 1 1] state_WI [  0.49   0.17 -10.     0.26   0.42   0.52 -10.     0.28] sorted [5 0 4]\n",
      "   state [1 0 1 1 1 0 0 0] state_WI [-10.     0.72 -10.     0.26   0.42   0.52   0.69   0.67] sorted [1 6 7]\n",
      "   state [1 1 1 0 0 0 1 1] state_WI [-10.     0.17 -10.     0.39   0.47   0.52 -10.     0.28] sorted [5 4 3]\n",
      "instance 9, ep 11, state [0 1 1 0 1 1 0 1]\n",
      "   state [0 1 1 0 1 1 0 1] state_WI [  0.49   0.17 -10.     0.39   0.42   0.4    0.69   0.28] sorted [6 0 4]\n",
      "   state [1 0 0 0 1 0 0 1] state_WI [-10.     0.72   0.27   0.39   0.42   0.52   0.69   0.28] sorted [1 6 5]\n",
      "   state [0 0 0 0 1 1 0 1] state_WI [0.49 0.72 0.27 0.39 0.42 0.4  0.69 0.28] sorted [1 6 0]\n",
      "   state [0 1 1 0 0 0 1 0] state_WI [  0.49   0.17 -10.     0.39   0.47   0.52 -10.     0.67] sorted [7 5 0]\n",
      "   state [1 1 0 0 0 1 0 0] state_WI [-10.     0.17   0.27   0.39   0.47   0.4    0.69   0.67] sorted [6 7 4]\n",
      "   state [0 1 1 1 0 1 1 1] state_WI [  0.49   0.17 -10.     0.26   0.47   0.4  -10.     0.28] sorted [0 4 5]\n",
      "   state [0 1 1 1 0 1 1 1] state_WI [  0.49   0.17 -10.     0.26   0.47   0.4  -10.     0.28] sorted [0 4 5]\n",
      "   state [0 0 1 1 0 0 1 0] state_WI [  0.49   0.72 -10.     0.26   0.47   0.52 -10.     0.67] sorted [1 7 5]\n",
      "   state [0 1 0 0 0 1 0 0] state_WI [0.49 0.17 0.27 0.39 0.47 0.4  0.69 0.67] sorted [6 7 0]\n",
      "   state [0 0 1 1 0 0 0 0] state_WI [  0.49   0.72 -10.     0.26   0.47   0.52   0.69   0.67] sorted [1 6 7]\n",
      "   state [0 0 0 1 0 0 0 1] state_WI [0.49 0.72 0.27 0.26 0.47 0.52 0.69 0.28] sorted [1 6 5]\n",
      "   state [0 0 0 0 0 0 0 1] state_WI [0.49 0.72 0.27 0.39 0.47 0.52 0.69 0.28] sorted [1 6 5]\n",
      "   state [0 0 0 0 0 0 1 1] state_WI [  0.49   0.72   0.27   0.39   0.47   0.52 -10.     0.28] sorted [1 5 0]\n",
      "   state [1 0 0 1 0 1 1 1] state_WI [-10.     0.72   0.27   0.26   0.47   0.4  -10.     0.28] sorted [1 4 5]\n",
      "   state [0 1 1 1 1 1 1 0] state_WI [  0.49   0.17 -10.     0.26   0.42   0.4  -10.     0.67] sorted [7 0 4]\n",
      "   state [0 1 1 1 0 0 0 0] state_WI [  0.49   0.17 -10.     0.26   0.47   0.52   0.69   0.67] sorted [6 7 5]\n",
      "   state [0 0 0 1 1 0 0 1] state_WI [0.49 0.72 0.27 0.26 0.42 0.52 0.69 0.28] sorted [1 6 5]\n",
      "   state [1 1 0 0 0 0 0 1] state_WI [-10.     0.17   0.27   0.39   0.47   0.52   0.69   0.28] sorted [6 5 4]\n",
      "   state [0 1 0 0 1 1 0 0] state_WI [0.49 0.17 0.27 0.39 0.42 0.4  0.69 0.67] sorted [6 7 0]\n",
      "   state [0 1 0 0 0 0 1 0] state_WI [  0.49   0.17   0.27   0.39   0.47   0.52 -10.     0.67] sorted [7 5 0]\n",
      "instance 9, ep 12, state [1 1 1 0 1 1 1 1]\n",
      "   state [1 1 1 0 1 1 1 1] state_WI [-10.     0.17 -10.     0.39   0.42   0.4  -10.     0.28] sorted [4 5 3]\n",
      "   state [1 1 1 0 1 0 0 0] state_WI [-10.     0.17 -10.     0.39   0.42   0.52   0.69   0.67] sorted [6 7 5]\n",
      "   state [0 0 1 1 0 0 1 1] state_WI [  0.49   0.72 -10.     0.26   0.47   0.52 -10.     0.28] sorted [1 5 0]\n",
      "   state [1 1 1 0 0 0 0 1] state_WI [-10.     0.17 -10.     0.39   0.47   0.52   0.69   0.28] sorted [6 5 4]\n",
      "   state [1 1 0 0 0 1 0 0] state_WI [-10.     0.17   0.27   0.39   0.47   0.4    0.69   0.67] sorted [6 7 4]\n",
      "   state [1 1 1 0 1 1 1 1] state_WI [-10.     0.17 -10.     0.39   0.42   0.4  -10.     0.28] sorted [4 5 3]\n",
      "   state [1 1 0 1 1 0 0 1] state_WI [-10.     0.17   0.27   0.26   0.42   0.52   0.69   0.28] sorted [6 5 4]\n",
      "   state [0 0 1 0 1 0 1 0] state_WI [  0.49   0.72 -10.     0.39   0.42   0.52 -10.     0.67] sorted [1 7 5]\n",
      "   state [1 1 0 0 0 0 1 0] state_WI [-10.     0.17   0.27   0.39   0.47   0.52 -10.     0.67] sorted [7 5 4]\n",
      "   state [1 1 1 0 1 0 1 1] state_WI [-10.     0.17 -10.     0.39   0.42   0.52 -10.     0.28] sorted [5 4 3]\n",
      "   state [0 1 0 0 1 0 1 0] state_WI [  0.49   0.17   0.27   0.39   0.42   0.52 -10.     0.67] sorted [7 5 0]\n",
      "   state [1 1 0 0 0 1 1 0] state_WI [-10.     0.17   0.27   0.39   0.47   0.4  -10.     0.67] sorted [7 4 5]\n",
      "   state [0 1 0 0 1 1 1 1] state_WI [  0.49   0.17   0.27   0.39   0.42   0.4  -10.     0.28] sorted [0 4 5]\n",
      "   state [1 1 0 0 1 0 1 1] state_WI [-10.     0.17   0.27   0.39   0.42   0.52 -10.     0.28] sorted [5 4 3]\n",
      "   state [0 0 0 0 1 0 1 0] state_WI [  0.49   0.72   0.27   0.39   0.42   0.52 -10.     0.67] sorted [1 7 5]\n",
      "   state [0 0 0 0 0 1 1 0] state_WI [  0.49   0.72   0.27   0.39   0.47   0.4  -10.     0.67] sorted [1 7 0]\n",
      "   state [0 1 1 0 0 0 0 0] state_WI [  0.49   0.17 -10.     0.39   0.47   0.52   0.69   0.67] sorted [6 7 5]\n",
      "   state [0 1 1 0 0 0 0 0] state_WI [  0.49   0.17 -10.     0.39   0.47   0.52   0.69   0.67] sorted [6 7 5]\n",
      "   state [0 1 0 0 0 0 1 0] state_WI [  0.49   0.17   0.27   0.39   0.47   0.52 -10.     0.67] sorted [7 5 0]\n",
      "   state [0 0 0 0 0 0 1 0] state_WI [  0.49   0.72   0.27   0.39   0.47   0.52 -10.     0.67] sorted [1 7 5]\n",
      "instance 9, ep 13, state [0 1 0 0 0 1 1 1]\n",
      "   state [0 1 0 0 0 1 1 1] state_WI [  0.49   0.17   0.27   0.39   0.47   0.4  -10.     0.28] sorted [0 4 5]\n",
      "   state [0 0 0 0 0 1 0 1] state_WI [0.49 0.72 0.27 0.39 0.47 0.4  0.69 0.28] sorted [1 6 0]\n",
      "   state [0 0 1 1 0 1 0 0] state_WI [  0.49   0.72 -10.     0.26   0.47   0.4    0.69   0.67] sorted [1 6 7]\n",
      "   state [0 0 1 1 0 1 1 0] state_WI [  0.49   0.72 -10.     0.26   0.47   0.4  -10.     0.67] sorted [1 7 0]\n",
      "   state [0 0 1 1 0 1 1 0] state_WI [  0.49   0.72 -10.     0.26   0.47   0.4  -10.     0.67] sorted [1 7 0]\n",
      "   state [1 0 1 0 0 0 1 0] state_WI [-10.     0.72 -10.     0.39   0.47   0.52 -10.     0.67] sorted [1 7 5]\n",
      "   state [1 0 1 0 0 0 0 1] state_WI [-10.     0.72 -10.     0.39   0.47   0.52   0.69   0.28] sorted [1 6 5]\n",
      "   state [1 1 1 0 0 0 0 0] state_WI [-10.     0.17 -10.     0.39   0.47   0.52   0.69   0.67] sorted [6 7 5]\n",
      "   state [1 0 0 0 0 0 0 1] state_WI [-10.     0.72   0.27   0.39   0.47   0.52   0.69   0.28] sorted [1 6 5]\n",
      "   state [0 1 0 0 0 1 1 0] state_WI [  0.49   0.17   0.27   0.39   0.47   0.4  -10.     0.67] sorted [7 0 4]\n",
      "   state [0 1 0 1 0 0 1 0] state_WI [  0.49   0.17   0.27   0.26   0.47   0.52 -10.     0.67] sorted [7 5 0]\n",
      "   state [1 1 0 0 0 1 1 0] state_WI [-10.     0.17   0.27   0.39   0.47   0.4  -10.     0.67] sorted [7 4 5]\n",
      "   state [1 1 0 0 1 0 1 1] state_WI [-10.     0.17   0.27   0.39   0.42   0.52 -10.     0.28] sorted [5 4 3]\n",
      "   state [0 1 0 1 1 1 1 0] state_WI [  0.49   0.17   0.27   0.26   0.42   0.4  -10.     0.67] sorted [7 0 4]\n",
      "   state [0 1 1 0 1 1 0 1] state_WI [  0.49   0.17 -10.     0.39   0.42   0.4    0.69   0.28] sorted [6 0 4]\n",
      "   state [0 1 0 0 0 1 0 0] state_WI [0.49 0.17 0.27 0.39 0.47 0.4  0.69 0.67] sorted [6 7 0]\n",
      "   state [0 0 0 0 0 1 0 1] state_WI [0.49 0.72 0.27 0.39 0.47 0.4  0.69 0.28] sorted [1 6 0]\n",
      "   state [0 1 0 0 0 0 0 1] state_WI [0.49 0.17 0.27 0.39 0.47 0.52 0.69 0.28] sorted [6 5 0]\n",
      "   state [1 1 0 0 1 0 0 0] state_WI [-10.     0.17   0.27   0.39   0.42   0.52   0.69   0.67] sorted [6 7 5]\n",
      "   state [0 0 1 0 0 1 0 0] state_WI [  0.49   0.72 -10.     0.39   0.47   0.4    0.69   0.67] sorted [1 6 7]\n",
      "instance 9, ep 14, state [1 1 1 0 0 0 1 1]\n",
      "   state [1 1 1 0 0 0 1 1] state_WI [-10.     0.17 -10.     0.39   0.47   0.52 -10.     0.28] sorted [5 4 3]\n",
      "   state [0 1 0 0 1 0 0 1] state_WI [0.49 0.17 0.27 0.39 0.42 0.52 0.69 0.28] sorted [6 5 0]\n",
      "   state [0 1 1 0 0 0 1 1] state_WI [  0.49   0.17 -10.     0.39   0.47   0.52 -10.     0.28] sorted [5 0 4]\n",
      "   state [0 0 1 0 0 0 0 0] state_WI [  0.49   0.72 -10.     0.39   0.47   0.52   0.69   0.67] sorted [1 6 7]\n",
      "   state [0 1 1 0 0 0 0 1] state_WI [  0.49   0.17 -10.     0.39   0.47   0.52   0.69   0.28] sorted [6 5 0]\n",
      "   state [0 0 1 0 0 0 0 1] state_WI [  0.49   0.72 -10.     0.39   0.47   0.52   0.69   0.28] sorted [1 6 5]\n",
      "   state [0 0 0 0 0 1 0 0] state_WI [0.49 0.72 0.27 0.39 0.47 0.4  0.69 0.67] sorted [1 6 7]\n",
      "   state [0 0 1 1 0 0 1 0] state_WI [  0.49   0.72 -10.     0.26   0.47   0.52 -10.     0.67] sorted [1 7 5]\n",
      "   state [0 1 0 1 0 0 1 1] state_WI [  0.49   0.17   0.27   0.26   0.47   0.52 -10.     0.28] sorted [5 0 4]\n",
      "   state [0 1 1 0 1 0 0 0] state_WI [  0.49   0.17 -10.     0.39   0.42   0.52   0.69   0.67] sorted [6 7 5]\n",
      "   state [0 0 1 0 1 0 1 1] state_WI [  0.49   0.72 -10.     0.39   0.42   0.52 -10.     0.28] sorted [1 5 0]\n",
      "   state [1 1 1 0 0 0 0 1] state_WI [-10.     0.17 -10.     0.39   0.47   0.52   0.69   0.28] sorted [6 5 4]\n",
      "   state [0 1 0 0 0 0 0 1] state_WI [0.49 0.17 0.27 0.39 0.47 0.52 0.69 0.28] sorted [6 5 0]\n",
      "   state [0 1 1 0 0 0 1 1] state_WI [  0.49   0.17 -10.     0.39   0.47   0.52 -10.     0.28] sorted [5 0 4]\n",
      "   state [1 1 1 1 1 1 1 0] state_WI [-10.     0.17 -10.     0.26   0.42   0.4  -10.     0.67] sorted [7 4 5]\n",
      "   state [1 1 0 0 1 1 1 0] state_WI [-10.     0.17   0.27   0.39   0.42   0.4  -10.     0.67] sorted [7 4 5]\n",
      "   state [1 0 0 1 0 1 0 1] state_WI [-10.     0.72   0.27   0.26   0.47   0.4    0.69   0.28] sorted [1 6 4]\n",
      "   state [0 0 1 0 1 1 0 0] state_WI [  0.49   0.72 -10.     0.39   0.42   0.4    0.69   0.67] sorted [1 6 7]\n",
      "   state [0 1 0 0 1 0 0 1] state_WI [0.49 0.17 0.27 0.39 0.42 0.52 0.69 0.28] sorted [6 5 0]\n",
      "   state [0 1 0 1 0 0 1 1] state_WI [  0.49   0.17   0.27   0.26   0.47   0.52 -10.     0.28] sorted [5 0 4]\n",
      "instance 9, ep 15, state [0 0 1 0 1 1 0 0]\n",
      "   state [0 0 1 0 1 1 0 0] state_WI [  0.49   0.72 -10.     0.39   0.42   0.4    0.69   0.67] sorted [1 6 7]\n",
      "   state [0 0 0 0 1 1 1 0] state_WI [  0.49   0.72   0.27   0.39   0.42   0.4  -10.     0.67] sorted [1 7 0]\n",
      "   state [1 0 0 0 0 1 1 1] state_WI [-10.     0.72   0.27   0.39   0.47   0.4  -10.     0.28] sorted [1 4 5]\n",
      "   state [0 0 0 1 0 1 0 1] state_WI [0.49 0.72 0.27 0.26 0.47 0.4  0.69 0.28] sorted [1 6 0]\n",
      "   state [1 1 1 1 0 1 1 0] state_WI [-10.     0.17 -10.     0.26   0.47   0.4  -10.     0.67] sorted [7 4 5]\n",
      "   state [1 1 0 1 0 1 0 1] state_WI [-10.     0.17   0.27   0.26   0.47   0.4    0.69   0.28] sorted [6 4 5]\n",
      "   state [0 0 0 0 1 0 0 1] state_WI [0.49 0.72 0.27 0.39 0.42 0.52 0.69 0.28] sorted [1 6 5]\n",
      "   state [0 0 0 0 1 1 1 1] state_WI [  0.49   0.72   0.27   0.39   0.42   0.4  -10.     0.28] sorted [1 0 4]\n",
      "   state [1 0 0 0 0 1 0 1] state_WI [-10.     0.72   0.27   0.39   0.47   0.4    0.69   0.28] sorted [1 6 4]\n",
      "   state [0 0 0 0 1 1 1 0] state_WI [  0.49   0.72   0.27   0.39   0.42   0.4  -10.     0.67] sorted [1 7 0]\n",
      "   state [0 0 1 0 0 1 0 1] state_WI [  0.49   0.72 -10.     0.39   0.47   0.4    0.69   0.28] sorted [1 6 0]\n",
      "   state [1 0 1 0 0 0 0 1] state_WI [-10.     0.72 -10.     0.39   0.47   0.52   0.69   0.28] sorted [1 6 5]\n",
      "   state [0 0 0 0 0 0 0 1] state_WI [0.49 0.72 0.27 0.39 0.47 0.52 0.69 0.28] sorted [1 6 5]\n",
      "   state [0 1 1 0 0 0 0 0] state_WI [  0.49   0.17 -10.     0.39   0.47   0.52   0.69   0.67] sorted [6 7 5]\n",
      "   state [0 1 0 0 1 1 1 0] state_WI [  0.49   0.17   0.27   0.39   0.42   0.4  -10.     0.67] sorted [7 0 4]\n",
      "   state [1 0 1 0 1 1 0 1] state_WI [-10.     0.72 -10.     0.39   0.42   0.4    0.69   0.28] sorted [1 6 4]\n",
      "   state [0 1 1 0 1 0 1 1] state_WI [  0.49   0.17 -10.     0.39   0.42   0.52 -10.     0.28] sorted [5 0 4]\n",
      "   state [1 1 0 0 1 1 0 0] state_WI [-10.     0.17   0.27   0.39   0.42   0.4    0.69   0.67] sorted [6 7 4]\n",
      "   state [0 1 1 0 0 1 1 1] state_WI [  0.49   0.17 -10.     0.39   0.47   0.4  -10.     0.28] sorted [0 4 5]\n",
      "   state [1 0 1 0 1 1 0 1] state_WI [-10.     0.72 -10.     0.39   0.42   0.4    0.69   0.28] sorted [1 6 4]\n",
      "instance 9, ep 16, state [1 1 1 1 0 1 1 1]\n",
      "   state [1 1 1 1 0 1 1 1] state_WI [-10.     0.17 -10.     0.26   0.47   0.4  -10.     0.28] sorted [4 5 7]\n",
      "   state [0 0 1 1 1 1 1 1] state_WI [  0.49   0.72 -10.     0.26   0.42   0.4  -10.     0.28] sorted [1 0 4]\n",
      "   state [0 1 0 1 1 0 0 0] state_WI [0.49 0.17 0.27 0.26 0.42 0.52 0.69 0.67] sorted [6 7 5]\n",
      "   state [0 0 1 1 1 1 1 0] state_WI [  0.49   0.72 -10.     0.26   0.42   0.4  -10.     0.67] sorted [1 7 0]\n",
      "   state [1 0 0 1 0 0 0 0] state_WI [-10.     0.72   0.27   0.26   0.47   0.52   0.69   0.67] sorted [1 6 7]\n",
      "   state [1 1 1 1 0 0 1 0] state_WI [-10.     0.17 -10.     0.26   0.47   0.52 -10.     0.67] sorted [7 5 4]\n",
      "   state [0 1 1 0 1 0 0 1] state_WI [  0.49   0.17 -10.     0.39   0.42   0.52   0.69   0.28] sorted [6 5 0]\n",
      "   state [1 1 1 0 0 0 0 0] state_WI [-10.     0.17 -10.     0.39   0.47   0.52   0.69   0.67] sorted [6 7 5]\n",
      "   state [0 1 1 0 0 0 1 1] state_WI [  0.49   0.17 -10.     0.39   0.47   0.52 -10.     0.28] sorted [5 0 4]\n",
      "   state [0 1 1 0 1 0 0 1] state_WI [  0.49   0.17 -10.     0.39   0.42   0.52   0.69   0.28] sorted [6 5 0]\n",
      "   state [1 0 1 1 1 0 1 1] state_WI [-10.     0.72 -10.     0.26   0.42   0.52 -10.     0.28] sorted [1 5 4]\n",
      "   state [1 1 0 0 1 1 1 1] state_WI [-10.     0.17   0.27   0.39   0.42   0.4  -10.     0.28] sorted [4 5 3]\n",
      "   state [1 1 1 0 1 0 0 0] state_WI [-10.     0.17 -10.     0.39   0.42   0.52   0.69   0.67] sorted [6 7 5]\n",
      "   state [1 0 0 1 1 1 0 1] state_WI [-10.     0.72   0.27   0.26   0.42   0.4    0.69   0.28] sorted [1 6 4]\n",
      "   state [0 1 0 1 1 0 0 0] state_WI [0.49 0.17 0.27 0.26 0.42 0.52 0.69 0.67] sorted [6 7 5]\n",
      "   state [0 0 1 0 0 1 1 1] state_WI [  0.49   0.72 -10.     0.39   0.47   0.4  -10.     0.28] sorted [1 0 4]\n",
      "   state [0 1 0 1 1 1 1 1] state_WI [  0.49   0.17   0.27   0.26   0.42   0.4  -10.     0.28] sorted [0 4 5]\n",
      "   state [0 0 0 1 0 1 0 0] state_WI [0.49 0.72 0.27 0.26 0.47 0.4  0.69 0.67] sorted [1 6 7]\n",
      "   state [0 1 0 1 0 1 1 1] state_WI [  0.49   0.17   0.27   0.26   0.47   0.4  -10.     0.28] sorted [0 4 5]\n",
      "   state [1 0 1 0 0 1 0 0] state_WI [-10.     0.72 -10.     0.39   0.47   0.4    0.69   0.67] sorted [1 6 7]\n",
      "instance 9, ep 17, state [0 1 1 0 0 1 0 0]\n",
      "   state [0 1 1 0 0 1 0 0] state_WI [  0.49   0.17 -10.     0.39   0.47   0.4    0.69   0.67] sorted [6 7 0]\n",
      "   state [0 1 1 0 0 1 0 0] state_WI [  0.49   0.17 -10.     0.39   0.47   0.4    0.69   0.67] sorted [6 7 0]\n",
      "   state [1 0 1 0 0 0 0 0] state_WI [-10.     0.72 -10.     0.39   0.47   0.52   0.69   0.67] sorted [1 6 7]\n",
      "   state [0 0 0 1 0 0 1 1] state_WI [  0.49   0.72   0.27   0.26   0.47   0.52 -10.     0.28] sorted [1 5 0]\n",
      "   state [1 1 0 0 0 1 0 1] state_WI [-10.     0.17   0.27   0.39   0.47   0.4    0.69   0.28] sorted [6 4 5]\n",
      "   state [0 1 0 0 0 1 1 1] state_WI [  0.49   0.17   0.27   0.39   0.47   0.4  -10.     0.28] sorted [0 4 5]\n",
      "   state [0 1 0 0 0 1 0 1] state_WI [0.49 0.17 0.27 0.39 0.47 0.4  0.69 0.28] sorted [6 0 4]\n",
      "   state [1 1 0 0 0 0 0 0] state_WI [-10.     0.17   0.27   0.39   0.47   0.52   0.69   0.67] sorted [6 7 5]\n",
      "   state [1 1 1 0 0 1 0 0] state_WI [-10.     0.17 -10.     0.39   0.47   0.4    0.69   0.67] sorted [6 7 4]\n",
      "   state [1 0 1 0 0 1 0 0] state_WI [-10.     0.72 -10.     0.39   0.47   0.4    0.69   0.67] sorted [1 6 7]\n",
      "   state [1 0 1 0 0 0 0 0] state_WI [-10.     0.72 -10.     0.39   0.47   0.52   0.69   0.67] sorted [1 6 7]\n",
      "   state [1 1 1 0 0 0 1 0] state_WI [-10.     0.17 -10.     0.39   0.47   0.52 -10.     0.67] sorted [7 5 4]\n",
      "   state [0 1 0 0 0 0 1 0] state_WI [  0.49   0.17   0.27   0.39   0.47   0.52 -10.     0.67] sorted [7 5 0]\n",
      "   state [1 1 0 0 0 0 1 1] state_WI [-10.     0.17   0.27   0.39   0.47   0.52 -10.     0.28] sorted [5 4 3]\n",
      "   state [1 1 0 1 1 0 1 0] state_WI [-10.     0.17   0.27   0.26   0.42   0.52 -10.     0.67] sorted [7 5 4]\n",
      "   state [1 1 0 0 1 0 1 0] state_WI [-10.     0.17   0.27   0.39   0.42   0.52 -10.     0.67] sorted [7 5 4]\n",
      "   state [0 0 0 0 1 1 0 0] state_WI [0.49 0.72 0.27 0.39 0.42 0.4  0.69 0.67] sorted [1 6 7]\n",
      "   state [1 0 1 0 0 1 1 1] state_WI [-10.     0.72 -10.     0.39   0.47   0.4  -10.     0.28] sorted [1 4 5]\n",
      "   state [1 1 0 0 0 1 0 0] state_WI [-10.     0.17   0.27   0.39   0.47   0.4    0.69   0.67] sorted [6 7 4]\n",
      "   state [0 1 0 0 0 1 1 0] state_WI [  0.49   0.17   0.27   0.39   0.47   0.4  -10.     0.67] sorted [7 0 4]\n",
      "instance 9, ep 18, state [0 1 1 1 0 1 1 1]\n",
      "   state [0 1 1 1 0 1 1 1] state_WI [  0.49   0.17 -10.     0.26   0.47   0.4  -10.     0.28] sorted [0 4 5]\n",
      "   state [1 1 1 0 0 1 0 0] state_WI [-10.     0.17 -10.     0.39   0.47   0.4    0.69   0.67] sorted [6 7 4]\n",
      "   state [0 0 1 0 0 1 1 1] state_WI [  0.49   0.72 -10.     0.39   0.47   0.4  -10.     0.28] sorted [1 0 4]\n",
      "   state [1 0 1 0 0 0 0 1] state_WI [-10.     0.72 -10.     0.39   0.47   0.52   0.69   0.28] sorted [1 6 5]\n",
      "   state [1 1 1 0 0 1 1 1] state_WI [-10.     0.17 -10.     0.39   0.47   0.4  -10.     0.28] sorted [4 5 3]\n",
      "   state [0 1 1 0 1 0 0 1] state_WI [  0.49   0.17 -10.     0.39   0.42   0.52   0.69   0.28] sorted [6 5 0]\n",
      "   state [1 1 1 0 0 0 1 1] state_WI [-10.     0.17 -10.     0.39   0.47   0.52 -10.     0.28] sorted [5 4 3]\n",
      "   state [0 1 1 1 1 1 0 0] state_WI [  0.49   0.17 -10.     0.26   0.42   0.4    0.69   0.67] sorted [6 7 0]\n",
      "   state [0 1 1 0 1 1 1 1] state_WI [  0.49   0.17 -10.     0.39   0.42   0.4  -10.     0.28] sorted [0 4 5]\n",
      "   state [1 1 0 0 1 0 1 1] state_WI [-10.     0.17   0.27   0.39   0.42   0.52 -10.     0.28] sorted [5 4 3]\n",
      "   state [0 1 1 0 1 1 0 0] state_WI [  0.49   0.17 -10.     0.39   0.42   0.4    0.69   0.67] sorted [6 7 0]\n",
      "   state [0 1 0 0 0 0 1 1] state_WI [  0.49   0.17   0.27   0.39   0.47   0.52 -10.     0.28] sorted [5 0 4]\n",
      "   state [0 1 1 0 1 0 1 0] state_WI [  0.49   0.17 -10.     0.39   0.42   0.52 -10.     0.67] sorted [7 5 0]\n",
      "   state [1 1 1 0 0 0 0 0] state_WI [-10.     0.17 -10.     0.39   0.47   0.52   0.69   0.67] sorted [6 7 5]\n",
      "   state [0 0 0 0 0 0 1 1] state_WI [  0.49   0.72   0.27   0.39   0.47   0.52 -10.     0.28] sorted [1 5 0]\n",
      "   state [0 0 0 1 0 0 1 1] state_WI [  0.49   0.72   0.27   0.26   0.47   0.52 -10.     0.28] sorted [1 5 0]\n",
      "   state [0 1 0 1 0 1 0 1] state_WI [0.49 0.17 0.27 0.26 0.47 0.4  0.69 0.28] sorted [6 0 4]\n",
      "   state [0 0 1 1 1 0 0 1] state_WI [  0.49   0.72 -10.     0.26   0.42   0.52   0.69   0.28] sorted [1 6 5]\n",
      "   state [0 1 1 1 0 0 1 1] state_WI [  0.49   0.17 -10.     0.26   0.47   0.52 -10.     0.28] sorted [5 0 4]\n",
      "   state [1 1 1 0 1 0 1 1] state_WI [-10.     0.17 -10.     0.39   0.42   0.52 -10.     0.28] sorted [5 4 3]\n",
      "instance 9, ep 19, state [1 0 1 0 1 0 0 0]\n",
      "   state [1 0 1 0 1 0 0 0] state_WI [-10.     0.72 -10.     0.39   0.42   0.52   0.69   0.67] sorted [1 6 7]\n",
      "   state [0 0 0 0 0 1 0 1] state_WI [0.49 0.72 0.27 0.39 0.47 0.4  0.69 0.28] sorted [1 6 0]\n",
      "   state [0 1 0 0 0 1 1 1] state_WI [  0.49   0.17   0.27   0.39   0.47   0.4  -10.     0.28] sorted [0 4 5]\n",
      "   state [1 1 0 1 1 0 1 0] state_WI [-10.     0.17   0.27   0.26   0.42   0.52 -10.     0.67] sorted [7 5 4]\n",
      "   state [1 1 1 1 1 0 0 0] state_WI [-10.     0.17 -10.     0.26   0.42   0.52   0.69   0.67] sorted [6 7 5]\n",
      "   state [1 0 1 0 1 0 0 0] state_WI [-10.     0.72 -10.     0.39   0.42   0.52   0.69   0.67] sorted [1 6 7]\n",
      "   state [0 0 1 0 1 1 1 0] state_WI [  0.49   0.72 -10.     0.39   0.42   0.4  -10.     0.67] sorted [1 7 0]\n",
      "   state [1 0 0 0 0 1 1 0] state_WI [-10.     0.72   0.27   0.39   0.47   0.4  -10.     0.67] sorted [1 7 4]\n",
      "   state [0 1 0 0 0 1 1 0] state_WI [  0.49   0.17   0.27   0.39   0.47   0.4  -10.     0.67] sorted [7 0 4]\n",
      "   state [1 0 1 0 1 0 1 0] state_WI [-10.     0.72 -10.     0.39   0.42   0.52 -10.     0.67] sorted [1 7 5]\n",
      "   state [0 1 1 0 0 0 0 0] state_WI [  0.49   0.17 -10.     0.39   0.47   0.52   0.69   0.67] sorted [6 7 5]\n",
      "   state [0 1 1 0 0 1 1 1] state_WI [  0.49   0.17 -10.     0.39   0.47   0.4  -10.     0.28] sorted [0 4 5]\n",
      "   state [1 1 1 0 1 0 1 1] state_WI [-10.     0.17 -10.     0.39   0.42   0.52 -10.     0.28] sorted [5 4 3]\n",
      "   state [0 1 1 1 1 0 1 1] state_WI [  0.49   0.17 -10.     0.26   0.42   0.52 -10.     0.28] sorted [5 0 4]\n",
      "   state [0 0 0 1 1 0 0 0] state_WI [0.49 0.72 0.27 0.26 0.42 0.52 0.69 0.67] sorted [1 6 7]\n",
      "   state [0 1 1 1 1 0 0 1] state_WI [  0.49   0.17 -10.     0.26   0.42   0.52   0.69   0.28] sorted [6 5 0]\n",
      "   state [0 1 0 1 0 1 1 1] state_WI [  0.49   0.17   0.27   0.26   0.47   0.4  -10.     0.28] sorted [0 4 5]\n",
      "   state [0 1 1 0 0 0 1 1] state_WI [  0.49   0.17 -10.     0.39   0.47   0.52 -10.     0.28] sorted [5 0 4]\n",
      "   state [1 1 1 0 1 0 0 0] state_WI [-10.     0.17 -10.     0.39   0.42   0.52   0.69   0.67] sorted [6 7 5]\n",
      "   state [1 1 0 0 1 0 0 0] state_WI [-10.     0.17   0.27   0.39   0.42   0.52   0.69   0.67] sorted [6 7 5]\n",
      "instance 9, ep 20, state [1 0 1 0 0 1 0 0]\n",
      "   state [1 0 1 0 0 1 0 0] state_WI [-10.     0.72 -10.     0.39   0.47   0.4    0.69   0.67] sorted [1 6 7]\n",
      "   state [0 1 0 0 0 1 0 0] state_WI [0.49 0.17 0.27 0.39 0.47 0.4  0.69 0.67] sorted [6 7 0]\n",
      "   state [1 0 0 0 0 1 1 0] state_WI [-10.     0.72   0.27   0.39   0.47   0.4  -10.     0.67] sorted [1 7 4]\n",
      "   state [0 1 0 0 1 1 0 0] state_WI [0.49 0.17 0.27 0.39 0.42 0.4  0.69 0.67] sorted [6 7 0]\n",
      "   state [1 1 1 0 0 1 0 1] state_WI [-10.     0.17 -10.     0.39   0.47   0.4    0.69   0.28] sorted [6 4 5]\n",
      "   state [0 1 1 0 1 1 0 0] state_WI [  0.49   0.17 -10.     0.39   0.42   0.4    0.69   0.67] sorted [6 7 0]\n",
      "   state [1 1 0 0 1 0 1 0] state_WI [-10.     0.17   0.27   0.39   0.42   0.52 -10.     0.67] sorted [7 5 4]\n",
      "   state [0 1 0 0 1 0 1 1] state_WI [  0.49   0.17   0.27   0.39   0.42   0.52 -10.     0.28] sorted [5 0 4]\n",
      "   state [1 1 0 1 0 1 0 0] state_WI [-10.     0.17   0.27   0.26   0.47   0.4    0.69   0.67] sorted [6 7 4]\n",
      "   state [1 0 0 0 1 0 1 1] state_WI [-10.     0.72   0.27   0.39   0.42   0.52 -10.     0.28] sorted [1 5 4]\n",
      "   state [0 0 1 0 1 1 0 1] state_WI [  0.49   0.72 -10.     0.39   0.42   0.4    0.69   0.28] sorted [1 6 0]\n",
      "   state [0 1 0 1 0 1 1 1] state_WI [  0.49   0.17   0.27   0.26   0.47   0.4  -10.     0.28] sorted [0 4 5]\n",
      "   state [0 1 0 1 0 0 1 1] state_WI [  0.49   0.17   0.27   0.26   0.47   0.52 -10.     0.28] sorted [5 0 4]\n",
      "   state [1 0 1 0 1 1 1 1] state_WI [-10.     0.72 -10.     0.39   0.42   0.4  -10.     0.28] sorted [1 4 5]\n",
      "   state [1 1 0 0 0 1 1 0] state_WI [-10.     0.17   0.27   0.39   0.47   0.4  -10.     0.67] sorted [7 4 5]\n",
      "   state [1 1 0 0 0 0 0 0] state_WI [-10.     0.17   0.27   0.39   0.47   0.52   0.69   0.67] sorted [6 7 5]\n",
      "   state [0 1 0 0 0 1 0 1] state_WI [0.49 0.17 0.27 0.39 0.47 0.4  0.69 0.28] sorted [6 0 4]\n",
      "   state [1 0 0 0 0 0 1 1] state_WI [-10.     0.72   0.27   0.39   0.47   0.52 -10.     0.28] sorted [1 5 4]\n",
      "   state [0 1 1 0 0 1 0 1] state_WI [  0.49   0.17 -10.     0.39   0.47   0.4    0.69   0.28] sorted [6 0 4]\n",
      "   state [0 0 0 1 1 1 1 0] state_WI [  0.49   0.72   0.27   0.26   0.42   0.4  -10.     0.67] sorted [1 7 0]\n",
      "instance 9, ep 21, state [1 0 0 0 1 1 1 1]\n",
      "   state [1 0 0 0 1 1 1 1] state_WI [-10.     0.72   0.27   0.39   0.42   0.4  -10.     0.28] sorted [1 4 5]\n",
      "   state [1 1 1 0 1 1 1 1] state_WI [-10.     0.17 -10.     0.39   0.42   0.4  -10.     0.28] sorted [4 5 3]\n",
      "   state [0 0 1 0 1 0 0 0] state_WI [  0.49   0.72 -10.     0.39   0.42   0.52   0.69   0.67] sorted [1 6 7]\n",
      "   state [0 1 1 0 0 0 1 0] state_WI [  0.49   0.17 -10.     0.39   0.47   0.52 -10.     0.67] sorted [7 5 0]\n",
      "   state [0 0 1 0 0 0 1 0] state_WI [  0.49   0.72 -10.     0.39   0.47   0.52 -10.     0.67] sorted [1 7 5]\n",
      "   state [0 1 1 0 1 1 0 1] state_WI [  0.49   0.17 -10.     0.39   0.42   0.4    0.69   0.28] sorted [6 0 4]\n",
      "   state [1 1 1 0 1 1 1 1] state_WI [-10.     0.17 -10.     0.39   0.42   0.4  -10.     0.28] sorted [4 5 3]\n",
      "   state [0 1 1 1 1 1 0 1] state_WI [  0.49   0.17 -10.     0.26   0.42   0.4    0.69   0.28] sorted [6 0 4]\n",
      "   state [0 1 1 1 1 0 1 1] state_WI [  0.49   0.17 -10.     0.26   0.42   0.52 -10.     0.28] sorted [5 0 4]\n",
      "   state [1 0 1 1 1 1 0 0] state_WI [-10.     0.72 -10.     0.26   0.42   0.4    0.69   0.67] sorted [1 6 7]\n",
      "   state [1 0 1 1 1 0 0 1] state_WI [-10.     0.72 -10.     0.26   0.42   0.52   0.69   0.28] sorted [1 6 5]\n",
      "   state [1 1 0 1 0 1 0 1] state_WI [-10.     0.17   0.27   0.26   0.47   0.4    0.69   0.28] sorted [6 4 5]\n",
      "   state [0 1 0 1 1 1 0 0] state_WI [0.49 0.17 0.27 0.26 0.42 0.4  0.69 0.67] sorted [6 7 0]\n",
      "   state [0 0 0 1 1 0 0 1] state_WI [0.49 0.72 0.27 0.26 0.42 0.52 0.69 0.28] sorted [1 6 5]\n",
      "   state [0 0 0 0 0 1 0 1] state_WI [0.49 0.72 0.27 0.39 0.47 0.4  0.69 0.28] sorted [1 6 0]\n",
      "   state [1 1 0 0 0 0 1 0] state_WI [-10.     0.17   0.27   0.39   0.47   0.52 -10.     0.67] sorted [7 5 4]\n",
      "   state [1 1 1 0 1 1 0 0] state_WI [-10.     0.17 -10.     0.39   0.42   0.4    0.69   0.67] sorted [6 7 4]\n",
      "   state [0 1 0 0 0 1 1 1] state_WI [  0.49   0.17   0.27   0.39   0.47   0.4  -10.     0.28] sorted [0 4 5]\n",
      "   state [0 1 0 0 0 0 1 1] state_WI [  0.49   0.17   0.27   0.39   0.47   0.52 -10.     0.28] sorted [5 0 4]\n",
      "   state [0 1 0 0 1 0 0 0] state_WI [0.49 0.17 0.27 0.39 0.42 0.52 0.69 0.67] sorted [6 7 5]\n",
      "instance 9, ep 22, state [0 0 1 0 0 0 0 1]\n",
      "   state [0 0 1 0 0 0 0 1] state_WI [  0.49   0.72 -10.     0.39   0.47   0.52   0.69   0.28] sorted [1 6 5]\n",
      "   state [0 1 1 0 0 1 1 1] state_WI [  0.49   0.17 -10.     0.39   0.47   0.4  -10.     0.28] sorted [0 4 5]\n",
      "   state [0 0 1 1 1 0 0 1] state_WI [  0.49   0.72 -10.     0.26   0.42   0.52   0.69   0.28] sorted [1 6 5]\n",
      "   state [0 0 1 1 0 0 0 1] state_WI [  0.49   0.72 -10.     0.26   0.47   0.52   0.69   0.28] sorted [1 6 5]\n",
      "   state [0 1 1 0 0 1 1 0] state_WI [  0.49   0.17 -10.     0.39   0.47   0.4  -10.     0.67] sorted [7 0 4]\n",
      "   state [0 1 1 0 1 1 0 1] state_WI [  0.49   0.17 -10.     0.39   0.42   0.4    0.69   0.28] sorted [6 0 4]\n",
      "   state [1 0 1 1 1 0 1 0] state_WI [-10.     0.72 -10.     0.26   0.42   0.52 -10.     0.67] sorted [1 7 5]\n",
      "   state [0 0 1 0 1 0 1 0] state_WI [  0.49   0.72 -10.     0.39   0.42   0.52 -10.     0.67] sorted [1 7 5]\n",
      "   state [0 1 0 0 1 1 0 1] state_WI [0.49 0.17 0.27 0.39 0.42 0.4  0.69 0.28] sorted [6 0 4]\n",
      "   state [1 0 0 0 1 0 0 0] state_WI [-10.     0.72   0.27   0.39   0.42   0.52   0.69   0.67] sorted [1 6 7]\n",
      "   state [0 1 0 0 1 0 0 1] state_WI [0.49 0.17 0.27 0.39 0.42 0.52 0.69 0.28] sorted [6 5 0]\n",
      "   state [1 0 0 0 1 1 1 1] state_WI [-10.     0.72   0.27   0.39   0.42   0.4  -10.     0.28] sorted [1 4 5]\n",
      "   state [1 0 1 0 0 1 1 1] state_WI [-10.     0.72 -10.     0.39   0.47   0.4  -10.     0.28] sorted [1 4 5]\n",
      "   state [1 0 0 0 0 1 0 1] state_WI [-10.     0.72   0.27   0.39   0.47   0.4    0.69   0.28] sorted [1 6 4]\n",
      "   state [1 1 1 0 0 1 1 0] state_WI [-10.     0.17 -10.     0.39   0.47   0.4  -10.     0.67] sorted [7 4 5]\n",
      "   state [1 1 1 0 0 1 1 1] state_WI [-10.     0.17 -10.     0.39   0.47   0.4  -10.     0.28] sorted [4 5 3]\n",
      "   state [0 0 1 0 1 0 0 0] state_WI [  0.49   0.72 -10.     0.39   0.42   0.52   0.69   0.67] sorted [1 6 7]\n",
      "   state [0 0 0 0 0 0 0 0] state_WI [0.49 0.72 0.27 0.39 0.47 0.52 0.69 0.67] sorted [1 6 7]\n",
      "   state [0 1 0 0 0 0 1 1] state_WI [  0.49   0.17   0.27   0.39   0.47   0.52 -10.     0.28] sorted [5 0 4]\n",
      "   state [0 1 1 1 1 0 1 1] state_WI [  0.49   0.17 -10.     0.26   0.42   0.52 -10.     0.28] sorted [5 0 4]\n",
      "instance 9, ep 23, state [0 1 0 1 0 0 1 1]\n",
      "   state [0 1 0 1 0 0 1 1] state_WI [  0.49   0.17   0.27   0.26   0.47   0.52 -10.     0.28] sorted [5 0 4]\n",
      "   state [1 0 1 0 1 0 1 1] state_WI [-10.     0.72 -10.     0.39   0.42   0.52 -10.     0.28] sorted [1 5 4]\n",
      "   state [1 1 0 0 1 0 0 1] state_WI [-10.     0.17   0.27   0.39   0.42   0.52   0.69   0.28] sorted [6 5 4]\n",
      "   state [1 1 0 1 1 1 1 0] state_WI [-10.     0.17   0.27   0.26   0.42   0.4  -10.     0.67] sorted [7 4 5]\n",
      "   state [0 1 0 1 1 1 1 0] state_WI [  0.49   0.17   0.27   0.26   0.42   0.4  -10.     0.67] sorted [7 0 4]\n",
      "   state [0 1 1 1 1 1 0 1] state_WI [  0.49   0.17 -10.     0.26   0.42   0.4    0.69   0.28] sorted [6 0 4]\n",
      "   state [1 1 0 0 0 1 0 1] state_WI [-10.     0.17   0.27   0.39   0.47   0.4    0.69   0.28] sorted [6 4 5]\n",
      "   state [0 0 0 0 1 1 1 1] state_WI [  0.49   0.72   0.27   0.39   0.42   0.4  -10.     0.28] sorted [1 0 4]\n",
      "   state [0 0 1 1 1 0 1 1] state_WI [  0.49   0.72 -10.     0.26   0.42   0.52 -10.     0.28] sorted [1 5 0]\n",
      "   state [1 1 0 1 0 0 1 1] state_WI [-10.     0.17   0.27   0.26   0.47   0.52 -10.     0.28] sorted [5 4 7]\n",
      "   state [1 0 1 0 0 1 1 1] state_WI [-10.     0.72 -10.     0.39   0.47   0.4  -10.     0.28] sorted [1 4 5]\n",
      "   state [1 1 0 0 0 1 0 0] state_WI [-10.     0.17   0.27   0.39   0.47   0.4    0.69   0.67] sorted [6 7 4]\n",
      "   state [0 1 0 0 0 1 0 1] state_WI [0.49 0.17 0.27 0.39 0.47 0.4  0.69 0.28] sorted [6 0 4]\n",
      "   state [1 1 1 0 0 1 0 1] state_WI [-10.     0.17 -10.     0.39   0.47   0.4    0.69   0.28] sorted [6 4 5]\n",
      "   state [0 0 1 0 1 1 1 1] state_WI [  0.49   0.72 -10.     0.39   0.42   0.4  -10.     0.28] sorted [1 0 4]\n",
      "   state [0 0 0 0 0 0 0 0] state_WI [0.49 0.72 0.27 0.39 0.47 0.52 0.69 0.67] sorted [1 6 7]\n",
      "   state [0 1 0 1 0 0 0 1] state_WI [0.49 0.17 0.27 0.26 0.47 0.52 0.69 0.28] sorted [6 5 0]\n",
      "   state [0 1 1 1 0 1 0 1] state_WI [  0.49   0.17 -10.     0.26   0.47   0.4    0.69   0.28] sorted [6 0 4]\n",
      "   state [0 1 0 0 0 0 1 1] state_WI [  0.49   0.17   0.27   0.39   0.47   0.52 -10.     0.28] sorted [5 0 4]\n",
      "   state [1 0 1 1 0 1 0 0] state_WI [-10.     0.72 -10.     0.26   0.47   0.4    0.69   0.67] sorted [1 6 7]\n",
      "instance 9, ep 24, state [0 0 0 0 0 0 0 0]\n",
      "   state [0 0 0 0 0 0 0 0] state_WI [0.49 0.72 0.27 0.39 0.47 0.52 0.69 0.67] sorted [1 6 7]\n",
      "   state [0 1 0 1 0 0 0 1] state_WI [0.49 0.17 0.27 0.26 0.47 0.52 0.69 0.28] sorted [6 5 0]\n",
      "   state [1 1 1 0 0 1 0 0] state_WI [-10.     0.17 -10.     0.39   0.47   0.4    0.69   0.67] sorted [6 7 4]\n",
      "   state [0 0 0 1 0 1 0 0] state_WI [0.49 0.72 0.27 0.26 0.47 0.4  0.69 0.67] sorted [1 6 7]\n",
      "   state [0 1 0 1 0 0 0 0] state_WI [0.49 0.17 0.27 0.26 0.47 0.52 0.69 0.67] sorted [6 7 5]\n",
      "   state [0 1 1 0 0 0 0 1] state_WI [  0.49   0.17 -10.     0.39   0.47   0.52   0.69   0.28] sorted [6 5 0]\n",
      "   state [0 1 1 0 0 0 1 1] state_WI [  0.49   0.17 -10.     0.39   0.47   0.52 -10.     0.28] sorted [5 0 4]\n",
      "   state [1 1 0 0 1 1 1 0] state_WI [-10.     0.17   0.27   0.39   0.42   0.4  -10.     0.67] sorted [7 4 5]\n",
      "   state [1 1 0 0 1 1 1 0] state_WI [-10.     0.17   0.27   0.39   0.42   0.4  -10.     0.67] sorted [7 4 5]\n",
      "   state [0 1 0 0 1 1 1 1] state_WI [  0.49   0.17   0.27   0.39   0.42   0.4  -10.     0.28] sorted [0 4 5]\n",
      "   state [0 1 0 0 0 1 0 0] state_WI [0.49 0.17 0.27 0.39 0.47 0.4  0.69 0.67] sorted [6 7 0]\n",
      "   state [1 1 1 0 0 1 0 1] state_WI [-10.     0.17 -10.     0.39   0.47   0.4    0.69   0.28] sorted [6 4 5]\n",
      "   state [1 0 0 0 1 1 0 1] state_WI [-10.     0.72   0.27   0.39   0.42   0.4    0.69   0.28] sorted [1 6 4]\n",
      "   state [0 1 0 0 1 0 1 1] state_WI [  0.49   0.17   0.27   0.39   0.42   0.52 -10.     0.28] sorted [5 0 4]\n",
      "   state [1 1 0 0 1 0 1 1] state_WI [-10.     0.17   0.27   0.39   0.42   0.52 -10.     0.28] sorted [5 4 3]\n",
      "   state [0 1 0 1 1 0 1 1] state_WI [  0.49   0.17   0.27   0.26   0.42   0.52 -10.     0.28] sorted [5 0 4]\n",
      "   state [0 1 0 1 1 1 0 0] state_WI [0.49 0.17 0.27 0.26 0.42 0.4  0.69 0.67] sorted [6 7 0]\n",
      "   state [0 1 0 0 1 0 1 0] state_WI [  0.49   0.17   0.27   0.39   0.42   0.52 -10.     0.67] sorted [7 5 0]\n",
      "   state [1 1 0 1 1 0 1 0] state_WI [-10.     0.17   0.27   0.26   0.42   0.52 -10.     0.67] sorted [7 5 4]\n",
      "   state [0 1 0 0 1 1 1 1] state_WI [  0.49   0.17   0.27   0.39   0.42   0.4  -10.     0.28] sorted [0 4 5]\n",
      "instance 9, ep 25, state [1 1 1 0 0 1 0 0]\n",
      "   state [1 1 1 0 0 1 0 0] state_WI [-10.     0.17 -10.     0.39   0.47   0.4    0.69   0.67] sorted [6 7 4]\n",
      "   state [1 1 1 0 0 1 0 1] state_WI [-10.     0.17 -10.     0.39   0.47   0.4    0.69   0.28] sorted [6 4 5]\n",
      "   state [0 1 0 0 1 0 0 1] state_WI [0.49 0.17 0.27 0.39 0.42 0.52 0.69 0.28] sorted [6 5 0]\n",
      "   state [0 1 1 1 0 0 1 0] state_WI [  0.49   0.17 -10.     0.26   0.47   0.52 -10.     0.67] sorted [7 5 0]\n",
      "   state [0 0 1 1 0 0 1 0] state_WI [  0.49   0.72 -10.     0.26   0.47   0.52 -10.     0.67] sorted [1 7 5]\n",
      "   state [0 0 0 0 0 1 1 1] state_WI [  0.49   0.72   0.27   0.39   0.47   0.4  -10.     0.28] sorted [1 0 4]\n",
      "   state [1 0 1 0 0 0 0 0] state_WI [-10.     0.72 -10.     0.39   0.47   0.52   0.69   0.67] sorted [1 6 7]\n",
      "   state [1 1 1 0 0 0 1 0] state_WI [-10.     0.17 -10.     0.39   0.47   0.52 -10.     0.67] sorted [7 5 4]\n",
      "   state [0 1 0 0 0 0 1 0] state_WI [  0.49   0.17   0.27   0.39   0.47   0.52 -10.     0.67] sorted [7 5 0]\n",
      "   state [0 0 0 1 0 0 1 0] state_WI [  0.49   0.72   0.27   0.26   0.47   0.52 -10.     0.67] sorted [1 7 5]\n",
      "   state [0 0 1 1 0 1 0 1] state_WI [  0.49   0.72 -10.     0.26   0.47   0.4    0.69   0.28] sorted [1 6 0]\n",
      "   state [0 0 0 0 0 0 1 0] state_WI [  0.49   0.72   0.27   0.39   0.47   0.52 -10.     0.67] sorted [1 7 5]\n",
      "   state [0 1 1 0 0 0 0 1] state_WI [  0.49   0.17 -10.     0.39   0.47   0.52   0.69   0.28] sorted [6 5 0]\n",
      "   state [1 1 0 0 0 1 0 1] state_WI [-10.     0.17   0.27   0.39   0.47   0.4    0.69   0.28] sorted [6 4 5]\n",
      "   state [1 0 0 0 1 1 0 0] state_WI [-10.     0.72   0.27   0.39   0.42   0.4    0.69   0.67] sorted [1 6 7]\n",
      "   state [0 0 0 0 1 0 1 1] state_WI [  0.49   0.72   0.27   0.39   0.42   0.52 -10.     0.28] sorted [1 5 0]\n",
      "   state [1 0 0 1 1 0 0 1] state_WI [-10.     0.72   0.27   0.26   0.42   0.52   0.69   0.28] sorted [1 6 5]\n",
      "   state [0 1 1 0 1 0 1 0] state_WI [  0.49   0.17 -10.     0.39   0.42   0.52 -10.     0.67] sorted [7 5 0]\n",
      "   state [0 1 0 1 0 0 0 1] state_WI [0.49 0.17 0.27 0.26 0.47 0.52 0.69 0.28] sorted [6 5 0]\n",
      "   state [0 1 0 0 0 0 0 1] state_WI [0.49 0.17 0.27 0.39 0.47 0.52 0.69 0.28] sorted [6 5 0]\n",
      "instance 9, ep 26, state [1 1 1 0 0 1 0 1]\n",
      "   state [1 1 1 0 0 1 0 1] state_WI [-10.     0.17 -10.     0.39   0.47   0.4    0.69   0.28] sorted [6 4 5]\n",
      "   state [1 1 0 0 0 1 1 0] state_WI [-10.     0.17   0.27   0.39   0.47   0.4  -10.     0.67] sorted [7 4 5]\n",
      "   state [1 0 0 0 0 1 1 0] state_WI [-10.     0.72   0.27   0.39   0.47   0.4  -10.     0.67] sorted [1 7 4]\n",
      "   state [0 1 1 1 0 1 0 0] state_WI [  0.49   0.17 -10.     0.26   0.47   0.4    0.69   0.67] sorted [6 7 0]\n",
      "   state [1 0 1 1 0 1 1 0] state_WI [-10.     0.72 -10.     0.26   0.47   0.4  -10.     0.67] sorted [1 7 4]\n",
      "   state [1 1 1 1 0 0 1 0] state_WI [-10.     0.17 -10.     0.26   0.47   0.52 -10.     0.67] sorted [7 5 4]\n",
      "   state [1 1 1 1 1 1 1 1] state_WI [-10.     0.17 -10.     0.26   0.42   0.4  -10.     0.28] sorted [4 5 7]\n",
      "   state [0 1 0 1 0 1 0 1] state_WI [0.49 0.17 0.27 0.26 0.47 0.4  0.69 0.28] sorted [6 0 4]\n",
      "   state [0 1 0 1 0 0 1 0] state_WI [  0.49   0.17   0.27   0.26   0.47   0.52 -10.     0.67] sorted [7 5 0]\n",
      "   state [0 1 0 0 0 0 0 1] state_WI [0.49 0.17 0.27 0.39 0.47 0.52 0.69 0.28] sorted [6 5 0]\n",
      "   state [0 0 1 0 0 1 0 0] state_WI [  0.49   0.72 -10.     0.39   0.47   0.4    0.69   0.67] sorted [1 6 7]\n",
      "   state [0 1 0 0 0 0 0 1] state_WI [0.49 0.17 0.27 0.39 0.47 0.52 0.69 0.28] sorted [6 5 0]\n",
      "   state [0 1 1 0 0 1 1 0] state_WI [  0.49   0.17 -10.     0.39   0.47   0.4  -10.     0.67] sorted [7 0 4]\n",
      "   state [0 0 0 0 1 0 0 1] state_WI [0.49 0.72 0.27 0.39 0.42 0.52 0.69 0.28] sorted [1 6 5]\n",
      "   state [0 1 0 0 0 0 1 1] state_WI [  0.49   0.17   0.27   0.39   0.47   0.52 -10.     0.28] sorted [5 0 4]\n",
      "   state [0 1 0 0 0 1 0 1] state_WI [0.49 0.17 0.27 0.39 0.47 0.4  0.69 0.28] sorted [6 0 4]\n",
      "   state [0 1 1 0 1 0 0 1] state_WI [  0.49   0.17 -10.     0.39   0.42   0.52   0.69   0.28] sorted [6 5 0]\n",
      "   state [0 0 1 1 0 0 0 0] state_WI [  0.49   0.72 -10.     0.26   0.47   0.52   0.69   0.67] sorted [1 6 7]\n",
      "   state [0 1 0 1 1 0 0 1] state_WI [0.49 0.17 0.27 0.26 0.42 0.52 0.69 0.28] sorted [6 5 0]\n",
      "   state [1 0 0 0 0 0 1 1] state_WI [-10.     0.72   0.27   0.39   0.47   0.52 -10.     0.28] sorted [1 5 4]\n",
      "instance 9, ep 27, state [1 1 0 0 1 1 1 0]\n",
      "   state [1 1 0 0 1 1 1 0] state_WI [-10.     0.17   0.27   0.39   0.42   0.4  -10.     0.67] sorted [7 4 5]\n",
      "   state [0 1 0 0 1 1 0 1] state_WI [0.49 0.17 0.27 0.39 0.42 0.4  0.69 0.28] sorted [6 0 4]\n",
      "   state [0 0 0 0 1 1 1 0] state_WI [  0.49   0.72   0.27   0.39   0.42   0.4  -10.     0.67] sorted [1 7 0]\n",
      "   state [1 1 0 1 0 1 1 0] state_WI [-10.     0.17   0.27   0.26   0.47   0.4  -10.     0.67] sorted [7 4 5]\n",
      "   state [0 0 0 0 1 1 1 1] state_WI [  0.49   0.72   0.27   0.39   0.42   0.4  -10.     0.28] sorted [1 0 4]\n",
      "   state [0 1 0 0 1 1 0 0] state_WI [0.49 0.17 0.27 0.39 0.42 0.4  0.69 0.67] sorted [6 7 0]\n",
      "   state [1 1 0 0 1 0 1 0] state_WI [-10.     0.17   0.27   0.39   0.42   0.52 -10.     0.67] sorted [7 5 4]\n",
      "   state [1 1 1 0 0 1 0 1] state_WI [-10.     0.17 -10.     0.39   0.47   0.4    0.69   0.28] sorted [6 4 5]\n",
      "   state [1 1 1 0 1 1 1 1] state_WI [-10.     0.17 -10.     0.39   0.42   0.4  -10.     0.28] sorted [4 5 3]\n",
      "   state [1 1 1 1 0 0 0 0] state_WI [-10.     0.17 -10.     0.26   0.47   0.52   0.69   0.67] sorted [6 7 5]\n",
      "   state [1 1 1 0 0 0 0 1] state_WI [-10.     0.17 -10.     0.39   0.47   0.52   0.69   0.28] sorted [6 5 4]\n",
      "   state [0 0 0 0 1 0 0 0] state_WI [0.49 0.72 0.27 0.39 0.42 0.52 0.69 0.67] sorted [1 6 7]\n",
      "   state [0 1 1 1 1 0 1 1] state_WI [  0.49   0.17 -10.     0.26   0.42   0.52 -10.     0.28] sorted [5 0 4]\n",
      "   state [1 1 0 1 1 1 1 1] state_WI [-10.     0.17   0.27   0.26   0.42   0.4  -10.     0.28] sorted [4 5 7]\n",
      "   state [0 0 1 1 1 1 0 1] state_WI [  0.49   0.72 -10.     0.26   0.42   0.4    0.69   0.28] sorted [1 6 0]\n",
      "   state [0 1 1 0 1 1 1 1] state_WI [  0.49   0.17 -10.     0.39   0.42   0.4  -10.     0.28] sorted [0 4 5]\n",
      "   state [1 1 0 0 0 1 0 0] state_WI [-10.     0.17   0.27   0.39   0.47   0.4    0.69   0.67] sorted [6 7 4]\n",
      "   state [0 1 0 1 1 1 1 1] state_WI [  0.49   0.17   0.27   0.26   0.42   0.4  -10.     0.28] sorted [0 4 5]\n",
      "   state [0 1 0 1 0 1 1 1] state_WI [  0.49   0.17   0.27   0.26   0.47   0.4  -10.     0.28] sorted [0 4 5]\n",
      "   state [0 1 1 0 1 1 1 0] state_WI [  0.49   0.17 -10.     0.39   0.42   0.4  -10.     0.67] sorted [7 0 4]\n",
      "instance 9, ep 28, state [0 1 1 1 0 1 1 1]\n",
      "   state [0 1 1 1 0 1 1 1] state_WI [  0.49   0.17 -10.     0.26   0.47   0.4  -10.     0.28] sorted [0 4 5]\n",
      "   state [0 0 1 1 0 0 0 1] state_WI [  0.49   0.72 -10.     0.26   0.47   0.52   0.69   0.28] sorted [1 6 5]\n",
      "   state [0 0 0 1 0 0 0 1] state_WI [0.49 0.72 0.27 0.26 0.47 0.52 0.69 0.28] sorted [1 6 5]\n",
      "   state [0 1 0 1 0 1 1 0] state_WI [  0.49   0.17   0.27   0.26   0.47   0.4  -10.     0.67] sorted [7 0 4]\n",
      "   state [1 0 1 1 1 1 1 1] state_WI [-10.     0.72 -10.     0.26   0.42   0.4  -10.     0.28] sorted [1 4 5]\n",
      "   state [1 0 0 0 0 1 1 1] state_WI [-10.     0.72   0.27   0.39   0.47   0.4  -10.     0.28] sorted [1 4 5]\n",
      "   state [1 1 1 1 0 1 0 1] state_WI [-10.     0.17 -10.     0.26   0.47   0.4    0.69   0.28] sorted [6 4 5]\n",
      "   state [0 1 1 1 1 1 0 0] state_WI [  0.49   0.17 -10.     0.26   0.42   0.4    0.69   0.67] sorted [6 7 0]\n",
      "   state [0 0 1 1 0 1 0 0] state_WI [  0.49   0.72 -10.     0.26   0.47   0.4    0.69   0.67] sorted [1 6 7]\n",
      "   state [0 1 0 1 1 1 0 0] state_WI [0.49 0.17 0.27 0.26 0.42 0.4  0.69 0.67] sorted [6 7 0]\n",
      "   state [1 1 1 1 1 1 0 1] state_WI [-10.     0.17 -10.     0.26   0.42   0.4    0.69   0.28] sorted [6 4 5]\n",
      "   state [1 0 1 0 1 1 1 0] state_WI [-10.     0.72 -10.     0.39   0.42   0.4  -10.     0.67] sorted [1 7 4]\n",
      "   state [1 0 1 0 1 0 1 1] state_WI [-10.     0.72 -10.     0.39   0.42   0.52 -10.     0.28] sorted [1 5 4]\n",
      "   state [1 0 1 1 1 0 0 1] state_WI [-10.     0.72 -10.     0.26   0.42   0.52   0.69   0.28] sorted [1 6 5]\n",
      "   state [0 1 1 0 0 1 0 0] state_WI [  0.49   0.17 -10.     0.39   0.47   0.4    0.69   0.67] sorted [6 7 0]\n",
      "   state [1 0 1 1 1 0 1 1] state_WI [-10.     0.72 -10.     0.26   0.42   0.52 -10.     0.28] sorted [1 5 4]\n",
      "   state [0 0 0 1 1 0 1 1] state_WI [  0.49   0.72   0.27   0.26   0.42   0.52 -10.     0.28] sorted [1 5 0]\n",
      "   state [0 1 1 1 1 0 1 1] state_WI [  0.49   0.17 -10.     0.26   0.42   0.52 -10.     0.28] sorted [5 0 4]\n",
      "   state [0 1 1 1 0 0 0 0] state_WI [  0.49   0.17 -10.     0.26   0.47   0.52   0.69   0.67] sorted [6 7 5]\n",
      "   state [0 1 1 0 0 1 1 1] state_WI [  0.49   0.17 -10.     0.39   0.47   0.4  -10.     0.28] sorted [0 4 5]\n",
      "instance 9, ep 29, state [0 0 1 0 0 1 0 1]\n",
      "   state [0 0 1 0 0 1 0 1] state_WI [  0.49   0.72 -10.     0.39   0.47   0.4    0.69   0.28] sorted [1 6 0]\n",
      "   state [0 1 1 1 1 1 1 1] state_WI [  0.49   0.17 -10.     0.26   0.42   0.4  -10.     0.28] sorted [0 4 5]\n",
      "   state [0 1 1 1 1 1 1 1] state_WI [  0.49   0.17 -10.     0.26   0.42   0.4  -10.     0.28] sorted [0 4 5]\n",
      "   state [1 1 1 1 1 1 0 1] state_WI [-10.     0.17 -10.     0.26   0.42   0.4    0.69   0.28] sorted [6 4 5]\n",
      "   state [0 1 0 0 1 1 0 1] state_WI [0.49 0.17 0.27 0.39 0.42 0.4  0.69 0.28] sorted [6 0 4]\n",
      "   state [0 1 0 0 1 1 0 0] state_WI [0.49 0.17 0.27 0.39 0.42 0.4  0.69 0.67] sorted [6 7 0]\n",
      "   state [1 1 1 0 0 0 0 1] state_WI [-10.     0.17 -10.     0.39   0.47   0.52   0.69   0.28] sorted [6 5 4]\n",
      "   state [1 0 0 0 1 0 0 1] state_WI [-10.     0.72   0.27   0.39   0.42   0.52   0.69   0.28] sorted [1 6 5]\n",
      "   state [0 1 0 0 0 0 1 0] state_WI [  0.49   0.17   0.27   0.39   0.47   0.52 -10.     0.67] sorted [7 5 0]\n",
      "   state [0 0 0 0 0 1 1 1] state_WI [  0.49   0.72   0.27   0.39   0.47   0.4  -10.     0.28] sorted [1 0 4]\n",
      "   state [1 1 1 0 1 1 0 0] state_WI [-10.     0.17 -10.     0.39   0.42   0.4    0.69   0.67] sorted [6 7 4]\n",
      "   state [0 1 1 1 1 0 0 1] state_WI [  0.49   0.17 -10.     0.26   0.42   0.52   0.69   0.28] sorted [6 5 0]\n",
      "   state [1 0 1 0 0 1 1 1] state_WI [-10.     0.72 -10.     0.39   0.47   0.4  -10.     0.28] sorted [1 4 5]\n",
      "   state [0 0 1 0 0 0 0 1] state_WI [  0.49   0.72 -10.     0.39   0.47   0.52   0.69   0.28] sorted [1 6 5]\n",
      "   state [0 1 1 0 0 0 1 1] state_WI [  0.49   0.17 -10.     0.39   0.47   0.52 -10.     0.28] sorted [5 0 4]\n",
      "   state [1 1 1 0 1 1 1 1] state_WI [-10.     0.17 -10.     0.39   0.42   0.4  -10.     0.28] sorted [4 5 3]\n",
      "   state [0 1 1 0 1 1 1 1] state_WI [  0.49   0.17 -10.     0.39   0.42   0.4  -10.     0.28] sorted [0 4 5]\n",
      "   state [1 0 1 0 1 0 0 0] state_WI [-10.     0.72 -10.     0.39   0.42   0.52   0.69   0.67] sorted [1 6 7]\n",
      "   state [1 0 0 0 1 0 0 0] state_WI [-10.     0.72   0.27   0.39   0.42   0.52   0.69   0.67] sorted [1 6 7]\n",
      "   state [0 1 1 0 0 0 1 0] state_WI [  0.49   0.17 -10.     0.39   0.47   0.52 -10.     0.67] sorted [7 5 0]\n"
     ]
    },
    {
     "data": {
      "text/plain": [
       "3.5778333333333334"
      ]
     },
     "execution_count": 16,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "np.random.seed(seed)\n",
    "random.seed(seed)\n",
    "optimal_reward = optimal_whittle(simulator, n_episodes, n_epochs, discount)\n",
    "np.mean(optimal_reward)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 17,
   "metadata": {},
   "outputs": [],
   "source": [
    "data = {\n",
    "    'mean_reward_baseline': np.mean(rewards_without_norm), \n",
    "    'mean_reward_norm': np.mean(rewards_with_norm), \n",
    "    'mean_reward_perfect': np.mean(perfect_rewards),\n",
    "    'mean_optimal_reward': np.mean(optimal_reward),\n",
    "    'parameters': \n",
    "        {'seed'      : seed,\n",
    "        'n_arms'    : n_arms,\n",
    "        'budget'    : budget,\n",
    "        'discount'  : discount, \n",
    "        'alpha'     : alpha, \n",
    "        'n_episodes': n_episodes, \n",
    "        'episode_len': episode_len, \n",
    "        'n_epochs'  : n_epochs, \n",
    "        'dataset': dataset} \n",
    "}"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 68,
   "metadata": {},
   "outputs": [],
   "source": [
    "save_path = get_save_path('better_bandit',save_name,seed,use_date=save_with_date)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 69,
   "metadata": {},
   "outputs": [],
   "source": [
    "delete_duplicate_results('better_bandit',save_name,data)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 70,
   "metadata": {},
   "outputs": [],
   "source": [
    "json.dump(data,open('../results/'+save_path,'w'))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "food",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.7.12"
  },
  "orig_nbformat": 4
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
