{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {},
   "outputs": [],
   "source": [
    "%load_ext autoreload\n",
    "%autoreload 2\n",
    "\n",
    "# important libraries for running experiments\n",
    "from open_spiel_integration.experiment import run_gops_experiment\n",
    "from open_spiel_integration.open_spiel_bots import *\n",
    "import pyspiel"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "We first run MCTS against RandomBot"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Player 1: 8.8\n",
      "Player 2: 8.7\n",
      "Player 1 winrate: 0.5\n",
      "Player 2 winrate: 0.5\n"
     ]
    },
    {
     "data": {
      "text/plain": [
       "(8.8, 8.7, 0.5, 0.5)"
      ]
     },
     "execution_count": 6,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# Load the gooftspiel game. remember to load the turn based version\n",
    "game = pyspiel.load_game_as_turn_based(\"goofspiel\", {\"num_cards\": 6})\n",
    "\n",
    "# Create random state\n",
    "random_state = np.random.RandomState(12)\n",
    "\n",
    "# Set up mcts bot\n",
    "mcts_bot1 = MCTSBot(game, player_id=0, rng=random_state, uct_c=2, max_simulations=100)\n",
    "\n",
    "# Set up random bot\n",
    "random_bot = RandomBot(game, player_id=1, rng=random_state)\n",
    "\n",
    "# Run the experiment\n",
    "run_gops_experiment(game, [mcts_bot1, random_bot], num_episodes=10, rng=random_state)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Next we run AlphaBeta against Random"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Player 1: 8.3\n",
      "Player 2: 9.4\n",
      "Player 1 winrate: 0.5\n",
      "Player 2 winrate: 0.5\n"
     ]
    },
    {
     "data": {
      "text/plain": [
       "(8.3, 9.4, 0.5, 0.5)"
      ]
     },
     "execution_count": 8,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# Load the gooftspiel game. remember to load the turn based version\n",
    "game = pyspiel.load_game_as_turn_based(\"goofspiel\", {\"num_cards\": 6})\n",
    "\n",
    "# Create random state\n",
    "random_state = np.random.RandomState(12)\n",
    "\n",
    "# Set up alpha beta bot\n",
    "alpha_beta_bot = AlphaBetaBot(game, player_id=0, rng=random_state)\n",
    "\n",
    "# Set up random bot\n",
    "random_bot = RandomBot(game, player_id=1, rng=random_state)\n",
    "\n",
    "# Run the experiment\n",
    "run_gops_experiment(game, [alpha_beta_bot, random_bot], num_episodes=10, rng=random_state)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 13,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Player 1: 10.98\n",
      "Player 2: 6.37\n",
      "Player 1 winrate: 0.76\n",
      "Player 2 winrate: 0.24\n"
     ]
    },
    {
     "data": {
      "text/plain": [
       "(10.98, 6.37, 0.76, 0.24)"
      ]
     },
     "execution_count": 13,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# custom SMMiniMaxBot vs random bot\n",
    "\n",
    "# Load the gooftspiel game. remember to load the turn based version\n",
    "game = pyspiel.load_game_as_turn_based(\"goofspiel\", {\"num_cards\": 6})\n",
    "\n",
    "# Create random state\n",
    "random_state = np.random.RandomState(12)\n",
    "\n",
    "# Set up SMMiniMaxBot\n",
    "sm_minimax_bot = SMMinimaxCustomBot(player_id=0, rng=random_state)\n",
    "\n",
    "# Set up random bot\n",
    "random_bot = RandomBot(game, player_id=1, rng=random_state)\n",
    "\n",
    "# Run the experiment\n",
    "run_gops_experiment(game, [sm_minimax_bot, random_bot], num_episodes=100, rng=random_state)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 11,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Player 1: 8.24\n",
      "Player 2: 8.71\n",
      "Player 1 winrate: 0.42\n",
      "Player 2 winrate: 0.58\n"
     ]
    },
    {
     "data": {
      "text/plain": [
       "(8.24, 8.71, 0.42, 0.58)"
      ]
     },
     "execution_count": 11,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# custom SMMiniMaxBot vs alpha beta bot\n",
    "\n",
    "# Load the gooftspiel game. remember to load the turn based version\n",
    "game = pyspiel.load_game_as_turn_based(\"goofspiel\", {\"num_cards\": 6})\n",
    "\n",
    "# Create random state\n",
    "random_state = np.random.RandomState(6)\n",
    "\n",
    "# Set up SMMiniMaxBot\n",
    "sm_minimax_bot = SMMinimaxCustomBot(player_id=0, rng=random_state)\n",
    "\n",
    "# Set up alpha beta bot\n",
    "alpha_beta_bot = AlphaBetaBot(game, player_id=1, rng=random_state)\n",
    "\n",
    "# Run the experiment\n",
    "run_gops_experiment(game, [sm_minimax_bot, alpha_beta_bot], num_episodes=100, rng=random_state)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 12,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Player 1: 8.24\n",
      "Player 2: 8.88\n",
      "Player 1 winrate: 0.42\n",
      "Player 2 winrate: 0.58\n"
     ]
    },
    {
     "data": {
      "text/plain": [
       "(8.24, 8.88, 0.42, 0.58)"
      ]
     },
     "execution_count": 12,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# Load the gooftspiel game. remember to load the turn based version\n",
    "game = pyspiel.load_game_as_turn_based(\"goofspiel\", {\"num_cards\": 6})\n",
    "\n",
    "# Create random state\n",
    "random_state = np.random.RandomState(12)\n",
    "\n",
    "# Set up alpha beta bot\n",
    "alpha_beta_bot = AlphaBetaBot(game, player_id=1, rng=random_state)\n",
    "\n",
    "# Set up random bot\n",
    "random_bot = RandomBot(game, player_id=0, rng=random_state)\n",
    "\n",
    "# Run the experiment\n",
    "run_gops_experiment(game, [random_bot, alpha_beta_bot], num_episodes=100, rng=random_state)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "100%|██████████| 100/100 [02:22<00:00,  1.42s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Player 1: 6.32\n",
      "Player 2: 10.59\n",
      "Player 1 winrate: 0.17\n",
      "Player 2 winrate: 0.83\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "\n"
     ]
    },
    {
     "data": {
      "text/plain": [
       "(6.32, 10.59, 0.17, 0.83)"
      ]
     },
     "execution_count": 3,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# Load the gooftspiel game. remember to load the turn based version\n",
    "game = pyspiel.load_game_as_turn_based(\"goofspiel\", {\"num_cards\": 6})\n",
    "\n",
    "# Create random state\n",
    "random_state = np.random.RandomState(12)\n",
    "\n",
    "# Set up alpha beta bot\n",
    "alpha_beta_bot = AlphaBetaBot(game, player_id=1, rng=random_state, depth=3)\n",
    "\n",
    "# Set up random bot\n",
    "random_bot = RandomBot(game, player_id=0, rng=random_state)\n",
    "\n",
    "# Run the experiment\n",
    "run_gops_experiment(game, [random_bot, alpha_beta_bot], num_episodes=100, rng=random_state)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "100%|██████████| 100/100 [26:38<00:00, 15.99s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Player 1: 6.46\n",
      "Player 2: 10.81\n",
      "Player 1 winrate: 0.21\n",
      "Player 2 winrate: 0.79\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "\n"
     ]
    },
    {
     "data": {
      "text/plain": [
       "(6.46, 10.81, 0.21, 0.79)"
      ]
     },
     "execution_count": 5,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# custom SMMiniMaxBot vs alpha beta bot\n",
    "\n",
    "# Load the gooftspiel game. remember to load the turn based version\n",
    "game = pyspiel.load_game_as_turn_based(\"goofspiel\", {\"num_cards\": 6})\n",
    "\n",
    "# Create random state\n",
    "random_state = np.random.RandomState(6)\n",
    "\n",
    "# Set up SMMiniMaxBot\n",
    "sm_minimax_bot = SMMinimaxCustomBot(player_id=0, rng=random_state, num_rollouts=10)\n",
    "\n",
    "# Set up alpha beta bot\n",
    "alpha_beta_bot = AlphaBetaBot(game, player_id=1, rng=random_state, depth=4, num_rollouts=10)\n",
    "\n",
    "# Run the experiment\n",
    "run_gops_experiment(game, [sm_minimax_bot, alpha_beta_bot], num_episodes=100, rng=random_state)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "  0%|          | 0/10 [00:00<?, ?it/s]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Player 0 takes action 5 at state Partial joint action: \n",
      "P0 hand: 1 2 3 4 5 6 \n",
      "P1 hand: 1 2 3 4 5 6 \n",
      "Point card sequence: 6 \n",
      "Points: 0 0 \n",
      "\n",
      "Player 1 cards: []\n",
      "Player 2 cards: []\n",
      "Possible actions:  [1, 2, 3, 4, 5, 6]\n",
      "Player 1 takes action 5 at state Partial joint action: 5 \n",
      "P0 hand: 1 2 3 4 5 6 \n",
      "P1 hand: 1 2 3 4 5 6 \n",
      "Point card sequence: 6 \n",
      "Points: 0 0 \n",
      "\n",
      "Player 1 cards: [6]\n",
      "Player 2 cards: [6]\n",
      "Player 0 takes action 2 at state Partial joint action: \n",
      "P0 hand: 1 2 3 4 5 \n",
      "P1 hand: 1 2 3 4 5 \n",
      "Point card sequence: 6 3 \n",
      "Points: 0 0 \n",
      "\n",
      "Player 1 cards: [6]\n",
      "Player 2 cards: [6]\n",
      "Possible actions:  [1, 2, 3, 4, 5]\n",
      "Player 1 takes action 4 at state Partial joint action: 2 \n",
      "P0 hand: 1 2 3 4 5 \n",
      "P1 hand: 1 2 3 4 5 \n",
      "Point card sequence: 6 3 \n",
      "Points: 0 0 \n",
      "\n",
      "Player 1 cards: [6, 3]\n",
      "Player 2 cards: [6, 5]\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "OpenSpiel exception: /Users/runner/work/open_spiel/open_spiel/open_spiel/games/goofspiel/goofspiel.cc:435 CHECK_TRUE(player_hands_[p][action])\n",
      "  0%|          | 0/10 [00:09<?, ?it/s]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Player 0 takes action 0 at state Partial joint action: \n",
      "P0 hand: 1 2 4 5 \n",
      "P1 hand: 1 2 3 4 \n",
      "Point card sequence: 6 3 2 \n",
      "Points: 0 3 \n",
      "\n",
      "Player 1 cards: [6, 3]\n",
      "Player 2 cards: [6, 5]\n",
      "Possible actions:  [1, 2, 4, 5]\n",
      "Player 1 takes action 1 at state Partial joint action: 0 \n",
      "P0 hand: 1 2 4 5 \n",
      "P1 hand: 1 2 3 4 \n",
      "Point card sequence: 6 3 2 \n",
      "Points: 0 3 \n",
      "\n",
      "Player 1 cards: [6, 3, 1]\n",
      "Player 2 cards: [6, 5, 2]\n",
      "Player 0 takes action 1 at state Partial joint action: \n",
      "P0 hand: 2 4 5 \n",
      "P1 hand: 1 3 4 \n",
      "Point card sequence: 6 3 2 4 \n",
      "Points: 0 5 \n",
      "\n",
      "Player 1 cards: [6, 3, 1]\n",
      "Player 2 cards: [6, 5, 2]\n",
      "Possible actions:  [2, 4, 5]\n",
      "Player 1 takes action 3 at state Partial joint action: 1 \n",
      "P0 hand: 2 4 5 \n",
      "P1 hand: 1 3 4 \n",
      "Point card sequence: 6 3 2 4 \n",
      "Points: 0 5 \n",
      "\n",
      "Player 1 cards: [6, 3, 1, 2]\n",
      "Player 2 cards: [6, 5, 2, 4]\n",
      "Player 0 takes action 3 at state Partial joint action: \n",
      "P0 hand: 4 5 \n",
      "P1 hand: 1 3 \n",
      "Point card sequence: 6 3 2 4 1 \n",
      "Points: 0 9 \n",
      "\n",
      "Player 1 cards: [6, 3, 1, 2]\n",
      "Player 2 cards: [6, 5, 2, 4]\n",
      "Possible actions:  [4, 5]\n",
      "Player 1 takes action 3 at state Partial joint action: 3 \n",
      "P0 hand: 4 5 \n",
      "P1 hand: 1 3 \n",
      "Point card sequence: 6 3 2 4 1 \n",
      "Points: 0 9 \n",
      "\n",
      "Player 1 cards: [6, 3, 1, 2, 4]\n",
      "Player 2 cards: [6, 5, 2, 4, 4]\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "\n"
     ]
    },
    {
     "ename": "SpielError",
     "evalue": "/Users/runner/work/open_spiel/open_spiel/open_spiel/games/goofspiel/goofspiel.cc:435 CHECK_TRUE(player_hands_[p][action])",
     "output_type": "error",
     "traceback": [
      "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m",
      "\u001b[0;31mSpielError\u001b[0m                                Traceback (most recent call last)",
      "\u001b[1;32m/Users/doctorduality/github-repos/generativeCommunication/gops_experiment.ipynb Cell 11\u001b[0m line \u001b[0;36m1\n\u001b[1;32m     <a href='vscode-notebook-cell:/Users/doctorduality/github-repos/generativeCommunication/gops_experiment.ipynb#X20sZmlsZQ%3D%3D?line=12'>13</a>\u001b[0m alpha_beta_bot \u001b[39m=\u001b[39m AlphaBetaBot(game, player_id\u001b[39m=\u001b[39m\u001b[39m0\u001b[39m, rng\u001b[39m=\u001b[39mrandom_state, depth\u001b[39m=\u001b[39m\u001b[39m4\u001b[39m, num_rollouts\u001b[39m=\u001b[39m\u001b[39m10\u001b[39m)\n\u001b[1;32m     <a href='vscode-notebook-cell:/Users/doctorduality/github-repos/generativeCommunication/gops_experiment.ipynb#X20sZmlsZQ%3D%3D?line=14'>15</a>\u001b[0m \u001b[39m# Run the experiment\u001b[39;00m\n\u001b[0;32m---> <a href='vscode-notebook-cell:/Users/doctorduality/github-repos/generativeCommunication/gops_experiment.ipynb#X20sZmlsZQ%3D%3D?line=15'>16</a>\u001b[0m run_gops_experiment(game, [alpha_beta_bot, sm_minimax_bot], num_episodes\u001b[39m=\u001b[39;49m\u001b[39m10\u001b[39;49m, rng\u001b[39m=\u001b[39;49mrandom_state)\n",
      "File \u001b[0;32m~/github-repos/generativeCommunication/open_spiel_integration/experiment.py:80\u001b[0m, in \u001b[0;36mrun_gops_experiment\u001b[0;34m(game, bots, num_episodes, rng)\u001b[0m\n\u001b[1;32m     77\u001b[0m         \u001b[39mprint\u001b[39m(\u001b[39m\"\u001b[39m\u001b[39mPlayer 1 cards: \u001b[39m\u001b[39m{}\u001b[39;00m\u001b[39m\"\u001b[39m\u001b[39m.\u001b[39mformat(player_cards))\n\u001b[1;32m     78\u001b[0m         \u001b[39mprint\u001b[39m(\u001b[39m\"\u001b[39m\u001b[39mPlayer 2 cards: \u001b[39m\u001b[39m{}\u001b[39;00m\u001b[39m\"\u001b[39m\u001b[39m.\u001b[39mformat(opponent_cards))\n\u001b[0;32m---> 80\u001b[0m         state\u001b[39m.\u001b[39;49mapply_action(action)\n\u001b[1;32m     82\u001b[0m gops_state \u001b[39m=\u001b[39m GOPSState(\u001b[39m'\u001b[39m\u001b[39mdummy\u001b[39m\u001b[39m'\u001b[39m, prize_cards, player_cards, opponent_cards, num_cards, \u001b[39mTrue\u001b[39;00m)\n\u001b[1;32m     84\u001b[0m \u001b[39m# Episode is over, update return\u001b[39;00m\n\u001b[1;32m     85\u001b[0m \u001b[39m# returns = state.returns()\u001b[39;00m\n",
      "\u001b[0;31mSpielError\u001b[0m: /Users/runner/work/open_spiel/open_spiel/open_spiel/games/goofspiel/goofspiel.cc:435 CHECK_TRUE(player_hands_[p][action])"
     ]
    }
   ],
   "source": [
    "# custom SMMiniMaxBot vs alpha beta bot\n",
    "\n",
    "# Load the gooftspiel game. remember to load the turn based version\n",
    "game = pyspiel.load_game_as_turn_based(\"goofspiel\", {\"num_cards\": 6})\n",
    "\n",
    "# Create random state\n",
    "random_state = np.random.RandomState(6)\n",
    "\n",
    "# Set up SMMiniMaxBot\n",
    "sm_minimax_bot = SMMinimaxCustomBot(player_id=1, rng=random_state, num_rollouts=10)\n",
    "\n",
    "# Set up alpha beta bot\n",
    "alpha_beta_bot = AlphaBetaBot(game, player_id=0, rng=random_state, depth=4, num_rollouts=10)\n",
    "\n",
    "# Run the experiment\n",
    "run_gops_experiment(game, [alpha_beta_bot, sm_minimax_bot], num_episodes=10, rng=random_state)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "  0%|          | 0/10 [00:00<?, ?it/s]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Player 0 takes action 5 at state Partial joint action: \n",
      "P0 hand: 1 2 3 4 5 6 \n",
      "P1 hand: 1 2 3 4 5 6 \n",
      "Point card sequence: 6 \n",
      "Points: 0 0 \n",
      "\n",
      "Player 1 cards: []\n",
      "Player 2 cards: []\n",
      "Possible actions:  [1, 2, 3, 4, 5, 6]\n",
      "Player 1 takes action 5 at state Partial joint action: 5 \n",
      "P0 hand: 1 2 3 4 5 6 \n",
      "P1 hand: 1 2 3 4 5 6 \n",
      "Point card sequence: 6 \n",
      "Points: 0 0 \n",
      "\n",
      "Player 1 cards: [6]\n",
      "Player 2 cards: [6]\n",
      "Player 0 takes action 2 at state Partial joint action: \n",
      "P0 hand: 1 2 3 4 5 \n",
      "P1 hand: 1 2 3 4 5 \n",
      "Point card sequence: 6 3 \n",
      "Points: 0 0 \n",
      "\n",
      "Player 1 cards: [6]\n",
      "Player 2 cards: [6]\n",
      "Possible actions:  [1, 2, 3, 4, 5]\n",
      "Player 1 takes action 4 at state Partial joint action: 2 \n",
      "P0 hand: 1 2 3 4 5 \n",
      "P1 hand: 1 2 3 4 5 \n",
      "Point card sequence: 6 3 \n",
      "Points: 0 0 \n",
      "\n",
      "Player 1 cards: [6, 3]\n",
      "Player 2 cards: [6, 5]\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      " 10%|█         | 1/10 [00:09<01:21,  9.04s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Player 0 takes action 0 at state Partial joint action: \n",
      "P0 hand: 1 2 4 5 \n",
      "P1 hand: 1 2 3 4 \n",
      "Point card sequence: 6 3 2 \n",
      "Points: 0 3 \n",
      "\n",
      "Player 1 cards: [6, 3]\n",
      "Player 2 cards: [6, 5]\n",
      "Possible actions:  [1, 2, 3, 4]\n",
      "Player 1 takes action 2 at state Partial joint action: 0 \n",
      "P0 hand: 1 2 4 5 \n",
      "P1 hand: 1 2 3 4 \n",
      "Point card sequence: 6 3 2 \n",
      "Points: 0 3 \n",
      "\n",
      "Player 1 cards: [6, 3, 1]\n",
      "Player 2 cards: [6, 5, 3]\n",
      "Player 0 takes action 3 at state Partial joint action: \n",
      "P0 hand: 2 4 5 \n",
      "P1 hand: 1 2 4 \n",
      "Point card sequence: 6 3 2 4 \n",
      "Points: 0 5 \n",
      "\n",
      "Player 1 cards: [6, 3, 1]\n",
      "Player 2 cards: [6, 5, 3]\n",
      "Possible actions:  [1, 2, 4]\n",
      "Player 1 takes action 0 at state Partial joint action: 3 \n",
      "P0 hand: 2 4 5 \n",
      "P1 hand: 1 2 4 \n",
      "Point card sequence: 6 3 2 4 \n",
      "Points: 0 5 \n",
      "\n",
      "Player 1 cards: [6, 3, 1, 4]\n",
      "Player 2 cards: [6, 5, 3, 1]\n",
      "Player 0 takes action 1 at state Partial joint action: \n",
      "P0 hand: 2 5 \n",
      "P1 hand: 2 4 \n",
      "Point card sequence: 6 3 2 4 1 \n",
      "Points: 4 5 \n",
      "\n",
      "Player 1 cards: [6, 3, 1, 4]\n",
      "Player 2 cards: [6, 5, 3, 1]\n",
      "Possible actions:  [2, 4]\n",
      "Player 1 takes action 3 at state Partial joint action: 1 \n",
      "P0 hand: 2 5 \n",
      "P1 hand: 2 4 \n",
      "Point card sequence: 6 3 2 4 1 \n",
      "Points: 4 5 \n",
      "\n",
      "Player 1 cards: [6, 3, 1, 4, 2]\n",
      "Player 2 cards: [6, 5, 3, 1, 4]\n",
      "Player 0 takes action 2 at state Partial joint action: \n",
      "P0 hand: 1 2 3 4 5 6 \n",
      "P1 hand: 1 2 3 4 5 6 \n",
      "Point card sequence: 2 \n",
      "Points: 0 0 \n",
      "\n",
      "Player 1 cards: []\n",
      "Player 2 cards: []\n",
      "Possible actions:  [1, 2, 3, 4, 5, 6]\n",
      "Player 1 takes action 1 at state Partial joint action: 2 \n",
      "P0 hand: 1 2 3 4 5 6 \n",
      "P1 hand: 1 2 3 4 5 6 \n",
      "Point card sequence: 2 \n",
      "Points: 0 0 \n",
      "\n",
      "Player 1 cards: [3]\n",
      "Player 2 cards: [2]\n",
      "Player 0 takes action 1 at state Partial joint action: \n",
      "P0 hand: 1 2 4 5 6 \n",
      "P1 hand: 1 3 4 5 6 \n",
      "Point card sequence: 2 1 \n",
      "Points: 2 0 \n",
      "\n",
      "Player 1 cards: [3]\n",
      "Player 2 cards: [2]\n",
      "Possible actions:  [1, 3, 4, 5, 6]\n",
      "Player 1 takes action 0 at state Partial joint action: 1 \n",
      "P0 hand: 1 2 4 5 6 \n",
      "P1 hand: 1 3 4 5 6 \n",
      "Point card sequence: 2 1 \n",
      "Points: 2 0 \n",
      "\n",
      "Player 1 cards: [3, 2]\n",
      "Player 2 cards: [2, 1]\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      " 20%|██        | 2/10 [00:18<01:13,  9.23s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Player 0 takes action 3 at state Partial joint action: \n",
      "P0 hand: 1 4 5 6 \n",
      "P1 hand: 3 4 5 6 \n",
      "Point card sequence: 2 1 4 \n",
      "Points: 3 0 \n",
      "\n",
      "Player 1 cards: [3, 2]\n",
      "Player 2 cards: [2, 1]\n",
      "Possible actions:  [3, 4, 5, 6]\n",
      "Player 1 takes action 3 at state Partial joint action: 3 \n",
      "P0 hand: 1 4 5 6 \n",
      "P1 hand: 3 4 5 6 \n",
      "Point card sequence: 2 1 4 \n",
      "Points: 3 0 \n",
      "\n",
      "Player 1 cards: [3, 2, 4]\n",
      "Player 2 cards: [2, 1, 4]\n",
      "Player 0 takes action 5 at state Partial joint action: \n",
      "P0 hand: 1 5 6 \n",
      "P1 hand: 3 5 6 \n",
      "Point card sequence: 2 1 4 6 \n",
      "Points: 3 0 \n",
      "\n",
      "Player 1 cards: [3, 2, 4]\n",
      "Player 2 cards: [2, 1, 4]\n",
      "Possible actions:  [3, 5, 6]\n",
      "Player 1 takes action 5 at state Partial joint action: 5 \n",
      "P0 hand: 1 5 6 \n",
      "P1 hand: 3 5 6 \n",
      "Point card sequence: 2 1 4 6 \n",
      "Points: 3 0 \n",
      "\n",
      "Player 1 cards: [3, 2, 4, 6]\n",
      "Player 2 cards: [2, 1, 4, 6]\n",
      "Player 0 takes action 4 at state Partial joint action: \n",
      "P0 hand: 1 5 \n",
      "P1 hand: 3 5 \n",
      "Point card sequence: 2 1 4 6 5 \n",
      "Points: 3 0 \n",
      "\n",
      "Player 1 cards: [3, 2, 4, 6]\n",
      "Player 2 cards: [2, 1, 4, 6]\n",
      "Possible actions:  [3, 5]\n",
      "Player 1 takes action 4 at state Partial joint action: 4 \n",
      "P0 hand: 1 5 \n",
      "P1 hand: 3 5 \n",
      "Point card sequence: 2 1 4 6 5 \n",
      "Points: 3 0 \n",
      "\n",
      "Player 1 cards: [3, 2, 4, 6, 5]\n",
      "Player 2 cards: [2, 1, 4, 6, 5]\n",
      "Player 0 takes action 0 at state Partial joint action: \n",
      "P0 hand: 1 2 3 4 5 6 \n",
      "P1 hand: 1 2 3 4 5 6 \n",
      "Point card sequence: 2 \n",
      "Points: 0 0 \n",
      "\n",
      "Player 1 cards: []\n",
      "Player 2 cards: []\n",
      "Possible actions:  [1, 2, 3, 4, 5, 6]\n",
      "Player 1 takes action 2 at state Partial joint action: 0 \n",
      "P0 hand: 1 2 3 4 5 6 \n",
      "P1 hand: 1 2 3 4 5 6 \n",
      "Point card sequence: 2 \n",
      "Points: 0 0 \n",
      "\n",
      "Player 1 cards: [1]\n",
      "Player 2 cards: [3]\n",
      "Player 0 takes action 5 at state Partial joint action: \n",
      "P0 hand: 2 3 4 5 6 \n",
      "P1 hand: 1 2 4 5 6 \n",
      "Point card sequence: 2 5 \n",
      "Points: 0 2 \n",
      "\n",
      "Player 1 cards: [1]\n",
      "Player 2 cards: [3]\n",
      "Possible actions:  [1, 2, 4, 5, 6]\n",
      "Player 1 takes action 0 at state Partial joint action: 5 \n",
      "P0 hand: 2 3 4 5 6 \n",
      "P1 hand: 1 2 4 5 6 \n",
      "Point card sequence: 2 5 \n",
      "Points: 0 2 \n",
      "\n",
      "Player 1 cards: [1, 6]\n",
      "Player 2 cards: [3, 1]\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      " 30%|███       | 3/10 [00:27<01:04,  9.25s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Player 0 takes action 1 at state Partial joint action: \n",
      "P0 hand: 2 3 4 5 \n",
      "P1 hand: 2 4 5 6 \n",
      "Point card sequence: 2 5 1 \n",
      "Points: 5 2 \n",
      "\n",
      "Player 1 cards: [1, 6]\n",
      "Player 2 cards: [3, 1]\n",
      "Possible actions:  [2, 4, 5, 6]\n",
      "Player 1 takes action 1 at state Partial joint action: 1 \n",
      "P0 hand: 2 3 4 5 \n",
      "P1 hand: 2 4 5 6 \n",
      "Point card sequence: 2 5 1 \n",
      "Points: 5 2 \n",
      "\n",
      "Player 1 cards: [1, 6, 2]\n",
      "Player 2 cards: [3, 1, 2]\n",
      "Player 0 takes action 2 at state Partial joint action: \n",
      "P0 hand: 3 4 5 \n",
      "P1 hand: 4 5 6 \n",
      "Point card sequence: 2 5 1 6 \n",
      "Points: 5 2 \n",
      "\n",
      "Player 1 cards: [1, 6, 2]\n",
      "Player 2 cards: [3, 1, 2]\n",
      "Possible actions:  [4, 5, 6]\n",
      "Player 1 takes action 4 at state Partial joint action: 2 \n",
      "P0 hand: 3 4 5 \n",
      "P1 hand: 4 5 6 \n",
      "Point card sequence: 2 5 1 6 \n",
      "Points: 5 2 \n",
      "\n",
      "Player 1 cards: [1, 6, 2, 3]\n",
      "Player 2 cards: [3, 1, 2, 5]\n",
      "Player 0 takes action 3 at state Partial joint action: \n",
      "P0 hand: 4 5 \n",
      "P1 hand: 4 6 \n",
      "Point card sequence: 2 5 1 6 4 \n",
      "Points: 5 8 \n",
      "\n",
      "Player 1 cards: [1, 6, 2, 3]\n",
      "Player 2 cards: [3, 1, 2, 5]\n",
      "Possible actions:  [4, 6]\n",
      "Player 1 takes action 5 at state Partial joint action: 3 \n",
      "P0 hand: 4 5 \n",
      "P1 hand: 4 6 \n",
      "Point card sequence: 2 5 1 6 4 \n",
      "Points: 5 8 \n",
      "\n",
      "Player 1 cards: [1, 6, 2, 3, 4]\n",
      "Player 2 cards: [3, 1, 2, 5, 6]\n",
      "Player 0 takes action 1 at state Partial joint action: \n",
      "P0 hand: 1 2 3 4 5 6 \n",
      "P1 hand: 1 2 3 4 5 6 \n",
      "Point card sequence: 2 \n",
      "Points: 0 0 \n",
      "\n",
      "Player 1 cards: []\n",
      "Player 2 cards: []\n",
      "Possible actions:  [1, 2, 3, 4, 5, 6]\n",
      "Player 1 takes action 2 at state Partial joint action: 1 \n",
      "P0 hand: 1 2 3 4 5 6 \n",
      "P1 hand: 1 2 3 4 5 6 \n",
      "Point card sequence: 2 \n",
      "Points: 0 0 \n",
      "\n",
      "Player 1 cards: [2]\n",
      "Player 2 cards: [3]\n",
      "Player 0 takes action 3 at state Partial joint action: \n",
      "P0 hand: 1 3 4 5 6 \n",
      "P1 hand: 1 2 4 5 6 \n",
      "Point card sequence: 2 3 \n",
      "Points: 0 2 \n",
      "\n",
      "Player 1 cards: [2]\n",
      "Player 2 cards: [3]\n",
      "Possible actions:  [1, 2, 4, 5, 6]\n",
      "Player 1 takes action 0 at state Partial joint action: 3 \n",
      "P0 hand: 1 3 4 5 6 \n",
      "P1 hand: 1 2 4 5 6 \n",
      "Point card sequence: 2 3 \n",
      "Points: 0 2 \n",
      "\n",
      "Player 1 cards: [2, 4]\n",
      "Player 2 cards: [3, 1]\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      " 40%|████      | 4/10 [00:37<00:55,  9.31s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Player 0 takes action 2 at state Partial joint action: \n",
      "P0 hand: 1 3 5 6 \n",
      "P1 hand: 2 4 5 6 \n",
      "Point card sequence: 2 3 1 \n",
      "Points: 3 2 \n",
      "\n",
      "Player 1 cards: [2, 4]\n",
      "Player 2 cards: [3, 1]\n",
      "Possible actions:  [2, 4, 5, 6]\n",
      "Player 1 takes action 1 at state Partial joint action: 2 \n",
      "P0 hand: 1 3 5 6 \n",
      "P1 hand: 2 4 5 6 \n",
      "Point card sequence: 2 3 1 \n",
      "Points: 3 2 \n",
      "\n",
      "Player 1 cards: [2, 4, 3]\n",
      "Player 2 cards: [3, 1, 2]\n",
      "Player 0 takes action 0 at state Partial joint action: \n",
      "P0 hand: 1 5 6 \n",
      "P1 hand: 4 5 6 \n",
      "Point card sequence: 2 3 1 4 \n",
      "Points: 4 2 \n",
      "\n",
      "Player 1 cards: [2, 4, 3]\n",
      "Player 2 cards: [3, 1, 2]\n",
      "Possible actions:  [4, 5, 6]\n",
      "Player 1 takes action 3 at state Partial joint action: 0 \n",
      "P0 hand: 1 5 6 \n",
      "P1 hand: 4 5 6 \n",
      "Point card sequence: 2 3 1 4 \n",
      "Points: 4 2 \n",
      "\n",
      "Player 1 cards: [2, 4, 3, 1]\n",
      "Player 2 cards: [3, 1, 2, 4]\n",
      "Player 0 takes action 4 at state Partial joint action: \n",
      "P0 hand: 5 6 \n",
      "P1 hand: 5 6 \n",
      "Point card sequence: 2 3 1 4 6 \n",
      "Points: 4 6 \n",
      "\n",
      "Player 1 cards: [2, 4, 3, 1]\n",
      "Player 2 cards: [3, 1, 2, 4]\n",
      "Possible actions:  [5, 6]\n",
      "Player 1 takes action 5 at state Partial joint action: 4 \n",
      "P0 hand: 5 6 \n",
      "P1 hand: 5 6 \n",
      "Point card sequence: 2 3 1 4 6 \n",
      "Points: 4 6 \n",
      "\n",
      "Player 1 cards: [2, 4, 3, 1, 5]\n",
      "Player 2 cards: [3, 1, 2, 4, 6]\n",
      "Player 0 takes action 1 at state Partial joint action: \n",
      "P0 hand: 1 2 3 4 5 6 \n",
      "P1 hand: 1 2 3 4 5 6 \n",
      "Point card sequence: 1 \n",
      "Points: 0 0 \n",
      "\n",
      "Player 1 cards: []\n",
      "Player 2 cards: []\n",
      "Possible actions:  [1, 2, 3, 4, 5, 6]\n",
      "Player 1 takes action 0 at state Partial joint action: 1 \n",
      "P0 hand: 1 2 3 4 5 6 \n",
      "P1 hand: 1 2 3 4 5 6 \n",
      "Point card sequence: 1 \n",
      "Points: 0 0 \n",
      "\n",
      "Player 1 cards: [2]\n",
      "Player 2 cards: [1]\n",
      "Player 0 takes action 3 at state Partial joint action: \n",
      "P0 hand: 1 3 4 5 6 \n",
      "P1 hand: 2 3 4 5 6 \n",
      "Point card sequence: 1 3 \n",
      "Points: 1 0 \n",
      "\n",
      "Player 1 cards: [2]\n",
      "Player 2 cards: [1]\n",
      "Possible actions:  [2, 3, 4, 5, 6]\n",
      "Player 1 takes action 2 at state Partial joint action: 3 \n",
      "P0 hand: 1 3 4 5 6 \n",
      "P1 hand: 2 3 4 5 6 \n",
      "Point card sequence: 1 3 \n",
      "Points: 1 0 \n",
      "\n",
      "Player 1 cards: [2, 4]\n",
      "Player 2 cards: [1, 3]\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      " 50%|█████     | 5/10 [00:46<00:46,  9.37s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Player 0 takes action 2 at state Partial joint action: \n",
      "P0 hand: 1 3 5 6 \n",
      "P1 hand: 2 4 5 6 \n",
      "Point card sequence: 1 3 2 \n",
      "Points: 4 0 \n",
      "\n",
      "Player 1 cards: [2, 4]\n",
      "Player 2 cards: [1, 3]\n",
      "Possible actions:  [2, 4, 5, 6]\n",
      "Player 1 takes action 4 at state Partial joint action: 2 \n",
      "P0 hand: 1 3 5 6 \n",
      "P1 hand: 2 4 5 6 \n",
      "Point card sequence: 1 3 2 \n",
      "Points: 4 0 \n",
      "\n",
      "Player 1 cards: [2, 4, 3]\n",
      "Player 2 cards: [1, 3, 5]\n",
      "Player 0 takes action 0 at state Partial joint action: \n",
      "P0 hand: 1 5 6 \n",
      "P1 hand: 2 4 6 \n",
      "Point card sequence: 1 3 2 5 \n",
      "Points: 4 2 \n",
      "\n",
      "Player 1 cards: [2, 4, 3]\n",
      "Player 2 cards: [1, 3, 5]\n",
      "Possible actions:  [2, 4, 6]\n",
      "Player 1 takes action 1 at state Partial joint action: 0 \n",
      "P0 hand: 1 5 6 \n",
      "P1 hand: 2 4 6 \n",
      "Point card sequence: 1 3 2 5 \n",
      "Points: 4 2 \n",
      "\n",
      "Player 1 cards: [2, 4, 3, 1]\n",
      "Player 2 cards: [1, 3, 5, 2]\n",
      "Player 0 takes action 4 at state Partial joint action: \n",
      "P0 hand: 5 6 \n",
      "P1 hand: 4 6 \n",
      "Point card sequence: 1 3 2 5 4 \n",
      "Points: 4 7 \n",
      "\n",
      "Player 1 cards: [2, 4, 3, 1]\n",
      "Player 2 cards: [1, 3, 5, 2]\n",
      "Possible actions:  [4, 6]\n",
      "Player 1 takes action 3 at state Partial joint action: 4 \n",
      "P0 hand: 5 6 \n",
      "P1 hand: 4 6 \n",
      "Point card sequence: 1 3 2 5 4 \n",
      "Points: 4 7 \n",
      "\n",
      "Player 1 cards: [2, 4, 3, 1, 5]\n",
      "Player 2 cards: [1, 3, 5, 2, 4]\n",
      "Player 0 takes action 5 at state Partial joint action: \n",
      "P0 hand: 1 2 3 4 5 6 \n",
      "P1 hand: 1 2 3 4 5 6 \n",
      "Point card sequence: 6 \n",
      "Points: 0 0 \n",
      "\n",
      "Player 1 cards: []\n",
      "Player 2 cards: []\n",
      "Possible actions:  [1, 2, 3, 4, 5, 6]\n",
      "Player 1 takes action 5 at state Partial joint action: 5 \n",
      "P0 hand: 1 2 3 4 5 6 \n",
      "P1 hand: 1 2 3 4 5 6 \n",
      "Point card sequence: 6 \n",
      "Points: 0 0 \n",
      "\n",
      "Player 1 cards: [6]\n",
      "Player 2 cards: [6]\n",
      "Player 0 takes action 4 at state Partial joint action: \n",
      "P0 hand: 1 2 3 4 5 \n",
      "P1 hand: 1 2 3 4 5 \n",
      "Point card sequence: 6 4 \n",
      "Points: 0 0 \n",
      "\n",
      "Player 1 cards: [6]\n",
      "Player 2 cards: [6]\n",
      "Possible actions:  [1, 2, 3, 4, 5]\n",
      "Player 1 takes action 4 at state Partial joint action: 4 \n",
      "P0 hand: 1 2 3 4 5 \n",
      "P1 hand: 1 2 3 4 5 \n",
      "Point card sequence: 6 4 \n",
      "Points: 0 0 \n",
      "\n",
      "Player 1 cards: [6, 5]\n",
      "Player 2 cards: [6, 5]\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      " 60%|██████    | 6/10 [00:55<00:37,  9.34s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Player 0 takes action 0 at state Partial joint action: \n",
      "P0 hand: 1 2 3 4 \n",
      "P1 hand: 1 2 3 4 \n",
      "Point card sequence: 6 4 1 \n",
      "Points: 0 0 \n",
      "\n",
      "Player 1 cards: [6, 5]\n",
      "Player 2 cards: [6, 5]\n",
      "Possible actions:  [1, 2, 3, 4]\n",
      "Player 1 takes action 3 at state Partial joint action: 0 \n",
      "P0 hand: 1 2 3 4 \n",
      "P1 hand: 1 2 3 4 \n",
      "Point card sequence: 6 4 1 \n",
      "Points: 0 0 \n",
      "\n",
      "Player 1 cards: [6, 5, 1]\n",
      "Player 2 cards: [6, 5, 4]\n",
      "Player 0 takes action 2 at state Partial joint action: \n",
      "P0 hand: 2 3 4 \n",
      "P1 hand: 1 2 3 \n",
      "Point card sequence: 6 4 1 5 \n",
      "Points: 0 1 \n",
      "\n",
      "Player 1 cards: [6, 5, 1]\n",
      "Player 2 cards: [6, 5, 4]\n",
      "Possible actions:  [1, 2, 3]\n",
      "Player 1 takes action 0 at state Partial joint action: 2 \n",
      "P0 hand: 2 3 4 \n",
      "P1 hand: 1 2 3 \n",
      "Point card sequence: 6 4 1 5 \n",
      "Points: 0 1 \n",
      "\n",
      "Player 1 cards: [6, 5, 1, 3]\n",
      "Player 2 cards: [6, 5, 4, 1]\n",
      "Player 0 takes action 1 at state Partial joint action: \n",
      "P0 hand: 2 4 \n",
      "P1 hand: 2 3 \n",
      "Point card sequence: 6 4 1 5 2 \n",
      "Points: 5 1 \n",
      "\n",
      "Player 1 cards: [6, 5, 1, 3]\n",
      "Player 2 cards: [6, 5, 4, 1]\n",
      "Possible actions:  [2, 3]\n",
      "Player 1 takes action 2 at state Partial joint action: 1 \n",
      "P0 hand: 2 4 \n",
      "P1 hand: 2 3 \n",
      "Point card sequence: 6 4 1 5 2 \n",
      "Points: 5 1 \n",
      "\n",
      "Player 1 cards: [6, 5, 1, 3, 2]\n",
      "Player 2 cards: [6, 5, 4, 1, 3]\n",
      "Player 0 takes action 0 at state Partial joint action: \n",
      "P0 hand: 1 2 3 4 5 6 \n",
      "P1 hand: 1 2 3 4 5 6 \n",
      "Point card sequence: 1 \n",
      "Points: 0 0 \n",
      "\n",
      "Player 1 cards: []\n",
      "Player 2 cards: []\n",
      "Possible actions:  [1, 2, 3, 4, 5, 6]\n",
      "Player 1 takes action 0 at state Partial joint action: 0 \n",
      "P0 hand: 1 2 3 4 5 6 \n",
      "P1 hand: 1 2 3 4 5 6 \n",
      "Point card sequence: 1 \n",
      "Points: 0 0 \n",
      "\n",
      "Player 1 cards: [1]\n",
      "Player 2 cards: [1]\n",
      "Player 0 takes action 5 at state Partial joint action: \n",
      "P0 hand: 2 3 4 5 6 \n",
      "P1 hand: 2 3 4 5 6 \n",
      "Point card sequence: 1 5 \n",
      "Points: 0 0 \n",
      "\n",
      "Player 1 cards: [1]\n",
      "Player 2 cards: [1]\n",
      "Possible actions:  [2, 3, 4, 5, 6]\n",
      "Player 1 takes action 5 at state Partial joint action: 5 \n",
      "P0 hand: 2 3 4 5 6 \n",
      "P1 hand: 2 3 4 5 6 \n",
      "Point card sequence: 1 5 \n",
      "Points: 0 0 \n",
      "\n",
      "Player 1 cards: [1, 6]\n",
      "Player 2 cards: [1, 6]\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      " 70%|███████   | 7/10 [01:05<00:27,  9.29s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Player 0 takes action 4 at state Partial joint action: \n",
      "P0 hand: 2 3 4 5 \n",
      "P1 hand: 2 3 4 5 \n",
      "Point card sequence: 1 5 6 \n",
      "Points: 0 0 \n",
      "\n",
      "Player 1 cards: [1, 6]\n",
      "Player 2 cards: [1, 6]\n",
      "Possible actions:  [2, 3, 4, 5]\n",
      "Player 1 takes action 4 at state Partial joint action: 4 \n",
      "P0 hand: 2 3 4 5 \n",
      "P1 hand: 2 3 4 5 \n",
      "Point card sequence: 1 5 6 \n",
      "Points: 0 0 \n",
      "\n",
      "Player 1 cards: [1, 6, 5]\n",
      "Player 2 cards: [1, 6, 5]\n",
      "Player 0 takes action 1 at state Partial joint action: \n",
      "P0 hand: 2 3 4 \n",
      "P1 hand: 2 3 4 \n",
      "Point card sequence: 1 5 6 2 \n",
      "Points: 0 0 \n",
      "\n",
      "Player 1 cards: [1, 6, 5]\n",
      "Player 2 cards: [1, 6, 5]\n",
      "Possible actions:  [2, 3, 4]\n",
      "Player 1 takes action 3 at state Partial joint action: 1 \n",
      "P0 hand: 2 3 4 \n",
      "P1 hand: 2 3 4 \n",
      "Point card sequence: 1 5 6 2 \n",
      "Points: 0 0 \n",
      "\n",
      "Player 1 cards: [1, 6, 5, 2]\n",
      "Player 2 cards: [1, 6, 5, 4]\n",
      "Player 0 takes action 2 at state Partial joint action: \n",
      "P0 hand: 3 4 \n",
      "P1 hand: 2 3 \n",
      "Point card sequence: 1 5 6 2 4 \n",
      "Points: 0 2 \n",
      "\n",
      "Player 1 cards: [1, 6, 5, 2]\n",
      "Player 2 cards: [1, 6, 5, 4]\n",
      "Possible actions:  [2, 3]\n",
      "Player 1 takes action 1 at state Partial joint action: 2 \n",
      "P0 hand: 3 4 \n",
      "P1 hand: 2 3 \n",
      "Point card sequence: 1 5 6 2 4 \n",
      "Points: 0 2 \n",
      "\n",
      "Player 1 cards: [1, 6, 5, 2, 3]\n",
      "Player 2 cards: [1, 6, 5, 4, 2]\n",
      "Player 0 takes action 5 at state Partial joint action: \n",
      "P0 hand: 1 2 3 4 5 6 \n",
      "P1 hand: 1 2 3 4 5 6 \n",
      "Point card sequence: 5 \n",
      "Points: 0 0 \n",
      "\n",
      "Player 1 cards: []\n",
      "Player 2 cards: []\n",
      "Possible actions:  [1, 2, 3, 4, 5, 6]\n",
      "Player 1 takes action 4 at state Partial joint action: 5 \n",
      "P0 hand: 1 2 3 4 5 6 \n",
      "P1 hand: 1 2 3 4 5 6 \n",
      "Point card sequence: 5 \n",
      "Points: 0 0 \n",
      "\n",
      "Player 1 cards: [6]\n",
      "Player 2 cards: [5]\n",
      "Player 0 takes action 4 at state Partial joint action: \n",
      "P0 hand: 1 2 3 4 5 \n",
      "P1 hand: 1 2 3 4 6 \n",
      "Point card sequence: 5 3 \n",
      "Points: 5 0 \n",
      "\n",
      "Player 1 cards: [6]\n",
      "Player 2 cards: [5]\n",
      "Possible actions:  [1, 2, 3, 4, 6]\n",
      "Player 1 takes action 1 at state Partial joint action: 4 \n",
      "P0 hand: 1 2 3 4 5 \n",
      "P1 hand: 1 2 3 4 6 \n",
      "Point card sequence: 5 3 \n",
      "Points: 5 0 \n",
      "\n",
      "Player 1 cards: [6, 5]\n",
      "Player 2 cards: [5, 2]\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      " 80%|████████  | 8/10 [01:14<00:18,  9.27s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Player 0 takes action 2 at state Partial joint action: \n",
      "P0 hand: 1 2 3 4 \n",
      "P1 hand: 1 3 4 6 \n",
      "Point card sequence: 5 3 6 \n",
      "Points: 8 0 \n",
      "\n",
      "Player 1 cards: [6, 5]\n",
      "Player 2 cards: [5, 2]\n",
      "Possible actions:  [1, 3, 4, 6]\n",
      "Player 1 takes action 3 at state Partial joint action: 2 \n",
      "P0 hand: 1 2 3 4 \n",
      "P1 hand: 1 3 4 6 \n",
      "Point card sequence: 5 3 6 \n",
      "Points: 8 0 \n",
      "\n",
      "Player 1 cards: [6, 5, 3]\n",
      "Player 2 cards: [5, 2, 4]\n",
      "Player 0 takes action 0 at state Partial joint action: \n",
      "P0 hand: 1 2 4 \n",
      "P1 hand: 1 3 6 \n",
      "Point card sequence: 5 3 6 1 \n",
      "Points: 8 6 \n",
      "\n",
      "Player 1 cards: [6, 5, 3]\n",
      "Player 2 cards: [5, 2, 4]\n",
      "Possible actions:  [1, 3, 6]\n",
      "Player 1 takes action 0 at state Partial joint action: 0 \n",
      "P0 hand: 1 2 4 \n",
      "P1 hand: 1 3 6 \n",
      "Point card sequence: 5 3 6 1 \n",
      "Points: 8 6 \n",
      "\n",
      "Player 1 cards: [6, 5, 3, 1]\n",
      "Player 2 cards: [5, 2, 4, 1]\n",
      "Player 0 takes action 1 at state Partial joint action: \n",
      "P0 hand: 2 4 \n",
      "P1 hand: 3 6 \n",
      "Point card sequence: 5 3 6 1 2 \n",
      "Points: 8 6 \n",
      "\n",
      "Player 1 cards: [6, 5, 3, 1]\n",
      "Player 2 cards: [5, 2, 4, 1]\n",
      "Possible actions:  [3, 6]\n",
      "Player 1 takes action 2 at state Partial joint action: 1 \n",
      "P0 hand: 2 4 \n",
      "P1 hand: 3 6 \n",
      "Point card sequence: 5 3 6 1 2 \n",
      "Points: 8 6 \n",
      "\n",
      "Player 1 cards: [6, 5, 3, 1, 2]\n",
      "Player 2 cards: [5, 2, 4, 1, 3]\n",
      "Player 0 takes action 3 at state Partial joint action: \n",
      "P0 hand: 1 2 3 4 5 6 \n",
      "P1 hand: 1 2 3 4 5 6 \n",
      "Point card sequence: 3 \n",
      "Points: 0 0 \n",
      "\n",
      "Player 1 cards: []\n",
      "Player 2 cards: []\n",
      "Possible actions:  [1, 2, 3, 4, 5, 6]\n",
      "Player 1 takes action 3 at state Partial joint action: 3 \n",
      "P0 hand: 1 2 3 4 5 6 \n",
      "P1 hand: 1 2 3 4 5 6 \n",
      "Point card sequence: 3 \n",
      "Points: 0 0 \n",
      "\n",
      "Player 1 cards: [4]\n",
      "Player 2 cards: [4]\n",
      "Player 0 takes action 1 at state Partial joint action: \n",
      "P0 hand: 1 2 3 5 6 \n",
      "P1 hand: 1 2 3 5 6 \n",
      "Point card sequence: 3 2 \n",
      "Points: 0 0 \n",
      "\n",
      "Player 1 cards: [4]\n",
      "Player 2 cards: [4]\n",
      "Possible actions:  [1, 2, 3, 5, 6]\n",
      "Player 1 takes action 1 at state Partial joint action: 1 \n",
      "P0 hand: 1 2 3 5 6 \n",
      "P1 hand: 1 2 3 5 6 \n",
      "Point card sequence: 3 2 \n",
      "Points: 0 0 \n",
      "\n",
      "Player 1 cards: [4, 2]\n",
      "Player 2 cards: [4, 2]\n",
      "Player 0 takes action 5 at state Partial joint action: \n",
      "P0 hand: 1 3 5 6 \n",
      "P1 hand: 1 3 5 6 \n",
      "Point card sequence: 3 2 5 \n",
      "Points: 0 0 \n",
      "\n",
      "Player 1 cards: [4, 2]\n",
      "Player 2 cards: [4, 2]\n",
      "Possible actions:  [1, 3, 5, 6]\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      " 90%|█████████ | 9/10 [01:23<00:09,  9.30s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Player 1 takes action 5 at state Partial joint action: 5 \n",
      "P0 hand: 1 3 5 6 \n",
      "P1 hand: 1 3 5 6 \n",
      "Point card sequence: 3 2 5 \n",
      "Points: 0 0 \n",
      "\n",
      "Player 1 cards: [4, 2, 6]\n",
      "Player 2 cards: [4, 2, 6]\n",
      "Player 0 takes action 2 at state Partial joint action: \n",
      "P0 hand: 1 3 5 \n",
      "P1 hand: 1 3 5 \n",
      "Point card sequence: 3 2 5 4 \n",
      "Points: 0 0 \n",
      "\n",
      "Player 1 cards: [4, 2, 6]\n",
      "Player 2 cards: [4, 2, 6]\n",
      "Possible actions:  [1, 3, 5]\n",
      "Player 1 takes action 4 at state Partial joint action: 2 \n",
      "P0 hand: 1 3 5 \n",
      "P1 hand: 1 3 5 \n",
      "Point card sequence: 3 2 5 4 \n",
      "Points: 0 0 \n",
      "\n",
      "Player 1 cards: [4, 2, 6, 3]\n",
      "Player 2 cards: [4, 2, 6, 5]\n",
      "Player 0 takes action 0 at state Partial joint action: \n",
      "P0 hand: 1 5 \n",
      "P1 hand: 1 3 \n",
      "Point card sequence: 3 2 5 4 1 \n",
      "Points: 0 4 \n",
      "\n",
      "Player 1 cards: [4, 2, 6, 3]\n",
      "Player 2 cards: [4, 2, 6, 5]\n",
      "Possible actions:  [1, 3]\n",
      "Player 1 takes action 2 at state Partial joint action: 0 \n",
      "P0 hand: 1 5 \n",
      "P1 hand: 1 3 \n",
      "Point card sequence: 3 2 5 4 1 \n",
      "Points: 0 4 \n",
      "\n",
      "Player 1 cards: [4, 2, 6, 3, 1]\n",
      "Player 2 cards: [4, 2, 6, 5, 3]\n",
      "Player 0 takes action 1 at state Partial joint action: \n",
      "P0 hand: 1 2 3 4 5 6 \n",
      "P1 hand: 1 2 3 4 5 6 \n",
      "Point card sequence: 3 \n",
      "Points: 0 0 \n",
      "\n",
      "Player 1 cards: []\n",
      "Player 2 cards: []\n",
      "Possible actions:  [1, 2, 3, 4, 5, 6]\n",
      "Player 1 takes action 0 at state Partial joint action: 1 \n",
      "P0 hand: 1 2 3 4 5 6 \n",
      "P1 hand: 1 2 3 4 5 6 \n",
      "Point card sequence: 3 \n",
      "Points: 0 0 \n",
      "\n",
      "Player 1 cards: [2]\n",
      "Player 2 cards: [1]\n",
      "Player 0 takes action 5 at state Partial joint action: \n",
      "P0 hand: 1 3 4 5 6 \n",
      "P1 hand: 2 3 4 5 6 \n",
      "Point card sequence: 3 6 \n",
      "Points: 3 0 \n",
      "\n",
      "Player 1 cards: [2]\n",
      "Player 2 cards: [1]\n",
      "Possible actions:  [2, 3, 4, 5, 6]\n",
      "Player 1 takes action 5 at state Partial joint action: 5 \n",
      "P0 hand: 1 3 4 5 6 \n",
      "P1 hand: 2 3 4 5 6 \n",
      "Point card sequence: 3 6 \n",
      "Points: 3 0 \n",
      "\n",
      "Player 1 cards: [2, 6]\n",
      "Player 2 cards: [1, 6]\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "100%|██████████| 10/10 [01:32<00:00,  9.28s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Player 0 takes action 4 at state Partial joint action: \n",
      "P0 hand: 1 3 4 5 \n",
      "P1 hand: 2 3 4 5 \n",
      "Point card sequence: 3 6 5 \n",
      "Points: 3 0 \n",
      "\n",
      "Player 1 cards: [2, 6]\n",
      "Player 2 cards: [1, 6]\n",
      "Possible actions:  [2, 3, 4, 5]\n",
      "Player 1 takes action 4 at state Partial joint action: 4 \n",
      "P0 hand: 1 3 4 5 \n",
      "P1 hand: 2 3 4 5 \n",
      "Point card sequence: 3 6 5 \n",
      "Points: 3 0 \n",
      "\n",
      "Player 1 cards: [2, 6, 5]\n",
      "Player 2 cards: [1, 6, 5]\n",
      "Player 0 takes action 0 at state Partial joint action: \n",
      "P0 hand: 1 3 4 \n",
      "P1 hand: 2 3 4 \n",
      "Point card sequence: 3 6 5 1 \n",
      "Points: 3 0 \n",
      "\n",
      "Player 1 cards: [2, 6, 5]\n",
      "Player 2 cards: [1, 6, 5]\n",
      "Possible actions:  [2, 3, 4]\n",
      "Player 1 takes action 3 at state Partial joint action: 0 \n",
      "P0 hand: 1 3 4 \n",
      "P1 hand: 2 3 4 \n",
      "Point card sequence: 3 6 5 1 \n",
      "Points: 3 0 \n",
      "\n",
      "Player 1 cards: [2, 6, 5, 1]\n",
      "Player 2 cards: [1, 6, 5, 4]\n",
      "Player 0 takes action 2 at state Partial joint action: \n",
      "P0 hand: 3 4 \n",
      "P1 hand: 2 3 \n",
      "Point card sequence: 3 6 5 1 2 \n",
      "Points: 3 1 \n",
      "\n",
      "Player 1 cards: [2, 6, 5, 1]\n",
      "Player 2 cards: [1, 6, 5, 4]\n",
      "Possible actions:  [2, 3]\n",
      "Player 1 takes action 1 at state Partial joint action: 2 \n",
      "P0 hand: 3 4 \n",
      "P1 hand: 2 3 \n",
      "Point card sequence: 3 6 5 1 2 \n",
      "Points: 3 1 \n",
      "\n",
      "Player 1 cards: [2, 6, 5, 1, 3]\n",
      "Player 2 cards: [1, 6, 5, 4, 2]\n",
      "Player 1: 4.6\n",
      "Player 2: 10.7\n",
      "Player 1 winrate: 0.2\n",
      "Player 2 winrate: 0.8\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "\n"
     ]
    },
    {
     "data": {
      "text/plain": [
       "(4.6, 10.7, 0.2, 0.8)"
      ]
     },
     "execution_count": 7,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# custom SMMiniMaxBot vs alpha beta bot\n",
    "\n",
    "# Load the gooftspiel game. remember to load the turn based version\n",
    "game = pyspiel.load_game_as_turn_based(\"goofspiel\", {\"num_cards\": 6})\n",
    "\n",
    "# Create random state\n",
    "random_state = np.random.RandomState(6)\n",
    "\n",
    "# Set up SMMiniMaxBot\n",
    "sm_minimax_bot = SMMinimaxCustomBot(player_id=1, rng=random_state, num_rollouts=10)\n",
    "\n",
    "# Set up alpha beta bot\n",
    "alpha_beta_bot = AlphaBetaBot(game, player_id=0, rng=random_state, depth=4, num_rollouts=10)\n",
    "\n",
    "# Run the experiment\n",
    "run_gops_experiment(game, [alpha_beta_bot, sm_minimax_bot], num_episodes=10, rng=random_state)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 10,
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "100%|██████████| 100/100 [15:14<00:00,  9.15s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Player 1: 6.32\n",
      "Player 2: 9.59\n",
      "Player 1 winrate: 0.25\n",
      "Player 2 winrate: 0.75\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "\n"
     ]
    },
    {
     "data": {
      "text/plain": [
       "(6.32, 9.59, 0.25, 0.75)"
      ]
     },
     "execution_count": 10,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# custom SMMiniMaxBot vs alpha beta bot\n",
    "\n",
    "# Load the gooftspiel game. remember to load the turn based version\n",
    "game = pyspiel.load_game_as_turn_based(\"goofspiel\", {\"num_cards\": 6})\n",
    "\n",
    "# Create random state\n",
    "random_state = np.random.RandomState(6)\n",
    "\n",
    "# Set up SMMiniMaxBot\n",
    "sm_minimax_bot = SMMinimaxCustomBot(player_id=1, rng=random_state, num_rollouts=10)\n",
    "\n",
    "# Set up alpha beta bot\n",
    "alpha_beta_bot = AlphaBetaBot(game, player_id=0, rng=random_state, depth=4, num_rollouts=10)\n",
    "\n",
    "# Run the experiment\n",
    "run_gops_experiment(game, [alpha_beta_bot, sm_minimax_bot], num_episodes=100, rng=random_state)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 10,
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "100%|██████████| 100/100 [13:34<00:00,  8.14s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Player 1: 9.31\n",
      "Player 2: 7.87\n",
      "Player 1 winrate: 0.63\n",
      "Player 2 winrate: 0.37\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "\n"
     ]
    },
    {
     "data": {
      "text/plain": [
       "(9.31, 7.87, 0.63, 0.37)"
      ]
     },
     "execution_count": 10,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# custom SMMiniMaxBot vs alpha beta bot\n",
    "\n",
    "# Load the gooftspiel game. remember to load the turn based version\n",
    "game = pyspiel.load_game_as_turn_based(\"goofspiel\", {\"num_cards\": 6})\n",
    "\n",
    "# Create random state\n",
    "random_state = np.random.RandomState(6)\n",
    "\n",
    "# Set up alpha beta bot\n",
    "alpha_beta_bot = AlphaBetaBot(game, player_id=0, rng=random_state, depth=5, num_rollouts=10)\n",
    "\n",
    "# Set up SMMiniMaxBot\n",
    "sm_minimax_bot = SMMinimaxCustomBot(player_id=1, random_state=random_state, num_rollouts=10)\n",
    "\n",
    "# Run the experiment\n",
    "run_gops_experiment(game, [alpha_beta_bot, sm_minimax_bot], num_episodes=100, rng=random_state)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "True"
      ]
     },
     "execution_count": 8,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "(0 in frozenset({0, 1})) and (1 in frozenset({0, 1}))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 16,
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "100%|██████████| 10/10 [00:00<00:00, 36.02it/s]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Player 1: 0.0\n",
      "Player 2: 1.2\n",
      "Player 1 winrate: 0.0\n",
      "Player 2 winrate: 1.0\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "\n"
     ]
    },
    {
     "data": {
      "text/plain": [
       "(0.0, 1.2, 0.0, 1.0)"
      ]
     },
     "execution_count": 16,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# custom SMMiniMaxBot vs alpha beta bot\n",
    "\n",
    "# Load the gooftspiel game. remember to load the turn based version\n",
    "game = pyspiel.load_game_as_turn_based(\"goofspiel\", {\"num_cards\": 3})\n",
    "\n",
    "# Create random state\n",
    "random_state = np.random.RandomState(6)\n",
    "\n",
    "# Set up alpha beta bot\n",
    "alpha_beta_bot = AlphaBetaBot(game, player_id=0, rng=random_state, depth=5, num_rollouts=10)\n",
    "\n",
    "# Set up SMMiniMaxBot\n",
    "sm_minimax_bot = SMMinimaxCustomBot(player_id=1, random_state=random_state, num_rollouts=10)\n",
    "\n",
    "# Run the experiment\n",
    "run_gops_experiment(game, [alpha_beta_bot, sm_minimax_bot], num_episodes=10, rng=random_state)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": []
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": []
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "LLMgames",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.11.5"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
