{
 "cells": [
  {
   "cell_type": "markdown",
   "id": "389837f6",
   "metadata": {},
   "source": [
    "## Getting comparisons on GPQA data"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "id": "49fe5dec",
   "metadata": {},
   "outputs": [],
   "source": [
    "import os\n",
    "import json\n",
    "events = [name for name in os.listdir('transcript_gpqa/') if '2025' in name]\n",
    "data = []\n",
    "for name in events:\n",
    "    with open(f\"transcript_gpqa/{name}/evaluations.json\", 'r') as file:\n",
    "        data.extend(json.load(file))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "9c80729e",
   "metadata": {},
   "outputs": [],
   "source": [
    "models = {\n",
    "    \"Grok 3 Mini\": \"grok-3-mini\",\n",
    "    # \"Gemini 2.5 Flash\": \"gemini-2.5-flash\",\n",
    "    # \"GPT oss 120b\": \"gpt-oss-120b\",\n",
    "    \"Qwen3 235B A22B Instruct 2507\": \"qwen/qwen3-235b-a22b-2507\",\n",
    "    \"Kimi K2 0905\": \"moonshotai/kimi-k2-0905\",\n",
    "    \"Qwen3 Next 80B A3B Instruct\": \"qwen/qwen3-next-80b-a3b-instruct\",\n",
    "    \"Llama 4 Maverick\": \"meta-llama/llama-4-maverick\",\n",
    "    \"DeepSeek V3 0324\": \"deepseek/deepseek-chat-v3-0324\",\n",
    "    \"Gemini 2.5 Flash Lite\": \"gemini-2.5-flash-lite\",\n",
    "    \"Gemini 2.0 Flash\": \"gemini-2.0-flash-001\",\n",
    "    \"Llama 4 Scout\": \"meta-llama/llama-4-scout\",\n",
    "    \"Gemini 2.0 Flash Lite\": \"gemini-2.0-flash-lite-001\",\n",
    "    \"Llama 3.3 70b Instruct\": \"meta-llama/llama-3.3-70b-instruct\",\n",
    "    \"Qwen2.5 72B Instruct\": \"qwen/qwen-2.5-72b-instruct\",\n",
    "    # \"Qwen3 235B A22B\": \"qwen/qwen3-235b-a22b\",\n",
    "    \"Llama 3.1 70B Instruct\": \"meta-llama/llama-3.1-70b-instruct\",\n",
    "    \"GPT 4o mini\": \"gpt-4o-mini-2024-07-18\",\n",
    "    \"GPT 3.5 Turbo\": \"gpt-3.5-turbo\"\n",
    "}\n",
    "\n",
    "model_nicks = list(models.keys())"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 50,
   "id": "714c0464",
   "metadata": {},
   "outputs": [],
   "source": [
    "import re\n",
    "\n",
    "data2 = []\n",
    "for scenario_index in range(448):\n",
    "    subset = [i for i in data if i['scenario_index'] == scenario_index][0]\n",
    "\n",
    "    to_append = {\n",
    "        'subdomain': subset['subdomain'],\n",
    "        'question': subset['question'],\n",
    "        'scenario_index': scenario_index,\n",
    "    }\n",
    "\n",
    "    for model in model_nicks:\n",
    "        if subset[model][1] is not None:\n",
    "            to_append[model] = subset[model]\n",
    "        else:\n",
    "            response = subset[model][0]\n",
    "            try:\n",
    "                match = re.search(r'<answer>(.)</answer>', response).group(1)\n",
    "                if match in ['A', 'B', 'C', 'D']:\n",
    "                    to_append[model] = [response, match]\n",
    "                else:\n",
    "                    raise Exception\n",
    "\n",
    "            except:\n",
    "                try:\n",
    "                    match2 = re.search(r'boxed{(.)}', response).group(1)\n",
    "                    if match in ['A', 'B', 'C', 'D']:\n",
    "                        to_append[model] = [response, match2]\n",
    "                    else:\n",
    "                        raise Exception\n",
    "                except:\n",
    "                    to_append[model] = [response, None]\n",
    "    data2.append(to_append)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 65,
   "id": "bf2f7e00",
   "metadata": {},
   "outputs": [],
   "source": [
    "json.dump(data2, open('evaluations_gpqa_parsed.json', 'w'), indent=4)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 56,
   "id": "160b9356",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "['A', 'A', 'A', 'A', 'A', 'A', None, 'A', 'C', 'C', 'A', 'A', 'A', 'A', 'C']\n",
      "14\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'C', 'A', 'A', 'A', 'A', 'A', 'C']\n",
      "15\n",
      "['A', 'B', 'A', None, 'A', 'B', None, 'A', 'C', 'A', 'C', 'C', 'C', 'A', 'A']\n",
      "13\n",
      "['B', None, 'A', None, 'A', 'B', None, 'B', 'B', 'B', 'A', 'B', 'C', 'C', 'B']\n",
      "12\n",
      "['C', None, 'B', None, None, 'A', None, None, None, 'B', 'B', 'C', 'A', 'B', 'D']\n",
      "9\n",
      "['A', None, 'A', 'A', 'A', 'A', 'A', None, 'A', 'A', 'A', 'A', None, 'A', 'C']\n",
      "12\n",
      "['A', 'A', 'C', None, 'D', 'B', 'A', 'A', 'C', 'B', 'D', 'A', 'B', 'D', 'B']\n",
      "14\n",
      "['A', 'A', 'A', 'A', 'B', 'A', None, 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A']\n",
      "14\n",
      "['C', 'C', 'A', 'A', 'A', 'B', 'B', 'B', 'C', 'B', 'C', 'C', 'C', 'C', 'B']\n",
      "15\n",
      "['C', 'A', 'C', 'A', 'C', 'C', 'C', 'C', 'C', 'C', 'C', 'B', 'C', 'C', 'B']\n",
      "15\n",
      "['A', 'B', 'A', 'B', 'A', 'D', None, 'D', 'D', 'D', 'D', 'D', 'D', 'D', 'D']\n",
      "14\n",
      "['B', 'B', 'B', 'B', 'B', 'B', None, 'B', 'B', 'B', 'B', 'B', 'B', 'B', 'A']\n",
      "14\n",
      "['A', 'A', 'A', 'A', 'A', 'A', None, 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'C']\n",
      "14\n",
      "['A', 'A', 'A', 'A', 'A', 'A', None, 'A', 'A', 'B', 'A', 'B', 'B', 'B', 'D']\n",
      "14\n",
      "['B', 'A', 'A', 'A', 'A', 'A', None, 'A', 'B', 'A', 'A', 'A', 'B', 'B', 'B']\n",
      "14\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', None, 'A', 'A', 'A', 'A', 'A', 'A']\n",
      "14\n",
      "['A', 'A', 'A', 'A', 'A', 'A', None, 'A', 'A', 'A', 'A', 'B', 'B', 'A', 'B']\n",
      "14\n",
      "['A', None, 'A', None, 'A', 'A', None, 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A']\n",
      "12\n",
      "['A', None, 'A', 'A', 'A', 'A', None, 'A', 'A', 'A', 'A', None, 'A', 'D', 'C']\n",
      "12\n",
      "['B', 'B', 'D', 'B', 'A', 'A', None, 'B', 'A', 'B', 'A', 'A', 'B', 'A', 'C']\n",
      "14\n",
      "['A', 'A', 'B', 'B', 'A', 'D', 'A', 'D', 'B', 'D', 'A', 'D', 'D', 'D', 'A']\n",
      "15\n",
      "['A', None, 'A', None, 'A', 'A', None, 'A', 'A', 'C', 'A', 'A', 'A', 'A', 'A']\n",
      "12\n",
      "['A', None, 'A', 'C', 'C', 'A', None, None, 'C', 'A', 'B', 'C', 'C', 'B', 'A']\n",
      "12\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'D', 'B', 'C']\n",
      "15\n",
      "['A', None, 'A', None, 'A', 'A', None, 'A', 'C', 'D', 'C', 'D', 'A', 'A', 'B']\n",
      "12\n",
      "['D', 'D', 'D', 'C', 'C', 'D', 'D', 'D', 'D', 'D', 'D', 'D', 'D', 'D', 'D']\n",
      "15\n",
      "['B', 'A', 'C', 'A', 'B', 'D', None, 'D', 'B', 'D', 'A', 'D', 'A', 'D', None]\n",
      "13\n",
      "['D', 'D', 'B', 'B', 'A', 'A', None, 'D', 'C', 'B', 'A', 'B', 'A', 'D', 'C']\n",
      "14\n",
      "['A', 'A', 'A', 'A', 'D', 'A', 'A', 'D', 'D', 'A', 'A', 'A', 'B', 'D', 'A']\n",
      "15\n",
      "['c', 'A', 'A', 'A', 'C', 'A', None, 'C', 'B', 'A', 'D', 'C', 'C', 'D', 'C']\n",
      "14\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'C', 'A', 'C', 'A', 'D', 'A', 'A', 'D', 'C']\n",
      "15\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A']\n",
      "15\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'B', 'A', 'B', 'A', 'A', 'C']\n",
      "15\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'C', 'D', 'A']\n",
      "15\n",
      "['A', 'B', 'A', None, 'B', 'A', None, None, None, 'A', 'A', 'A', 'B', 'A', 'A']\n",
      "11\n",
      "['A', 'A', 'C', 'A', 'C', 'D', 'A', 'A', 'A', 'A', 'A', 'A', 'B', 'A', 'A']\n",
      "15\n",
      "['C', 'A', 'C', 'A', 'A', 'A', None, 'C', 'C', 'A', 'C', 'B', 'C', 'C', 'A']\n",
      "14\n",
      "['B', 'B', 'B', 'B', 'B', 'B', 'A', 'B', 'B', 'B', 'B', 'B', 'B', 'B', 'C']\n",
      "15\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'B', 'A', 'B', 'A']\n",
      "15\n",
      "['D', 'A', 'D', 'A', 'A', 'A', 'A', 'D', 'C', 'D', 'A', None, 'A', 'C', 'A']\n",
      "14\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'C', 'C', 'C', 'D', 'D', 'D', 'C', 'D', None]\n",
      "14\n",
      "['A', 'B', 'B', 'D', 'A', 'B', 'A', 'B', 'B', 'B', 'A', 'B', 'B', 'B', 'D']\n",
      "15\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A']\n",
      "15\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', None, 'A', 'A', 'A', 'A', 'A', 'A']\n",
      "14\n",
      "['A', 'A', None, 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'D', 'A', 'A', None]\n",
      "13\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', None, 'A', 'A', 'A', 'A', 'B', 'A']\n",
      "14\n",
      "['B', 'B', 'B', 'B', 'B', 'B', 'A', 'B', None, 'B', 'C', 'B', 'A', 'A', 'B']\n",
      "14\n",
      "['B', 'B', 'C', 'B', 'A', 'B', 'B', 'B', 'B', 'B', 'A', 'C', 'C', 'B', 'B']\n",
      "15\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', None, 'A', 'A', 'C', 'A', 'D', 'C']\n",
      "14\n",
      "['A', 'A', 'A', 'A', 'A', 'D', 'A', 'A', 'A', 'A', 'A', 'D', 'A', 'D', 'A']\n",
      "15\n",
      "['A', 'D', 'B', None, 'A', 'A', 'A', 'D', 'C', 'D', 'A', 'A', 'A', 'A', 'A']\n",
      "14\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A']\n",
      "15\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', None, 'A', 'A', 'A', 'A', 'A', 'A']\n",
      "14\n",
      "['A', 'A', 'A', 'A', 'A', 'B', 'A', 'A', 'A', 'A', 'B', 'A', 'B', 'A', 'A']\n",
      "15\n",
      "['A', 'A', 'C', 'D', 'D', 'D', None, 'D', None, 'B', 'A', 'B', 'A', 'C', 'A']\n",
      "13\n",
      "['A', 'A', 'C', 'A', 'A', 'A', 'A', 'A', 'C', 'B', 'A', 'A', 'A', 'A', 'A']\n",
      "15\n",
      "['A', 'B', 'C', 'A', 'A', 'A', 'B', 'B', 'C', 'B', 'B', 'A', 'A', 'D', 'C']\n",
      "15\n",
      "['A', None, 'A', None, 'A', 'B', None, 'A', None, 'B', 'A', 'B', 'A', 'D', 'D']\n",
      "11\n",
      "['A', None, 'A', None, 'A', 'C', None, 'D', None, 'D', 'B', 'B', 'D', 'A', 'A']\n",
      "11\n",
      "['D', 'B', 'B', 'B', 'D', 'D', 'D', 'D', 'B', 'D', 'B', 'A', 'B', 'B', 'C']\n",
      "15\n",
      "['C', None, 'A', None, 'D', 'D', 'D', 'A', 'C', 'C', 'A', 'B', 'C', 'D', 'D']\n",
      "13\n",
      "['A', 'A', 'A', 'A', 'A', 'C', 'A', 'A', 'C', 'C', 'C', 'C', 'C', 'C', 'A']\n",
      "15\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A']\n",
      "15\n",
      "['A', None, 'A', 'B', 'A', 'B', 'B', 'B', 'A', 'B', 'C', 'B', 'D', 'A', 'B']\n",
      "14\n",
      "['A', None, 'A', 'A', 'A', 'B', 'A', 'A', 'B', 'B', 'B', 'A', 'A', 'A', 'D']\n",
      "14\n",
      "['A', 'A', 'A', 'A', 'A', 'D', 'A', 'D', 'A', 'A', 'A', 'A', 'A', 'D', 'D']\n",
      "15\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'D']\n",
      "15\n",
      "['C', 'A', 'A', 'D', 'C', 'C', None, 'C', 'D', 'C', 'C', 'D', 'D', 'D', 'C']\n",
      "14\n",
      "['A', 'A', 'A', 'A', 'A', None, 'A', 'A', 'C', 'C', 'A', 'C', 'C', 'B', 'B']\n",
      "14\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'B', 'C', 'A', 'A', 'A', 'C', 'B']\n",
      "15\n",
      "['A', 'A', 'B', 'A', 'B', 'A', 'C', 'B', 'B', 'A', 'C', 'C', 'C', 'B', 'A']\n",
      "15\n",
      "['A', 'A', 'A', 'A', 'C', 'A', 'A', 'B', None, 'A', 'C', 'C', 'C', 'A', 'B']\n",
      "14\n",
      "['C', 'C', 'A', 'C', 'A', 'A', 'A', 'B', 'A', 'C', 'B', 'D', 'C', 'A', 'A']\n",
      "15\n",
      "['B', 'B', 'B', 'B', 'B', 'B', 'C', 'B', 'B', 'B', 'C', 'B', 'A', 'D', 'C']\n",
      "15\n",
      "['A', 'A', 'A', 'A', 'A', 'D', None, 'B', 'D', 'A', 'A', 'B', 'B', 'A', 'B']\n",
      "14\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'C', 'A', 'C']\n",
      "15\n",
      "['D', None, 'B', None, 'A', 'A', None, 'A', 'D', 'C', 'A', 'A', 'A', 'B', 'D']\n",
      "12\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'B', 'A', None, 'A', 'A', 'B', 'A', 'A']\n",
      "14\n",
      "['A', 'A', 'A', 'A', 'A', 'B', None, 'B', None, 'B', 'A', 'B', 'B', 'B', 'B']\n",
      "13\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'B']\n",
      "15\n",
      "['D', 'D', 'D', 'D', 'D', 'D', None, 'D', 'B', 'A', 'A', None, 'A', 'A', 'D']\n",
      "13\n",
      "['A', None, 'C', None, 'C', 'A', None, 'A', 'C', 'C', None, 'C', 'A', 'A', 'A']\n",
      "11\n",
      "['D', None, 'D', 'A', 'C', 'B', 'D', 'D', 'A', 'A', 'A', 'B', 'A', 'A', 'B']\n",
      "14\n",
      "['A', 'A', 'C', 'A', 'A', 'A', 'A', 'A', None, 'A', 'A', 'A', 'C', 'B', 'C']\n",
      "14\n",
      "['C', None, 'C', 'A', 'A', 'A', 'A', None, 'C', 'A', 'A', 'A', 'A', 'C', 'C']\n",
      "13\n",
      "['A', 'A', 'A', 'A', 'C', 'A', 'A', 'D', 'C', 'D', 'A', 'B', 'C', 'A', 'A']\n",
      "15\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A']\n",
      "15\n",
      "['A', 'A', 'A', None, 'A', 'A', 'C', 'A', 'A', 'A', 'A', 'B', 'A', 'C', None]\n",
      "13\n",
      "['B', 'B', 'D', 'B', 'D', 'B', 'B', 'D', 'B', 'B', 'B', 'B', 'B', 'D', 'D']\n",
      "15\n",
      "['A', 'D', 'D', 'D', 'A', 'D', 'A', None, 'C', 'C', 'D', 'B', 'C', 'B', 'A']\n",
      "14\n",
      "['A', 'A', 'A', 'A', 'D', 'A', 'A', 'A', 'D', 'A', 'D', 'D', 'A', 'D', 'D']\n",
      "15\n",
      "['A', None, 'D', 'A', 'A', 'A', 'D', 'C', 'C', 'D', 'D', 'C', 'C', 'C', 'D']\n",
      "14\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'C', 'A', 'C', 'C', 'A', 'D', 'A', 'A', 'A']\n",
      "15\n",
      "['A', 'A', 'A', None, 'B', None, None, 'B', 'D', 'C', 'D', 'C', 'D', 'C', 'C']\n",
      "12\n",
      "['D', 'D', 'D', 'D', 'D', 'C', 'D', 'D', 'D', 'D', 'D', 'D', 'D', 'D', 'A']\n",
      "15\n",
      "['A', None, 'B', 'A', 'B', 'B', 'B', 'B', 'A', 'B', 'A', 'A', 'A', 'A', 'A']\n",
      "14\n",
      "['A', 'A', 'A', 'A', 'A', 'D', 'D', 'D', 'A', 'C', 'D', 'D', 'D', 'D', 'B']\n",
      "15\n",
      "['A', 'A', 'A', 'A', 'A', 'A', None, 'C', 'A', 'B', 'A', 'A', None, 'A', 'D']\n",
      "13\n",
      "['A', 'B', 'A', 'D', 'C', 'D', 'D', 'B', 'B', 'A', 'A', 'A', 'D', 'B', 'C']\n",
      "15\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'B', 'A']\n",
      "15\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A']\n",
      "15\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'D', 'A', 'A', 'A', 'D', 'D', 'D', 'A']\n",
      "15\n",
      "['A', None, 'A', 'A', 'A', 'A', None, 'A', 'A', 'D', 'B', 'A', 'A', 'A', 'D']\n",
      "13\n",
      "['A', 'A', 'A', 'A', 'B', 'B', 'A', 'A', None, 'B', 'A', 'A', 'A', 'A', 'A']\n",
      "14\n",
      "['A', 'A', 'C', 'A', 'A', 'A', 'A', 'A', None, 'A', 'A', 'A', 'B', 'C', 'A']\n",
      "14\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'B', 'A', 'A', 'B', 'C']\n",
      "15\n",
      "['A', 'A', 'A', None, 'B', 'A', None, None, None, 'D', 'A', 'A', 'A', 'A', 'B']\n",
      "11\n",
      "['C', None, 'A', None, 'A', 'C', '3', None, 'C', 'C', None, 'A', 'D', 'A', 'A']\n",
      "11\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'C', 'A', 'A', 'A', None]\n",
      "14\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'C', 'B', 'C']\n",
      "15\n",
      "['A', 'A', 'A', 'A', 'A', 'A', None, 'A', 'A', 'A', 'A', 'A', 'A', 'D', 'A']\n",
      "14\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', None, 'A', 'A', 'A', 'A', 'D']\n",
      "14\n",
      "['A', 'D', 'C', None, 'B', 'B', None, 'A', 'B', 'B', 'A', 'B', 'A', 'B', 'B']\n",
      "13\n",
      "['C', 'A', 'A', 'C', 'A', 'C', 'A', 'C', None, 'C', 'C', 'C', 'A', 'C', 'B']\n",
      "14\n",
      "['A', None, 'A', None, 'A', 'A', None, 'A', 'C', None, 'C', 'A', None, 'B', 'C']\n",
      "10\n",
      "['C', None, 'B', None, 'C', 'C', None, 'C', 'C', 'A', 'C', 'A', 'B', 'C', 'C']\n",
      "12\n",
      "['A', None, 'C', None, 'C', 'C', None, 'D', 'C', 'C', 'A', 'C', 'A', 'B', 'D']\n",
      "12\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'D']\n",
      "15\n",
      "['A', 'B', 'A', 'A', 'B', 'B', 'B', 'A', 'A', 'D', 'A', 'A', 'B', 'D', 'B']\n",
      "15\n",
      "['A', None, 'A', None, None, 'B', None, 'A', 'B', 'B', None, 'B', 'B', 'D', 'D']\n",
      "10\n",
      "['A', 'A', 'A', 'D', 'A', 'A', None, 'A', 'A', 'A', 'A', 'B', 'A', 'A', 'D']\n",
      "14\n",
      "['B', 'D', 'D', 'B', 'D', 'D', 'D', 'D', 'D', 'D', 'D', 'D', 'D', 'D', 'B']\n",
      "15\n",
      "['A', None, 'B', None, 'A', 'A', None, None, 'B', 'B', 'D', 'A', 'B', 'B', 'B']\n",
      "11\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'C', 'A', 'A', 'A', 'C', 'A', 'C', 'C', 'C']\n",
      "15\n",
      "['A', 'A', 'A', 'A', None, 'A', 'A', 'A', 'A', None, 'B', 'A', 'C', 'D', 'B']\n",
      "13\n",
      "['A', 'A', 'A', None, 'A', 'A', 'A', 'D', None, None, 'A', 'C', 'A', None, 'C']\n",
      "11\n",
      "['A', None, 'A', None, 'D', 'D', None, 'D', 'C', 'A', 'A', 'D', 'D', 'C', 'C']\n",
      "12\n",
      "['A', 'C', 'D', None, 'B', 'B', None, 'B', None, 'B', 'A', 'D', 'A', 'B', 'C']\n",
      "12\n",
      "['A', 'A', None, 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A']\n",
      "14\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'C', 'D', 'A', 'D', 'A', 'A', 'A', 'A', 'D']\n",
      "15\n",
      "['D', 'B', 'B', 'D', 'A', 'B', 'D', 'B', 'D', 'A', 'D', 'A', 'D', 'D', 'D']\n",
      "15\n",
      "['A', 'A', 'A', 'A', 'A', 'A', None, 'A', None, 'B', 'A', 'A', 'A', 'A', None]\n",
      "12\n",
      "['C', 'B', 'D', 'B', 'C', 'C', None, 'C', 'C', 'C', 'A', 'D', 'C', 'D', 'B']\n",
      "14\n",
      "['A', None, 'C', None, None, 'A', None, 'A', 'A', 'B', 'C', 'C', 'C', 'A', 'A']\n",
      "11\n",
      "['A', 'A', 'C', None, 'A', None, None, 'C', 'D', 'A', 'B', 'A', 'D', 'D', 'D']\n",
      "12\n",
      "['D', 'A', 'A', 'A', 'C', 'C', None, 'A', 'B', 'C', 'A', 'B', 'C', 'B', 'C']\n",
      "14\n",
      "['A', None, 'D', None, None, 'A', None, None, None, 'B', None, None, 'A', 'D', 'A']\n",
      "7\n",
      "['A', None, None, None, None, None, None, 'D', None, 'D', 'D', 'D', 'D', 'D', 'D']\n",
      "8\n",
      "['A', None, None, None, 'A', 'C', None, 'D', 'C', 'D', 'A', 'A', 'C', 'A', 'A']\n",
      "11\n",
      "['A', 'A', None, 'A', 'C', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A']\n",
      "14\n",
      "['A', None, 'A', None, 'A', 'A', None, None, 'B', 'B', 'A', 'B', 'A', 'B', 'A']\n",
      "11\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'B', 'B']\n",
      "15\n",
      "['C', 'C', 'C', 'C', 'C', 'C', 'A', 'C', 'C', 'C', 'A', 'C', 'C', 'C', 'A']\n",
      "15\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', None, 'A', 'A', 'A', 'A', 'B', 'A']\n",
      "14\n",
      "['B', 'B', 'B', 'B', 'B', 'B', 'B', 'B', 'B', 'B', 'B', 'B', 'B', 'B', 'B']\n",
      "15\n",
      "['A', None, 'A', None, 'B', 'C', None, 'A', 'B', 'B', 'B', 'A', 'B', 'A', 'A']\n",
      "12\n",
      "['B', 'B', 'A', 'A', 'A', 'B', 'B', 'A', 'B', 'A', 'A', 'A', 'A', 'B', 'C']\n",
      "15\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A']\n",
      "15\n",
      "['C', 'C', 'C', 'B', 'C', 'A', 'C', 'C', 'C', 'C', 'C', 'C', 'C', 'C', 'C']\n",
      "15\n",
      "['A', None, 'C', 'C', 'B', 'C', None, 'D', 'C', 'B', 'A', 'C', 'B', 'B', 'B']\n",
      "13\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'C']\n",
      "15\n",
      "['A', 'D', 'A', None, 'D', 'B', 'D', 'A', 'A', 'C', None, 'C', 'A', 'A', 'A']\n",
      "13\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'B', 'A', 'D', 'A', 'C', 'A', 'A']\n",
      "15\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', None, 'D', 'A', 'B', 'C', 'D']\n",
      "14\n",
      "['A', 'A', 'D', 'A', 'A', 'A', 'A', 'A', 'A', 'C', 'C', 'A', 'A', 'A', 'A']\n",
      "15\n",
      "['A', None, 'A', None, 'A', 'A', 'A', 'A', 'A', 'A', 'C', 'C', 'A', 'D', 'D']\n",
      "13\n",
      "['A', 'A', 'A', 'A', 'A', 'D', 'D', 'C', 'C', 'B', 'D', 'B', 'D', 'D', 'B']\n",
      "15\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'D', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A']\n",
      "15\n",
      "['A', None, 'D', None, 'A', 'A', 'A', 'D', None, 'A', 'D', 'D', 'C', 'A', 'D']\n",
      "12\n",
      "['A', 'A', 'A', 'A', 'B', 'A', 'A', 'A', 'A', 'A', 'A', 'B', 'B', 'A', 'B']\n",
      "15\n",
      "['B', 'C', 'B', 'D', 'B', 'B', 'D', 'C', 'C', 'B', 'B', 'D', 'B', 'C', 'B']\n",
      "15\n",
      "['C', 'A', 'B', 'A', 'C', 'A', None, 'C', 'C', 'B', None, 'C', 'B', 'C', 'A']\n",
      "13\n",
      "['C', None, 'C', None, 'A', 'A', None, 'C', 'C', 'D', 'D', 'C', 'A', 'B', 'A']\n",
      "12\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'B', 'A', 'A', 'C', 'A', 'B', 'A']\n",
      "15\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'C', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A']\n",
      "15\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'D', 'A', 'D', 'A', 'A', 'D']\n",
      "15\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'B', 'B', 'C', 'D']\n",
      "15\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', None]\n",
      "14\n",
      "['A', 'A', 'A', 'A', 'A', 'D', None, 'A', 'A', 'B', 'B', 'B', 'B', 'C', 'C']\n",
      "14\n",
      "['A', 'A', 'A', 'A', 'A', 'A', None, 'A', 'A', 'A', 'A', 'A', 'C', 'A', 'A']\n",
      "14\n",
      "['C', 'C', 'A', 'C', 'C', 'C', None, 'C', 'C', 'C', 'C', 'C', 'C', 'C', 'C']\n",
      "14\n",
      "['A', 'A', 'A', None, 'A', 'A', None, None, 'A', 'A', 'A', 'A', 'A', 'A', 'D']\n",
      "12\n",
      "['A', 'A', 'A', 'A', 'A', 'A', None, 'A', 'A', 'A', 'A', 'A', 'A', 'D', 'C']\n",
      "14\n",
      "['A', 'C', 'A', 'A', 'D', 'C', 'D', None, 'A', 'D', 'D', 'D', 'A', 'D', 'A']\n",
      "14\n",
      "['C', None, 'A', 'C', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'B', 'C', 'C', 'A']\n",
      "14\n",
      "['C', 'C', 'A', 'C', 'C', 'C', 'A', 'C', 'C', 'A', 'A', 'C', 'A', 'C', 'D']\n",
      "15\n",
      "['A', None, 'B', None, 'D', 'B', None, 'D', 'A', 'D', 'D', 'A', 'D', 'D', 'A']\n",
      "12\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'D', 'A', 'A', 'A', 'B', None]\n",
      "14\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'B', 'A', 'B', 'A']\n",
      "15\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'B', 'A', 'A', 'A', 'A', 'B', 'B', 'D', 'D']\n",
      "15\n",
      "['A', 'A', None, 'D', 'D', 'A', 'A', 'A', 'D', 'A', 'A', 'D', 'D', 'A', 'C']\n",
      "14\n",
      "['A', 'B', 'B', 'B', 'A', 'B', 'B', 'B', 'B', 'B', 'B', 'B', 'B', 'B', 'A']\n",
      "15\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A']\n",
      "15\n",
      "['C', None, 'A', None, 'B', 'A', 'C', 'A', 'C', 'C', 'B', 'A', 'B', 'B', 'C']\n",
      "13\n",
      "['C', None, 'C', 'C', 'C', 'C', 'C', 'C', 'C', 'C', 'C', 'C', 'D', 'A', 'D']\n",
      "14\n",
      "['A', 'D', 'B', 'A', 'A', 'D', 'B', None, 'B', 'C', 'D', 'A', 'D', 'B', 'B']\n",
      "14\n",
      "['A', 'A', 'B', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'D', 'A', 'A']\n",
      "15\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A']\n",
      "15\n",
      "['A', 'A', 'A', 'A', 'A', 'A', None, None, 'A', 'C', None, 'A', 'C', 'D', 'A']\n",
      "12\n",
      "['D', None, 'C', None, 'D', 'A', None, 'D', 'D', 'D', None, 'D', 'D', 'D', 'A']\n",
      "11\n",
      "['A', None, 'C', None, 'A', 'A', 'D', 'A', None, 'C', 'B', 'D', 'D', 'C', 'B']\n",
      "12\n",
      "['D', None, 'D', None, 'D', 'D', None, 'D', 'D', 'C', 'D', 'D', 'A', 'D', 'D']\n",
      "12\n",
      "['A', 'C', 'A', 'B', 'C', 'B', 'C', 'B', 'D', 'B', 'C', 'C', 'C', 'C', 'C']\n",
      "15\n",
      "['C', None, 'A', None, 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A']\n",
      "13\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A']\n",
      "15\n",
      "['A', 'A', 'A', 'A', 'C', 'C', None, 'C', None, 'A', 'C', 'A', 'C', 'A', 'A']\n",
      "13\n",
      "['A', 'D', 'A', 'A', 'A', 'D', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'D', 'B']\n",
      "15\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'D', 'B', 'B', 'A', 'D', 'D', 'D', 'C']\n",
      "15\n",
      "['B', 'A', 'C', 'B', 'A', 'C', 'B', 'C', 'A', 'B', 'C', 'A', 'C', 'B', 'C']\n",
      "15\n",
      "['A', 'A', 'A', None, 'A', 'A', 'A', None, 'A', 'C', 'A', 'A', 'A', 'A', 'A']\n",
      "13\n",
      "['B', 'B', 'B', None, 'A', 'B', 'B', 'D', 'B', 'B', 'B', 'D', 'B', 'B', 'B']\n",
      "14\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'C', 'B', 'C', 'B', 'A', 'C', 'C', 'B', None]\n",
      "14\n",
      "['A', 'C', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'B', 'A', 'C', 'B', 'C', 'C']\n",
      "15\n",
      "['A', None, 'A', None, 'B', 'B', None, 'B', 'B', None, 'B', 'D', 'D', 'A', 'D']\n",
      "11\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'D', 'B', None, 'B', 'A', 'B', 'B', 'B', 'B']\n",
      "14\n",
      "['A', None, 'A', 'A', 'A', 'B', 'A', 'C', 'B', 'A', 'A', 'A', 'A', 'A', 'D']\n",
      "14\n",
      "['A', 'A', 'A', None, 'A', 'D', None, None, 'A', 'C', 'A', 'D', 'A', 'C', 'A']\n",
      "12\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A']\n",
      "15\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A']\n",
      "15\n",
      "['A', 'C', 'B', 'C', 'C', 'C', 'B', 'C', 'C', 'B', 'C', 'D', 'C', 'D', 'D']\n",
      "15\n",
      "['A', None, None, None, 'C', 'A', None, 'A', 'A', 'C', 'A', 'D', 'D', 'D', 'C']\n",
      "11\n",
      "['C', None, 'A', None, 'D', 'C', None, 'A', 'D', 'B', 'B', 'C', None, 'C', 'C']\n",
      "11\n",
      "['C', 'A', None, None, 'C', 'A', 'A', 'C', None, 'A', 'A', 'C', 'A', 'A', 'C']\n",
      "12\n",
      "['D', None, None, None, 'C', 'D', None, None, 'D', 'C', 'B', 'C', 'B', 'D', 'D']\n",
      "10\n",
      "['C', 'C', 'C', 'B', 'C', 'B', 'B', 'C', 'C', 'C', 'C', 'C', 'C', 'C', 'B']\n",
      "15\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A']\n",
      "15\n",
      "['A', None, 'D', 'A', 'B', 'D', None, 'D', 'D', 'A', None, 'D', 'D', 'D', 'B']\n",
      "12\n",
      "['A', None, 'D', None, 'B', 'D', None, 'A', 'D', 'D', 'A', 'D', 'D', 'D', 'B']\n",
      "12\n",
      "['A', None, 'A', 'A', 'B', 'B', 'D', 'B', 'B', 'B', 'A', 'A', 'A', 'C', 'B']\n",
      "14\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'C', 'D', 'C', 'A']\n",
      "15\n",
      "['A', 'A', 'A', 'A', 'A', 'B', 'B', 'B', 'A', 'B', 'B', 'B', 'B', 'B', 'B']\n",
      "15\n",
      "['A', 'A', 'D', 'A', 'C', 'D', None, 'B', 'D', 'D', 'A', 'C', 'D', 'D', 'D']\n",
      "14\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', None]\n",
      "14\n",
      "['A', 'A', 'B', 'A', 'A', 'B', 'A', 'A', 'A', 'B', 'B', 'A', 'A', 'B', 'D']\n",
      "15\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'D', 'D']\n",
      "15\n",
      "['A', None, 'A', None, 'A', None, None, 'A', 'A', 'D', 'D', 'B', 'D', 'B', 'B']\n",
      "11\n",
      "['C', 'C', 'D', None, 'C', 'D', 'C', 'D', 'C', 'C', 'C', 'C', 'D', 'C', 'C']\n",
      "14\n",
      "['A', None, None, None, 'D', 'A', None, 'D', 'D', 'D', 'D', 'D', 'A', 'C', 'D']\n",
      "11\n",
      "['B', 'B', 'B', 'B', 'B', 'B', 'B', 'B', 'B', 'B', None, 'B', 'B', 'A', None]\n",
      "13\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'C', 'A', 'A', 'C', 'A', 'D', 'A']\n",
      "15\n",
      "['B', None, 'B', None, None, 'B', None, 'B', 'B', 'B', 'B', 'B', 'B', 'B', 'A']\n",
      "11\n",
      "['A', 'A', 'A', 'A', 'A', 'B', None, 'A', 'A', 'A', 'A', 'B', 'A', 'A', 'A']\n",
      "14\n",
      "['A', 'A', 'A', 'A', 'A', 'C', 'A', 'A', 'A', 'A', 'A', 'D', 'A', 'A', 'A']\n",
      "15\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'B', 'A', 'A', 'A', 'B', 'A', 'B']\n",
      "15\n",
      "['B', None, None, None, 'B', 'B', None, 'D', None, 'B', 'A', 'A', 'D', 'D', 'D']\n",
      "10\n",
      "['A', None, 'B', None, None, 'B', None, 'A', None, 'B', 'B', 'B', 'B', 'B', 'C']\n",
      "10\n",
      "['D', None, 'A', 'D', 'D', 'D', None, 'D', None, 'D', 'D', 'D', 'D', 'B', 'C']\n",
      "12\n",
      "['A', 'A', 'A', None, 'A', 'D', None, 'A', 'A', 'A', 'A', 'D', 'A', 'D', 'A']\n",
      "13\n",
      "['A', None, 'B', None, 'B', 'A', None, 'D', None, 'C', 'D', 'A', 'B', 'B', 'A']\n",
      "11\n",
      "['A', None, 'A', None, 'D', 'A', None, 'A', 'D', 'D', 'B', 'C', 'D', 'B', 'C']\n",
      "12\n",
      "['A', None, None, None, 'A', 'A', None, 'C', 'B', 'C', 'A', 'C', 'D', 'D', 'B']\n",
      "11\n",
      "['A', None, 'A', None, 'A', 'B', None, 'A', None, None, None, 'B', 'D', 'D', 'C']\n",
      "9\n",
      "['C', None, 'A', 'C', 'C', 'C', 'C', 'C', 'C', 'C', 'C', 'C', 'C', 'B', None]\n",
      "13\n",
      "['A', 'A', None, 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A']\n",
      "14\n",
      "['A', 'D', 'D', 'D', 'B', 'D', 'B', 'D', 'D', 'A', 'D', 'C', 'A', 'D', 'D']\n",
      "15\n",
      "['C', None, None, None, 'C', 'C', None, 'D', 'B', 'B', 'B', 'D', 'B', 'B', 'D']\n",
      "11\n",
      "['A', None, 'C', None, 'A', 'B', None, 'C', 'C', 'B', 'C', 'C', 'C', 'C', 'B']\n",
      "12\n",
      "['A', 'A', 'A', None, 'A', 'A', None, 'C', None, 'A', 'D', 'C', 'C', 'A', 'C']\n",
      "12\n",
      "['A', None, 'A', None, None, None, None, 'A', None, 'B', 'B', 'D', 'D', 'B', 'A']\n",
      "9\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A']\n",
      "15\n",
      "['C', 'C', 'C', None, 'C', 'C', None, 'C', None, 'A', 'C', 'C', 'C', 'C', 'C']\n",
      "12\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'D', 'A', 'A', 'A', 'A']\n",
      "15\n",
      "['A', None, 'D', None, 'B', 'B', None, 'B', 'D', 'B', 'D', 'A', 'A', 'C', 'D']\n",
      "12\n",
      "['C', 'A', 'A', 'C', 'C', 'C', 'A', 'C', 'A', 'A', 'C', 'D', 'A', 'D', 'C']\n",
      "15\n",
      "['A', 'B', 'D', 'A', 'C', 'C', 'A', 'B', None, 'C', 'A', 'C', 'B', 'B', 'B']\n",
      "14\n",
      "['D', 'C', 'A', 'D', 'C', 'C', 'C', 'C', 'C', 'C', 'C', 'D', 'C', 'C', 'C']\n",
      "15\n",
      "['A', 'A', 'C', 'A', 'A', 'A', None, 'A', 'A', None, 'C', 'D', 'C', 'B', 'D']\n",
      "13\n",
      "['A', 'A', 'C', 'A', 'A', 'B', 'D', 'D', 'B', 'D', 'A', 'D', 'A', 'A', 'D']\n",
      "15\n",
      "['A', None, 'C', None, 'D', 'A', None, None, 'D', 'A', 'A', 'D', 'A', 'D', 'D']\n",
      "11\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'D', 'D', 'D', 'B', 'D', 'B', 'D', 'B']\n",
      "15\n",
      "['C', None, 'B', None, 'B', 'A', None, 'A', 'B', 'A', 'A', 'B', 'C', 'D', 'A']\n",
      "12\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A']\n",
      "15\n",
      "['C', 'C', 'C', 'D', 'C', 'C', 'D', 'D', 'C', 'C', 'D', 'A', 'A', 'A', 'A']\n",
      "15\n",
      "['C', None, 'A', 'A', 'A', None, 'D', 'D', None, 'D', 'A', 'A', 'A', 'A', 'A']\n",
      "12\n",
      "['D', None, 'D', None, 'A', 'D', None, 'D', 'D', 'C', 'A', 'C', 'C', 'D', 'D']\n",
      "12\n",
      "['D', None, 'C', None, 'D', 'D', 'D', 'D', 'A', 'D', 'D', 'C', 'D', 'A', 'C']\n",
      "13\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'D']\n",
      "15\n",
      "['A', 'B', 'B', 'B', 'A', 'D', 'A', 'C', None, 'C', 'A', 'C', 'B', 'B', 'B']\n",
      "14\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'B', 'A', 'A', 'A', 'A', 'B', 'A', 'B', 'A']\n",
      "15\n",
      "['A', 'C', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A']\n",
      "15\n",
      "['A', 'A', 'A', 'A', 'A', 'B', 'A', 'A', None, 'B', 'A', 'B', 'C', 'A', 'C']\n",
      "14\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', None, 'B', 'A', 'A', None, 'A', 'A']\n",
      "13\n",
      "['A', 'A', 'A', 'A', 'A', 'C', 'D', 'D', 'A', 'A', 'A', 'A', 'A', 'A', 'A']\n",
      "15\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A']\n",
      "15\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'B', 'B']\n",
      "15\n",
      "['A', 'A', 'A', 'A', 'A', 'B', None, 'A', None, 'A', 'B', 'B', 'A', 'A', 'A']\n",
      "13\n",
      "['A', 'D', 'A', 'D', 'D', 'D', 'D', 'D', None, 'D', 'D', 'D', 'D', 'D', 'D']\n",
      "14\n",
      "['A', 'A', 'A', 'A', 'A', 'A', None, 'A', 'A', 'C', 'A', 'A', 'D', 'D', 'C']\n",
      "14\n",
      "['C', 'C', 'C', 'C', 'C', 'C', 'C', 'C', 'C', 'C', 'C', 'C', 'C', 'C', 'A']\n",
      "15\n",
      "['A', None, 'B', None, 'A', 'A', None, None, None, 'B', 'B', 'B', 'B', 'B', 'A']\n",
      "10\n",
      "['D', 'A', 'A', 'A', 'A', 'A', 'D', 'A', None, 'A', 'A', 'A', 'A', 'A', 'B']\n",
      "14\n",
      "['C', None, 'A', None, 'A', 'B', None, 'C', 'A', 'D', 'A', 'D', 'A', 'C', 'B']\n",
      "12\n",
      "['D', 'D', 'D', 'D', 'D', 'D', 'D', 'D', 'D', 'D', 'D', 'D', 'D', 'D', 'D']\n",
      "15\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'D', 'B', 'A', 'A', 'B', 'C', 'C']\n",
      "15\n",
      "['A', 'A', 'A', 'A', 'B', 'A', 'B', 'B', 'A', 'B', 'A', 'B', 'C', 'A', 'A']\n",
      "15\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'B', None, None, 'B', 'B', None, 'B', 'A', 'D']\n",
      "12\n",
      "['A', 'A', 'B', 'C', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'C', 'A', 'C', 'A']\n",
      "15\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A']\n",
      "15\n",
      "['A', None, 'A', None, 'A', 'A', None, 'A', 'A', 'A', 'B', 'A', 'B', 'A', 'D']\n",
      "12\n",
      "['A', 'A', 'B', 'A', 'A', 'B', None, 'A', 'A', 'A', 'B', 'A', 'C', 'C', 'B']\n",
      "14\n",
      "['A', 'A', 'A', 'A', 'A', 'A', None, 'A', 'A', 'A', 'A', 'A', 'A', 'B', 'C']\n",
      "14\n",
      "['A', None, 'B', 'A', 'D', 'C', None, 'B', 'C', 'C', 'C', 'B', 'C', 'C', 'D']\n",
      "13\n",
      "['A', 'C', 'A', None, 'A', 'A', None, 'A', 'A', 'B', 'A', 'B', 'A', 'B', None]\n",
      "12\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', None, 'A', 'A', 'A', 'B', 'C', 'C']\n",
      "14\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'C']\n",
      "15\n",
      "['A', 'A', 'A', 'A', 'A', 'A', None, 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A']\n",
      "14\n",
      "['A', 'C', 'A', 'A', 'A', 'A', 'A', 'A', 'D', 'B', 'D', 'D', 'D', 'D', 'D']\n",
      "15\n",
      "['D', 'A', 'A', 'D', 'A', 'D', 'A', 'A', 'D', 'A', 'A', 'D', 'D', 'A', 'D']\n",
      "15\n",
      "['B', 'A', 'B', 'A', 'A', 'A', 'A', 'A', 'A', 'B', 'A', 'B', 'A', 'B', 'B']\n",
      "15\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A']\n",
      "15\n",
      "['D', None, 'B', None, 'A', 'B', 'D', None, 'B', 'D', 'D', 'B', 'A', 'C', 'A']\n",
      "12\n",
      "['B', 'B', 'B', 'B', 'B', 'B', 'B', 'B', None, 'B', 'B', 'B', 'B', 'B', 'A']\n",
      "14\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', None, 'A', 'A']\n",
      "14\n",
      "['B', 'A', 'A', None, 'B', 'B', None, 'A', 'B', 'A', 'B', 'A', 'A', 'A', 'A']\n",
      "13\n",
      "['C', 'C', 'C', 'C', 'C', 'A', 'C', 'C', 'C', 'A', 'C', 'A', 'C', 'C', 'C']\n",
      "15\n",
      "['A', 'A', 'B', 'A', 'A', 'A', 'A', 'A', 'A', 'C', 'B', 'B', 'A', 'C', 'C']\n",
      "15\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'B', 'C', 'A', 'A', 'B', 'A', 'C']\n",
      "15\n",
      "['A', 'A', 'B', 'A', 'C', 'A', None, 'A', None, 'A', 'C', 'C', 'D', 'A', 'A']\n",
      "13\n",
      "['A', None, 'A', None, 'A', 'D', None, None, None, 'D', 'B', 'B', 'B', 'D', 'B']\n",
      "10\n",
      "['C', 'C', 'A', 'A', 'A', 'C', 'C', 'A', 'A', 'C', 'D', 'C', 'A', 'A', 'A']\n",
      "15\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'C', 'A', 'A', 'A']\n",
      "15\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'B', 'D']\n",
      "15\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'C']\n",
      "15\n",
      "['A', 'A', 'A', 'A', 'A', 'A', None, None, 'A', 'D', 'B', 'A', 'D', 'C', 'C']\n",
      "13\n",
      "['A', None, 'A', 'A', 'D', 'D', 'B', 'A', 'A', 'A', 'A', 'B', 'D', 'D', 'B']\n",
      "14\n",
      "['A', 'A', 'B', 'A', 'A', 'A', None, None, None, 'A', 'A', 'A', 'A', 'B', 'D']\n",
      "12\n",
      "['B', None, 'A', 'A', 'B', 'B', None, 'A', None, 'A', 'A', 'A', 'C', 'A', 'A']\n",
      "12\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'D', 'A', 'A', 'D', 'A', 'A', 'D', 'D', 'D']\n",
      "15\n",
      "['A', 'A', None, 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'B', 'A', 'B', 'A']\n",
      "14\n",
      "['A', 'C', 'A', None, None, 'C', None, 'A', 'C', 'C', 'C', 'A', 'C', 'C', 'D']\n",
      "12\n",
      "['C', 'A', 'A', 'A', 'A', 'C', 'C', 'A', 'A', 'C', 'A', 'C', 'C', 'D', 'A']\n",
      "15\n",
      "['C', 'A', 'B', 'B', 'A', 'D', 'D', 'C', 'D', 'B', 'B', 'B', 'A', 'D', 'B']\n",
      "15\n",
      "['A', 'A', 'B', None, 'C', 'D', None, 'A', None, None, 'A', 'D', 'D', 'D', 'C']\n",
      "11\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'C', 'C', 'A', 'C', 'C', 'C', 'C', 'C', 'C']\n",
      "15\n",
      "['A', 'A', 'A', 'A', 'A', 'A', None, None, None, 'C', 'C', 'A', 'C', 'B', 'B']\n",
      "12\n",
      "['B', None, 'A', None, 'A', 'C', None, 'A', None, 'A', None, 'B', 'A', 'A', 'A']\n",
      "10\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'D', 'D', 'A', 'A', 'D', 'A']\n",
      "15\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A']\n",
      "15\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'B', 'B']\n",
      "15\n",
      "['A', 'C', 'A', 'A', 'A', 'C', 'A', 'C', None, 'C', 'C', 'B', 'C', 'B', 'C']\n",
      "14\n",
      "['D', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A']\n",
      "15\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'C']\n",
      "15\n",
      "['A', 'B', 'C', 'B', 'B', 'B', 'B', 'B', 'B', 'A', 'B', 'A', 'C', 'A', 'B']\n",
      "15\n",
      "['D', 'A', 'A', 'B', 'C', 'C', 'A', 'C', 'A', 'A', 'A', 'A', 'B', 'A', 'A']\n",
      "15\n",
      "['A', 'A', None, 'A', 'A', 'A', 'A', 'A', None, 'A', 'A', 'D', 'A', 'C', 'B']\n",
      "13\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'D', 'D', 'A', 'C', 'A', 'B']\n",
      "15\n",
      "['D', 'D', 'A', 'A', 'A', 'B', 'D', 'C', 'B', 'D', 'A', 'C', 'B', 'B', 'B']\n",
      "15\n",
      "['A', 'A', 'D', 'A', 'A', 'A', None, 'A', 'A', 'D', 'A', 'D', 'D', 'D', 'B']\n",
      "14\n",
      "['A', 'A', 'B', 'A', 'A', 'A', 'A', 'A', 'A', 'B', 'B', 'A', 'D', 'B', 'C']\n",
      "15\n",
      "['A', 'A', 'A', None, 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', None]\n",
      "13\n",
      "['A', 'A', 'D', 'D', 'A', 'A', 'C', 'A', 'A', 'A', 'A', 'C', 'C', 'C', 'C']\n",
      "15\n",
      "['A', None, 'B', None, 'A', 'B', None, 'B', 'B', 'B', None, 'C', 'C', 'A', 'B']\n",
      "11\n",
      "['A', None, 'B', None, None, None, None, None, None, 'C', 'A', 'A', 'C', 'C', 'B']\n",
      "8\n",
      "['C', None, 'C', 'C', 'C', 'D', None, 'C', 'C', 'C', 'C', 'C', 'C', 'C', 'C']\n",
      "13\n",
      "['A', None, 'D', None, 'C', 'B', None, 'D', 'A', 'A', 'D', 'C', 'A', 'B', 'D']\n",
      "12\n",
      "['C', 'A', 'A', 'C', 'A', 'A', 'C', 'C', 'A', 'C', 'A', 'C', 'A', 'C', 'C']\n",
      "15\n",
      "['A', None, 'D', None, 'A', 'B', None, 'A', None, 'B', 'B', 'B', 'B', 'B', 'A']\n",
      "11\n",
      "['C', 'A', 'A', 'A', 'C', 'C', 'C', 'C', 'A', 'C', 'A', 'C', 'C', 'C', 'A']\n",
      "15\n",
      "['A', None, 'C', None, None, 'A', None, 'C', 'C', 'C', None, 'C', 'A', 'C', 'C']\n",
      "10\n",
      "['B', None, 'B', None, 'B', 'B', None, 'B', 'B', 'C', 'B', 'D', 'B', 'A', 'C']\n",
      "12\n",
      "['A', 'A', 'B', None, 'B', 'A', None, 'A', 'D', 'B', 'B', 'B', 'B', 'B', 'B']\n",
      "13\n",
      "['A', None, 'C', 'A', 'A', 'C', 'C', 'B', 'C', 'C', 'C', 'C', 'C', 'B', 'C']\n",
      "14\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'D', 'C']\n",
      "15\n",
      "['A', 'A', 'A', 'A', 'A', 'A', None, 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'C']\n",
      "14\n",
      "['B', None, 'B', None, None, 'B', None, 'B', 'B', 'D', 'B', 'B', 'B', 'B', 'B']\n",
      "11\n",
      "['A', 'A', 'A', None, None, None, None, None, 'A', 'B', 'B', 'D', 'C', 'A', 'B']\n",
      "10\n",
      "['A', None, 'C', None, 'A', 'A', 'D', 'D', 'C', 'D', 'A', 'D', 'A', 'D', 'C']\n",
      "13\n",
      "['A', 'A', 'A', 'C', 'C', 'A', 'C', 'A', None, 'A', 'A', 'A', 'C', 'B', 'A']\n",
      "14\n",
      "['A', 'B', 'A', None, 'A', 'A', 'B', 'B', None, 'B', 'A', 'A', 'A', 'B', 'B']\n",
      "13\n",
      "['A', None, 'A', None, 'A', 'B', None, 'B', 'A', 'C', 'A', 'A', 'A', 'A', 'B']\n",
      "12\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A']\n",
      "15\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A']\n",
      "15\n",
      "['A', None, 'A', 'A', 'A', 'A', 'A', 'A', None, 'A', 'A', 'A', 'A', 'D', 'D']\n",
      "13\n",
      "['A', 'A', 'B', 'A', 'A', 'A', 'A', 'A', None, 'A', 'D', 'A', 'A', 'A', 'C']\n",
      "14\n",
      "['A', 'A', 'A', 'A', 'A', 'A', None, 'A', 'A', 'A', 'A', 'B', 'B', 'B', 'A']\n",
      "14\n",
      "['B', None, 'B', 'B', 'A', 'B', None, 'B', 'B', 'B', 'B', 'B', 'B', 'D', None]\n",
      "12\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'D', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A']\n",
      "15\n",
      "['C', None, 'A', 'A', 'C', 'A', None, 'C', 'C', 'A', 'A', 'A', 'C', 'C', 'B']\n",
      "13\n",
      "['A', 'A', 'D', 'A', 'A', 'A', 'A', 'A', 'A', 'B', 'D', 'B', 'B', 'B', 'B']\n",
      "15\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'B', 'C', 'B', 'B']\n",
      "15\n",
      "['A', None, 'C', 'A', 'A', 'A', None, 'C', 'C', 'C', 'A', 'B', 'B', 'B', 'A']\n",
      "13\n",
      "['A', 'A', 'A', None, 'A', 'A', 'A', 'A', 'C', 'A', 'A', 'A', 'D', 'D', 'D']\n",
      "14\n",
      "['A', 'D', 'A', 'A', 'B', 'A', 'B', 'B', 'B', 'B', 'A', 'B', 'B', 'A', 'A']\n",
      "15\n",
      "['A', None, 'A', None, 'A', 'C', 'A', 'A', 'A', 'D', 'A', 'A', 'D', 'A', 'A']\n",
      "13\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'C', 'A']\n",
      "15\n",
      "['A', 'A', 'A', 'A', 'A', 'C', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'B']\n",
      "15\n",
      "['B', 'A', 'A', 'A', 'B', 'A', None, 'D', 'B', 'C', 'C', 'D', 'A', 'B', 'A']\n",
      "14\n",
      "['A', 'C', 'D', 'B', 'C', 'C', None, 'C', 'C', 'C', 'B', 'C', 'B', 'C', 'C']\n",
      "14\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'C', 'A', 'C', 'A', 'B', 'B']\n",
      "15\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A']\n",
      "15\n",
      "['C', 'C', 'C', None, 'C', 'D', None, 'D', 'D', 'D', 'C', 'C', 'D', 'C', 'A']\n",
      "13\n",
      "['A', 'A', 'A', 'A', 'A', 'B', 'A', 'B', 'A', 'B', 'A', 'A', 'A', 'D', 'D']\n",
      "15\n",
      "['C', None, 'B', None, 'B', 'C', None, None, 'B', 'B', 'C', 'B', 'B', 'B', 'B']\n",
      "11\n",
      "['A', 'A', 'A', 'A', 'A', 'D', 'D', 'B', None, 'B', 'A', 'B', 'A', 'D', 'D']\n",
      "14\n",
      "['C', None, 'B', 'A', 'C', 'A', 'A', 'B', 'B', 'A', 'A', 'A', 'B', 'C', None]\n",
      "13\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'B', 'A', 'A', 'A', 'A', 'A', 'C', 'A', 'A']\n",
      "15\n",
      "['C', 'A', 'A', 'A', 'A', 'A', 'B', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A']\n",
      "15\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'C', 'C', 'C', 'A', 'A', 'A']\n",
      "15\n",
      "['A', 'A', 'A', 'D', 'D', 'A', '4', 'A', 'C', 'C', 'C', 'D', 'A', 'A', 'B']\n",
      "15\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'D', 'C', 'A', 'A', 'C', 'A', 'C', 'A', 'C']\n",
      "15\n",
      "['B', 'A', 'D', 'A', 'B', 'D', 'A', 'C', 'A', 'B', 'A', 'A', 'D', 'B', 'B']\n",
      "15\n",
      "['A', 'A', 'A', 'A', 'A', 'B', 'A', 'C', 'A', 'A', 'A', 'B', 'A', 'A', 'B']\n",
      "15\n",
      "['A', 'A', 'A', 'B', 'A', 'A', None, 'D', 'A', 'A', 'B', 'B', 'B', 'A', 'A']\n",
      "14\n",
      "['A', 'A', 'A', 'A', 'A', 'C', None, 'A', 'A', 'A', 'A', 'A', 'C', 'D', 'A']\n",
      "14\n",
      "['D', None, 'C', None, 'B', 'C', None, 'A', 'A', 'C', 'C', 'C', 'C', 'C', 'C']\n",
      "12\n",
      "['A', 'A', 'C', 'A', 'A', 'A', None, 'C', 'A', 'C', 'A', 'C', 'A', 'C', 'A']\n",
      "14\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'C', 'C', 'A', 'C', 'A', 'A', 'A', None]\n",
      "14\n",
      "['A', 'A', 'A', 'A', 'A', 'B', 'C', 'A', 'C', 'C', 'A', 'C', 'C', 'C', 'C']\n",
      "15\n",
      "['A', 'A', 'A', None, 'A', 'B', None, 'B', 'A', 'B', 'B', 'B', 'D', 'D', 'B']\n",
      "13\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'C', 'A', 'C', 'B']\n",
      "15\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'D', 'A', 'A', 'A', 'A', 'A', 'A', 'D', 'C']\n",
      "15\n",
      "['A', 'A', 'A', 'A', 'A', 'A', None, 'A', 'A', 'A', 'A', 'A', 'C', 'A', 'A']\n",
      "14\n",
      "['A', 'C', 'A', 'C', 'C', 'C', 'C', 'D', 'C', 'A', 'C', 'B', 'B', 'D', 'D']\n",
      "15\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A']\n",
      "15\n",
      "['A', None, 'A', None, 'A', 'A', None, 'C', 'A', 'C', 'A', 'A', 'A', 'A', 'A']\n",
      "12\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', None, 'A', 'A', 'A', 'A', 'A', 'A']\n",
      "14\n",
      "['D', 'A', 'A', 'A', 'D', 'D', 'D', 'D', 'A', 'D', 'D', 'D', 'D', 'D', 'D']\n",
      "15\n",
      "['A', 'A', 'A', None, 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'B', 'A', 'A', 'A']\n",
      "14\n",
      "['A', None, 'B', None, 'A', 'A', None, None, 'B', 'B', 'A', 'A', 'B', 'B', 'B']\n",
      "11\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A']\n",
      "15\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'B']\n",
      "15\n",
      "['A', 'A', 'D', 'A', 'D', 'A', None, 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A']\n",
      "14\n",
      "['A', None, 'B', 'A', 'B', 'A', 'A', None, 'A', 'B', 'C', 'B', 'B', 'A', 'B']\n",
      "13\n",
      "['D', 'C', 'A', None, 'C', 'D', None, 'A', 'A', 'C', 'A', 'D', 'C', 'D', 'A']\n",
      "13\n",
      "['A', 'C', 'C', 'A', 'C', 'C', 'D', 'D', None, 'D', 'D', 'C', 'C', 'C', None]\n",
      "13\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'B', 'A', 'B', 'C', 'D', 'C', 'D']\n",
      "15\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A']\n",
      "15\n",
      "['A', None, 'A', 'A', 'C', 'D', None, 'B', 'A', 'C', 'B', 'D', 'B', 'C', 'C']\n",
      "13\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A']\n",
      "15\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'C', 'A', 'B', 'B', 'A']\n",
      "15\n",
      "['D', 'D', 'A', 'D', 'A', 'D', None, 'A', 'A', 'D', 'A', 'A', 'A', 'C', 'C']\n",
      "14\n",
      "['A', 'A', 'A', 'A', 'A', 'C', 'B', 'A', 'B', 'B', 'B', 'A', 'B', 'A', 'B']\n",
      "15\n",
      "['A', 'A', 'B', 'B', 'A', 'A', 'A', 'B', 'A', 'D', 'B', 'D', 'B', 'D', 'A']\n",
      "15\n",
      "['A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'A', 'D', 'A', 'B', 'B', 'D', 'B']\n",
      "15\n",
      "['A', 'B', 'B', 'A', 'A', 'C', None, 'B', 'B', 'B', 'A', 'B', 'B', 'A', 'C']\n",
      "14\n",
      "['B', 'A', 'A', 'C', 'C', 'B', 'D', 'A', None, 'A', 'A', 'A', 'C', 'A', 'A']\n",
      "14\n",
      "['B', 'C', 'C', 'B', 'B', 'C', 'B', 'D', 'B', 'B', 'B', 'D', 'B', 'B', 'D']\n",
      "15\n",
      "['B', None, 'A', None, 'A', 'B', 'B', 'D', 'D', 'B', 'B', 'B', 'B', 'B', 'D']\n",
      "13\n",
      "['A', 'A', 'A', 'A', 'A', 'D', 'D', 'A', 'A', 'D', 'D', 'D', 'D', 'A', 'D']\n",
      "15\n",
      "['A', 'B', 'B', 'A', 'B', 'A', 'D', 'B', 'B', 'B', 'A', 'A', 'D', 'A', 'A']\n",
      "15\n",
      "['D', 'C', None, 'D', 'D', 'D', 'D', 'D', 'C', 'D', 'D', 'D', 'D', 'D', 'D']\n",
      "14\n",
      "['D', 'D', 'D', 'D', 'D', 'D', None, 'D', 'D', 'D', 'A', 'D', 'D', 'D', 'D']\n",
      "14\n",
      "['A', 'A', 'A', 'A', 'B', 'A', 'B', None, 'B', 'D', 'C', 'A', 'C', 'B', 'B']\n",
      "14\n",
      "['C', None, None, None, 'A', 'A', None, 'D', 'A', 'D', 'A', 'D', 'A', 'B', 'B']\n",
      "11\n",
      "['A', 'A', None, 'A', 'A', 'A', 'A', None, 'A', 'A', 'A', 'A', 'C', 'D', 'A']\n",
      "13\n",
      "['D', 'B', 'D', 'B', 'B', 'D', 'D', 'D', None, 'A', 'D', 'A', 'D', 'A', 'D']\n",
      "14\n",
      "['B', None, 'B', None, 'B', 'B', None, 'C', 'B', 'B', 'D', 'D', 'D', 'B', 'B']\n",
      "12\n",
      "['A', 'A', 'A', 'B', 'A', 'A', 'B', 'A', 'D', 'A', 'D', None, 'B', 'B', 'A']\n",
      "14\n",
      "['A', 'A', 'B', 'A', 'B', 'A', 'A', None, None, 'A', 'B', 'C', 'A', 'D', 'C']\n",
      "13\n",
      "['A', 'A', 'A', 'A', 'A', 'A', None, 'A', None, 'A', 'A', 'A', 'C', 'B', 'B']\n",
      "13\n",
      "['A', 'D', 'D', 'D', 'A', 'A', 'D', 'D', 'B', 'B', 'A', 'D', 'A', 'B', 'C']\n",
      "15\n",
      "['C', 'C', 'B', 'C', 'C', 'C', 'C', 'C', 'C', 'A', 'C', 'C', 'C', 'C', 'C']\n",
      "15\n",
      "['A', None, 'A', 'A', 'C', 'A', None, None, None, None, None, 'B', 'C', None, 'B']\n",
      "8\n",
      "['A', 'A', 'D', 'A', 'A', 'A', None, 'B', 'D', 'A', 'A', 'D', 'A', 'A', 'A']\n",
      "14\n",
      "['C', 'B', 'A', 'B', 'B', 'C', None, 'B', None, 'B', 'B', 'C', 'B', 'A', 'D']\n",
      "13\n",
      "['A', 'A', 'B', 'B', 'B', 'A', 'D', 'A', 'B', 'B', 'D', 'B', 'B', 'D', 'D']\n",
      "15\n",
      "['B', 'B', 'B', 'B', 'B', 'B', None, 'B', 'B', 'B', 'A', 'B', 'C', 'B', 'A']\n",
      "14\n",
      "['A', 'D', 'A', 'D', 'D', 'D', None, 'D', None, 'D', 'A', 'A', 'A', 'D', 'D']\n",
      "13\n"
     ]
    }
   ],
   "source": [
    "for item in data2:\n",
    "    # print(item['scenario_index'])\n",
    "    l = [item[i][1] for i in model_nicks]\n",
    "    print(l)\n",
    "    print(len([i for i in l if i is not None]))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "7291d179",
   "metadata": {},
   "outputs": [],
   "source": [
    "import itertools\n",
    "\n",
    "count = 0\n",
    "for item in data2:\n",
    "    answer_choices = set([item[i][1].upper() for i in model_nicks if item[i][1] is not None])\n",
    "    print(answer_choices)\n",
    "    combos = list(itertools.combinations(answer_choices, 2))\n",
    "    print(combos)\n",
    "    count += len(combos)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 66,
   "id": "a6cfcf76",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "A D\n"
     ]
    }
   ],
   "source": [
    "for answer1, answer2 in combos:\n",
    "    print(answer1, answer2)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 78,
   "id": "4087baa5",
   "metadata": {},
   "outputs": [],
   "source": [
    "evaluation = {}\n",
    "\n",
    "model_nicks = ['a','b','c','d']\n",
    "\n",
    "for i in range(4):\n",
    "    evaluation[model_nicks[i]] = []\n",
    "    for answer1, answer2 in [['a','b'], ['a','c']]:\n",
    "\n",
    "        judge_response = 'hi'\n",
    "\n",
    "        evaluation[model_nicks[i]].append([answer1, answer2, judge_response])\n",
    "\n",
    "        # print(evaluation)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 79,
   "id": "300172d3",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "{'a': [['a', 'b', 'hi'], ['a', 'c', 'hi']],\n",
       " 'b': [['a', 'b', 'hi'], ['a', 'c', 'hi']],\n",
       " 'c': [['a', 'b', 'hi'], ['a', 'c', 'hi']],\n",
       " 'd': [['a', 'b', 'hi'], ['a', 'c', 'hi']]}"
      ]
     },
     "execution_count": 79,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "evaluation"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 101,
   "id": "dcf0c7c1",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "range(425, 448)"
      ]
     },
     "execution_count": 101,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "import numpy as np\n",
    "k = 19\n",
    "r = np.linspace(0,448,21)[k:k+2]\n",
    "range(int(r[0]), int(r[1]))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "1e523053",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "markdown",
   "id": "c91a0851",
   "metadata": {},
   "source": [
    "## getting GPQA comparisons"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 11,
   "id": "e67f345b",
   "metadata": {},
   "outputs": [],
   "source": [
    "import os\n",
    "import json\n",
    "events = [name for name in os.listdir('transcript_gpqa/') if '2025' in name]\n",
    "data = []\n",
    "for name in events:\n",
    "    with open(f\"transcript_gpqa/{name}/evaluations.json\", 'r') as file:\n",
    "        data.extend(json.load(file))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 12,
   "id": "812ffebc",
   "metadata": {},
   "outputs": [],
   "source": [
    "data = sorted(data, key=lambda x: x['scenario_index'])\n",
    "json.dump(data, open('gpqa_comparisons.json', 'w'), indent=4)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "e5a4990f",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "a0aaa679",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "markdown",
   "id": "3abaaa4f",
   "metadata": {},
   "source": [
    "## forming evaluations"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 98,
   "id": "f2454684",
   "metadata": {},
   "outputs": [],
   "source": [
    "models = {\n",
    "    \"Grok 3 Mini\": \"grok-3-mini\",\n",
    "    # \"Gemini 2.5 Flash\": \"gemini-2.5-flash\",\n",
    "    # \"GPT oss 120b\": \"gpt-oss-120b\",\n",
    "    \"Qwen3 235B A22B Instruct 2507\": \"qwen/qwen3-235b-a22b-2507\",\n",
    "    \"Kimi K2 0905\": \"moonshotai/kimi-k2-0905\",\n",
    "    \"Qwen3 Next 80B A3B Instruct\": \"qwen/qwen3-next-80b-a3b-instruct\",\n",
    "    \"Llama 4 Maverick\": \"meta-llama/llama-4-maverick\",\n",
    "    \"DeepSeek V3 0324\": \"deepseek/deepseek-chat-v3-0324\",\n",
    "    \"Gemini 2.5 Flash Lite\": \"gemini-2.5-flash-lite\",\n",
    "    \"Gemini 2.0 Flash\": \"gemini-2.0-flash-001\",\n",
    "    \"Llama 4 Scout\": \"meta-llama/llama-4-scout\",\n",
    "    \"Gemini 2.0 Flash Lite\": \"gemini-2.0-flash-lite-001\",\n",
    "    \"Llama 3.3 70b Instruct\": \"meta-llama/llama-3.3-70b-instruct\",\n",
    "    \"Qwen2.5 72B Instruct\": \"qwen/qwen-2.5-72b-instruct\",\n",
    "    # \"Qwen3 235B A22B\": \"qwen/qwen3-235b-a22b\",\n",
    "    \"Llama 3.1 70B Instruct\": \"meta-llama/llama-3.1-70b-instruct\",\n",
    "    \"GPT 4o mini\": \"gpt-4o-mini-2024-07-18\",\n",
    "    \"GPT 3.5 Turbo\": \"gpt-3.5-turbo\"\n",
    "}\n",
    "\n",
    "model_nicks = list(models.keys())\n",
    "num_models = len(model_nicks)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 100,
   "id": "ef2107da",
   "metadata": {},
   "outputs": [],
   "source": [
    "import json\n",
    "import re\n",
    "responses = json.load(open('transcript_gpqa/gpqa_responses.json', 'r'))\n",
    "judgments = json.load(open('transcript_gpqa/gpqa_judgments.json', 'r'))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 101,
   "id": "1fc89b6b",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Number of judge comparisons without a choice: 17875\n"
     ]
    }
   ],
   "source": [
    "comparisons = []\n",
    "\n",
    "no_choice_count = 0\n",
    "for scenario in range(448):\n",
    "    responses_dict = [i for i in responses if i['scenario_index'] == scenario][0]\n",
    "    judgments_dict = [i for i in judgments if i['scenario_index'] == scenario][0]\n",
    "    for i in range(num_models):\n",
    "        for j in range(num_models):\n",
    "            for k in range(j+1, num_models):\n",
    "                if j == k: continue\n",
    "\n",
    "                answer_j = responses_dict[model_nicks[j]][1]\n",
    "                answer_k = responses_dict[model_nicks[k]][1]\n",
    "\n",
    "                if answer_j is None or answer_k is None: continue\n",
    "                if answer_j == answer_k: \n",
    "                    # comparisons.append([scenario, i, j, k, 0])\n",
    "                    continue\n",
    "\n",
    "                judgment_i = [None, None, None]\n",
    "                for judgment in judgments_dict[model_nicks[i]]:\n",
    "                    if set(judgment[:2]) == set([answer_j, answer_k]) and judgment[2] is not None:\n",
    "                        judgment_i = judgment\n",
    "                        break\n",
    "                if judgment_i[2] is None: continue\n",
    "                \n",
    "                try:\n",
    "                    m = int(re.search(r'<choice>(.)</choice>', judgment_i[2]).group(1))\n",
    "                    if m in [1,2]:\n",
    "                        # if the judge saw answers in the same order as j,k\n",
    "                        if answer_j == judgment_i[0]:\n",
    "                            comparisons.append([scenario, i, j, k, 2-m]) # map {1,2} to {1,0}, i.e. if it chose answer 1, record win for j\n",
    "                        # if the judge saw answers in the opposite order as j,k\n",
    "                        else:\n",
    "                            comparisons.append([scenario, i, j, k, m-1]) # map {1,2} to {0,1}, i.e. if it chose answer 1, record win for k\n",
    "                except:\n",
    "                    no_choice_count += 1\n",
    "                    pass\n",
    "\n",
    "print(f'Number of judge comparisons without a choice: {no_choice_count}')\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 102,
   "id": "b04425a2",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "239588"
      ]
     },
     "execution_count": 102,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "len(comparisons)"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "aabf641c",
   "metadata": {},
   "source": [
    "## Training BT models"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 89,
   "id": "0f61ad02",
   "metadata": {},
   "outputs": [],
   "source": [
    "from BT import *\n",
    "from eigentrust import *\n",
    "import random"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 107,
   "id": "2573a70e",
   "metadata": {},
   "outputs": [],
   "source": [
    "def train_vector_bt(model, dataloader, lr, weight_decay, max_epochs, device, save_path=None, normalize=False, use_btd=False):\n",
    "    model.to(device)\n",
    "    optimizer = torch.optim.Adam(model.parameters(), lr=lr, weight_decay=weight_decay)\n",
    "    \n",
    "    if use_btd:\n",
    "        loss_fn = nn.CrossEntropyLoss()\n",
    "    else:\n",
    "        loss_fn = nn.BCELoss()\n",
    "\n",
    "    loss_history = []\n",
    "\n",
    "    for epoch in range(1, max_epochs+1):\n",
    "        total_loss = 0.0\n",
    "        model.train()\n",
    "\n",
    "        for i, j, k, r in dataloader:\n",
    "            i = i.to(device)\n",
    "            j = j.to(device)\n",
    "            k = k.to(device)\n",
    "            r = r.to(device)\n",
    "\n",
    "            if use_btd:\n",
    "                r = r.long()  # CrossEntropyLoss expects long tensor\n",
    "                logits = model(i, j, k)\n",
    "                loss = loss_fn(logits, r) # CE expects logits, unnormalized, as it has built in softmax\n",
    "            else:\n",
    "                p = model(i, j, k)\n",
    "                loss = loss_fn(p, r)\n",
    "\n",
    "            optimizer.zero_grad()\n",
    "            loss.backward()\n",
    "            optimizer.step()\n",
    "\n",
    "            if normalize:\n",
    "                with torch.no_grad():\n",
    "                    model.v.weight.data = F.normalize(model.v.weight.data, p=2, dim=1)\n",
    "\n",
    "            total_loss += loss.item() * r.size(0)\n",
    "\n",
    "        avg_loss = total_loss / len(dataloader.dataset)\n",
    "        loss_history.append(avg_loss)\n",
    "    \n",
    "        if len(loss_history) >= 3 and  np.average(np.abs(np.diff(loss_history[-3:]))) <= .0001:\n",
    "            print('loss converged, breaking')\n",
    "            break\n",
    "\n",
    "        print(f\"Epoch {epoch:>3d}, Loss = {avg_loss:.4f}\")\n",
    "\n",
    "    return loss_history"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 108,
   "id": "9bfd0682",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epoch   1, Loss = 0.6709\n",
      "Epoch   2, Loss = 0.6659\n",
      "Epoch   3, Loss = 0.6658\n",
      "loss converged, breaking\n"
     ]
    },
    {
     "data": {
      "text/plain": [
       "[0.6709230756461904,\n",
       " 0.6658611887882179,\n",
       " 0.6657772519077895,\n",
       " 0.6657622753334899]"
      ]
     },
     "execution_count": 108,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "num_models = len(set([i[1] for i in comparisons]))\n",
    "\n",
    "d = 2\n",
    "NORMALIZE = False\n",
    "USE_BTD = False\n",
    "\n",
    "lr = 1e-3\n",
    "weight_decay = 0\n",
    "max_epochs = 1000\n",
    "\n",
    "batch_size=32\n",
    "dataloader = DataLoader(dataset = Comparisons(comparisons), batch_size=batch_size, shuffle=True)\n",
    "\n",
    "model = VectorBT(num_models, d)\n",
    "train_vector_bt(\n",
    "    model,\n",
    "    dataloader,\n",
    "    lr=lr,\n",
    "    weight_decay=weight_decay,\n",
    "    max_epochs=max_epochs,\n",
    "    device='cpu',\n",
    "    save_path=None,\n",
    "    normalize=NORMALIZE,\n",
    "    use_btd=USE_BTD\n",
    ")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 109,
   "id": "ac04a9a0",
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "  1%|          | 8/1000 [00:00<00:00, 1860.93it/s]\n"
     ]
    }
   ],
   "source": [
    "device = 'cpu'\n",
    "T = compute_trust_matrix(model, device)\n",
    "T = row_normalize(T)\n",
    "t = eigentrust(T, alpha=0)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 111,
   "id": "26e334b5",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "tensor([0.0846, 0.0885, 0.0656, 0.0880, 0.0771, 0.0741, 0.0664, 0.0746, 0.0666,\n",
       "        0.0607, 0.0629, 0.0564, 0.0521, 0.0438, 0.0386])"
      ]
     },
     "execution_count": 111,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "t"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 122,
   "id": "9862f3b3",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[1, 3, 0, 4, 7, 5, 8, 6, 2, 10, 9, 11, 12, 13, 14]"
      ]
     },
     "execution_count": 122,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "list(reversed(np.argsort(t.numpy())))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 123,
   "id": "918a327c",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Kendall tau distance: 12\n"
     ]
    }
   ],
   "source": [
    "from itertools import combinations\n",
    "\n",
    "def kendall_tau_distance(rank1, rank2):\n",
    "    \"\"\"\n",
    "    Compute the Kendall tau distance between two rankings.\n",
    "    \n",
    "    rank1, rank2: lists of items representing two permutations of the same set.\n",
    "    Returns: integer distance (number of discordant pairs).\n",
    "    \"\"\"\n",
    "    if set(rank1) != set(rank2):\n",
    "        raise ValueError(\"Rankings must contain the same elements\")\n",
    "\n",
    "    # Map each item in rank2 to its position\n",
    "    pos2 = {item: i for i, item in enumerate(rank2)}\n",
    "\n",
    "    # Count discordant pairs\n",
    "    discordant = 0\n",
    "    for i, j in combinations(range(len(rank1)), 2):\n",
    "        a, b = rank1[i], rank1[j]\n",
    "        # Compare orderings in rank1 and rank2\n",
    "        if (pos2[a] - pos2[b]) * (i - j) < 0:\n",
    "            discordant += 1\n",
    "\n",
    "    return discordant\n",
    "\n",
    "\n",
    "# Example usage:\n",
    "rank1 = [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14]       # ground truth\n",
    "rank2 = [1, 3, 0, 4, 7, 5, 8, 6, 2, 10, 9, 11, 12, 13, 14]      # model ranking\n",
    "print(\"Kendall tau distance:\", kendall_tau_distance(rank1, rank2))\n"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "tf-metal",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.9.23"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
