{
 "cells": [
  {
   "cell_type": "markdown",
   "id": "ebd91bf5",
   "metadata": {},
   "source": [
    "### Notebook for Running Full Game of SKATE\n",
    "\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "c5c04663",
   "metadata": {},
   "outputs": [],
   "source": [
    "import pandas as pd\n",
    "import numpy as np \n",
    "import pickle\n",
    "import tqdm\n",
    "\n",
    "from tournament_utils import (get_valid_task_with_options, score_model_on_question)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "d6adcac2",
   "metadata": {},
   "outputs": [],
   "source": [
    "new_model = 'insert-new-model-name'\n",
    "# Update this to reflect path to latest game database csv\n",
    "latest_csv = 'skate/workshop-experiments/skate-tournament/game_database.csv'\n",
    "new_csv_name = 'new_game_database.csv'\n",
    "\n",
    "players = [] # make list of players already in game + new one."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "727b8988",
   "metadata": {},
   "outputs": [],
   "source": [
    "archive = []\n",
    "for _ in range(50):\n",
    "    print(f\"Doing Round {_+1}/50\")\n",
    "    archive_copy = archive.copy()\n",
    "    task, gt_answer, options, embedding = get_valid_task_with_options(new_model, archive_copy, _+1)\n",
    "    if task:\n",
    "        score = score_model_on_question(\n",
    "            model=new_model,\n",
    "            problem=task,\n",
    "            ground_truth_answer=gt_answer,\n",
    "            distractor_options=options\n",
    "        )[0]\n",
    "        archive.append((task, score, gt_answer, options, embedding))\n",
    "    \n",
    "    with open(f'archive_{new_model}.pkl', 'wb') as f:\n",
    "        pickle.dump(archive, f)\n",
    "\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "1f6e1c5f",
   "metadata": {},
   "outputs": [],
   "source": [
    "# Add the new questions to the CSV file/ game database.\n",
    "\n",
    "with open(f'archive_{new_model}.pkl', 'rb') as f:\n",
    "    data = pickle.load(f)\n",
    "\n",
    "\n",
    "df = pd.read_csv(latest_csv)\n",
    "\n",
    "\n",
    "if new_model not in df.columns:\n",
    "    df[new_model] = np.nan  # Add a new column for the task setter if it doesn't exist\n",
    "\n",
    "for idx, question in enumerate(data):\n",
    "    q_text, score, gt_answer, options, embedding = question\n",
    "\n",
    "    new_row = {\n",
    "        'round_number': idx+1,\n",
    "        'question': q_text,\n",
    "        'ground_truth_answer': gt_answer,\n",
    "        'distractor_options': options,\n",
    "        'task_setter': new_model,\n",
    "        'gpt-4o': np.nan,\n",
    "        'claude-3-5-sonnet-20241022': np.nan,\n",
    "        'gemini-2.0-flash': np.nan,\n",
    "        new_model: score\n",
    "    }\n",
    "    \n",
    "    df = pd.concat([df, pd.DataFrame([new_row])], ignore_index=True)\n",
    "\n",
    "df.to_csv('questions_added.csv', index=False)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "f2001805",
   "metadata": {},
   "outputs": [],
   "source": [
    "df = pd.read_csv('saving_run.csv')\n",
    "\n",
    "\n",
    "for idx, row in tqdm.tqdm(df.iterrows(), total=len(df)):\n",
    "    for player in players:\n",
    "        if pd.isna(row[player]):\n",
    "\n",
    "            p, std = score_model_on_question(\n",
    "                model=player,\n",
    "                problem=row['question'],\n",
    "                ground_truth_answer=row['ground_truth_answer'],\n",
    "                distractor_options=row['distractor_options']\n",
    "            )\n",
    "            df.at[idx, player] = p\n",
    "\n",
    "            df.to_csv('saving_run.csv', index=False)\n",
    "    print(f\"Final row scores for all players: {df.loc[idx][players].to_dict()}\")\n",
    "\n",
    "df.to_csv(new_csv_name, index=False)\n"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "skate_aaai_env",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.10.18"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
