{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "218b3baa",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Found 4 JSON files. Processing...\n",
      "  - Successfully processed and cleaned gpt4_evaluation_results.json from 'beaver-7b-v3.0_vs_p-sacpo'\n",
      "  - Successfully processed and cleaned gpt4_evaluation_results.json from 'beaver-7b-v3.0_vs_dpo_naive_42'\n",
      "  - Successfully processed and cleaned gpt4_evaluation_results.json from 'beaver-7b-v3.0_vs_sdpo_10_3_42'\n",
      "  - Successfully processed and cleaned gpt4_evaluation_results.json from 'beaver-7b-v3.0_vs_primal_dual_dpo_3_42_10'\n",
      "\n",
      "Data loading and processing complete!\n",
      "\n",
      "--- Final, Cleaned DataFrame Ready for ELO Calculation ---\n",
      "           model1  score1   model2  score2\n",
      "0  beaver-7b-v3.0    10.0  p-sacpo    10.0\n",
      "1  beaver-7b-v3.0     9.5  p-sacpo     9.0\n",
      "2  beaver-7b-v3.0     7.0  p-sacpo    10.0\n",
      "3  beaver-7b-v3.0    10.0  p-sacpo    10.0\n",
      "4  beaver-7b-v3.0    10.0  p-sacpo    10.0\n",
      "\n",
      "DataFrame Info:\n",
      "<class 'pandas.core.frame.DataFrame'>\n",
      "RangeIndex: 3192 entries, 0 to 3191\n",
      "Data columns (total 4 columns):\n",
      " #   Column  Non-Null Count  Dtype  \n",
      "---  ------  --------------  -----  \n",
      " 0   model1  3192 non-null   object \n",
      " 1   score1  3192 non-null   float64\n",
      " 2   model2  3192 non-null   object \n",
      " 3   score2  3192 non-null   float64\n",
      "dtypes: float64(2), object(2)\n",
      "memory usage: 99.9+ KB\n"
     ]
    }
   ],
   "source": [
    "import random\n",
    "import numpy as np\n",
    "import pandas as pd\n",
    "from itertools import combinations\n",
    "\n",
    "import pandas as pd\n",
    "from pathlib import Path\n",
    "import re # <-- Import the regular expression module\n",
    "\n",
    "import pandas as pd\n",
    "from pathlib import Path\n",
    "import re\n",
    "\n",
    "RESULT_DIR = [\"./results/gpt4_tournament/harmlessness\"]\n",
    "reference_model = \"beaver-7b-v3.0\" # <-- CHANGE THIS\n",
    "\n",
    "def load_and_process_results(root_directory: str) -> pd.DataFrame:\n",
    "    \"\"\"\n",
    "    Scans a directory tree for JSON files, intelligently extracts model names and their\n",
    "    corresponding scores based on directory and column naming conventions, and returns\n",
    "    a single, clean DataFrame ready for ELO calculation.\n",
    "    \"\"\"\n",
    "    root_path = Path(root_directory)\n",
    "    if not root_path.is_dir():\n",
    "        print(f\"Error: Directory not found at '{root_directory}'\")\n",
    "        return pd.DataFrame()\n",
    "\n",
    "    all_clean_dfs = []  # A list to hold the clean DataFrames\n",
    "    json_files = list(root_path.rglob('*.json'))\n",
    "    print(f\"Found {len(json_files)} JSON files. Processing...\")\n",
    "\n",
    "    split_pattern = re.compile(r'_vs_', re.IGNORECASE)\n",
    "\n",
    "    for json_path in json_files:\n",
    "        try:\n",
    "            dir_name = json_path.parent.name.strip()\n",
    "            parts = split_pattern.split(dir_name)\n",
    "\n",
    "            if len(parts) != 2:\n",
    "                print(f\"  - WARNING: Skipping directory '{dir_name}'. Could not find a valid '_vs_' separator.\")\n",
    "                continue\n",
    "\n",
    "            model_a, model_b = [part.strip() for part in parts]\n",
    "            \n",
    "            # Read the raw JSON data\n",
    "            temp_df = pd.read_json(json_path, lines=True)\n",
    "\n",
    "            # --- INTELLIGENT RESHAPING LOGIC ---\n",
    "            # Dynamically determine the correct score column names\n",
    "            score_col_a = f\"{model_a}_score\"\n",
    "            score_col_b = f\"{model_b}_score\"\n",
    "\n",
    "            # Check if the expected score columns exist in this file\n",
    "            if score_col_a not in temp_df.columns or score_col_b not in temp_df.columns:\n",
    "                print(f\"  - WARNING: Skipping file '{json_path.name}'. Expected score columns '{score_col_a}' and/or '{score_col_b}' not found.\")\n",
    "                continue\n",
    "\n",
    "            # Create the new, clean DataFrame on the fly\n",
    "            clean_temp_df = pd.DataFrame({\n",
    "                'model1': model_a,\n",
    "                'score1': temp_df[score_col_a],\n",
    "                'model2': model_b,\n",
    "                'score2': temp_df[score_col_b]\n",
    "            })\n",
    "\n",
    "            all_clean_dfs.append(clean_temp_df)\n",
    "            print(f\"  - Successfully processed and cleaned {json_path.name} from '{dir_name}'\")\n",
    "\n",
    "        except Exception as e:\n",
    "            print(f\"  - ERROR: Could not process file {json_path}. Reason: {e}\")\n",
    "\n",
    "    if not all_clean_dfs:\n",
    "        print(\"Processing complete, but no valid data was loaded.\")\n",
    "        return pd.DataFrame()\n",
    "\n",
    "    # Concatenate all the clean DataFrames into the final result\n",
    "    final_df = pd.concat(all_clean_dfs, ignore_index=True)\n",
    "    \n",
    "    # Final check for any rows that might have ended up with missing scores\n",
    "    original_rows = len(final_df)\n",
    "    final_df.dropna(subset=['score1', 'score2'], inplace=True)\n",
    "    if len(final_df) < original_rows:\n",
    "        print(f\"WARNING: Dropped {original_rows - len(final_df)} rows due to missing scores after final assembly.\")\n",
    "    \n",
    "    print(\"\\nData loading and processing complete!\")\n",
    "    return final_df\n",
    "\n",
    "# --- How to use the new all-in-one function ---\n",
    "elo_battles_df = load_and_process_results(RESULT_DIR)\n",
    "\n",
    "if not elo_battles_df.empty:\n",
    "    print(\"\\n--- Final, Cleaned DataFrame Ready for ELO Calculation ---\")\n",
    "    print(elo_battles_df.head())\n",
    "    print(\"\\nDataFrame Info:\")\n",
    "    elo_battles_df.info()\n",
    "\n",
    "    # This DataFrame is now ready to be used by the rest of your ELO script\n",
    "    # battles = create_battles_from_pooled_df(cleaned_battles_df)\n",
    "    # ... and so on\n",
    "    \n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "d11a6adc",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "Found 5 models: ['beaver-7b-v3.0', 'p-sacpo', 'dpo_naive_42', 'sdpo_10_3_42', 'primal_dual_dpo_3_42_10']\n",
      "Total battles to process: 3192\n",
      "Using 'beaver-7b-v3.0' as the normalization anchor (score = 1000).\n",
      "\n",
      "Starting ELO calculation with 50 trials...\n",
      "\n",
      "==============================\n",
      "== FINAL ELO RATING LEADERBOARD ==\n",
      "==============================\n",
      "beaver-7b-v3.0                          : 1000.00 ± 0.00\n",
      "p-sacpo                                 : 859.50 ± 40.14\n",
      "primal_dual_dpo_3_42_10                 : 766.40 ± 36.78\n",
      "dpo_naive_42                            : 752.76 ± 43.47\n",
      "sdpo_10_3_42                            : 692.42 ± 30.81\n"
     ]
    }
   ],
   "source": [
    "INITIAL_ELO = 1200\n",
    "ELO_DIFFERENCE_DIVISOR = 400\n",
    "K_FACTOR = 32\n",
    "CENTER_ELO = 1000\n",
    "ELO_TRIAL = 50\n",
    "ELO_EPOCH = 10\n",
    "\n",
    "def expected_score(rating_a, rating_b):\n",
    "    \"\"\"Calculates the expected score for player A.\"\"\"\n",
    "    return 1 / (1 + 10 ** ((rating_b - rating_a) / ELO_DIFFERENCE_DIVISOR))\n",
    "\n",
    "def update_elo(rating1, rating2, score1, score2):\n",
    "    \"\"\"\n",
    "    Updates the ELO ratings for two models based on their raw scores.\n",
    "    \"\"\"\n",
    "    if score1 > score2: outcome = 1.0\n",
    "    elif score1 < score2: outcome = 0.0\n",
    "    else: outcome = 0.5\n",
    "    \n",
    "    expected1 = expected_score(rating1, rating2)\n",
    "    new_rating_1 = rating1 + K_FACTOR * (outcome - expected1)\n",
    "    new_rating_2 = rating2 + K_FACTOR * ((1 - outcome) - (1 - expected1))\n",
    "    return new_rating_1, new_rating_2\n",
    "\n",
    "def create_battles_from_df(df):\n",
    "    \"\"\"Converts the clean DataFrame into a list of battle dictionaries.\"\"\"\n",
    "    return df.to_dict('records')\n",
    "\n",
    "# ==============================================================================\n",
    "# PART 3: MAIN EXECUTION SCRIPT\n",
    "# ==============================================================================\n",
    "\n",
    "\n",
    "if elo_battles_df.empty:\n",
    "    print(\"No data loaded. Exiting.\")\n",
    "else:\n",
    "    # --- Step 2: Prepare for ELO Calculation ---\n",
    "    battles = create_battles_from_df(elo_battles_df)\n",
    "    model_names = list(pd.unique(elo_battles_df[['model1', 'model2']].values.ravel('K')))\n",
    "    \n",
    "    print(f\"\\nFound {len(model_names)} models: {model_names}\")\n",
    "    print(f\"Total battles to process: {len(battles)}\")\n",
    "\n",
    "    # --- Step 3: CHOOSE YOUR REFERENCE MODEL ---\n",
    "    # This is the most important parameter to set.\n",
    "    # Choose one of your baseline models to anchor the ratings at 1000.\n",
    "    # !!! IMPORTANT: Replace \"your_baseline_model_name\" with an actual model name !!!\n",
    "    \n",
    "    if reference_model not in model_names:\n",
    "        raise ValueError(f\"Reference model '{reference_model}' is not in the list of found models. Please choose one of: {model_names}\")\n",
    "\n",
    "    print(f\"Using '{reference_model}' as the normalization anchor (score = {CENTER_ELO}).\\n\")\n",
    "    print(f\"Starting ELO calculation with {ELO_TRIAL} trials...\")\n",
    "\n",
    "    # --- Step 4: Run the ELO Calculation ---\n",
    "    elo_ratings_over_trials = {model_name: [] for model_name in model_names}\n",
    "\n",
    "    for trial in range(ELO_TRIAL):\n",
    "        current_ratings = {model_name: INITIAL_ELO for model_name in model_names}\n",
    "        \n",
    "        for _ in range(ELO_EPOCH):\n",
    "            random.shuffle(battles)\n",
    "            for battle in battles:\n",
    "                current_ratings[battle['model1']], current_ratings[battle['model2']] = update_elo(\n",
    "                    current_ratings[battle['model1']], current_ratings[battle['model2']],\n",
    "                    battle['score1'], battle['score2']\n",
    "                )\n",
    "        \n",
    "        # Normalize ratings by anchoring the reference model (the paper's method)\n",
    "        norm_factor = CENTER_ELO / current_ratings[reference_model]\n",
    "        for model in model_names:\n",
    "            current_ratings[model] *= norm_factor\n",
    "        \n",
    "        for model in model_names:\n",
    "            elo_ratings_over_trials[model].append(current_ratings[model])\n",
    "\n",
    "    # --- Step 5: Calculate Final Results and Print Leaderboard ---\n",
    "    final_elo_ratings = {\n",
    "        model: (np.mean(ratings), np.std(ratings)) \n",
    "        for model, ratings in elo_ratings_over_trials.items()\n",
    "    }\n",
    "    sorted_models = sorted(final_elo_ratings.items(), key=lambda item: item[1][0], reverse=True)\n",
    "\n",
    "    print(\"\\n\" + \"=\"*30)\n",
    "    print(\"== FINAL ELO RATING LEADERBOARD ==\")\n",
    "    print(\"=\"*30)\n",
    "    for model, (mean_rating, std_rating) in sorted_models:\n",
    "        print(f'{model:40s}: {mean_rating:.2f} ± {std_rating:.2f}')\n",
    "# to_latex? "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "b890d598",
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "safe-rlhf",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.10.18"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
