{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 39,
   "id": "5ee41a6b",
   "metadata": {},
   "outputs": [],
   "source": [
    "import json\n",
    "import time\n",
    "import os\n",
    "\n",
    "from dotenv import load_dotenv\n",
    "from openai import OpenAI\n",
    "from pathlib import Path\n",
    "\n",
    "import anthropic\n",
    "from anthropic.types.message_create_params import MessageCreateParamsNonStreaming\n",
    "from anthropic.types.messages.batch_create_params import Request"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 40,
   "id": "9090ce24",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "True"
      ]
     },
     "execution_count": 40,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# Load .env file from the parent directory\n",
    "env_path = \".env\"\n",
    "load_dotenv(dotenv_path=env_path)"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "601013c0",
   "metadata": {},
   "source": [
    "# OPEN AI"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 41,
   "id": "b316c6ec",
   "metadata": {},
   "outputs": [],
   "source": [
    "open_ai_client = OpenAI(\n",
    "    base_url=\"https://api.openai.com/v1/\",\n",
    "    api_key=os.environ.get(\"OPENAI_API_KEY\"),\n",
    ")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 130,
   "id": "ee9f6591",
   "metadata": {},
   "outputs": [],
   "source": [
    "openai_models_list = [\n",
    "    # OpenAI\n",
    "    (4096, \"gpt-5-2025-08-07\"),\n",
    "    # (8192, \"gpt-5-mini-2025-08-07\"),\n",
    "    # (12288, \"gpt-4.1-2025-04-14\"),\n",
    "    # (8192, \"gpt-4.1-mini-2025-04-14\"),\n",
    "    # # reasoning\n",
    "    # (12288, \"openai/gpt-oss-120b\"),\n",
    "    # # (12288, \"deepseek-ai/DeepSeek-R1-0528\"),\n",
    "    # # (8192, \"Qwen/Qwen3-30B-A3B-Thinking-2507\"),\n",
    "    # (8192, \"openai/gpt-oss-20b\"),\n",
    "    # # non\n",
    "    # # (12288, \"moonshotai/Kimi-K2-Instruct\"),\n",
    "    # # (12288, \"Qwen/Qwen3-Coder-480B-A35B-Instruct\"),\n",
    "    # (12288, \"Qwen/Qwen3-235B-A22B-Instruct-2507\"),\n",
    "    # (8192, \"Qwen/Qwen3-30B-A3B-Instruct-2507\"),\n",
    "    # (8192, \"mistralai/Devstral-Small-2505\"),\n",
    "]\n",
    "\n",
    "# datasets = [\"angle\", \"elephant_box\", \"is_object_fit\", \"non_occupied_area\", \"object_movement\", \"specific_area\", \"direct_way\", \"missing_object\", \"shortest_path\", \"pair_distance\"]\n",
    "# datasets = [\"angle\", \"direct_way\", \"object_movement\"]\n",
    "# room_types = [\"bedroom\", \"kitchen\", \"living_room\"]\n",
    "\n",
    "# datasets = [\"is_object_fit\"]\n",
    "# room_types = [\"living_room\", \"kitchen\"]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 131,
   "id": "90c0af6d",
   "metadata": {},
   "outputs": [],
   "source": [
    "# room_types = [\"hssd_data\"]\n",
    "room_types = [\"living_rooms\", \"bedrooms\", \"kitchens\", \"hssd_data_simplified\"]\n",
    "# room_types = [\"kitchens\", \"hssd_data_simplified\"]\n",
    "# room_types = [\"kitchens\", \"hssd_data_simplified\"]\n",
    "# datasets = [\"max_box\", \"free_space\", \"pair_distance\"]\n",
    "datasets = [\n",
    "    \"shortest_path\",\n",
    "    \"obstruction\",\n",
    "    \"view_angle\",\n",
    "    \"max_box\",\n",
    "    # \"free_space\",\n",
    "    # \"pair_distance\", +\n",
    "    # \"placement\",\n",
    "    # \"repositioning\",\n",
    "]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 132,
   "id": "19f86b96",
   "metadata": {},
   "outputs": [],
   "source": [
    "# 5 * 16"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 133,
   "id": "af3d7a2c",
   "metadata": {},
   "outputs": [],
   "source": [
    "openai_batch_requests = []"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "f0cba1f8",
   "metadata": {},
   "outputs": [],
   "source": "for max_tokens, model_id in openai_models_list:\n    for dataset in datasets:\n        for room_type in room_types:\n            print(f\"Processing {dataset} {room_type} {model_id}\")\n            model_name = model_id.split(\"/\")[-1]\n            file_jsonl = f\"qa_jsonl/{dataset}/{room_type}/{model_name}_{max_tokens}.jsonl\"\n\n\n            with open(file_jsonl, 'r') as f:\n                data = json.loads(f.readline())\n\n            assert 'openings' in data['body']['messages'][-1]['content']\n\n            batch_request = open_ai_client.files.create(\n                file=open(file_jsonl, \"rb\"),\n                purpose=\"batch\"\n            )\n\n            openai_batch_requests.append(batch_request)"
  },
  {
   "cell_type": "code",
   "execution_count": 135,
   "id": "aa586a3f",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "16"
      ]
     },
     "execution_count": 135,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "len(openai_batch_requests)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 136,
   "id": "045ba356",
   "metadata": {},
   "outputs": [],
   "source": [
    "openai_batches = []\n",
    "for batch_request in openai_batch_requests:\n",
    "    batch = open_ai_client.batches.create(\n",
    "        input_file_id=batch_request.id,\n",
    "        endpoint=\"/v1/chat/completions\",\n",
    "        completion_window=\"24h\",\n",
    "        metadata={\n",
    "            \"description\": \"Asynchronous job\"\n",
    "        }\n",
    "    )\n",
    "    openai_batches.append(batch)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 141,
   "id": "0330e7e5",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Batch(id='batch_68d2d53ed6d08190adb8c94ccd89f406', completion_window='24h', created_at=1758647614, endpoint='/v1/chat/completions', input_file_id='file-9Hc1xawp224NAyAKrzbQXq', object='batch', status='completed', cancelled_at=None, cancelling_at=None, completed_at=1758650767, error_file_id='file-7LaxuKRfKBdvpXxhvoPanq', errors=None, expired_at=None, expires_at=1758734014, failed_at=None, finalizing_at=1758650602, in_progress_at=1758647618, metadata={'description': 'Asynchronous job'}, output_file_id='file-FdvsrPWE81GN3EDArNo9Kq', request_counts=BatchRequestCounts(completed=230, failed=370, total=600), model='gpt-5-2025-08-07', usage={'input_tokens': 407380, 'output_tokens': 328225, 'total_tokens': 735605, 'input_tokens_details': {'cached_tokens': 0}, 'output_tokens_details': {'reasoning_tokens': 0}})\n",
      "Batch(id='batch_68d2d53f80388190a85708ff6d43e338', completion_window='24h', created_at=1758647615, endpoint='/v1/chat/completions', input_file_id='file-BXXmCUyqYWdmr9YV6GcUn9', object='batch', status='completed', cancelled_at=None, cancelling_at=None, completed_at=1758648354, error_file_id='file-EzGmVyeU6hJT7fp3UwfWof', errors=None, expired_at=None, expires_at=1758734015, failed_at=None, finalizing_at=1758648169, in_progress_at=1758647618, metadata={'description': 'Asynchronous job'}, output_file_id='file-FDZQc91cry9vCUmaefhXSH', request_counts=BatchRequestCounts(completed=458, failed=142, total=600), model='gpt-5-2025-08-07', usage={'input_tokens': 765293, 'output_tokens': 660377, 'total_tokens': 1425670, 'input_tokens_details': {'cached_tokens': 0}, 'output_tokens_details': {'reasoning_tokens': 8192}})\n",
      "Batch(id='batch_68d2d541c5d88190b10940ef05a0ddb2', completion_window='24h', created_at=1758647617, endpoint='/v1/chat/completions', input_file_id='file-5DAaP6X4ffLyzDGNkrRf4w', object='batch', status='completed', cancelled_at=None, cancelling_at=None, completed_at=1758650360, error_file_id='file-QqzQRn1uKP6d5gcMbNqxJu', errors=None, expired_at=None, expires_at=1758734017, failed_at=None, finalizing_at=1758650305, in_progress_at=1758647619, metadata={'description': 'Asynchronous job'}, output_file_id='file-T88e3Z1b6HSeA91egJMYFF', request_counts=BatchRequestCounts(completed=490, failed=110, total=600), model='gpt-5-2025-08-07', usage={'input_tokens': 788284, 'output_tokens': 537212, 'total_tokens': 1325496, 'input_tokens_details': {'cached_tokens': 0}, 'output_tokens_details': {'reasoning_tokens': 0}})\n",
      "Batch(id='batch_68d2d542a7d48190963f192bf44f0b8d', completion_window='24h', created_at=1758647618, endpoint='/v1/chat/completions', input_file_id='file-FnU5SiQXXcWhy7TWbL718F', object='batch', status='completed', cancelled_at=None, cancelling_at=None, completed_at=1758648252, error_file_id='file-3KkZnnU79DzUYEZ55FeZe3', errors=None, expired_at=None, expires_at=1758734018, failed_at=None, finalizing_at=1758648201, in_progress_at=1758647621, metadata={'description': 'Asynchronous job'}, output_file_id='file-QFJ9MGk7xo239sv37oYkyS', request_counts=BatchRequestCounts(completed=191, failed=9, total=200), model='gpt-5-2025-08-07', usage={'input_tokens': 717556, 'output_tokens': 203191, 'total_tokens': 920747, 'input_tokens_details': {'cached_tokens': 0}, 'output_tokens_details': {'reasoning_tokens': 0}})\n",
      "Batch(id='batch_68d2d54329888190bab6ee3c6e5c86f4', completion_window='24h', created_at=1758647619, endpoint='/v1/chat/completions', input_file_id='file-Br3Z1G7TapArvLawr7VK6Z', object='batch', status='completed', cancelled_at=None, cancelling_at=None, completed_at=1758648163, error_file_id='file-C6ThS1HhDyyFNcE7pd4vPn', errors=None, expired_at=None, expires_at=1758734019, failed_at=None, finalizing_at=1758648106, in_progress_at=1758647621, metadata={'description': 'Asynchronous job'}, output_file_id='file-SSnnXXY2k6PQT3pBoVcz1A', request_counts=BatchRequestCounts(completed=596, failed=4, total=600), model='gpt-5-2025-08-07', usage={'input_tokens': 1032214, 'output_tokens': 663871, 'total_tokens': 1696085, 'input_tokens_details': {'cached_tokens': 0}, 'output_tokens_details': {'reasoning_tokens': 0}})\n",
      "Batch(id='batch_68d2d543ba008190a1558acf698f9b9b', completion_window='24h', created_at=1758647619, endpoint='/v1/chat/completions', input_file_id='file-6xxHJgosxJMwSwjXea9Bru', object='batch', status='completed', cancelled_at=None, cancelling_at=None, completed_at=1758648766, error_file_id='file-3EDeho63fjUHBRQoGxusWr', errors=None, expired_at=None, expires_at=1758734019, failed_at=None, finalizing_at=1758648703, in_progress_at=1758647622, metadata={'description': 'Asynchronous job'}, output_file_id='file-7TjZ7313f1rQHiEKicTvQg', request_counts=BatchRequestCounts(completed=598, failed=2, total=600), model='gpt-5-2025-08-07', usage={'input_tokens': 986087, 'output_tokens': 652154, 'total_tokens': 1638241, 'input_tokens_details': {'cached_tokens': 1664}, 'output_tokens_details': {'reasoning_tokens': 0}})\n",
      "Batch(id='batch_68d2d544af708190861b4e1219fbd38f', completion_window='24h', created_at=1758647620, endpoint='/v1/chat/completions', input_file_id='file-Anj8Vsd2xEU7eSr4KX459J', object='batch', status='completed', cancelled_at=None, cancelling_at=None, completed_at=1758648164, error_file_id=None, errors=None, expired_at=None, expires_at=1758734020, failed_at=None, finalizing_at=1758648138, in_progress_at=1758647622, metadata={'description': 'Asynchronous job'}, output_file_id='file-CZ7xBCe3eyEyYDUsWGof5U', request_counts=BatchRequestCounts(completed=600, failed=0, total=600), model='gpt-5-2025-08-07', usage={'input_tokens': 947783, 'output_tokens': 557050, 'total_tokens': 1504833, 'input_tokens_details': {'cached_tokens': 0}, 'output_tokens_details': {'reasoning_tokens': 0}})\n",
      "Batch(id='batch_68d2d54553b881909046544d58379f73', completion_window='24h', created_at=1758647621, endpoint='/v1/chat/completions', input_file_id='file-EWefzoZQ3nG3FwC1e1PsQD', object='batch', status='completed', cancelled_at=None, cancelling_at=None, completed_at=1758648692, error_file_id='file-Hijxc1ZzHZ2KyvvJHWVTrs', errors=None, expired_at=None, expires_at=1758734021, failed_at=None, finalizing_at=1758648674, in_progress_at=1758647622, metadata={'description': 'Asynchronous job'}, output_file_id='file-MGQRvUq3fPMqP3jtAfMURK', request_counts=BatchRequestCounts(completed=186, failed=14, total=200), model='gpt-5-2025-08-07', usage={'input_tokens': 656128, 'output_tokens': 212599, 'total_tokens': 868727, 'input_tokens_details': {'cached_tokens': 0}, 'output_tokens_details': {'reasoning_tokens': 0}})\n",
      "Batch(id='batch_68d2d545de90819086c62282cdd6cc3f', completion_window='24h', created_at=1758647621, endpoint='/v1/chat/completions', input_file_id='file-51GfsGbfxMbiiDE8PVs8h9', object='batch', status='completed', cancelled_at=None, cancelling_at=None, completed_at=1758650666, error_file_id='file-2wc4rRPt7azYCaq3cgJt8h', errors=None, expired_at=None, expires_at=1758734021, failed_at=None, finalizing_at=1758650510, in_progress_at=1758647622, metadata={'description': 'Asynchronous job'}, output_file_id='file-HorfXj7kqjUyVTp3JVffJ7', request_counts=BatchRequestCounts(completed=547, failed=53, total=600), model='gpt-5-2025-08-07', usage={'input_tokens': 952532, 'output_tokens': 262238, 'total_tokens': 1214770, 'input_tokens_details': {'cached_tokens': 0}, 'output_tokens_details': {'reasoning_tokens': 0}})\n",
      "Batch(id='batch_68d2d54674308190a62d3db70a19e3b0', completion_window='24h', created_at=1758647622, endpoint='/v1/chat/completions', input_file_id='file-8ndKzo6XcYrPqVMQ7WUQA2', object='batch', status='completed', cancelled_at=None, cancelling_at=None, completed_at=1758648913, error_file_id='file-AYWZnFXikEt4zaZRwNMVSD', errors=None, expired_at=None, expires_at=1758734022, failed_at=None, finalizing_at=1758648854, in_progress_at=1758647626, metadata={'description': 'Asynchronous job'}, output_file_id='file-TzgecneynWp8VgkQ5F4yn3', request_counts=BatchRequestCounts(completed=597, failed=3, total=600), model='gpt-5-2025-08-07', usage={'input_tokens': 989134, 'output_tokens': 293362, 'total_tokens': 1282496, 'input_tokens_details': {'cached_tokens': 1664}, 'output_tokens_details': {'reasoning_tokens': 0}})\n",
      "Batch(id='batch_68d2d546fddc8190b2e3b70ab7f83afa', completion_window='24h', created_at=1758647622, endpoint='/v1/chat/completions', input_file_id='file-RqtgVYDUuqp33qhjsz6WkJ', object='batch', status='completed', cancelled_at=None, cancelling_at=None, completed_at=1758648612, error_file_id=None, errors=None, expired_at=None, expires_at=1758734022, failed_at=None, finalizing_at=1758648552, in_progress_at=1758647625, metadata={'description': 'Asynchronous job'}, output_file_id='file-8Yhrku2Sede5823NZJtULa', request_counts=BatchRequestCounts(completed=600, failed=0, total=600), model='gpt-5-2025-08-07', usage={'input_tokens': 951983, 'output_tokens': 280571, 'total_tokens': 1232554, 'input_tokens_details': {'cached_tokens': 0}, 'output_tokens_details': {'reasoning_tokens': 0}})\n",
      "Batch(id='batch_68d2d5478960819086930de76e96f0bc', completion_window='24h', created_at=1758647623, endpoint='/v1/chat/completions', input_file_id='file-PaQniqsBRzWyabuqajThzb', object='batch', status='completed', cancelled_at=None, cancelling_at=None, completed_at=1758649360, error_file_id='file-Wq5kqYEy2LXMHH5xcbskT4', errors=None, expired_at=None, expires_at=1758734023, failed_at=None, finalizing_at=1758649327, in_progress_at=1758647625, metadata={'description': 'Asynchronous job'}, output_file_id='file-BXZ5PEMSTptW4tpWd2MgtN', request_counts=BatchRequestCounts(completed=184, failed=16, total=200), model='gpt-5-2025-08-07', usage={'input_tokens': 670595, 'output_tokens': 204464, 'total_tokens': 875059, 'input_tokens_details': {'cached_tokens': 0}, 'output_tokens_details': {'reasoning_tokens': 0}})\n",
      "Batch(id='batch_68d2d5481b4c8190933fec9d80597767', completion_window='24h', created_at=1758647624, endpoint='/v1/chat/completions', input_file_id='file-FACfFi96gyqzsvz7QMREjz', object='batch', status='completed', cancelled_at=None, cancelling_at=None, completed_at=1758650571, error_file_id='file-5VBzfGDAJxcNatbPGNeTZB', errors=None, expired_at=None, expires_at=1758734024, failed_at=None, finalizing_at=1758650510, in_progress_at=1758647685, metadata={'description': 'Asynchronous job'}, output_file_id='file-D8y6xPjf3NkePXXgohFp8q', request_counts=BatchRequestCounts(completed=542, failed=58, total=600), model='gpt-5-2025-08-07', usage={'input_tokens': 970913, 'output_tokens': 721300, 'total_tokens': 1692213, 'input_tokens_details': {'cached_tokens': 0}, 'output_tokens_details': {'reasoning_tokens': 0}})\n",
      "Batch(id='batch_68d2d549469481909228adde2fcd8c0e', completion_window='24h', created_at=1758647625, endpoint='/v1/chat/completions', input_file_id='file-AamhW2g1TD4GdW9RDztEUF', object='batch', status='completed', cancelled_at=None, cancelling_at=None, completed_at=1758649582, error_file_id='file-BUuT9TdUnwihTwn4e9wHYB', errors=None, expired_at=None, expires_at=1758734025, failed_at=None, finalizing_at=1758649545, in_progress_at=1758647627, metadata={'description': 'Asynchronous job'}, output_file_id='file-WMEpMRaH3oKxCwjKPW1hJY', request_counts=BatchRequestCounts(completed=522, failed=78, total=600), model='gpt-5-2025-08-07', usage={'input_tokens': 890963, 'output_tokens': 653025, 'total_tokens': 1543988, 'input_tokens_details': {'cached_tokens': 0}, 'output_tokens_details': {'reasoning_tokens': 0}})\n",
      "Batch(id='batch_68d2d549f20c8190aa7bcac5672e27b5', completion_window='24h', created_at=1758647625, endpoint='/v1/chat/completions', input_file_id='file-McdZLVnc3PePit7fchEnEM', object='batch', status='completed', cancelled_at=None, cancelling_at=None, completed_at=1758648319, error_file_id='file-Krf7C2Ec1qpth63UNFJydP', errors=None, expired_at=None, expires_at=1758734025, failed_at=None, finalizing_at=1758648136, in_progress_at=1758647627, metadata={'description': 'Asynchronous job'}, output_file_id='file-42bQEYzWebmZwaPcJE37fP', request_counts=BatchRequestCounts(completed=524, failed=76, total=600), model='gpt-5-2025-08-07', usage={'input_tokens': 856383, 'output_tokens': 477570, 'total_tokens': 1333953, 'input_tokens_details': {'cached_tokens': 0}, 'output_tokens_details': {'reasoning_tokens': 0}})\n",
      "Batch(id='batch_68d2d54a81e08190a5a51150195f4daa', completion_window='24h', created_at=1758647626, endpoint='/v1/chat/completions', input_file_id='file-HyVcmnNbH2Q27RxSHcPj3G', object='batch', status='completed', cancelled_at=None, cancelling_at=None, completed_at=1758650531, error_file_id='file-FvDE52acn49YfpHLm7ftp8', errors=None, expired_at=None, expires_at=1758734026, failed_at=None, finalizing_at=1758650510, in_progress_at=1758647627, metadata={'description': 'Asynchronous job'}, output_file_id='file-K1KgULSZo1YYLEus7NV7fC', request_counts=BatchRequestCounts(completed=193, failed=7, total=200), model='gpt-5-2025-08-07', usage={'input_tokens': 706250, 'output_tokens': 202480, 'total_tokens': 908730, 'input_tokens_details': {'cached_tokens': 0}, 'output_tokens_details': {'reasoning_tokens': 0}})\n"
     ]
    }
   ],
   "source": [
    "for batch in openai_batches:\n",
    "    batch_id_info = open_ai_client.batches.retrieve(batch.id)\n",
    "    print(batch_id_info)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 92,
   "id": "f16fe2ce",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Batch(id='batch_68d18ac7d0b481909245621553dc6f1e', completion_window='24h', created_at=1758563015, endpoint='/v1/chat/completions', input_file_id='file-YZRP7TxbfJS1m2YhkvHj3i', object='batch', status='completed', cancelled_at=None, cancelling_at=None, completed_at=1758572422, error_file_id=None, errors=None, expired_at=None, expires_at=1758649415, failed_at=None, finalizing_at=1758572364, in_progress_at=1758563018, metadata={'description': 'Asynchronous job'}, output_file_id='file-Fur1zxj52hJE1E6ByYMGJd', request_counts=BatchRequestCounts(completed=200, failed=0, total=200), model='gpt-5-2025-08-07', usage={'input_tokens': 729538, 'output_tokens': 151919, 'total_tokens': 881457, 'input_tokens_details': {'cached_tokens': 0}, 'output_tokens_details': {'reasoning_tokens': 0}})\n"
     ]
    }
   ],
   "source": [
    "batch_id_info = open_ai_client.batches.retrieve('batch_68d18ac7d0b481909245621553dc6f1e')\n",
    "print(batch_id_info)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "2cc55782",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "Batch(id='batch_68cfd65feea881909d0ec55587a1b12c', completion_window='24h', created_at=1758451295, endpoint='/v1/chat/completions', input_file_id='file-7Lo5fx6ELSYDzLusii8kEv', object='batch', status='cancelling', cancelled_at=None, cancelling_at=1758452118, completed_at=None, error_file_id=None, errors=None, expired_at=None, expires_at=1758537695, failed_at=None, finalizing_at=None, in_progress_at=1758451298, metadata={'description': 'Asynchronous job'}, output_file_id=None, request_counts=BatchRequestCounts(completed=0, failed=599, total=600), model='gpt-5-mini-2025-08-07', usage={'input_tokens': 0, 'output_tokens': 0, 'total_tokens': 0, 'input_tokens_details': {'cached_tokens': 0}, 'output_tokens_details': {'reasoning_tokens': 0}})"
      ]
     },
     "execution_count": 16,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# open_ai_client.batches.cancel('batch_68cfd65ad5088190b52e8043f63fdaf1')\n",
    "# open_ai_client.batches.cancel('batch_68cfd65c9a7c8190abb032430b676cee')\n",
    "# open_ai_client.batches.cancel('batch_68cfd65d2a90819094478592645618b1')\n",
    "# open_ai_client.batches.cancel('batch_68cfd65e55688190a980415499ac4789')\n",
    "# open_ai_client.batches.cancel('batch_68cfd65feea881909d0ec55587a1b12c')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "df54efa7",
   "metadata": {},
   "outputs": [],
   "source": [
    "# done_set = {\n",
    "#     'batch_68cff25982008190b7e59c338df41030',\n",
    "#     'batch_68cff25b4a308190b08769dd064e07f5',\n",
    "#     'batch_68cff25c48b08190b7789e50d0e2fc9e'\n",
    "# }"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 142,
   "id": "f1cb4c3f",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Processing shortest_path living_rooms gpt-5-2025-08-07\n",
      "Processing shortest_path bedrooms gpt-5-2025-08-07\n",
      "Processing shortest_path kitchens gpt-5-2025-08-07\n",
      "Processing shortest_path hssd_data_simplified gpt-5-2025-08-07\n",
      "Processing obstruction living_rooms gpt-5-2025-08-07\n",
      "Processing obstruction bedrooms gpt-5-2025-08-07\n",
      "Processing obstruction kitchens gpt-5-2025-08-07\n",
      "Processing obstruction hssd_data_simplified gpt-5-2025-08-07\n",
      "Processing view_angle living_rooms gpt-5-2025-08-07\n",
      "Processing view_angle bedrooms gpt-5-2025-08-07\n",
      "Processing view_angle kitchens gpt-5-2025-08-07\n",
      "Processing view_angle hssd_data_simplified gpt-5-2025-08-07\n",
      "Processing max_box living_rooms gpt-5-2025-08-07\n",
      "Processing max_box bedrooms gpt-5-2025-08-07\n",
      "Processing max_box kitchens gpt-5-2025-08-07\n",
      "Processing max_box hssd_data_simplified gpt-5-2025-08-07\n"
     ]
    }
   ],
   "source": [
    "index = 0\n",
    "for max_tokens, model_id in openai_models_list:\n",
    "    for dataset in datasets:\n",
    "        for room_type in room_types:\n",
    "            batch = openai_batches[index]\n",
    "            index += 1\n",
    "            # if batch.id in done_set:\n",
    "                \n",
    "            print(f\"Processing {dataset} {room_type} {model_id}\")\n",
    "            # else:\n",
    "            #     print(f\"Skipping {dataset} {room_type} {model_id}\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "379b5a04",
   "metadata": {},
   "outputs": [],
   "source": "index = 0\nfor max_tokens, model_id in openai_models_list:\n    for dataset in datasets:\n        for room_type in room_types:\n            batch = openai_batches[index]\n            index += 1\n            # if batch.id in done_set:\n\n            batch_id_info = open_ai_client.batches.retrieve(batch.id)\n            batch_result = open_ai_client.files.content(batch_id_info.output_file_id)\n\n            model_name = model_id.split(\"/\")[-1]\n\n            output_jsonl = f\"qa_response/{dataset}/{room_type}/{model_name}_{max_tokens}.jsonl\"\n            print('Saving to', output_jsonl)\n            output_jsonl = Path(output_jsonl)\n            output_jsonl.parent.mkdir(parents=True, exist_ok=True)\n\n            with open(output_jsonl, \"w\") as f:\n                for line in batch_result.text.strip().splitlines():\n                    line = json.loads(line)\n                    json.dump(line, f)\n                    f.write(\"\\n\")\n            # raise\n            # index += 1"
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "4ea2d24e",
   "metadata": {},
   "outputs": [],
   "source": [
    "from pathlib import Path\n",
    "import json, io\n",
    "\n",
    "def _parse_jsonl(text):\n",
    "    if not text:\n",
    "        return []\n",
    "    return [json.loads(line) for line in io.StringIO(text) if line.strip()]\n",
    "\n",
    "# ---- Rebuild the same iteration order your loop used, to align with openai_batches ----\n",
    "param_grid = []  # [(max_tokens, model_id, dataset, room_type)]\n",
    "for max_tokens, model_id in openai_models_list:\n",
    "    for dataset in datasets:\n",
    "        for room_type in room_types:\n",
    "            param_grid.append((max_tokens, model_id, dataset, room_type))\n",
    "\n",
    "assert len(param_grid) == len(openai_batches), \"param_grid and openai_batches must align 1:1\"\n",
    "\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 150,
   "id": "c9057fc6",
   "metadata": {},
   "outputs": [],
   "source": [
    "openai_retied_batches = []  # same length, index-aligned with openai_batches"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 148,
   "id": "25f596ca",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Retrying 370 rows from batch batch_68d2d53ed6d08190adb8c94ccd89f406...\n",
      "Retrying 142 rows from batch batch_68d2d53f80388190a85708ff6d43e338...\n",
      "Retrying 110 rows from batch batch_68d2d541c5d88190b10940ef05a0ddb2...\n",
      "Retrying 9 rows from batch batch_68d2d542a7d48190963f192bf44f0b8d...\n",
      "Retrying 4 rows from batch batch_68d2d54329888190bab6ee3c6e5c86f4...\n",
      "Retrying 2 rows from batch batch_68d2d543ba008190a1558acf698f9b9b...\n",
      "Retrying 14 rows from batch batch_68d2d54553b881909046544d58379f73...\n",
      "Retrying 53 rows from batch batch_68d2d545de90819086c62282cdd6cc3f...\n",
      "Retrying 3 rows from batch batch_68d2d54674308190a62d3db70a19e3b0...\n",
      "Retrying 16 rows from batch batch_68d2d5478960819086930de76e96f0bc...\n",
      "Retrying 58 rows from batch batch_68d2d5481b4c8190933fec9d80597767...\n",
      "Retrying 78 rows from batch batch_68d2d549469481909228adde2fcd8c0e...\n",
      "Retrying 76 rows from batch batch_68d2d549f20c8190aa7bcac5672e27b5...\n",
      "Retrying 7 rows from batch batch_68d2d54a81e08190a5a51150195f4daa...\n"
     ]
    }
   ],
   "source": [
    "for i, batch in enumerate(openai_batches):\n",
    "    # retrieve batch + its files\n",
    "    b = open_ai_client.batches.retrieve(batch.id)\n",
    "\n",
    "    # pull original input (to reconstruct failed rows exactly)\n",
    "    in_text = open_ai_client.files.content(b.input_file_id).text\n",
    "    input_rows = _parse_jsonl(in_text)\n",
    "    by_custom = {r.get(\"custom_id\"): r for r in input_rows if r.get(\"custom_id\") is not None}\n",
    "    by_id     = {r.get(\"id\"):        r for r in input_rows if r.get(\"id\") is not None}\n",
    "\n",
    "    # read errors for this batch\n",
    "    failed_rows = []\n",
    "    if getattr(b, \"error_file_id\", None):\n",
    "        err_text = open_ai_client.files.content(b.error_file_id).text\n",
    "        for line in _parse_jsonl(err_text):\n",
    "            # keep ALL failures; if you want only transient, filter on line.get(\"status_code\") here\n",
    "            cid = line.get(\"custom_id\")\n",
    "            rid = line.get(\"id\")\n",
    "            src = by_custom.get(cid) if cid in by_custom else by_id.get(rid)\n",
    "            if src:\n",
    "                failed_rows.append(src)\n",
    "\n",
    "    if not failed_rows:\n",
    "        # no retry needed for this slot\n",
    "        openai_retied_batches.append(None)\n",
    "        continue\n",
    "\n",
    "    print(f\"Retrying {len(failed_rows)} rows from batch {batch.id}...\")\n",
    "    # write a retry-only JSONL (one per original batch) and submit a new batch\n",
    "    retry_payload_path = Path(f\"./retry_failed_{i}.jsonl\")\n",
    "    retry_payload_path.parent.mkdir(parents=True, exist_ok=True)\n",
    "    with retry_payload_path.open(\"w\", encoding=\"utf-8\") as f:\n",
    "        for row in failed_rows:\n",
    "            f.write(json.dumps(row, ensure_ascii=False) + \"\\n\")\n",
    "\n",
    "    file_obj = open_ai_client.files.create(file=retry_payload_path.open(\"rb\"), purpose=\"batch\")\n",
    "\n",
    "    retry_batch = open_ai_client.batches.create(\n",
    "        input_file_id=file_obj.id,\n",
    "        endpoint=\"/v1/chat/completions\",\n",
    "        completion_window=\"24h\",\n",
    "        metadata={\n",
    "            \"description\": \"Asynchronous job\",\n",
    "            \"retry_of\": batch.id\n",
    "        }\n",
    "    )\n",
    "\n",
    "    openai_retied_batches.append(retry_batch)\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 152,
   "id": "ac27e5dc",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[]"
      ]
     },
     "execution_count": 152,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "openai_retied_batches"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "35902787",
   "metadata": {},
   "outputs": [],
   "source": [
    "openai_retied_batches[2:]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "4b35022e",
   "metadata": {},
   "outputs": [],
   "source": [
    "for batch in openai_retied_batches[2:]:\n",
    "    if batch is not None:\n",
    "        batch_id_info = open_ai_client.batches.retrieve(batch.id)\n",
    "        print(batch_id_info)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "e113a487",
   "metadata": {},
   "outputs": [],
   "source": "index = 0\nfor max_tokens, model_id in openai_models_list:\n    for dataset in datasets:\n        for room_type in room_types:\n            retry_batch = openai_retied_batches[index]\n            index += 1\n            if retry_batch is None:\n                # nothing to save for this slot\n                continue\n\n            # fresh retrieve (in case status advanced)\n            retry_info = open_ai_client.batches.retrieve(retry_batch.id)\n\n            # if still running, you'll get no output_file_id yet; your original code didn't wait either\n            if not getattr(retry_info, \"output_file_id\", None):\n                print(f\"[warn] retry batch {retry_info.id} not ready (status={retry_info.status}); skipping save for now\")\n                continue\n\n            retry_result = open_ai_client.files.content(retry_info.output_file_id)\n            model_name = model_id.split(\"/\")[-1]\n\n            out_path = f\"qa_response/{dataset}/{room_type}/{model_name}_{max_tokens}_retried.jsonl\"\n            print('Saving retried to', out_path)\n            out_path = Path(out_path)\n            out_path.parent.mkdir(parents=True, exist_ok=True)\n\n            with out_path.open(\"w\", encoding=\"utf-8\") as f:\n                for line in retry_result.text.strip().splitlines():\n                    obj = json.loads(line)\n                    json.dump(obj, f, ensure_ascii=False)\n                    f.write(\"\\n\")"
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "plan_b",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.10.17"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}