{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 2,
   "id": "bd1ac517",
   "metadata": {},
   "outputs": [],
   "source": [
    "import json\n",
    "import time\n",
    "import os\n",
    "\n",
    "from dotenv import load_dotenv\n",
    "from openai import OpenAI\n",
    "from pathlib import Path\n",
    "\n",
    "import anthropic\n",
    "from anthropic.types.message_create_params import MessageCreateParamsNonStreaming\n",
    "from anthropic.types.messages.batch_create_params import Request"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "id": "fdb6913e",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "True"
      ]
     },
     "execution_count": 3,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# Load .env file from the parent directory\n",
    "env_path = \".env\"\n",
    "load_dotenv(dotenv_path=env_path)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "id": "6f79c509",
   "metadata": {},
   "outputs": [],
   "source": [
    "open_ai_client = OpenAI(\n",
    "    base_url=\"https://api.openai.com/v1/\",\n",
    "    api_key=os.environ.get(\"OPENAI_API_KEY\"),\n",
    ")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "id": "8ccab41e",
   "metadata": {},
   "outputs": [],
   "source": [
    "openai_models_list = [\n",
    "    # OpenAI\n",
    "    (12288, \"gpt-4.1-2025-04-14\"),\n",
    "]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "id": "f8075e19",
   "metadata": {},
   "outputs": [],
   "source": [
    "# room_types = [\"hssd_data\"]\n",
    "room_types = [\"living_rooms\", \"bedrooms\", \"kitchens\", \"hssd_data_simplified\"]\n",
    "# room_types = [\"kitchens\", \"hssd_data_simplified\"]\n",
    "# room_types = [\"kitchens\", \"hssd_data_simplified\"]\n",
    "# datasets = [\"max_box\", \"free_space\", \"pair_distance\"]\n",
    "datasets = [\n",
    "    \"shortest_path\",\n",
    "    \"obstruction\",\n",
    "    \"view_angle\",\n",
    "    \"max_box\",\n",
    "    # \"free_space\",\n",
    "    # \"pair_distance\", +\n",
    "    # \"placement\",\n",
    "    # \"repositioning\",\n",
    "]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "id": "316da469",
   "metadata": {},
   "outputs": [],
   "source": [
    "openai_batch_requests = []"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "id": "190358c6",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Processing shortest_path living_rooms gpt-4.1-2025-04-14\n",
      "Processing shortest_path bedrooms gpt-4.1-2025-04-14\n",
      "Processing shortest_path kitchens gpt-4.1-2025-04-14\n",
      "Processing shortest_path hssd_data_simplified gpt-4.1-2025-04-14\n",
      "Processing obstruction living_rooms gpt-4.1-2025-04-14\n",
      "Processing obstruction bedrooms gpt-4.1-2025-04-14\n",
      "Processing obstruction kitchens gpt-4.1-2025-04-14\n",
      "Processing obstruction hssd_data_simplified gpt-4.1-2025-04-14\n",
      "Processing view_angle living_rooms gpt-4.1-2025-04-14\n",
      "Processing view_angle bedrooms gpt-4.1-2025-04-14\n",
      "Processing view_angle kitchens gpt-4.1-2025-04-14\n",
      "Processing view_angle hssd_data_simplified gpt-4.1-2025-04-14\n",
      "Processing max_box living_rooms gpt-4.1-2025-04-14\n",
      "Processing max_box bedrooms gpt-4.1-2025-04-14\n",
      "Processing max_box kitchens gpt-4.1-2025-04-14\n",
      "Processing max_box hssd_data_simplified gpt-4.1-2025-04-14\n"
     ]
    }
   ],
   "source": [
    "for max_tokens, model_id in openai_models_list:\n",
    "    for dataset in datasets:\n",
    "        for room_type in room_types:\n",
    "            print(f\"Processing {dataset} {room_type} {model_id}\")\n",
    "            model_name = model_id.split(\"/\")[-1]\n",
    "            file_jsonl = f\"/home/rodionfa/FloorplanQA/qa_jsonl/{dataset}/{room_type}/{model_name}_{max_tokens}.jsonl\"\n",
    "\n",
    "\n",
    "            with open(file_jsonl, 'r') as f:\n",
    "                data = json.loads(f.readline())\n",
    "\n",
    "            assert 'openings' in data['body']['messages'][-1]['content']\n",
    "\n",
    "            batch_request = open_ai_client.files.create(\n",
    "                file=open(file_jsonl, \"rb\"),\n",
    "                purpose=\"batch\"\n",
    "            )\n",
    "\n",
    "            openai_batch_requests.append(batch_request)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 9,
   "id": "4b82d474",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "16"
      ]
     },
     "execution_count": 9,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "len(openai_batch_requests)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 11,
   "id": "af2c1d19",
   "metadata": {},
   "outputs": [],
   "source": [
    "openai_batches = []\n",
    "for batch_request in openai_batch_requests:\n",
    "    batch = open_ai_client.batches.create(\n",
    "        input_file_id=batch_request.id,\n",
    "        endpoint=\"/v1/chat/completions\",\n",
    "        completion_window=\"24h\",\n",
    "        metadata={\n",
    "            \"description\": \"Asynchronous job\"\n",
    "        }\n",
    "    )\n",
    "    openai_batches.append(batch)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 37,
   "id": "a5099b3b",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Batch(id='batch_68d2ac18717c81909fab2627f96b3c0f', completion_window='24h', created_at=1758637080, endpoint='/v1/chat/completions', input_file_id='file-GS1Lqw6YwyK5LLrTQnspxr', object='batch', status='completed', cancelled_at=None, cancelling_at=None, completed_at=1758645099, error_file_id=None, errors=None, expired_at=None, expires_at=1758723480, failed_at=None, finalizing_at=1758645051, in_progress_at=1758637083, metadata={'description': 'Asynchronous job'}, output_file_id='file-1FyHSDzVipQm5vyzdSXVxH', request_counts=BatchRequestCounts(completed=600, failed=0, total=600), model='gpt-4.1-2025-04-14', usage={'input_tokens': 1055746, 'output_tokens': 667366, 'total_tokens': 1723112, 'input_tokens_details': {'cached_tokens': 0}, 'output_tokens_details': {'reasoning_tokens': 0}})\n",
      "Batch(id='batch_68d2ac18f8448190bed1cc2c7faf5127', completion_window='24h', created_at=1758637080, endpoint='/v1/chat/completions', input_file_id='file-ACnUx6qPHJpvumX7TWDuzg', object='batch', status='completed', cancelled_at=None, cancelling_at=None, completed_at=1758645676, error_file_id=None, errors=None, expired_at=None, expires_at=1758723480, failed_at=None, finalizing_at=1758645625, in_progress_at=1758637083, metadata={'description': 'Asynchronous job'}, output_file_id='file-DKzbGFayFT6yA4ywXc2KLZ', request_counts=BatchRequestCounts(completed=600, failed=0, total=600), model='gpt-4.1-2025-04-14', usage={'input_tokens': 1004793, 'output_tokens': 674857, 'total_tokens': 1679650, 'input_tokens_details': {'cached_tokens': 0}, 'output_tokens_details': {'reasoning_tokens': 0}})\n",
      "Batch(id='batch_68d2ac19d6b881908fb11780d9c71af8', completion_window='24h', created_at=1758637081, endpoint='/v1/chat/completions', input_file_id='file-AvrA4Z8FL1FDuK5XHeBc4Q', object='batch', status='completed', cancelled_at=None, cancelling_at=None, completed_at=1758647567, error_file_id=None, errors=None, expired_at=None, expires_at=1758723481, failed_at=None, finalizing_at=1758647512, in_progress_at=1758637143, metadata={'description': 'Asynchronous job'}, output_file_id='file-QwmRFsbuf65E8mwGrN5tKu', request_counts=BatchRequestCounts(completed=600, failed=0, total=600), model='gpt-4.1-2025-04-14', usage={'input_tokens': 963362, 'output_tokens': 565986, 'total_tokens': 1529348, 'input_tokens_details': {'cached_tokens': 0}, 'output_tokens_details': {'reasoning_tokens': 0}})\n",
      "Batch(id='batch_68d2ac1a9d78819090c0dbb2ed4351fc', completion_window='24h', created_at=1758637082, endpoint='/v1/chat/completions', input_file_id='file-MhAtDQwcWww5y9f4WzWhZU', object='batch', status='completed', cancelled_at=None, cancelling_at=None, completed_at=1758661129, error_file_id=None, errors=None, expired_at=None, expires_at=1758723482, failed_at=None, finalizing_at=1758661092, in_progress_at=1758637083, metadata={'description': 'Asynchronous job'}, output_file_id='file-BGLJAdjV93k73QLWWfMhwm', request_counts=BatchRequestCounts(completed=200, failed=0, total=200), model='gpt-4.1-2025-04-14', usage={'input_tokens': 738396, 'output_tokens': 292848, 'total_tokens': 1031244, 'input_tokens_details': {'cached_tokens': 0}, 'output_tokens_details': {'reasoning_tokens': 0}})\n",
      "Batch(id='batch_68d2ac1b30f081909034788f573b97b5', completion_window='24h', created_at=1758637083, endpoint='/v1/chat/completions', input_file_id='file-1jC3BVhnFWNQaXAD6mFp7x', object='batch', status='completed', cancelled_at=None, cancelling_at=None, completed_at=1758662588, error_file_id='file-Fu4g4fu7HhHjZpMyMqdHnc', errors=None, expired_at=None, expires_at=1758723483, failed_at=None, finalizing_at=1758662485, in_progress_at=1758637085, metadata={'description': 'Asynchronous job'}, output_file_id='file-1khyAaz7tFyFWvDw73RMvK', request_counts=BatchRequestCounts(completed=598, failed=2, total=600), model='gpt-4.1-2025-04-14', usage={'input_tokens': 1037161, 'output_tokens': 1151105, 'total_tokens': 2188266, 'input_tokens_details': {'cached_tokens': 0}, 'output_tokens_details': {'reasoning_tokens': 0}})\n",
      "Batch(id='batch_68d2ac1becf08190812a8285abe59853', completion_window='24h', created_at=1758637083, endpoint='/v1/chat/completions', input_file_id='file-1k6oLUFpBQJohKgZHjK4xH', object='batch', status='completed', cancelled_at=None, cancelling_at=None, completed_at=1758663082, error_file_id='file-EHJcJgSAYBMmoBGTe2BSzC', errors=None, expired_at=None, expires_at=1758723483, failed_at=None, finalizing_at=1758663035, in_progress_at=1758637145, metadata={'description': 'Asynchronous job'}, output_file_id='file-4kCjMbqpUhDe8AE41yKrZS', request_counts=BatchRequestCounts(completed=599, failed=1, total=600), model='gpt-4.1-2025-04-14', usage={'input_tokens': 987760, 'output_tokens': 1056222, 'total_tokens': 2043982, 'input_tokens_details': {'cached_tokens': 0}, 'output_tokens_details': {'reasoning_tokens': 0}})\n",
      "Batch(id='batch_68d2ac1d0ea08190bb009f78d05a3b2b', completion_window='24h', created_at=1758637085, endpoint='/v1/chat/completions', input_file_id='file-6QiyKsn6sNXivNPYx4zLhr', object='batch', status='completed', cancelled_at=None, cancelling_at=None, completed_at=1758656592, error_file_id=None, errors=None, expired_at=None, expires_at=1758723485, failed_at=None, finalizing_at=1758656531, in_progress_at=1758637086, metadata={'description': 'Asynchronous job'}, output_file_id='file-AemF1hu7Qm8bjGTh8tNhvk', request_counts=BatchRequestCounts(completed=600, failed=0, total=600), model='gpt-4.1-2025-04-14', usage={'input_tokens': 948383, 'output_tokens': 1009240, 'total_tokens': 1957623, 'input_tokens_details': {'cached_tokens': 0}, 'output_tokens_details': {'reasoning_tokens': 0}})\n",
      "Batch(id='batch_68d2ac1da2348190a53f71f6e61fbcfa', completion_window='24h', created_at=1758637085, endpoint='/v1/chat/completions', input_file_id='file-Sk9dzTwtHfdV5KSuYLMh8V', object='batch', status='completed', cancelled_at=None, cancelling_at=None, completed_at=1758664202, error_file_id='file-JmrpLJByPPnShrT4rZLvWQ', errors=None, expired_at=None, expires_at=1758723485, failed_at=None, finalizing_at=1758664140, in_progress_at=1758637148, metadata={'description': 'Asynchronous job'}, output_file_id='file-8rSafbmdV6THETbxYj7TcZ', request_counts=BatchRequestCounts(completed=197, failed=3, total=200), model='gpt-4.1-2025-04-14', usage={'input_tokens': 724290, 'output_tokens': 437884, 'total_tokens': 1162174, 'input_tokens_details': {'cached_tokens': 0}, 'output_tokens_details': {'reasoning_tokens': 0}})\n",
      "Batch(id='batch_68d2ac1eb0508190931837466323d192', completion_window='24h', created_at=1758637086, endpoint='/v1/chat/completions', input_file_id='file-AvwVdwBebW4DWJs6qe1FPc', object='batch', status='completed', cancelled_at=None, cancelling_at=None, completed_at=1758643647, error_file_id=None, errors=None, expired_at=None, expires_at=1758723486, failed_at=None, finalizing_at=1758643562, in_progress_at=1758637088, metadata={'description': 'Asynchronous job'}, output_file_id='file-F1g58vU9MPnML8wxduAkyT', request_counts=BatchRequestCounts(completed=600, failed=0, total=600), model='gpt-4.1-2025-04-14', usage={'input_tokens': 1044839, 'output_tokens': 697090, 'total_tokens': 1741929, 'input_tokens_details': {'cached_tokens': 0}, 'output_tokens_details': {'reasoning_tokens': 0}})\n",
      "Batch(id='batch_68d2ac1f2e7c8190af78406f6ba3bf87', completion_window='24h', created_at=1758637087, endpoint='/v1/chat/completions', input_file_id='file-488YKEYJotPCRXPk3dQEXF', object='batch', status='completed', cancelled_at=None, cancelling_at=None, completed_at=1758644845, error_file_id=None, errors=None, expired_at=None, expires_at=1758723487, failed_at=None, finalizing_at=1758644790, in_progress_at=1758637089, metadata={'description': 'Asynchronous job'}, output_file_id='file-FNfCJrTDRoQHhvRXrMPikc', request_counts=BatchRequestCounts(completed=600, failed=0, total=600), model='gpt-4.1-2025-04-14', usage={'input_tokens': 993896, 'output_tokens': 870130, 'total_tokens': 1864026, 'input_tokens_details': {'cached_tokens': 0}, 'output_tokens_details': {'reasoning_tokens': 0}})\n",
      "Batch(id='batch_68d2ac1fb0c08190a86afe5acd4b20a1', completion_window='24h', created_at=1758637087, endpoint='/v1/chat/completions', input_file_id='file-EQA77ivoy2VwVPPYKtR1r8', object='batch', status='completed', cancelled_at=None, cancelling_at=None, completed_at=1758664171, error_file_id=None, errors=None, expired_at=None, expires_at=1758723487, failed_at=None, finalizing_at=1758664081, in_progress_at=1758637091, metadata={'description': 'Asynchronous job'}, output_file_id='file-JhZGks3MGeMrBJ1k9hZ3kK', request_counts=BatchRequestCounts(completed=600, failed=0, total=600), model='gpt-4.1-2025-04-14', usage={'input_tokens': 952583, 'output_tokens': 728195, 'total_tokens': 1680778, 'input_tokens_details': {'cached_tokens': 0}, 'output_tokens_details': {'reasoning_tokens': 0}})\n",
      "Batch(id='batch_68d2ac2046008190963f900173fe3175', completion_window='24h', created_at=1758637088, endpoint='/v1/chat/completions', input_file_id='file-QQhV3AuhfdcpEDZ4A5CDb8', object='batch', status='completed', cancelled_at=None, cancelling_at=None, completed_at=1758663537, error_file_id='file-HitbzDdf6UrR7ZctV9zWVt', errors=None, expired_at=None, expires_at=1758723488, failed_at=None, finalizing_at=1758663502, in_progress_at=1758637090, metadata={'description': 'Asynchronous job'}, output_file_id='file-UcJzwq5Bo7wS11JmKULwZo', request_counts=BatchRequestCounts(completed=166, failed=34, total=200), model='gpt-4.1-2025-04-14', usage={'input_tokens': 576134, 'output_tokens': 505188, 'total_tokens': 1081322, 'input_tokens_details': {'cached_tokens': 0}, 'output_tokens_details': {'reasoning_tokens': 0}})\n",
      "Batch(id='batch_68d2ac20f7d48190a8e9a9504dc1a13a', completion_window='24h', created_at=1758637088, endpoint='/v1/chat/completions', input_file_id='file-5efYKbtDwUc1KuKcBkJTJD', object='batch', status='completed', cancelled_at=None, cancelling_at=None, completed_at=1758663736, error_file_id='file-TJdRReeiRQb6cQCqcKVeDt', errors=None, expired_at=None, expires_at=1758723488, failed_at=None, finalizing_at=1758663545, in_progress_at=1758637091, metadata={'description': 'Asynchronous job'}, output_file_id='file-YDtkb8mi4L5AxecD9JiPey', request_counts=BatchRequestCounts(completed=598, failed=2, total=600), model='gpt-4.1-2025-04-14', usage={'input_tokens': 1071343, 'output_tokens': 828797, 'total_tokens': 1900140, 'input_tokens_details': {'cached_tokens': 0}, 'output_tokens_details': {'reasoning_tokens': 0}})\n",
      "Batch(id='batch_68d2ac21a87081909d05e70b4b0c394d', completion_window='24h', created_at=1758637089, endpoint='/v1/chat/completions', input_file_id='file-YTN5KGnge6wVbehUi21DUw', object='batch', status='completed', cancelled_at=None, cancelling_at=None, completed_at=1758651718, error_file_id=None, errors=None, expired_at=None, expires_at=1758723489, failed_at=None, finalizing_at=1758651678, in_progress_at=1758637091, metadata={'description': 'Asynchronous job'}, output_file_id='file-LeTQ3QWJvLFai69Lyi8Vbn', request_counts=BatchRequestCounts(completed=600, failed=0, total=600), model='gpt-4.1-2025-04-14', usage={'input_tokens': 1024375, 'output_tokens': 690563, 'total_tokens': 1714938, 'input_tokens_details': {'cached_tokens': 0}, 'output_tokens_details': {'reasoning_tokens': 0}})\n",
      "Batch(id='batch_68d2ac2233388190a2dd1aef72ec1fc7', completion_window='24h', created_at=1758637090, endpoint='/v1/chat/completions', input_file_id='file-LJ5sHv3NPsoUEPcjcqSC34', object='batch', status='completed', cancelled_at=None, cancelling_at=None, completed_at=1758643863, error_file_id=None, errors=None, expired_at=None, expires_at=1758723490, failed_at=None, finalizing_at=1758643762, in_progress_at=1758637091, metadata={'description': 'Asynchronous job'}, output_file_id='file-EPoXRqycQE37YaC6Jdw8cj', request_counts=BatchRequestCounts(completed=600, failed=0, total=600), model='gpt-4.1-2025-04-14', usage={'input_tokens': 982556, 'output_tokens': 479996, 'total_tokens': 1462552, 'input_tokens_details': {'cached_tokens': 0}, 'output_tokens_details': {'reasoning_tokens': 0}})\n",
      "Batch(id='batch_68d2ac22b9e8819083c08e405d20c780', completion_window='24h', created_at=1758637090, endpoint='/v1/chat/completions', input_file_id='file-LKSm1jxPyEePJRAyfoUAr6', object='batch', status='completed', cancelled_at=None, cancelling_at=None, completed_at=1758641144, error_file_id=None, errors=None, expired_at=None, expires_at=1758723490, failed_at=None, finalizing_at=1758641118, in_progress_at=1758637093, metadata={'description': 'Asynchronous job'}, output_file_id='file-2rNygpYusK9KSXKHx13eUn', request_counts=BatchRequestCounts(completed=200, failed=0, total=200), model='gpt-4.1-2025-04-14', usage={'input_tokens': 744933, 'output_tokens': 198943, 'total_tokens': 943876, 'input_tokens_details': {'cached_tokens': 0}, 'output_tokens_details': {'reasoning_tokens': 0}})\n"
     ]
    }
   ],
   "source": [
    "for batch in openai_batches:\n",
    "    batch_id_info = open_ai_client.batches.retrieve(batch.id)\n",
    "    print(batch_id_info)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 38,
   "id": "45f9f6d1",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Saving to /home/rodionfa/FloorplanQA/qa_response/shortest_path/living_rooms/gpt-4.1-2025-04-14_12288.jsonl\n",
      "Saving to /home/rodionfa/FloorplanQA/qa_response/shortest_path/bedrooms/gpt-4.1-2025-04-14_12288.jsonl\n",
      "Saving to /home/rodionfa/FloorplanQA/qa_response/shortest_path/kitchens/gpt-4.1-2025-04-14_12288.jsonl\n",
      "Saving to /home/rodionfa/FloorplanQA/qa_response/shortest_path/hssd_data_simplified/gpt-4.1-2025-04-14_12288.jsonl\n",
      "Saving to /home/rodionfa/FloorplanQA/qa_response/obstruction/living_rooms/gpt-4.1-2025-04-14_12288.jsonl\n",
      "Saving to /home/rodionfa/FloorplanQA/qa_response/obstruction/bedrooms/gpt-4.1-2025-04-14_12288.jsonl\n",
      "Saving to /home/rodionfa/FloorplanQA/qa_response/obstruction/kitchens/gpt-4.1-2025-04-14_12288.jsonl\n",
      "Saving to /home/rodionfa/FloorplanQA/qa_response/obstruction/hssd_data_simplified/gpt-4.1-2025-04-14_12288.jsonl\n",
      "Saving to /home/rodionfa/FloorplanQA/qa_response/view_angle/living_rooms/gpt-4.1-2025-04-14_12288.jsonl\n",
      "Saving to /home/rodionfa/FloorplanQA/qa_response/view_angle/bedrooms/gpt-4.1-2025-04-14_12288.jsonl\n",
      "Saving to /home/rodionfa/FloorplanQA/qa_response/view_angle/kitchens/gpt-4.1-2025-04-14_12288.jsonl\n",
      "Saving to /home/rodionfa/FloorplanQA/qa_response/view_angle/hssd_data_simplified/gpt-4.1-2025-04-14_12288.jsonl\n",
      "Saving to /home/rodionfa/FloorplanQA/qa_response/max_box/living_rooms/gpt-4.1-2025-04-14_12288.jsonl\n",
      "Saving to /home/rodionfa/FloorplanQA/qa_response/max_box/bedrooms/gpt-4.1-2025-04-14_12288.jsonl\n",
      "Saving to /home/rodionfa/FloorplanQA/qa_response/max_box/kitchens/gpt-4.1-2025-04-14_12288.jsonl\n",
      "Saving to /home/rodionfa/FloorplanQA/qa_response/max_box/hssd_data_simplified/gpt-4.1-2025-04-14_12288.jsonl\n"
     ]
    }
   ],
   "source": [
    "index = 0\n",
    "for max_tokens, model_id in openai_models_list:\n",
    "    for dataset in datasets:\n",
    "        for room_type in room_types:\n",
    "            batch = openai_batches[index]\n",
    "            index += 1\n",
    "            # if batch.id in done_set:\n",
    "\n",
    "            batch_id_info = open_ai_client.batches.retrieve(batch.id)\n",
    "            batch_result = open_ai_client.files.content(batch_id_info.output_file_id)\n",
    "\n",
    "            model_name = model_id.split(\"/\")[-1]\n",
    "\n",
    "            output_jsonl = f\"/home/rodionfa/FloorplanQA/qa_response/{dataset}/{room_type}/{model_name}_{max_tokens}.jsonl\"\n",
    "            print('Saving to', output_jsonl)\n",
    "            output_jsonl = Path(output_jsonl)\n",
    "            output_jsonl.parent.mkdir(parents=True, exist_ok=True)\n",
    "\n",
    "            with open(output_jsonl, \"w\") as f:\n",
    "                for line in batch_result.text.strip().splitlines():\n",
    "                    line = json.loads(line)\n",
    "                    json.dump(line, f)\n",
    "                    f.write(\"\\n\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "feda6a99",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": 39,
   "id": "e4886cf4",
   "metadata": {},
   "outputs": [],
   "source": [
    "from pathlib import Path\n",
    "import json, io\n",
    "\n",
    "def _parse_jsonl(text):\n",
    "    if not text:\n",
    "        return []\n",
    "    return [json.loads(line) for line in io.StringIO(text) if line.strip()]\n",
    "\n",
    "# ---- Rebuild the same iteration order your loop used, to align with openai_batches ----\n",
    "param_grid = []  # [(max_tokens, model_id, dataset, room_type)]\n",
    "for max_tokens, model_id in openai_models_list:\n",
    "    for dataset in datasets:\n",
    "        for room_type in room_types:\n",
    "            param_grid.append((max_tokens, model_id, dataset, room_type))\n",
    "\n",
    "assert len(param_grid) == len(openai_batches), \"param_grid and openai_batches must align 1:1\"\n",
    "\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 40,
   "id": "74376033",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Retrying 2 rows from batch batch_68d2ac1b30f081909034788f573b97b5...\n",
      "Retrying 1 rows from batch batch_68d2ac1becf08190812a8285abe59853...\n",
      "Retrying 3 rows from batch batch_68d2ac1da2348190a53f71f6e61fbcfa...\n",
      "Retrying 34 rows from batch batch_68d2ac2046008190963f900173fe3175...\n",
      "Retrying 2 rows from batch batch_68d2ac20f7d48190a8e9a9504dc1a13a...\n"
     ]
    }
   ],
   "source": [
    "openai_retied_batches = []  # same length, index-aligned with openai_batches\n",
    "\n",
    "for i, batch in enumerate(openai_batches):\n",
    "    # retrieve batch + its files\n",
    "    b = open_ai_client.batches.retrieve(batch.id)\n",
    "\n",
    "    # pull original input (to reconstruct failed rows exactly)\n",
    "    in_text = open_ai_client.files.content(b.input_file_id).text\n",
    "    input_rows = _parse_jsonl(in_text)\n",
    "    by_custom = {r.get(\"custom_id\"): r for r in input_rows if r.get(\"custom_id\") is not None}\n",
    "    by_id     = {r.get(\"id\"):        r for r in input_rows if r.get(\"id\") is not None}\n",
    "\n",
    "    # read errors for this batch\n",
    "    failed_rows = []\n",
    "    if getattr(b, \"error_file_id\", None):\n",
    "        err_text = open_ai_client.files.content(b.error_file_id).text\n",
    "        for line in _parse_jsonl(err_text):\n",
    "            # keep ALL failures; if you want only transient, filter on line.get(\"status_code\") here\n",
    "            cid = line.get(\"custom_id\")\n",
    "            rid = line.get(\"id\")\n",
    "            src = by_custom.get(cid) if cid in by_custom else by_id.get(rid)\n",
    "            if src:\n",
    "                failed_rows.append(src)\n",
    "\n",
    "    if not failed_rows:\n",
    "        # no retry needed for this slot\n",
    "        openai_retied_batches.append(None)\n",
    "        continue\n",
    "\n",
    "    print(f\"Retrying {len(failed_rows)} rows from batch {batch.id}...\")\n",
    "    # write a retry-only JSONL (one per original batch) and submit a new batch\n",
    "    retry_payload_path = Path(f\"./retry_failed_{i}.jsonl\")\n",
    "    retry_payload_path.parent.mkdir(parents=True, exist_ok=True)\n",
    "    with retry_payload_path.open(\"w\", encoding=\"utf-8\") as f:\n",
    "        for row in failed_rows:\n",
    "            f.write(json.dumps(row, ensure_ascii=False) + \"\\n\")\n",
    "\n",
    "    file_obj = open_ai_client.files.create(file=retry_payload_path.open(\"rb\"), purpose=\"batch\")\n",
    "\n",
    "    retry_batch = open_ai_client.batches.create(\n",
    "        input_file_id=file_obj.id,\n",
    "        endpoint=\"/v1/chat/completions\",\n",
    "        completion_window=\"24h\",\n",
    "        metadata={\n",
    "            \"description\": \"Asynchronous job\",\n",
    "            \"retry_of\": batch.id\n",
    "        }\n",
    "    )\n",
    "\n",
    "    openai_retied_batches.append(retry_batch)\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 42,
   "id": "5169ec35",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Batch(id='batch_68d3975c8a888190828f85750b52e290', completion_window='24h', created_at=1758697308, endpoint='/v1/chat/completions', input_file_id='file-NUg8b5MM4EDrfCjDGYzMu7', object='batch', status='completed', cancelled_at=None, cancelling_at=None, completed_at=1758697447, error_file_id=None, errors=None, expired_at=None, expires_at=1758783708, failed_at=None, finalizing_at=1758697445, in_progress_at=1758697369, metadata={'description': 'Asynchronous job', 'retry_of': 'batch_68d2ac1b30f081909034788f573b97b5'}, output_file_id='file-8L4YHuLT7DNaWK42yG1xyt', request_counts=BatchRequestCounts(completed=2, failed=0, total=2), model='gpt-4.1-2025-04-14', usage={'input_tokens': 3478, 'output_tokens': 3806, 'total_tokens': 7284, 'input_tokens_details': {'cached_tokens': 0}, 'output_tokens_details': {'reasoning_tokens': 0}})\n",
      "Batch(id='batch_68d39761cfb48190819815eea1d5518b', completion_window='24h', created_at=1758697313, endpoint='/v1/chat/completions', input_file_id='file-5BYruQmn4wGy1ayNHQV5Sf', object='batch', status='completed', cancelled_at=None, cancelling_at=None, completed_at=1758697398, error_file_id=None, errors=None, expired_at=None, expires_at=1758783713, failed_at=None, finalizing_at=1758697395, in_progress_at=1758697374, metadata={'description': 'Asynchronous job', 'retry_of': 'batch_68d2ac1becf08190812a8285abe59853'}, output_file_id='file-8Nm3GpX8yhqoAe3hzRAcij', request_counts=BatchRequestCounts(completed=1, failed=0, total=1), model='gpt-4.1-2025-04-14', usage={'input_tokens': 1936, 'output_tokens': 3208, 'total_tokens': 5144, 'input_tokens_details': {'cached_tokens': 0}, 'output_tokens_details': {'reasoning_tokens': 0}})\n",
      "Batch(id='batch_68d3976b3fc4819087362dce8ec9b4c7', completion_window='24h', created_at=1758697323, endpoint='/v1/chat/completions', input_file_id='file-SxjvqjuciQbJrreJFT73b5', object='batch', status='completed', cancelled_at=None, cancelling_at=None, completed_at=1758697536, error_file_id=None, errors=None, expired_at=None, expires_at=1758783723, failed_at=None, finalizing_at=1758697533, in_progress_at=1758697386, metadata={'description': 'Asynchronous job', 'retry_of': 'batch_68d2ac1da2348190a53f71f6e61fbcfa'}, output_file_id='file-6RcmZf4PKcCWXTWS11nH8C', request_counts=BatchRequestCounts(completed=3, failed=0, total=3), model='gpt-4.1-2025-04-14', usage={'input_tokens': 9248, 'output_tokens': 10387, 'total_tokens': 19635, 'input_tokens_details': {'cached_tokens': 0}, 'output_tokens_details': {'reasoning_tokens': 0}})\n",
      "Batch(id='batch_68d3977aa7848190baa8dd662d7aee71', completion_window='24h', created_at=1758697338, endpoint='/v1/chat/completions', input_file_id='file-HGWNcYCnrkoZWYhzbMcz3t', object='batch', status='in_progress', cancelled_at=None, cancelling_at=None, completed_at=None, error_file_id=None, errors=None, expired_at=None, expires_at=1758783738, failed_at=None, finalizing_at=None, in_progress_at=1758697340, metadata={'description': 'Asynchronous job', 'retry_of': 'batch_68d2ac2046008190963f900173fe3175'}, output_file_id=None, request_counts=BatchRequestCounts(completed=16, failed=0, total=34), model='gpt-4.1-2025-04-14', usage={'input_tokens': 0, 'output_tokens': 0, 'total_tokens': 0, 'input_tokens_details': {'cached_tokens': 0}, 'output_tokens_details': {'reasoning_tokens': 0}})\n",
      "Batch(id='batch_68d3977f4ec48190982c3c27f0e56957', completion_window='24h', created_at=1758697343, endpoint='/v1/chat/completions', input_file_id='file-WBXLTwLnUfsKK7gX8mBjh6', object='batch', status='completed', cancelled_at=None, cancelling_at=None, completed_at=1758697369, error_file_id=None, errors=None, expired_at=None, expires_at=1758783743, failed_at=None, finalizing_at=1758697367, in_progress_at=1758697344, metadata={'description': 'Asynchronous job', 'retry_of': 'batch_68d2ac20f7d48190a8e9a9504dc1a13a'}, output_file_id='file-CuSg4rxiSUw1yggqBGbWUV', request_counts=BatchRequestCounts(completed=2, failed=0, total=2), model='gpt-4.1-2025-04-14', usage={'input_tokens': 3718, 'output_tokens': 3393, 'total_tokens': 7111, 'input_tokens_details': {'cached_tokens': 0}, 'output_tokens_details': {'reasoning_tokens': 0}})\n"
     ]
    }
   ],
   "source": [
    "for batch in openai_retied_batches:\n",
    "    if batch is not None:\n",
    "        batch_id_info = open_ai_client.batches.retrieve(batch.id)\n",
    "        print(batch_id_info)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "c9569cca",
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "plan_b",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.10.17"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
