{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "executionInfo": {
     "elapsed": 540,
     "status": "ok",
     "timestamp": 1757237857593,
     "user": {
      "displayName": "Nicla Faccioli",
      "userId": "11628056964833727666"
     },
     "user_tz": -120
    },
    "id": "MOeLdKtwkLZ8"
   },
   "outputs": [],
   "source": [
    "import random\n",
    "import csv\n",
    "\n",
    "import math\n",
    "\n",
    "import pandas as pd\n",
    "import matplotlib.pyplot as plt\n",
    "import matplotlib.patches as patches\n",
    "\n",
    "import textwrap\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "executionInfo": {
     "elapsed": 3,
     "status": "ok",
     "timestamp": 1757237857595,
     "user": {
      "displayName": "Nicla Faccioli",
      "userId": "11628056964833727666"
     },
     "user_tz": -120
    },
    "id": "iSwKBb4wkS6D"
   },
   "outputs": [],
   "source": [
    "def parse_bbox(bbox_str):\n",
    "    if pd.isna(bbox_str) or bbox_str == '':\n",
    "        return None\n",
    "    return tuple(map(int, bbox_str.split(',')))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "id": "hH-rVNHgj3et"
   },
   "outputs": [],
   "source": [
    "def visualize_csv_boxes_grid(csv_path, num_samples=35, boxes_per_row=5, random_seed=42):\n",
    "    df = pd.read_csv(csv_path)\n",
    "    sampled_rows = df.sample(n=num_samples, random_state=random_seed)\n",
    "\n",
    "    num_cols = boxes_per_row\n",
    "    num_rows = math.ceil(num_samples / num_cols)\n",
    "\n",
    "    fig, axes = plt.subplots(num_rows, num_cols, figsize=(boxes_per_row * 4, num_rows * 4))\n",
    "    axes = axes.flatten()  # easy indexing even if last row is incomplete\n",
    "\n",
    "    for ax, (idx, row) in zip(axes, sampled_rows.iterrows()):\n",
    "        # Read the boxes\n",
    "        boxes = []\n",
    "        labels = []\n",
    "        for i in range(1, 5):\n",
    "            obj_col = f'obj{i}'\n",
    "            bbox_col = f'bbox{i}'\n",
    "            obj_name = row[obj_col]\n",
    "            bbox = parse_bbox(row[bbox_col])\n",
    "            if obj_name and isinstance(obj_name, str) and bbox:\n",
    "                boxes.append(bbox)\n",
    "                labels.append(obj_name)\n",
    "\n",
    "        # Plot this row\n",
    "        ax.set_xlim(0, 512)\n",
    "        ax.set_ylim(0, 512)\n",
    "        ax.invert_yaxis()\n",
    "\n",
    "        for i, box in enumerate(boxes):\n",
    "            x1, y1, x3, y3 = box\n",
    "            width = x3 - x1\n",
    "            height = y3 - y1\n",
    "            rect = patches.Rectangle((x1, y1), width, height, linewidth=2, edgecolor='r', facecolor='none')\n",
    "            ax.add_patch(rect)\n",
    "\n",
    "            # Label\n",
    "            ax.text(x1 + 3, y1 - 5, labels[i], color='blue', fontsize=8)\n",
    "\n",
    "        ax.set_title(f'ID {row[\"id\"]}\\n{row[\"prompt\"]}\\n{row[\"category\"]}', fontsize=10)\n",
    "        ax.grid(True)\n",
    "\n",
    "    # Hide unused axes (if num_samples is not multiple of boxes_per_row)\n",
    "    for ax in axes[num_samples:]:\n",
    "        ax.axis('off')\n",
    "\n",
    "    plt.tight_layout()\n",
    "    plt.show()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/",
     "height": 1000
    },
    "executionInfo": {
     "elapsed": 7726,
     "status": "ok",
     "timestamp": 1756503223581,
     "user": {
      "displayName": "Nicla Faccioli",
      "userId": "11628056964833727666"
     },
     "user_tz": -120
    },
    "id": "qwVXHVH7kAgd",
    "outputId": "1d379c33-e6b3-47d9-dfa0-d485de3a32e3"
   },
   "outputs": [],
   "source": [
    "visualize_csv_boxes_grid('openSet.csv', num_samples=35, boxes_per_row=5, random_seed=42)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "id": "Ro-3TTLclxJ2"
   },
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "executionInfo": {
     "elapsed": 18,
     "status": "ok",
     "timestamp": 1757237872200,
     "user": {
      "displayName": "Nicla Faccioli",
      "userId": "11628056964833727666"
     },
     "user_tz": -120
    },
    "id": "vwV8xrXKkYXK"
   },
   "outputs": [],
   "source": [
    "def visualize_csv_boxes_by_ids(csv_path, selected_ids, boxes_per_row=4, output_path=None):\n",
    "    import pandas as pd\n",
    "    import matplotlib.pyplot as plt\n",
    "    import matplotlib.patches as patches\n",
    "    import math\n",
    "\n",
    "    def parse_bbox(bbox_str):\n",
    "        try:\n",
    "            return list(map(int, bbox_str.split(',')))\n",
    "        except:\n",
    "            return None\n",
    "\n",
    "    df = pd.read_csv(csv_path)\n",
    "\n",
    "    padded_ids = [str(id_) for id_ in selected_ids]\n",
    "    selected_rows = df[df['id'].astype(str).isin(padded_ids)]\n",
    "\n",
    "    if selected_rows.empty:\n",
    "        print(\"⚠️ No matching IDs found.\")\n",
    "        return\n",
    "\n",
    "    num_samples = len(selected_rows)\n",
    "    num_cols = boxes_per_row\n",
    "    num_rows = math.ceil(num_samples / num_cols)\n",
    "\n",
    "    fig, axes = plt.subplots(num_rows, num_cols, figsize=(boxes_per_row * 4, num_rows * 4), squeeze=False)\n",
    "    axes = axes.flatten()\n",
    "\n",
    "    for ax, (_, row) in zip(axes, selected_rows.iterrows()):\n",
    "        boxes, labels = [], []\n",
    "        for i in range(1, 5):\n",
    "            obj_col, bbox_col = f'obj{i}', f'bbox{i}'\n",
    "            obj_name = row[obj_col]\n",
    "            bbox = parse_bbox(row[bbox_col])\n",
    "            if obj_name and isinstance(obj_name, str) and bbox:\n",
    "                boxes.append(bbox)\n",
    "                labels.append(obj_name)\n",
    "\n",
    "        ax.set_xlim(0, 512)\n",
    "        ax.set_ylim(0, 512)\n",
    "        ax.invert_yaxis()\n",
    "\n",
    "        for i, box in enumerate(boxes):\n",
    "            x1, y1, x3, y3 = box\n",
    "            rect = patches.Rectangle((x1, y1), x3 - x1, y3 - y1,\n",
    "                                     linewidth=2, edgecolor='r', facecolor='none')\n",
    "            ax.add_patch(rect)\n",
    "            ax.text(x1 + 3, y1 - 5, labels[i], color='blue', fontsize=8)\n",
    "\n",
    "\n",
    "        id_text = f\"ID {row['id']}\"\n",
    "        prompt_text = \"\\n\".join(textwrap.wrap(row[\"prompt\"], width=50))  # adjust width\n",
    "        category_text = row[\"category\"]\n",
    "\n",
    "        title_text = f\"{id_text}\\n{prompt_text}\\n{category_text}\"\n",
    "\n",
    "        ax.set_title(title_text, fontsize=10)\n",
    "        ax.grid(True)\n",
    "\n",
    "    # remove extra axes entirely\n",
    "    for ax in axes[num_samples:]:\n",
    "        fig.delaxes(ax)\n",
    "\n",
    "    plt.tight_layout()\n",
    "\n",
    "    if output_path:\n",
    "        plt.savefig(output_path, bbox_inches='tight')\n",
    "\n",
    "    plt.show()\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/",
     "height": 407
    },
    "executionInfo": {
     "elapsed": 462,
     "status": "ok",
     "timestamp": 1757170308135,
     "user": {
      "displayName": "Nicla Faccioli",
      "userId": "11628056964833727666"
     },
     "user_tz": -120
    },
    "id": "HWMhhR9OkbsM",
    "outputId": "db580c22-1533-4d68-a21d-4fc37a7adbca"
   },
   "outputs": [],
   "source": [
    "# Visualize specific prompts (e.g., ID 0, 5, 18, and 29)\n",
    "visualize_csv_boxes_by_ids(\"fullNewDataset.csv\", selected_ids=[183], output_path=\"2359.png\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/",
     "height": 337
    },
    "executionInfo": {
     "elapsed": 2199,
     "status": "ok",
     "timestamp": 1757170312506,
     "user": {
      "displayName": "Nicla Faccioli",
      "userId": "11628056964833727666"
     },
     "user_tz": -120
    },
    "id": "tY8dWBjeoFTM",
    "outputId": "31c98c5d-10cf-4cc8-a9c5-b13b4549c5e1"
   },
   "outputs": [],
   "source": [
    "visualize_csv_boxes_by_ids(\"fullNewDataset.csv\", selected_ids=[2158,2219,2336,2517], output_path=\"sb_boxes.pdf\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/",
     "height": 407
    },
    "executionInfo": {
     "elapsed": 364,
     "status": "ok",
     "timestamp": 1757170314203,
     "user": {
      "displayName": "Nicla Faccioli",
      "userId": "11628056964833727666"
     },
     "user_tz": -120
    },
    "id": "AF5PqumDo2S9",
    "outputId": "d283f53e-012e-4f6a-87cd-d9f6a2ca965a"
   },
   "outputs": [],
   "source": [
    "visualize_csv_boxes_by_ids(\"fullNewDataset.csv\", selected_ids=[2008], output_path=\"over_boxes.pdf\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/",
     "height": 407
    },
    "executionInfo": {
     "elapsed": 346,
     "status": "ok",
     "timestamp": 1757170333224,
     "user": {
      "displayName": "Nicla Faccioli",
      "userId": "11628056964833727666"
     },
     "user_tz": -120
    },
    "id": "DvKmE0NGpoBN",
    "outputId": "b2736882-5dfa-4720-9a8b-43b01a6bce53"
   },
   "outputs": [],
   "source": [
    "visualize_csv_boxes_by_ids(\"fullNewDataset.csv\", selected_ids=[783], output_path=\"cb_boxes.pdf\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/",
     "height": 382
    },
    "executionInfo": {
     "elapsed": 1325,
     "status": "ok",
     "timestamp": 1756418467517,
     "user": {
      "displayName": "Nicla Faccioli",
      "userId": "11628056964833727666"
     },
     "user_tz": -120
    },
    "id": "s5rCG7AmqAeO",
    "outputId": "cea8cc3d-e11d-401d-8302-b5e58db90ea1"
   },
   "outputs": [],
   "source": [
    "visualize_csv_boxes_by_ids(\"fullNewDataset.csv\", selected_ids=[1058,1254,1303,1454], output_path=\"ab_boxes.pdf\")\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/",
     "height": 407
    },
    "executionInfo": {
     "elapsed": 373,
     "status": "ok",
     "timestamp": 1757170474624,
     "user": {
      "displayName": "Nicla Faccioli",
      "userId": "11628056964833727666"
     },
     "user_tz": -120
    },
    "id": "yk3c2JPbqVN9",
    "outputId": "c77298f9-d344-41d6-be90-32c29a129298"
   },
   "outputs": [],
   "source": [
    "visualize_csv_boxes_by_ids(\"fullNewDataset.csv\", selected_ids=[2731], output_path=\"or_boxes.pdf\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/",
     "height": 407
    },
    "executionInfo": {
     "elapsed": 351,
     "status": "ok",
     "timestamp": 1757170359556,
     "user": {
      "displayName": "Nicla Faccioli",
      "userId": "11628056964833727666"
     },
     "user_tz": -120
    },
    "id": "jBci6MGvqln0",
    "outputId": "193a9050-f069-4933-f572-1625d64c4d22"
   },
   "outputs": [],
   "source": [
    "visualize_csv_boxes_by_ids(\"fullNewDataset.csv\", selected_ids=[2951], output_path=\"cc_boxes.pdf\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/",
     "height": 0
    },
    "executionInfo": {
     "elapsed": 2291,
     "status": "ok",
     "timestamp": 1757237909890,
     "user": {
      "displayName": "Nicla Faccioli",
      "userId": "11628056964833727666"
     },
     "user_tz": -120
    },
    "id": "_vG2SMTkwFZb",
    "outputId": "ffd300ab-b1c6-40d5-ddb8-dc22c3e0dbd5"
   },
   "outputs": [],
   "source": [
    "visualize_csv_boxes_by_ids(\"openSet.csv\", selected_ids=[4,385,1499,2471,3033,3210,3275,3318], output_path=\"open_boxes.pdf\")\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "id": "pyvs5kp6vM-6"
   },
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "colab": {
   "authorship_tag": "ABX9TyPhVfzFLNL9qEF0JovlGIOy",
   "provenance": []
  },
  "kernelspec": {
   "display_name": "Python 3",
   "name": "python3"
  },
  "language_info": {
   "name": "python"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 0
}
