{
 "cells": [
  {
   "cell_type": "code",
   "id": "initial_id",
   "metadata": {
    "collapsed": true
   },
   "source": [
    "import os\n",
    "from shutil import copytree\n",
    "\n",
    "import PIL.Image\n",
    "import PIL.ImageDraw2\n",
    "from tqdm import tqdm\n",
    "\n",
    "from src.bongard_problems.rendering import draw_compact_bongard_problem, resize"
   ],
   "outputs": [],
   "execution_count": null
  },
  {
   "cell_type": "code",
   "id": "6bac1f16b0226a47",
   "metadata": {},
   "source": [
    "source_dir = \"~/Projects/llm-avr-benchmarks/data/raw/bongard_rwr_splitted\"\n",
    "target_dir = \"~/Projects/llm-avr-benchmarks/data/raw/bongard_rwr\"\n",
    "target_labels_path = \"~/Projects/llm-avr-benchmarks/data/raw/bongard_translated.csv\""
   ],
   "outputs": [],
   "execution_count": null
  },
  {
   "cell_type": "markdown",
   "id": "57ca8e7bd49efd5e",
   "metadata": {},
   "source": [
    "## Copy images from original dataset directory to processed directory"
   ]
  },
  {
   "cell_type": "code",
   "id": "27696769692c707a",
   "metadata": {},
   "source": [
    "for problem_id in tqdm(sorted(os.listdir(f\"{source_dir}\"))):\n",
    "    copytree(f\"{source_dir}/{problem_id}\", f\"{target_dir}/{problem_id}\")"
   ],
   "outputs": [],
   "execution_count": null
  },
  {
   "cell_type": "markdown",
   "id": "f516ef66e1b07174",
   "metadata": {},
   "source": [
    "## Resize each image so that the bigger dimension (height or width) is at most 512px"
   ]
  },
  {
   "cell_type": "code",
   "id": "658e4f58e7e6da89",
   "metadata": {},
   "source": [
    "for problem_id in tqdm(sorted(os.listdir(target_dir))):\n",
    "    for side in [\"left\", \"right\"]:\n",
    "        for filename in os.listdir(f\"{target_dir}/{problem_id}/{side}\"):\n",
    "            filepath = f\"{target_dir}/{problem_id}/{side}/{filename}\"\n",
    "            try:\n",
    "                image = PIL.Image.open(filepath).convert(\"RGB\")\n",
    "                image = resize(image, 512)\n",
    "                image.save(filepath)\n",
    "            except Exception as e:\n",
    "                print(filepath, e)"
   ],
   "outputs": [],
   "execution_count": null
  },
  {
   "cell_type": "markdown",
   "id": "dadd096d62aa704b",
   "metadata": {},
   "source": [
    "## Arrange into the whole matrix such that its area is minimized; Resize to at most 1024px per dimension"
   ]
  },
  {
   "cell_type": "code",
   "id": "1ffe835c0cc81310",
   "metadata": {},
   "source": [
    "for problem_id in tqdm(sorted(os.listdir(target_dir))):\n",
    "    left_images = [\n",
    "        PIL.Image.open(f\"{target_dir}/{problem_id}/left/{filename}\")\n",
    "        for filename in sorted(os.listdir(f\"{target_dir}/{problem_id}/left\"))\n",
    "    ]\n",
    "    right_images = [\n",
    "        PIL.Image.open(f\"{target_dir}/{problem_id}/right/{filename}\")\n",
    "        for filename in sorted(os.listdir(f\"{target_dir}/{problem_id}/right\"))\n",
    "    ]\n",
    "    left_canvas, right_canvas, canvas = draw_compact_bongard_problem(\n",
    "        left_images,\n",
    "        right_images,\n",
    "        margin=10,\n",
    "        side_max_size=512,\n",
    "        max_size=1024,\n",
    "        background_color=\"black\",\n",
    "        separator_color=\"white\",\n",
    "    )\n",
    "    left_canvas.save(f\"{target_dir}/{problem_id}/left.png\")\n",
    "    right_canvas.save(f\"{target_dir}/{problem_id}/right.png\")\n",
    "    canvas.save(f\"{target_dir}/{problem_id}/whole.png\")\n",
    "    # canvas.show()"
   ],
   "outputs": [],
   "execution_count": null
  },
  {
   "cell_type": "markdown",
   "id": "6373668081260067",
   "metadata": {},
   "source": [
    "## Arrange but with white background"
   ]
  },
  {
   "cell_type": "code",
   "id": "320ff65ab55d9242",
   "metadata": {},
   "source": [
    "for problem_id in tqdm(sorted(os.listdir(target_dir))):\n",
    "    left_images = [\n",
    "        PIL.Image.open(f\"{target_dir}/{problem_id}/left/{filename}\")\n",
    "        for filename in sorted(os.listdir(f\"{target_dir}/{problem_id}/left\"))\n",
    "    ]\n",
    "    right_images = [\n",
    "        PIL.Image.open(f\"{target_dir}/{problem_id}/right/{filename}\")\n",
    "        for filename in sorted(os.listdir(f\"{target_dir}/{problem_id}/right\"))\n",
    "    ]\n",
    "    left_canvas, right_canvas, canvas = draw_compact_bongard_problem(\n",
    "        left_images,\n",
    "        right_images,\n",
    "        margin=10,\n",
    "        side_max_size=512,\n",
    "        max_size=1024,\n",
    "        background_color=\"white\",\n",
    "        separator_color=\"black\",\n",
    "    )\n",
    "    canvas.save(f\"{target_dir}/{problem_id}/whole-white.png\")\n",
    "    # canvas.show()"
   ],
   "outputs": [],
   "execution_count": null
  },
  {
   "cell_type": "code",
   "id": "8bbaa3087b3b8a14",
   "metadata": {},
   "source": [],
   "outputs": [],
   "execution_count": null
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 2
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython2",
   "version": "3.9.13"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
