{
  "cells": [
    {
      "cell_type": "markdown",
      "metadata": {},
      "source": [
        "# Imports"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": 2,
      "metadata": {},
      "outputs": [],
      "source": [
        "import os\n",
        "import shutil\n",
        "import random"
      ]
    },
    {
      "cell_type": "markdown",
      "metadata": {},
      "source": [
        "# Dataset Spliting\n"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {},
      "outputs": [],
      "source": [
        "random.seed(42)\n",
        "\n",
        "print(\"Current working directory:\", os.getcwd())\n",
        "\n",
        "os.chdir(r\"./Data_files/Cyst_vs_Normal\")\n",
        "# os.chdir(r\"./Data_files/Cyst_vs_Stone\")\n",
        "# os.chdir(r\"./Data_files/Cyst_vs_Tumor\")\n",
        "# os.chdir(r\"./Data_files/Stone_vs_Tumor\")\n",
        "\n",
        "# Define the classes\n",
        "two_classes = [\"Cyst\", \"Normal\"]\n",
        "# two_classes = [\"Cyst\", \"Stone\"]\n",
        "# two_classes = [\"Cyst\", \"Tumor\"]\n",
        "# two_classes = [\"Stone\", \"Tumor\"]\n",
        "\n",
        "\n",
        "shutil.rmtree('Split_ds', ignore_errors=True)\n",
        "os.makedirs(f'Split_ds/training/{two_classes[0]}', exist_ok=True)\n",
        "os.makedirs(f'Split_ds/training/{two_classes[1]}', exist_ok=True)\n",
        "os.makedirs(f'Split_ds/validation/{two_classes[0]}', exist_ok=True)\n",
        "os.makedirs(f'Split_ds/validation/{two_classes[1]}', exist_ok=True)\n",
        "os.makedirs(f'Split_ds/testing/{two_classes[0]}', exist_ok=True)\n",
        "os.makedirs(f'Split_ds/testing/{two_classes[1]}', exist_ok=True)\n",
        "\n",
        "class_1 = []\n",
        "class_2 = []\n",
        "\n",
        "\n",
        "for image in os.listdir(f\"Full_ds/{two_classes[0]}\"):\n",
        "    class_1.append(f\"Full_ds/{two_classes[0]}/{image}\")\n",
        "\n",
        "for image in os.listdir(f\"Full_ds/{two_classes[1]}\"):\n",
        "    class_2.append(f\"Full_ds/{two_classes[1]}/{image}\")\n",
        "\n",
        "images = class_1 + class_2\n",
        "random.shuffle(images)\n",
        "\n",
        "num_images = len(images)\n",
        "train_num = int(0.8 * num_images)\n",
        "val_num = int(0.1 * num_images)\n",
        "print(\"train_num: \", train_num)\n",
        "print(\"val_num: \", val_num)\n",
        "print(\"test_num: \", num_images - train_num - val_num)\n",
        "\n",
        "train = images[0:train_num]\n",
        "val = images[train_num:train_num + val_num]\n",
        "test = images[train_num + val_num:]\n",
        "\n",
        "\n",
        "for image in train:\n",
        "    if image[8] == two_classes[0][0]:\n",
        "        shutil.copy(image, f\"Split_ds/training/{two_classes[0]}\")\n",
        "    if image[8] == two_classes[1][0]:\n",
        "        shutil.copy(image, f\"Split_ds/training/{two_classes[1]}\")\n",
        "\n",
        "for image in val:\n",
        "    if image[8] == two_classes[0][0]:\n",
        "        shutil.copy(image, f\"Split_ds/validation/{two_classes[0]}\")\n",
        "    if image[8] == two_classes[1][0]:\n",
        "        shutil.copy(image, f\"Split_ds/validation/{two_classes[1]}\")\n",
        "\n",
        "for image in test:\n",
        "    if image[8] == two_classes[0][0]:\n",
        "        shutil.copy(image, f\"Split_ds/testing/{two_classes[0]}\")\n",
        "    if image[8] == two_classes[1][0]:\n",
        "        shutil.copy(image, f\"Split_ds/testing/{two_classes[1]}\")"
      ]
    }
  ],
  "metadata": {
    "colab": {
      "authorship_tag": "ABX9TyNN2hYPfQIf1vZ68NUZ4fxu",
      "collapsed_sections": [],
      "include_colab_link": true,
      "mount_file_id": "1ULwSyd2ZI3osiHE79X6KvGrXmE0qTV1S",
      "name": "split_dataset.ipynb",
      "provenance": []
    },
    "kernelspec": {
      "display_name": "Python 3",
      "name": "python3"
    },
    "language_info": {
      "codemirror_mode": {
        "name": "ipython",
        "version": 3
      },
      "file_extension": ".py",
      "mimetype": "text/x-python",
      "name": "python",
      "nbconvert_exporter": "python",
      "pygments_lexer": "ipython3",
      "version": "3.11.5"
    }
  },
  "nbformat": 4,
  "nbformat_minor": 0
}
