{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import sys \n",
    "sys.path.append('../')\n",
    "sys.path.append('./')\n",
    "from  tiny_imagenet  import * "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "data_conf = {'dimension':256, 'data_path':'../../data/tiny-imagenet/tiny-imagenet-200/' }\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "tiny_img_net_ds = TinyImageNet200(data_conf)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "tiny_img_net_ds.build_dataset()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "len(tiny_img_net_ds.ds_std_train),len(tiny_img_net_ds.ds_std_val)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "tiny_img_net_ds.ds_std_train.X[0].shape"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def get_model_info(model_ID, device):\n",
    "# Save the model to device\n",
    "\tmodel = CLIPModel.from_pretrained(model_ID).to(device)\n",
    " \t# Get the processor\n",
    "\tprocessor = CLIPProcessor.from_pretrained(model_ID)\n",
    "# Get the tokenizer\n",
    "\ttokenizer = CLIPTokenizer.from_pretrained(model_ID)\n",
    "       # Return model, processor & tokenizer\n",
    "\treturn model, processor, tokenizer\n",
    "# Set the device\n",
    "device = \"cuda\" if torch.cuda.is_available() else \"cpu\"\n",
    "# Define the model ID\n",
    "model_ID = \"openai/clip-vit-base-patch32\"\n",
    "# Get model, processor & tokenizer\n",
    "model, processor, tokenizer = get_model_info(model_ID, device)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def get_single_image_embedding(my_image):\n",
    "    image = processor( text = None, images = my_image, return_tensors=\"pt\"\n",
    "\t\t)[\"pixel_values\"].to(device)\n",
    "    \n",
    "    embedding = model.get_image_features(image)\n",
    "    # convert the embeddings to numpy array\n",
    "    embedding_as_np = embedding.cpu().detach().numpy()\n",
    "    return embedding_as_np\n",
    "\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import torch \n",
    "from transformers import CLIPProcessor, CLIPModel, CLIPTokenizer"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "path =''\n",
    "\n",
    "from PIL import Image \n",
    "\n",
    "image = Image.open(path).convert(\"RGB\")\n",
    "lst_images = [image,image,image]\n",
    "v = get_single_image_embedding()\n",
    "v.shape "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "lst_images = [image]*100\n",
    "image_p = processor( text = None, images = lst_images, return_tensors=\"pt\"\n",
    "\t\t)[\"pixel_values\"].to(device)\n",
    "    \n",
    "embedding = model.get_image_features(image_p)\n",
    "# convert the embeddings to numpy array\n",
    "embedding_as_np = embedding.cpu().detach().numpy()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "embedding_as_np.shape "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import numpy as np "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "np.dot(embedding_as_np[0],embedding_as_np[1])/(np.linalg.norm(embedding_as_np[0])**2)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "act-lbl",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.10.4"
  },
  "orig_nbformat": 4
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
