{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "id": "502d595c",
   "metadata": {},
   "outputs": [],
   "source": [
    "import os\n",
    "os.sys.path.append(\"..\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "id": "initial_id",
   "metadata": {
    "ExecuteTime": {
     "end_time": "2024-12-19T06:09:05.039841Z",
     "start_time": "2024-12-19T06:08:15.190757Z"
    },
    "collapsed": true
   },
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/inspire/ssd/ws-f4d69b29-e0a5-44e6-bd92-acf4de9990f0/public-project/public/yjc/conda/envs/vima/lib/python3.9/site-packages/tqdm/auto.py:21: TqdmWarning: IProgress not found. Please update jupyter and ipywidgets. See https://ipywidgets.readthedocs.io/en/stable/user_install.html\n",
      "  from .autonotebook import tqdm as notebook_tqdm\n",
      "No CUDA runtime is found, using CUDA_HOME='/usr/local/cuda'\n"
     ]
    },
    {
     "ename": "RuntimeError",
     "evalue": "Found no NVIDIA driver on your system. Please check that you have an NVIDIA GPU and installed a driver from http://www.nvidia.com/Download/index.aspx",
     "output_type": "error",
     "traceback": [
      "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m",
      "\u001b[0;31mRuntimeError\u001b[0m                              Traceback (most recent call last)",
      "\u001b[1;32m/inspire/ssd/ws-f4d69b29-e0a5-44e6-bd92-acf4de9990f0/public-project/public/yjc/cunxin/Chameleon-VLA/openvla/notebooks/internvl2.5.ipynb Cell 2\u001b[0m line \u001b[0;36m5\n\u001b[1;32m      <a href='vscode-notebook-cell://nat-notebook-inspire.sii.edu.cn/inspire/ssd/ws-f4d69b29-e0a5-44e6-bd92-acf4de9990f0/public-project/public/yjc/cunxin/Chameleon-VLA/openvla/notebooks/internvl2.5.ipynb#W1sdnNjb2RlLXJlbW90ZQ%3D%3D?line=1'>2</a>\u001b[0m \u001b[39mfrom\u001b[39;00m \u001b[39minternvl\u001b[39;00m\u001b[39m.\u001b[39;00m\u001b[39mextern\u001b[39;00m\u001b[39m.\u001b[39;00m\u001b[39mhf\u001b[39;00m\u001b[39m.\u001b[39;00m\u001b[39mmodeling_internvl\u001b[39;00m \u001b[39mimport\u001b[39;00m InternVLChatModel\n\u001b[1;32m      <a href='vscode-notebook-cell://nat-notebook-inspire.sii.edu.cn/inspire/ssd/ws-f4d69b29-e0a5-44e6-bd92-acf4de9990f0/public-project/public/yjc/cunxin/Chameleon-VLA/openvla/notebooks/internvl2.5.ipynb#W1sdnNjb2RlLXJlbW90ZQ%3D%3D?line=2'>3</a>\u001b[0m \u001b[39mfrom\u001b[39;00m \u001b[39minternvl\u001b[39;00m\u001b[39m.\u001b[39;00m\u001b[39mextern\u001b[39;00m\u001b[39m.\u001b[39;00m\u001b[39mhf\u001b[39;00m\u001b[39m.\u001b[39;00m\u001b[39mtokenization_internlm2\u001b[39;00m \u001b[39mimport\u001b[39;00m InternLM2Tokenizer\n\u001b[0;32m----> <a href='vscode-notebook-cell://nat-notebook-inspire.sii.edu.cn/inspire/ssd/ws-f4d69b29-e0a5-44e6-bd92-acf4de9990f0/public-project/public/yjc/cunxin/Chameleon-VLA/openvla/notebooks/internvl2.5.ipynb#W1sdnNjb2RlLXJlbW90ZQ%3D%3D?line=4'>5</a>\u001b[0m torch\u001b[39m.\u001b[39;49mcuda\u001b[39m.\u001b[39;49mset_device(\u001b[39m3\u001b[39;49m)\n\u001b[1;32m      <a href='vscode-notebook-cell://nat-notebook-inspire.sii.edu.cn/inspire/ssd/ws-f4d69b29-e0a5-44e6-bd92-acf4de9990f0/public-project/public/yjc/cunxin/Chameleon-VLA/openvla/notebooks/internvl2.5.ipynb#W1sdnNjb2RlLXJlbW90ZQ%3D%3D?line=6'>7</a>\u001b[0m model_name_or_path \u001b[39m=\u001b[39m \u001b[39m\"\u001b[39m\u001b[39m/inspire/ssd/ws-f4d69b29-e0a5-44e6-bd92-acf4de9990f0/public-project/public/yjc/cunxin/internvl_checkpoint/2b\u001b[39m\u001b[39m\"\u001b[39m\n\u001b[1;32m      <a href='vscode-notebook-cell://nat-notebook-inspire.sii.edu.cn/inspire/ssd/ws-f4d69b29-e0a5-44e6-bd92-acf4de9990f0/public-project/public/yjc/cunxin/Chameleon-VLA/openvla/notebooks/internvl2.5.ipynb#W1sdnNjb2RlLXJlbW90ZQ%3D%3D?line=8'>9</a>\u001b[0m model \u001b[39m=\u001b[39m InternVLChatModel\u001b[39m.\u001b[39mfrom_pretrained(\n\u001b[1;32m     <a href='vscode-notebook-cell://nat-notebook-inspire.sii.edu.cn/inspire/ssd/ws-f4d69b29-e0a5-44e6-bd92-acf4de9990f0/public-project/public/yjc/cunxin/Chameleon-VLA/openvla/notebooks/internvl2.5.ipynb#W1sdnNjb2RlLXJlbW90ZQ%3D%3D?line=9'>10</a>\u001b[0m     model_name_or_path,\n\u001b[1;32m     <a href='vscode-notebook-cell://nat-notebook-inspire.sii.edu.cn/inspire/ssd/ws-f4d69b29-e0a5-44e6-bd92-acf4de9990f0/public-project/public/yjc/cunxin/Chameleon-VLA/openvla/notebooks/internvl2.5.ipynb#W1sdnNjb2RlLXJlbW90ZQ%3D%3D?line=10'>11</a>\u001b[0m     torch_dtype\u001b[39m=\u001b[39mtorch\u001b[39m.\u001b[39mbfloat16,\n\u001b[0;32m   (...)\u001b[0m\n\u001b[1;32m     <a href='vscode-notebook-cell://nat-notebook-inspire.sii.edu.cn/inspire/ssd/ws-f4d69b29-e0a5-44e6-bd92-acf4de9990f0/public-project/public/yjc/cunxin/Chameleon-VLA/openvla/notebooks/internvl2.5.ipynb#W1sdnNjb2RlLXJlbW90ZQ%3D%3D?line=13'>14</a>\u001b[0m     local_files_only\u001b[39m=\u001b[39m\u001b[39mTrue\u001b[39;00m\n\u001b[1;32m     <a href='vscode-notebook-cell://nat-notebook-inspire.sii.edu.cn/inspire/ssd/ws-f4d69b29-e0a5-44e6-bd92-acf4de9990f0/public-project/public/yjc/cunxin/Chameleon-VLA/openvla/notebooks/internvl2.5.ipynb#W1sdnNjb2RlLXJlbW90ZQ%3D%3D?line=14'>15</a>\u001b[0m )\u001b[39m.\u001b[39meval()\u001b[39m.\u001b[39mcuda()\n",
      "File \u001b[0;32m/inspire/ssd/ws-f4d69b29-e0a5-44e6-bd92-acf4de9990f0/public-project/public/yjc/conda/envs/vima/lib/python3.9/site-packages/torch/cuda/__init__.py:399\u001b[0m, in \u001b[0;36mset_device\u001b[0;34m(device)\u001b[0m\n\u001b[1;32m    397\u001b[0m device \u001b[39m=\u001b[39m _get_device_index(device)\n\u001b[1;32m    398\u001b[0m \u001b[39mif\u001b[39;00m device \u001b[39m>\u001b[39m\u001b[39m=\u001b[39m \u001b[39m0\u001b[39m:\n\u001b[0;32m--> 399\u001b[0m     torch\u001b[39m.\u001b[39;49m_C\u001b[39m.\u001b[39;49m_cuda_setDevice(device)\n",
      "File \u001b[0;32m/inspire/ssd/ws-f4d69b29-e0a5-44e6-bd92-acf4de9990f0/public-project/public/yjc/conda/envs/vima/lib/python3.9/site-packages/torch/cuda/__init__.py:293\u001b[0m, in \u001b[0;36m_lazy_init\u001b[0;34m()\u001b[0m\n\u001b[1;32m    291\u001b[0m \u001b[39mif\u001b[39;00m \u001b[39m\"\u001b[39m\u001b[39mCUDA_MODULE_LOADING\u001b[39m\u001b[39m\"\u001b[39m \u001b[39mnot\u001b[39;00m \u001b[39min\u001b[39;00m os\u001b[39m.\u001b[39menviron:\n\u001b[1;32m    292\u001b[0m     os\u001b[39m.\u001b[39menviron[\u001b[39m\"\u001b[39m\u001b[39mCUDA_MODULE_LOADING\u001b[39m\u001b[39m\"\u001b[39m] \u001b[39m=\u001b[39m \u001b[39m\"\u001b[39m\u001b[39mLAZY\u001b[39m\u001b[39m\"\u001b[39m\n\u001b[0;32m--> 293\u001b[0m torch\u001b[39m.\u001b[39;49m_C\u001b[39m.\u001b[39;49m_cuda_init()\n\u001b[1;32m    294\u001b[0m \u001b[39m# Some of the queued calls may reentrantly call _lazy_init();\u001b[39;00m\n\u001b[1;32m    295\u001b[0m \u001b[39m# we need to just return without initializing in that case.\u001b[39;00m\n\u001b[1;32m    296\u001b[0m \u001b[39m# However, we must not let any *other* threads in!\u001b[39;00m\n\u001b[1;32m    297\u001b[0m _tls\u001b[39m.\u001b[39mis_initializing \u001b[39m=\u001b[39m \u001b[39mTrue\u001b[39;00m\n",
      "\u001b[0;31mRuntimeError\u001b[0m: Found no NVIDIA driver on your system. Please check that you have an NVIDIA GPU and installed a driver from http://www.nvidia.com/Download/index.aspx"
     ]
    }
   ],
   "source": [
    "import torch\n",
    "from internvl.extern.hf.modeling_internvl import InternVLChatModel\n",
    "from internvl.extern.hf.tokenization_internlm2 import InternLM2Tokenizer\n",
    "\n",
    "torch.cuda.set_device(3)\n",
    "\n",
    "model_name_or_path = \"/inspire/ssd/ws-f4d69b29-e0a5-44e6-bd92-acf4de9990f0/public-project/public/yjc/cunxin/internvl_checkpoint/2b\"\n",
    "\n",
    "model = InternVLChatModel.from_pretrained(\n",
    "    model_name_or_path,\n",
    "    torch_dtype=torch.bfloat16,\n",
    "    low_cpu_mem_usage=True,\n",
    "    use_flash_attn=True,\n",
    "    local_files_only=True\n",
    ").eval().cuda()\n",
    "\n",
    "tokenizer = InternLM2Tokenizer.from_pretrained(\n",
    "    model_name_or_path,\n",
    "    local_files_only=True,\n",
    "    use_fast=False\n",
    ")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "id": "446ffcbbe29e3411",
   "metadata": {
    "ExecuteTime": {
     "end_time": "2024-12-19T06:12:47.077862Z",
     "start_time": "2024-12-19T06:12:32.218740Z"
    }
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Sorry, that's my mistake. What did you see in the image?\n",
      "\n",
      "![My apologies, as expected.](https://i.imgur.com/9q2Wg9M.png)\n"
     ]
    }
   ],
   "source": [
    "%matplotlib inline\n",
    "from internvl.extern.hf.processing_internvl import load_image_from_file, process_image\n",
    "import matplotlib.pyplot as plt\n",
    "from PIL import Image\n",
    "\n",
    "generation_config = dict(max_new_tokens=1024, do_sample=True)\n",
    "\n",
    "image_size = 224\n",
    "\n",
    "# url1 = 'http://images.cocodataset.org/val2017/000000039769.jpg'\n",
    "# url2 = 'http://images.cocodataset.org/val2017/000000009769.jpg'\n",
    "# img1, img2 = requests.get(url1, stream=True).raw, requests.get(url2, stream=True).raw\n",
    "img1, img2 = \"assets/+.jpg\", \"assets/000000039769.jpg\"\n",
    "img1 = Image.open(img1).convert('RGB')\n",
    "img2 = Image.open(img2).convert('RGB')\n",
    "img1 = img1.resize((image_size, image_size))\n",
    "# img2 = img2.resize((image_size, image_size))\n",
    "# plt.imshow(img1)\n",
    "pixel_values = process_image(img1, input_size=image_size).to(torch.bfloat16).cuda()\n",
    "# pixel_values1, pixel_values2 = load_image_from_file(img1).to(torch.bfloat16).cuda(), load_image_from_file(img2).to(torch.bfloat16).cuda()\n",
    "# pixel_values1 = pixel_values1[-1:, ...]\n",
    "# pixel_values2 = pixel_values2[-1:, ...]\n",
    "# pixel_values = torch.cat([pixel_values1, pixel_values2], dim=0)\n",
    "# num_patches_list = [pixel_values1.size(0), pixel_values2.size(0)]\n",
    "num_patches_list = [pixel_values.size(0)]\n",
    "# prompt = f\"What do you see separately in the following two images? Image1: <image>\\nImage2: <image>\"\n",
    "prompt = f\"What do you see separately in the following image? Image: <image>\"\n",
    "response, history = model.chat(tokenizer, pixel_values, prompt, generation_config,\n",
    "                               num_patches_list=num_patches_list,\n",
    "                               history=None, return_history=True)\n",
    "print(response)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "a69adc33",
   "metadata": {},
   "outputs": [
    {
     "ename": "",
     "evalue": "",
     "output_type": "error",
     "traceback": [
      "\u001b[1;31mThe Kernel crashed while executing code in the the current cell or a previous cell. Please review the code in the cell(s) to identify a possible cause of the failure. Click <a href='https://aka.ms/vscodeJupyterKernelCrash'>here</a> for more info. View Jupyter <a href='command:jupyter.viewOutput'>log</a> for further details."
     ]
    }
   ],
   "source": [
    "print(model.language_model.get_output_embeddings().weight.data)\n",
    "print(model.language_model.get_input_embeddings().weight.data)"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.9.21"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
