{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "ce977b02-580b-41ff-8b79-f3792be87e55",
   "metadata": {},
   "outputs": [],
   "source": [
    "import numpy as np\n",
    "from PIL import Image, ImageDraw, ImageFont,ImageColor\n",
    "\n",
    "class SmartwatchGenerator:\n",
    "    def __init__(self, size=(224, 224)):\n",
    "        self.size = size\n",
    "        self.center = (size[0]//2, size[1]//2)\n",
    "        self.radius = int(min(size)*0.4)\n",
    "        self.font = ImageFont.load_default()\n",
    "        self.image=None\n",
    "    def draw_watch_face(self, draw, material_type, \n",
    "                   material_color=(128,128,128),\n",
    "                   grid_spacing=5,\n",
    "                   material_alpha=255):\n",
    "        \"\"\"\n",
    "        绘制智能手表表盘主体，支持完整颜色控制\n",
    "        \n",
    "        参数:\n",
    "        material_type (str): 材质类型('mesh','noise','pure')\n",
    "        face_color (str/tuple): 纯色材质颜色\n",
    "        mesh_color (tuple): 网格线条颜色（RGB）\n",
    "        noise_color (tuple): 噪点基色（RGB）\n",
    "        grid_spacing (int): 网格线间隔像素\n",
    "        material_alpha (int): 整体透明度(0-255)\n",
    "        \"\"\"\n",
    "        # 创建圆形遮罩\n",
    "        mask = Image.new('L', self.size, 0)\n",
    "        mask_draw = ImageDraw.Draw(mask)\n",
    "        mask_draw.ellipse([self.center[0]-self.radius, self.center[1]-self.radius,\n",
    "                          self.center[0]+self.radius, self.center[1]+self.radius], \n",
    "                          fill=255)\n",
    "        \n",
    "        # 生成材质纹理\n",
    "        material = self.create_material(material_type, \n",
    "                                       face_color=material_color,\n",
    "                                       mesh_color=material_color,\n",
    "                                       noise_color=material_color,\n",
    "                                       grid_spacing=grid_spacing)\n",
    "        \n",
    "        # 处理透明度\n",
    "        material = material.convert('RGBA')\n",
    "        material.putalpha(mask)\n",
    "        r, g, b, a = material.split()\n",
    "        new_alpha = a.point( lambda x: int(x * material_alpha/255))\n",
    "        material.putalpha(new_alpha)  # 直接应用新Alpha\n",
    "        return material\n",
    "    \n",
    "    def create_material(self, material_type, **kwargs):\n",
    "        \"\"\"增强版材质生成器，支持颜色参数\"\"\"\n",
    "        if material_type == 'mesh':\n",
    "            # 网格材质实现\n",
    "            grid_color = kwargs.get('mesh_color', (0,0,0))\n",
    "            grid_color = grid_color if isinstance(grid_color, tuple) else ImageColor.getrgb(grid_color)\n",
    "            grid_spacing = kwargs.get('grid_spacing', 5)\n",
    "            \n",
    "            # 创建透明背景\n",
    "            arr = np.ones((self.size[1], self.size[0], 4), dtype=np.uint8)*255\n",
    "            # 绘制水平线\n",
    "            arr[::grid_spacing, :, :3] = grid_color\n",
    "            arr[:, ::grid_spacing, :3] = grid_color\n",
    "            return Image.fromarray(arr)\n",
    "        \n",
    "        elif material_type == 'noise':\n",
    "            # 彩色噪点材质\n",
    "            base_color = kwargs.get('noise_color', (128,128,128))\n",
    "            base_color = base_color if isinstance(base_color, tuple) else ImageColor.getrgb(base_color)\n",
    "            noise = np.ones((self.size[1], self.size[0], 4), dtype=np.uint8)*255\n",
    "            # 生成彩色噪点\n",
    "            noise[:, :, :3] = np.random.randint(0, 20, \n",
    "                                               (self.size[1], self.size[0], 3), \n",
    "                                               dtype=np.uint8) + base_color\n",
    "            return Image.fromarray(noise.clip(0,255))\n",
    "        \n",
    "        else:  # pure\n",
    "            # 纯色材质\n",
    "            color = kwargs.get('face_color', (128,128,128))\n",
    "            color = color if isinstance(color, tuple) else ImageColor.getrgb(color)\n",
    "            \n",
    "            \n",
    "            return Image.new('RGBA', self.size, (*color, 255))\n",
    "\n",
    "    \n",
    "\n",
    "    def add_clock_hands(self, draw, hour, minute, second, colors):\n",
    "        angles = [\n",
    "            (hour % 12 + minute/60) * 30 - 90,  # Hour hand\n",
    "            minute * 6 - 90,                    # Minute hand\n",
    "            second * 6 - 90                     # Second hand\n",
    "        ]\n",
    "        \n",
    "        lengths = [\n",
    "            self.radius * 0.5,\n",
    "            self.radius * 0.7,\n",
    "            self.radius * 0.9\n",
    "        ]\n",
    "        \n",
    "        for i in range(3):\n",
    "            end_x = self.center[0] + lengths[i] * np.cos(np.radians(angles[i]))\n",
    "            end_y = self.center[1] + lengths[i] * np.sin(np.radians(angles[i]))\n",
    "            draw.line([self.center[0], self.center[1], end_x, end_y], \n",
    "                     fill=colors[i], width=6-i*2)\n",
    "\n",
    "   \n",
    "\n",
    "    def add_weather(self, draw, weather, position, icon_size=30):\n",
    "        \"\"\"\n",
    "        使用预渲染的PNG图标显示天气\n",
    "        :param weather: 天气类型（对应文件名，如'sunny'）\n",
    "        :param position: 显示位置（'top-left'等）\n",
    "        :param icon_size: 图标目标尺寸\n",
    "        \"\"\"\n",
    "       \n",
    "        # 加载天气图标（假设与脚本同目录）\n",
    "        icon_path = f\"./{weather}.png\"\n",
    "        weather_icon = Image.open(icon_path)\n",
    "        \n",
    "        # 缩放图标到指定尺寸\n",
    "        weather_icon = weather_icon.resize((icon_size, icon_size))\n",
    "        \n",
    "        # 计算粘贴位置\n",
    "        x, y = self.get_corner_position(position)\n",
    "        # 粘贴到主画布\n",
    "        self.image.paste(weather_icon, (x, y), weather_icon)\n",
    "        \n",
    "                             \n",
    "    def add_battery(self, draw, percentage, position):\n",
    "        x, y = self.get_corner_position(position)\n",
    "        draw.rectangle([x, y, x+25, y+10], outline='black', width=1)\n",
    "        fill_width = int(23 * percentage/100)\n",
    "        draw.rectangle([x+2, y+2, x+2+fill_width, y+8], fill='green')\n",
    "        draw.text((x+30, y), f\"{percentage}%\", fill='black', font=self.font)\n",
    "\n",
    "    def get_corner_position(self, position):\n",
    "        margin = 10\n",
    "        if position == 'top-left':\n",
    "            return (margin, margin)\n",
    "        elif position == 'top-right':\n",
    "            return (self.size[0]-50, margin)\n",
    "        elif position == 'bottom-left':\n",
    "            return (margin, self.size[1]-30)\n",
    "        else:  # bottom-right\n",
    "            return (self.size[0]-50, self.size[1]-30)\n",
    "\n",
    "    def generate(self, hour=12, minute=0, second=0,\n",
    "                hour_color=(0,0,0), minute_color=(100,100,100), second_color=(255,0,0),\n",
    "                material='mesh',material_color='#FFD700',material_alpha=50, weather='sunny', battery=100,\n",
    "                weather_pos='top-left', battery_pos='bottom-right'):\n",
    "        \n",
    "        # Create base image\n",
    "        base = Image.new('RGBA', self.size, (255,255,255,255))\n",
    "        self.image=base\n",
    "        draw = ImageDraw.Draw(base)\n",
    "        \n",
    "        # Draw watch face with material\n",
    "        watch_face = self.draw_watch_face(draw, material, \n",
    "                                 material_color=material_color, \n",
    "                                 material_alpha=material_alpha)\n",
    "        # 明确指定Alpha通道作为掩码\n",
    "        alpha_mask = watch_face.getchannel('A')\n",
    "    \n",
    "        base.paste(watch_face, (0,0), mask=alpha_mask)\n",
    "        \n",
    "        # Draw clock elements\n",
    "        self.add_clock_hands(draw, hour, minute, second, \n",
    "                            [hour_color, minute_color, second_color])\n",
    "        \n",
    "        # Add information displays\n",
    "        self.add_weather(draw, weather, weather_pos)\n",
    "        self.add_battery(draw, battery, battery_pos)\n",
    "        \n",
    "        return base.convert('RGB')\n",
    "\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "a8c63304-a68a-48a9-bfe8-500699873894",
   "metadata": {},
   "outputs": [],
   "source": [
    "def quantize_color(rgb):\n",
    "    color_map = {\n",
    "        'R': 'Dark' if rgb[0] < 64 else 'Medium' if rgb[0] < 128 else 'Light' if rgb[0] < 192 else 'Bright',\n",
    "        'G': 'Dark' if rgb[1] < 64 else 'Medium' if rgb[1] < 128 else 'Light' if rgb[1] < 192 else 'Bright',\n",
    "        'B': 'Dark' if rgb[2] < 64 else 'Medium' if rgb[2] < 128 else 'Light' if rgb[2] < 192 else 'Bright'\n",
    "    }\n",
    "    return f\"{color_map['R']}-{color_map['G']}-{color_map['B']}\"\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "56112688-1132-4b92-9aa2-bd91824736b1",
   "metadata": {},
   "outputs": [],
   "source": [
    "import random\n",
    "\n",
    "# What is 模板 (10个/属性)\n",
    "WHAT_TEMPLATES = {\n",
    "    'color': [\n",
    "        \"What is the color of the {}?\",\n",
    "        \"Can you tell the {} color?\",\n",
    "        \"What color is the {}?\",\n",
    "        \"Identify the {} color.\",\n",
    "        \"Describe the {}'s color.\",\n",
    "        \"What hue is used for the {}?\",\n",
    "        \"What shade is the {}?\",\n",
    "        \"What is the {}'s color scheme?\",\n",
    "        \"What color tone does the {} have?\",\n",
    "        \"What is the {} colored?\"\n",
    "    ],\n",
    "    'weather': [\n",
    "        \"What weather condition is shown?\",\n",
    "        \"What is the current weather?\",\n",
    "        \"Describe the weather displayed.\",\n",
    "        \"What climate is indicated?\",\n",
    "        \"What meteorological condition is visible?\",\n",
    "        \"What is the atmospheric condition?\",\n",
    "        \"What type of weather is depicted?\",\n",
    "        \"Identify the weather situation.\",\n",
    "        \"What is the weather forecast showing?\",\n",
    "    ],\n",
    "    'texture': [\n",
    "        \"What material texture is used in the watch face?\",\n",
    "        \"Describe the watch face texture.\",\n",
    "        \"What surface pattern is visible in the watch face?\",\n",
    "        \"What is the texture type of the watch face?\",\n",
    "        \"Identify the material pattern of the watch face.\",\n",
    "        \"What design texture is applied on the watch face?\",\n",
    "        \"What is the watch face surface finish?\",\n",
    "        \"What kind of texture is shown on the watch face?\",\n",
    "        \"What material effect is used on the watch face?\",\n",
    "        \"What is the pattern style on the watch face?\"\n",
    "    ],\n",
    "    'time': [\n",
    "        \"What is the current time?\",\n",
    "        \"What time does the watch show?\",\n",
    "        \"What hour/minute/second is displayed?\",\n",
    "        \"What's the exact time shown?\",\n",
    "        \"What is the time configuration?\",\n",
    "        \"What time is indicated?\",\n",
    "        \"What is the time reading?\",\n",
    "        \"What time is displayed?\",\n",
    "        \"What is the watch showing?\",\n",
    "        \"What's the time value?\"\n",
    "    ],\n",
    "    'battery': [\n",
    "        \"What is the battery percentage?\",\n",
    "        \"What battery level is shown?\",\n",
    "        \"What is the power status?\",\n",
    "        \"What's the remaining battery?\",\n",
    "        \"What is the battery capacity?\",\n",
    "        \"What percentage is displayed?\",\n",
    "        \"What is the battery status?\",\n",
    "        \"How much battery is left?\",\n",
    "        \"What is the charge level?\",\n",
    "        \"What's the battery indicator showing?\"\n",
    "    ]\n",
    "}\n",
    "\n",
    "# Where is 模板 (10个/属性)\n",
    "WHERE_TEMPLATES = {\n",
    "    'battery_pos': [\n",
    "        \"Where is the battery indicator located?\",\n",
    "        \"Where is the battery displayed?\",\n",
    "        \"What corner shows the battery?\",\n",
    "        \"Where is the power status shown?\",\n",
    "        \"Where to find the battery info?\",\n",
    "        \"Where is the charge level visible?\",\n",
    "        \"Where is the battery percentage placed?\",\n",
    "        \"In which corner is the battery?\",\n",
    "        \"Where is the battery positioned?\",\n",
    "        \"Where can you see the battery level?\"\n",
    "    ],\n",
    "    'weather_pos': [\n",
    "        \"Where is the weather displayed?\",\n",
    "        \"Where is the climate info shown?\",\n",
    "        \"What corner has the weather?\",\n",
    "        \"Where is the meteorological data?\",\n",
    "        \"Where to find the weather condition?\",\n",
    "        \"Where is the precipitation info?\",\n",
    "        \"Where is the atmospheric data?\",\n",
    "        \"In which corner is the weather?\",\n",
    "        \"Where is the forecast positioned?\",\n",
    "        \"Where can you see the weather icon?\"\n",
    "    ]\n",
    "}"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "92f64e59-ceba-48ff-89e9-af0c2c92d113",
   "metadata": {},
   "outputs": [],
   "source": [
    "class VQAGenerator:\n",
    "    def __init__(self, watch_params):\n",
    "        self.params = watch_params\n",
    "        \n",
    "    def generate_qa_pair(self):\n",
    "        # 随机选择问题类型\n",
    "        question_type = random.choice(['what', 'what', 'what', 'where','where'])\n",
    "        \n",
    "        # 根据类型选择属性\n",
    "        if question_type == 'what':\n",
    "            attribute = random.choice([\n",
    "                'weather', 'time', 'battery'\n",
    "            ])\n",
    "            q_template=random.choice(WHAT_TEMPLATES[attribute])\n",
    "        else:\n",
    "            attribute = random.choice(['battery_pos', 'weather_pos'])\n",
    "            q_template=random.choice(WHERE_TEMPLATES[attribute])\n",
    "        \n",
    "        # 获取属性值\n",
    "        value = self.get_attribute_value(attribute)\n",
    "\n",
    "        # 特殊处理颜色属性\n",
    "        if attribute == 'color':\n",
    "            element = random.choice(['hour hand', 'minute hand', \n",
    "                                    'second hand', 'watch face'])\n",
    "            color = self.get_color_value(element)\n",
    "            answer = quantize_color(color)\n",
    "            q_template = q_template.format(element)\n",
    "        else:\n",
    "            answer = value\n",
    "        \n",
    "        return q_template, answer\n",
    "\n",
    "    def get_attribute_value(self, attribute):\n",
    "        mapping = {\n",
    "            'weather': self.params['weather'],\n",
    "            'texture': self.params['material'],\n",
    "            'time': f\"{self.params['hour']:02}:{self.params['minute']:02}:{self.params['second']:02}\",\n",
    "            'battery': f\"{self.params['battery']}%\",\n",
    "            'weather_pos': self.params['weather_pos'],\n",
    "            'battery_pos': self.params['battery_pos']\n",
    "        }\n",
    "        return mapping.get(attribute, None)\n",
    "    \n",
    "    def get_color_value(self, element):\n",
    "        color_map = {\n",
    "            'hour hand': self.params['hour_color'],\n",
    "            'minute hand': self.params['minute_color'],\n",
    "            'second hand': self.params['second_color'],\n",
    "            'watch face': self.params['material_color']\n",
    "        }\n",
    "        return color_map[element]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "2d1f61be-a964-450b-89ec-48fe668ef428",
   "metadata": {},
   "outputs": [],
   "source": [
    "CAPTION_ATTRIBUTES = {\n",
    "    # 核心属性（必现）\n",
    "    'time': 1,\n",
    "    \n",
    "    # 颜色属性\n",
    "    'hour_color': 0,\n",
    "    'minute_color': 0,\n",
    "    'second_color': 0,\n",
    "    \n",
    "    # 材质属性\n",
    "    'material': 0,\n",
    "    \n",
    "    # 状态属性\n",
    "    'weather': 0.5,\n",
    "    'battery': 0.5,\n",
    "    \n",
    "    # 位置属性\n",
    "    'weather_pos': 0.5,\n",
    "    'battery_pos': 0.5\n",
    "}"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "89fb1516-35be-445c-ab64-b3f236552fc7",
   "metadata": {},
   "outputs": [],
   "source": [
    "CAPTION_TEMPLATES = {\n",
    "    # 时间模板\n",
    "    'time': [\n",
    "        \", on which the current time is {}\",\n",
    "        \", displaying {}\",\n",
    "        \", showing the time {}\",\n",
    "        \", on which the time reads {}\"\n",
    "    ],\n",
    "    \n",
    "    # 颜色模板\n",
    "    'hour_color': [\n",
    "        \", with an hour hand colored {}\",\n",
    "        \", featuring {} hour hand\",\n",
    "        \", with hour hand in {}\"\n",
    "    ],\n",
    "    'minute_color': [\n",
    "        \", with minute hand in {}\",\n",
    "        \", with {} minute hand\",\n",
    "        \", featuring {} minute pointer\"\n",
    "    ],\n",
    "    'second_color': [\n",
    "        \", with second hand colored {}\",\n",
    "        \", with a {} second pointer\",\n",
    "        \", featuring {} second hand\"\n",
    "    ],\n",
    "    \n",
    "    # 材质模板\n",
    "    'material': [\n",
    "        \", on a {} watch face\",\n",
    "        \", with {} textured background\",\n",
    "        \", featuring {} surface\"\n",
    "    ],\n",
    "    \n",
    "    # 状态模板\n",
    "    'weather': [\n",
    "        \", showing {} weather\",\n",
    "        \", with {} weather displayed\",\n",
    "        \", indicating {} conditions\"\n",
    "    ],\n",
    "    'battery': [\n",
    "        \", with {}% battery\",\n",
    "        \", showing {}% charge\",\n",
    "        \", displaying {}% power level\"\n",
    "    ],\n",
    "    \n",
    "    # 位置模板\n",
    "    'weather_pos': [\n",
    "        \", with weather displayed at {}\",\n",
    "        \", with weather indicator at {}\",\n",
    "        \", with weather shown in the {} corner\"\n",
    "    ],\n",
    "    'battery_pos': [\n",
    "        \", with battery level at {}\",\n",
    "        \", with battery indicator at {}\",\n",
    "        \", power status displayed in {}\"\n",
    "    ],\n",
    "    'caption_a':[\n",
    "        \"The image shows a smart watch\",\n",
    "        \"There is a watch on the image\",\n",
    "        \"A smart watch is show in the image\"\n",
    "    ],\n",
    "    'generation_q':[\n",
    "        \"Can you generate a image of a smart watch\",\n",
    "        \"Can you draw a smart watch\",\n",
    "        \"Please show a smart watch\"\n",
    "    ],\n",
    "\n",
    "    'caption_q':[\n",
    "        \"<image>\\nWhat are the key components and features of this image?\",\n",
    "        \"<image>\\nCould you outline the primary elements of this watch?\",\n",
    "        \"<image>\\nWhat main features define the appearance of this user interface?\",\n",
    "        \"<image>\\nPlease identify the central elements and characteristics of this watch design.\",\n",
    "        \"<image>\\nHow would you describe the core features of this image's visual layout?\",\n",
    "        \"<image>\\nWhat are the standout elements in this smartwatch interface's design?\",\n",
    "        \"<image>\\nCould you detail the principal components of this watch face's structure?\",\n",
    "        \"<image>\\nWhat visual features are most prominent in this image?\",\n",
    "        \"<image>\\nPlease list the main aspects that make up this user interface.\",\n",
    "        \"<image>\\nHow would you characterize the key elements of this watch's user interface?\"\n",
    "    ],\n",
    "    'generation_a':[\n",
    "        \"Sure, here is the image. \\n<image>\",\n",
    "        \"The image is shown as you wish. \\n<image>\",\n",
    "        \"The image is generated. \\n<image>\"\n",
    "    ]\n",
    "}"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "04f61a3e-febd-4d78-b5ee-d22a838b0c90",
   "metadata": {},
   "outputs": [],
   "source": [
    "\n",
    "def generate_caption(params,base, attributes=CAPTION_ATTRIBUTES):\n",
    "    selected = []\n",
    "    for key, prob in attributes.items():\n",
    "        if random.random() < prob:\n",
    "            selected.append(key)\n",
    "    # 确保不空\n",
    "    if len(selected)==0:\n",
    "        selected.append('time')\n",
    "    \n",
    "    # 添加其他属性\n",
    "    for attr in selected:\n",
    "        template = random.choice(CAPTION_TEMPLATES[attr])\n",
    "        if attr == 'time':\n",
    "            value=f\"{params['hour']:02}:{params['minute']:02}:{params['second']:02}\"\n",
    "        elif attr == 'hour_color':\n",
    "            value = quantize_color(params['hour_color'])\n",
    "        elif attr == 'minute_color':\n",
    "            value = quantize_color(params['minute_color'])\n",
    "        elif attr == 'second_color':\n",
    "            value = quantize_color(params['second_color'])\n",
    "        elif attr== 'material':\n",
    "            value=quantize_color(params['material_color'])\n",
    "            if random.random() < 0.5:\n",
    "                value+=f\" {params['material']}\"\n",
    "        else:\n",
    "            value = params[attr]\n",
    "        \n",
    "        # 替换占位符\n",
    "        formatted = template.format(value)\n",
    "        base += formatted\n",
    "    \n",
    "    # 优化句子结构\n",
    "    base = base.replace(\"  \", \" \").capitalize()\n",
    "    if base.endswith(','):\n",
    "        base = base[:-1]\n",
    "    return base + '.' if not base.endswith('.') else base\n",
    "\n",
    "def generate_caption_QA(params,mode):\n",
    "    Q=None\n",
    "    A=None\n",
    "    if mode=='caption':\n",
    "        Q=random.choice(CAPTION_TEMPLATES['caption_q'])\n",
    "        A=generate_caption(params,random.choice(CAPTION_TEMPLATES['caption_a']))\n",
    "    elif mode=='generation':\n",
    "        Q=generate_caption(params,random.choice(CAPTION_TEMPLATES['generation_q']))\n",
    "        A=random.choice(CAPTION_TEMPLATES['generation_a'])\n",
    "    return Q, A"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "006a3a64-38c0-483a-b015-4ded275462c2",
   "metadata": {},
   "outputs": [],
   "source": [
    "import json\n",
    "import os\n",
    "from tqdm import tqdm\n",
    "\n",
    "# set the data path and number of samples here\n",
    "image_folder = '.../smart_watch_image_train'\n",
    "data_file_path= '.../smart_watch_train.json'\n",
    "num_of_samples = 60000\n",
    "\n",
    "os.makedirs(image_folder, exist_ok=True)\n",
    "generator = SmartwatchGenerator()\n",
    "samples=[]\n",
    "for index in tqdm(range(num_of_samples)):\n",
    "    watch_params={}\n",
    "    watch_params['hour'] = random.randint(0, 12)\n",
    "    watch_params['minute'] = random.randint(0, 59)\n",
    "    watch_params['second'] = random.randint(0, 59)\n",
    "    # watch_params['hour_color'] = tuple(random.randint(0, 255) for _ in range(3))\n",
    "    # watch_params['minute_color'] = tuple(random.randint(0, 255) for _ in range(3))\n",
    "    # watch_params['second_color'] = tuple(random.randint(0, 255) for _ in range(3))\n",
    "    #watch_params['material'] = random.choice(['mesh', 'noise', 'pure'])\n",
    "    watch_params['material_color'] = tuple(random.randint(0, 255) for _ in range(3))\n",
    "    watch_params['hour_color'] = (255,255,255)\n",
    "    watch_params['minute_color'] = (255,255,255)\n",
    "    watch_params['second_color'] = (255,255,255)\n",
    "    watch_params['material'] = 'pure'\n",
    "    # watch_params['material_color'] = (0,0,0)\n",
    "    watch_params['weather'] = random.choice(['sunny', 'cloudy', 'raining'])\n",
    "    watch_params['battery'] = random.randint(0, 100)\n",
    "    pos_list= ['top-left', 'top-right', 'bottom-left', 'bottom-right']\n",
    "    pos=random.sample(pos_list,2)\n",
    "    watch_params['weather_pos'] = pos[0]\n",
    "    watch_params['battery_pos'] = pos[1]\n",
    "\n",
    "\n",
    "    # image generation -----------------------------------\n",
    "    vqa_gen = VQAGenerator(watch_params)\n",
    "    image = generator.generate(\n",
    "        hour=watch_params['hour'], minute=watch_params['minute'], second=watch_params['second'],\n",
    "        hour_color=watch_params['hour_color'], minute_color=watch_params['minute_color'], second_color=watch_params['second_color'],\n",
    "        material=watch_params['material'], material_color=watch_params['material_color'], material_alpha=255,\n",
    "        weather=watch_params['weather'], battery=watch_params['battery'],\n",
    "        weather_pos=watch_params['weather_pos'], battery_pos=watch_params['battery_pos']\n",
    "    )\n",
    "    image_file_path=f\"{index}.png\"\n",
    "    full_image_file_path=f\"{image_folder}/{image_file_path}\"\n",
    "    image.save(full_image_file_path,format='PNG')\n",
    "\n",
    "\n",
    "    # generation data generation -----------------------------------\n",
    "    Gen_data={\n",
    "        \"task\": \"generation\",\n",
    "        \"image\": image_file_path,\n",
    "        \"conversations\":[]\n",
    "    }\n",
    "    q,a=generate_caption_QA(watch_params,'generation')\n",
    "    Gen_data['conversations'].append({\"from\": \"human\", \"value\": q})\n",
    "    Gen_data['conversations'].append({\"from\": \"gpt\", \"value\": a})\n",
    "    samples.append(Gen_data)\n",
    "\n",
    "\n",
    "    # vqa data generation -----------------------------------\n",
    "    VQA_data={\n",
    "        \"task\": \"vqa\",\n",
    "        \"image\": image_file_path,\n",
    "        \"conversations\":[]\n",
    "    }\n",
    "    q, a = vqa_gen.generate_qa_pair()\n",
    "    VQA_data['conversations'].append({\"from\": \"human\", \"value\": q})\n",
    "    VQA_data['conversations'].append({\"from\": \"gpt\", \"value\": a})\n",
    "    for i in range(3):\n",
    "        if random.random() < 0.4:\n",
    "            q, a = vqa_gen.generate_qa_pair()\n",
    "            VQA_data['conversations'].append({\"from\": \"human\", \"value\": q})\n",
    "            VQA_data['conversations'].append({\"from\": \"gpt\", \"value\": a})\n",
    "    VQA_data['conversations'][0]['value']='<image>\\n'+VQA_data['conversations'][0]['value']\n",
    "    samples.append(VQA_data)\n",
    "\n",
    "    # caption data generation -----------------------------------\n",
    "    Caption_data={\n",
    "        \"task\": \"caption\",\n",
    "        \"image\": image_file_path,\n",
    "        \"conversations\":[]\n",
    "    }\n",
    "    q,a=generate_caption_QA(watch_params,'caption')\n",
    "    Caption_data['conversations'].append({\"from\": \"human\", \"value\": q})\n",
    "    Caption_data['conversations'].append({\"from\": \"gpt\", \"value\": a})\n",
    "    samples.append(Caption_data)\n",
    "\n",
    "\n",
    "with open(data_file_path, \"w\") as f:\n",
    "    json.dump(samples, f, indent=4)"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "multimodal",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.9.21"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
