{"cells":[{"cell_type":"code","execution_count":5,"metadata":{"executionInfo":{"elapsed":3558,"status":"ok","timestamp":1673232455896,"user":{"displayName":"Yun Cheng","userId":"00325904972559050626"},"user_tz":300},"id":"wbxLvcuuV6tc"},"outputs":[],"source":["from torch import nn\n","import torch\n","import sys\n","import os\n","import numpy as np\n","import pandas as pd\n","from scipy.stats import entropy\n","\n","from sklearn.manifold import TSNE\n","from sklearn.decomposition import PCA\n","from sklearn.preprocessing import normalize\n","from sklearn.cluster import KMeans\n","import matplotlib.pyplot as plt2\n","import pickle"]},{"cell_type":"code","execution_count":3,"metadata":{"executionInfo":{"elapsed":4,"status":"ok","timestamp":1673232456880,"user":{"displayName":"Yun Cheng","userId":"00325904972559050626"},"user_tz":300},"id":"-WUWExmnK_KD"},"outputs":[],"source":["def clustering(X, pca=False, n_clusters=20):\n","  X = np.nan_to_num(X)\n","  if len(X.shape) > 2:\n","    X = X.reshape(X.shape[0],-1)\n","  if pca:\n","    # print(np.any(np.isnan(X)), np.all(np.isfinite(X)))\n","    X = normalize(X)\n","    X = PCA(n_components=5).fit_transform(X)\n","  kmeans = KMeans(n_clusters=n_clusters).fit(X)\n","  return kmeans.labels_"]},{"attachments":{},"cell_type":"markdown","metadata":{"id":"gnJNWCzFSBNx"},"source":["#### MOSI"]},{"cell_type":"code","execution_count":4,"metadata":{"colab":{"base_uri":"https://localhost:8080/"},"executionInfo":{"elapsed":2290,"status":"ok","timestamp":1673232030387,"user":{"displayName":"Yun Cheng","userId":"00325904972559050626"},"user_tz":300},"id":"EzybOI24I5M3","outputId":"de7e7a8a-4092-46de-f46b-090d32b48275"},"outputs":[{"name":"stdout","output_type":"stream","text":["dict_keys(['train', 'valid', 'test'])\n"]}],"source":["data_dir = '/usr0/home/yuncheng/MultiBench/data/mosi_raw.pkl'\n","dataset = pd.read_pickle(data_dir)\n","print(dataset.keys())\n","print(dataset['train'].keys())"]},{"cell_type":"code","execution_count":22,"metadata":{"colab":{"base_uri":"https://localhost:8080/"},"executionInfo":{"elapsed":5249,"status":"ok","timestamp":1673232035630,"user":{"displayName":"Yun Cheng","userId":"00325904972559050626"},"user_tz":300},"id":"Vamq88yMOgjF","outputId":"843c5b8a-62cd-4894-d5f5-7f7b895c5352"},"outputs":[{"name":"stderr","output_type":"stream","text":["/usr0/home/yuncheng/miniconda3/envs/multibench/lib/python3.9/site-packages/numpy/core/fromnumeric.py:86: RuntimeWarning: overflow encountered in reduce\n","  return ufunc.reduce(obj, axis, dtype, out, **passkwargs)\n","/usr0/home/yuncheng/miniconda3/envs/multibench/lib/python3.9/site-packages/numpy/core/fromnumeric.py:86: RuntimeWarning: overflow encountered in reduce\n","  return ufunc.reduce(obj, axis, dtype, out, **passkwargs)\n"]}],"source":["data_cluster = dict()\n","for split in dataset:\n","  data_cluster[split] = dict()\n","  data = dataset[split]\n","  data_cluster[split]['vision'] = clustering(data['vision'], pca=True).reshape(-1,1)\n","  data_cluster[split]['audio'] = clustering(data['audio'], pca=True).reshape(-1,1)\n","  data_cluster[split]['text'] = clustering(data['text'], pca=True).reshape(-1,1)\n","  data_cluster[split]['labels'] = (data['labels'][:,:,0]>0)*1\n","  data_cluster[split]['id'] = data['id']\n","with open('/usr0/home/yuncheng/MultiBench/synthetic/bounds/mosi_cluster.pickle', 'wb') as f:\n","    pickle.dump(data_cluster, f)"]},{"cell_type":"code","execution_count":6,"metadata":{"colab":{"base_uri":"https://localhost:8080/"},"executionInfo":{"elapsed":319,"status":"ok","timestamp":1673231360042,"user":{"displayName":"Yun Cheng","userId":"00325904972559050626"},"user_tz":300},"id":"BU8TVfhTWIpl","outputId":"84b38ee4-0d63-4130-ca00-1a89c341480d"},"outputs":[],"source":["with open('/usr0/home/yuncheng/MultiBench/synthetic/bounds/mosi_cluster.pickle', 'rb') as f:\n","    file = pickle.load(f)\n","for split in file:\n","  data = file[split]\n","  for modality in ['vision', 'audio', 'text']:\n","    X = data[modality]\n","    print(split, modality, np.any(np.isnan(X)), np.all(np.isfinite(X)))\n","    \n","_, counts = np.unique(dataset['test']['labels'], return_counts=True)\n","pk = counts / np.sum(counts)\n","ent = entropy(pk, base=2)\n","file['test']['entropy'] = ent\n","with open('/usr0/home/yuncheng/MultiBench/synthetic/bounds/mosi_cluster.pickle', 'wb') as f:\n","    pickle.dump(file, f)"]},{"attachments":{},"cell_type":"markdown","metadata":{"id":"i8_XHhbvZzmG"},"source":["#### MOSEI"]},{"cell_type":"code","execution_count":8,"metadata":{"colab":{"base_uri":"https://localhost:8080/"},"executionInfo":{"elapsed":42485,"status":"ok","timestamp":1673232719593,"user":{"displayName":"Yun Cheng","userId":"00325904972559050626"},"user_tz":300},"id":"lgUVrtdGZ0ud","outputId":"db27d01c-6357-4777-9118-635bd823d418"},"outputs":[{"name":"stdout","output_type":"stream","text":["dict_keys(['train', 'valid', 'test'])\n"]}],"source":["data_dir = '/usr0/home/yuncheng/MultiBench/data/mosei_raw.pkl'\n","dataset = pd.read_pickle(data_dir)\n","print(dataset.keys())\n","print(dataset['train'].keys())"]},{"cell_type":"code","execution_count":14,"metadata":{"colab":{"base_uri":"https://localhost:8080/"},"executionInfo":{"elapsed":77000,"status":"ok","timestamp":1673232796573,"user":{"displayName":"Yun Cheng","userId":"00325904972559050626"},"user_tz":300},"id":"Ob-aM8u8apKP","outputId":"1780751c-5c7f-4d76-d045-703077c42761"},"outputs":[{"name":"stderr","output_type":"stream","text":["/usr0/home/yuncheng/miniconda3/envs/multibench/lib/python3.9/site-packages/numpy/core/fromnumeric.py:86: RuntimeWarning: overflow encountered in reduce\n","  return ufunc.reduce(obj, axis, dtype, out, **passkwargs)\n","/usr0/home/yuncheng/miniconda3/envs/multibench/lib/python3.9/site-packages/numpy/core/fromnumeric.py:86: RuntimeWarning: overflow encountered in reduce\n","  return ufunc.reduce(obj, axis, dtype, out, **passkwargs)\n","/usr0/home/yuncheng/miniconda3/envs/multibench/lib/python3.9/site-packages/numpy/core/fromnumeric.py:86: RuntimeWarning: overflow encountered in reduce\n","  return ufunc.reduce(obj, axis, dtype, out, **passkwargs)\n"]}],"source":["data_cluster = dict()\n","for split in dataset:\n","  data_cluster[split] = dict()\n","  data = dataset[split]\n","  data_cluster[split]['vision'] = clustering(data['vision'], pca=True).reshape(-1,1)\n","  data_cluster[split]['audio'] = clustering(data['audio'], pca=True).reshape(-1,1)\n","  data_cluster[split]['text'] = clustering(data['text'], pca=True).reshape(-1,1)\n","  data_cluster[split]['labels'] = (data['labels'][:,:,0]>0)*1\n","  data_cluster[split]['id'] = data['id']\n","with open('/usr0/home/yuncheng/MultiBench/synthetic/bounds/mosei_cluster.pickle', 'wb') as f:\n","    pickle.dump(data_cluster, f)"]},{"cell_type":"code","execution_count":9,"metadata":{"colab":{"base_uri":"https://localhost:8080/"},"executionInfo":{"elapsed":223,"status":"ok","timestamp":1673232920983,"user":{"displayName":"Yun Cheng","userId":"00325904972559050626"},"user_tz":300},"id":"QVlGhyqEcy5Q","outputId":"b4d8b50a-eb6d-415f-bec6-d4868cf87e73"},"outputs":[],"source":["with open('/usr0/home/yuncheng/MultiBench/synthetic/bounds/mosei_cluster.pickle', 'rb') as f:\n","    file = pickle.load(f)\n","for split in file:\n","  data = file[split]\n","  for modality in ['vision', 'audio', 'text']:\n","    X = data[modality]\n","    print(split, modality, X.shape, np.any(np.isnan(X)), np.all(np.isfinite(X)))\n","    \n","_, counts = np.unique(dataset['test']['labels'], return_counts=True)\n","pk = counts / np.sum(counts)\n","ent = entropy(pk, base=2)\n","file['test']['entropy'] = ent\n","with open('/usr0/home/yuncheng/MultiBench/synthetic/bounds/mosei_cluster.pickle', 'wb') as f:\n","    pickle.dump(file, f)"]},{"attachments":{},"cell_type":"markdown","metadata":{"id":"TBW1eWwWXoCQ"},"source":["#### sarcasm"]},{"cell_type":"code","execution_count":10,"metadata":{"colab":{"base_uri":"https://localhost:8080/"},"executionInfo":{"elapsed":615,"status":"ok","timestamp":1673232044706,"user":{"displayName":"Yun Cheng","userId":"00325904972559050626"},"user_tz":300},"id":"KGgrdrG_X9sQ","outputId":"cb03b831-1b6c-4688-d6c9-b8a76672cd4c"},"outputs":[{"name":"stdout","output_type":"stream","text":["dict_keys(['train', 'valid', 'test'])\n"]}],"source":["data_dir = '/usr0/home/yuncheng/MultiBench/data/sarcasm.pkl'\n","dataset = pd.read_pickle(data_dir)\n","print(dataset.keys())"]},{"cell_type":"code","execution_count":null,"metadata":{"executionInfo":{"elapsed":3201,"status":"ok","timestamp":1673232049000,"user":{"displayName":"Yun Cheng","userId":"00325904972559050626"},"user_tz":300},"id":"unGebSTzZg13"},"outputs":[],"source":["data_cluster = dict()\n","for split in dataset:\n","  data_cluster[split] = dict()\n","  data = dataset[split]\n","  data_cluster[split]['vision'] = clustering(data['vision'], pca=True).reshape(-1,1)\n","  data_cluster[split]['audio'] = clustering(data['audio'], pca=True).reshape(-1,1)\n","  data_cluster[split]['text'] = clustering(data['text'], pca=True).reshape(-1,1)\n","  data_cluster[split]['labels'] = data['labels']\n","  data_cluster[split]['id'] = data['id']\n","with open('/usr0/home/yuncheng/MultiBench/synthetic/bounds/sarcasm_cluster.pickle', 'wb') as f:\n","    pickle.dump(data_cluster, f)"]},{"cell_type":"code","execution_count":11,"metadata":{},"outputs":[],"source":["with open('/usr0/home/yuncheng/MultiBench/synthetic/bounds/sarcasm_cluster.pickle', 'rb') as f:\n","    file = pickle.load(f)\n","for split in file:\n","  data = file[split]\n","  for modality in ['vision', 'audio', 'text']:\n","    X = data[modality]\n","    print(split, modality, X.shape, np.any(np.isnan(X)), np.all(np.isfinite(X)))\n","    \n","_, counts = np.unique(dataset['test']['labels'], return_counts=True)\n","pk = counts / np.sum(counts)\n","ent = entropy(pk, base=2)\n","file['test']['entropy'] = ent\n","with open('/usr0/home/yuncheng/MultiBench/synthetic/bounds/sarcasm_cluster.pickle', 'wb') as f:\n","    pickle.dump(file, f)"]},{"attachments":{},"cell_type":"markdown","metadata":{"id":"CtJKIS6AbFcQ"},"source":["### humor"]},{"cell_type":"code","execution_count":12,"metadata":{"colab":{"base_uri":"https://localhost:8080/"},"executionInfo":{"elapsed":16719,"status":"ok","timestamp":1673232633173,"user":{"displayName":"Yun Cheng","userId":"00325904972559050626"},"user_tz":300},"id":"2PJ-4ptOZkVM","outputId":"ca514e05-c196-4ea8-f3f1-53b3727439ff"},"outputs":[],"source":["data_dir = '/usr0/home/yuncheng/MultiBench/data/humor.pkl'\n","dataset = pd.read_pickle(data_dir)"]},{"cell_type":"code","execution_count":null,"metadata":{"executionInfo":{"elapsed":15156,"status":"ok","timestamp":1673232665372,"user":{"displayName":"Yun Cheng","userId":"00325904972559050626"},"user_tz":300},"id":"4uz95Krfb93s"},"outputs":[],"source":["data_cluster = dict()\n","for split in dataset:\n","  data_cluster[split] = dict()\n","  data = dataset[split]\n","  data_cluster[split]['vision'] = clustering(data['vision'], pca=True).reshape(-1,1)\n","  data_cluster[split]['audio'] = clustering(data['audio'], pca=True).reshape(-1,1)\n","  data_cluster[split]['text'] = clustering(data['text'], pca=True).reshape(-1,1)\n","  data_cluster[split]['labels'] = data['labels']\n","  data_cluster[split]['id'] = data['id']\n","with open('/usr0/home/yuncheng/MultiBench/synthetic/bounds/humor_cluster.pickle', 'wb') as f:\n","    pickle.dump(data_cluster, f)"]},{"cell_type":"code","execution_count":13,"metadata":{},"outputs":[],"source":["with open('/usr0/home/yuncheng/MultiBench/synthetic/bounds/humor_cluster.pickle', 'rb') as f:\n","    file = pickle.load(f)\n","for split in file:\n","  data = file[split]\n","  for modality in ['vision', 'audio', 'text']:\n","    X = data[modality]\n","    print(split, modality, X.shape, np.any(np.isnan(X)), np.all(np.isfinite(X)))\n","    \n","_, counts = np.unique(dataset['test']['labels'], return_counts=True)\n","pk = counts / np.sum(counts)\n","ent = entropy(pk, base=2)\n","file['test']['entropy'] = ent\n","with open('/usr0/home/yuncheng/MultiBench/synthetic/bounds/humor_cluster.pickle', 'wb') as f:\n","    pickle.dump(file, f)"]},{"attachments":{},"cell_type":"markdown","metadata":{},"source":["### avmnist"]},{"cell_type":"code","execution_count":26,"metadata":{},"outputs":[],"source":["audio = np.load('/usr0/home/yuncheng/MultiBench/data/avmnist/audio/test_data.npy')\n","image = np.load('/usr0/home/yuncheng/MultiBench/data/avmnist/image/test_data.npy')\n","labels = np.load('/usr0/home/yuncheng/MultiBench/data/avmnist/test_labels.npy')"]},{"cell_type":"code","execution_count":30,"metadata":{},"outputs":[],"source":["data_cluster = dict()\n","data_cluster['test'] = dict()\n","data_cluster[split]['audio'] = clustering(audio, pca=True).reshape(-1,1)\n","data_cluster[split]['image'] = clustering(image, pca=True).reshape(-1,1)\n","data_cluster[split]['labels'] = labels.reshape(-1,1)\n","with open('/usr0/home/yuncheng/MultiBench/synthetic/bounds/avmnist_cluster.pickle', 'wb') as f:\n","    pickle.dump(data_cluster, f)"]},{"attachments":{},"cell_type":"markdown","metadata":{},"source":["### enrico"]},{"cell_type":"code","execution_count":34,"metadata":{},"outputs":[],"source":["import csv\n","import random\n","from torchvision import transforms\n","from PIL import Image\n","\n","img_dim_x = 128\n","img_dim_y = 256\n","seq_len = 64\n","csv_file = \"/usr0/home/yuncheng/MultiBench/data/dataset/design_topics.csv\"\n","img_dir = \"/usr0/home/yuncheng/MultiBench/data/dataset/screenshots\"\n","wireframe_dir = \"/usr0/home/yuncheng/MultiBench/data/dataset/wireframes\"\n","hierarchy_dir = \"/usr0/home/yuncheng/MultiBench/data/dataset/hierarchies\"\n","with open(csv_file, \"r\") as f:\n","    reader = csv.DictReader(f)\n","    example_list = list(reader)\n","\n","# the wireframe files are corrupted for these files\n","IGNORES = set([\"50105\", \"50109\"])\n","example_list = [e for e in example_list if e['screen_id'] not in IGNORES]\n","keys = list(range(len(example_list)))\n","# shuffle and create splits\n","random.Random(42).shuffle(keys)\n","\n","# test split\n","train_split = 0.65\n","val_split = 0.15\n","start_index = int(len(example_list) * (train_split + val_split))\n","stop_index = len(example_list)\n","keys = keys[start_index:stop_index]\n","\n","img_transforms = [\n","            transforms.Resize((img_dim_y, img_dim_x)),\n","            transforms.ToTensor()\n","        ]\n","img_transforms = transforms.Compose(img_transforms)\n","\n","# make maps\n","topics = set()\n","for e in example_list:\n","    topics.add(e['topic'])\n","topics = sorted(list(topics))\n","idx2Topic = {}\n","topic2Idx = {}\n","for i in range(len(topics)):\n","    idx2Topic[i] = topics[i]\n","    topic2Idx[topics[i]] = i\n","UI_TYPES = [\"Text\", \"Text Button\", \"Icon\", \"Card\", \"Drawer\", \"Web View\", \"List Item\", \"Toolbar\", \"Bottom Navigation\", \"Multi-Tab\", \"List Item\", \"Toolbar\", \"Bottom Navigation\", \"Multi-Tab\",\n","                    \"Background Image\", \"Image\", \"Video\", \"Input\", \"Number Stepper\", \"Checkbox\", \"Radio Button\", \"Pager Indicator\", \"On/Off Switch\", \"Modal\", \"Slider\", \"Advertisement\", \"Date Picker\", \"Map View\"]\n","idx2Label = {}\n","label2Idx = {}\n","for i in range(len(UI_TYPES)):\n","    idx2Label[i] = UI_TYPES[i]\n","    label2Idx[UI_TYPES[i]] = i"]},{"cell_type":"code","execution_count":39,"metadata":{},"outputs":[{"name":"stderr","output_type":"stream","text":["/usr0/home/yuncheng/miniconda3/envs/multibench/lib/python3.9/site-packages/PIL/Image.py:992: UserWarning: Palette images with Transparency expressed in bytes should be converted to RGBA images\n","  warnings.warn(\n"]}],"source":["screenImgs = []\n","screenWireframeImgs = []\n","screenLabels = []\n","for idx in range(len(keys)):\n","    example = example_list[keys[idx]]\n","    screenId = example['screen_id']\n","    # image modality\n","    screenImg = Image.open(os.path.join(img_dir, screenId + \".jpg\")).convert(\"RGB\")\n","    screenImg = img_transforms(screenImg)\n","    # wireframe image modality\n","    screenWireframeImg = Image.open(os.path.join(wireframe_dir, screenId + \".png\")).convert(\"RGB\")\n","    screenWireframeImg = img_transforms(screenWireframeImg)\n","    # label\n","    screenLabel = topic2Idx[example['topic']]\n","    screenImgs.append(screenImg.numpy())\n","    screenWireframeImgs.append(screenWireframeImg.numpy())\n","    screenLabels.append(screenLabel)"]},{"cell_type":"code","execution_count":41,"metadata":{},"outputs":[],"source":["data_cluster = dict()\n","data_cluster['test'] = dict()\n","data_cluster[split]['image'] = clustering(np.array(screenImgs), pca=True).reshape(-1,1)\n","data_cluster[split]['wireframe'] = clustering(np.array(screenWireframeImgs), pca=True).reshape(-1,1)\n","data_cluster[split]['labels'] = np.array(screenLabels).reshape(-1,1)\n","with open('/usr0/home/yuncheng/MultiBench/synthetic/bounds/enrico_cluster.pickle', 'wb') as f:\n","    pickle.dump(data_cluster, f)"]},{"cell_type":"code","execution_count":null,"metadata":{},"outputs":[],"source":[]}],"metadata":{"colab":{"machine_shape":"hm","provenance":[{"file_id":"1qLjxRERCTRpgQgXjF4CNgERBonXWoIQw","timestamp":1673227051889},{"file_id":"https://github.com/pliang279/MultiBench/blob/main/examples/Multibench_Example_Usage_On_Colab_Part_3_MCTN.ipynb","timestamp":1668715594346}]},"gpuClass":"premium","kernelspec":{"display_name":"Python 3","name":"python3"},"language_info":{"codemirror_mode":{"name":"ipython","version":3},"file_extension":".py","mimetype":"text/x-python","name":"python","nbconvert_exporter":"python","pygments_lexer":"ipython3","version":"3.9.6"}},"nbformat":4,"nbformat_minor":0}
